diff --git "a/wandb/run-20220317_145036-3tnpukko/files/wandb-summary.json" "b/wandb/run-20220317_145036-3tnpukko/files/wandb-summary.json" --- "a/wandb/run-20220317_145036-3tnpukko/files/wandb-summary.json" +++ "b/wandb/run-20220317_145036-3tnpukko/files/wandb-summary.json" @@ -1 +1 @@ -{"train/loss": 3.0179, "train/learning_rate": 4.591836734693877e-06, "train/epoch": 1.0, "train/global_step": 892, "_runtime": 5009, "_timestamp": 1647533645, "_step": 892, "gradients/decoder.model.decoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 7.0, 197.0, 544.0, 249.0, 18.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7681227922439575, -1.2875614166259766, -0.8070001006126404, -0.3264387845993042, 0.15412259101867676, 0.6346839666366577, 1.1152452230453491, 1.5958067178726196, 2.0763678550720215, 2.556929111480713, 3.0374906063079834, 3.518051862716675, 3.9986133575439453, 4.479174613952637, 4.959735870361328, 5.4402971267700195, 5.920858860015869, 6.4014201164245605, 6.881981372833252, 7.362543106079102, 7.843104362487793, 8.323665618896484, 8.804226875305176, 9.284788131713867, 9.765349388122559, 10.24591064453125, 10.726471900939941, 11.207033157348633, 11.687594413757324, 12.168155670166016, 12.648717880249023, 13.129279136657715, 13.60983943939209, 14.090400695800781, 14.570961952209473, 15.051523208618164, 15.532084465026855, 16.012645721435547, 16.493207931518555, 16.97376823425293, 17.454330444335938, 17.934892654418945, 18.41545295715332, 18.896015167236328, 19.376575469970703, 19.85713768005371, 20.337697982788086, 20.818260192871094, 21.29882049560547, 21.779382705688477, 22.25994300842285, 22.74050521850586, 23.221065521240234, 23.701627731323242, 24.182188034057617, 24.662750244140625, 25.143312454223633, 25.62387466430664, 26.104434967041016, 26.584997177124023, 27.0655574798584, 27.546119689941406, 28.02667999267578, 28.50724220275879, 28.987802505493164]}, "gradients/decoder.model.decoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 5.0, 6.0, 3.0, 6.0, 9.0, 12.0, 18.0, 16.0, 11.0, 20.0, 17.0, 22.0, 32.0, 28.0, 26.0, 34.0, 36.0, 33.0, 41.0, 41.0, 39.0, 33.0, 39.0, 41.0, 41.0, 46.0, 30.0, 40.0, 37.0, 27.0, 40.0, 25.0, 22.0, 20.0, 14.0, 19.0, 15.0, 20.0, 7.0, 12.0, 8.0, 5.0, 2.0, 4.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-3.695791721343994, -3.598155975341797, -3.5005202293395996, -3.4028844833374023, -3.305248737335205, -3.207612991333008, -3.1099772453308105, -3.012341260910034, -2.914705514907837, -2.8170697689056396, -2.7194340229034424, -2.621798276901245, -2.524162530899048, -2.4265265464782715, -2.328890800476074, -2.231255054473877, -2.1336193084716797, -2.0359835624694824, -1.9383478164672852, -1.840712070465088, -1.743076205253601, -1.6454404592514038, -1.5478047132492065, -1.4501688480377197, -1.3525333404541016, -1.2548975944519043, -1.157261848449707, -1.0596261024475098, -0.961990237236023, -0.8643544912338257, -0.7667187452316284, -0.6690829396247864, -0.5714471340179443, -0.4738113582134247, -0.37617558240890503, -0.27853983640670776, -0.1809040606021881, -0.08326828479766846, 0.014367461204528809, 0.11200326681137085, 0.20963901281356812, 0.30727478861808777, 0.4049105644226074, 0.5025463104248047, 0.600182056427002, 0.697817862033844, 0.7954536080360413, 0.8930894136428833, 0.9907251596450806, 1.0883609056472778, 1.185996651649475, 1.283632516860962, 1.3812682628631592, 1.4789040088653564, 1.5765397548675537, 1.674175500869751, 1.7718112468719482, 1.8694469928741455, 1.9670827388763428, 2.06471848487854, 2.1623542308807373, 2.2599902153015137, 2.357625961303711, 2.455261707305908, 2.5528974533081055]}, "gradients/decoder.model.decoder.layers.11.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 3.0, 1.0, 5.0, 4.0, 7.0, 10.0, 11.0, 32.0, 34.0, 54.0, 72.0, 103.0, 147.0, 290.0, 423.0, 776.0, 1480.0, 2667.0, 5174.0, 10941.0, 24908.0, 57350.0, 134043.0, 304513.0, 687304.0, 1346694.0, 903490.0, 398829.0, 175166.0, 76072.0, 33459.0, 15167.0, 7155.0, 3531.0, 1914.0, 1015.0, 551.0, 325.0, 192.0, 120.0, 83.0, 52.0, 32.0, 18.0, 25.0, 21.0, 12.0, 4.0, 4.0, 3.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-2.310546875, -2.241943359375, -2.17333984375, -2.104736328125, -2.0361328125, -1.967529296875, -1.89892578125, -1.830322265625, -1.76171875, -1.693115234375, -1.62451171875, -1.555908203125, -1.4873046875, -1.418701171875, -1.35009765625, -1.281494140625, -1.212890625, -1.144287109375, -1.07568359375, -1.007080078125, -0.9384765625, -0.869873046875, -0.80126953125, -0.732666015625, -0.6640625, -0.595458984375, -0.52685546875, -0.458251953125, -0.3896484375, -0.321044921875, -0.25244140625, -0.183837890625, -0.115234375, -0.046630859375, 0.02197265625, 0.090576171875, 0.1591796875, 0.227783203125, 0.29638671875, 0.364990234375, 0.43359375, 0.502197265625, 0.57080078125, 0.639404296875, 0.7080078125, 0.776611328125, 0.84521484375, 0.913818359375, 0.982421875, 1.051025390625, 1.11962890625, 1.188232421875, 1.2568359375, 1.325439453125, 1.39404296875, 1.462646484375, 1.53125, 1.599853515625, 1.66845703125, 1.737060546875, 1.8056640625, 1.874267578125, 1.94287109375, 2.011474609375, 2.080078125]}, "gradients/decoder.model.decoder.layers.11.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 2.0, 3.0, 1.0, 6.0, 6.0, 5.0, 10.0, 6.0, 16.0, 12.0, 17.0, 24.0, 24.0, 31.0, 24.0, 29.0, 35.0, 41.0, 30.0, 33.0, 51.0, 40.0, 38.0, 44.0, 40.0, 58.0, 32.0, 42.0, 34.0, 29.0, 29.0, 24.0, 24.0, 28.0, 27.0, 21.0, 21.0, 10.0, 16.0, 9.0, 8.0, 10.0, 5.0, 4.0, 6.0, 4.0, 1.0, 0.0, 2.0, 2.0], "bins": [-4.015625, -3.90777587890625, -3.7999267578125, -3.69207763671875, -3.584228515625, -3.47637939453125, -3.3685302734375, -3.26068115234375, -3.15283203125, -3.04498291015625, -2.9371337890625, -2.82928466796875, -2.721435546875, -2.61358642578125, -2.5057373046875, -2.39788818359375, -2.2900390625, -2.18218994140625, -2.0743408203125, -1.96649169921875, -1.858642578125, -1.75079345703125, -1.6429443359375, -1.53509521484375, -1.42724609375, -1.31939697265625, -1.2115478515625, -1.10369873046875, -0.995849609375, -0.88800048828125, -0.7801513671875, -0.67230224609375, -0.564453125, -0.45660400390625, -0.3487548828125, -0.24090576171875, -0.133056640625, -0.02520751953125, 0.0826416015625, 0.19049072265625, 0.29833984375, 0.40618896484375, 0.5140380859375, 0.62188720703125, 0.729736328125, 0.83758544921875, 0.9454345703125, 1.05328369140625, 1.1611328125, 1.26898193359375, 1.3768310546875, 1.48468017578125, 1.592529296875, 1.70037841796875, 1.8082275390625, 1.91607666015625, 2.02392578125, 2.13177490234375, 2.2396240234375, 2.34747314453125, 2.455322265625, 2.56317138671875, 2.6710205078125, 2.77886962890625, 2.88671875]}, "gradients/decoder.model.decoder.layers.11.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 2.0, 2.0, 2.0, 8.0, 12.0, 17.0, 16.0, 45.0, 124.0, 382.0, 56488.0, 4136465.0, 432.0, 150.0, 67.0, 32.0, 27.0, 8.0, 7.0, 5.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-76.9375, -72.6748046875, -68.412109375, -64.1494140625, -59.88671875, -55.6240234375, -51.361328125, -47.0986328125, -42.8359375, -38.5732421875, -34.310546875, -30.0478515625, -25.78515625, -21.5224609375, -17.259765625, -12.9970703125, -8.734375, -4.4716796875, -0.208984375, 4.0537109375, 8.31640625, 12.5791015625, 16.841796875, 21.1044921875, 25.3671875, 29.6298828125, 33.892578125, 38.1552734375, 42.41796875, 46.6806640625, 50.943359375, 55.2060546875, 59.46875, 63.7314453125, 67.994140625, 72.2568359375, 76.51953125, 80.7822265625, 85.044921875, 89.3076171875, 93.5703125, 97.8330078125, 102.095703125, 106.3583984375, 110.62109375, 114.8837890625, 119.146484375, 123.4091796875, 127.671875, 131.9345703125, 136.197265625, 140.4599609375, 144.72265625, 148.9853515625, 153.248046875, 157.5107421875, 161.7734375, 166.0361328125, 170.298828125, 174.5615234375, 178.82421875, 183.0869140625, 187.349609375, 191.6123046875, 195.875]}, "gradients/decoder.model.decoder.layers.11.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 1.0, 0.0, 4.0, 1.0, 6.0, 5.0, 14.0, 18.0, 15.0, 43.0, 95.0, 195.0, 549.0, 1536.0, 966.0, 303.0, 156.0, 71.0, 37.0, 29.0, 16.0, 10.0, 7.0, 6.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.849609375, -1.7603759765625, -1.671142578125, -1.5819091796875, -1.49267578125, -1.4034423828125, -1.314208984375, -1.2249755859375, -1.1357421875, -1.0465087890625, -0.957275390625, -0.8680419921875, -0.77880859375, -0.6895751953125, -0.600341796875, -0.5111083984375, -0.421875, -0.3326416015625, -0.243408203125, -0.1541748046875, -0.06494140625, 0.0242919921875, 0.113525390625, 0.2027587890625, 0.2919921875, 0.3812255859375, 0.470458984375, 0.5596923828125, 0.64892578125, 0.7381591796875, 0.827392578125, 0.9166259765625, 1.005859375, 1.0950927734375, 1.184326171875, 1.2735595703125, 1.36279296875, 1.4520263671875, 1.541259765625, 1.6304931640625, 1.7197265625, 1.8089599609375, 1.898193359375, 1.9874267578125, 2.07666015625, 2.1658935546875, 2.255126953125, 2.3443603515625, 2.43359375, 2.5228271484375, 2.612060546875, 2.7012939453125, 2.79052734375, 2.8797607421875, 2.968994140625, 3.0582275390625, 3.1474609375, 3.2366943359375, 3.325927734375, 3.4151611328125, 3.50439453125, 3.5936279296875, 3.682861328125, 3.7720947265625, 3.861328125]}, "gradients/decoder.model.decoder.layers.11.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 10.0, 14.0, 21.0, 20.0, 36.0, 48.0, 63.0, 82.0, 89.0, 90.0, 117.0, 94.0, 98.0, 61.0, 49.0, 40.0, 23.0, 19.0, 13.0, 7.0, 7.0, 2.0, 2.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.2791056632995605, -6.09200382232666, -5.90490198135376, -5.717800140380859, -5.530697822570801, -5.3435959815979, -5.156494140625, -4.9693922996521, -4.782290458679199, -4.595188617706299, -4.408086776733398, -4.220984935760498, -4.033883094787598, -3.846781015396118, -3.6596789360046387, -3.4725770950317383, -3.285475254058838, -3.0983734130859375, -2.911271572113037, -2.7241694927215576, -2.5370676517486572, -2.349965810775757, -2.1628637313842773, -1.975761890411377, -1.7886600494384766, -1.6015582084655762, -1.4144562482833862, -1.2273542881011963, -1.040252447128296, -0.8531505465507507, -0.6660486459732056, -0.4789466857910156, -0.29184436798095703, -0.10474246740341187, 0.0823594331741333, 0.26946133375167847, 0.45656323432922363, 0.6436651349067688, 0.830767035484314, 1.017868995666504, 1.2049708366394043, 1.3920726776123047, 1.5791746377944946, 1.7662765979766846, 1.953378438949585, 2.1404802799224854, 2.327582359313965, 2.5146842002868652, 2.7017860412597656, 2.888887882232666, 3.0759897232055664, 3.263091802597046, 3.4501936435699463, 3.6372954845428467, 3.824397563934326, 4.011499404907227, 4.198601245880127, 4.385703086853027, 4.572804927825928, 4.759906768798828, 4.947009086608887, 5.134110927581787, 5.3212127685546875, 5.508314609527588, 5.695416450500488]}, "gradients/decoder.model.decoder.layers.11.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 3.0, 4.0, 2.0, 4.0, 6.0, 11.0, 14.0, 7.0, 14.0, 18.0, 18.0, 21.0, 22.0, 34.0, 24.0, 32.0, 38.0, 28.0, 39.0, 37.0, 41.0, 44.0, 43.0, 46.0, 39.0, 44.0, 33.0, 37.0, 34.0, 41.0, 32.0, 38.0, 27.0, 30.0, 18.0, 9.0, 20.0, 11.0, 9.0, 13.0, 3.0, 4.0, 7.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0], "bins": [-3.8008768558502197, -3.698765754699707, -3.5966548919677734, -3.49454402923584, -3.392432928085327, -3.2903218269348145, -3.188210964202881, -3.0861001014709473, -2.9839890003204346, -2.881877899169922, -2.7797670364379883, -2.6776561737060547, -2.575545072555542, -2.4734339714050293, -2.3713231086730957, -2.269212245941162, -2.1671011447906494, -2.0649900436401367, -1.9628791809082031, -1.86076819896698, -1.7586572170257568, -1.6565462350845337, -1.5544352531433105, -1.4523242712020874, -1.3502132892608643, -1.2481023073196411, -1.145991325378418, -1.0438803434371948, -0.9417693614959717, -0.8396583795547485, -0.7375473976135254, -0.6354364156723022, -0.5333254337310791, -0.43121445178985596, -0.3291034698486328, -0.22699248790740967, -0.12488150596618652, -0.02277052402496338, 0.07934045791625977, 0.1814514398574829, 0.28356242179870605, 0.3856734037399292, 0.48778438568115234, 0.5898953676223755, 0.6920063495635986, 0.7941173315048218, 0.8962283134460449, 0.9983392953872681, 1.1004502773284912, 1.2025612592697144, 1.3046722412109375, 1.4067832231521606, 1.5088942050933838, 1.611005187034607, 1.71311616897583, 1.8152271509170532, 1.9173381328582764, 2.019449234008789, 2.1215600967407227, 2.2236709594726562, 2.325782060623169, 2.4278931617736816, 2.5300040245056152, 2.632114887237549, 2.7342259883880615]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 4.0, 3.0, 5.0, 5.0, 8.0, 8.0, 16.0, 16.0, 31.0, 44.0, 62.0, 85.0, 117.0, 196.0, 305.0, 547.0, 863.0, 1654.0, 3220.0, 5935.0, 11773.0, 23152.0, 44878.0, 84487.0, 142148.0, 198286.0, 200993.0, 145669.0, 86844.0, 47050.0, 24402.0, 12192.0, 6203.0, 3253.0, 1693.0, 940.0, 559.0, 307.0, 201.0, 111.0, 82.0, 48.0, 47.0, 39.0, 29.0, 13.0, 12.0, 10.0, 6.0, 3.0, 1.0, 5.0, 0.0, 2.0, 3.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.6669921875, -0.6431961059570312, -0.6194000244140625, -0.5956039428710938, -0.571807861328125, -0.5480117797851562, -0.5242156982421875, -0.5004196166992188, -0.47662353515625, -0.45282745361328125, -0.4290313720703125, -0.40523529052734375, -0.381439208984375, -0.35764312744140625, -0.3338470458984375, -0.31005096435546875, -0.2862548828125, -0.26245880126953125, -0.2386627197265625, -0.21486663818359375, -0.191070556640625, -0.16727447509765625, -0.1434783935546875, -0.11968231201171875, -0.09588623046875, -0.07209014892578125, -0.0482940673828125, -0.02449798583984375, -0.000701904296875, 0.02309417724609375, 0.0468902587890625, 0.07068634033203125, 0.094482421875, 0.11827850341796875, 0.1420745849609375, 0.16587066650390625, 0.189666748046875, 0.21346282958984375, 0.2372589111328125, 0.26105499267578125, 0.28485107421875, 0.30864715576171875, 0.3324432373046875, 0.35623931884765625, 0.380035400390625, 0.40383148193359375, 0.4276275634765625, 0.45142364501953125, 0.4752197265625, 0.49901580810546875, 0.5228118896484375, 0.5466079711914062, 0.570404052734375, 0.5942001342773438, 0.6179962158203125, 0.6417922973632812, 0.66558837890625, 0.6893844604492188, 0.7131805419921875, 0.7369766235351562, 0.760772705078125, 0.7845687866210938, 0.8083648681640625, 0.8321609497070312, 0.85595703125]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 1.0, 5.0, 5.0, 5.0, 2.0, 6.0, 8.0, 7.0, 15.0, 9.0, 24.0, 16.0, 15.0, 26.0, 32.0, 29.0, 33.0, 27.0, 37.0, 42.0, 51.0, 36.0, 53.0, 42.0, 40.0, 46.0, 38.0, 46.0, 40.0, 38.0, 32.0, 33.0, 22.0, 28.0, 22.0, 23.0, 12.0, 15.0, 15.0, 7.0, 7.0, 3.0, 5.0, 1.0, 2.0, 2.0, 3.0, 4.0, 0.0, 0.0, 2.0], "bins": [-2.826171875, -2.748443603515625, -2.67071533203125, -2.592987060546875, -2.5152587890625, -2.437530517578125, -2.35980224609375, -2.282073974609375, -2.204345703125, -2.126617431640625, -2.04888916015625, -1.971160888671875, -1.8934326171875, -1.815704345703125, -1.73797607421875, -1.660247802734375, -1.58251953125, -1.504791259765625, -1.42706298828125, -1.349334716796875, -1.2716064453125, -1.193878173828125, -1.11614990234375, -1.038421630859375, -0.960693359375, -0.882965087890625, -0.80523681640625, -0.727508544921875, -0.6497802734375, -0.572052001953125, -0.49432373046875, -0.416595458984375, -0.3388671875, -0.261138916015625, -0.18341064453125, -0.105682373046875, -0.0279541015625, 0.049774169921875, 0.12750244140625, 0.205230712890625, 0.282958984375, 0.360687255859375, 0.43841552734375, 0.516143798828125, 0.5938720703125, 0.671600341796875, 0.74932861328125, 0.827056884765625, 0.90478515625, 0.982513427734375, 1.06024169921875, 1.137969970703125, 1.2156982421875, 1.293426513671875, 1.37115478515625, 1.448883056640625, 1.526611328125, 1.604339599609375, 1.68206787109375, 1.759796142578125, 1.8375244140625, 1.915252685546875, 1.99298095703125, 2.070709228515625, 2.1484375]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 4.0, 6.0, 5.0, 8.0, 7.0, 12.0, 10.0, 19.0, 40.0, 56.0, 94.0, 160.0, 246.0, 442.0, 1065.0, 2335.0, 5992.0, 16914.0, 52296.0, 154361.0, 318471.0, 297061.0, 131855.0, 43532.0, 14557.0, 5102.0, 2034.0, 896.0, 426.0, 223.0, 118.0, 64.0, 53.0, 30.0, 26.0, 16.0, 8.0, 6.0, 3.0, 1.0, 6.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.0283203125, -0.998870849609375, -0.96942138671875, -0.939971923828125, -0.9105224609375, -0.881072998046875, -0.85162353515625, -0.822174072265625, -0.792724609375, -0.763275146484375, -0.73382568359375, -0.704376220703125, -0.6749267578125, -0.645477294921875, -0.61602783203125, -0.586578369140625, -0.55712890625, -0.527679443359375, -0.49822998046875, -0.468780517578125, -0.4393310546875, -0.409881591796875, -0.38043212890625, -0.350982666015625, -0.321533203125, -0.292083740234375, -0.26263427734375, -0.233184814453125, -0.2037353515625, -0.174285888671875, -0.14483642578125, -0.115386962890625, -0.0859375, -0.056488037109375, -0.02703857421875, 0.002410888671875, 0.0318603515625, 0.061309814453125, 0.09075927734375, 0.120208740234375, 0.149658203125, 0.179107666015625, 0.20855712890625, 0.238006591796875, 0.2674560546875, 0.296905517578125, 0.32635498046875, 0.355804443359375, 0.38525390625, 0.414703369140625, 0.44415283203125, 0.473602294921875, 0.5030517578125, 0.532501220703125, 0.56195068359375, 0.591400146484375, 0.620849609375, 0.650299072265625, 0.67974853515625, 0.709197998046875, 0.7386474609375, 0.768096923828125, 0.79754638671875, 0.826995849609375, 0.8564453125]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 5.0, 13.0, 6.0, 11.0, 29.0, 23.0, 23.0, 26.0, 35.0, 39.0, 51.0, 58.0, 62.0, 55.0, 57.0, 50.0, 62.0, 49.0, 60.0, 51.0, 44.0, 40.0, 37.0, 25.0, 22.0, 13.0, 15.0, 15.0, 11.0, 5.0, 4.0, 5.0, 4.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-7.3203125, -7.11517333984375, -6.9100341796875, -6.70489501953125, -6.499755859375, -6.29461669921875, -6.0894775390625, -5.88433837890625, -5.67919921875, -5.47406005859375, -5.2689208984375, -5.06378173828125, -4.858642578125, -4.65350341796875, -4.4483642578125, -4.24322509765625, -4.0380859375, -3.83294677734375, -3.6278076171875, -3.42266845703125, -3.217529296875, -3.01239013671875, -2.8072509765625, -2.60211181640625, -2.39697265625, -2.19183349609375, -1.9866943359375, -1.78155517578125, -1.576416015625, -1.37127685546875, -1.1661376953125, -0.96099853515625, -0.755859375, -0.55072021484375, -0.3455810546875, -0.14044189453125, 0.064697265625, 0.26983642578125, 0.4749755859375, 0.68011474609375, 0.88525390625, 1.09039306640625, 1.2955322265625, 1.50067138671875, 1.705810546875, 1.91094970703125, 2.1160888671875, 2.32122802734375, 2.5263671875, 2.73150634765625, 2.9366455078125, 3.14178466796875, 3.346923828125, 3.55206298828125, 3.7572021484375, 3.96234130859375, 4.16748046875, 4.37261962890625, 4.5777587890625, 4.78289794921875, 4.988037109375, 5.19317626953125, 5.3983154296875, 5.60345458984375, 5.80859375]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 7.0, 11.0, 10.0, 8.0, 20.0, 21.0, 36.0, 42.0, 81.0, 109.0, 185.0, 397.0, 710.0, 1601.0, 3501.0, 8691.0, 24165.0, 89788.0, 413188.0, 385531.0, 82533.0, 22962.0, 8336.0, 3359.0, 1584.0, 724.0, 396.0, 262.0, 104.0, 59.0, 43.0, 31.0, 20.0, 8.0, 15.0, 9.0, 9.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2322998046875, -0.22525405883789062, -0.21820831298828125, -0.21116256713867188, -0.2041168212890625, -0.19707107543945312, -0.19002532958984375, -0.18297958374023438, -0.175933837890625, -0.16888809204101562, -0.16184234619140625, -0.15479660034179688, -0.1477508544921875, -0.14070510864257812, -0.13365936279296875, -0.12661361694335938, -0.11956787109375, -0.11252212524414062, -0.10547637939453125, -0.09843063354492188, -0.0913848876953125, -0.08433914184570312, -0.07729339599609375, -0.07024765014648438, -0.063201904296875, -0.056156158447265625, -0.04911041259765625, -0.042064666748046875, -0.0350189208984375, -0.027973175048828125, -0.02092742919921875, -0.013881683349609375, -0.0068359375, 0.000209808349609375, 0.00725555419921875, 0.014301300048828125, 0.0213470458984375, 0.028392791748046875, 0.03543853759765625, 0.042484283447265625, 0.049530029296875, 0.056575775146484375, 0.06362152099609375, 0.07066726684570312, 0.0777130126953125, 0.08475875854492188, 0.09180450439453125, 0.09885025024414062, 0.10589599609375, 0.11294174194335938, 0.11998748779296875, 0.12703323364257812, 0.1340789794921875, 0.14112472534179688, 0.14817047119140625, 0.15521621704101562, 0.162261962890625, 0.16930770874023438, 0.17635345458984375, 0.18339920043945312, 0.1904449462890625, 0.19749069213867188, 0.20453643798828125, 0.21158218383789062, 0.2186279296875]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 5.0, 3.0, 4.0, 6.0, 9.0, 9.0, 17.0, 22.0, 32.0, 53.0, 84.0, 158.0, 150.0, 151.0, 120.0, 71.0, 38.0, 34.0, 14.0, 7.0, 7.0, 5.0, 6.0, 2.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002765655517578125, -0.0002690330147743225, -0.0002615004777908325, -0.00025396794080734253, -0.00024643540382385254, -0.00023890286684036255, -0.00023137032985687256, -0.00022383779287338257, -0.00021630525588989258, -0.0002087727189064026, -0.0002012401819229126, -0.0001937076449394226, -0.00018617510795593262, -0.00017864257097244263, -0.00017111003398895264, -0.00016357749700546265, -0.00015604496002197266, -0.00014851242303848267, -0.00014097988605499268, -0.00013344734907150269, -0.0001259148120880127, -0.0001183822751045227, -0.00011084973812103271, -0.00010331720113754272, -9.578466415405273e-05, -8.825212717056274e-05, -8.071959018707275e-05, -7.318705320358276e-05, -6.565451622009277e-05, -5.812197923660278e-05, -5.058944225311279e-05, -4.30569052696228e-05, -3.552436828613281e-05, -2.7991831302642822e-05, -2.0459294319152832e-05, -1.2926757335662842e-05, -5.3942203521728516e-06, 2.1383166313171387e-06, 9.670853614807129e-06, 1.720339059829712e-05, 2.473592758178711e-05, 3.22684645652771e-05, 3.980100154876709e-05, 4.733353853225708e-05, 5.486607551574707e-05, 6.239861249923706e-05, 6.993114948272705e-05, 7.746368646621704e-05, 8.499622344970703e-05, 9.252876043319702e-05, 0.00010006129741668701, 0.000107593834400177, 0.00011512637138366699, 0.00012265890836715698, 0.00013019144535064697, 0.00013772398233413696, 0.00014525651931762695, 0.00015278905630111694, 0.00016032159328460693, 0.00016785413026809692, 0.00017538666725158691, 0.0001829192042350769, 0.0001904517412185669, 0.00019798427820205688, 0.00020551681518554688]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 8.0, 5.0, 6.0, 7.0, 22.0, 24.0, 37.0, 52.0, 119.0, 196.0, 900.0, 45684.0, 990458.0, 10126.0, 514.0, 141.0, 86.0, 56.0, 36.0, 24.0, 12.0, 11.0, 9.0, 6.0, 4.0, 2.0, 1.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.2705078125, -1.22998046875, -1.189453125, -1.14892578125, -1.1083984375, -1.06787109375, -1.02734375, -0.98681640625, -0.9462890625, -0.90576171875, -0.865234375, -0.82470703125, -0.7841796875, -0.74365234375, -0.703125, -0.66259765625, -0.6220703125, -0.58154296875, -0.541015625, -0.50048828125, -0.4599609375, -0.41943359375, -0.37890625, -0.33837890625, -0.2978515625, -0.25732421875, -0.216796875, -0.17626953125, -0.1357421875, -0.09521484375, -0.0546875, -0.01416015625, 0.0263671875, 0.06689453125, 0.107421875, 0.14794921875, 0.1884765625, 0.22900390625, 0.26953125, 0.31005859375, 0.3505859375, 0.39111328125, 0.431640625, 0.47216796875, 0.5126953125, 0.55322265625, 0.59375, 0.63427734375, 0.6748046875, 0.71533203125, 0.755859375, 0.79638671875, 0.8369140625, 0.87744140625, 0.91796875, 0.95849609375, 0.9990234375, 1.03955078125, 1.080078125, 1.12060546875, 1.1611328125, 1.20166015625, 1.2421875, 1.28271484375, 1.3232421875]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 3.0, 2.0, 1.0, 2.0, 5.0, 7.0, 5.0, 9.0, 20.0, 20.0, 40.0, 41.0, 71.0, 81.0, 89.0, 106.0, 98.0, 92.0, 84.0, 68.0, 50.0, 38.0, 24.0, 17.0, 11.0, 9.0, 4.0, 1.0, 3.0, 1.0, 2.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.092529296875, -0.0892171859741211, -0.08590507507324219, -0.08259296417236328, -0.07928085327148438, -0.07596874237060547, -0.07265663146972656, -0.06934452056884766, -0.06603240966796875, -0.06272029876708984, -0.05940818786621094, -0.05609607696533203, -0.052783966064453125, -0.04947185516357422, -0.04615974426269531, -0.042847633361816406, -0.0395355224609375, -0.036223411560058594, -0.03291130065917969, -0.02959918975830078, -0.026287078857421875, -0.02297496795654297, -0.019662857055664062, -0.016350746154785156, -0.01303863525390625, -0.009726524353027344, -0.0064144134521484375, -0.0031023025512695312, 0.000209808349609375, 0.0035219192504882812, 0.0068340301513671875, 0.010146141052246094, 0.013458251953125, 0.016770362854003906, 0.020082473754882812, 0.02339458465576172, 0.026706695556640625, 0.03001880645751953, 0.03333091735839844, 0.036643028259277344, 0.03995513916015625, 0.043267250061035156, 0.04657936096191406, 0.04989147186279297, 0.053203582763671875, 0.05651569366455078, 0.05982780456542969, 0.0631399154663086, 0.0664520263671875, 0.0697641372680664, 0.07307624816894531, 0.07638835906982422, 0.07970046997070312, 0.08301258087158203, 0.08632469177246094, 0.08963680267333984, 0.09294891357421875, 0.09626102447509766, 0.09957313537597656, 0.10288524627685547, 0.10619735717773438, 0.10950946807861328, 0.11282157897949219, 0.1161336898803711, 0.11944580078125]}, "gradients/decoder.model.decoder.layers.11.self_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 3.0, 13.0, 35.0, 104.0, 206.0, 306.0, 213.0, 91.0, 25.0, 10.0, 5.0, 3.0, 0.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.611790418624878, -3.234570026397705, -2.8573496341705322, -2.4801292419433594, -2.1029086112976074, -1.7256883382797241, -1.3484678268432617, -0.9712474346160889, -0.594027042388916, -0.21680662035942078, 0.16041380167007446, 0.5376342535018921, 0.9148546457290649, 1.2920750379562378, 1.6692955493927002, 2.046515941619873, 2.423736333847046, 2.8009567260742188, 3.1781771183013916, 3.5553975105285645, 3.9326181411743164, 4.30983829498291, 4.687058925628662, 5.064279556274414, 5.441499710083008, 5.81872034072876, 6.1959404945373535, 6.5731611251831055, 6.950381278991699, 7.327601909637451, 7.704822540283203, 8.082042694091797, 8.459263801574707, 8.8364839553833, 9.213705062866211, 9.590925216674805, 9.968145370483398, 10.345365524291992, 10.722586631774902, 11.099806785583496, 11.47702693939209, 11.854247093200684, 12.231468200683594, 12.608688354492188, 12.985908508300781, 13.363128662109375, 13.740349769592285, 14.117569923400879, 14.494791030883789, 14.872011184692383, 15.249232292175293, 15.626452445983887, 16.003673553466797, 16.38089370727539, 16.758113861083984, 17.135334014892578, 17.512554168701172, 17.889774322509766, 18.26699447631836, 18.644214630126953, 19.02143669128418, 19.398656845092773, 19.775876998901367, 20.15309715270996, 20.530317306518555]}, "gradients/decoder.model.decoder.layers.11.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 2.0, 4.0, 6.0, 6.0, 3.0, 12.0, 10.0, 12.0, 15.0, 21.0, 19.0, 24.0, 32.0, 35.0, 31.0, 30.0, 31.0, 39.0, 45.0, 50.0, 54.0, 31.0, 53.0, 36.0, 51.0, 37.0, 40.0, 43.0, 37.0, 34.0, 31.0, 23.0, 14.0, 23.0, 16.0, 14.0, 11.0, 8.0, 5.0, 3.0, 9.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 2.0], "bins": [-2.843140125274658, -2.7669174671173096, -2.69069504737854, -2.6144723892211914, -2.538249969482422, -2.4620273113250732, -2.3858048915863037, -2.309582233428955, -2.2333598136901855, -2.157137155532837, -2.0809147357940674, -2.0046920776367188, -1.9284696578979492, -1.8522469997406006, -1.7760244607925415, -1.6998019218444824, -1.6235792636871338, -1.5473567247390747, -1.4711341857910156, -1.3949116468429565, -1.3186891078948975, -1.2424664497375488, -1.1662439107894897, -1.0900213718414307, -1.0137988328933716, -0.9375762939453125, -0.8613537549972534, -0.7851311564445496, -0.7089086174964905, -0.6326860785484314, -0.5564634799957275, -0.48024094104766846, -0.4040184020996094, -0.3277958631515503, -0.2515732944011688, -0.17535074055194855, -0.09912818670272827, -0.02290564775466919, 0.05331692099571228, 0.12953948974609375, 0.20576202869415283, 0.2819845676422119, 0.3582071363925934, 0.43442970514297485, 0.5106522440910339, 0.586874783039093, 0.6630973815917969, 0.739319920539856, 0.815542459487915, 0.8917649984359741, 0.9679875373840332, 1.0442100763320923, 1.1204326152801514, 1.1966552734375, 1.272877812385559, 1.3491003513336182, 1.4253228902816772, 1.5015454292297363, 1.5777679681777954, 1.6539905071258545, 1.7302131652832031, 1.8064355850219727, 1.8826582431793213, 1.9588807821273804, 2.0351033210754395]}, "gradients/decoder.model.decoder.layers.11.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 7.0, 2.0, 11.0, 15.0, 15.0, 34.0, 39.0, 83.0, 121.0, 171.0, 359.0, 604.0, 1162.0, 2069.0, 3968.0, 8068.0, 19325.0, 53139.0, 179875.0, 443132.0, 228104.0, 66000.0, 22863.0, 9596.0, 4541.0, 2301.0, 1261.0, 680.0, 421.0, 260.0, 115.0, 74.0, 45.0, 29.0, 32.0, 15.0, 12.0, 9.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.091796875, -1.0522308349609375, -1.012664794921875, -0.9730987548828125, -0.93353271484375, -0.8939666748046875, -0.854400634765625, -0.8148345947265625, -0.7752685546875, -0.7357025146484375, -0.696136474609375, -0.6565704345703125, -0.61700439453125, -0.5774383544921875, -0.537872314453125, -0.4983062744140625, -0.458740234375, -0.4191741943359375, -0.379608154296875, -0.3400421142578125, -0.30047607421875, -0.2609100341796875, -0.221343994140625, -0.1817779541015625, -0.1422119140625, -0.1026458740234375, -0.063079833984375, -0.0235137939453125, 0.01605224609375, 0.0556182861328125, 0.095184326171875, 0.1347503662109375, 0.17431640625, 0.2138824462890625, 0.253448486328125, 0.2930145263671875, 0.33258056640625, 0.3721466064453125, 0.411712646484375, 0.4512786865234375, 0.4908447265625, 0.5304107666015625, 0.569976806640625, 0.6095428466796875, 0.64910888671875, 0.6886749267578125, 0.728240966796875, 0.7678070068359375, 0.807373046875, 0.8469390869140625, 0.886505126953125, 0.9260711669921875, 0.96563720703125, 1.0052032470703125, 1.044769287109375, 1.0843353271484375, 1.1239013671875, 1.1634674072265625, 1.203033447265625, 1.2425994873046875, 1.28216552734375, 1.3217315673828125, 1.361297607421875, 1.4008636474609375, 1.4404296875]}, "gradients/decoder.model.decoder.layers.11.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 5.0, 0.0, 3.0, 2.0, 3.0, 2.0, 2.0, 5.0, 8.0, 4.0, 7.0, 11.0, 17.0, 16.0, 21.0, 25.0, 26.0, 30.0, 40.0, 33.0, 37.0, 35.0, 40.0, 39.0, 50.0, 42.0, 57.0, 47.0, 53.0, 39.0, 48.0, 35.0, 37.0, 27.0, 39.0, 22.0, 16.0, 19.0, 13.0, 12.0, 7.0, 11.0, 7.0, 6.0, 3.0, 5.0, 5.0, 2.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.2421875, -6.05816650390625, -5.8741455078125, -5.69012451171875, -5.506103515625, -5.32208251953125, -5.1380615234375, -4.95404052734375, -4.77001953125, -4.58599853515625, -4.4019775390625, -4.21795654296875, -4.033935546875, -3.84991455078125, -3.6658935546875, -3.48187255859375, -3.2978515625, -3.11383056640625, -2.9298095703125, -2.74578857421875, -2.561767578125, -2.37774658203125, -2.1937255859375, -2.00970458984375, -1.82568359375, -1.64166259765625, -1.4576416015625, -1.27362060546875, -1.089599609375, -0.90557861328125, -0.7215576171875, -0.53753662109375, -0.353515625, -0.16949462890625, 0.0145263671875, 0.19854736328125, 0.382568359375, 0.56658935546875, 0.7506103515625, 0.93463134765625, 1.11865234375, 1.30267333984375, 1.4866943359375, 1.67071533203125, 1.854736328125, 2.03875732421875, 2.2227783203125, 2.40679931640625, 2.5908203125, 2.77484130859375, 2.9588623046875, 3.14288330078125, 3.326904296875, 3.51092529296875, 3.6949462890625, 3.87896728515625, 4.06298828125, 4.24700927734375, 4.4310302734375, 4.61505126953125, 4.799072265625, 4.98309326171875, 5.1671142578125, 5.35113525390625, 5.53515625]}, "gradients/decoder.model.decoder.layers.11.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 5.0, 4.0, 2.0, 2.0, 4.0, 6.0, 2.0, 6.0, 10.0, 15.0, 17.0, 26.0, 36.0, 64.0, 82.0, 115.0, 159.0, 376.0, 960.0, 8576.0, 668770.0, 361629.0, 5908.0, 871.0, 346.0, 202.0, 114.0, 79.0, 55.0, 35.0, 25.0, 11.0, 7.0, 7.0, 8.0, 8.0, 3.0, 4.0, 3.0, 3.0, 3.0, 2.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.11328125, -5.92767333984375, -5.7420654296875, -5.55645751953125, -5.370849609375, -5.18524169921875, -4.9996337890625, -4.81402587890625, -4.62841796875, -4.44281005859375, -4.2572021484375, -4.07159423828125, -3.885986328125, -3.70037841796875, -3.5147705078125, -3.32916259765625, -3.1435546875, -2.95794677734375, -2.7723388671875, -2.58673095703125, -2.401123046875, -2.21551513671875, -2.0299072265625, -1.84429931640625, -1.65869140625, -1.47308349609375, -1.2874755859375, -1.10186767578125, -0.916259765625, -0.73065185546875, -0.5450439453125, -0.35943603515625, -0.173828125, 0.01177978515625, 0.1973876953125, 0.38299560546875, 0.568603515625, 0.75421142578125, 0.9398193359375, 1.12542724609375, 1.31103515625, 1.49664306640625, 1.6822509765625, 1.86785888671875, 2.053466796875, 2.23907470703125, 2.4246826171875, 2.61029052734375, 2.7958984375, 2.98150634765625, 3.1671142578125, 3.35272216796875, 3.538330078125, 3.72393798828125, 3.9095458984375, 4.09515380859375, 4.28076171875, 4.46636962890625, 4.6519775390625, 4.83758544921875, 5.023193359375, 5.20880126953125, 5.3944091796875, 5.58001708984375, 5.765625]}, "gradients/decoder.model.decoder.layers.11.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 6.0, 1.0, 2.0, 3.0, 3.0, 4.0, 4.0, 6.0, 9.0, 12.0, 14.0, 7.0, 9.0, 19.0, 20.0, 25.0, 30.0, 25.0, 34.0, 31.0, 24.0, 47.0, 42.0, 39.0, 45.0, 41.0, 48.0, 43.0, 56.0, 45.0, 37.0, 37.0, 24.0, 32.0, 28.0, 28.0, 29.0, 19.0, 12.0, 11.0, 11.0, 13.0, 7.0, 9.0, 8.0, 4.0, 5.0, 4.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.35546875, -5.17584228515625, -4.9962158203125, -4.81658935546875, -4.636962890625, -4.45733642578125, -4.2777099609375, -4.09808349609375, -3.91845703125, -3.73883056640625, -3.5592041015625, -3.37957763671875, -3.199951171875, -3.02032470703125, -2.8406982421875, -2.66107177734375, -2.4814453125, -2.30181884765625, -2.1221923828125, -1.94256591796875, -1.762939453125, -1.58331298828125, -1.4036865234375, -1.22406005859375, -1.04443359375, -0.86480712890625, -0.6851806640625, -0.50555419921875, -0.325927734375, -0.14630126953125, 0.0333251953125, 0.21295166015625, 0.392578125, 0.57220458984375, 0.7518310546875, 0.93145751953125, 1.111083984375, 1.29071044921875, 1.4703369140625, 1.64996337890625, 1.82958984375, 2.00921630859375, 2.1888427734375, 2.36846923828125, 2.548095703125, 2.72772216796875, 2.9073486328125, 3.08697509765625, 3.2666015625, 3.44622802734375, 3.6258544921875, 3.80548095703125, 3.985107421875, 4.16473388671875, 4.3443603515625, 4.52398681640625, 4.70361328125, 4.88323974609375, 5.0628662109375, 5.24249267578125, 5.422119140625, 5.60174560546875, 5.7813720703125, 5.96099853515625, 6.140625]}, "gradients/decoder.model.decoder.layers.11.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 0.0, 6.0, 2.0, 6.0, 9.0, 5.0, 10.0, 14.0, 29.0, 34.0, 64.0, 137.0, 278.0, 1103.0, 7395.0, 601973.0, 429093.0, 6751.0, 1081.0, 292.0, 111.0, 61.0, 33.0, 19.0, 20.0, 6.0, 12.0, 4.0, 3.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6162109375, -1.565673828125, -1.51513671875, -1.464599609375, -1.4140625, -1.363525390625, -1.31298828125, -1.262451171875, -1.2119140625, -1.161376953125, -1.11083984375, -1.060302734375, -1.009765625, -0.959228515625, -0.90869140625, -0.858154296875, -0.8076171875, -0.757080078125, -0.70654296875, -0.656005859375, -0.60546875, -0.554931640625, -0.50439453125, -0.453857421875, -0.4033203125, -0.352783203125, -0.30224609375, -0.251708984375, -0.201171875, -0.150634765625, -0.10009765625, -0.049560546875, 0.0009765625, 0.051513671875, 0.10205078125, 0.152587890625, 0.203125, 0.253662109375, 0.30419921875, 0.354736328125, 0.4052734375, 0.455810546875, 0.50634765625, 0.556884765625, 0.607421875, 0.657958984375, 0.70849609375, 0.759033203125, 0.8095703125, 0.860107421875, 0.91064453125, 0.961181640625, 1.01171875, 1.062255859375, 1.11279296875, 1.163330078125, 1.2138671875, 1.264404296875, 1.31494140625, 1.365478515625, 1.416015625, 1.466552734375, 1.51708984375, 1.567626953125, 1.6181640625]}, "gradients/decoder.model.decoder.layers.11.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 3.0, 5.0, 9.0, 7.0, 11.0, 11.0, 14.0, 32.0, 32.0, 50.0, 77.0, 109.0, 211.0, 141.0, 86.0, 50.0, 47.0, 24.0, 22.0, 22.0, 13.0, 9.0, 7.0, 3.0, 2.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00012445449829101562, -0.00012076832354068756, -0.0001170821487903595, -0.00011339597404003143, -0.00010970979928970337, -0.0001060236245393753, -0.00010233744978904724, -9.865127503871918e-05, -9.496510028839111e-05, -9.127892553806305e-05, -8.759275078773499e-05, -8.390657603740692e-05, -8.022040128707886e-05, -7.65342265367508e-05, -7.284805178642273e-05, -6.916187703609467e-05, -6.54757022857666e-05, -6.178952753543854e-05, -5.8103352785110474e-05, -5.441717803478241e-05, -5.0731003284454346e-05, -4.704482853412628e-05, -4.335865378379822e-05, -3.9672479033470154e-05, -3.598630428314209e-05, -3.2300129532814026e-05, -2.8613954782485962e-05, -2.4927780032157898e-05, -2.1241605281829834e-05, -1.755543053150177e-05, -1.3869255781173706e-05, -1.0183081030845642e-05, -6.496906280517578e-06, -2.810731530189514e-06, 8.754432201385498e-07, 4.561617970466614e-06, 8.247792720794678e-06, 1.1933967471122742e-05, 1.5620142221450806e-05, 1.930631697177887e-05, 2.2992491722106934e-05, 2.6678666472434998e-05, 3.036484122276306e-05, 3.4051015973091125e-05, 3.773719072341919e-05, 4.1423365473747253e-05, 4.510954022407532e-05, 4.879571497440338e-05, 5.2481889724731445e-05, 5.616806447505951e-05, 5.985423922538757e-05, 6.354041397571564e-05, 6.72265887260437e-05, 7.091276347637177e-05, 7.459893822669983e-05, 7.828511297702789e-05, 8.197128772735596e-05, 8.565746247768402e-05, 8.934363722801208e-05, 9.302981197834015e-05, 9.671598672866821e-05, 0.00010040216147899628, 0.00010408833622932434, 0.0001077745109796524, 0.00011146068572998047]}, "gradients/decoder.model.decoder.layers.11.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 6.0, 9.0, 10.0, 16.0, 21.0, 26.0, 21.0, 49.0, 100.0, 277.0, 1200.0, 12226.0, 927862.0, 102317.0, 3451.0, 542.0, 171.0, 86.0, 64.0, 23.0, 28.0, 13.0, 12.0, 8.0, 2.0, 3.0, 6.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7314453125, -1.6732635498046875, -1.615081787109375, -1.5569000244140625, -1.49871826171875, -1.4405364990234375, -1.382354736328125, -1.3241729736328125, -1.2659912109375, -1.2078094482421875, -1.149627685546875, -1.0914459228515625, -1.03326416015625, -0.9750823974609375, -0.916900634765625, -0.8587188720703125, -0.800537109375, -0.7423553466796875, -0.684173583984375, -0.6259918212890625, -0.56781005859375, -0.5096282958984375, -0.451446533203125, -0.3932647705078125, -0.3350830078125, -0.2769012451171875, -0.218719482421875, -0.1605377197265625, -0.10235595703125, -0.0441741943359375, 0.014007568359375, 0.0721893310546875, 0.13037109375, 0.1885528564453125, 0.246734619140625, 0.3049163818359375, 0.36309814453125, 0.4212799072265625, 0.479461669921875, 0.5376434326171875, 0.5958251953125, 0.6540069580078125, 0.712188720703125, 0.7703704833984375, 0.82855224609375, 0.8867340087890625, 0.944915771484375, 1.0030975341796875, 1.061279296875, 1.1194610595703125, 1.177642822265625, 1.2358245849609375, 1.29400634765625, 1.3521881103515625, 1.410369873046875, 1.4685516357421875, 1.5267333984375, 1.5849151611328125, 1.643096923828125, 1.7012786865234375, 1.75946044921875, 1.8176422119140625, 1.875823974609375, 1.9340057373046875, 1.9921875]}, "gradients/decoder.model.decoder.layers.11.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 3.0, 2.0, 3.0, 8.0, 8.0, 6.0, 5.0, 23.0, 16.0, 27.0, 21.0, 47.0, 89.0, 129.0, 216.0, 125.0, 70.0, 72.0, 40.0, 35.0, 17.0, 10.0, 8.0, 9.0, 3.0, 7.0, 1.0, 0.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.304443359375, -0.2941169738769531, -0.28379058837890625, -0.2734642028808594, -0.2631378173828125, -0.2528114318847656, -0.24248504638671875, -0.23215866088867188, -0.221832275390625, -0.21150588989257812, -0.20117950439453125, -0.19085311889648438, -0.1805267333984375, -0.17020034790039062, -0.15987396240234375, -0.14954757690429688, -0.13922119140625, -0.12889480590820312, -0.11856842041015625, -0.10824203491210938, -0.0979156494140625, -0.08758926391601562, -0.07726287841796875, -0.06693649291992188, -0.056610107421875, -0.046283721923828125, -0.03595733642578125, -0.025630950927734375, -0.0153045654296875, -0.004978179931640625, 0.00534820556640625, 0.015674591064453125, 0.0260009765625, 0.036327362060546875, 0.04665374755859375, 0.056980133056640625, 0.0673065185546875, 0.07763290405273438, 0.08795928955078125, 0.09828567504882812, 0.108612060546875, 0.11893844604492188, 0.12926483154296875, 0.13959121704101562, 0.1499176025390625, 0.16024398803710938, 0.17057037353515625, 0.18089675903320312, 0.19122314453125, 0.20154953002929688, 0.21187591552734375, 0.22220230102539062, 0.2325286865234375, 0.24285507202148438, 0.25318145751953125, 0.2635078430175781, 0.273834228515625, 0.2841606140136719, 0.29448699951171875, 0.3048133850097656, 0.3151397705078125, 0.3254661560058594, 0.33579254150390625, 0.3461189270019531, 0.3564453125]}, "gradients/decoder.model.decoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 5.0, 34.0, 204.0, 427.0, 274.0, 56.0, 14.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.37736177444458, -3.449653148651123, -2.521944761276245, -1.5942363739013672, -0.6665277481079102, 0.2611808776855469, 1.1888890266418457, 2.1165976524353027, 3.0443062782287598, 3.972014904022217, 4.899723052978516, 5.827431678771973, 6.75514030456543, 7.682848930358887, 8.610557556152344, 9.538265228271484, 10.465974807739258, 11.393683433532715, 12.321392059326172, 13.249099731445312, 14.176809310913086, 15.104516983032227, 16.0322265625, 16.95993423461914, 17.88764190673828, 18.815349578857422, 19.743059158325195, 20.670766830444336, 21.59847640991211, 22.52618408203125, 23.45389175415039, 24.381601333618164, 25.309310913085938, 26.237018585205078, 27.16472816467285, 28.092435836791992, 29.020145416259766, 29.947853088378906, 30.875560760498047, 31.80327033996582, 32.730979919433594, 33.658687591552734, 34.586395263671875, 35.51410675048828, 36.44181442260742, 37.36952209472656, 38.2972297668457, 39.224937438964844, 40.15264892578125, 41.08035659790039, 42.00806427001953, 42.93577575683594, 43.86348342895508, 44.79119110107422, 45.71889877319336, 46.6466064453125, 47.57431411743164, 48.50202178955078, 49.42972946166992, 50.35744094848633, 51.28514862060547, 52.21285629272461, 53.14056396484375, 54.068275451660156, 54.9959831237793]}, "gradients/decoder.model.decoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 2.0, 8.0, 4.0, 8.0, 11.0, 11.0, 10.0, 15.0, 14.0, 11.0, 24.0, 17.0, 27.0, 30.0, 34.0, 40.0, 26.0, 53.0, 31.0, 41.0, 49.0, 54.0, 46.0, 36.0, 38.0, 32.0, 34.0, 38.0, 29.0, 30.0, 28.0, 25.0, 28.0, 22.0, 21.0, 16.0, 15.0, 7.0, 14.0, 4.0, 5.0, 4.0, 4.0, 3.0, 1.0, 5.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.70509147644043, -8.427559852600098, -8.150028228759766, -7.87249755859375, -7.594965934753418, -7.317434310913086, -7.039903163909912, -6.762372016906738, -6.484840393066406, -6.207308769226074, -5.9297776222229, -5.652246475219727, -5.3747148513793945, -5.0971832275390625, -4.819652080535889, -4.542120933532715, -4.264589309692383, -3.98705792427063, -3.709526538848877, -3.431995153427124, -3.154463768005371, -2.876932382583618, -2.5994009971618652, -2.3218696117401123, -2.0443382263183594, -1.7668068408966064, -1.4892754554748535, -1.2117440700531006, -0.9342126846313477, -0.6566812992095947, -0.3791499137878418, -0.10161852836608887, 0.17591381072998047, 0.4534451961517334, 0.7309765815734863, 1.0085079669952393, 1.2860393524169922, 1.5635707378387451, 1.841102123260498, 2.118633508682251, 2.396164894104004, 2.673696279525757, 2.9512276649475098, 3.2287590503692627, 3.5062904357910156, 3.7838218212127686, 4.0613532066345215, 4.338884353637695, 4.616415977478027, 4.893947601318359, 5.171478748321533, 5.449009895324707, 5.726541519165039, 6.004073143005371, 6.281604290008545, 6.559135437011719, 6.836667060852051, 7.114198684692383, 7.391729831695557, 7.6692609786987305, 7.9467926025390625, 8.224324226379395, 8.501855850219727, 8.779386520385742, 9.056918144226074]}, "gradients/decoder.model.decoder.layers.10.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 1.0, 4.0, 6.0, 14.0, 18.0, 27.0, 28.0, 54.0, 59.0, 76.0, 118.0, 281.0, 536.0, 1331.0, 4135.0, 16444.0, 91558.0, 704441.0, 2459042.0, 780703.0, 109008.0, 19449.0, 4562.0, 1305.0, 511.0, 240.0, 118.0, 68.0, 44.0, 23.0, 27.0, 16.0, 13.0, 9.0, 4.0, 4.0, 4.0, 2.0, 2.0, 4.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.07421875, -3.95623779296875, -3.8382568359375, -3.72027587890625, -3.602294921875, -3.48431396484375, -3.3663330078125, -3.24835205078125, -3.13037109375, -3.01239013671875, -2.8944091796875, -2.77642822265625, -2.658447265625, -2.54046630859375, -2.4224853515625, -2.30450439453125, -2.1865234375, -2.06854248046875, -1.9505615234375, -1.83258056640625, -1.714599609375, -1.59661865234375, -1.4786376953125, -1.36065673828125, -1.24267578125, -1.12469482421875, -1.0067138671875, -0.88873291015625, -0.770751953125, -0.65277099609375, -0.5347900390625, -0.41680908203125, -0.298828125, -0.18084716796875, -0.0628662109375, 0.05511474609375, 0.173095703125, 0.29107666015625, 0.4090576171875, 0.52703857421875, 0.64501953125, 0.76300048828125, 0.8809814453125, 0.99896240234375, 1.116943359375, 1.23492431640625, 1.3529052734375, 1.47088623046875, 1.5888671875, 1.70684814453125, 1.8248291015625, 1.94281005859375, 2.060791015625, 2.17877197265625, 2.2967529296875, 2.41473388671875, 2.53271484375, 2.65069580078125, 2.7686767578125, 2.88665771484375, 3.004638671875, 3.12261962890625, 3.2406005859375, 3.35858154296875, 3.4765625]}, "gradients/decoder.model.decoder.layers.10.fc2.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 2.0, 4.0, 4.0, 10.0, 9.0, 7.0, 18.0, 28.0, 26.0, 36.0, 38.0, 50.0, 49.0, 77.0, 52.0, 56.0, 50.0, 66.0, 52.0, 58.0, 55.0, 52.0, 50.0, 35.0, 40.0, 24.0, 17.0, 10.0, 9.0, 7.0, 6.0, 3.0, 2.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.71484375, -2.612274169921875, -2.50970458984375, -2.407135009765625, -2.3045654296875, -2.201995849609375, -2.09942626953125, -1.996856689453125, -1.894287109375, -1.791717529296875, -1.68914794921875, -1.586578369140625, -1.4840087890625, -1.381439208984375, -1.27886962890625, -1.176300048828125, -1.07373046875, -0.971160888671875, -0.86859130859375, -0.766021728515625, -0.6634521484375, -0.560882568359375, -0.45831298828125, -0.355743408203125, -0.253173828125, -0.150604248046875, -0.04803466796875, 0.054534912109375, 0.1571044921875, 0.259674072265625, 0.36224365234375, 0.464813232421875, 0.5673828125, 0.669952392578125, 0.77252197265625, 0.875091552734375, 0.9776611328125, 1.080230712890625, 1.18280029296875, 1.285369873046875, 1.387939453125, 1.490509033203125, 1.59307861328125, 1.695648193359375, 1.7982177734375, 1.900787353515625, 2.00335693359375, 2.105926513671875, 2.20849609375, 2.311065673828125, 2.41363525390625, 2.516204833984375, 2.6187744140625, 2.721343994140625, 2.82391357421875, 2.926483154296875, 3.029052734375, 3.131622314453125, 3.23419189453125, 3.336761474609375, 3.4393310546875, 3.541900634765625, 3.64447021484375, 3.747039794921875, 3.849609375]}, "gradients/decoder.model.decoder.layers.10.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 3.0, 2.0, 11.0, 14.0, 24.0, 61.0, 169.0, 612.0, 2090622.0, 2101885.0, 637.0, 134.0, 53.0, 22.0, 9.0, 7.0, 5.0, 5.0, 3.0, 5.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-28.125, -26.953125, -25.78125, -24.609375, -23.4375, -22.265625, -21.09375, -19.921875, -18.75, -17.578125, -16.40625, -15.234375, -14.0625, -12.890625, -11.71875, -10.546875, -9.375, -8.203125, -7.03125, -5.859375, -4.6875, -3.515625, -2.34375, -1.171875, 0.0, 1.171875, 2.34375, 3.515625, 4.6875, 5.859375, 7.03125, 8.203125, 9.375, 10.546875, 11.71875, 12.890625, 14.0625, 15.234375, 16.40625, 17.578125, 18.75, 19.921875, 21.09375, 22.265625, 23.4375, 24.609375, 25.78125, 26.953125, 28.125, 29.296875, 30.46875, 31.640625, 32.8125, 33.984375, 35.15625, 36.328125, 37.5, 38.671875, 39.84375, 41.015625, 42.1875, 43.359375, 44.53125, 45.703125, 46.875]}, "gradients/decoder.model.decoder.layers.10.fc1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 7.0, 1.0, 7.0, 8.0, 5.0, 11.0, 13.0, 16.0, 18.0, 43.0, 42.0, 57.0, 88.0, 114.0, 165.0, 271.0, 377.0, 556.0, 627.0, 487.0, 402.0, 227.0, 161.0, 105.0, 91.0, 45.0, 35.0, 27.0, 25.0, 18.0, 9.0, 10.0, 4.0, 3.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.0576171875, -1.0249176025390625, -0.992218017578125, -0.9595184326171875, -0.92681884765625, -0.8941192626953125, -0.861419677734375, -0.8287200927734375, -0.7960205078125, -0.7633209228515625, -0.730621337890625, -0.6979217529296875, -0.66522216796875, -0.6325225830078125, -0.599822998046875, -0.5671234130859375, -0.534423828125, -0.5017242431640625, -0.469024658203125, -0.4363250732421875, -0.40362548828125, -0.3709259033203125, -0.338226318359375, -0.3055267333984375, -0.2728271484375, -0.2401275634765625, -0.207427978515625, -0.1747283935546875, -0.14202880859375, -0.1093292236328125, -0.076629638671875, -0.0439300537109375, -0.01123046875, 0.0214691162109375, 0.054168701171875, 0.0868682861328125, 0.11956787109375, 0.1522674560546875, 0.184967041015625, 0.2176666259765625, 0.2503662109375, 0.2830657958984375, 0.315765380859375, 0.3484649658203125, 0.38116455078125, 0.4138641357421875, 0.446563720703125, 0.4792633056640625, 0.511962890625, 0.5446624755859375, 0.577362060546875, 0.6100616455078125, 0.64276123046875, 0.6754608154296875, 0.708160400390625, 0.7408599853515625, 0.7735595703125, 0.8062591552734375, 0.838958740234375, 0.8716583251953125, 0.90435791015625, 0.9370574951171875, 0.969757080078125, 1.0024566650390625, 1.03515625]}, "gradients/decoder.model.decoder.layers.10.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 5.0, 14.0, 28.0, 103.0, 193.0, 288.0, 213.0, 98.0, 33.0, 24.0, 7.0, 6.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.553400754928589, -3.146216869354248, -2.7390329837799072, -2.3318490982055664, -1.924665093421936, -1.5174810886383057, -1.1102972030639648, -0.703113317489624, -0.2959294319152832, 0.11125448346138, 0.5184383988380432, 0.9256223440170288, 1.3328062295913696, 1.739990234375, 2.147174119949341, 2.5543580055236816, 2.9615418910980225, 3.3687257766723633, 3.775909662246704, 4.183093547821045, 4.590277671813965, 4.997461318969727, 5.4046454429626465, 5.811829566955566, 6.219013214111328, 6.626197338104248, 7.03338098526001, 7.44056510925293, 7.847748756408691, 8.254932403564453, 8.662117004394531, 9.069300651550293, 9.476485252380371, 9.883668899536133, 10.290853500366211, 10.698037147521973, 11.105220794677734, 11.512405395507812, 11.919589042663574, 12.326772689819336, 12.733956336975098, 13.14113998413086, 13.548324584960938, 13.9555082321167, 14.362691879272461, 14.769876480102539, 15.1770601272583, 15.584243774414062, 15.99142837524414, 16.39861297607422, 16.805795669555664, 17.212980270385742, 17.62016487121582, 18.027347564697266, 18.434532165527344, 18.841716766357422, 19.248899459838867, 19.656084060668945, 20.06326675415039, 20.47045135498047, 20.877635955810547, 21.284818649291992, 21.69200325012207, 22.099185943603516, 22.506370544433594]}, "gradients/decoder.model.decoder.layers.10.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 5.0, 3.0, 5.0, 6.0, 7.0, 16.0, 14.0, 16.0, 29.0, 31.0, 38.0, 35.0, 44.0, 40.0, 56.0, 42.0, 57.0, 52.0, 62.0, 55.0, 50.0, 48.0, 43.0, 37.0, 49.0, 42.0, 30.0, 21.0, 23.0, 15.0, 9.0, 12.0, 11.0, 5.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.143270254135132, -3.042898654937744, -2.9425268173217773, -2.8421552181243896, -2.741783380508423, -2.641411781311035, -2.5410399436950684, -2.4406683444976807, -2.340296745300293, -2.2399251461029053, -2.1395533084869385, -2.039181709289551, -1.938809871673584, -1.8384382724761963, -1.738066554069519, -1.6376948356628418, -1.537322998046875, -1.4369512796401978, -1.3365795612335205, -1.2362079620361328, -1.135836124420166, -1.0354645252227783, -0.9350928068161011, -0.8347210884094238, -0.7343493700027466, -0.6339776515960693, -0.5336059331893921, -0.4332342743873596, -0.3328625559806824, -0.23249083757400513, -0.13211917877197266, -0.03174746036529541, 0.06862449645996094, 0.168996199965477, 0.26936790347099304, 0.3697395920753479, 0.47011131048202515, 0.5704830288887024, 0.6708546876907349, 0.7712264060974121, 0.8715981245040894, 0.9719698429107666, 1.0723415613174438, 1.172713279724121, 1.2730848789215088, 1.3734567165374756, 1.4738283157348633, 1.5742000341415405, 1.6745717525482178, 1.774943470954895, 1.8753151893615723, 1.97568678855896, 2.0760586261749268, 2.1764302253723145, 2.2768020629882812, 2.377173662185669, 2.4775452613830566, 2.5779168605804443, 2.678288698196411, 2.778660297393799, 2.8790321350097656, 2.9794037342071533, 3.079775333404541, 3.180147171020508, 3.2805190086364746]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 4.0, 4.0, 4.0, 7.0, 16.0, 13.0, 11.0, 22.0, 32.0, 63.0, 70.0, 118.0, 169.0, 282.0, 463.0, 649.0, 1184.0, 1940.0, 3796.0, 7961.0, 19335.0, 52353.0, 142193.0, 291052.0, 292237.0, 144393.0, 53563.0, 19604.0, 8102.0, 3891.0, 2028.0, 1108.0, 687.0, 418.0, 244.0, 193.0, 118.0, 80.0, 51.0, 34.0, 22.0, 15.0, 7.0, 9.0, 6.0, 4.0, 2.0, 3.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.87158203125, -0.8451766967773438, -0.8187713623046875, -0.7923660278320312, -0.765960693359375, -0.7395553588867188, -0.7131500244140625, -0.6867446899414062, -0.66033935546875, -0.6339340209960938, -0.6075286865234375, -0.5811233520507812, -0.554718017578125, -0.5283126831054688, -0.5019073486328125, -0.47550201416015625, -0.4490966796875, -0.42269134521484375, -0.3962860107421875, -0.36988067626953125, -0.343475341796875, -0.31707000732421875, -0.2906646728515625, -0.26425933837890625, -0.23785400390625, -0.21144866943359375, -0.1850433349609375, -0.15863800048828125, -0.132232666015625, -0.10582733154296875, -0.0794219970703125, -0.05301666259765625, -0.026611328125, -0.00020599365234375, 0.0261993408203125, 0.05260467529296875, 0.079010009765625, 0.10541534423828125, 0.1318206787109375, 0.15822601318359375, 0.18463134765625, 0.21103668212890625, 0.2374420166015625, 0.26384735107421875, 0.290252685546875, 0.31665802001953125, 0.3430633544921875, 0.36946868896484375, 0.3958740234375, 0.42227935791015625, 0.4486846923828125, 0.47509002685546875, 0.501495361328125, 0.5279006958007812, 0.5543060302734375, 0.5807113647460938, 0.60711669921875, 0.6335220336914062, 0.6599273681640625, 0.6863327026367188, 0.712738037109375, 0.7391433715820312, 0.7655487060546875, 0.7919540405273438, 0.818359375]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 0.0, 3.0, 1.0, 6.0, 7.0, 5.0, 12.0, 15.0, 16.0, 15.0, 24.0, 26.0, 35.0, 25.0, 47.0, 44.0, 42.0, 59.0, 53.0, 49.0, 55.0, 49.0, 51.0, 53.0, 42.0, 49.0, 44.0, 35.0, 35.0, 31.0, 24.0, 12.0, 11.0, 12.0, 5.0, 5.0, 7.0, 5.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.322265625, -2.2398681640625, -2.157470703125, -2.0750732421875, -1.99267578125, -1.9102783203125, -1.827880859375, -1.7454833984375, -1.6630859375, -1.5806884765625, -1.498291015625, -1.4158935546875, -1.33349609375, -1.2510986328125, -1.168701171875, -1.0863037109375, -1.00390625, -0.9215087890625, -0.839111328125, -0.7567138671875, -0.67431640625, -0.5919189453125, -0.509521484375, -0.4271240234375, -0.3447265625, -0.2623291015625, -0.179931640625, -0.0975341796875, -0.01513671875, 0.0672607421875, 0.149658203125, 0.2320556640625, 0.314453125, 0.3968505859375, 0.479248046875, 0.5616455078125, 0.64404296875, 0.7264404296875, 0.808837890625, 0.8912353515625, 0.9736328125, 1.0560302734375, 1.138427734375, 1.2208251953125, 1.30322265625, 1.3856201171875, 1.468017578125, 1.5504150390625, 1.6328125, 1.7152099609375, 1.797607421875, 1.8800048828125, 1.96240234375, 2.0447998046875, 2.127197265625, 2.2095947265625, 2.2919921875, 2.3743896484375, 2.456787109375, 2.5391845703125, 2.62158203125, 2.7039794921875, 2.786376953125, 2.8687744140625, 2.951171875]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 5.0, 6.0, 1.0, 7.0, 6.0, 14.0, 20.0, 18.0, 30.0, 45.0, 85.0, 123.0, 231.0, 430.0, 904.0, 2060.0, 5436.0, 16222.0, 51515.0, 161870.0, 338766.0, 295215.0, 119677.0, 36978.0, 11551.0, 4085.0, 1640.0, 733.0, 381.0, 194.0, 109.0, 72.0, 42.0, 30.0, 18.0, 13.0, 5.0, 5.0, 5.0, 6.0, 5.0, 1.0, 4.0, 2.0, 0.0, 0.0, 3.0], "bins": [-0.86962890625, -0.8466567993164062, -0.8236846923828125, -0.8007125854492188, -0.777740478515625, -0.7547683715820312, -0.7317962646484375, -0.7088241577148438, -0.68585205078125, -0.6628799438476562, -0.6399078369140625, -0.6169357299804688, -0.593963623046875, -0.5709915161132812, -0.5480194091796875, -0.5250473022460938, -0.5020751953125, -0.47910308837890625, -0.4561309814453125, -0.43315887451171875, -0.410186767578125, -0.38721466064453125, -0.3642425537109375, -0.34127044677734375, -0.31829833984375, -0.29532623291015625, -0.2723541259765625, -0.24938201904296875, -0.226409912109375, -0.20343780517578125, -0.1804656982421875, -0.15749359130859375, -0.134521484375, -0.11154937744140625, -0.0885772705078125, -0.06560516357421875, -0.042633056640625, -0.01966094970703125, 0.0033111572265625, 0.02628326416015625, 0.04925537109375, 0.07222747802734375, 0.0951995849609375, 0.11817169189453125, 0.141143798828125, 0.16411590576171875, 0.1870880126953125, 0.21006011962890625, 0.2330322265625, 0.25600433349609375, 0.2789764404296875, 0.30194854736328125, 0.324920654296875, 0.34789276123046875, 0.3708648681640625, 0.39383697509765625, 0.41680908203125, 0.43978118896484375, 0.4627532958984375, 0.48572540283203125, 0.508697509765625, 0.5316696166992188, 0.5546417236328125, 0.5776138305664062, 0.6005859375]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 2.0, 7.0, 7.0, 6.0, 10.0, 10.0, 9.0, 9.0, 10.0, 13.0, 23.0, 24.0, 26.0, 19.0, 28.0, 22.0, 24.0, 32.0, 42.0, 48.0, 49.0, 27.0, 34.0, 52.0, 41.0, 38.0, 42.0, 39.0, 27.0, 40.0, 27.0, 24.0, 33.0, 24.0, 23.0, 19.0, 16.0, 15.0, 9.0, 7.0, 15.0, 9.0, 7.0, 6.0, 2.0, 3.0, 3.0, 3.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-3.51953125, -3.406707763671875, -3.29388427734375, -3.181060791015625, -3.0682373046875, -2.955413818359375, -2.84259033203125, -2.729766845703125, -2.616943359375, -2.504119873046875, -2.39129638671875, -2.278472900390625, -2.1656494140625, -2.052825927734375, -1.94000244140625, -1.827178955078125, -1.71435546875, -1.601531982421875, -1.48870849609375, -1.375885009765625, -1.2630615234375, -1.150238037109375, -1.03741455078125, -0.924591064453125, -0.811767578125, -0.698944091796875, -0.58612060546875, -0.473297119140625, -0.3604736328125, -0.247650146484375, -0.13482666015625, -0.022003173828125, 0.0908203125, 0.203643798828125, 0.31646728515625, 0.429290771484375, 0.5421142578125, 0.654937744140625, 0.76776123046875, 0.880584716796875, 0.993408203125, 1.106231689453125, 1.21905517578125, 1.331878662109375, 1.4447021484375, 1.557525634765625, 1.67034912109375, 1.783172607421875, 1.89599609375, 2.008819580078125, 2.12164306640625, 2.234466552734375, 2.3472900390625, 2.460113525390625, 2.57293701171875, 2.685760498046875, 2.798583984375, 2.911407470703125, 3.02423095703125, 3.137054443359375, 3.2498779296875, 3.362701416015625, 3.47552490234375, 3.588348388671875, 3.701171875]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 5.0, 5.0, 7.0, 8.0, 9.0, 15.0, 17.0, 34.0, 42.0, 50.0, 114.0, 141.0, 244.0, 410.0, 715.0, 1420.0, 2844.0, 6438.0, 15754.0, 44853.0, 185088.0, 520004.0, 195037.0, 46393.0, 16110.0, 6573.0, 3003.0, 1388.0, 733.0, 410.0, 248.0, 157.0, 79.0, 61.0, 51.0, 25.0, 19.0, 15.0, 10.0, 11.0, 6.0, 7.0, 4.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.11376953125, -0.10991477966308594, -0.10606002807617188, -0.10220527648925781, -0.09835052490234375, -0.09449577331542969, -0.09064102172851562, -0.08678627014160156, -0.0829315185546875, -0.07907676696777344, -0.07522201538085938, -0.07136726379394531, -0.06751251220703125, -0.06365776062011719, -0.059803009033203125, -0.05594825744628906, -0.052093505859375, -0.04823875427246094, -0.044384002685546875, -0.04052925109863281, -0.03667449951171875, -0.03281974792480469, -0.028964996337890625, -0.025110244750976562, -0.0212554931640625, -0.017400741577148438, -0.013545989990234375, -0.009691238403320312, -0.00583648681640625, -0.0019817352294921875, 0.001873016357421875, 0.0057277679443359375, 0.00958251953125, 0.013437271118164062, 0.017292022705078125, 0.021146774291992188, 0.02500152587890625, 0.028856277465820312, 0.032711029052734375, 0.03656578063964844, 0.0404205322265625, 0.04427528381347656, 0.048130035400390625, 0.05198478698730469, 0.05583953857421875, 0.05969429016113281, 0.06354904174804688, 0.06740379333496094, 0.071258544921875, 0.07511329650878906, 0.07896804809570312, 0.08282279968261719, 0.08667755126953125, 0.09053230285644531, 0.09438705444335938, 0.09824180603027344, 0.1020965576171875, 0.10595130920410156, 0.10980606079101562, 0.11366081237792969, 0.11751556396484375, 0.12137031555175781, 0.12522506713867188, 0.12907981872558594, 0.1329345703125]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 2.0, 6.0, 5.0, 4.0, 11.0, 5.0, 14.0, 16.0, 16.0, 41.0, 44.0, 72.0, 86.0, 104.0, 129.0, 109.0, 110.0, 74.0, 44.0, 29.0, 15.0, 16.0, 8.0, 7.0, 4.0, 13.0, 3.0, 3.0, 4.0, 7.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.00011736154556274414, -0.00011422205716371536, -0.00011108256876468658, -0.0001079430803656578, -0.00010480359196662903, -0.00010166410356760025, -9.852461516857147e-05, -9.53851267695427e-05, -9.224563837051392e-05, -8.910614997148514e-05, -8.596666157245636e-05, -8.282717317342758e-05, -7.96876847743988e-05, -7.654819637537003e-05, -7.340870797634125e-05, -7.026921957731247e-05, -6.712973117828369e-05, -6.399024277925491e-05, -6.0850754380226135e-05, -5.771126598119736e-05, -5.457177758216858e-05, -5.14322891831398e-05, -4.829280078411102e-05, -4.5153312385082245e-05, -4.201382398605347e-05, -3.887433558702469e-05, -3.573484718799591e-05, -3.259535878896713e-05, -2.9455870389938354e-05, -2.6316381990909576e-05, -2.31768935918808e-05, -2.003740519285202e-05, -1.6897916793823242e-05, -1.3758428394794464e-05, -1.0618939995765686e-05, -7.479451596736908e-06, -4.33996319770813e-06, -1.2004747986793518e-06, 1.9390136003494263e-06, 5.078501999378204e-06, 8.217990398406982e-06, 1.135747879743576e-05, 1.4496967196464539e-05, 1.7636455595493317e-05, 2.0775943994522095e-05, 2.3915432393550873e-05, 2.705492079257965e-05, 3.019440919160843e-05, 3.333389759063721e-05, 3.6473385989665985e-05, 3.961287438869476e-05, 4.275236278772354e-05, 4.589185118675232e-05, 4.90313395857811e-05, 5.2170827984809875e-05, 5.5310316383838654e-05, 5.844980478286743e-05, 6.158929318189621e-05, 6.472878158092499e-05, 6.786826997995377e-05, 7.100775837898254e-05, 7.414724677801132e-05, 7.72867351770401e-05, 8.042622357606888e-05, 8.356571197509766e-05]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 0.0, 3.0, 4.0, 3.0, 4.0, 2.0, 4.0, 10.0, 9.0, 10.0, 20.0, 18.0, 21.0, 39.0, 43.0, 94.0, 148.0, 281.0, 647.0, 1826.0, 6149.0, 38443.0, 799355.0, 182994.0, 13325.0, 3094.0, 1087.0, 429.0, 207.0, 101.0, 50.0, 37.0, 28.0, 23.0, 10.0, 8.0, 4.0, 8.0, 4.0, 4.0, 5.0, 3.0, 2.0, 0.0, 2.0, 0.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.31689453125, -0.30504608154296875, -0.2931976318359375, -0.28134918212890625, -0.269500732421875, -0.25765228271484375, -0.2458038330078125, -0.23395538330078125, -0.22210693359375, -0.21025848388671875, -0.1984100341796875, -0.18656158447265625, -0.174713134765625, -0.16286468505859375, -0.1510162353515625, -0.13916778564453125, -0.1273193359375, -0.11547088623046875, -0.1036224365234375, -0.09177398681640625, -0.079925537109375, -0.06807708740234375, -0.0562286376953125, -0.04438018798828125, -0.03253173828125, -0.02068328857421875, -0.0088348388671875, 0.00301361083984375, 0.014862060546875, 0.02671051025390625, 0.0385589599609375, 0.05040740966796875, 0.062255859375, 0.07410430908203125, 0.0859527587890625, 0.09780120849609375, 0.109649658203125, 0.12149810791015625, 0.1333465576171875, 0.14519500732421875, 0.15704345703125, 0.16889190673828125, 0.1807403564453125, 0.19258880615234375, 0.204437255859375, 0.21628570556640625, 0.2281341552734375, 0.23998260498046875, 0.2518310546875, 0.26367950439453125, 0.2755279541015625, 0.28737640380859375, 0.299224853515625, 0.31107330322265625, 0.3229217529296875, 0.33477020263671875, 0.34661865234375, 0.35846710205078125, 0.3703155517578125, 0.38216400146484375, 0.394012451171875, 0.40586090087890625, 0.4177093505859375, 0.42955780029296875, 0.44140625]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 3.0, 3.0, 6.0, 7.0, 6.0, 4.0, 6.0, 11.0, 3.0, 11.0, 13.0, 20.0, 16.0, 35.0, 37.0, 64.0, 82.0, 110.0, 136.0, 103.0, 78.0, 52.0, 52.0, 20.0, 28.0, 23.0, 9.0, 14.0, 10.0, 6.0, 6.0, 3.0, 10.0, 4.0, 3.0, 4.0, 2.0, 1.0, 0.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.05810546875, -0.056204795837402344, -0.05430412292480469, -0.05240345001220703, -0.050502777099609375, -0.04860210418701172, -0.04670143127441406, -0.044800758361816406, -0.04290008544921875, -0.040999412536621094, -0.03909873962402344, -0.03719806671142578, -0.035297393798828125, -0.03339672088623047, -0.03149604797363281, -0.029595375061035156, -0.0276947021484375, -0.025794029235839844, -0.023893356323242188, -0.02199268341064453, -0.020092010498046875, -0.01819133758544922, -0.016290664672851562, -0.014389991760253906, -0.01248931884765625, -0.010588645935058594, -0.008687973022460938, -0.006787300109863281, -0.004886627197265625, -0.0029859542846679688, -0.0010852813720703125, 0.0008153915405273438, 0.002716064453125, 0.004616737365722656, 0.0065174102783203125, 0.008418083190917969, 0.010318756103515625, 0.012219429016113281, 0.014120101928710938, 0.016020774841308594, 0.01792144775390625, 0.019822120666503906, 0.021722793579101562, 0.02362346649169922, 0.025524139404296875, 0.02742481231689453, 0.029325485229492188, 0.031226158142089844, 0.0331268310546875, 0.035027503967285156, 0.03692817687988281, 0.03882884979248047, 0.040729522705078125, 0.04263019561767578, 0.04453086853027344, 0.046431541442871094, 0.04833221435546875, 0.050232887268066406, 0.05213356018066406, 0.05403423309326172, 0.055934906005859375, 0.05783557891845703, 0.05973625183105469, 0.061636924743652344, 0.06353759765625]}, "gradients/decoder.model.decoder.layers.10.self_attn_layer_norm.weight": {"_type": "histogram", "values": [3.0, 3.0, 2.0, 4.0, 17.0, 59.0, 192.0, 311.0, 281.0, 90.0, 30.0, 14.0, 8.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.294938802719116, -2.0025463104248047, -1.7101539373397827, -1.4177615642547607, -1.1253690719604492, -0.8329765796661377, -0.5405842065811157, -0.24819183349609375, 0.04420065879821777, 0.3365930914878845, 0.6289855241775513, 0.921377956867218, 1.2137703895568848, 1.5061628818511963, 1.7985552549362183, 2.0909476280212402, 2.3833401203155518, 2.6757326126098633, 2.9681248664855957, 3.2605173587799072, 3.5529098510742188, 3.8453023433685303, 4.137694835662842, 4.430087089538574, 4.722479820251465, 5.014872074127197, 5.307264804840088, 5.59965705871582, 5.892049789428711, 6.184442043304443, 6.476834297180176, 6.769227027893066, 7.061618804931641, 7.354011058807373, 7.646403789520264, 7.938796043395996, 8.231188774108887, 8.523580551147461, 8.815973281860352, 9.108366012573242, 9.400758743286133, 9.693151473999023, 9.985543251037598, 10.277935981750488, 10.570328712463379, 10.862720489501953, 11.155113220214844, 11.447505950927734, 11.739897727966309, 12.0322904586792, 12.324682235717773, 12.617074966430664, 12.909467697143555, 13.201860427856445, 13.49425220489502, 13.78664493560791, 14.079036712646484, 14.371429443359375, 14.66382122039795, 14.95621395111084, 15.24860668182373, 15.540998458862305, 15.833391189575195, 16.125783920288086, 16.418176651000977]}, "gradients/decoder.model.decoder.layers.10.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 1.0, 6.0, 5.0, 7.0, 14.0, 19.0, 20.0, 15.0, 22.0, 38.0, 37.0, 58.0, 43.0, 44.0, 50.0, 64.0, 46.0, 71.0, 68.0, 61.0, 58.0, 45.0, 34.0, 37.0, 37.0, 29.0, 15.0, 21.0, 12.0, 8.0, 11.0, 5.0, 6.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.471536636352539, -2.3857316970825195, -2.299926519393921, -2.2141215801239014, -2.128316640853882, -2.042511463165283, -1.9567065238952637, -1.8709015846252441, -1.785096526145935, -1.699291467666626, -1.6134865283966064, -1.5276814699172974, -1.4418764114379883, -1.3560714721679688, -1.2702664136886597, -1.1844613552093506, -1.098656415939331, -1.012851357460022, -0.9270464181900024, -0.8412413597106934, -0.755436360836029, -0.6696313619613647, -0.5838263034820557, -0.49802130460739136, -0.41221630573272705, -0.32641130685806274, -0.24060627818107605, -0.15480124950408936, -0.06899625062942505, 0.016808748245239258, 0.10261380672454834, 0.18841880559921265, 0.27422404289245605, 0.36002904176712036, 0.44583407044410706, 0.5316390991210938, 0.6174440979957581, 0.7032490968704224, 0.7890541553497314, 0.8748591542243958, 0.9606641530990601, 1.0464692115783691, 1.1322741508483887, 1.2180792093276978, 1.3038842678070068, 1.3896892070770264, 1.4754942655563354, 1.5612993240356445, 1.647104263305664, 1.7329093217849731, 1.8187142610549927, 1.9045193195343018, 1.9903242588043213, 2.07612943649292, 2.1619343757629395, 2.247739315032959, 2.3335442543029785, 2.419349193572998, 2.5051543712615967, 2.590959310531616, 2.6767642498016357, 2.7625694274902344, 2.848374366760254, 2.9341793060302734, 3.019984483718872]}, "gradients/decoder.model.decoder.layers.10.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 4.0, 2.0, 8.0, 8.0, 12.0, 18.0, 29.0, 43.0, 65.0, 97.0, 162.0, 267.0, 436.0, 841.0, 1612.0, 2903.0, 5764.0, 12090.0, 26409.0, 64647.0, 181539.0, 445215.0, 187727.0, 66555.0, 27205.0, 12460.0, 5908.0, 2929.0, 1571.0, 848.0, 441.0, 306.0, 162.0, 83.0, 58.0, 51.0, 29.0, 19.0, 14.0, 8.0, 3.0, 4.0, 1.0, 2.0, 2.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-1.203125, -1.1609344482421875, -1.118743896484375, -1.0765533447265625, -1.03436279296875, -0.9921722412109375, -0.949981689453125, -0.9077911376953125, -0.8656005859375, -0.8234100341796875, -0.781219482421875, -0.7390289306640625, -0.69683837890625, -0.6546478271484375, -0.612457275390625, -0.5702667236328125, -0.528076171875, -0.4858856201171875, -0.443695068359375, -0.4015045166015625, -0.35931396484375, -0.3171234130859375, -0.274932861328125, -0.2327423095703125, -0.1905517578125, -0.1483612060546875, -0.106170654296875, -0.0639801025390625, -0.02178955078125, 0.0204010009765625, 0.062591552734375, 0.1047821044921875, 0.14697265625, 0.1891632080078125, 0.231353759765625, 0.2735443115234375, 0.31573486328125, 0.3579254150390625, 0.400115966796875, 0.4423065185546875, 0.4844970703125, 0.5266876220703125, 0.568878173828125, 0.6110687255859375, 0.65325927734375, 0.6954498291015625, 0.737640380859375, 0.7798309326171875, 0.822021484375, 0.8642120361328125, 0.906402587890625, 0.9485931396484375, 0.99078369140625, 1.0329742431640625, 1.075164794921875, 1.1173553466796875, 1.1595458984375, 1.2017364501953125, 1.243927001953125, 1.2861175537109375, 1.32830810546875, 1.3704986572265625, 1.412689208984375, 1.4548797607421875, 1.4970703125]}, "gradients/decoder.model.decoder.layers.10.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 8.0, 7.0, 9.0, 12.0, 12.0, 10.0, 19.0, 14.0, 27.0, 19.0, 19.0, 39.0, 30.0, 37.0, 42.0, 56.0, 38.0, 38.0, 56.0, 47.0, 47.0, 41.0, 50.0, 45.0, 33.0, 31.0, 39.0, 33.0, 20.0, 24.0, 22.0, 13.0, 14.0, 13.0, 7.0, 7.0, 8.0, 8.0, 5.0, 0.0, 6.0, 0.0, 2.0, 1.0], "bins": [-4.671875, -4.55169677734375, -4.4315185546875, -4.31134033203125, -4.191162109375, -4.07098388671875, -3.9508056640625, -3.83062744140625, -3.71044921875, -3.59027099609375, -3.4700927734375, -3.34991455078125, -3.229736328125, -3.10955810546875, -2.9893798828125, -2.86920166015625, -2.7490234375, -2.62884521484375, -2.5086669921875, -2.38848876953125, -2.268310546875, -2.14813232421875, -2.0279541015625, -1.90777587890625, -1.78759765625, -1.66741943359375, -1.5472412109375, -1.42706298828125, -1.306884765625, -1.18670654296875, -1.0665283203125, -0.94635009765625, -0.826171875, -0.70599365234375, -0.5858154296875, -0.46563720703125, -0.345458984375, -0.22528076171875, -0.1051025390625, 0.01507568359375, 0.13525390625, 0.25543212890625, 0.3756103515625, 0.49578857421875, 0.615966796875, 0.73614501953125, 0.8563232421875, 0.97650146484375, 1.0966796875, 1.21685791015625, 1.3370361328125, 1.45721435546875, 1.577392578125, 1.69757080078125, 1.8177490234375, 1.93792724609375, 2.05810546875, 2.17828369140625, 2.2984619140625, 2.41864013671875, 2.538818359375, 2.65899658203125, 2.7791748046875, 2.89935302734375, 3.01953125]}, "gradients/decoder.model.decoder.layers.10.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 5.0, 3.0, 4.0, 4.0, 4.0, 8.0, 6.0, 11.0, 10.0, 13.0, 23.0, 19.0, 24.0, 27.0, 42.0, 38.0, 57.0, 75.0, 84.0, 102.0, 196.0, 489.0, 9610.0, 1025015.0, 11389.0, 539.0, 187.0, 108.0, 86.0, 66.0, 66.0, 54.0, 35.0, 38.0, 19.0, 26.0, 10.0, 17.0, 12.0, 6.0, 7.0, 8.0, 7.0, 2.0, 5.0, 4.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-10.328125, -9.9659423828125, -9.603759765625, -9.2415771484375, -8.87939453125, -8.5172119140625, -8.155029296875, -7.7928466796875, -7.4306640625, -7.0684814453125, -6.706298828125, -6.3441162109375, -5.98193359375, -5.6197509765625, -5.257568359375, -4.8953857421875, -4.533203125, -4.1710205078125, -3.808837890625, -3.4466552734375, -3.08447265625, -2.7222900390625, -2.360107421875, -1.9979248046875, -1.6357421875, -1.2735595703125, -0.911376953125, -0.5491943359375, -0.18701171875, 0.1751708984375, 0.537353515625, 0.8995361328125, 1.26171875, 1.6239013671875, 1.986083984375, 2.3482666015625, 2.71044921875, 3.0726318359375, 3.434814453125, 3.7969970703125, 4.1591796875, 4.5213623046875, 4.883544921875, 5.2457275390625, 5.60791015625, 5.9700927734375, 6.332275390625, 6.6944580078125, 7.056640625, 7.4188232421875, 7.781005859375, 8.1431884765625, 8.50537109375, 8.8675537109375, 9.229736328125, 9.5919189453125, 9.9541015625, 10.3162841796875, 10.678466796875, 11.0406494140625, 11.40283203125, 11.7650146484375, 12.127197265625, 12.4893798828125, 12.8515625]}, "gradients/decoder.model.decoder.layers.10.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 5.0, 5.0, 5.0, 4.0, 10.0, 13.0, 10.0, 14.0, 21.0, 20.0, 16.0, 23.0, 33.0, 34.0, 37.0, 37.0, 50.0, 60.0, 52.0, 58.0, 50.0, 54.0, 51.0, 41.0, 43.0, 30.0, 34.0, 38.0, 36.0, 19.0, 20.0, 15.0, 18.0, 8.0, 12.0, 2.0, 5.0, 9.0, 4.0, 3.0, 2.0, 2.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.46484375, -4.32501220703125, -4.1851806640625, -4.04534912109375, -3.905517578125, -3.76568603515625, -3.6258544921875, -3.48602294921875, -3.34619140625, -3.20635986328125, -3.0665283203125, -2.92669677734375, -2.786865234375, -2.64703369140625, -2.5072021484375, -2.36737060546875, -2.2275390625, -2.08770751953125, -1.9478759765625, -1.80804443359375, -1.668212890625, -1.52838134765625, -1.3885498046875, -1.24871826171875, -1.10888671875, -0.96905517578125, -0.8292236328125, -0.68939208984375, -0.549560546875, -0.40972900390625, -0.2698974609375, -0.13006591796875, 0.009765625, 0.14959716796875, 0.2894287109375, 0.42926025390625, 0.569091796875, 0.70892333984375, 0.8487548828125, 0.98858642578125, 1.12841796875, 1.26824951171875, 1.4080810546875, 1.54791259765625, 1.687744140625, 1.82757568359375, 1.9674072265625, 2.10723876953125, 2.2470703125, 2.38690185546875, 2.5267333984375, 2.66656494140625, 2.806396484375, 2.94622802734375, 3.0860595703125, 3.22589111328125, 3.36572265625, 3.50555419921875, 3.6453857421875, 3.78521728515625, 3.925048828125, 4.06488037109375, 4.2047119140625, 4.34454345703125, 4.484375]}, "gradients/decoder.model.decoder.layers.10.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 4.0, 5.0, 5.0, 7.0, 9.0, 12.0, 15.0, 25.0, 29.0, 53.0, 81.0, 249.0, 2563.0, 898443.0, 145313.0, 1307.0, 185.0, 91.0, 50.0, 22.0, 40.0, 14.0, 10.0, 8.0, 3.0, 5.0, 3.0, 2.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.41015625, -3.2833251953125, -3.156494140625, -3.0296630859375, -2.90283203125, -2.7760009765625, -2.649169921875, -2.5223388671875, -2.3955078125, -2.2686767578125, -2.141845703125, -2.0150146484375, -1.88818359375, -1.7613525390625, -1.634521484375, -1.5076904296875, -1.380859375, -1.2540283203125, -1.127197265625, -1.0003662109375, -0.87353515625, -0.7467041015625, -0.619873046875, -0.4930419921875, -0.3662109375, -0.2393798828125, -0.112548828125, 0.0142822265625, 0.14111328125, 0.2679443359375, 0.394775390625, 0.5216064453125, 0.6484375, 0.7752685546875, 0.902099609375, 1.0289306640625, 1.15576171875, 1.2825927734375, 1.409423828125, 1.5362548828125, 1.6630859375, 1.7899169921875, 1.916748046875, 2.0435791015625, 2.17041015625, 2.2972412109375, 2.424072265625, 2.5509033203125, 2.677734375, 2.8045654296875, 2.931396484375, 3.0582275390625, 3.18505859375, 3.3118896484375, 3.438720703125, 3.5655517578125, 3.6923828125, 3.8192138671875, 3.946044921875, 4.0728759765625, 4.19970703125, 4.3265380859375, 4.453369140625, 4.5802001953125, 4.70703125]}, "gradients/decoder.model.decoder.layers.10.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 5.0, 5.0, 6.0, 2.0, 6.0, 15.0, 17.0, 26.0, 38.0, 44.0, 89.0, 148.0, 197.0, 152.0, 85.0, 49.0, 36.0, 33.0, 8.0, 12.0, 9.0, 9.0, 4.0, 1.0, 3.0, 4.0, 1.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00011819601058959961, -0.0001129666343331337, -0.00010773725807666779, -0.00010250788182020187, -9.727850556373596e-05, -9.204912930727005e-05, -8.681975305080414e-05, -8.159037679433823e-05, -7.636100053787231e-05, -7.11316242814064e-05, -6.590224802494049e-05, -6.067287176847458e-05, -5.544349551200867e-05, -5.0214119255542755e-05, -4.498474299907684e-05, -3.975536674261093e-05, -3.452599048614502e-05, -2.9296614229679108e-05, -2.4067237973213196e-05, -1.8837861716747284e-05, -1.3608485460281372e-05, -8.37910920381546e-06, -3.1497329473495483e-06, 2.0796433091163635e-06, 7.309019565582275e-06, 1.2538395822048187e-05, 1.77677720785141e-05, 2.299714833498001e-05, 2.8226524591445923e-05, 3.3455900847911835e-05, 3.8685277104377747e-05, 4.391465336084366e-05, 4.914402961730957e-05, 5.437340587377548e-05, 5.9602782130241394e-05, 6.48321583867073e-05, 7.006153464317322e-05, 7.529091089963913e-05, 8.052028715610504e-05, 8.574966341257095e-05, 9.097903966903687e-05, 9.620841592550278e-05, 0.00010143779218196869, 0.0001066671684384346, 0.00011189654469490051, 0.00011712592095136642, 0.00012235529720783234, 0.00012758467346429825, 0.00013281404972076416, 0.00013804342597723007, 0.00014327280223369598, 0.0001485021784901619, 0.0001537315547466278, 0.00015896093100309372, 0.00016419030725955963, 0.00016941968351602554, 0.00017464905977249146, 0.00017987843602895737, 0.00018510781228542328, 0.0001903371885418892, 0.0001955665647983551, 0.00020079594105482101, 0.00020602531731128693, 0.00021125469356775284, 0.00021648406982421875]}, "gradients/decoder.model.decoder.layers.10.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 2.0, 3.0, 5.0, 5.0, 5.0, 6.0, 5.0, 14.0, 13.0, 19.0, 25.0, 40.0, 50.0, 91.0, 255.0, 1350.0, 42319.0, 989789.0, 13329.0, 809.0, 172.0, 67.0, 52.0, 33.0, 21.0, 24.0, 14.0, 8.0, 12.0, 3.0, 4.0, 4.0, 4.0, 2.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.455078125, -2.368560791015625, -2.28204345703125, -2.195526123046875, -2.1090087890625, -2.022491455078125, -1.93597412109375, -1.849456787109375, -1.762939453125, -1.676422119140625, -1.58990478515625, -1.503387451171875, -1.4168701171875, -1.330352783203125, -1.24383544921875, -1.157318115234375, -1.07080078125, -0.984283447265625, -0.89776611328125, -0.811248779296875, -0.7247314453125, -0.638214111328125, -0.55169677734375, -0.465179443359375, -0.378662109375, -0.292144775390625, -0.20562744140625, -0.119110107421875, -0.0325927734375, 0.053924560546875, 0.14044189453125, 0.226959228515625, 0.3134765625, 0.399993896484375, 0.48651123046875, 0.573028564453125, 0.6595458984375, 0.746063232421875, 0.83258056640625, 0.919097900390625, 1.005615234375, 1.092132568359375, 1.17864990234375, 1.265167236328125, 1.3516845703125, 1.438201904296875, 1.52471923828125, 1.611236572265625, 1.69775390625, 1.784271240234375, 1.87078857421875, 1.957305908203125, 2.0438232421875, 2.130340576171875, 2.21685791015625, 2.303375244140625, 2.389892578125, 2.476409912109375, 2.56292724609375, 2.649444580078125, 2.7359619140625, 2.822479248046875, 2.90899658203125, 2.995513916015625, 3.08203125]}, "gradients/decoder.model.decoder.layers.10.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 3.0, 2.0, 3.0, 4.0, 8.0, 2.0, 8.0, 16.0, 24.0, 21.0, 41.0, 53.0, 86.0, 119.0, 199.0, 125.0, 76.0, 59.0, 48.0, 29.0, 16.0, 15.0, 11.0, 12.0, 8.0, 6.0, 7.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.387939453125, -0.3763618469238281, -0.36478424072265625, -0.3532066345214844, -0.3416290283203125, -0.3300514221191406, -0.31847381591796875, -0.3068962097167969, -0.295318603515625, -0.2837409973144531, -0.27216339111328125, -0.2605857849121094, -0.2490081787109375, -0.23743057250976562, -0.22585296630859375, -0.21427536010742188, -0.20269775390625, -0.19112014770507812, -0.17954254150390625, -0.16796493530273438, -0.1563873291015625, -0.14480972290039062, -0.13323211669921875, -0.12165451049804688, -0.110076904296875, -0.09849929809570312, -0.08692169189453125, -0.07534408569335938, -0.0637664794921875, -0.052188873291015625, -0.04061126708984375, -0.029033660888671875, -0.0174560546875, -0.005878448486328125, 0.00569915771484375, 0.017276763916015625, 0.0288543701171875, 0.040431976318359375, 0.05200958251953125, 0.06358718872070312, 0.075164794921875, 0.08674240112304688, 0.09832000732421875, 0.10989761352539062, 0.1214752197265625, 0.13305282592773438, 0.14463043212890625, 0.15620803833007812, 0.16778564453125, 0.17936325073242188, 0.19094085693359375, 0.20251846313476562, 0.2140960693359375, 0.22567367553710938, 0.23725128173828125, 0.24882888793945312, 0.260406494140625, 0.2719841003417969, 0.28356170654296875, 0.2951393127441406, 0.3067169189453125, 0.3182945251464844, 0.32987213134765625, 0.3414497375488281, 0.35302734375]}, "gradients/decoder.model.decoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 4.0, 6.0, 7.0, 12.0, 81.0, 226.0, 306.0, 231.0, 95.0, 29.0, 14.0, 5.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.233728885650635, -3.685295581817627, -3.13686203956604, -2.588428497314453, -2.0399951934814453, -1.4915618896484375, -0.9431283473968506, -0.39469480514526367, 0.15373849868774414, 0.7021719217300415, 1.2506053447723389, 1.7990387678146362, 2.3474721908569336, 2.8959054946899414, 3.4443390369415283, 3.9927725791931152, 4.541205883026123, 5.089639186859131, 5.638072967529297, 6.186506271362305, 6.7349395751953125, 7.28337287902832, 7.831806182861328, 8.380239486694336, 8.928672790527344, 9.477106094360352, 10.02553939819336, 10.573972702026367, 11.122406005859375, 11.670839309692383, 12.219273567199707, 12.767706871032715, 13.316139221191406, 13.864572525024414, 14.413005828857422, 14.96143913269043, 15.509872436523438, 16.058305740356445, 16.606739044189453, 17.155174255371094, 17.70360565185547, 18.252038955688477, 18.800472259521484, 19.348905563354492, 19.8973388671875, 20.445772171020508, 20.994205474853516, 21.542640686035156, 22.091073989868164, 22.639507293701172, 23.18794059753418, 23.736373901367188, 24.284807205200195, 24.833240509033203, 25.38167381286621, 25.93010711669922, 26.47854232788086, 27.026975631713867, 27.575408935546875, 28.123842239379883, 28.67227554321289, 29.2207088470459, 29.769142150878906, 30.317577362060547, 30.866008758544922]}, "gradients/decoder.model.decoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 4.0, 4.0, 3.0, 3.0, 5.0, 4.0, 10.0, 5.0, 9.0, 9.0, 10.0, 13.0, 7.0, 20.0, 27.0, 18.0, 23.0, 29.0, 34.0, 33.0, 38.0, 40.0, 36.0, 30.0, 34.0, 38.0, 55.0, 37.0, 36.0, 44.0, 31.0, 34.0, 40.0, 27.0, 24.0, 23.0, 20.0, 17.0, 24.0, 20.0, 13.0, 16.0, 12.0, 5.0, 7.0, 9.0, 9.0, 5.0, 8.0, 2.0, 4.0, 3.0, 3.0, 1.0, 3.0], "bins": [-5.967244625091553, -5.800583839416504, -5.633923530578613, -5.4672627449035645, -5.300602436065674, -5.133941650390625, -4.967281341552734, -4.8006205558776855, -4.633959770202637, -4.467298984527588, -4.300638675689697, -4.133977890014648, -3.9673173427581787, -3.800656795501709, -3.6339962482452393, -3.4673357009887695, -3.3006751537323, -3.13401460647583, -2.9673540592193604, -2.8006935119628906, -2.634032726287842, -2.467372179031372, -2.3007116317749023, -2.1340508460998535, -1.9673904180526733, -1.8007298707962036, -1.6340692043304443, -1.4674086570739746, -1.3007481098175049, -1.1340874433517456, -0.9674268960952759, -0.8007662296295166, -0.6341056823730469, -0.4674450755119324, -0.30078449845314026, -0.13412392139434814, 0.03253668546676636, 0.19919729232788086, 0.3658578395843506, 0.5325185060501099, 0.6991790533065796, 0.8658396601676941, 1.0325002670288086, 1.1991608142852783, 1.365821361541748, 1.5324820280075073, 1.699142575263977, 1.8658032417297363, 2.032463788986206, 2.199124336242676, 2.3657848834991455, 2.5324454307556152, 2.699106216430664, 2.865766763687134, 3.0324273109436035, 3.1990880966186523, 3.365748405456543, 3.5324089527130127, 3.6990694999694824, 3.8657302856445312, 4.032390594482422, 4.199051380157471, 4.3657121658325195, 4.53237247467041, 4.699033260345459]}, "gradients/decoder.model.decoder.layers.9.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 4.0, 5.0, 4.0, 7.0, 6.0, 16.0, 17.0, 28.0, 19.0, 39.0, 50.0, 76.0, 58.0, 111.0, 156.0, 284.0, 510.0, 1038.0, 2408.0, 6598.0, 23983.0, 126021.0, 798007.0, 2269360.0, 795141.0, 131666.0, 26974.0, 7144.0, 2432.0, 937.0, 437.0, 250.0, 158.0, 84.0, 54.0, 49.0, 27.0, 32.0, 17.0, 17.0, 12.0, 13.0, 14.0, 6.0, 4.0, 3.0, 4.0, 5.0, 2.0, 3.0, 0.0, 2.0, 1.0], "bins": [-3.455078125, -3.354949951171875, -3.25482177734375, -3.154693603515625, -3.0545654296875, -2.954437255859375, -2.85430908203125, -2.754180908203125, -2.654052734375, -2.553924560546875, -2.45379638671875, -2.353668212890625, -2.2535400390625, -2.153411865234375, -2.05328369140625, -1.953155517578125, -1.85302734375, -1.752899169921875, -1.65277099609375, -1.552642822265625, -1.4525146484375, -1.352386474609375, -1.25225830078125, -1.152130126953125, -1.052001953125, -0.951873779296875, -0.85174560546875, -0.751617431640625, -0.6514892578125, -0.551361083984375, -0.45123291015625, -0.351104736328125, -0.2509765625, -0.150848388671875, -0.05072021484375, 0.049407958984375, 0.1495361328125, 0.249664306640625, 0.34979248046875, 0.449920654296875, 0.550048828125, 0.650177001953125, 0.75030517578125, 0.850433349609375, 0.9505615234375, 1.050689697265625, 1.15081787109375, 1.250946044921875, 1.35107421875, 1.451202392578125, 1.55133056640625, 1.651458740234375, 1.7515869140625, 1.851715087890625, 1.95184326171875, 2.051971435546875, 2.152099609375, 2.252227783203125, 2.35235595703125, 2.452484130859375, 2.5526123046875, 2.652740478515625, 2.75286865234375, 2.852996826171875, 2.953125]}, "gradients/decoder.model.decoder.layers.9.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 2.0, 0.0, 3.0, 6.0, 5.0, 8.0, 14.0, 19.0, 22.0, 29.0, 35.0, 49.0, 47.0, 74.0, 68.0, 64.0, 87.0, 75.0, 61.0, 66.0, 45.0, 48.0, 50.0, 30.0, 24.0, 24.0, 15.0, 11.0, 17.0, 8.0, 4.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.283203125, -2.186981201171875, -2.09075927734375, -1.994537353515625, -1.8983154296875, -1.802093505859375, -1.70587158203125, -1.609649658203125, -1.513427734375, -1.417205810546875, -1.32098388671875, -1.224761962890625, -1.1285400390625, -1.032318115234375, -0.93609619140625, -0.839874267578125, -0.74365234375, -0.647430419921875, -0.55120849609375, -0.454986572265625, -0.3587646484375, -0.262542724609375, -0.16632080078125, -0.070098876953125, 0.026123046875, 0.122344970703125, 0.21856689453125, 0.314788818359375, 0.4110107421875, 0.507232666015625, 0.60345458984375, 0.699676513671875, 0.7958984375, 0.892120361328125, 0.98834228515625, 1.084564208984375, 1.1807861328125, 1.277008056640625, 1.37322998046875, 1.469451904296875, 1.565673828125, 1.661895751953125, 1.75811767578125, 1.854339599609375, 1.9505615234375, 2.046783447265625, 2.14300537109375, 2.239227294921875, 2.33544921875, 2.431671142578125, 2.52789306640625, 2.624114990234375, 2.7203369140625, 2.816558837890625, 2.91278076171875, 3.009002685546875, 3.105224609375, 3.201446533203125, 3.29766845703125, 3.393890380859375, 3.4901123046875, 3.586334228515625, 3.68255615234375, 3.778778076171875, 3.875]}, "gradients/decoder.model.decoder.layers.9.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 3.0, 1.0, 8.0, 0.0, 5.0, 8.0, 30.0, 38.0, 86.0, 144.0, 327.0, 900.0, 10572.0, 4126105.0, 53915.0, 1292.0, 429.0, 224.0, 80.0, 50.0, 19.0, 13.0, 7.0, 10.0, 8.0, 1.0, 3.0, 2.0, 2.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-18.28125, -17.7955322265625, -17.309814453125, -16.8240966796875, -16.33837890625, -15.8526611328125, -15.366943359375, -14.8812255859375, -14.3955078125, -13.9097900390625, -13.424072265625, -12.9383544921875, -12.45263671875, -11.9669189453125, -11.481201171875, -10.9954833984375, -10.509765625, -10.0240478515625, -9.538330078125, -9.0526123046875, -8.56689453125, -8.0811767578125, -7.595458984375, -7.1097412109375, -6.6240234375, -6.1383056640625, -5.652587890625, -5.1668701171875, -4.68115234375, -4.1954345703125, -3.709716796875, -3.2239990234375, -2.73828125, -2.2525634765625, -1.766845703125, -1.2811279296875, -0.79541015625, -0.3096923828125, 0.176025390625, 0.6617431640625, 1.1474609375, 1.6331787109375, 2.118896484375, 2.6046142578125, 3.09033203125, 3.5760498046875, 4.061767578125, 4.5474853515625, 5.033203125, 5.5189208984375, 6.004638671875, 6.4903564453125, 6.97607421875, 7.4617919921875, 7.947509765625, 8.4332275390625, 8.9189453125, 9.4046630859375, 9.890380859375, 10.3760986328125, 10.86181640625, 11.3475341796875, 11.833251953125, 12.3189697265625, 12.8046875]}, "gradients/decoder.model.decoder.layers.9.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 2.0, 4.0, 5.0, 6.0, 6.0, 14.0, 13.0, 21.0, 27.0, 45.0, 62.0, 100.0, 122.0, 175.0, 259.0, 347.0, 458.0, 548.0, 512.0, 406.0, 265.0, 204.0, 148.0, 89.0, 77.0, 55.0, 40.0, 26.0, 11.0, 4.0, 8.0, 6.0, 3.0, 3.0, 5.0, 4.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.205078125, -1.1721267700195312, -1.1391754150390625, -1.1062240600585938, -1.073272705078125, -1.0403213500976562, -1.0073699951171875, -0.9744186401367188, -0.94146728515625, -0.9085159301757812, -0.8755645751953125, -0.8426132202148438, -0.809661865234375, -0.7767105102539062, -0.7437591552734375, -0.7108078002929688, -0.6778564453125, -0.6449050903320312, -0.6119537353515625, -0.5790023803710938, -0.546051025390625, -0.5130996704101562, -0.4801483154296875, -0.44719696044921875, -0.41424560546875, -0.38129425048828125, -0.3483428955078125, -0.31539154052734375, -0.282440185546875, -0.24948883056640625, -0.2165374755859375, -0.18358612060546875, -0.150634765625, -0.11768341064453125, -0.0847320556640625, -0.05178070068359375, -0.018829345703125, 0.01412200927734375, 0.0470733642578125, 0.08002471923828125, 0.11297607421875, 0.14592742919921875, 0.1788787841796875, 0.21183013916015625, 0.244781494140625, 0.27773284912109375, 0.3106842041015625, 0.34363555908203125, 0.3765869140625, 0.40953826904296875, 0.4424896240234375, 0.47544097900390625, 0.508392333984375, 0.5413436889648438, 0.5742950439453125, 0.6072463989257812, 0.64019775390625, 0.6731491088867188, 0.7061004638671875, 0.7390518188476562, 0.772003173828125, 0.8049545288085938, 0.8379058837890625, 0.8708572387695312, 0.90380859375]}, "gradients/decoder.model.decoder.layers.9.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 4.0, 7.0, 14.0, 30.0, 59.0, 82.0, 117.0, 147.0, 165.0, 131.0, 93.0, 65.0, 41.0, 19.0, 10.0, 8.0, 10.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.9344077110290527, -3.730466604232788, -3.5265254974365234, -3.3225841522216797, -3.118643045425415, -2.9147019386291504, -2.7107605934143066, -2.506819486618042, -2.3028783798217773, -2.0989372730255127, -1.8949960470199585, -1.6910548210144043, -1.4871137142181396, -1.283172607421875, -1.0792313814163208, -0.8752901554107666, -0.671349048614502, -0.46740788221359253, -0.2634667158126831, -0.05952554941177368, 0.14441561698913574, 0.3483567237854004, 0.5522979497909546, 0.7562391757965088, 0.9601802825927734, 1.164121389389038, 1.3680626153945923, 1.5720038414001465, 1.7759449481964111, 1.9798860549926758, 2.1838274002075195, 2.387768507003784, 2.591710090637207, 2.7956511974334717, 2.9995923042297363, 3.20353364944458, 3.4074747562408447, 3.6114158630371094, 3.815357208251953, 4.019298553466797, 4.223239421844482, 4.427180767059326, 4.631121635437012, 4.8350629806518555, 5.039004325866699, 5.242945194244385, 5.4468865394592285, 5.650827407836914, 5.854768753051758, 6.058710098266602, 6.262650966644287, 6.466592311859131, 6.670533180236816, 6.87447452545166, 7.078415870666504, 7.282357215881348, 7.486298084259033, 7.690239429473877, 7.8941802978515625, 8.098121643066406, 8.30206298828125, 8.506004333496094, 8.709944725036621, 8.913886070251465, 9.117827415466309]}, "gradients/decoder.model.decoder.layers.9.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 3.0, 5.0, 7.0, 7.0, 7.0, 17.0, 14.0, 15.0, 24.0, 21.0, 28.0, 38.0, 39.0, 48.0, 42.0, 61.0, 60.0, 45.0, 61.0, 72.0, 66.0, 54.0, 54.0, 37.0, 29.0, 40.0, 25.0, 18.0, 18.0, 16.0, 9.0, 13.0, 9.0, 3.0, 8.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.7118377685546875, -2.6209635734558105, -2.5300893783569336, -2.4392151832580566, -2.3483409881591797, -2.2574665546417236, -2.1665923595428467, -2.0757181644439697, -1.9848439693450928, -1.8939697742462158, -1.8030955791473389, -1.7122212648391724, -1.6213470697402954, -1.5304728746414185, -1.439598560333252, -1.348724365234375, -1.257850170135498, -1.166975975036621, -1.0761017799377441, -0.9852274656295776, -0.8943532705307007, -0.8034790754318237, -0.712604820728302, -0.6217305660247803, -0.5308563709259033, -0.439982146024704, -0.34910792112350464, -0.2582336962223053, -0.16735947132110596, -0.07648524641990662, 0.014388978481292725, 0.10526323318481445, 0.1961374282836914, 0.28701165318489075, 0.3778858780860901, 0.46876010298728943, 0.5596343278884888, 0.6505085229873657, 0.7413827776908875, 0.8322570323944092, 0.9231312274932861, 1.014005422592163, 1.10487961769104, 1.1957539319992065, 1.2866281270980835, 1.3775023221969604, 1.468376636505127, 1.559250831604004, 1.6501250267028809, 1.7409992218017578, 1.8318734169006348, 1.9227477312088013, 2.0136218070983887, 2.1044962406158447, 2.1953704357147217, 2.2862446308135986, 2.3771188259124756, 2.4679930210113525, 2.5588672161102295, 2.6497414112091064, 2.7406158447265625, 2.8314900398254395, 2.9223642349243164, 3.0132384300231934, 3.1041126251220703]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 1.0, 4.0, 4.0, 11.0, 12.0, 15.0, 21.0, 32.0, 59.0, 100.0, 156.0, 304.0, 662.0, 1435.0, 3791.0, 13629.0, 76827.0, 427060.0, 427376.0, 76790.0, 13568.0, 3760.0, 1502.0, 681.0, 323.0, 191.0, 94.0, 58.0, 38.0, 16.0, 10.0, 10.0, 7.0, 4.0, 4.0, 2.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.03125, -1.0017852783203125, -0.972320556640625, -0.9428558349609375, -0.91339111328125, -0.8839263916015625, -0.854461669921875, -0.8249969482421875, -0.7955322265625, -0.7660675048828125, -0.736602783203125, -0.7071380615234375, -0.67767333984375, -0.6482086181640625, -0.618743896484375, -0.5892791748046875, -0.559814453125, -0.5303497314453125, -0.500885009765625, -0.4714202880859375, -0.44195556640625, -0.4124908447265625, -0.383026123046875, -0.3535614013671875, -0.3240966796875, -0.2946319580078125, -0.265167236328125, -0.2357025146484375, -0.20623779296875, -0.1767730712890625, -0.147308349609375, -0.1178436279296875, -0.08837890625, -0.0589141845703125, -0.029449462890625, 1.52587890625e-05, 0.02947998046875, 0.0589447021484375, 0.088409423828125, 0.1178741455078125, 0.1473388671875, 0.1768035888671875, 0.206268310546875, 0.2357330322265625, 0.26519775390625, 0.2946624755859375, 0.324127197265625, 0.3535919189453125, 0.383056640625, 0.4125213623046875, 0.441986083984375, 0.4714508056640625, 0.50091552734375, 0.5303802490234375, 0.559844970703125, 0.5893096923828125, 0.6187744140625, 0.6482391357421875, 0.677703857421875, 0.7071685791015625, 0.73663330078125, 0.7660980224609375, 0.795562744140625, 0.8250274658203125, 0.8544921875]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 4.0, 3.0, 13.0, 19.0, 15.0, 26.0, 28.0, 36.0, 44.0, 59.0, 77.0, 74.0, 102.0, 74.0, 78.0, 78.0, 60.0, 64.0, 41.0, 30.0, 27.0, 15.0, 20.0, 11.0, 7.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.255859375, -2.178436279296875, -2.10101318359375, -2.023590087890625, -1.9461669921875, -1.868743896484375, -1.79132080078125, -1.713897705078125, -1.636474609375, -1.559051513671875, -1.48162841796875, -1.404205322265625, -1.3267822265625, -1.249359130859375, -1.17193603515625, -1.094512939453125, -1.01708984375, -0.939666748046875, -0.86224365234375, -0.784820556640625, -0.7073974609375, -0.629974365234375, -0.55255126953125, -0.475128173828125, -0.397705078125, -0.320281982421875, -0.24285888671875, -0.165435791015625, -0.0880126953125, -0.010589599609375, 0.06683349609375, 0.144256591796875, 0.2216796875, 0.299102783203125, 0.37652587890625, 0.453948974609375, 0.5313720703125, 0.608795166015625, 0.68621826171875, 0.763641357421875, 0.841064453125, 0.918487548828125, 0.99591064453125, 1.073333740234375, 1.1507568359375, 1.228179931640625, 1.30560302734375, 1.383026123046875, 1.46044921875, 1.537872314453125, 1.61529541015625, 1.692718505859375, 1.7701416015625, 1.847564697265625, 1.92498779296875, 2.002410888671875, 2.079833984375, 2.157257080078125, 2.23468017578125, 2.312103271484375, 2.3895263671875, 2.466949462890625, 2.54437255859375, 2.621795654296875, 2.69921875]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 4.0, 4.0, 10.0, 5.0, 10.0, 13.0, 16.0, 21.0, 27.0, 55.0, 87.0, 130.0, 206.0, 398.0, 758.0, 1451.0, 3058.0, 6839.0, 16519.0, 41291.0, 97446.0, 198379.0, 274444.0, 214882.0, 111151.0, 47042.0, 19337.0, 7933.0, 3465.0, 1672.0, 793.0, 413.0, 253.0, 155.0, 96.0, 62.0, 40.0, 23.0, 24.0, 13.0, 18.0, 6.0, 4.0, 2.0, 3.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0], "bins": [-0.307373046875, -0.297637939453125, -0.28790283203125, -0.278167724609375, -0.2684326171875, -0.258697509765625, -0.24896240234375, -0.239227294921875, -0.2294921875, -0.219757080078125, -0.21002197265625, -0.200286865234375, -0.1905517578125, -0.180816650390625, -0.17108154296875, -0.161346435546875, -0.151611328125, -0.141876220703125, -0.13214111328125, -0.122406005859375, -0.1126708984375, -0.102935791015625, -0.09320068359375, -0.083465576171875, -0.07373046875, -0.063995361328125, -0.05426025390625, -0.044525146484375, -0.0347900390625, -0.025054931640625, -0.01531982421875, -0.005584716796875, 0.004150390625, 0.013885498046875, 0.02362060546875, 0.033355712890625, 0.0430908203125, 0.052825927734375, 0.06256103515625, 0.072296142578125, 0.08203125, 0.091766357421875, 0.10150146484375, 0.111236572265625, 0.1209716796875, 0.130706787109375, 0.14044189453125, 0.150177001953125, 0.159912109375, 0.169647216796875, 0.17938232421875, 0.189117431640625, 0.1988525390625, 0.208587646484375, 0.21832275390625, 0.228057861328125, 0.23779296875, 0.247528076171875, 0.25726318359375, 0.266998291015625, 0.2767333984375, 0.286468505859375, 0.29620361328125, 0.305938720703125, 0.315673828125]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 1.0, 1.0, 4.0, 2.0, 4.0, 3.0, 4.0, 11.0, 10.0, 8.0, 5.0, 14.0, 19.0, 21.0, 25.0, 28.0, 37.0, 28.0, 46.0, 44.0, 47.0, 35.0, 62.0, 53.0, 47.0, 55.0, 54.0, 44.0, 52.0, 31.0, 31.0, 32.0, 19.0, 22.0, 26.0, 16.0, 13.0, 13.0, 15.0, 9.0, 4.0, 6.0, 2.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-2.673828125, -2.595855712890625, -2.51788330078125, -2.439910888671875, -2.3619384765625, -2.283966064453125, -2.20599365234375, -2.128021240234375, -2.050048828125, -1.972076416015625, -1.89410400390625, -1.816131591796875, -1.7381591796875, -1.660186767578125, -1.58221435546875, -1.504241943359375, -1.42626953125, -1.348297119140625, -1.27032470703125, -1.192352294921875, -1.1143798828125, -1.036407470703125, -0.95843505859375, -0.880462646484375, -0.802490234375, -0.724517822265625, -0.64654541015625, -0.568572998046875, -0.4906005859375, -0.412628173828125, -0.33465576171875, -0.256683349609375, -0.1787109375, -0.100738525390625, -0.02276611328125, 0.055206298828125, 0.1331787109375, 0.211151123046875, 0.28912353515625, 0.367095947265625, 0.445068359375, 0.523040771484375, 0.60101318359375, 0.678985595703125, 0.7569580078125, 0.834930419921875, 0.91290283203125, 0.990875244140625, 1.06884765625, 1.146820068359375, 1.22479248046875, 1.302764892578125, 1.3807373046875, 1.458709716796875, 1.53668212890625, 1.614654541015625, 1.692626953125, 1.770599365234375, 1.84857177734375, 1.926544189453125, 2.0045166015625, 2.082489013671875, 2.16046142578125, 2.238433837890625, 2.31640625]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 1.0, 2.0, 9.0, 10.0, 18.0, 22.0, 26.0, 56.0, 84.0, 110.0, 157.0, 325.0, 488.0, 1006.0, 1799.0, 3497.0, 7378.0, 15551.0, 35507.0, 86277.0, 217336.0, 339222.0, 199765.0, 78693.0, 32786.0, 14606.0, 6668.0, 3276.0, 1631.0, 925.0, 526.0, 284.0, 176.0, 123.0, 67.0, 51.0, 28.0, 21.0, 15.0, 13.0, 11.0, 8.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.050537109375, -0.04882097244262695, -0.047104835510253906, -0.04538869857788086, -0.04367256164550781, -0.041956424713134766, -0.04024028778076172, -0.03852415084838867, -0.036808013916015625, -0.03509187698364258, -0.03337574005126953, -0.031659603118896484, -0.029943466186523438, -0.02822732925415039, -0.026511192321777344, -0.024795055389404297, -0.02307891845703125, -0.021362781524658203, -0.019646644592285156, -0.01793050765991211, -0.016214370727539062, -0.014498233795166016, -0.012782096862792969, -0.011065959930419922, -0.009349822998046875, -0.007633686065673828, -0.005917549133300781, -0.004201412200927734, -0.0024852752685546875, -0.0007691383361816406, 0.0009469985961914062, 0.002663135528564453, 0.0043792724609375, 0.006095409393310547, 0.007811546325683594, 0.00952768325805664, 0.011243820190429688, 0.012959957122802734, 0.014676094055175781, 0.016392230987548828, 0.018108367919921875, 0.019824504852294922, 0.02154064178466797, 0.023256778717041016, 0.024972915649414062, 0.02668905258178711, 0.028405189514160156, 0.030121326446533203, 0.03183746337890625, 0.0335536003112793, 0.035269737243652344, 0.03698587417602539, 0.03870201110839844, 0.040418148040771484, 0.04213428497314453, 0.04385042190551758, 0.045566558837890625, 0.04728269577026367, 0.04899883270263672, 0.050714969635009766, 0.05243110656738281, 0.05414724349975586, 0.055863380432128906, 0.05757951736450195, 0.059295654296875]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 8.0, 11.0, 13.0, 30.0, 55.0, 98.0, 203.0, 233.0, 162.0, 96.0, 57.0, 25.0, 8.0, 8.0, 3.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.6862831115722656e-05, -5.2304938435554504e-05, -4.774704575538635e-05, -4.31891530752182e-05, -3.863126039505005e-05, -3.40733677148819e-05, -2.9515475034713745e-05, -2.4957582354545593e-05, -2.039968967437744e-05, -1.584179699420929e-05, -1.1283904314041138e-05, -6.726011633872986e-06, -2.168118953704834e-06, 2.389773726463318e-06, 6.94766640663147e-06, 1.1505559086799622e-05, 1.6063451766967773e-05, 2.0621344447135925e-05, 2.5179237127304077e-05, 2.973712980747223e-05, 3.429502248764038e-05, 3.885291516780853e-05, 4.3410807847976685e-05, 4.7968700528144836e-05, 5.252659320831299e-05, 5.708448588848114e-05, 6.164237856864929e-05, 6.620027124881744e-05, 7.07581639289856e-05, 7.531605660915375e-05, 7.98739492893219e-05, 8.443184196949005e-05, 8.89897346496582e-05, 9.354762732982635e-05, 9.810552000999451e-05, 0.00010266341269016266, 0.00010722130537033081, 0.00011177919805049896, 0.00011633709073066711, 0.00012089498341083527, 0.00012545287609100342, 0.00013001076877117157, 0.00013456866145133972, 0.00013912655413150787, 0.00014368444681167603, 0.00014824233949184418, 0.00015280023217201233, 0.00015735812485218048, 0.00016191601753234863, 0.00016647391021251678, 0.00017103180289268494, 0.0001755896955728531, 0.00018014758825302124, 0.0001847054809331894, 0.00018926337361335754, 0.0001938212662935257, 0.00019837915897369385, 0.000202937051653862, 0.00020749494433403015, 0.0002120528370141983, 0.00021661072969436646, 0.0002211686223745346, 0.00022572651505470276, 0.0002302844077348709, 0.00023484230041503906]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0, 7.0, 6.0, 14.0, 26.0, 26.0, 51.0, 71.0, 123.0, 251.0, 726.0, 2582.0, 12766.0, 91581.0, 684731.0, 223572.0, 25615.0, 4479.0, 1143.0, 384.0, 181.0, 93.0, 47.0, 25.0, 18.0, 15.0, 10.0, 6.0, 4.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1683349609375, -0.1630229949951172, -0.15771102905273438, -0.15239906311035156, -0.14708709716796875, -0.14177513122558594, -0.13646316528320312, -0.1311511993408203, -0.1258392333984375, -0.12052726745605469, -0.11521530151367188, -0.10990333557128906, -0.10459136962890625, -0.09927940368652344, -0.09396743774414062, -0.08865547180175781, -0.083343505859375, -0.07803153991699219, -0.07271957397460938, -0.06740760803222656, -0.06209564208984375, -0.05678367614746094, -0.051471710205078125, -0.04615974426269531, -0.0408477783203125, -0.03553581237792969, -0.030223846435546875, -0.024911880493164062, -0.01959991455078125, -0.014287948608398438, -0.008975982666015625, -0.0036640167236328125, 0.00164794921875, 0.0069599151611328125, 0.012271881103515625, 0.017583847045898438, 0.02289581298828125, 0.028207778930664062, 0.033519744873046875, 0.03883171081542969, 0.0441436767578125, 0.04945564270019531, 0.054767608642578125, 0.06007957458496094, 0.06539154052734375, 0.07070350646972656, 0.07601547241210938, 0.08132743835449219, 0.086639404296875, 0.09195137023925781, 0.09726333618164062, 0.10257530212402344, 0.10788726806640625, 0.11319923400878906, 0.11851119995117188, 0.12382316589355469, 0.1291351318359375, 0.1344470977783203, 0.13975906372070312, 0.14507102966308594, 0.15038299560546875, 0.15569496154785156, 0.16100692749023438, 0.1663188934326172, 0.171630859375]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 5.0, 1.0, 6.0, 11.0, 10.0, 13.0, 15.0, 21.0, 17.0, 24.0, 31.0, 41.0, 59.0, 71.0, 85.0, 95.0, 83.0, 83.0, 81.0, 58.0, 42.0, 31.0, 23.0, 21.0, 25.0, 10.0, 16.0, 3.0, 9.0, 8.0, 4.0, 4.0, 3.0, 0.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.018829345703125, -0.01824045181274414, -0.01765155792236328, -0.017062664031982422, -0.016473770141601562, -0.015884876251220703, -0.015295982360839844, -0.014707088470458984, -0.014118194580078125, -0.013529300689697266, -0.012940406799316406, -0.012351512908935547, -0.011762619018554688, -0.011173725128173828, -0.010584831237792969, -0.00999593734741211, -0.00940704345703125, -0.00881814956665039, -0.008229255676269531, -0.007640361785888672, -0.0070514678955078125, -0.006462574005126953, -0.005873680114746094, -0.005284786224365234, -0.004695892333984375, -0.004106998443603516, -0.0035181045532226562, -0.002929210662841797, -0.0023403167724609375, -0.0017514228820800781, -0.0011625289916992188, -0.0005736351013183594, 1.52587890625e-05, 0.0006041526794433594, 0.0011930465698242188, 0.0017819404602050781, 0.0023708343505859375, 0.002959728240966797, 0.0035486221313476562, 0.004137516021728516, 0.004726409912109375, 0.005315303802490234, 0.005904197692871094, 0.006493091583251953, 0.0070819854736328125, 0.007670879364013672, 0.008259773254394531, 0.00884866714477539, 0.00943756103515625, 0.01002645492553711, 0.010615348815917969, 0.011204242706298828, 0.011793136596679688, 0.012382030487060547, 0.012970924377441406, 0.013559818267822266, 0.014148712158203125, 0.014737606048583984, 0.015326499938964844, 0.015915393829345703, 0.016504287719726562, 0.017093181610107422, 0.01768207550048828, 0.01827096939086914, 0.01885986328125]}, "gradients/decoder.model.decoder.layers.9.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 3.0, 6.0, 6.0, 17.0, 23.0, 66.0, 114.0, 165.0, 195.0, 174.0, 109.0, 58.0, 33.0, 13.0, 12.0, 4.0, 3.0, 8.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.1353538036346436, -2.9968111515045166, -2.8582684993743896, -2.7197258472442627, -2.581183433532715, -2.442640781402588, -2.304098129272461, -2.165555477142334, -2.027012825012207, -1.88847017288208, -1.7499275207519531, -1.6113849878311157, -1.4728423357009888, -1.3342996835708618, -1.1957571506500244, -1.0572144985198975, -0.9186718463897705, -0.7801291942596436, -0.6415866017341614, -0.5030440092086792, -0.36450135707855225, -0.2259587049484253, -0.08741611242294312, 0.05112648010253906, 0.18966913223266602, 0.3282117545604706, 0.46675437688827515, 0.6052969694137573, 0.7438396215438843, 0.8823822736740112, 1.0209248065948486, 1.1594674587249756, 1.2980103492736816, 1.4365530014038086, 1.5750956535339355, 1.713638186454773, 1.8521808385849, 1.9907234907150269, 2.1292660236358643, 2.267808675765991, 2.406351327896118, 2.544893980026245, 2.683436632156372, 2.821979284286499, 2.960521697998047, 3.099064350128174, 3.237607002258301, 3.3761496543884277, 3.5146923065185547, 3.6532349586486816, 3.7917776107788086, 3.9303202629089355, 4.0688629150390625, 4.2074055671691895, 4.345948219299316, 4.484490394592285, 4.62303352355957, 4.761576175689697, 4.900118827819824, 5.038661479949951, 5.177204132080078, 5.315746784210205, 5.454289436340332, 5.592831611633301, 5.731374263763428]}, "gradients/decoder.model.decoder.layers.9.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 5.0, 1.0, 1.0, 5.0, 8.0, 7.0, 10.0, 11.0, 19.0, 18.0, 23.0, 29.0, 37.0, 45.0, 55.0, 52.0, 73.0, 54.0, 63.0, 91.0, 78.0, 58.0, 59.0, 42.0, 35.0, 37.0, 21.0, 21.0, 18.0, 14.0, 9.0, 6.0, 6.0, 6.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4924906492233276, -1.4316776990890503, -1.3708648681640625, -1.3100519180297852, -1.2492389678955078, -1.1884260177612305, -1.1276130676269531, -1.0668002367019653, -1.005987286567688, -0.9451743364334106, -0.8843614459037781, -0.8235485553741455, -0.7627356052398682, -0.7019226551055908, -0.6411097645759583, -0.5802968740463257, -0.5194839239120483, -0.4586710035800934, -0.3978580832481384, -0.33704516291618347, -0.2762322425842285, -0.21541932225227356, -0.1546064019203186, -0.09379348158836365, -0.03298056125640869, 0.027832359075546265, 0.08864527940750122, 0.14945819973945618, 0.21027112007141113, 0.2710840404033661, 0.33189696073532104, 0.392709881067276, 0.4535226821899414, 0.5143356323242188, 0.5751485228538513, 0.6359614133834839, 0.6967743635177612, 0.7575873136520386, 0.8184002041816711, 0.8792130947113037, 0.940026044845581, 1.0008389949798584, 1.0616519451141357, 1.1224647760391235, 1.1832777261734009, 1.2440906763076782, 1.304903507232666, 1.3657164573669434, 1.4265294075012207, 1.487342357635498, 1.5481553077697754, 1.6089681386947632, 1.6697810888290405, 1.7305940389633179, 1.7914068698883057, 1.852219820022583, 1.9130327701568604, 1.9738457202911377, 2.034658670425415, 2.0954716205596924, 2.1562843322753906, 2.217097282409668, 2.2779102325439453, 2.3387231826782227, 2.3995361328125]}, "gradients/decoder.model.decoder.layers.9.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 5.0, 2.0, 7.0, 8.0, 14.0, 26.0, 29.0, 42.0, 57.0, 95.0, 206.0, 307.0, 537.0, 856.0, 1747.0, 3681.0, 7167.0, 15532.0, 36859.0, 94162.0, 244345.0, 355018.0, 173339.0, 65332.0, 26368.0, 11569.0, 5416.0, 2672.0, 1317.0, 759.0, 442.0, 247.0, 133.0, 86.0, 52.0, 42.0, 21.0, 18.0, 21.0, 7.0, 10.0, 4.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0], "bins": [-1.328125, -1.2882537841796875, -1.248382568359375, -1.2085113525390625, -1.16864013671875, -1.1287689208984375, -1.088897705078125, -1.0490264892578125, -1.0091552734375, -0.9692840576171875, -0.929412841796875, -0.8895416259765625, -0.84967041015625, -0.8097991943359375, -0.769927978515625, -0.7300567626953125, -0.690185546875, -0.6503143310546875, -0.610443115234375, -0.5705718994140625, -0.53070068359375, -0.4908294677734375, -0.450958251953125, -0.4110870361328125, -0.3712158203125, -0.3313446044921875, -0.291473388671875, -0.2516021728515625, -0.21173095703125, -0.1718597412109375, -0.131988525390625, -0.0921173095703125, -0.05224609375, -0.0123748779296875, 0.027496337890625, 0.0673675537109375, 0.10723876953125, 0.1471099853515625, 0.186981201171875, 0.2268524169921875, 0.2667236328125, 0.3065948486328125, 0.346466064453125, 0.3863372802734375, 0.42620849609375, 0.4660797119140625, 0.505950927734375, 0.5458221435546875, 0.585693359375, 0.6255645751953125, 0.665435791015625, 0.7053070068359375, 0.74517822265625, 0.7850494384765625, 0.824920654296875, 0.8647918701171875, 0.9046630859375, 0.9445343017578125, 0.984405517578125, 1.0242767333984375, 1.06414794921875, 1.1040191650390625, 1.143890380859375, 1.1837615966796875, 1.2236328125]}, "gradients/decoder.model.decoder.layers.9.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 5.0, 1.0, 3.0, 6.0, 11.0, 9.0, 12.0, 15.0, 26.0, 26.0, 21.0, 33.0, 45.0, 51.0, 72.0, 62.0, 79.0, 68.0, 80.0, 61.0, 56.0, 55.0, 44.0, 37.0, 27.0, 30.0, 15.0, 22.0, 17.0, 9.0, 6.0, 6.0, 6.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.08203125, -2.956298828125, -2.83056640625, -2.704833984375, -2.5791015625, -2.453369140625, -2.32763671875, -2.201904296875, -2.076171875, -1.950439453125, -1.82470703125, -1.698974609375, -1.5732421875, -1.447509765625, -1.32177734375, -1.196044921875, -1.0703125, -0.944580078125, -0.81884765625, -0.693115234375, -0.5673828125, -0.441650390625, -0.31591796875, -0.190185546875, -0.064453125, 0.061279296875, 0.18701171875, 0.312744140625, 0.4384765625, 0.564208984375, 0.68994140625, 0.815673828125, 0.94140625, 1.067138671875, 1.19287109375, 1.318603515625, 1.4443359375, 1.570068359375, 1.69580078125, 1.821533203125, 1.947265625, 2.072998046875, 2.19873046875, 2.324462890625, 2.4501953125, 2.575927734375, 2.70166015625, 2.827392578125, 2.953125, 3.078857421875, 3.20458984375, 3.330322265625, 3.4560546875, 3.581787109375, 3.70751953125, 3.833251953125, 3.958984375, 4.084716796875, 4.21044921875, 4.336181640625, 4.4619140625, 4.587646484375, 4.71337890625, 4.839111328125, 4.96484375]}, "gradients/decoder.model.decoder.layers.9.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 5.0, 8.0, 3.0, 6.0, 9.0, 6.0, 13.0, 10.0, 13.0, 17.0, 17.0, 14.0, 26.0, 33.0, 20.0, 40.0, 39.0, 49.0, 76.0, 163.0, 578.0, 21767.0, 1019576.0, 5210.0, 373.0, 119.0, 69.0, 39.0, 34.0, 38.0, 28.0, 21.0, 23.0, 18.0, 23.0, 12.0, 10.0, 14.0, 10.0, 6.0, 6.0, 7.0, 4.0, 5.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.9296875, -10.5699462890625, -10.210205078125, -9.8504638671875, -9.49072265625, -9.1309814453125, -8.771240234375, -8.4114990234375, -8.0517578125, -7.6920166015625, -7.332275390625, -6.9725341796875, -6.61279296875, -6.2530517578125, -5.893310546875, -5.5335693359375, -5.173828125, -4.8140869140625, -4.454345703125, -4.0946044921875, -3.73486328125, -3.3751220703125, -3.015380859375, -2.6556396484375, -2.2958984375, -1.9361572265625, -1.576416015625, -1.2166748046875, -0.85693359375, -0.4971923828125, -0.137451171875, 0.2222900390625, 0.58203125, 0.9417724609375, 1.301513671875, 1.6612548828125, 2.02099609375, 2.3807373046875, 2.740478515625, 3.1002197265625, 3.4599609375, 3.8197021484375, 4.179443359375, 4.5391845703125, 4.89892578125, 5.2586669921875, 5.618408203125, 5.9781494140625, 6.337890625, 6.6976318359375, 7.057373046875, 7.4171142578125, 7.77685546875, 8.1365966796875, 8.496337890625, 8.8560791015625, 9.2158203125, 9.5755615234375, 9.935302734375, 10.2950439453125, 10.65478515625, 11.0145263671875, 11.374267578125, 11.7340087890625, 12.09375]}, "gradients/decoder.model.decoder.layers.9.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 2.0, 3.0, 1.0, 5.0, 2.0, 11.0, 9.0, 10.0, 14.0, 8.0, 18.0, 17.0, 20.0, 24.0, 21.0, 27.0, 22.0, 42.0, 51.0, 30.0, 32.0, 52.0, 40.0, 42.0, 56.0, 45.0, 37.0, 42.0, 38.0, 38.0, 29.0, 34.0, 16.0, 29.0, 27.0, 19.0, 12.0, 15.0, 20.0, 11.0, 5.0, 5.0, 6.0, 9.0, 6.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.7890625, -2.698822021484375, -2.60858154296875, -2.518341064453125, -2.4281005859375, -2.337860107421875, -2.24761962890625, -2.157379150390625, -2.067138671875, -1.976898193359375, -1.88665771484375, -1.796417236328125, -1.7061767578125, -1.615936279296875, -1.52569580078125, -1.435455322265625, -1.34521484375, -1.254974365234375, -1.16473388671875, -1.074493408203125, -0.9842529296875, -0.894012451171875, -0.80377197265625, -0.713531494140625, -0.623291015625, -0.533050537109375, -0.44281005859375, -0.352569580078125, -0.2623291015625, -0.172088623046875, -0.08184814453125, 0.008392333984375, 0.0986328125, 0.188873291015625, 0.27911376953125, 0.369354248046875, 0.4595947265625, 0.549835205078125, 0.64007568359375, 0.730316162109375, 0.820556640625, 0.910797119140625, 1.00103759765625, 1.091278076171875, 1.1815185546875, 1.271759033203125, 1.36199951171875, 1.452239990234375, 1.54248046875, 1.632720947265625, 1.72296142578125, 1.813201904296875, 1.9034423828125, 1.993682861328125, 2.08392333984375, 2.174163818359375, 2.264404296875, 2.354644775390625, 2.44488525390625, 2.535125732421875, 2.6253662109375, 2.715606689453125, 2.80584716796875, 2.896087646484375, 2.986328125]}, "gradients/decoder.model.decoder.layers.9.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 3.0, 4.0, 4.0, 7.0, 11.0, 15.0, 12.0, 40.0, 64.0, 135.0, 314.0, 1108.0, 6712.0, 189888.0, 821837.0, 25069.0, 2336.0, 588.0, 212.0, 90.0, 50.0, 20.0, 12.0, 11.0, 6.0, 3.0, 4.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.30078125, -2.246307373046875, -2.19183349609375, -2.137359619140625, -2.0828857421875, -2.028411865234375, -1.97393798828125, -1.919464111328125, -1.864990234375, -1.810516357421875, -1.75604248046875, -1.701568603515625, -1.6470947265625, -1.592620849609375, -1.53814697265625, -1.483673095703125, -1.42919921875, -1.374725341796875, -1.32025146484375, -1.265777587890625, -1.2113037109375, -1.156829833984375, -1.10235595703125, -1.047882080078125, -0.993408203125, -0.938934326171875, -0.88446044921875, -0.829986572265625, -0.7755126953125, -0.721038818359375, -0.66656494140625, -0.612091064453125, -0.5576171875, -0.503143310546875, -0.44866943359375, -0.394195556640625, -0.3397216796875, -0.285247802734375, -0.23077392578125, -0.176300048828125, -0.121826171875, -0.067352294921875, -0.01287841796875, 0.041595458984375, 0.0960693359375, 0.150543212890625, 0.20501708984375, 0.259490966796875, 0.31396484375, 0.368438720703125, 0.42291259765625, 0.477386474609375, 0.5318603515625, 0.586334228515625, 0.64080810546875, 0.695281982421875, 0.749755859375, 0.804229736328125, 0.85870361328125, 0.913177490234375, 0.9676513671875, 1.022125244140625, 1.07659912109375, 1.131072998046875, 1.185546875]}, "gradients/decoder.model.decoder.layers.9.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 2.0, 4.0, 6.0, 5.0, 14.0, 15.0, 20.0, 39.0, 47.0, 89.0, 111.0, 128.0, 118.0, 119.0, 83.0, 63.0, 45.0, 30.0, 27.0, 18.0, 13.0, 2.0, 1.0, 1.0, 3.0, 2.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00013446807861328125, -0.00012985989451408386, -0.00012525171041488647, -0.00012064352631568909, -0.0001160353422164917, -0.00011142715811729431, -0.00010681897401809692, -0.00010221078991889954, -9.760260581970215e-05, -9.299442172050476e-05, -8.838623762130737e-05, -8.377805352210999e-05, -7.91698694229126e-05, -7.456168532371521e-05, -6.995350122451782e-05, -6.534531712532043e-05, -6.073713302612305e-05, -5.612894892692566e-05, -5.152076482772827e-05, -4.6912580728530884e-05, -4.2304396629333496e-05, -3.769621253013611e-05, -3.308802843093872e-05, -2.8479844331741333e-05, -2.3871660232543945e-05, -1.9263476133346558e-05, -1.465529203414917e-05, -1.0047107934951782e-05, -5.4389238357543945e-06, -8.307397365570068e-07, 3.777444362640381e-06, 8.385628461837769e-06, 1.2993812561035156e-05, 1.7601996660232544e-05, 2.221018075942993e-05, 2.681836485862732e-05, 3.142654895782471e-05, 3.6034733057022095e-05, 4.064291715621948e-05, 4.525110125541687e-05, 4.985928535461426e-05, 5.4467469453811646e-05, 5.907565355300903e-05, 6.368383765220642e-05, 6.829202175140381e-05, 7.29002058506012e-05, 7.750838994979858e-05, 8.211657404899597e-05, 8.672475814819336e-05, 9.133294224739075e-05, 9.594112634658813e-05, 0.00010054931044578552, 0.00010515749454498291, 0.0001097656786441803, 0.00011437386274337769, 0.00011898204684257507, 0.00012359023094177246, 0.00012819841504096985, 0.00013280659914016724, 0.00013741478323936462, 0.000142022967338562, 0.0001466311514377594, 0.0001512393355369568, 0.00015584751963615417, 0.00016045570373535156]}, "gradients/decoder.model.decoder.layers.9.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 6.0, 1.0, 8.0, 6.0, 20.0, 20.0, 49.0, 87.0, 186.0, 526.0, 2252.0, 22916.0, 752570.0, 259230.0, 8694.0, 1317.0, 361.0, 153.0, 64.0, 36.0, 21.0, 19.0, 10.0, 4.0, 3.0, 4.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.107421875, -2.05450439453125, -2.0015869140625, -1.94866943359375, -1.895751953125, -1.84283447265625, -1.7899169921875, -1.73699951171875, -1.68408203125, -1.63116455078125, -1.5782470703125, -1.52532958984375, -1.472412109375, -1.41949462890625, -1.3665771484375, -1.31365966796875, -1.2607421875, -1.20782470703125, -1.1549072265625, -1.10198974609375, -1.049072265625, -0.99615478515625, -0.9432373046875, -0.89031982421875, -0.83740234375, -0.78448486328125, -0.7315673828125, -0.67864990234375, -0.625732421875, -0.57281494140625, -0.5198974609375, -0.46697998046875, -0.4140625, -0.36114501953125, -0.3082275390625, -0.25531005859375, -0.202392578125, -0.14947509765625, -0.0965576171875, -0.04364013671875, 0.00927734375, 0.06219482421875, 0.1151123046875, 0.16802978515625, 0.220947265625, 0.27386474609375, 0.3267822265625, 0.37969970703125, 0.4326171875, 0.48553466796875, 0.5384521484375, 0.59136962890625, 0.644287109375, 0.69720458984375, 0.7501220703125, 0.80303955078125, 0.85595703125, 0.90887451171875, 0.9617919921875, 1.01470947265625, 1.067626953125, 1.12054443359375, 1.1734619140625, 1.22637939453125, 1.279296875]}, "gradients/decoder.model.decoder.layers.9.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 2.0, 4.0, 4.0, 7.0, 16.0, 20.0, 55.0, 113.0, 160.0, 234.0, 164.0, 96.0, 58.0, 43.0, 20.0, 6.0, 5.0, 5.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.39208984375, -0.37094879150390625, -0.3498077392578125, -0.32866668701171875, -0.307525634765625, -0.28638458251953125, -0.2652435302734375, -0.24410247802734375, -0.22296142578125, -0.20182037353515625, -0.1806793212890625, -0.15953826904296875, -0.138397216796875, -0.11725616455078125, -0.0961151123046875, -0.07497406005859375, -0.0538330078125, -0.03269195556640625, -0.0115509033203125, 0.00959014892578125, 0.030731201171875, 0.05187225341796875, 0.0730133056640625, 0.09415435791015625, 0.11529541015625, 0.13643646240234375, 0.1575775146484375, 0.17871856689453125, 0.199859619140625, 0.22100067138671875, 0.2421417236328125, 0.26328277587890625, 0.284423828125, 0.30556488037109375, 0.3267059326171875, 0.34784698486328125, 0.368988037109375, 0.39012908935546875, 0.4112701416015625, 0.43241119384765625, 0.45355224609375, 0.47469329833984375, 0.4958343505859375, 0.5169754028320312, 0.538116455078125, 0.5592575073242188, 0.5803985595703125, 0.6015396118164062, 0.6226806640625, 0.6438217163085938, 0.6649627685546875, 0.6861038208007812, 0.707244873046875, 0.7283859252929688, 0.7495269775390625, 0.7706680297851562, 0.79180908203125, 0.8129501342773438, 0.8340911865234375, 0.8552322387695312, 0.876373291015625, 0.8975143432617188, 0.9186553955078125, 0.9397964477539062, 0.9609375]}, "gradients/decoder.model.decoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 4.0, 0.0, 3.0, 5.0, 3.0, 6.0, 9.0, 23.0, 37.0, 66.0, 112.0, 174.0, 163.0, 144.0, 96.0, 74.0, 32.0, 22.0, 18.0, 5.0, 4.0, 5.0, 3.0, 4.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.3319878578186035, -4.098165035247803, -3.8643417358398438, -3.630518913269043, -3.396695613861084, -3.162872791290283, -2.9290497303009033, -2.6952266693115234, -2.4614036083221436, -2.2275805473327637, -1.9937574863433838, -1.7599345445632935, -1.5261114835739136, -1.2922884225845337, -1.0584654808044434, -0.8246424198150635, -0.5908193588256836, -0.3569963276386261, -0.1231732964515686, 0.1106497049331665, 0.3444727659225464, 0.5782958269119263, 0.8121187686920166, 1.0459418296813965, 1.2797648906707764, 1.5135879516601562, 1.7474110126495361, 1.9812339544296265, 2.215056896209717, 2.448880195617676, 2.6827030181884766, 2.9165260791778564, 3.1503496170043945, 3.3841726779937744, 3.6179957389831543, 3.851818561553955, 4.085641860961914, 4.319464683532715, 4.553287506103516, 4.787110805511475, 5.020934104919434, 5.254756927490234, 5.488580226898193, 5.722403049468994, 5.956226348876953, 6.190049171447754, 6.423871994018555, 6.657695293426514, 6.8915181159973145, 7.125340938568115, 7.359164237976074, 7.592987060546875, 7.826810359954834, 8.060633659362793, 8.294456481933594, 8.528279304504395, 8.762102127075195, 8.995924949645996, 9.229747772216797, 9.463571548461914, 9.697394371032715, 9.931217193603516, 10.165040016174316, 10.398862838745117, 10.632686614990234]}, "gradients/decoder.model.decoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 0.0, 2.0, 8.0, 3.0, 7.0, 6.0, 9.0, 12.0, 18.0, 10.0, 22.0, 26.0, 23.0, 18.0, 27.0, 30.0, 36.0, 37.0, 32.0, 33.0, 40.0, 41.0, 46.0, 49.0, 34.0, 57.0, 33.0, 29.0, 33.0, 36.0, 47.0, 23.0, 36.0, 30.0, 23.0, 15.0, 11.0, 15.0, 12.0, 10.0, 7.0, 6.0, 3.0, 3.0, 2.0, 5.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.5542969703674316, -3.4319028854370117, -3.3095085620880127, -3.1871142387390137, -3.0647201538085938, -2.942326068878174, -2.819931745529175, -2.697537422180176, -2.575143337249756, -2.452749252319336, -2.330354928970337, -2.207960605621338, -2.085566520690918, -1.9631723165512085, -1.840778112411499, -1.7183839082717896, -1.59598970413208, -1.4735954999923706, -1.3512012958526611, -1.2288070917129517, -1.1064128875732422, -0.9840186834335327, -0.8616244792938232, -0.7392302751541138, -0.6168360710144043, -0.4944418668746948, -0.37204766273498535, -0.24965345859527588, -0.1272592544555664, -0.004865050315856934, 0.11752915382385254, 0.239923357963562, 0.3623175621032715, 0.48471176624298096, 0.6071059703826904, 0.7295001745223999, 0.8518943786621094, 0.9742885828018188, 1.0966827869415283, 1.2190769910812378, 1.3414711952209473, 1.4638653993606567, 1.5862596035003662, 1.7086538076400757, 1.8310480117797852, 1.9534422159194946, 2.075836420059204, 2.198230743408203, 2.320624828338623, 2.443018913269043, 2.565413236618042, 2.687807559967041, 2.810201644897461, 2.932595729827881, 3.05499005317688, 3.177384376525879, 3.299778461456299, 3.4221725463867188, 3.5445668697357178, 3.666961193084717, 3.7893552780151367, 3.9117493629455566, 4.034143447875977, 4.156538009643555, 4.278932094573975]}, "gradients/decoder.model.decoder.layers.8.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 5.0, 4.0, 4.0, 8.0, 1.0, 10.0, 9.0, 11.0, 13.0, 17.0, 21.0, 32.0, 38.0, 51.0, 67.0, 142.0, 206.0, 505.0, 1281.0, 5088.0, 30316.0, 326068.0, 2514240.0, 1191479.0, 106701.0, 13140.0, 2950.0, 903.0, 398.0, 176.0, 110.0, 69.0, 47.0, 46.0, 34.0, 18.0, 20.0, 10.0, 10.0, 7.0, 9.0, 6.0, 6.0, 0.0, 3.0, 4.0, 3.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0], "bins": [-4.17578125, -4.04833984375, -3.9208984375, -3.79345703125, -3.666015625, -3.53857421875, -3.4111328125, -3.28369140625, -3.15625, -3.02880859375, -2.9013671875, -2.77392578125, -2.646484375, -2.51904296875, -2.3916015625, -2.26416015625, -2.13671875, -2.00927734375, -1.8818359375, -1.75439453125, -1.626953125, -1.49951171875, -1.3720703125, -1.24462890625, -1.1171875, -0.98974609375, -0.8623046875, -0.73486328125, -0.607421875, -0.47998046875, -0.3525390625, -0.22509765625, -0.09765625, 0.02978515625, 0.1572265625, 0.28466796875, 0.412109375, 0.53955078125, 0.6669921875, 0.79443359375, 0.921875, 1.04931640625, 1.1767578125, 1.30419921875, 1.431640625, 1.55908203125, 1.6865234375, 1.81396484375, 1.94140625, 2.06884765625, 2.1962890625, 2.32373046875, 2.451171875, 2.57861328125, 2.7060546875, 2.83349609375, 2.9609375, 3.08837890625, 3.2158203125, 3.34326171875, 3.470703125, 3.59814453125, 3.7255859375, 3.85302734375, 3.98046875]}, "gradients/decoder.model.decoder.layers.8.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 1.0, 3.0, 1.0, 4.0, 8.0, 10.0, 13.0, 13.0, 10.0, 18.0, 27.0, 26.0, 40.0, 36.0, 50.0, 46.0, 57.0, 76.0, 65.0, 60.0, 60.0, 43.0, 68.0, 43.0, 47.0, 35.0, 42.0, 28.0, 23.0, 15.0, 14.0, 11.0, 6.0, 5.0, 3.0, 1.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.091796875, -2.0145263671875, -1.937255859375, -1.8599853515625, -1.78271484375, -1.7054443359375, -1.628173828125, -1.5509033203125, -1.4736328125, -1.3963623046875, -1.319091796875, -1.2418212890625, -1.16455078125, -1.0872802734375, -1.010009765625, -0.9327392578125, -0.85546875, -0.7781982421875, -0.700927734375, -0.6236572265625, -0.54638671875, -0.4691162109375, -0.391845703125, -0.3145751953125, -0.2373046875, -0.1600341796875, -0.082763671875, -0.0054931640625, 0.07177734375, 0.1490478515625, 0.226318359375, 0.3035888671875, 0.380859375, 0.4581298828125, 0.535400390625, 0.6126708984375, 0.68994140625, 0.7672119140625, 0.844482421875, 0.9217529296875, 0.9990234375, 1.0762939453125, 1.153564453125, 1.2308349609375, 1.30810546875, 1.3853759765625, 1.462646484375, 1.5399169921875, 1.6171875, 1.6944580078125, 1.771728515625, 1.8489990234375, 1.92626953125, 2.0035400390625, 2.080810546875, 2.1580810546875, 2.2353515625, 2.3126220703125, 2.389892578125, 2.4671630859375, 2.54443359375, 2.6217041015625, 2.698974609375, 2.7762451171875, 2.853515625]}, "gradients/decoder.model.decoder.layers.8.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 1.0, 2.0, 2.0, 2.0, 2.0, 5.0, 4.0, 11.0, 19.0, 31.0, 25.0, 69.0, 125.0, 217.0, 510.0, 2469.0, 59742.0, 4022426.0, 104338.0, 3125.0, 579.0, 265.0, 128.0, 63.0, 42.0, 25.0, 20.0, 14.0, 9.0, 6.0, 5.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-10.34375, -10.06829833984375, -9.7928466796875, -9.51739501953125, -9.241943359375, -8.96649169921875, -8.6910400390625, -8.41558837890625, -8.14013671875, -7.86468505859375, -7.5892333984375, -7.31378173828125, -7.038330078125, -6.76287841796875, -6.4874267578125, -6.21197509765625, -5.9365234375, -5.66107177734375, -5.3856201171875, -5.11016845703125, -4.834716796875, -4.55926513671875, -4.2838134765625, -4.00836181640625, -3.73291015625, -3.45745849609375, -3.1820068359375, -2.90655517578125, -2.631103515625, -2.35565185546875, -2.0802001953125, -1.80474853515625, -1.529296875, -1.25384521484375, -0.9783935546875, -0.70294189453125, -0.427490234375, -0.15203857421875, 0.1234130859375, 0.39886474609375, 0.67431640625, 0.94976806640625, 1.2252197265625, 1.50067138671875, 1.776123046875, 2.05157470703125, 2.3270263671875, 2.60247802734375, 2.8779296875, 3.15338134765625, 3.4288330078125, 3.70428466796875, 3.979736328125, 4.25518798828125, 4.5306396484375, 4.80609130859375, 5.08154296875, 5.35699462890625, 5.6324462890625, 5.90789794921875, 6.183349609375, 6.45880126953125, 6.7342529296875, 7.00970458984375, 7.28515625]}, "gradients/decoder.model.decoder.layers.8.fc1.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 5.0, 7.0, 8.0, 9.0, 15.0, 18.0, 16.0, 37.0, 64.0, 89.0, 121.0, 175.0, 249.0, 404.0, 517.0, 594.0, 537.0, 362.0, 283.0, 188.0, 109.0, 89.0, 70.0, 47.0, 24.0, 17.0, 9.0, 2.0, 4.0, 2.0, 0.0, 3.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.95703125, -0.9234466552734375, -0.889862060546875, -0.8562774658203125, -0.82269287109375, -0.7891082763671875, -0.755523681640625, -0.7219390869140625, -0.6883544921875, -0.6547698974609375, -0.621185302734375, -0.5876007080078125, -0.55401611328125, -0.5204315185546875, -0.486846923828125, -0.4532623291015625, -0.419677734375, -0.3860931396484375, -0.352508544921875, -0.3189239501953125, -0.28533935546875, -0.2517547607421875, -0.218170166015625, -0.1845855712890625, -0.1510009765625, -0.1174163818359375, -0.083831787109375, -0.0502471923828125, -0.01666259765625, 0.0169219970703125, 0.050506591796875, 0.0840911865234375, 0.11767578125, 0.1512603759765625, 0.184844970703125, 0.2184295654296875, 0.25201416015625, 0.2855987548828125, 0.319183349609375, 0.3527679443359375, 0.3863525390625, 0.4199371337890625, 0.453521728515625, 0.4871063232421875, 0.52069091796875, 0.5542755126953125, 0.587860107421875, 0.6214447021484375, 0.655029296875, 0.6886138916015625, 0.722198486328125, 0.7557830810546875, 0.78936767578125, 0.8229522705078125, 0.856536865234375, 0.8901214599609375, 0.9237060546875, 0.9572906494140625, 0.990875244140625, 1.0244598388671875, 1.05804443359375, 1.0916290283203125, 1.125213623046875, 1.1587982177734375, 1.1923828125]}, "gradients/decoder.model.decoder.layers.8.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 3.0, 5.0, 6.0, 16.0, 8.0, 20.0, 28.0, 43.0, 47.0, 88.0, 113.0, 121.0, 118.0, 95.0, 93.0, 57.0, 47.0, 33.0, 21.0, 11.0, 11.0, 8.0, 5.0, 1.0, 6.0, 5.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.443881988525391, -4.306818962097168, -4.169755935668945, -4.032692909240723, -3.8956298828125, -3.7585668563842773, -3.6215038299560547, -3.484440803527832, -3.3473777770996094, -3.2103147506713867, -3.073251724243164, -2.9361886978149414, -2.7991256713867188, -2.662062644958496, -2.5249996185302734, -2.387936592102051, -2.250873565673828, -2.1138105392456055, -1.9767475128173828, -1.8396844863891602, -1.7026214599609375, -1.5655584335327148, -1.4284954071044922, -1.2914323806762695, -1.1543693542480469, -1.0173063278198242, -0.8802433013916016, -0.7431802749633789, -0.6061172485351562, -0.4690542221069336, -0.33199119567871094, -0.19492816925048828, -0.05786561965942383, 0.07919740676879883, 0.21626043319702148, 0.35332345962524414, 0.4903864860534668, 0.6274495124816895, 0.7645125389099121, 0.9015755653381348, 1.0386385917663574, 1.17570161819458, 1.3127646446228027, 1.4498276710510254, 1.586890697479248, 1.7239537239074707, 1.8610167503356934, 1.998079776763916, 2.1351428031921387, 2.2722058296203613, 2.409268856048584, 2.5463318824768066, 2.6833949089050293, 2.820457935333252, 2.9575209617614746, 3.0945839881896973, 3.23164701461792, 3.3687100410461426, 3.5057730674743652, 3.642836093902588, 3.7798991203308105, 3.916962146759033, 4.054025173187256, 4.1910881996154785, 4.328151226043701]}, "gradients/decoder.model.decoder.layers.8.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 2.0, 4.0, 5.0, 11.0, 7.0, 17.0, 13.0, 13.0, 15.0, 22.0, 25.0, 30.0, 29.0, 46.0, 46.0, 51.0, 46.0, 52.0, 50.0, 56.0, 67.0, 43.0, 44.0, 40.0, 52.0, 28.0, 34.0, 31.0, 27.0, 24.0, 16.0, 19.0, 15.0, 10.0, 3.0, 3.0, 5.0, 1.0, 1.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.1229019165039062, -2.0435311794281006, -1.9641602039337158, -1.8847893476486206, -1.8054184913635254, -1.7260477542877197, -1.6466768980026245, -1.5673060417175293, -1.487935185432434, -1.4085643291473389, -1.3291934728622437, -1.2498226165771484, -1.1704518795013428, -1.091080904006958, -1.0117101669311523, -0.9323393106460571, -0.8529684543609619, -0.7735975980758667, -0.6942267417907715, -0.614855945110321, -0.5354850888252258, -0.4561142325401306, -0.3767434060573578, -0.29737257957458496, -0.21800172328948975, -0.13863088190555573, -0.059260040521621704, 0.020110800862312317, 0.09948164224624634, 0.17885249853134155, 0.2582233250141144, 0.3375941514968872, 0.4169652462005615, 0.49633610248565674, 0.575706958770752, 0.6550777554512024, 0.7344486117362976, 0.8138194680213928, 0.8931902647018433, 0.9725611209869385, 1.0519319772720337, 1.131302833557129, 1.2106736898422241, 1.2900445461273193, 1.369415283203125, 1.4487862586975098, 1.5281569957733154, 1.6075278520584106, 1.6868987083435059, 1.766269564628601, 1.8456404209136963, 1.9250112771987915, 2.0043821334838867, 2.0837528705596924, 2.163123846054077, 2.242494583129883, 2.3218655586242676, 2.4012362957000732, 2.480607271194458, 2.5599780082702637, 2.6393489837646484, 2.718719720840454, 2.798090696334839, 2.8774614334106445, 2.95683217048645]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 7.0, 14.0, 18.0, 26.0, 48.0, 71.0, 103.0, 207.0, 524.0, 1421.0, 5946.0, 52789.0, 497404.0, 438913.0, 43586.0, 5328.0, 1211.0, 459.0, 213.0, 108.0, 69.0, 37.0, 14.0, 13.0, 14.0, 7.0, 4.0, 2.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.99560546875, -0.9634475708007812, -0.9312896728515625, -0.8991317749023438, -0.866973876953125, -0.8348159790039062, -0.8026580810546875, -0.7705001831054688, -0.73834228515625, -0.7061843872070312, -0.6740264892578125, -0.6418685913085938, -0.609710693359375, -0.5775527954101562, -0.5453948974609375, -0.5132369995117188, -0.4810791015625, -0.44892120361328125, -0.4167633056640625, -0.38460540771484375, -0.352447509765625, -0.32028961181640625, -0.2881317138671875, -0.25597381591796875, -0.22381591796875, -0.19165802001953125, -0.1595001220703125, -0.12734222412109375, -0.095184326171875, -0.06302642822265625, -0.0308685302734375, 0.00128936767578125, 0.033447265625, 0.06560516357421875, 0.0977630615234375, 0.12992095947265625, 0.162078857421875, 0.19423675537109375, 0.2263946533203125, 0.25855255126953125, 0.29071044921875, 0.32286834716796875, 0.3550262451171875, 0.38718414306640625, 0.419342041015625, 0.45149993896484375, 0.4836578369140625, 0.5158157348632812, 0.5479736328125, 0.5801315307617188, 0.6122894287109375, 0.6444473266601562, 0.676605224609375, 0.7087631225585938, 0.7409210205078125, 0.7730789184570312, 0.80523681640625, 0.8373947143554688, 0.8695526123046875, 0.9017105102539062, 0.933868408203125, 0.9660263061523438, 0.9981842041015625, 1.0303421020507812, 1.0625]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 5.0, 8.0, 5.0, 7.0, 23.0, 26.0, 30.0, 30.0, 47.0, 60.0, 71.0, 92.0, 87.0, 97.0, 70.0, 72.0, 63.0, 53.0, 41.0, 39.0, 33.0, 19.0, 9.0, 4.0, 9.0, 6.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.126953125, -2.05157470703125, -1.9761962890625, -1.90081787109375, -1.825439453125, -1.75006103515625, -1.6746826171875, -1.59930419921875, -1.52392578125, -1.44854736328125, -1.3731689453125, -1.29779052734375, -1.222412109375, -1.14703369140625, -1.0716552734375, -0.99627685546875, -0.9208984375, -0.84552001953125, -0.7701416015625, -0.69476318359375, -0.619384765625, -0.54400634765625, -0.4686279296875, -0.39324951171875, -0.31787109375, -0.24249267578125, -0.1671142578125, -0.09173583984375, -0.016357421875, 0.05902099609375, 0.1343994140625, 0.20977783203125, 0.28515625, 0.36053466796875, 0.4359130859375, 0.51129150390625, 0.586669921875, 0.66204833984375, 0.7374267578125, 0.81280517578125, 0.88818359375, 0.96356201171875, 1.0389404296875, 1.11431884765625, 1.189697265625, 1.26507568359375, 1.3404541015625, 1.41583251953125, 1.4912109375, 1.56658935546875, 1.6419677734375, 1.71734619140625, 1.792724609375, 1.86810302734375, 1.9434814453125, 2.01885986328125, 2.09423828125, 2.16961669921875, 2.2449951171875, 2.32037353515625, 2.395751953125, 2.47113037109375, 2.5465087890625, 2.62188720703125, 2.697265625]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 2.0, 2.0, 3.0, 0.0, 3.0, 3.0, 6.0, 11.0, 16.0, 22.0, 36.0, 35.0, 54.0, 89.0, 136.0, 193.0, 331.0, 595.0, 1086.0, 2052.0, 4106.0, 8215.0, 16555.0, 33947.0, 69115.0, 129129.0, 197742.0, 219849.0, 167539.0, 98142.0, 50293.0, 24854.0, 11937.0, 5966.0, 2986.0, 1525.0, 796.0, 426.0, 274.0, 144.0, 120.0, 69.0, 45.0, 32.0, 24.0, 17.0, 9.0, 11.0, 10.0, 2.0, 4.0, 3.0, 1.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.2215576171875, -0.21447181701660156, -0.20738601684570312, -0.2003002166748047, -0.19321441650390625, -0.1861286163330078, -0.17904281616210938, -0.17195701599121094, -0.1648712158203125, -0.15778541564941406, -0.15069961547851562, -0.1436138153076172, -0.13652801513671875, -0.1294422149658203, -0.12235641479492188, -0.11527061462402344, -0.108184814453125, -0.10109901428222656, -0.09401321411132812, -0.08692741394042969, -0.07984161376953125, -0.07275581359863281, -0.06567001342773438, -0.05858421325683594, -0.0514984130859375, -0.04441261291503906, -0.037326812744140625, -0.030241012573242188, -0.02315521240234375, -0.016069412231445312, -0.008983612060546875, -0.0018978118896484375, 0.00518798828125, 0.012273788452148438, 0.019359588623046875, 0.026445388793945312, 0.03353118896484375, 0.04061698913574219, 0.047702789306640625, 0.05478858947753906, 0.0618743896484375, 0.06896018981933594, 0.07604598999023438, 0.08313179016113281, 0.09021759033203125, 0.09730339050292969, 0.10438919067382812, 0.11147499084472656, 0.118560791015625, 0.12564659118652344, 0.13273239135742188, 0.1398181915283203, 0.14690399169921875, 0.1539897918701172, 0.16107559204101562, 0.16816139221191406, 0.1752471923828125, 0.18233299255371094, 0.18941879272460938, 0.1965045928955078, 0.20359039306640625, 0.2106761932373047, 0.21776199340820312, 0.22484779357910156, 0.23193359375]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 3.0, 3.0, 4.0, 7.0, 7.0, 13.0, 5.0, 15.0, 13.0, 12.0, 12.0, 16.0, 25.0, 29.0, 36.0, 33.0, 29.0, 40.0, 55.0, 37.0, 42.0, 49.0, 39.0, 45.0, 43.0, 36.0, 46.0, 37.0, 38.0, 42.0, 23.0, 25.0, 26.0, 21.0, 19.0, 17.0, 12.0, 13.0, 10.0, 7.0, 9.0, 4.0, 2.0, 4.0, 2.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.41796875, -2.34393310546875, -2.2698974609375, -2.19586181640625, -2.121826171875, -2.04779052734375, -1.9737548828125, -1.89971923828125, -1.82568359375, -1.75164794921875, -1.6776123046875, -1.60357666015625, -1.529541015625, -1.45550537109375, -1.3814697265625, -1.30743408203125, -1.2333984375, -1.15936279296875, -1.0853271484375, -1.01129150390625, -0.937255859375, -0.86322021484375, -0.7891845703125, -0.71514892578125, -0.64111328125, -0.56707763671875, -0.4930419921875, -0.41900634765625, -0.344970703125, -0.27093505859375, -0.1968994140625, -0.12286376953125, -0.048828125, 0.02520751953125, 0.0992431640625, 0.17327880859375, 0.247314453125, 0.32135009765625, 0.3953857421875, 0.46942138671875, 0.54345703125, 0.61749267578125, 0.6915283203125, 0.76556396484375, 0.839599609375, 0.91363525390625, 0.9876708984375, 1.06170654296875, 1.1357421875, 1.20977783203125, 1.2838134765625, 1.35784912109375, 1.431884765625, 1.50592041015625, 1.5799560546875, 1.65399169921875, 1.72802734375, 1.80206298828125, 1.8760986328125, 1.95013427734375, 2.024169921875, 2.09820556640625, 2.1722412109375, 2.24627685546875, 2.3203125]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 3.0, 5.0, 7.0, 14.0, 8.0, 8.0, 20.0, 37.0, 78.0, 109.0, 199.0, 361.0, 693.0, 1575.0, 4139.0, 14933.0, 79205.0, 443709.0, 412334.0, 70636.0, 13660.0, 3870.0, 1393.0, 721.0, 380.0, 178.0, 106.0, 68.0, 55.0, 23.0, 11.0, 9.0, 4.0, 6.0, 1.0, 3.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.11553955078125, -0.11241436004638672, -0.10928916931152344, -0.10616397857666016, -0.10303878784179688, -0.0999135971069336, -0.09678840637207031, -0.09366321563720703, -0.09053802490234375, -0.08741283416748047, -0.08428764343261719, -0.0811624526977539, -0.07803726196289062, -0.07491207122802734, -0.07178688049316406, -0.06866168975830078, -0.0655364990234375, -0.06241130828857422, -0.05928611755371094, -0.056160926818847656, -0.053035736083984375, -0.049910545349121094, -0.04678535461425781, -0.04366016387939453, -0.04053497314453125, -0.03740978240966797, -0.03428459167480469, -0.031159400939941406, -0.028034210205078125, -0.024909019470214844, -0.021783828735351562, -0.01865863800048828, -0.015533447265625, -0.012408256530761719, -0.009283065795898438, -0.006157875061035156, -0.003032684326171875, 9.250640869140625e-05, 0.0032176971435546875, 0.006342887878417969, 0.00946807861328125, 0.012593269348144531, 0.015718460083007812, 0.018843650817871094, 0.021968841552734375, 0.025094032287597656, 0.028219223022460938, 0.03134441375732422, 0.0344696044921875, 0.03759479522705078, 0.04071998596191406, 0.043845176696777344, 0.046970367431640625, 0.050095558166503906, 0.05322074890136719, 0.05634593963623047, 0.05947113037109375, 0.06259632110595703, 0.06572151184082031, 0.0688467025756836, 0.07197189331054688, 0.07509708404541016, 0.07822227478027344, 0.08134746551513672, 0.08447265625]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 10.0, 6.0, 9.0, 12.0, 12.0, 28.0, 30.0, 60.0, 69.0, 72.0, 87.0, 101.0, 89.0, 98.0, 78.0, 66.0, 43.0, 42.0, 23.0, 18.0, 18.0, 9.0, 4.0, 5.0, 5.0, 0.0, 5.0, 0.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-6.4849853515625e-05, -6.323214620351791e-05, -6.161443889141083e-05, -5.999673157930374e-05, -5.8379024267196655e-05, -5.676131695508957e-05, -5.514360964298248e-05, -5.35259023308754e-05, -5.190819501876831e-05, -5.0290487706661224e-05, -4.867278039455414e-05, -4.705507308244705e-05, -4.5437365770339966e-05, -4.381965845823288e-05, -4.2201951146125793e-05, -4.058424383401871e-05, -3.896653652191162e-05, -3.7348829209804535e-05, -3.573112189769745e-05, -3.411341458559036e-05, -3.2495707273483276e-05, -3.087799996137619e-05, -2.9260292649269104e-05, -2.7642585337162018e-05, -2.602487802505493e-05, -2.4407170712947845e-05, -2.278946340084076e-05, -2.1171756088733673e-05, -1.9554048776626587e-05, -1.79363414645195e-05, -1.6318634152412415e-05, -1.4700926840305328e-05, -1.3083219528198242e-05, -1.1465512216091156e-05, -9.84780490398407e-06, -8.230097591876984e-06, -6.6123902797698975e-06, -4.994682967662811e-06, -3.376975655555725e-06, -1.759268343448639e-06, -1.4156103134155273e-07, 1.4761462807655334e-06, 3.0938535928726196e-06, 4.711560904979706e-06, 6.329268217086792e-06, 7.946975529193878e-06, 9.564682841300964e-06, 1.118239015340805e-05, 1.2800097465515137e-05, 1.4417804777622223e-05, 1.603551208972931e-05, 1.7653219401836395e-05, 1.927092671394348e-05, 2.0888634026050568e-05, 2.2506341338157654e-05, 2.412404865026474e-05, 2.5741755962371826e-05, 2.7359463274478912e-05, 2.8977170586586e-05, 3.0594877898693085e-05, 3.221258521080017e-05, 3.383029252290726e-05, 3.544799983501434e-05, 3.706570714712143e-05, 3.8683414459228516e-05]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 5.0, 2.0, 3.0, 2.0, 6.0, 4.0, 7.0, 15.0, 11.0, 11.0, 34.0, 41.0, 70.0, 109.0, 268.0, 611.0, 2009.0, 9102.0, 63773.0, 591315.0, 339637.0, 33709.0, 5653.0, 1300.0, 414.0, 185.0, 89.0, 59.0, 34.0, 23.0, 16.0, 9.0, 10.0, 5.0, 6.0, 3.0, 6.0, 1.0, 5.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1446533203125, -0.13980674743652344, -0.13496017456054688, -0.1301136016845703, -0.12526702880859375, -0.12042045593261719, -0.11557388305664062, -0.11072731018066406, -0.1058807373046875, -0.10103416442871094, -0.09618759155273438, -0.09134101867675781, -0.08649444580078125, -0.08164787292480469, -0.07680130004882812, -0.07195472717285156, -0.067108154296875, -0.06226158142089844, -0.057415008544921875, -0.05256843566894531, -0.04772186279296875, -0.04287528991699219, -0.038028717041015625, -0.03318214416503906, -0.0283355712890625, -0.023488998413085938, -0.018642425537109375, -0.013795852661132812, -0.00894927978515625, -0.0041027069091796875, 0.000743865966796875, 0.0055904388427734375, 0.01043701171875, 0.015283584594726562, 0.020130157470703125, 0.024976730346679688, 0.02982330322265625, 0.03466987609863281, 0.039516448974609375, 0.04436302185058594, 0.0492095947265625, 0.05405616760253906, 0.058902740478515625, 0.06374931335449219, 0.06859588623046875, 0.07344245910644531, 0.07828903198242188, 0.08313560485839844, 0.087982177734375, 0.09282875061035156, 0.09767532348632812, 0.10252189636230469, 0.10736846923828125, 0.11221504211425781, 0.11706161499023438, 0.12190818786621094, 0.1267547607421875, 0.13160133361816406, 0.13644790649414062, 0.1412944793701172, 0.14614105224609375, 0.1509876251220703, 0.15583419799804688, 0.16068077087402344, 0.16552734375]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 3.0, 2.0, 2.0, 5.0, 5.0, 14.0, 6.0, 13.0, 16.0, 22.0, 24.0, 45.0, 44.0, 74.0, 91.0, 102.0, 108.0, 101.0, 60.0, 53.0, 56.0, 33.0, 29.0, 16.0, 17.0, 13.0, 13.0, 7.0, 4.0, 6.0, 7.0, 3.0, 1.0, 3.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.0298309326171875, -0.028982877731323242, -0.028134822845458984, -0.027286767959594727, -0.02643871307373047, -0.02559065818786621, -0.024742603302001953, -0.023894548416137695, -0.023046493530273438, -0.02219843864440918, -0.021350383758544922, -0.020502328872680664, -0.019654273986816406, -0.01880621910095215, -0.01795816421508789, -0.017110109329223633, -0.016262054443359375, -0.015413999557495117, -0.01456594467163086, -0.013717889785766602, -0.012869834899902344, -0.012021780014038086, -0.011173725128173828, -0.01032567024230957, -0.009477615356445312, -0.008629560470581055, -0.007781505584716797, -0.006933450698852539, -0.006085395812988281, -0.0052373409271240234, -0.004389286041259766, -0.003541231155395508, -0.00269317626953125, -0.0018451213836669922, -0.0009970664978027344, -0.00014901161193847656, 0.0006990432739257812, 0.001547098159790039, 0.002395153045654297, 0.0032432079315185547, 0.0040912628173828125, 0.00493931770324707, 0.005787372589111328, 0.006635427474975586, 0.007483482360839844, 0.008331537246704102, 0.00917959213256836, 0.010027647018432617, 0.010875701904296875, 0.011723756790161133, 0.01257181167602539, 0.013419866561889648, 0.014267921447753906, 0.015115976333618164, 0.015964031219482422, 0.01681208610534668, 0.017660140991210938, 0.018508195877075195, 0.019356250762939453, 0.02020430564880371, 0.02105236053466797, 0.021900415420532227, 0.022748470306396484, 0.023596525192260742, 0.024444580078125]}, "gradients/decoder.model.decoder.layers.8.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 6.0, 6.0, 11.0, 16.0, 14.0, 40.0, 58.0, 105.0, 154.0, 158.0, 134.0, 113.0, 77.0, 37.0, 28.0, 19.0, 8.0, 5.0, 6.0, 3.0, 2.0, 4.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-3.755671739578247, -3.656165361404419, -3.55665922164917, -3.457152843475342, -3.3576464653015137, -3.2581400871276855, -3.1586339473724365, -3.0591275691986084, -2.9596211910247803, -2.860114812850952, -2.760608673095703, -2.661102294921875, -2.561595916748047, -2.4620895385742188, -2.3625833988189697, -2.2630770206451416, -2.1635708808898926, -2.0640645027160645, -1.9645582437515259, -1.8650519847869873, -1.7655456066131592, -1.6660393476486206, -1.566533088684082, -1.467026710510254, -1.3675203323364258, -1.2680140733718872, -1.168507695198059, -1.0690014362335205, -0.9694950580596924, -0.8699887990951538, -0.7704824805259705, -0.6709761619567871, -0.571469783782959, -0.47196346521377563, -0.3724571466445923, -0.2729508578777313, -0.17344453930854797, -0.07393822073936462, 0.025568068027496338, 0.1250743865966797, 0.22458070516586304, 0.3240870237350464, 0.42359334230422974, 0.5230996608734131, 0.6226059198379517, 0.7221122980117798, 0.8216185569763184, 0.9211248755455017, 1.020631194114685, 1.1201374530792236, 1.2196438312530518, 1.3191500902175903, 1.4186564683914185, 1.518162727355957, 1.6176691055297852, 1.7171753644943237, 1.8166816234588623, 1.9161878824234009, 2.0156941413879395, 2.1152005195617676, 2.2147068977355957, 2.314213275909424, 2.413719415664673, 2.513225793838501, 2.612732172012329]}, "gradients/decoder.model.decoder.layers.8.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 2.0, 4.0, 4.0, 8.0, 18.0, 14.0, 14.0, 19.0, 17.0, 37.0, 30.0, 51.0, 50.0, 64.0, 65.0, 58.0, 59.0, 85.0, 60.0, 52.0, 57.0, 45.0, 40.0, 32.0, 34.0, 21.0, 24.0, 12.0, 10.0, 9.0, 4.0, 1.0, 2.0, 1.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.3821330070495605, -1.3261218070983887, -1.2701106071472168, -1.2140992879867554, -1.1580880880355835, -1.1020768880844116, -1.0460656881332397, -0.9900544285774231, -0.9340431690216064, -0.8780319690704346, -0.8220207095146179, -0.766009509563446, -0.7099982500076294, -0.6539870500564575, -0.5979758501052856, -0.541964590549469, -0.4859533905982971, -0.42994216084480286, -0.3739309310913086, -0.3179197311401367, -0.26190847158432007, -0.2058972716331482, -0.14988604187965393, -0.09387481212615967, -0.037863582372665405, 0.01814764365553856, 0.07415886968374252, 0.1301700919866562, 0.18618132174015045, 0.24219253659248352, 0.2982037663459778, 0.35421499609947205, 0.4102262258529663, 0.46623745560646057, 0.5222486853599548, 0.5782598853111267, 0.6342711448669434, 0.6902823448181152, 0.7462935447692871, 0.8023048043251038, 0.8583160638809204, 0.9143272638320923, 0.9703385233879089, 1.0263497829437256, 1.0823609828948975, 1.1383721828460693, 1.1943833827972412, 1.250394582748413, 1.306405782699585, 1.3624169826507568, 1.4184281826019287, 1.4744395017623901, 1.530450701713562, 1.5864619016647339, 1.6424731016159058, 1.6984844207763672, 1.754495620727539, 1.810506820678711, 1.8665180206298828, 1.9225293397903442, 1.9785405397415161, 2.0345516204833984, 2.0905630588531494, 2.1465742588043213, 2.202585458755493]}, "gradients/decoder.model.decoder.layers.8.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 4.0, 1.0, 2.0, 2.0, 2.0, 4.0, 3.0, 4.0, 17.0, 21.0, 18.0, 27.0, 61.0, 88.0, 147.0, 221.0, 410.0, 711.0, 1430.0, 2939.0, 6466.0, 14955.0, 35969.0, 89276.0, 208636.0, 316902.0, 212870.0, 91581.0, 37035.0, 15554.0, 6734.0, 3114.0, 1563.0, 809.0, 436.0, 204.0, 123.0, 84.0, 41.0, 34.0, 19.0, 17.0, 4.0, 8.0, 7.0, 5.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.4453125, -1.4046173095703125, -1.363922119140625, -1.3232269287109375, -1.28253173828125, -1.2418365478515625, -1.201141357421875, -1.1604461669921875, -1.1197509765625, -1.0790557861328125, -1.038360595703125, -0.9976654052734375, -0.95697021484375, -0.9162750244140625, -0.875579833984375, -0.8348846435546875, -0.794189453125, -0.7534942626953125, -0.712799072265625, -0.6721038818359375, -0.63140869140625, -0.5907135009765625, -0.550018310546875, -0.5093231201171875, -0.4686279296875, -0.4279327392578125, -0.387237548828125, -0.3465423583984375, -0.30584716796875, -0.2651519775390625, -0.224456787109375, -0.1837615966796875, -0.14306640625, -0.1023712158203125, -0.061676025390625, -0.0209808349609375, 0.01971435546875, 0.0604095458984375, 0.101104736328125, 0.1417999267578125, 0.1824951171875, 0.2231903076171875, 0.263885498046875, 0.3045806884765625, 0.34527587890625, 0.3859710693359375, 0.426666259765625, 0.4673614501953125, 0.508056640625, 0.5487518310546875, 0.589447021484375, 0.6301422119140625, 0.67083740234375, 0.7115325927734375, 0.752227783203125, 0.7929229736328125, 0.8336181640625, 0.8743133544921875, 0.915008544921875, 0.9557037353515625, 0.99639892578125, 1.0370941162109375, 1.077789306640625, 1.1184844970703125, 1.1591796875]}, "gradients/decoder.model.decoder.layers.8.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 4.0, 3.0, 3.0, 5.0, 4.0, 15.0, 12.0, 14.0, 23.0, 27.0, 23.0, 33.0, 32.0, 41.0, 50.0, 62.0, 61.0, 45.0, 50.0, 70.0, 52.0, 54.0, 54.0, 45.0, 38.0, 36.0, 28.0, 22.0, 23.0, 21.0, 14.0, 6.0, 11.0, 5.0, 8.0, 3.0, 1.0, 6.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.662109375, -2.56298828125, -2.4638671875, -2.36474609375, -2.265625, -2.16650390625, -2.0673828125, -1.96826171875, -1.869140625, -1.77001953125, -1.6708984375, -1.57177734375, -1.47265625, -1.37353515625, -1.2744140625, -1.17529296875, -1.076171875, -0.97705078125, -0.8779296875, -0.77880859375, -0.6796875, -0.58056640625, -0.4814453125, -0.38232421875, -0.283203125, -0.18408203125, -0.0849609375, 0.01416015625, 0.11328125, 0.21240234375, 0.3115234375, 0.41064453125, 0.509765625, 0.60888671875, 0.7080078125, 0.80712890625, 0.90625, 1.00537109375, 1.1044921875, 1.20361328125, 1.302734375, 1.40185546875, 1.5009765625, 1.60009765625, 1.69921875, 1.79833984375, 1.8974609375, 1.99658203125, 2.095703125, 2.19482421875, 2.2939453125, 2.39306640625, 2.4921875, 2.59130859375, 2.6904296875, 2.78955078125, 2.888671875, 2.98779296875, 3.0869140625, 3.18603515625, 3.28515625, 3.38427734375, 3.4833984375, 3.58251953125, 3.681640625]}, "gradients/decoder.model.decoder.layers.8.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 6.0, 3.0, 6.0, 4.0, 13.0, 9.0, 9.0, 17.0, 11.0, 21.0, 14.0, 29.0, 34.0, 35.0, 35.0, 46.0, 86.0, 140.0, 294.0, 971.0, 54834.0, 982585.0, 8103.0, 567.0, 222.0, 134.0, 62.0, 48.0, 25.0, 28.0, 31.0, 29.0, 12.0, 17.0, 16.0, 12.0, 13.0, 6.0, 10.0, 6.0, 3.0, 3.0, 5.0, 1.0, 1.0, 4.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.28125, -8.9942626953125, -8.707275390625, -8.4202880859375, -8.13330078125, -7.8463134765625, -7.559326171875, -7.2723388671875, -6.9853515625, -6.6983642578125, -6.411376953125, -6.1243896484375, -5.83740234375, -5.5504150390625, -5.263427734375, -4.9764404296875, -4.689453125, -4.4024658203125, -4.115478515625, -3.8284912109375, -3.54150390625, -3.2545166015625, -2.967529296875, -2.6805419921875, -2.3935546875, -2.1065673828125, -1.819580078125, -1.5325927734375, -1.24560546875, -0.9586181640625, -0.671630859375, -0.3846435546875, -0.09765625, 0.1893310546875, 0.476318359375, 0.7633056640625, 1.05029296875, 1.3372802734375, 1.624267578125, 1.9112548828125, 2.1982421875, 2.4852294921875, 2.772216796875, 3.0592041015625, 3.34619140625, 3.6331787109375, 3.920166015625, 4.2071533203125, 4.494140625, 4.7811279296875, 5.068115234375, 5.3551025390625, 5.64208984375, 5.9290771484375, 6.216064453125, 6.5030517578125, 6.7900390625, 7.0770263671875, 7.364013671875, 7.6510009765625, 7.93798828125, 8.2249755859375, 8.511962890625, 8.7989501953125, 9.0859375]}, "gradients/decoder.model.decoder.layers.8.self_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 3.0, 4.0, 7.0, 7.0, 5.0, 13.0, 16.0, 10.0, 11.0, 24.0, 16.0, 22.0, 22.0, 17.0, 34.0, 50.0, 36.0, 35.0, 57.0, 45.0, 45.0, 38.0, 39.0, 31.0, 41.0, 45.0, 34.0, 34.0, 32.0, 29.0, 31.0, 26.0, 23.0, 14.0, 19.0, 15.0, 14.0, 10.0, 12.0, 8.0, 3.0, 5.0, 9.0, 3.0, 2.0, 6.0, 1.0, 5.0, 1.0, 0.0, 0.0, 0.0, 3.0], "bins": [-2.763671875, -2.68017578125, -2.5966796875, -2.51318359375, -2.4296875, -2.34619140625, -2.2626953125, -2.17919921875, -2.095703125, -2.01220703125, -1.9287109375, -1.84521484375, -1.76171875, -1.67822265625, -1.5947265625, -1.51123046875, -1.427734375, -1.34423828125, -1.2607421875, -1.17724609375, -1.09375, -1.01025390625, -0.9267578125, -0.84326171875, -0.759765625, -0.67626953125, -0.5927734375, -0.50927734375, -0.42578125, -0.34228515625, -0.2587890625, -0.17529296875, -0.091796875, -0.00830078125, 0.0751953125, 0.15869140625, 0.2421875, 0.32568359375, 0.4091796875, 0.49267578125, 0.576171875, 0.65966796875, 0.7431640625, 0.82666015625, 0.91015625, 0.99365234375, 1.0771484375, 1.16064453125, 1.244140625, 1.32763671875, 1.4111328125, 1.49462890625, 1.578125, 1.66162109375, 1.7451171875, 1.82861328125, 1.912109375, 1.99560546875, 2.0791015625, 2.16259765625, 2.24609375, 2.32958984375, 2.4130859375, 2.49658203125, 2.580078125]}, "gradients/decoder.model.decoder.layers.8.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 5.0, 1.0, 4.0, 2.0, 3.0, 8.0, 5.0, 11.0, 20.0, 28.0, 41.0, 65.0, 117.0, 332.0, 781.0, 2913.0, 21239.0, 495733.0, 501213.0, 21538.0, 2978.0, 807.0, 346.0, 180.0, 83.0, 41.0, 23.0, 10.0, 7.0, 10.0, 2.0, 3.0, 2.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5185546875, -1.4679412841796875, -1.417327880859375, -1.3667144775390625, -1.31610107421875, -1.2654876708984375, -1.214874267578125, -1.1642608642578125, -1.1136474609375, -1.0630340576171875, -1.012420654296875, -0.9618072509765625, -0.91119384765625, -0.8605804443359375, -0.809967041015625, -0.7593536376953125, -0.708740234375, -0.6581268310546875, -0.607513427734375, -0.5569000244140625, -0.50628662109375, -0.4556732177734375, -0.405059814453125, -0.3544464111328125, -0.3038330078125, -0.2532196044921875, -0.202606201171875, -0.1519927978515625, -0.10137939453125, -0.0507659912109375, -0.000152587890625, 0.0504608154296875, 0.10107421875, 0.1516876220703125, 0.202301025390625, 0.2529144287109375, 0.30352783203125, 0.3541412353515625, 0.404754638671875, 0.4553680419921875, 0.5059814453125, 0.5565948486328125, 0.607208251953125, 0.6578216552734375, 0.70843505859375, 0.7590484619140625, 0.809661865234375, 0.8602752685546875, 0.910888671875, 0.9615020751953125, 1.012115478515625, 1.0627288818359375, 1.11334228515625, 1.1639556884765625, 1.214569091796875, 1.2651824951171875, 1.3157958984375, 1.3664093017578125, 1.417022705078125, 1.4676361083984375, 1.51824951171875, 1.5688629150390625, 1.619476318359375, 1.6700897216796875, 1.720703125]}, "gradients/decoder.model.decoder.layers.8.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 4.0, 1.0, 6.0, 2.0, 3.0, 5.0, 11.0, 11.0, 17.0, 20.0, 30.0, 33.0, 66.0, 79.0, 85.0, 88.0, 112.0, 106.0, 86.0, 60.0, 50.0, 37.0, 31.0, 22.0, 17.0, 9.0, 8.0, 3.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.00017440319061279297, -0.00016973353922367096, -0.00016506388783454895, -0.00016039423644542694, -0.00015572458505630493, -0.00015105493366718292, -0.0001463852822780609, -0.0001417156308889389, -0.0001370459794998169, -0.00013237632811069489, -0.00012770667672157288, -0.00012303702533245087, -0.00011836737394332886, -0.00011369772255420685, -0.00010902807116508484, -0.00010435841977596283, -9.968876838684082e-05, -9.501911699771881e-05, -9.03494656085968e-05, -8.567981421947479e-05, -8.101016283035278e-05, -7.634051144123077e-05, -7.167086005210876e-05, -6.700120866298676e-05, -6.233155727386475e-05, -5.766190588474274e-05, -5.299225449562073e-05, -4.832260310649872e-05, -4.365295171737671e-05, -3.89833003282547e-05, -3.431364893913269e-05, -2.964399755001068e-05, -2.4974346160888672e-05, -2.0304694771766663e-05, -1.5635043382644653e-05, -1.0965391993522644e-05, -6.295740604400635e-06, -1.6260892152786255e-06, 3.043562173843384e-06, 7.713213562965393e-06, 1.2382864952087402e-05, 1.705251634120941e-05, 2.172216773033142e-05, 2.639181911945343e-05, 3.106147050857544e-05, 3.573112189769745e-05, 4.040077328681946e-05, 4.507042467594147e-05, 4.9740076065063477e-05, 5.4409727454185486e-05, 5.9079378843307495e-05, 6.37490302324295e-05, 6.841868162155151e-05, 7.308833301067352e-05, 7.775798439979553e-05, 8.242763578891754e-05, 8.709728717803955e-05, 9.176693856716156e-05, 9.643658995628357e-05, 0.00010110624134540558, 0.00010577589273452759, 0.0001104455441236496, 0.0001151151955127716, 0.00011978484690189362, 0.00012445449829101562]}, "gradients/decoder.model.decoder.layers.8.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 7.0, 7.0, 10.0, 11.0, 33.0, 31.0, 71.0, 111.0, 248.0, 828.0, 3602.0, 40604.0, 751949.0, 237242.0, 11258.0, 1648.0, 471.0, 203.0, 89.0, 64.0, 30.0, 17.0, 9.0, 7.0, 4.0, 6.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.32421875, -1.26849365234375, -1.2127685546875, -1.15704345703125, -1.101318359375, -1.04559326171875, -0.9898681640625, -0.93414306640625, -0.87841796875, -0.82269287109375, -0.7669677734375, -0.71124267578125, -0.655517578125, -0.59979248046875, -0.5440673828125, -0.48834228515625, -0.4326171875, -0.37689208984375, -0.3211669921875, -0.26544189453125, -0.209716796875, -0.15399169921875, -0.0982666015625, -0.04254150390625, 0.01318359375, 0.06890869140625, 0.1246337890625, 0.18035888671875, 0.236083984375, 0.29180908203125, 0.3475341796875, 0.40325927734375, 0.458984375, 0.51470947265625, 0.5704345703125, 0.62615966796875, 0.681884765625, 0.73760986328125, 0.7933349609375, 0.84906005859375, 0.90478515625, 0.96051025390625, 1.0162353515625, 1.07196044921875, 1.127685546875, 1.18341064453125, 1.2391357421875, 1.29486083984375, 1.3505859375, 1.40631103515625, 1.4620361328125, 1.51776123046875, 1.573486328125, 1.62921142578125, 1.6849365234375, 1.74066162109375, 1.79638671875, 1.85211181640625, 1.9078369140625, 1.96356201171875, 2.019287109375, 2.07501220703125, 2.1307373046875, 2.18646240234375, 2.2421875]}, "gradients/decoder.model.decoder.layers.8.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 4.0, 8.0, 6.0, 5.0, 12.0, 18.0, 22.0, 35.0, 43.0, 55.0, 68.0, 75.0, 106.0, 103.0, 90.0, 74.0, 64.0, 65.0, 43.0, 27.0, 24.0, 14.0, 11.0, 9.0, 7.0, 6.0, 4.0, 3.0, 7.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.5126953125, -0.4986724853515625, -0.484649658203125, -0.4706268310546875, -0.45660400390625, -0.4425811767578125, -0.428558349609375, -0.4145355224609375, -0.4005126953125, -0.3864898681640625, -0.372467041015625, -0.3584442138671875, -0.34442138671875, -0.3303985595703125, -0.316375732421875, -0.3023529052734375, -0.288330078125, -0.2743072509765625, -0.260284423828125, -0.2462615966796875, -0.23223876953125, -0.2182159423828125, -0.204193115234375, -0.1901702880859375, -0.1761474609375, -0.1621246337890625, -0.148101806640625, -0.1340789794921875, -0.12005615234375, -0.1060333251953125, -0.092010498046875, -0.0779876708984375, -0.06396484375, -0.0499420166015625, -0.035919189453125, -0.0218963623046875, -0.00787353515625, 0.0061492919921875, 0.020172119140625, 0.0341949462890625, 0.0482177734375, 0.0622406005859375, 0.076263427734375, 0.0902862548828125, 0.10430908203125, 0.1183319091796875, 0.132354736328125, 0.1463775634765625, 0.160400390625, 0.1744232177734375, 0.188446044921875, 0.2024688720703125, 0.21649169921875, 0.2305145263671875, 0.244537353515625, 0.2585601806640625, 0.2725830078125, 0.2866058349609375, 0.300628662109375, 0.3146514892578125, 0.32867431640625, 0.3426971435546875, 0.356719970703125, 0.3707427978515625, 0.384765625]}, "gradients/decoder.model.decoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 17.0, 38.0, 117.0, 230.0, 326.0, 170.0, 70.0, 23.0, 6.0, 8.0, 5.0, 0.0, 2.0, 0.0, 0.0, 3.0], "bins": [-23.3571834564209, -22.910215377807617, -22.463247299194336, -22.016277313232422, -21.56930923461914, -21.12234115600586, -20.675373077392578, -20.228404998779297, -19.781435012817383, -19.3344669342041, -18.88749885559082, -18.440528869628906, -17.993560791015625, -17.546592712402344, -17.099624633789062, -16.65265655517578, -16.2056884765625, -15.758720397949219, -15.311751365661621, -14.86478328704834, -14.417814254760742, -13.970846176147461, -13.52387809753418, -13.076909065246582, -12.629940032958984, -12.182971954345703, -11.736002922058105, -11.289034843444824, -10.842065811157227, -10.395097732543945, -9.948129653930664, -9.501160621643066, -9.054192543029785, -8.607224464416504, -8.160255432128906, -7.713287353515625, -7.266318321228027, -6.819350242614746, -6.372381687164307, -5.925413131713867, -5.478444576263428, -5.031476020812988, -4.584507465362549, -4.137538909912109, -3.690570592880249, -3.2436020374298096, -2.796633720397949, -2.3496651649475098, -1.9026966094970703, -1.4557280540466309, -1.008759617805481, -0.561791181564331, -0.1148226261138916, 0.33214592933654785, 0.7791142463684082, 1.2260828018188477, 1.673051357269287, 2.1200199127197266, 2.566988468170166, 3.0139567852020264, 3.460925340652466, 3.9078938961029053, 4.354862213134766, 4.801830768585205, 5.2487993240356445]}, "gradients/decoder.model.decoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 2.0, 3.0, 6.0, 3.0, 1.0, 5.0, 4.0, 5.0, 12.0, 12.0, 15.0, 10.0, 18.0, 24.0, 29.0, 24.0, 20.0, 30.0, 24.0, 36.0, 30.0, 40.0, 53.0, 44.0, 40.0, 28.0, 39.0, 39.0, 46.0, 41.0, 27.0, 49.0, 28.0, 31.0, 43.0, 26.0, 28.0, 17.0, 14.0, 15.0, 8.0, 12.0, 8.0, 5.0, 8.0, 1.0, 4.0, 1.0, 1.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-4.125938415527344, -3.9832170009613037, -3.8404955863952637, -3.6977741718292236, -3.5550527572631836, -3.4123313426971436, -3.2696099281311035, -3.1268885135650635, -2.9841670989990234, -2.8414456844329834, -2.6987242698669434, -2.5560028553009033, -2.4132814407348633, -2.2705600261688232, -2.127838611602783, -1.9851171970367432, -1.8423957824707031, -1.699674367904663, -1.556952953338623, -1.414231538772583, -1.271510124206543, -1.128788709640503, -0.9860672950744629, -0.8433458805084229, -0.7006244659423828, -0.5579030513763428, -0.41518163681030273, -0.2724602222442627, -0.12973880767822266, 0.012982606887817383, 0.15570402145385742, 0.29842543601989746, 0.4411473274230957, 0.5838687419891357, 0.7265901565551758, 0.8693115711212158, 1.0120329856872559, 1.154754400253296, 1.297475814819336, 1.440197229385376, 1.582918643951416, 1.725640058517456, 1.868361473083496, 2.011082887649536, 2.153804302215576, 2.296525716781616, 2.4392471313476562, 2.5819685459136963, 2.7246899604797363, 2.8674113750457764, 3.0101327896118164, 3.1528542041778564, 3.2955756187438965, 3.4382970333099365, 3.5810184478759766, 3.7237398624420166, 3.8664612770080566, 4.009182929992676, 4.151904106140137, 4.294625282287598, 4.437346935272217, 4.580068588256836, 4.722789764404297, 4.865510940551758, 5.008232593536377]}, "gradients/decoder.model.decoder.layers.7.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 1.0, 6.0, 2.0, 4.0, 3.0, 11.0, 10.0, 24.0, 29.0, 28.0, 47.0, 66.0, 85.0, 148.0, 265.0, 395.0, 905.0, 2906.0, 16331.0, 200090.0, 2565872.0, 1321199.0, 74314.0, 8218.0, 1831.0, 620.0, 298.0, 182.0, 123.0, 76.0, 63.0, 34.0, 26.0, 22.0, 15.0, 13.0, 6.0, 4.0, 5.0, 1.0, 5.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.671875, -4.52508544921875, -4.3782958984375, -4.23150634765625, -4.084716796875, -3.93792724609375, -3.7911376953125, -3.64434814453125, -3.49755859375, -3.35076904296875, -3.2039794921875, -3.05718994140625, -2.910400390625, -2.76361083984375, -2.6168212890625, -2.47003173828125, -2.3232421875, -2.17645263671875, -2.0296630859375, -1.88287353515625, -1.736083984375, -1.58929443359375, -1.4425048828125, -1.29571533203125, -1.14892578125, -1.00213623046875, -0.8553466796875, -0.70855712890625, -0.561767578125, -0.41497802734375, -0.2681884765625, -0.12139892578125, 0.025390625, 0.17218017578125, 0.3189697265625, 0.46575927734375, 0.612548828125, 0.75933837890625, 0.9061279296875, 1.05291748046875, 1.19970703125, 1.34649658203125, 1.4932861328125, 1.64007568359375, 1.786865234375, 1.93365478515625, 2.0804443359375, 2.22723388671875, 2.3740234375, 2.52081298828125, 2.6676025390625, 2.81439208984375, 2.961181640625, 3.10797119140625, 3.2547607421875, 3.40155029296875, 3.54833984375, 3.69512939453125, 3.8419189453125, 3.98870849609375, 4.135498046875, 4.28228759765625, 4.4290771484375, 4.57586669921875, 4.72265625]}, "gradients/decoder.model.decoder.layers.7.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 1.0, 3.0, 11.0, 8.0, 15.0, 14.0, 22.0, 16.0, 32.0, 34.0, 50.0, 36.0, 39.0, 53.0, 44.0, 53.0, 61.0, 59.0, 63.0, 48.0, 47.0, 40.0, 45.0, 28.0, 40.0, 35.0, 29.0, 24.0, 14.0, 14.0, 9.0, 3.0, 5.0, 3.0, 4.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.12109375, -2.045166015625, -1.96923828125, -1.893310546875, -1.8173828125, -1.741455078125, -1.66552734375, -1.589599609375, -1.513671875, -1.437744140625, -1.36181640625, -1.285888671875, -1.2099609375, -1.134033203125, -1.05810546875, -0.982177734375, -0.90625, -0.830322265625, -0.75439453125, -0.678466796875, -0.6025390625, -0.526611328125, -0.45068359375, -0.374755859375, -0.298828125, -0.222900390625, -0.14697265625, -0.071044921875, 0.0048828125, 0.080810546875, 0.15673828125, 0.232666015625, 0.30859375, 0.384521484375, 0.46044921875, 0.536376953125, 0.6123046875, 0.688232421875, 0.76416015625, 0.840087890625, 0.916015625, 0.991943359375, 1.06787109375, 1.143798828125, 1.2197265625, 1.295654296875, 1.37158203125, 1.447509765625, 1.5234375, 1.599365234375, 1.67529296875, 1.751220703125, 1.8271484375, 1.903076171875, 1.97900390625, 2.054931640625, 2.130859375, 2.206787109375, 2.28271484375, 2.358642578125, 2.4345703125, 2.510498046875, 2.58642578125, 2.662353515625, 2.73828125]}, "gradients/decoder.model.decoder.layers.7.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 3.0, 4.0, 3.0, 3.0, 6.0, 5.0, 5.0, 11.0, 17.0, 20.0, 16.0, 25.0, 41.0, 77.0, 151.0, 286.0, 1200.0, 38421.0, 4136008.0, 16419.0, 918.0, 268.0, 119.0, 86.0, 49.0, 45.0, 18.0, 16.0, 8.0, 8.0, 7.0, 5.0, 6.0, 4.0, 5.0, 3.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.1015625, -9.7042236328125, -9.306884765625, -8.9095458984375, -8.51220703125, -8.1148681640625, -7.717529296875, -7.3201904296875, -6.9228515625, -6.5255126953125, -6.128173828125, -5.7308349609375, -5.33349609375, -4.9361572265625, -4.538818359375, -4.1414794921875, -3.744140625, -3.3468017578125, -2.949462890625, -2.5521240234375, -2.15478515625, -1.7574462890625, -1.360107421875, -0.9627685546875, -0.5654296875, -0.1680908203125, 0.229248046875, 0.6265869140625, 1.02392578125, 1.4212646484375, 1.818603515625, 2.2159423828125, 2.61328125, 3.0106201171875, 3.407958984375, 3.8052978515625, 4.20263671875, 4.5999755859375, 4.997314453125, 5.3946533203125, 5.7919921875, 6.1893310546875, 6.586669921875, 6.9840087890625, 7.38134765625, 7.7786865234375, 8.176025390625, 8.5733642578125, 8.970703125, 9.3680419921875, 9.765380859375, 10.1627197265625, 10.56005859375, 10.9573974609375, 11.354736328125, 11.7520751953125, 12.1494140625, 12.5467529296875, 12.944091796875, 13.3414306640625, 13.73876953125, 14.1361083984375, 14.533447265625, 14.9307861328125, 15.328125]}, "gradients/decoder.model.decoder.layers.7.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 6.0, 3.0, 1.0, 8.0, 13.0, 8.0, 21.0, 24.0, 39.0, 57.0, 83.0, 149.0, 235.0, 349.0, 470.0, 607.0, 597.0, 507.0, 319.0, 230.0, 119.0, 96.0, 57.0, 35.0, 22.0, 14.0, 9.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.17578125, -1.1400604248046875, -1.104339599609375, -1.0686187744140625, -1.03289794921875, -0.9971771240234375, -0.961456298828125, -0.9257354736328125, -0.8900146484375, -0.8542938232421875, -0.818572998046875, -0.7828521728515625, -0.74713134765625, -0.7114105224609375, -0.675689697265625, -0.6399688720703125, -0.604248046875, -0.5685272216796875, -0.532806396484375, -0.4970855712890625, -0.46136474609375, -0.4256439208984375, -0.389923095703125, -0.3542022705078125, -0.3184814453125, -0.2827606201171875, -0.247039794921875, -0.2113189697265625, -0.17559814453125, -0.1398773193359375, -0.104156494140625, -0.0684356689453125, -0.03271484375, 0.0030059814453125, 0.038726806640625, 0.0744476318359375, 0.11016845703125, 0.1458892822265625, 0.181610107421875, 0.2173309326171875, 0.2530517578125, 0.2887725830078125, 0.324493408203125, 0.3602142333984375, 0.39593505859375, 0.4316558837890625, 0.467376708984375, 0.5030975341796875, 0.538818359375, 0.5745391845703125, 0.610260009765625, 0.6459808349609375, 0.68170166015625, 0.7174224853515625, 0.753143310546875, 0.7888641357421875, 0.8245849609375, 0.8603057861328125, 0.896026611328125, 0.9317474365234375, 0.96746826171875, 1.0031890869140625, 1.038909912109375, 1.0746307373046875, 1.1103515625]}, "gradients/decoder.model.decoder.layers.7.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 3.0, 4.0, 6.0, 10.0, 9.0, 15.0, 14.0, 37.0, 39.0, 72.0, 90.0, 112.0, 111.0, 108.0, 106.0, 63.0, 61.0, 42.0, 34.0, 23.0, 19.0, 15.0, 6.0, 3.0, 5.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-5.2290778160095215, -5.0955610275268555, -4.9620442390441895, -4.828527927398682, -4.695011138916016, -4.56149435043335, -4.427977561950684, -4.294461250305176, -4.16094446182251, -4.027427673339844, -3.893911123275757, -3.760394334793091, -3.626877784729004, -3.493360996246338, -3.359844207763672, -3.226327657699585, -3.092810869216919, -2.959294080734253, -2.825777530670166, -2.6922607421875, -2.558744192123413, -2.425227403640747, -2.29171085357666, -2.158194065093994, -2.024677276611328, -1.8911606073379517, -1.7576439380645752, -1.6241271495819092, -1.4906105995178223, -1.3570938110351562, -1.2235771417617798, -1.0900604724884033, -0.9565441608428955, -0.823027491569519, -0.6895108222961426, -0.5559940934181213, -0.4224774241447449, -0.2889607548713684, -0.15544402599334717, -0.021927356719970703, 0.11158931255340576, 0.24510599672794342, 0.3786226809024811, 0.5121393799781799, 0.6456560492515564, 0.7791727185249329, 0.9126894474029541, 1.0462061166763306, 1.179722785949707, 1.3132394552230835, 1.44675612449646, 1.580272912979126, 1.713789463043213, 1.847306251525879, 1.9808229207992554, 2.114339590072632, 2.2478561401367188, 2.3813729286193848, 2.5148894786834717, 2.6484062671661377, 2.7819228172302246, 2.9154396057128906, 3.0489563941955566, 3.1824729442596436, 3.3159897327423096]}, "gradients/decoder.model.decoder.layers.7.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 0.0, 6.0, 1.0, 4.0, 5.0, 10.0, 4.0, 10.0, 17.0, 21.0, 23.0, 29.0, 26.0, 31.0, 33.0, 41.0, 36.0, 50.0, 39.0, 40.0, 52.0, 43.0, 49.0, 44.0, 56.0, 40.0, 50.0, 37.0, 37.0, 31.0, 28.0, 20.0, 15.0, 16.0, 13.0, 13.0, 6.0, 11.0, 5.0, 7.0, 2.0, 3.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.4433648586273193, -2.3669867515563965, -2.2906088829040527, -2.21423077583313, -2.137852907180786, -2.0614748001098633, -1.98509681224823, -1.9087188243865967, -1.8323408365249634, -1.75596284866333, -1.6795848608016968, -1.6032068729400635, -1.5268287658691406, -1.4504508972167969, -1.374072790145874, -1.2976948022842407, -1.2213168144226074, -1.1449388265609741, -1.0685608386993408, -0.9921827912330627, -0.9158048033714294, -0.8394268155097961, -0.7630487680435181, -0.6866707801818848, -0.6102927923202515, -0.5339148044586182, -0.4575367867946625, -0.3811587691307068, -0.3047807812690735, -0.22840279340744019, -0.1520247757434845, -0.07564675807952881, 0.0007309913635253906, 0.07710899412631989, 0.15348699688911438, 0.22986499965190887, 0.30624300241470337, 0.38262099027633667, 0.45899900794029236, 0.535377025604248, 0.6117550134658813, 0.6881330013275146, 0.764510989189148, 0.840889036655426, 0.9172670245170593, 0.9936450123786926, 1.0700230598449707, 1.146401047706604, 1.2227790355682373, 1.2991570234298706, 1.375535011291504, 1.4519129991531372, 1.5282909870147705, 1.6046690940856934, 1.6810470819473267, 1.75742506980896, 1.8338030576705933, 1.9101810455322266, 1.9865590333938599, 2.062937021255493, 2.139315128326416, 2.2156929969787598, 2.2920711040496826, 2.3684492111206055, 2.444827079772949]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 9.0, 5.0, 7.0, 13.0, 15.0, 22.0, 29.0, 41.0, 67.0, 104.0, 214.0, 346.0, 712.0, 1842.0, 5448.0, 20140.0, 85015.0, 304037.0, 417804.0, 159603.0, 38304.0, 9709.0, 2872.0, 1043.0, 490.0, 257.0, 123.0, 85.0, 52.0, 44.0, 31.0, 14.0, 18.0, 15.0, 4.0, 7.0, 6.0, 7.0, 3.0, 3.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.59375, -0.5753250122070312, -0.5569000244140625, -0.5384750366210938, -0.520050048828125, -0.5016250610351562, -0.4832000732421875, -0.46477508544921875, -0.44635009765625, -0.42792510986328125, -0.4095001220703125, -0.39107513427734375, -0.372650146484375, -0.35422515869140625, -0.3358001708984375, -0.31737518310546875, -0.2989501953125, -0.28052520751953125, -0.2621002197265625, -0.24367523193359375, -0.225250244140625, -0.20682525634765625, -0.1884002685546875, -0.16997528076171875, -0.15155029296875, -0.13312530517578125, -0.1147003173828125, -0.09627532958984375, -0.077850341796875, -0.05942535400390625, -0.0410003662109375, -0.02257537841796875, -0.004150390625, 0.01427459716796875, 0.0326995849609375, 0.05112457275390625, 0.069549560546875, 0.08797454833984375, 0.1063995361328125, 0.12482452392578125, 0.14324951171875, 0.16167449951171875, 0.1800994873046875, 0.19852447509765625, 0.216949462890625, 0.23537445068359375, 0.2537994384765625, 0.27222442626953125, 0.2906494140625, 0.30907440185546875, 0.3274993896484375, 0.34592437744140625, 0.364349365234375, 0.38277435302734375, 0.4011993408203125, 0.41962432861328125, 0.43804931640625, 0.45647430419921875, 0.4748992919921875, 0.49332427978515625, 0.511749267578125, 0.5301742553710938, 0.5485992431640625, 0.5670242309570312, 0.58544921875]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 4.0, 3.0, 10.0, 6.0, 18.0, 19.0, 21.0, 43.0, 41.0, 49.0, 64.0, 60.0, 88.0, 72.0, 84.0, 76.0, 74.0, 64.0, 52.0, 34.0, 42.0, 20.0, 22.0, 16.0, 6.0, 6.0, 8.0, 4.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.919921875, -1.84295654296875, -1.7659912109375, -1.68902587890625, -1.612060546875, -1.53509521484375, -1.4581298828125, -1.38116455078125, -1.30419921875, -1.22723388671875, -1.1502685546875, -1.07330322265625, -0.996337890625, -0.91937255859375, -0.8424072265625, -0.76544189453125, -0.6884765625, -0.61151123046875, -0.5345458984375, -0.45758056640625, -0.380615234375, -0.30364990234375, -0.2266845703125, -0.14971923828125, -0.07275390625, 0.00421142578125, 0.0811767578125, 0.15814208984375, 0.235107421875, 0.31207275390625, 0.3890380859375, 0.46600341796875, 0.54296875, 0.61993408203125, 0.6968994140625, 0.77386474609375, 0.850830078125, 0.92779541015625, 1.0047607421875, 1.08172607421875, 1.15869140625, 1.23565673828125, 1.3126220703125, 1.38958740234375, 1.466552734375, 1.54351806640625, 1.6204833984375, 1.69744873046875, 1.7744140625, 1.85137939453125, 1.9283447265625, 2.00531005859375, 2.082275390625, 2.15924072265625, 2.2362060546875, 2.31317138671875, 2.39013671875, 2.46710205078125, 2.5440673828125, 2.62103271484375, 2.697998046875, 2.77496337890625, 2.8519287109375, 2.92889404296875, 3.005859375]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 8.0, 3.0, 5.0, 8.0, 11.0, 11.0, 25.0, 29.0, 44.0, 57.0, 98.0, 152.0, 238.0, 414.0, 736.0, 1312.0, 2641.0, 5164.0, 11070.0, 22706.0, 47012.0, 92092.0, 159764.0, 218275.0, 204142.0, 135777.0, 74823.0, 37383.0, 17523.0, 8487.0, 3903.0, 2049.0, 1107.0, 585.0, 317.0, 183.0, 140.0, 87.0, 51.0, 40.0, 19.0, 21.0, 10.0, 9.0, 8.0, 6.0, 4.0, 2.0, 3.0, 1.0, 3.0, 3.0, 2.0, 1.0], "bins": [-0.261474609375, -0.25374794006347656, -0.24602127075195312, -0.2382946014404297, -0.23056793212890625, -0.2228412628173828, -0.21511459350585938, -0.20738792419433594, -0.1996612548828125, -0.19193458557128906, -0.18420791625976562, -0.1764812469482422, -0.16875457763671875, -0.1610279083251953, -0.15330123901367188, -0.14557456970214844, -0.137847900390625, -0.13012123107910156, -0.12239456176757812, -0.11466789245605469, -0.10694122314453125, -0.09921455383300781, -0.09148788452148438, -0.08376121520996094, -0.0760345458984375, -0.06830787658691406, -0.060581207275390625, -0.05285453796386719, -0.04512786865234375, -0.03740119934082031, -0.029674530029296875, -0.021947860717773438, -0.01422119140625, -0.0064945220947265625, 0.001232147216796875, 0.008958816528320312, 0.01668548583984375, 0.024412155151367188, 0.032138824462890625, 0.03986549377441406, 0.0475921630859375, 0.05531883239746094, 0.06304550170898438, 0.07077217102050781, 0.07849884033203125, 0.08622550964355469, 0.09395217895507812, 0.10167884826660156, 0.109405517578125, 0.11713218688964844, 0.12485885620117188, 0.1325855255126953, 0.14031219482421875, 0.1480388641357422, 0.15576553344726562, 0.16349220275878906, 0.1712188720703125, 0.17894554138183594, 0.18667221069335938, 0.1943988800048828, 0.20212554931640625, 0.2098522186279297, 0.21757888793945312, 0.22530555725097656, 0.2330322265625]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 7.0, 4.0, 4.0, 6.0, 9.0, 12.0, 16.0, 25.0, 23.0, 19.0, 36.0, 40.0, 41.0, 65.0, 59.0, 70.0, 68.0, 64.0, 59.0, 59.0, 55.0, 48.0, 49.0, 28.0, 32.0, 22.0, 15.0, 18.0, 16.0, 10.0, 9.0, 8.0, 8.0, 5.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.85546875, -3.73992919921875, -3.6243896484375, -3.50885009765625, -3.393310546875, -3.27777099609375, -3.1622314453125, -3.04669189453125, -2.93115234375, -2.81561279296875, -2.7000732421875, -2.58453369140625, -2.468994140625, -2.35345458984375, -2.2379150390625, -2.12237548828125, -2.0068359375, -1.89129638671875, -1.7757568359375, -1.66021728515625, -1.544677734375, -1.42913818359375, -1.3135986328125, -1.19805908203125, -1.08251953125, -0.96697998046875, -0.8514404296875, -0.73590087890625, -0.620361328125, -0.50482177734375, -0.3892822265625, -0.27374267578125, -0.158203125, -0.04266357421875, 0.0728759765625, 0.18841552734375, 0.303955078125, 0.41949462890625, 0.5350341796875, 0.65057373046875, 0.76611328125, 0.88165283203125, 0.9971923828125, 1.11273193359375, 1.228271484375, 1.34381103515625, 1.4593505859375, 1.57489013671875, 1.6904296875, 1.80596923828125, 1.9215087890625, 2.03704833984375, 2.152587890625, 2.26812744140625, 2.3836669921875, 2.49920654296875, 2.61474609375, 2.73028564453125, 2.8458251953125, 2.96136474609375, 3.076904296875, 3.19244384765625, 3.3079833984375, 3.42352294921875, 3.5390625]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 4.0, 3.0, 8.0, 6.0, 4.0, 10.0, 9.0, 20.0, 27.0, 28.0, 40.0, 58.0, 114.0, 142.0, 205.0, 376.0, 697.0, 1420.0, 3333.0, 9393.0, 30130.0, 121461.0, 426249.0, 337647.0, 83247.0, 21732.0, 7034.0, 2650.0, 1134.0, 548.0, 279.0, 184.0, 115.0, 66.0, 52.0, 44.0, 17.0, 18.0, 9.0, 8.0, 14.0, 11.0, 7.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.07501220703125, -0.07250118255615234, -0.06999015808105469, -0.06747913360595703, -0.06496810913085938, -0.06245708465576172, -0.05994606018066406, -0.057435035705566406, -0.05492401123046875, -0.052412986755371094, -0.04990196228027344, -0.04739093780517578, -0.044879913330078125, -0.04236888885498047, -0.03985786437988281, -0.037346839904785156, -0.0348358154296875, -0.032324790954589844, -0.029813766479492188, -0.02730274200439453, -0.024791717529296875, -0.02228069305419922, -0.019769668579101562, -0.017258644104003906, -0.01474761962890625, -0.012236595153808594, -0.009725570678710938, -0.007214546203613281, -0.004703521728515625, -0.0021924972534179688, 0.0003185272216796875, 0.0028295516967773438, 0.005340576171875, 0.007851600646972656, 0.010362625122070312, 0.012873649597167969, 0.015384674072265625, 0.01789569854736328, 0.020406723022460938, 0.022917747497558594, 0.02542877197265625, 0.027939796447753906, 0.030450820922851562, 0.03296184539794922, 0.035472869873046875, 0.03798389434814453, 0.04049491882324219, 0.043005943298339844, 0.0455169677734375, 0.048027992248535156, 0.05053901672363281, 0.05305004119873047, 0.055561065673828125, 0.05807209014892578, 0.06058311462402344, 0.0630941390991211, 0.06560516357421875, 0.0681161880493164, 0.07062721252441406, 0.07313823699951172, 0.07564926147460938, 0.07816028594970703, 0.08067131042480469, 0.08318233489990234, 0.085693359375]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 4.0, 2.0, 2.0, 1.0, 5.0, 4.0, 9.0, 5.0, 20.0, 12.0, 16.0, 23.0, 32.0, 29.0, 39.0, 73.0, 61.0, 85.0, 69.0, 78.0, 72.0, 79.0, 52.0, 45.0, 47.0, 26.0, 24.0, 21.0, 17.0, 16.0, 8.0, 7.0, 4.0, 6.0, 6.0, 4.0, 0.0, 3.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-3.4749507904052734e-05, -3.351643681526184e-05, -3.228336572647095e-05, -3.1050294637680054e-05, -2.981722354888916e-05, -2.8584152460098267e-05, -2.7351081371307373e-05, -2.611801028251648e-05, -2.4884939193725586e-05, -2.3651868104934692e-05, -2.24187970161438e-05, -2.1185725927352905e-05, -1.9952654838562012e-05, -1.8719583749771118e-05, -1.7486512660980225e-05, -1.625344157218933e-05, -1.5020370483398438e-05, -1.3787299394607544e-05, -1.255422830581665e-05, -1.1321157217025757e-05, -1.0088086128234863e-05, -8.85501503944397e-06, -7.621943950653076e-06, -6.388872861862183e-06, -5.155801773071289e-06, -3.9227306842803955e-06, -2.689659595489502e-06, -1.4565885066986084e-06, -2.2351741790771484e-07, 1.0095536708831787e-06, 2.2426247596740723e-06, 3.475695848464966e-06, 4.708766937255859e-06, 5.941838026046753e-06, 7.1749091148376465e-06, 8.40798020362854e-06, 9.641051292419434e-06, 1.0874122381210327e-05, 1.210719347000122e-05, 1.3340264558792114e-05, 1.4573335647583008e-05, 1.58064067363739e-05, 1.7039477825164795e-05, 1.827254891395569e-05, 1.9505620002746582e-05, 2.0738691091537476e-05, 2.197176218032837e-05, 2.3204833269119263e-05, 2.4437904357910156e-05, 2.567097544670105e-05, 2.6904046535491943e-05, 2.8137117624282837e-05, 2.937018871307373e-05, 3.0603259801864624e-05, 3.183633089065552e-05, 3.306940197944641e-05, 3.4302473068237305e-05, 3.55355441570282e-05, 3.676861524581909e-05, 3.8001686334609985e-05, 3.923475742340088e-05, 4.046782851219177e-05, 4.1700899600982666e-05, 4.293397068977356e-05, 4.416704177856445e-05]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 2.0, 2.0, 3.0, 6.0, 8.0, 14.0, 4.0, 15.0, 22.0, 25.0, 44.0, 73.0, 96.0, 195.0, 374.0, 889.0, 2485.0, 7910.0, 29641.0, 152144.0, 569774.0, 227463.0, 41749.0, 10252.0, 3164.0, 1120.0, 520.0, 232.0, 113.0, 68.0, 40.0, 29.0, 15.0, 20.0, 9.0, 10.0, 4.0, 5.0, 7.0, 5.0, 4.0, 2.0, 5.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.113525390625, -0.1102457046508789, -0.10696601867675781, -0.10368633270263672, -0.10040664672851562, -0.09712696075439453, -0.09384727478027344, -0.09056758880615234, -0.08728790283203125, -0.08400821685791016, -0.08072853088378906, -0.07744884490966797, -0.07416915893554688, -0.07088947296142578, -0.06760978698730469, -0.0643301010131836, -0.0610504150390625, -0.057770729064941406, -0.05449104309082031, -0.05121135711669922, -0.047931671142578125, -0.04465198516845703, -0.04137229919433594, -0.038092613220214844, -0.03481292724609375, -0.031533241271972656, -0.028253555297851562, -0.02497386932373047, -0.021694183349609375, -0.01841449737548828, -0.015134811401367188, -0.011855125427246094, -0.008575439453125, -0.005295753479003906, -0.0020160675048828125, 0.0012636184692382812, 0.004543304443359375, 0.007822990417480469, 0.011102676391601562, 0.014382362365722656, 0.01766204833984375, 0.020941734313964844, 0.024221420288085938, 0.02750110626220703, 0.030780792236328125, 0.03406047821044922, 0.03734016418457031, 0.040619850158691406, 0.0438995361328125, 0.047179222106933594, 0.05045890808105469, 0.05373859405517578, 0.057018280029296875, 0.06029796600341797, 0.06357765197753906, 0.06685733795166016, 0.07013702392578125, 0.07341670989990234, 0.07669639587402344, 0.07997608184814453, 0.08325576782226562, 0.08653545379638672, 0.08981513977050781, 0.0930948257446289, 0.09637451171875]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 0.0, 4.0, 4.0, 2.0, 2.0, 6.0, 5.0, 5.0, 5.0, 6.0, 11.0, 7.0, 14.0, 17.0, 16.0, 43.0, 59.0, 56.0, 56.0, 78.0, 84.0, 91.0, 77.0, 77.0, 50.0, 45.0, 40.0, 30.0, 34.0, 16.0, 12.0, 12.0, 8.0, 7.0, 3.0, 13.0, 3.0, 0.0, 6.0, 1.0, 0.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0184478759765625, -0.017822980880737305, -0.01719808578491211, -0.016573190689086914, -0.01594829559326172, -0.015323400497436523, -0.014698505401611328, -0.014073610305786133, -0.013448715209960938, -0.012823820114135742, -0.012198925018310547, -0.011574029922485352, -0.010949134826660156, -0.010324239730834961, -0.009699344635009766, -0.00907444953918457, -0.008449554443359375, -0.00782465934753418, -0.007199764251708984, -0.006574869155883789, -0.005949974060058594, -0.0053250789642333984, -0.004700183868408203, -0.004075288772583008, -0.0034503936767578125, -0.002825498580932617, -0.002200603485107422, -0.0015757083892822266, -0.0009508132934570312, -0.00032591819763183594, 0.0002989768981933594, 0.0009238719940185547, 0.00154876708984375, 0.0021736621856689453, 0.0027985572814941406, 0.003423452377319336, 0.004048347473144531, 0.0046732425689697266, 0.005298137664794922, 0.005923032760620117, 0.0065479278564453125, 0.007172822952270508, 0.007797718048095703, 0.008422613143920898, 0.009047508239746094, 0.009672403335571289, 0.010297298431396484, 0.01092219352722168, 0.011547088623046875, 0.01217198371887207, 0.012796878814697266, 0.013421773910522461, 0.014046669006347656, 0.014671564102172852, 0.015296459197998047, 0.015921354293823242, 0.016546249389648438, 0.017171144485473633, 0.017796039581298828, 0.018420934677124023, 0.01904582977294922, 0.019670724868774414, 0.02029561996459961, 0.020920515060424805, 0.02154541015625]}, "gradients/decoder.model.decoder.layers.7.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 15.0, 22.0, 72.0, 216.0, 349.0, 211.0, 80.0, 28.0, 13.0, 2.0, 2.0, 3.0, 2.0, 0.0, 3.0], "bins": [-12.600336074829102, -12.36499309539795, -12.129650115966797, -11.894307136535645, -11.658964157104492, -11.42362117767334, -11.188278198242188, -10.952935218811035, -10.717592239379883, -10.48224925994873, -10.246906280517578, -10.011563301086426, -9.776220321655273, -9.540877342224121, -9.305534362792969, -9.070191383361816, -8.834848403930664, -8.599505424499512, -8.36416244506836, -8.128819465637207, -7.893476486206055, -7.658133506774902, -7.42279052734375, -7.187447547912598, -6.952103614807129, -6.716760635375977, -6.481417655944824, -6.246074676513672, -6.0107316970825195, -5.775388717651367, -5.540045738220215, -5.3047027587890625, -5.06935977935791, -4.834016799926758, -4.5986738204956055, -4.363330841064453, -4.127987861633301, -3.8926448822021484, -3.657301664352417, -3.4219586849212646, -3.186615467071533, -2.951272487640381, -2.7159295082092285, -2.480586528778076, -2.245243549346924, -2.0099005699157715, -1.77455735206604, -1.5392143726348877, -1.3038713932037354, -1.068528413772583, -0.8331853747367859, -0.5978423357009888, -0.3624993562698364, -0.12715637683868408, 0.10818672180175781, 0.34352970123291016, 0.5788726806640625, 0.8142156600952148, 1.0495586395263672, 1.284901738166809, 1.5202447175979614, 1.7555876970291138, 1.9909307956695557, 2.226273775100708, 2.4616167545318604]}, "gradients/decoder.model.decoder.layers.7.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 8.0, 12.0, 9.0, 20.0, 25.0, 47.0, 48.0, 74.0, 66.0, 82.0, 91.0, 79.0, 93.0, 89.0, 73.0, 56.0, 36.0, 35.0, 17.0, 15.0, 15.0, 8.0, 4.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7142726182937622, -1.6294703483581543, -1.5446680784225464, -1.4598658084869385, -1.3750636577606201, -1.2902613878250122, -1.2054591178894043, -1.120656967163086, -1.0358545780181885, -0.9510523080825806, -0.8662500977516174, -0.7814478278160095, -0.6966456174850464, -0.6118433475494385, -0.5270410776138306, -0.44223886728286743, -0.3574366569519043, -0.2726344168186188, -0.18783216178417206, -0.10302990674972534, -0.01822766661643982, 0.0665745735168457, 0.1513768434524536, 0.23617905378341675, 0.32098132371902466, 0.4057835638523102, 0.4905858039855957, 0.5753880739212036, 0.6601903438568115, 0.7449925541877747, 0.8297948241233826, 0.9145970344543457, 0.9993991851806641, 1.084201455116272, 1.1690037250518799, 1.2538058757781982, 1.3386081457138062, 1.423410415649414, 1.508212685585022, 1.5930149555206299, 1.6778171062469482, 1.7626193761825562, 1.847421646118164, 1.9322237968444824, 2.01702618598938, 2.1018283367156982, 2.1866307258605957, 2.271432876586914, 2.3562350273132324, 2.441037178039551, 2.5258395671844482, 2.6106417179107666, 2.695444107055664, 2.7802462577819824, 2.865048408508301, 2.9498507976531982, 3.0346531867980957, 3.119455337524414, 3.2042577266693115, 3.28905987739563, 3.3738622665405273, 3.4586644172668457, 3.543466567993164, 3.6282689571380615, 3.71307110786438]}, "gradients/decoder.model.decoder.layers.7.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 4.0, 5.0, 4.0, 2.0, 6.0, 5.0, 8.0, 4.0, 6.0, 5.0, 14.0, 11.0, 30.0, 25.0, 35.0, 40.0, 53.0, 94.0, 378.0, 3842.0, 112494.0, 842063.0, 85596.0, 3142.0, 359.0, 94.0, 64.0, 44.0, 36.0, 21.0, 26.0, 10.0, 9.0, 10.0, 7.0, 5.0, 3.0, 4.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.01953125, -4.8599853515625, -4.700439453125, -4.5408935546875, -4.38134765625, -4.2218017578125, -4.062255859375, -3.9027099609375, -3.7431640625, -3.5836181640625, -3.424072265625, -3.2645263671875, -3.10498046875, -2.9454345703125, -2.785888671875, -2.6263427734375, -2.466796875, -2.3072509765625, -2.147705078125, -1.9881591796875, -1.82861328125, -1.6690673828125, -1.509521484375, -1.3499755859375, -1.1904296875, -1.0308837890625, -0.871337890625, -0.7117919921875, -0.55224609375, -0.3927001953125, -0.233154296875, -0.0736083984375, 0.0859375, 0.2454833984375, 0.405029296875, 0.5645751953125, 0.72412109375, 0.8836669921875, 1.043212890625, 1.2027587890625, 1.3623046875, 1.5218505859375, 1.681396484375, 1.8409423828125, 2.00048828125, 2.1600341796875, 2.319580078125, 2.4791259765625, 2.638671875, 2.7982177734375, 2.957763671875, 3.1173095703125, 3.27685546875, 3.4364013671875, 3.595947265625, 3.7554931640625, 3.9150390625, 4.0745849609375, 4.234130859375, 4.3936767578125, 4.55322265625, 4.7127685546875, 4.872314453125, 5.0318603515625, 5.19140625]}, "gradients/decoder.model.decoder.layers.7.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 4.0, 10.0, 24.0, 29.0, 94.0, 100.0, 163.0, 175.0, 145.0, 132.0, 70.0, 28.0, 27.0, 8.0, 5.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.25390625, -2.94427490234375, -2.6346435546875, -2.32501220703125, -2.015380859375, -1.70574951171875, -1.3961181640625, -1.08648681640625, -0.77685546875, -0.46722412109375, -0.1575927734375, 0.15203857421875, 0.461669921875, 0.77130126953125, 1.0809326171875, 1.39056396484375, 1.7001953125, 2.00982666015625, 2.3194580078125, 2.62908935546875, 2.938720703125, 3.24835205078125, 3.5579833984375, 3.86761474609375, 4.17724609375, 4.48687744140625, 4.7965087890625, 5.10614013671875, 5.415771484375, 5.72540283203125, 6.0350341796875, 6.34466552734375, 6.654296875, 6.96392822265625, 7.2735595703125, 7.58319091796875, 7.892822265625, 8.20245361328125, 8.5120849609375, 8.82171630859375, 9.13134765625, 9.44097900390625, 9.7506103515625, 10.06024169921875, 10.369873046875, 10.67950439453125, 10.9891357421875, 11.29876708984375, 11.6083984375, 11.91802978515625, 12.2276611328125, 12.53729248046875, 12.846923828125, 13.15655517578125, 13.4661865234375, 13.77581787109375, 14.08544921875, 14.39508056640625, 14.7047119140625, 15.01434326171875, 15.323974609375, 15.63360595703125, 15.9432373046875, 16.25286865234375, 16.5625]}, "gradients/decoder.model.decoder.layers.7.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 4.0, 1.0, 3.0, 2.0, 1.0, 4.0, 2.0, 11.0, 16.0, 13.0, 20.0, 25.0, 39.0, 42.0, 44.0, 85.0, 93.0, 109.0, 155.0, 152.0, 276.0, 475.0, 1782.0, 38603.0, 780879.0, 217937.0, 5812.0, 709.0, 357.0, 225.0, 154.0, 128.0, 95.0, 73.0, 69.0, 46.0, 32.0, 22.0, 19.0, 9.0, 15.0, 10.0, 4.0, 5.0, 5.0, 5.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.203125, -4.05682373046875, -3.9105224609375, -3.76422119140625, -3.617919921875, -3.47161865234375, -3.3253173828125, -3.17901611328125, -3.03271484375, -2.88641357421875, -2.7401123046875, -2.59381103515625, -2.447509765625, -2.30120849609375, -2.1549072265625, -2.00860595703125, -1.8623046875, -1.71600341796875, -1.5697021484375, -1.42340087890625, -1.277099609375, -1.13079833984375, -0.9844970703125, -0.83819580078125, -0.69189453125, -0.54559326171875, -0.3992919921875, -0.25299072265625, -0.106689453125, 0.03961181640625, 0.1859130859375, 0.33221435546875, 0.478515625, 0.62481689453125, 0.7711181640625, 0.91741943359375, 1.063720703125, 1.21002197265625, 1.3563232421875, 1.50262451171875, 1.64892578125, 1.79522705078125, 1.9415283203125, 2.08782958984375, 2.234130859375, 2.38043212890625, 2.5267333984375, 2.67303466796875, 2.8193359375, 2.96563720703125, 3.1119384765625, 3.25823974609375, 3.404541015625, 3.55084228515625, 3.6971435546875, 3.84344482421875, 3.98974609375, 4.13604736328125, 4.2823486328125, 4.42864990234375, 4.574951171875, 4.72125244140625, 4.8675537109375, 5.01385498046875, 5.16015625]}, "gradients/decoder.model.decoder.layers.7.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 4.0, 0.0, 8.0, 2.0, 7.0, 5.0, 12.0, 9.0, 15.0, 22.0, 19.0, 27.0, 34.0, 25.0, 41.0, 43.0, 37.0, 38.0, 44.0, 51.0, 49.0, 42.0, 60.0, 40.0, 49.0, 44.0, 43.0, 34.0, 35.0, 28.0, 32.0, 12.0, 21.0, 24.0, 6.0, 9.0, 12.0, 6.0, 6.0, 3.0, 4.0, 9.0, 4.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.634765625, -2.532318115234375, -2.42987060546875, -2.327423095703125, -2.2249755859375, -2.122528076171875, -2.02008056640625, -1.917633056640625, -1.815185546875, -1.712738037109375, -1.61029052734375, -1.507843017578125, -1.4053955078125, -1.302947998046875, -1.20050048828125, -1.098052978515625, -0.99560546875, -0.893157958984375, -0.79071044921875, -0.688262939453125, -0.5858154296875, -0.483367919921875, -0.38092041015625, -0.278472900390625, -0.176025390625, -0.073577880859375, 0.02886962890625, 0.131317138671875, 0.2337646484375, 0.336212158203125, 0.43865966796875, 0.541107177734375, 0.6435546875, 0.746002197265625, 0.84844970703125, 0.950897216796875, 1.0533447265625, 1.155792236328125, 1.25823974609375, 1.360687255859375, 1.463134765625, 1.565582275390625, 1.66802978515625, 1.770477294921875, 1.8729248046875, 1.975372314453125, 2.07781982421875, 2.180267333984375, 2.28271484375, 2.385162353515625, 2.48760986328125, 2.590057373046875, 2.6925048828125, 2.794952392578125, 2.89739990234375, 2.999847412109375, 3.102294921875, 3.204742431640625, 3.30718994140625, 3.409637451171875, 3.5120849609375, 3.614532470703125, 3.71697998046875, 3.819427490234375, 3.921875]}, "gradients/decoder.model.decoder.layers.7.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 4.0, 3.0, 5.0, 8.0, 17.0, 24.0, 39.0, 66.0, 136.0, 299.0, 794.0, 2453.0, 13037.0, 219223.0, 759638.0, 45386.0, 5205.0, 1372.0, 467.0, 184.0, 103.0, 25.0, 22.0, 18.0, 8.0, 5.0, 2.0, 4.0, 4.0, 5.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.4765625, -1.420318603515625, -1.36407470703125, -1.307830810546875, -1.2515869140625, -1.195343017578125, -1.13909912109375, -1.082855224609375, -1.026611328125, -0.970367431640625, -0.91412353515625, -0.857879638671875, -0.8016357421875, -0.745391845703125, -0.68914794921875, -0.632904052734375, -0.57666015625, -0.520416259765625, -0.46417236328125, -0.407928466796875, -0.3516845703125, -0.295440673828125, -0.23919677734375, -0.182952880859375, -0.126708984375, -0.070465087890625, -0.01422119140625, 0.042022705078125, 0.0982666015625, 0.154510498046875, 0.21075439453125, 0.266998291015625, 0.3232421875, 0.379486083984375, 0.43572998046875, 0.491973876953125, 0.5482177734375, 0.604461669921875, 0.66070556640625, 0.716949462890625, 0.773193359375, 0.829437255859375, 0.88568115234375, 0.941925048828125, 0.9981689453125, 1.054412841796875, 1.11065673828125, 1.166900634765625, 1.22314453125, 1.279388427734375, 1.33563232421875, 1.391876220703125, 1.4481201171875, 1.504364013671875, 1.56060791015625, 1.616851806640625, 1.673095703125, 1.729339599609375, 1.78558349609375, 1.841827392578125, 1.8980712890625, 1.954315185546875, 2.01055908203125, 2.066802978515625, 2.123046875]}, "gradients/decoder.model.decoder.layers.7.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 5.0, 2.0, 7.0, 18.0, 22.0, 28.0, 37.0, 74.0, 100.0, 116.0, 152.0, 129.0, 96.0, 85.0, 49.0, 29.0, 24.0, 11.0, 5.0, 5.0, 4.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002601146697998047, -0.00025320425629615784, -0.000246293842792511, -0.00023938342928886414, -0.00023247301578521729, -0.00022556260228157043, -0.00021865218877792358, -0.00021174177527427673, -0.00020483136177062988, -0.00019792094826698303, -0.00019101053476333618, -0.00018410012125968933, -0.00017718970775604248, -0.00017027929425239563, -0.00016336888074874878, -0.00015645846724510193, -0.00014954805374145508, -0.00014263764023780823, -0.00013572722673416138, -0.00012881681323051453, -0.00012190639972686768, -0.00011499598622322083, -0.00010808557271957397, -0.00010117515921592712, -9.426474571228027e-05, -8.735433220863342e-05, -8.044391870498657e-05, -7.353350520133972e-05, -6.662309169769287e-05, -5.971267819404602e-05, -5.280226469039917e-05, -4.589185118675232e-05, -3.898143768310547e-05, -3.207102417945862e-05, -2.5160610675811768e-05, -1.8250197172164917e-05, -1.1339783668518066e-05, -4.429370164871216e-06, 2.4810433387756348e-06, 9.391456842422485e-06, 1.6301870346069336e-05, 2.3212283849716187e-05, 3.0122697353363037e-05, 3.703311085700989e-05, 4.394352436065674e-05, 5.085393786430359e-05, 5.776435136795044e-05, 6.467476487159729e-05, 7.158517837524414e-05, 7.849559187889099e-05, 8.540600538253784e-05, 9.231641888618469e-05, 9.922683238983154e-05, 0.0001061372458934784, 0.00011304765939712524, 0.0001199580729007721, 0.00012686848640441895, 0.0001337788999080658, 0.00014068931341171265, 0.0001475997269153595, 0.00015451014041900635, 0.0001614205539226532, 0.00016833096742630005, 0.0001752413809299469, 0.00018215179443359375]}, "gradients/decoder.model.decoder.layers.7.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 2.0, 0.0, 4.0, 3.0, 9.0, 8.0, 11.0, 20.0, 31.0, 34.0, 52.0, 100.0, 231.0, 582.0, 2171.0, 17840.0, 514320.0, 492619.0, 17284.0, 2143.0, 562.0, 231.0, 124.0, 66.0, 26.0, 29.0, 19.0, 14.0, 7.0, 8.0, 6.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-2.357421875, -2.2900543212890625, -2.222686767578125, -2.1553192138671875, -2.08795166015625, -2.0205841064453125, -1.953216552734375, -1.8858489990234375, -1.8184814453125, -1.7511138916015625, -1.683746337890625, -1.6163787841796875, -1.54901123046875, -1.4816436767578125, -1.414276123046875, -1.3469085693359375, -1.279541015625, -1.2121734619140625, -1.144805908203125, -1.0774383544921875, -1.01007080078125, -0.9427032470703125, -0.875335693359375, -0.8079681396484375, -0.7406005859375, -0.6732330322265625, -0.605865478515625, -0.5384979248046875, -0.47113037109375, -0.4037628173828125, -0.336395263671875, -0.2690277099609375, -0.20166015625, -0.1342926025390625, -0.066925048828125, 0.0004425048828125, 0.06781005859375, 0.1351776123046875, 0.202545166015625, 0.2699127197265625, 0.3372802734375, 0.4046478271484375, 0.472015380859375, 0.5393829345703125, 0.60675048828125, 0.6741180419921875, 0.741485595703125, 0.8088531494140625, 0.876220703125, 0.9435882568359375, 1.010955810546875, 1.0783233642578125, 1.14569091796875, 1.2130584716796875, 1.280426025390625, 1.3477935791015625, 1.4151611328125, 1.4825286865234375, 1.549896240234375, 1.6172637939453125, 1.68463134765625, 1.7519989013671875, 1.819366455078125, 1.8867340087890625, 1.9541015625]}, "gradients/decoder.model.decoder.layers.7.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 4.0, 2.0, 7.0, 6.0, 9.0, 6.0, 15.0, 18.0, 26.0, 36.0, 56.0, 69.0, 116.0, 126.0, 120.0, 104.0, 87.0, 61.0, 39.0, 21.0, 25.0, 18.0, 10.0, 7.0, 9.0, 6.0, 2.0, 3.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.472412109375, -0.4544334411621094, -0.43645477294921875, -0.4184761047363281, -0.4004974365234375, -0.3825187683105469, -0.36454010009765625, -0.3465614318847656, -0.328582763671875, -0.3106040954589844, -0.29262542724609375, -0.2746467590332031, -0.2566680908203125, -0.23868942260742188, -0.22071075439453125, -0.20273208618164062, -0.18475341796875, -0.16677474975585938, -0.14879608154296875, -0.13081741333007812, -0.1128387451171875, -0.09486007690429688, -0.07688140869140625, -0.058902740478515625, -0.040924072265625, -0.022945404052734375, -0.00496673583984375, 0.013011932373046875, 0.0309906005859375, 0.048969268798828125, 0.06694793701171875, 0.08492660522460938, 0.1029052734375, 0.12088394165039062, 0.13886260986328125, 0.15684127807617188, 0.1748199462890625, 0.19279861450195312, 0.21077728271484375, 0.22875595092773438, 0.246734619140625, 0.2647132873535156, 0.28269195556640625, 0.3006706237792969, 0.3186492919921875, 0.3366279602050781, 0.35460662841796875, 0.3725852966308594, 0.39056396484375, 0.4085426330566406, 0.42652130126953125, 0.4444999694824219, 0.4624786376953125, 0.4804573059082031, 0.49843597412109375, 0.5164146423339844, 0.534393310546875, 0.5523719787597656, 0.5703506469726562, 0.5883293151855469, 0.6063079833984375, 0.6242866516113281, 0.6422653198242188, 0.6602439880371094, 0.67822265625]}, "gradients/decoder.model.decoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 3.0, 3.0, 2.0, 10.0, 7.0, 20.0, 26.0, 42.0, 51.0, 71.0, 105.0, 115.0, 125.0, 118.0, 91.0, 61.0, 46.0, 40.0, 28.0, 10.0, 8.0, 7.0, 5.0, 7.0, 0.0, 4.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-6.005093097686768, -5.8308210372924805, -5.656548500061035, -5.482276439666748, -5.308004379272461, -5.133732318878174, -4.9594597816467285, -4.785187721252441, -4.610915660858154, -4.436643600463867, -4.262371063232422, -4.088099002838135, -3.9138269424438477, -3.7395546436309814, -3.5652823448181152, -3.391010284423828, -3.216737985610962, -3.0424656867980957, -2.8681936264038086, -2.6939213275909424, -2.5196492671966553, -2.345376968383789, -2.171104907989502, -1.9968326091766357, -1.822560429573059, -1.6482882499694824, -1.4740160703659058, -1.299743890762329, -1.125471591949463, -0.951199471950531, -0.7769272327423096, -0.6026550531387329, -0.42838287353515625, -0.2541106939315796, -0.07983848452568054, 0.0944337248802185, 0.26870590448379517, 0.4429780840873718, 0.6172503232955933, 0.7915225028991699, 0.9657946825027466, 1.1400668621063232, 1.3143390417099, 1.4886112213134766, 1.6628835201263428, 1.8371555805206299, 2.011427879333496, 2.185699939727783, 2.3599722385406494, 2.5342445373535156, 2.7085165977478027, 2.882788896560669, 3.057060956954956, 3.2313332557678223, 3.4056053161621094, 3.5798776149749756, 3.754149913787842, 3.928422212600708, 4.102694511413574, 4.276966571807861, 4.451238632202148, 4.6255106925964355, 4.799783229827881, 4.974055290222168, 5.148327350616455]}, "gradients/decoder.model.decoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [8.0, 9.0, 5.0, 13.0, 24.0, 34.0, 41.0, 47.0, 61.0, 71.0, 82.0, 76.0, 90.0, 91.0, 81.0, 80.0, 66.0, 46.0, 41.0, 24.0, 11.0, 9.0, 6.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.012876033782959, -3.6836705207824707, -3.3544647693634033, -3.025259017944336, -2.6960535049438477, -2.3668479919433594, -2.037642240524292, -1.7084364891052246, -1.3792309761047363, -1.0500253438949585, -0.7208197116851807, -0.39161407947540283, -0.062408447265625, 0.26679718494415283, 0.5960028171539307, 0.925208568572998, 1.2544140815734863, 1.5836197137832642, 1.912825345993042, 2.2420310974121094, 2.5712366104125977, 2.900442123413086, 3.2296478748321533, 3.5588536262512207, 3.888059139251709, 4.217264652252197, 4.546470642089844, 4.875676155090332, 5.20488166809082, 5.534087181091309, 5.863292694091797, 6.192498683929443, 6.521703720092773, 6.850909233093262, 7.18011474609375, 7.5093207359313965, 7.838526248931885, 8.167732238769531, 8.49693775177002, 8.826143264770508, 9.155348777770996, 9.484554290771484, 9.813759803771973, 10.142965316772461, 10.472171783447266, 10.801377296447754, 11.130582809448242, 11.45978832244873, 11.788993835449219, 12.118199348449707, 12.447404861450195, 12.776610374450684, 13.105815887451172, 13.435022354125977, 13.764227867126465, 14.093433380126953, 14.422638893127441, 14.75184440612793, 15.081049919128418, 15.410255432128906, 15.739461898803711, 16.068666458129883, 16.397872924804688, 16.72707748413086, 17.056283950805664]}, "gradients/decoder.model.decoder.layers.6.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 4.0, 3.0, 3.0, 4.0, 10.0, 8.0, 20.0, 13.0, 22.0, 33.0, 45.0, 57.0, 85.0, 111.0, 197.0, 338.0, 969.0, 5015.0, 114857.0, 3382080.0, 670911.0, 16019.0, 1943.0, 631.0, 353.0, 195.0, 114.0, 74.0, 51.0, 30.0, 18.0, 15.0, 15.0, 12.0, 5.0, 9.0, 4.0, 4.0, 3.0, 1.0, 1.0, 1.0, 6.0, 2.0, 0.0, 0.0, 3.0], "bins": [-7.5546875, -7.348876953125, -7.14306640625, -6.937255859375, -6.7314453125, -6.525634765625, -6.31982421875, -6.114013671875, -5.908203125, -5.702392578125, -5.49658203125, -5.290771484375, -5.0849609375, -4.879150390625, -4.67333984375, -4.467529296875, -4.26171875, -4.055908203125, -3.85009765625, -3.644287109375, -3.4384765625, -3.232666015625, -3.02685546875, -2.821044921875, -2.615234375, -2.409423828125, -2.20361328125, -1.997802734375, -1.7919921875, -1.586181640625, -1.38037109375, -1.174560546875, -0.96875, -0.762939453125, -0.55712890625, -0.351318359375, -0.1455078125, 0.060302734375, 0.26611328125, 0.471923828125, 0.677734375, 0.883544921875, 1.08935546875, 1.295166015625, 1.5009765625, 1.706787109375, 1.91259765625, 2.118408203125, 2.32421875, 2.530029296875, 2.73583984375, 2.941650390625, 3.1474609375, 3.353271484375, 3.55908203125, 3.764892578125, 3.970703125, 4.176513671875, 4.38232421875, 4.588134765625, 4.7939453125, 4.999755859375, 5.20556640625, 5.411376953125, 5.6171875]}, "gradients/decoder.model.decoder.layers.6.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 4.0, 3.0, 3.0, 7.0, 7.0, 4.0, 13.0, 8.0, 24.0, 21.0, 22.0, 31.0, 35.0, 37.0, 58.0, 43.0, 52.0, 50.0, 61.0, 60.0, 59.0, 44.0, 47.0, 48.0, 37.0, 49.0, 32.0, 33.0, 26.0, 19.0, 24.0, 14.0, 11.0, 9.0, 4.0, 3.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.349609375, -2.27484130859375, -2.2000732421875, -2.12530517578125, -2.050537109375, -1.97576904296875, -1.9010009765625, -1.82623291015625, -1.75146484375, -1.67669677734375, -1.6019287109375, -1.52716064453125, -1.452392578125, -1.37762451171875, -1.3028564453125, -1.22808837890625, -1.1533203125, -1.07855224609375, -1.0037841796875, -0.92901611328125, -0.854248046875, -0.77947998046875, -0.7047119140625, -0.62994384765625, -0.55517578125, -0.48040771484375, -0.4056396484375, -0.33087158203125, -0.256103515625, -0.18133544921875, -0.1065673828125, -0.03179931640625, 0.04296875, 0.11773681640625, 0.1925048828125, 0.26727294921875, 0.342041015625, 0.41680908203125, 0.4915771484375, 0.56634521484375, 0.64111328125, 0.71588134765625, 0.7906494140625, 0.86541748046875, 0.940185546875, 1.01495361328125, 1.0897216796875, 1.16448974609375, 1.2392578125, 1.31402587890625, 1.3887939453125, 1.46356201171875, 1.538330078125, 1.61309814453125, 1.6878662109375, 1.76263427734375, 1.83740234375, 1.91217041015625, 1.9869384765625, 2.06170654296875, 2.136474609375, 2.21124267578125, 2.2860107421875, 2.36077880859375, 2.435546875]}, "gradients/decoder.model.decoder.layers.6.fc1.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 6.0, 9.0, 7.0, 21.0, 38.0, 37.0, 67.0, 117.0, 202.0, 421.0, 1018.0, 4131.0, 104223.0, 3997500.0, 80603.0, 3971.0, 964.0, 426.0, 207.0, 121.0, 80.0, 49.0, 34.0, 15.0, 4.0, 8.0, 5.0, 0.0, 3.0, 4.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.203125, -6.958740234375, -6.71435546875, -6.469970703125, -6.2255859375, -5.981201171875, -5.73681640625, -5.492431640625, -5.248046875, -5.003662109375, -4.75927734375, -4.514892578125, -4.2705078125, -4.026123046875, -3.78173828125, -3.537353515625, -3.29296875, -3.048583984375, -2.80419921875, -2.559814453125, -2.3154296875, -2.071044921875, -1.82666015625, -1.582275390625, -1.337890625, -1.093505859375, -0.84912109375, -0.604736328125, -0.3603515625, -0.115966796875, 0.12841796875, 0.372802734375, 0.6171875, 0.861572265625, 1.10595703125, 1.350341796875, 1.5947265625, 1.839111328125, 2.08349609375, 2.327880859375, 2.572265625, 2.816650390625, 3.06103515625, 3.305419921875, 3.5498046875, 3.794189453125, 4.03857421875, 4.282958984375, 4.52734375, 4.771728515625, 5.01611328125, 5.260498046875, 5.5048828125, 5.749267578125, 5.99365234375, 6.238037109375, 6.482421875, 6.726806640625, 6.97119140625, 7.215576171875, 7.4599609375, 7.704345703125, 7.94873046875, 8.193115234375, 8.4375]}, "gradients/decoder.model.decoder.layers.6.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 4.0, 7.0, 6.0, 10.0, 12.0, 24.0, 24.0, 34.0, 37.0, 61.0, 100.0, 131.0, 165.0, 290.0, 369.0, 486.0, 536.0, 440.0, 417.0, 294.0, 192.0, 141.0, 84.0, 58.0, 41.0, 35.0, 24.0, 23.0, 12.0, 8.0, 5.0, 4.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0], "bins": [-1.0908203125, -1.0625, -1.0341796875, -1.005859375, -0.9775390625, -0.94921875, -0.9208984375, -0.892578125, -0.8642578125, -0.8359375, -0.8076171875, -0.779296875, -0.7509765625, -0.72265625, -0.6943359375, -0.666015625, -0.6376953125, -0.609375, -0.5810546875, -0.552734375, -0.5244140625, -0.49609375, -0.4677734375, -0.439453125, -0.4111328125, -0.3828125, -0.3544921875, -0.326171875, -0.2978515625, -0.26953125, -0.2412109375, -0.212890625, -0.1845703125, -0.15625, -0.1279296875, -0.099609375, -0.0712890625, -0.04296875, -0.0146484375, 0.013671875, 0.0419921875, 0.0703125, 0.0986328125, 0.126953125, 0.1552734375, 0.18359375, 0.2119140625, 0.240234375, 0.2685546875, 0.296875, 0.3251953125, 0.353515625, 0.3818359375, 0.41015625, 0.4384765625, 0.466796875, 0.4951171875, 0.5234375, 0.5517578125, 0.580078125, 0.6083984375, 0.63671875, 0.6650390625, 0.693359375, 0.7216796875]}, "gradients/decoder.model.decoder.layers.6.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 6.0, 1.0, 3.0, 3.0, 6.0, 5.0, 7.0, 8.0, 16.0, 16.0, 41.0, 59.0, 60.0, 80.0, 89.0, 100.0, 93.0, 102.0, 75.0, 57.0, 58.0, 37.0, 27.0, 21.0, 11.0, 7.0, 12.0, 3.0, 4.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.669475078582764, -4.544282913208008, -4.41909122467041, -4.293899059295654, -4.168706893920898, -4.043515205383301, -3.918323040008545, -3.793130874633789, -3.6679389476776123, -3.5427470207214355, -3.4175548553466797, -3.292362928390503, -3.167171001434326, -3.0419788360595703, -2.9167869091033936, -2.791594982147217, -2.666402816772461, -2.541210889816284, -2.4160187244415283, -2.2908267974853516, -2.1656346321105957, -2.040442705154419, -1.9152507781982422, -1.7900587320327759, -1.6648666858673096, -1.5396746397018433, -1.414482593536377, -1.2892906665802002, -1.1640986204147339, -1.0389065742492676, -0.913714587688446, -0.7885226011276245, -0.6633305549621582, -0.5381385087966919, -0.41294652223587036, -0.28775450587272644, -0.16256248950958252, -0.03737044334411621, 0.08782154321670532, 0.21301352977752686, 0.33820557594299316, 0.4633975923061371, 0.588589608669281, 0.7137815952301025, 0.8389736413955688, 0.9641656875610352, 1.089357614517212, 1.2145496606826782, 1.3397417068481445, 1.4649337530136108, 1.5901257991790771, 1.715317726135254, 1.8405097723007202, 1.9657018184661865, 2.0908937454223633, 2.216085910797119, 2.341277837753296, 2.4664697647094727, 2.5916619300842285, 2.7168538570404053, 2.842045783996582, 2.967237949371338, 3.0924298763275146, 3.2176218032836914, 3.3428139686584473]}, "gradients/decoder.model.decoder.layers.6.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 2.0, 0.0, 6.0, 9.0, 6.0, 10.0, 18.0, 20.0, 18.0, 23.0, 26.0, 34.0, 34.0, 40.0, 30.0, 48.0, 51.0, 46.0, 43.0, 62.0, 63.0, 57.0, 46.0, 52.0, 42.0, 34.0, 36.0, 34.0, 23.0, 20.0, 18.0, 27.0, 12.0, 2.0, 8.0, 2.0, 2.0, 4.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.850348472595215, -2.765322685241699, -2.6802966594696045, -2.595270872116089, -2.510244846343994, -2.4252190589904785, -2.340193033218384, -2.255167245864868, -2.1701412200927734, -2.085115432739258, -2.000089406967163, -1.915063500404358, -1.8300375938415527, -1.7450116872787476, -1.6599857807159424, -1.5749599933624268, -1.4899340867996216, -1.4049081802368164, -1.3198822736740112, -1.234856367111206, -1.1498304605484009, -1.0648045539855957, -0.9797787070274353, -0.8947528004646301, -0.809726893901825, -0.7247009873390198, -0.6396750807762146, -0.5546492338180542, -0.46962329745292664, -0.38459739089012146, -0.29957151412963867, -0.2145456075668335, -0.12951970100402832, -0.04449380189180374, 0.04053209722042084, 0.12555798888206482, 0.21058389544487, 0.29560980200767517, 0.38063567876815796, 0.46566158533096313, 0.5506874918937683, 0.6357133984565735, 0.7207393050193787, 0.8057651519775391, 0.8907910585403442, 0.9758169651031494, 1.0608428716659546, 1.1458687782287598, 1.230894684791565, 1.3159205913543701, 1.4009464979171753, 1.4859724044799805, 1.5709983110427856, 1.6560242176055908, 1.7410500049591064, 1.8260760307312012, 1.9111018180847168, 1.996127724647522, 2.081153631210327, 2.1661794185638428, 2.2512054443359375, 2.336231231689453, 2.421257257461548, 2.5062830448150635, 2.591309070587158]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [3.0, 3.0, 1.0, 2.0, 2.0, 1.0, 3.0, 4.0, 13.0, 9.0, 5.0, 15.0, 17.0, 30.0, 31.0, 31.0, 54.0, 67.0, 129.0, 180.0, 323.0, 674.0, 1527.0, 4739.0, 16002.0, 58244.0, 193148.0, 386565.0, 265306.0, 86507.0, 23757.0, 6981.0, 2295.0, 873.0, 372.0, 200.0, 125.0, 88.0, 58.0, 41.0, 35.0, 21.0, 22.0, 15.0, 13.0, 9.0, 8.0, 8.0, 5.0, 2.0, 3.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.484619140625, -0.4670982360839844, -0.44957733154296875, -0.4320564270019531, -0.4145355224609375, -0.3970146179199219, -0.37949371337890625, -0.3619728088378906, -0.344451904296875, -0.3269309997558594, -0.30941009521484375, -0.2918891906738281, -0.2743682861328125, -0.2568473815917969, -0.23932647705078125, -0.22180557250976562, -0.20428466796875, -0.18676376342773438, -0.16924285888671875, -0.15172195434570312, -0.1342010498046875, -0.11668014526367188, -0.09915924072265625, -0.08163833618164062, -0.064117431640625, -0.046596527099609375, -0.02907562255859375, -0.011554718017578125, 0.0059661865234375, 0.023487091064453125, 0.04100799560546875, 0.058528900146484375, 0.0760498046875, 0.09357070922851562, 0.11109161376953125, 0.12861251831054688, 0.1461334228515625, 0.16365432739257812, 0.18117523193359375, 0.19869613647460938, 0.216217041015625, 0.23373794555664062, 0.25125885009765625, 0.2687797546386719, 0.2863006591796875, 0.3038215637207031, 0.32134246826171875, 0.3388633728027344, 0.35638427734375, 0.3739051818847656, 0.39142608642578125, 0.4089469909667969, 0.4264678955078125, 0.4439888000488281, 0.46150970458984375, 0.4790306091308594, 0.496551513671875, 0.5140724182128906, 0.5315933227539062, 0.5491142272949219, 0.5666351318359375, 0.5841560363769531, 0.6016769409179688, 0.6191978454589844, 0.63671875]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 5.0, 4.0, 8.0, 12.0, 24.0, 22.0, 30.0, 34.0, 43.0, 62.0, 65.0, 83.0, 80.0, 87.0, 82.0, 79.0, 79.0, 51.0, 41.0, 48.0, 29.0, 16.0, 11.0, 5.0, 4.0, 3.0, 4.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.33984375, -3.2501220703125, -3.160400390625, -3.0706787109375, -2.98095703125, -2.8912353515625, -2.801513671875, -2.7117919921875, -2.6220703125, -2.5323486328125, -2.442626953125, -2.3529052734375, -2.26318359375, -2.1734619140625, -2.083740234375, -1.9940185546875, -1.904296875, -1.8145751953125, -1.724853515625, -1.6351318359375, -1.54541015625, -1.4556884765625, -1.365966796875, -1.2762451171875, -1.1865234375, -1.0968017578125, -1.007080078125, -0.9173583984375, -0.82763671875, -0.7379150390625, -0.648193359375, -0.5584716796875, -0.46875, -0.3790283203125, -0.289306640625, -0.1995849609375, -0.10986328125, -0.0201416015625, 0.069580078125, 0.1593017578125, 0.2490234375, 0.3387451171875, 0.428466796875, 0.5181884765625, 0.60791015625, 0.6976318359375, 0.787353515625, 0.8770751953125, 0.966796875, 1.0565185546875, 1.146240234375, 1.2359619140625, 1.32568359375, 1.4154052734375, 1.505126953125, 1.5948486328125, 1.6845703125, 1.7742919921875, 1.864013671875, 1.9537353515625, 2.04345703125, 2.1331787109375, 2.222900390625, 2.3126220703125, 2.40234375]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 5.0, 4.0, 8.0, 18.0, 26.0, 42.0, 61.0, 100.0, 190.0, 290.0, 573.0, 1192.0, 2119.0, 4220.0, 8364.0, 16177.0, 30866.0, 57897.0, 102361.0, 160959.0, 202803.0, 182842.0, 123763.0, 72646.0, 39002.0, 20692.0, 10340.0, 5290.0, 2672.0, 1453.0, 703.0, 383.0, 197.0, 115.0, 57.0, 46.0, 30.0, 24.0, 9.0, 8.0, 5.0, 7.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.26513671875, -0.2572669982910156, -0.24939727783203125, -0.24152755737304688, -0.2336578369140625, -0.22578811645507812, -0.21791839599609375, -0.21004867553710938, -0.202178955078125, -0.19430923461914062, -0.18643951416015625, -0.17856979370117188, -0.1707000732421875, -0.16283035278320312, -0.15496063232421875, -0.14709091186523438, -0.13922119140625, -0.13135147094726562, -0.12348175048828125, -0.11561203002929688, -0.1077423095703125, -0.09987258911132812, -0.09200286865234375, -0.08413314819335938, -0.076263427734375, -0.06839370727539062, -0.06052398681640625, -0.052654266357421875, -0.0447845458984375, -0.036914825439453125, -0.02904510498046875, -0.021175384521484375, -0.0133056640625, -0.005435943603515625, 0.00243377685546875, 0.010303497314453125, 0.0181732177734375, 0.026042938232421875, 0.03391265869140625, 0.041782379150390625, 0.049652099609375, 0.057521820068359375, 0.06539154052734375, 0.07326126098632812, 0.0811309814453125, 0.08900070190429688, 0.09687042236328125, 0.10474014282226562, 0.11260986328125, 0.12047958374023438, 0.12834930419921875, 0.13621902465820312, 0.1440887451171875, 0.15195846557617188, 0.15982818603515625, 0.16769790649414062, 0.175567626953125, 0.18343734741210938, 0.19130706787109375, 0.19917678833007812, 0.2070465087890625, 0.21491622924804688, 0.22278594970703125, 0.23065567016601562, 0.238525390625]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 3.0, 3.0, 2.0, 3.0, 6.0, 5.0, 8.0, 15.0, 12.0, 16.0, 12.0, 26.0, 18.0, 33.0, 22.0, 27.0, 31.0, 41.0, 44.0, 42.0, 53.0, 65.0, 48.0, 52.0, 49.0, 52.0, 33.0, 39.0, 42.0, 34.0, 29.0, 22.0, 18.0, 20.0, 16.0, 10.0, 14.0, 15.0, 10.0, 5.0, 6.0, 4.0, 5.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.67578125, -3.569549560546875, -3.46331787109375, -3.357086181640625, -3.2508544921875, -3.144622802734375, -3.03839111328125, -2.932159423828125, -2.825927734375, -2.719696044921875, -2.61346435546875, -2.507232666015625, -2.4010009765625, -2.294769287109375, -2.18853759765625, -2.082305908203125, -1.97607421875, -1.869842529296875, -1.76361083984375, -1.657379150390625, -1.5511474609375, -1.444915771484375, -1.33868408203125, -1.232452392578125, -1.126220703125, -1.019989013671875, -0.91375732421875, -0.807525634765625, -0.7012939453125, -0.595062255859375, -0.48883056640625, -0.382598876953125, -0.2763671875, -0.170135498046875, -0.06390380859375, 0.042327880859375, 0.1485595703125, 0.254791259765625, 0.36102294921875, 0.467254638671875, 0.573486328125, 0.679718017578125, 0.78594970703125, 0.892181396484375, 0.9984130859375, 1.104644775390625, 1.21087646484375, 1.317108154296875, 1.42333984375, 1.529571533203125, 1.63580322265625, 1.742034912109375, 1.8482666015625, 1.954498291015625, 2.06072998046875, 2.166961669921875, 2.273193359375, 2.379425048828125, 2.48565673828125, 2.591888427734375, 2.6981201171875, 2.804351806640625, 2.91058349609375, 3.016815185546875, 3.123046875]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 4.0, 5.0, 5.0, 2.0, 17.0, 19.0, 17.0, 38.0, 71.0, 124.0, 163.0, 397.0, 641.0, 1338.0, 3221.0, 8989.0, 34595.0, 183290.0, 586044.0, 180449.0, 34184.0, 8977.0, 3147.0, 1370.0, 632.0, 334.0, 178.0, 108.0, 69.0, 45.0, 35.0, 18.0, 10.0, 9.0, 6.0, 2.0, 1.0, 2.0, 2.0, 0.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11895751953125, -0.11492443084716797, -0.11089134216308594, -0.1068582534790039, -0.10282516479492188, -0.09879207611083984, -0.09475898742675781, -0.09072589874267578, -0.08669281005859375, -0.08265972137451172, -0.07862663269042969, -0.07459354400634766, -0.07056045532226562, -0.0665273666381836, -0.06249427795410156, -0.05846118927001953, -0.0544281005859375, -0.05039501190185547, -0.04636192321777344, -0.042328834533691406, -0.038295745849609375, -0.034262657165527344, -0.030229568481445312, -0.02619647979736328, -0.02216339111328125, -0.01813030242919922, -0.014097213745117188, -0.010064125061035156, -0.006031036376953125, -0.0019979476928710938, 0.0020351409912109375, 0.006068229675292969, 0.010101318359375, 0.014134407043457031, 0.018167495727539062, 0.022200584411621094, 0.026233673095703125, 0.030266761779785156, 0.03429985046386719, 0.03833293914794922, 0.04236602783203125, 0.04639911651611328, 0.05043220520019531, 0.054465293884277344, 0.058498382568359375, 0.0625314712524414, 0.06656455993652344, 0.07059764862060547, 0.0746307373046875, 0.07866382598876953, 0.08269691467285156, 0.0867300033569336, 0.09076309204101562, 0.09479618072509766, 0.09882926940917969, 0.10286235809326172, 0.10689544677734375, 0.11092853546142578, 0.11496162414550781, 0.11899471282958984, 0.12302780151367188, 0.1270608901977539, 0.13109397888183594, 0.13512706756591797, 0.13916015625]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 6.0, 7.0, 11.0, 27.0, 27.0, 56.0, 74.0, 100.0, 147.0, 166.0, 109.0, 94.0, 66.0, 39.0, 28.0, 19.0, 6.0, 15.0, 4.0, 3.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0001207590103149414, -0.00011767912656068802, -0.00011459924280643463, -0.00011151935905218124, -0.00010843947529792786, -0.00010535959154367447, -0.00010227970778942108, -9.91998240351677e-05, -9.61199402809143e-05, -9.304005652666092e-05, -8.996017277240753e-05, -8.688028901815414e-05, -8.380040526390076e-05, -8.072052150964737e-05, -7.764063775539398e-05, -7.45607540011406e-05, -7.148087024688721e-05, -6.840098649263382e-05, -6.532110273838043e-05, -6.224121898412704e-05, -5.916133522987366e-05, -5.608145147562027e-05, -5.300156772136688e-05, -4.9921683967113495e-05, -4.684180021286011e-05, -4.376191645860672e-05, -4.068203270435333e-05, -3.7602148950099945e-05, -3.452226519584656e-05, -3.144238144159317e-05, -2.8362497687339783e-05, -2.5282613933086395e-05, -2.2202730178833008e-05, -1.912284642457962e-05, -1.6042962670326233e-05, -1.2963078916072845e-05, -9.883195161819458e-06, -6.8033114075660706e-06, -3.723427653312683e-06, -6.435438990592957e-07, 2.436339855194092e-06, 5.516223609447479e-06, 8.596107363700867e-06, 1.1675991117954254e-05, 1.4755874872207642e-05, 1.783575862646103e-05, 2.0915642380714417e-05, 2.3995526134967804e-05, 2.707540988922119e-05, 3.015529364347458e-05, 3.3235177397727966e-05, 3.6315061151981354e-05, 3.939494490623474e-05, 4.247482866048813e-05, 4.5554712414741516e-05, 4.8634596168994904e-05, 5.171447992324829e-05, 5.479436367750168e-05, 5.7874247431755066e-05, 6.095413118600845e-05, 6.403401494026184e-05, 6.711389869451523e-05, 7.019378244876862e-05, 7.3273666203022e-05, 7.635354995727539e-05]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 5.0, 6.0, 6.0, 8.0, 6.0, 15.0, 29.0, 52.0, 85.0, 130.0, 285.0, 493.0, 1275.0, 3352.0, 11626.0, 52013.0, 300529.0, 541060.0, 107772.0, 21049.0, 5454.0, 1775.0, 724.0, 340.0, 171.0, 112.0, 53.0, 39.0, 30.0, 21.0, 13.0, 9.0, 6.0, 1.0, 3.0, 4.0, 0.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1270751953125, -0.12286949157714844, -0.11866378784179688, -0.11445808410644531, -0.11025238037109375, -0.10604667663574219, -0.10184097290039062, -0.09763526916503906, -0.0934295654296875, -0.08922386169433594, -0.08501815795898438, -0.08081245422363281, -0.07660675048828125, -0.07240104675292969, -0.06819534301757812, -0.06398963928222656, -0.059783935546875, -0.05557823181152344, -0.051372528076171875, -0.04716682434082031, -0.04296112060546875, -0.03875541687011719, -0.034549713134765625, -0.030344009399414062, -0.0261383056640625, -0.021932601928710938, -0.017726898193359375, -0.013521194458007812, -0.00931549072265625, -0.0051097869873046875, -0.000904083251953125, 0.0033016204833984375, 0.00750732421875, 0.011713027954101562, 0.015918731689453125, 0.020124435424804688, 0.02433013916015625, 0.028535842895507812, 0.032741546630859375, 0.03694725036621094, 0.0411529541015625, 0.04535865783691406, 0.049564361572265625, 0.05377006530761719, 0.05797576904296875, 0.06218147277832031, 0.06638717651367188, 0.07059288024902344, 0.074798583984375, 0.07900428771972656, 0.08320999145507812, 0.08741569519042969, 0.09162139892578125, 0.09582710266113281, 0.10003280639648438, 0.10423851013183594, 0.1084442138671875, 0.11264991760253906, 0.11685562133789062, 0.12106132507324219, 0.12526702880859375, 0.1294727325439453, 0.13367843627929688, 0.13788414001464844, 0.14208984375]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 3.0, 3.0, 5.0, 11.0, 9.0, 16.0, 14.0, 14.0, 23.0, 20.0, 49.0, 43.0, 54.0, 68.0, 71.0, 77.0, 83.0, 88.0, 74.0, 59.0, 50.0, 40.0, 34.0, 26.0, 13.0, 18.0, 20.0, 8.0, 3.0, 2.0, 2.0, 6.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.033355712890625, -0.03240847587585449, -0.031461238861083984, -0.030514001846313477, -0.02956676483154297, -0.02861952781677246, -0.027672290802001953, -0.026725053787231445, -0.025777816772460938, -0.02483057975769043, -0.023883342742919922, -0.022936105728149414, -0.021988868713378906, -0.0210416316986084, -0.02009439468383789, -0.019147157669067383, -0.018199920654296875, -0.017252683639526367, -0.01630544662475586, -0.015358209609985352, -0.014410972595214844, -0.013463735580444336, -0.012516498565673828, -0.01156926155090332, -0.010622024536132812, -0.009674787521362305, -0.008727550506591797, -0.007780313491821289, -0.006833076477050781, -0.0058858394622802734, -0.004938602447509766, -0.003991365432739258, -0.00304412841796875, -0.002096891403198242, -0.0011496543884277344, -0.00020241737365722656, 0.0007448196411132812, 0.001692056655883789, 0.002639293670654297, 0.0035865306854248047, 0.0045337677001953125, 0.00548100471496582, 0.006428241729736328, 0.007375478744506836, 0.008322715759277344, 0.009269952774047852, 0.01021718978881836, 0.011164426803588867, 0.012111663818359375, 0.013058900833129883, 0.01400613784790039, 0.014953374862670898, 0.015900611877441406, 0.016847848892211914, 0.017795085906982422, 0.01874232292175293, 0.019689559936523438, 0.020636796951293945, 0.021584033966064453, 0.02253127098083496, 0.02347850799560547, 0.024425745010375977, 0.025372982025146484, 0.026320219039916992, 0.0272674560546875]}, "gradients/decoder.model.decoder.layers.6.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 7.0, 11.0, 33.0, 122.0, 272.0, 285.0, 186.0, 64.0, 14.0, 10.0, 5.0, 3.0, 0.0, 1.0, 3.0], "bins": [-13.121729850769043, -12.879738807678223, -12.637748718261719, -12.395757675170898, -12.153766632080078, -11.911775588989258, -11.669785499572754, -11.427794456481934, -11.18580436706543, -10.94381332397461, -10.701823234558105, -10.459832191467285, -10.217841148376465, -9.975851058959961, -9.73386001586914, -9.49186897277832, -9.2498779296875, -9.00788688659668, -8.765896797180176, -8.523905754089355, -8.281914710998535, -8.039924621582031, -7.797933578491211, -7.555942535400391, -7.3139519691467285, -7.071961402893066, -6.829970359802246, -6.587979793548584, -6.345989227294922, -6.103998184204102, -5.8620076179504395, -5.620017051696777, -5.378025531768799, -5.136034965515137, -4.894043922424316, -4.652053356170654, -4.410062789916992, -4.168071746826172, -3.9260811805725098, -3.6840903759002686, -3.4420995712280273, -3.200108766555786, -2.958117961883545, -2.716127395629883, -2.4741365909576416, -2.2321457862854004, -1.9901551008224487, -1.748164415359497, -1.5061736106872559, -1.2641828060150146, -1.022192120552063, -0.7802013754844666, -0.5382106304168701, -0.2962198257446289, -0.054229140281677246, 0.18776154518127441, 0.4297523498535156, 0.6717430949211121, 0.9137338399887085, 1.1557245254516602, 1.3977153301239014, 1.6397061347961426, 1.8816968202590942, 2.123687505722046, 2.365678310394287]}, "gradients/decoder.model.decoder.layers.6.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 4.0, 2.0, 3.0, 3.0, 11.0, 17.0, 20.0, 20.0, 27.0, 36.0, 47.0, 46.0, 45.0, 57.0, 68.0, 55.0, 77.0, 79.0, 67.0, 68.0, 48.0, 44.0, 46.0, 39.0, 21.0, 26.0, 12.0, 7.0, 4.0, 7.0, 3.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.558716297149658, -2.4864108562469482, -2.4141054153442383, -2.3417999744415283, -2.2694945335388184, -2.1971893310546875, -2.1248836517333984, -2.0525784492492676, -1.9802730083465576, -1.9079675674438477, -1.8356621265411377, -1.7633566856384277, -1.6910513639450073, -1.6187459230422974, -1.5464404821395874, -1.474135160446167, -1.4018296003341675, -1.3295241594314575, -1.2572187185287476, -1.1849133968353271, -1.1126079559326172, -1.0403025150299072, -0.9679970741271973, -0.8956916928291321, -0.8233862519264221, -0.7510808110237122, -0.678775429725647, -0.606469988822937, -0.534164547920227, -0.46185916662216187, -0.3895537257194519, -0.3172483444213867, -0.24494290351867676, -0.17263749241828918, -0.10033206641674042, -0.02802664041519165, 0.04427877068519592, 0.1165841817855835, 0.18888962268829346, 0.26119500398635864, 0.3335004448890686, 0.4058058559894562, 0.47811126708984375, 0.5504167079925537, 0.6227221488952637, 0.6950275301933289, 0.7673329710960388, 0.839638352394104, 0.911943793296814, 0.9842492341995239, 1.0565546751022339, 1.1288599967956543, 1.2011654376983643, 1.2734708786010742, 1.3457763195037842, 1.4180817604064941, 1.490387201309204, 1.562692642211914, 1.634998083114624, 1.707303524017334, 1.7796088457107544, 1.8519142866134644, 1.9242197275161743, 1.9965250492095947, 2.0688304901123047]}, "gradients/decoder.model.decoder.layers.6.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 6.0, 2.0, 3.0, 7.0, 14.0, 17.0, 16.0, 29.0, 51.0, 73.0, 216.0, 812.0, 8443.0, 399239.0, 624537.0, 13535.0, 1063.0, 255.0, 80.0, 46.0, 27.0, 35.0, 17.0, 12.0, 2.0, 6.0, 6.0, 2.0, 3.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.48828125, -5.29949951171875, -5.1107177734375, -4.92193603515625, -4.733154296875, -4.54437255859375, -4.3555908203125, -4.16680908203125, -3.97802734375, -3.78924560546875, -3.6004638671875, -3.41168212890625, -3.222900390625, -3.03411865234375, -2.8453369140625, -2.65655517578125, -2.4677734375, -2.27899169921875, -2.0902099609375, -1.90142822265625, -1.712646484375, -1.52386474609375, -1.3350830078125, -1.14630126953125, -0.95751953125, -0.76873779296875, -0.5799560546875, -0.39117431640625, -0.202392578125, -0.01361083984375, 0.1751708984375, 0.36395263671875, 0.552734375, 0.74151611328125, 0.9302978515625, 1.11907958984375, 1.307861328125, 1.49664306640625, 1.6854248046875, 1.87420654296875, 2.06298828125, 2.25177001953125, 2.4405517578125, 2.62933349609375, 2.818115234375, 3.00689697265625, 3.1956787109375, 3.38446044921875, 3.5732421875, 3.76202392578125, 3.9508056640625, 4.13958740234375, 4.328369140625, 4.51715087890625, 4.7059326171875, 4.89471435546875, 5.08349609375, 5.27227783203125, 5.4610595703125, 5.64984130859375, 5.838623046875, 6.02740478515625, 6.2161865234375, 6.40496826171875, 6.59375]}, "gradients/decoder.model.decoder.layers.6.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 3.0, 8.0, 12.0, 23.0, 35.0, 75.0, 91.0, 133.0, 130.0, 171.0, 116.0, 89.0, 72.0, 34.0, 11.0, 6.0, 6.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.45703125, -3.16595458984375, -2.8748779296875, -2.58380126953125, -2.292724609375, -2.00164794921875, -1.7105712890625, -1.41949462890625, -1.12841796875, -0.83734130859375, -0.5462646484375, -0.25518798828125, 0.035888671875, 0.32696533203125, 0.6180419921875, 0.90911865234375, 1.2001953125, 1.49127197265625, 1.7823486328125, 2.07342529296875, 2.364501953125, 2.65557861328125, 2.9466552734375, 3.23773193359375, 3.52880859375, 3.81988525390625, 4.1109619140625, 4.40203857421875, 4.693115234375, 4.98419189453125, 5.2752685546875, 5.56634521484375, 5.857421875, 6.14849853515625, 6.4395751953125, 6.73065185546875, 7.021728515625, 7.31280517578125, 7.6038818359375, 7.89495849609375, 8.18603515625, 8.47711181640625, 8.7681884765625, 9.05926513671875, 9.350341796875, 9.64141845703125, 9.9324951171875, 10.22357177734375, 10.5146484375, 10.80572509765625, 11.0968017578125, 11.38787841796875, 11.678955078125, 11.97003173828125, 12.2611083984375, 12.55218505859375, 12.84326171875, 13.13433837890625, 13.4254150390625, 13.71649169921875, 14.007568359375, 14.29864501953125, 14.5897216796875, 14.88079833984375, 15.171875]}, "gradients/decoder.model.decoder.layers.6.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 4.0, 1.0, 4.0, 12.0, 6.0, 8.0, 15.0, 33.0, 33.0, 48.0, 59.0, 70.0, 87.0, 156.0, 211.0, 330.0, 663.0, 2139.0, 16609.0, 427171.0, 572939.0, 23281.0, 2779.0, 764.0, 356.0, 224.0, 162.0, 94.0, 64.0, 66.0, 50.0, 30.0, 27.0, 17.0, 11.0, 9.0, 9.0, 3.0, 4.0, 4.0, 1.0, 2.0, 1.0, 3.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-4.72265625, -4.583984375, -4.4453125, -4.306640625, -4.16796875, -4.029296875, -3.890625, -3.751953125, -3.61328125, -3.474609375, -3.3359375, -3.197265625, -3.05859375, -2.919921875, -2.78125, -2.642578125, -2.50390625, -2.365234375, -2.2265625, -2.087890625, -1.94921875, -1.810546875, -1.671875, -1.533203125, -1.39453125, -1.255859375, -1.1171875, -0.978515625, -0.83984375, -0.701171875, -0.5625, -0.423828125, -0.28515625, -0.146484375, -0.0078125, 0.130859375, 0.26953125, 0.408203125, 0.546875, 0.685546875, 0.82421875, 0.962890625, 1.1015625, 1.240234375, 1.37890625, 1.517578125, 1.65625, 1.794921875, 1.93359375, 2.072265625, 2.2109375, 2.349609375, 2.48828125, 2.626953125, 2.765625, 2.904296875, 3.04296875, 3.181640625, 3.3203125, 3.458984375, 3.59765625, 3.736328125, 3.875, 4.013671875, 4.15234375]}, "gradients/decoder.model.decoder.layers.6.self_attn.v_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 2.0, 3.0, 7.0, 10.0, 15.0, 20.0, 13.0, 12.0, 16.0, 24.0, 22.0, 34.0, 49.0, 35.0, 40.0, 41.0, 33.0, 47.0, 45.0, 49.0, 44.0, 55.0, 38.0, 41.0, 46.0, 31.0, 33.0, 25.0, 23.0, 24.0, 26.0, 18.0, 12.0, 13.0, 9.0, 5.0, 14.0, 11.0, 4.0, 6.0, 3.0, 0.0, 1.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.529296875, -3.409027099609375, -3.28875732421875, -3.168487548828125, -3.0482177734375, -2.927947998046875, -2.80767822265625, -2.687408447265625, -2.567138671875, -2.446868896484375, -2.32659912109375, -2.206329345703125, -2.0860595703125, -1.965789794921875, -1.84552001953125, -1.725250244140625, -1.60498046875, -1.484710693359375, -1.36444091796875, -1.244171142578125, -1.1239013671875, -1.003631591796875, -0.88336181640625, -0.763092041015625, -0.642822265625, -0.522552490234375, -0.40228271484375, -0.282012939453125, -0.1617431640625, -0.041473388671875, 0.07879638671875, 0.199066162109375, 0.3193359375, 0.439605712890625, 0.55987548828125, 0.680145263671875, 0.8004150390625, 0.920684814453125, 1.04095458984375, 1.161224365234375, 1.281494140625, 1.401763916015625, 1.52203369140625, 1.642303466796875, 1.7625732421875, 1.882843017578125, 2.00311279296875, 2.123382568359375, 2.24365234375, 2.363922119140625, 2.48419189453125, 2.604461669921875, 2.7247314453125, 2.845001220703125, 2.96527099609375, 3.085540771484375, 3.205810546875, 3.326080322265625, 3.44635009765625, 3.566619873046875, 3.6868896484375, 3.807159423828125, 3.92742919921875, 4.047698974609375, 4.16796875]}, "gradients/decoder.model.decoder.layers.6.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 7.0, 6.0, 14.0, 24.0, 47.0, 104.0, 279.0, 958.0, 4745.0, 89766.0, 924640.0, 24377.0, 2557.0, 626.0, 220.0, 88.0, 47.0, 19.0, 12.0, 4.0, 1.0, 7.0, 1.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.185546875, -2.095733642578125, -2.00592041015625, -1.916107177734375, -1.8262939453125, -1.736480712890625, -1.64666748046875, -1.556854248046875, -1.467041015625, -1.377227783203125, -1.28741455078125, -1.197601318359375, -1.1077880859375, -1.017974853515625, -0.92816162109375, -0.838348388671875, -0.74853515625, -0.658721923828125, -0.56890869140625, -0.479095458984375, -0.3892822265625, -0.299468994140625, -0.20965576171875, -0.119842529296875, -0.030029296875, 0.059783935546875, 0.14959716796875, 0.239410400390625, 0.3292236328125, 0.419036865234375, 0.50885009765625, 0.598663330078125, 0.6884765625, 0.778289794921875, 0.86810302734375, 0.957916259765625, 1.0477294921875, 1.137542724609375, 1.22735595703125, 1.317169189453125, 1.406982421875, 1.496795654296875, 1.58660888671875, 1.676422119140625, 1.7662353515625, 1.856048583984375, 1.94586181640625, 2.035675048828125, 2.12548828125, 2.215301513671875, 2.30511474609375, 2.394927978515625, 2.4847412109375, 2.574554443359375, 2.66436767578125, 2.754180908203125, 2.843994140625, 2.933807373046875, 3.02362060546875, 3.113433837890625, 3.2032470703125, 3.293060302734375, 3.38287353515625, 3.472686767578125, 3.5625]}, "gradients/decoder.model.decoder.layers.6.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 1.0, 4.0, 4.0, 7.0, 8.0, 22.0, 41.0, 38.0, 94.0, 160.0, 188.0, 171.0, 106.0, 71.0, 36.0, 24.0, 11.0, 13.0, 5.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.00037097930908203125, -0.0003620833158493042, -0.00035318732261657715, -0.0003442913293838501, -0.00033539533615112305, -0.000326499342918396, -0.00031760334968566895, -0.0003087073564529419, -0.00029981136322021484, -0.0002909153699874878, -0.00028201937675476074, -0.0002731233835220337, -0.00026422739028930664, -0.0002553313970565796, -0.00024643540382385254, -0.0002375394105911255, -0.00022864341735839844, -0.0002197474241256714, -0.00021085143089294434, -0.00020195543766021729, -0.00019305944442749023, -0.00018416345119476318, -0.00017526745796203613, -0.00016637146472930908, -0.00015747547149658203, -0.00014857947826385498, -0.00013968348503112793, -0.00013078749179840088, -0.00012189149856567383, -0.00011299550533294678, -0.00010409951210021973, -9.520351886749268e-05, -8.630752563476562e-05, -7.741153240203857e-05, -6.851553916931152e-05, -5.961954593658447e-05, -5.072355270385742e-05, -4.182755947113037e-05, -3.293156623840332e-05, -2.403557300567627e-05, -1.5139579772949219e-05, -6.243586540222168e-06, 2.652406692504883e-06, 1.1548399925231934e-05, 2.0444393157958984e-05, 2.9340386390686035e-05, 3.8236379623413086e-05, 4.713237285614014e-05, 5.602836608886719e-05, 6.492435932159424e-05, 7.382035255432129e-05, 8.271634578704834e-05, 9.161233901977539e-05, 0.00010050833225250244, 0.00010940432548522949, 0.00011830031871795654, 0.0001271963119506836, 0.00013609230518341064, 0.0001449882984161377, 0.00015388429164886475, 0.0001627802848815918, 0.00017167627811431885, 0.0001805722713470459, 0.00018946826457977295, 0.0001983642578125]}, "gradients/decoder.model.decoder.layers.6.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 3.0, 4.0, 9.0, 9.0, 21.0, 20.0, 63.0, 113.0, 322.0, 1547.0, 29447.0, 990938.0, 23975.0, 1533.0, 311.0, 113.0, 49.0, 32.0, 18.0, 6.0, 7.0, 4.0, 5.0, 1.0, 4.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-5.28515625, -5.16632080078125, -5.0474853515625, -4.92864990234375, -4.809814453125, -4.69097900390625, -4.5721435546875, -4.45330810546875, -4.33447265625, -4.21563720703125, -4.0968017578125, -3.97796630859375, -3.859130859375, -3.74029541015625, -3.6214599609375, -3.50262451171875, -3.3837890625, -3.26495361328125, -3.1461181640625, -3.02728271484375, -2.908447265625, -2.78961181640625, -2.6707763671875, -2.55194091796875, -2.43310546875, -2.31427001953125, -2.1954345703125, -2.07659912109375, -1.957763671875, -1.83892822265625, -1.7200927734375, -1.60125732421875, -1.482421875, -1.36358642578125, -1.2447509765625, -1.12591552734375, -1.007080078125, -0.88824462890625, -0.7694091796875, -0.65057373046875, -0.53173828125, -0.41290283203125, -0.2940673828125, -0.17523193359375, -0.056396484375, 0.06243896484375, 0.1812744140625, 0.30010986328125, 0.4189453125, 0.53778076171875, 0.6566162109375, 0.77545166015625, 0.894287109375, 1.01312255859375, 1.1319580078125, 1.25079345703125, 1.36962890625, 1.48846435546875, 1.6072998046875, 1.72613525390625, 1.844970703125, 1.96380615234375, 2.0826416015625, 2.20147705078125, 2.3203125]}, "gradients/decoder.model.decoder.layers.6.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 4.0, 5.0, 6.0, 8.0, 7.0, 28.0, 41.0, 71.0, 115.0, 148.0, 221.0, 115.0, 113.0, 49.0, 34.0, 20.0, 7.0, 7.0, 7.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.642578125, -0.6137237548828125, -0.584869384765625, -0.5560150146484375, -0.52716064453125, -0.4983062744140625, -0.469451904296875, -0.4405975341796875, -0.4117431640625, -0.3828887939453125, -0.354034423828125, -0.3251800537109375, -0.29632568359375, -0.2674713134765625, -0.238616943359375, -0.2097625732421875, -0.180908203125, -0.1520538330078125, -0.123199462890625, -0.0943450927734375, -0.06549072265625, -0.0366363525390625, -0.007781982421875, 0.0210723876953125, 0.0499267578125, 0.0787811279296875, 0.107635498046875, 0.1364898681640625, 0.16534423828125, 0.1941986083984375, 0.223052978515625, 0.2519073486328125, 0.28076171875, 0.3096160888671875, 0.338470458984375, 0.3673248291015625, 0.39617919921875, 0.4250335693359375, 0.453887939453125, 0.4827423095703125, 0.5115966796875, 0.5404510498046875, 0.569305419921875, 0.5981597900390625, 0.62701416015625, 0.6558685302734375, 0.684722900390625, 0.7135772705078125, 0.742431640625, 0.7712860107421875, 0.800140380859375, 0.8289947509765625, 0.85784912109375, 0.8867034912109375, 0.915557861328125, 0.9444122314453125, 0.9732666015625, 1.0021209716796875, 1.030975341796875, 1.0598297119140625, 1.08868408203125, 1.1175384521484375, 1.146392822265625, 1.1752471923828125, 1.2041015625]}, "gradients/decoder.model.decoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 2.0, 3.0, 15.0, 15.0, 42.0, 78.0, 122.0, 179.0, 205.0, 161.0, 91.0, 35.0, 29.0, 13.0, 6.0, 6.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.8226189613342285, -4.524514198303223, -4.226409912109375, -3.928305149078369, -3.6302008628845215, -3.3320960998535156, -3.033991575241089, -2.735887050628662, -2.4377825260162354, -2.1396780014038086, -1.8415734767913818, -1.5434688329696655, -1.2453643083572388, -0.947259783744812, -0.6491551399230957, -0.35105061531066895, -0.05294609069824219, 0.24515846371650696, 0.5432630181312561, 0.8413676023483276, 1.1394721269607544, 1.4375766515731812, 1.7356812953948975, 2.033785820007324, 2.331890344619751, 2.6299948692321777, 2.9280993938446045, 3.2262039184570312, 3.524308681488037, 3.8224129676818848, 4.120517730712891, 4.418622016906738, 4.716726303100586, 5.014831066131592, 5.3129353523254395, 5.611040115356445, 5.909144401550293, 6.207249164581299, 6.505353927612305, 6.803458213806152, 7.1015625, 7.399667263031006, 7.6977715492248535, 7.995876312255859, 8.293980598449707, 8.592084884643555, 8.890190124511719, 9.188294410705566, 9.486398696899414, 9.784502983093262, 10.082608222961426, 10.380712509155273, 10.678816795349121, 10.976921081542969, 11.275026321411133, 11.57313060760498, 11.871235847473145, 12.169340133666992, 12.467445373535156, 12.765549659729004, 13.063653945922852, 13.3617582321167, 13.659863471984863, 13.957967758178711, 14.256072044372559]}, "gradients/decoder.model.decoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 5.0, 3.0, 5.0, 8.0, 14.0, 13.0, 13.0, 15.0, 19.0, 26.0, 27.0, 29.0, 38.0, 36.0, 45.0, 35.0, 52.0, 45.0, 43.0, 60.0, 54.0, 51.0, 46.0, 42.0, 49.0, 39.0, 36.0, 30.0, 31.0, 28.0, 21.0, 10.0, 12.0, 7.0, 9.0, 5.0, 3.0, 5.0, 6.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.0236945152282715, -5.784102439880371, -5.5445098876953125, -5.304917335510254, -5.0653252601623535, -4.825733184814453, -4.5861406326293945, -4.346548080444336, -4.1069560050964355, -3.867363691329956, -3.6277713775634766, -3.388179063796997, -3.1485867500305176, -2.908994436264038, -2.6694021224975586, -2.429809808731079, -2.1902174949645996, -1.9506251811981201, -1.7110328674316406, -1.4714405536651611, -1.2318482398986816, -0.9922559261322021, -0.7526636123657227, -0.5130712985992432, -0.27347898483276367, -0.03388667106628418, 0.2057056427001953, 0.4452979564666748, 0.6848902702331543, 0.9244825839996338, 1.1640748977661133, 1.4036672115325928, 1.643259048461914, 1.8828513622283936, 2.122443675994873, 2.3620359897613525, 2.601628303527832, 2.8412206172943115, 3.080812931060791, 3.3204052448272705, 3.55999755859375, 3.7995898723602295, 4.039182186126709, 4.278774261474609, 4.518366813659668, 4.757959365844727, 4.997551441192627, 5.237143516540527, 5.476736068725586, 5.7163286209106445, 5.955920696258545, 6.195512771606445, 6.435105323791504, 6.6746978759765625, 6.914289951324463, 7.153882026672363, 7.393474578857422, 7.6330671310424805, 7.872659206390381, 8.112251281738281, 8.35184383392334, 8.591436386108398, 8.83102798461914, 9.0706205368042, 9.310213088989258]}, "gradients/decoder.model.decoder.layers.5.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 3.0, 3.0, 11.0, 13.0, 12.0, 19.0, 29.0, 24.0, 53.0, 95.0, 171.0, 384.0, 1391.0, 12923.0, 1377667.0, 2772416.0, 25602.0, 2164.0, 670.0, 302.0, 126.0, 63.0, 44.0, 39.0, 16.0, 17.0, 7.0, 4.0, 6.0, 3.0, 5.0, 1.0, 1.0, 4.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.7890625, -8.53125, -8.2734375, -8.015625, -7.7578125, -7.5, -7.2421875, -6.984375, -6.7265625, -6.46875, -6.2109375, -5.953125, -5.6953125, -5.4375, -5.1796875, -4.921875, -4.6640625, -4.40625, -4.1484375, -3.890625, -3.6328125, -3.375, -3.1171875, -2.859375, -2.6015625, -2.34375, -2.0859375, -1.828125, -1.5703125, -1.3125, -1.0546875, -0.796875, -0.5390625, -0.28125, -0.0234375, 0.234375, 0.4921875, 0.75, 1.0078125, 1.265625, 1.5234375, 1.78125, 2.0390625, 2.296875, 2.5546875, 2.8125, 3.0703125, 3.328125, 3.5859375, 3.84375, 4.1015625, 4.359375, 4.6171875, 4.875, 5.1328125, 5.390625, 5.6484375, 5.90625, 6.1640625, 6.421875, 6.6796875, 6.9375, 7.1953125, 7.453125, 7.7109375]}, "gradients/decoder.model.decoder.layers.5.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 7.0, 3.0, 4.0, 9.0, 9.0, 14.0, 9.0, 27.0, 24.0, 26.0, 37.0, 33.0, 39.0, 47.0, 49.0, 50.0, 65.0, 46.0, 77.0, 68.0, 59.0, 59.0, 43.0, 43.0, 41.0, 27.0, 21.0, 16.0, 20.0, 10.0, 12.0, 7.0, 5.0, 3.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.779296875, -2.696685791015625, -2.61407470703125, -2.531463623046875, -2.4488525390625, -2.366241455078125, -2.28363037109375, -2.201019287109375, -2.118408203125, -2.035797119140625, -1.95318603515625, -1.870574951171875, -1.7879638671875, -1.705352783203125, -1.62274169921875, -1.540130615234375, -1.45751953125, -1.374908447265625, -1.29229736328125, -1.209686279296875, -1.1270751953125, -1.044464111328125, -0.96185302734375, -0.879241943359375, -0.796630859375, -0.714019775390625, -0.63140869140625, -0.548797607421875, -0.4661865234375, -0.383575439453125, -0.30096435546875, -0.218353271484375, -0.1357421875, -0.053131103515625, 0.02947998046875, 0.112091064453125, 0.1947021484375, 0.277313232421875, 0.35992431640625, 0.442535400390625, 0.525146484375, 0.607757568359375, 0.69036865234375, 0.772979736328125, 0.8555908203125, 0.938201904296875, 1.02081298828125, 1.103424072265625, 1.18603515625, 1.268646240234375, 1.35125732421875, 1.433868408203125, 1.5164794921875, 1.599090576171875, 1.68170166015625, 1.764312744140625, 1.846923828125, 1.929534912109375, 2.01214599609375, 2.094757080078125, 2.1773681640625, 2.259979248046875, 2.34259033203125, 2.425201416015625, 2.5078125]}, "gradients/decoder.model.decoder.layers.5.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 4.0, 3.0, 2.0, 6.0, 4.0, 3.0, 9.0, 11.0, 14.0, 14.0, 18.0, 26.0, 49.0, 60.0, 74.0, 132.0, 135.0, 328.0, 565.0, 1081.0, 2499.0, 7162.0, 32419.0, 354073.0, 3282733.0, 461776.0, 38070.0, 7740.0, 2697.0, 1131.0, 574.0, 307.0, 204.0, 119.0, 83.0, 47.0, 38.0, 16.0, 13.0, 8.0, 7.0, 10.0, 11.0, 6.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-3.69921875, -3.592132568359375, -3.48504638671875, -3.377960205078125, -3.2708740234375, -3.163787841796875, -3.05670166015625, -2.949615478515625, -2.842529296875, -2.735443115234375, -2.62835693359375, -2.521270751953125, -2.4141845703125, -2.307098388671875, -2.20001220703125, -2.092926025390625, -1.98583984375, -1.878753662109375, -1.77166748046875, -1.664581298828125, -1.5574951171875, -1.450408935546875, -1.34332275390625, -1.236236572265625, -1.129150390625, -1.022064208984375, -0.91497802734375, -0.807891845703125, -0.7008056640625, -0.593719482421875, -0.48663330078125, -0.379547119140625, -0.2724609375, -0.165374755859375, -0.05828857421875, 0.048797607421875, 0.1558837890625, 0.262969970703125, 0.37005615234375, 0.477142333984375, 0.584228515625, 0.691314697265625, 0.79840087890625, 0.905487060546875, 1.0125732421875, 1.119659423828125, 1.22674560546875, 1.333831787109375, 1.44091796875, 1.548004150390625, 1.65509033203125, 1.762176513671875, 1.8692626953125, 1.976348876953125, 2.08343505859375, 2.190521240234375, 2.297607421875, 2.404693603515625, 2.51177978515625, 2.618865966796875, 2.7259521484375, 2.833038330078125, 2.94012451171875, 3.047210693359375, 3.154296875]}, "gradients/decoder.model.decoder.layers.5.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 4.0, 1.0, 5.0, 7.0, 9.0, 7.0, 15.0, 22.0, 36.0, 50.0, 74.0, 102.0, 134.0, 180.0, 278.0, 360.0, 449.0, 491.0, 509.0, 380.0, 268.0, 192.0, 147.0, 106.0, 78.0, 45.0, 35.0, 21.0, 21.0, 13.0, 11.0, 8.0, 4.0, 4.0, 2.0, 5.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.81005859375, -0.7826156616210938, -0.7551727294921875, -0.7277297973632812, -0.700286865234375, -0.6728439331054688, -0.6454010009765625, -0.6179580688476562, -0.59051513671875, -0.5630722045898438, -0.5356292724609375, -0.5081863403320312, -0.480743408203125, -0.45330047607421875, -0.4258575439453125, -0.39841461181640625, -0.3709716796875, -0.34352874755859375, -0.3160858154296875, -0.28864288330078125, -0.261199951171875, -0.23375701904296875, -0.2063140869140625, -0.17887115478515625, -0.15142822265625, -0.12398529052734375, -0.0965423583984375, -0.06909942626953125, -0.041656494140625, -0.01421356201171875, 0.0132293701171875, 0.04067230224609375, 0.068115234375, 0.09555816650390625, 0.1230010986328125, 0.15044403076171875, 0.177886962890625, 0.20532989501953125, 0.2327728271484375, 0.26021575927734375, 0.28765869140625, 0.31510162353515625, 0.3425445556640625, 0.36998748779296875, 0.397430419921875, 0.42487335205078125, 0.4523162841796875, 0.47975921630859375, 0.5072021484375, 0.5346450805664062, 0.5620880126953125, 0.5895309448242188, 0.616973876953125, 0.6444168090820312, 0.6718597412109375, 0.6993026733398438, 0.72674560546875, 0.7541885375976562, 0.7816314697265625, 0.8090744018554688, 0.836517333984375, 0.8639602661132812, 0.8914031982421875, 0.9188461303710938, 0.9462890625]}, "gradients/decoder.model.decoder.layers.5.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 3.0, 4.0, 8.0, 7.0, 21.0, 28.0, 44.0, 66.0, 111.0, 118.0, 129.0, 139.0, 92.0, 81.0, 61.0, 42.0, 20.0, 12.0, 10.0, 3.0, 6.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.902558326721191, -5.737022876739502, -5.571487903594971, -5.405952453613281, -5.24041748046875, -5.0748820304870605, -4.909347057342529, -4.74381160736084, -4.578276634216309, -4.412741184234619, -4.247206211090088, -4.081670761108398, -3.916135787963867, -3.7506003379821777, -3.5850651264190674, -3.419529914855957, -3.2539944648742676, -3.0884592533111572, -2.922924041748047, -2.7573888301849365, -2.591853618621826, -2.4263181686401367, -2.2607829570770264, -2.095247745513916, -1.9297125339508057, -1.7641773223876953, -1.598642110824585, -1.433106780052185, -1.2675715684890747, -1.1020363569259644, -0.9365010857582092, -0.7709658145904541, -0.605431079864502, -0.4398958384990692, -0.2743605971336365, -0.10882535576820374, 0.056709885597229004, 0.22224509716033936, 0.3877803683280945, 0.5533156394958496, 0.71885085105896, 0.8843860626220703, 1.0499212741851807, 1.2154566049575806, 1.380991816520691, 1.5465270280838013, 1.7120623588562012, 1.8775975704193115, 2.043132781982422, 2.2086679935455322, 2.3742032051086426, 2.539738416671753, 2.7052736282348633, 2.8708090782165527, 3.036344289779663, 3.2018795013427734, 3.367414712905884, 3.532949924468994, 3.6984851360321045, 3.864020347595215, 4.029555797576904, 4.1950907707214355, 4.360626220703125, 4.526161193847656, 4.691696643829346]}, "gradients/decoder.model.decoder.layers.5.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0, 2.0, 8.0, 7.0, 11.0, 10.0, 18.0, 9.0, 18.0, 19.0, 17.0, 20.0, 28.0, 30.0, 43.0, 25.0, 52.0, 41.0, 38.0, 43.0, 51.0, 47.0, 47.0, 54.0, 49.0, 44.0, 42.0, 36.0, 22.0, 37.0, 28.0, 27.0, 18.0, 12.0, 17.0, 13.0, 5.0, 8.0, 1.0, 6.0, 2.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.434231758117676, -2.35748553276062, -2.2807395458221436, -2.203993320465088, -2.1272473335266113, -2.0505011081695557, -1.973755121231079, -1.8970088958740234, -1.8202629089355469, -1.7435168027877808, -1.6667706966400146, -1.5900245904922485, -1.5132784843444824, -1.4365323781967163, -1.3597862720489502, -1.2830400466918945, -1.2062939405441284, -1.1295478343963623, -1.0528017282485962, -0.9760556221008301, -0.899309515953064, -0.8225634098052979, -0.745817244052887, -0.6690711379051208, -0.5923250317573547, -0.5155789256095886, -0.4388328194618225, -0.362086683511734, -0.2853405773639679, -0.20859447121620178, -0.13184833526611328, -0.05510222911834717, 0.021643877029418945, 0.09838999062776566, 0.17513610422611237, 0.2518822252750397, 0.3286283314228058, 0.4053744375705719, 0.4821205735206604, 0.5588666796684265, 0.6356127858161926, 0.7123588919639587, 0.7891049981117249, 0.8658511638641357, 0.9425972700119019, 1.019343376159668, 1.096089482307434, 1.1728355884552002, 1.2495816946029663, 1.3263278007507324, 1.4030739068984985, 1.4798200130462646, 1.5565661191940308, 1.6333122253417969, 1.7100584506988525, 1.786804437637329, 1.8635506629943848, 1.9402967691421509, 2.017042875289917, 2.0937891006469727, 2.170535087585449, 2.247281312942505, 2.3240272998809814, 2.400773525238037, 2.4775195121765137]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 4.0, 1.0, 2.0, 2.0, 7.0, 10.0, 11.0, 16.0, 11.0, 28.0, 34.0, 59.0, 52.0, 104.0, 166.0, 271.0, 585.0, 1269.0, 3030.0, 8375.0, 24699.0, 73319.0, 196340.0, 334731.0, 248851.0, 102312.0, 35070.0, 11734.0, 4162.0, 1650.0, 705.0, 370.0, 184.0, 102.0, 80.0, 54.0, 41.0, 26.0, 23.0, 19.0, 15.0, 7.0, 8.0, 9.0, 3.0, 1.0, 1.0, 4.0, 0.0, 1.0, 3.0, 1.0, 1.0], "bins": [-0.448974609375, -0.4360198974609375, -0.423065185546875, -0.4101104736328125, -0.39715576171875, -0.3842010498046875, -0.371246337890625, -0.3582916259765625, -0.3453369140625, -0.3323822021484375, -0.319427490234375, -0.3064727783203125, -0.29351806640625, -0.2805633544921875, -0.267608642578125, -0.2546539306640625, -0.24169921875, -0.2287445068359375, -0.215789794921875, -0.2028350830078125, -0.18988037109375, -0.1769256591796875, -0.163970947265625, -0.1510162353515625, -0.1380615234375, -0.1251068115234375, -0.112152099609375, -0.0991973876953125, -0.08624267578125, -0.0732879638671875, -0.060333251953125, -0.0473785400390625, -0.034423828125, -0.0214691162109375, -0.008514404296875, 0.0044403076171875, 0.01739501953125, 0.0303497314453125, 0.043304443359375, 0.0562591552734375, 0.0692138671875, 0.0821685791015625, 0.095123291015625, 0.1080780029296875, 0.12103271484375, 0.1339874267578125, 0.146942138671875, 0.1598968505859375, 0.1728515625, 0.1858062744140625, 0.198760986328125, 0.2117156982421875, 0.22467041015625, 0.2376251220703125, 0.250579833984375, 0.2635345458984375, 0.2764892578125, 0.2894439697265625, 0.302398681640625, 0.3153533935546875, 0.32830810546875, 0.3412628173828125, 0.354217529296875, 0.3671722412109375, 0.380126953125]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 5.0, 8.0, 11.0, 23.0, 34.0, 36.0, 49.0, 58.0, 77.0, 72.0, 90.0, 74.0, 112.0, 89.0, 69.0, 54.0, 43.0, 45.0, 25.0, 13.0, 8.0, 3.0, 5.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.50390625, -3.412506103515625, -3.32110595703125, -3.229705810546875, -3.1383056640625, -3.046905517578125, -2.95550537109375, -2.864105224609375, -2.772705078125, -2.681304931640625, -2.58990478515625, -2.498504638671875, -2.4071044921875, -2.315704345703125, -2.22430419921875, -2.132904052734375, -2.04150390625, -1.950103759765625, -1.85870361328125, -1.767303466796875, -1.6759033203125, -1.584503173828125, -1.49310302734375, -1.401702880859375, -1.310302734375, -1.218902587890625, -1.12750244140625, -1.036102294921875, -0.9447021484375, -0.853302001953125, -0.76190185546875, -0.670501708984375, -0.5791015625, -0.487701416015625, -0.39630126953125, -0.304901123046875, -0.2135009765625, -0.122100830078125, -0.03070068359375, 0.060699462890625, 0.152099609375, 0.243499755859375, 0.33489990234375, 0.426300048828125, 0.5177001953125, 0.609100341796875, 0.70050048828125, 0.791900634765625, 0.88330078125, 0.974700927734375, 1.06610107421875, 1.157501220703125, 1.2489013671875, 1.340301513671875, 1.43170166015625, 1.523101806640625, 1.614501953125, 1.705902099609375, 1.79730224609375, 1.888702392578125, 1.9801025390625, 2.071502685546875, 2.16290283203125, 2.254302978515625, 2.345703125]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 4.0, 3.0, 3.0, 1.0, 5.0, 9.0, 11.0, 17.0, 19.0, 38.0, 57.0, 91.0, 186.0, 262.0, 462.0, 747.0, 1292.0, 2233.0, 3896.0, 6940.0, 11720.0, 20580.0, 35000.0, 58773.0, 95152.0, 140208.0, 174152.0, 167440.0, 125782.0, 82469.0, 50239.0, 29896.0, 17283.0, 9902.0, 5730.0, 3284.0, 1895.0, 1106.0, 606.0, 413.0, 227.0, 154.0, 101.0, 69.0, 36.0, 24.0, 13.0, 16.0, 9.0, 6.0, 3.0, 3.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.1925048828125, -0.1864604949951172, -0.18041610717773438, -0.17437171936035156, -0.16832733154296875, -0.16228294372558594, -0.15623855590820312, -0.1501941680908203, -0.1441497802734375, -0.1381053924560547, -0.13206100463867188, -0.12601661682128906, -0.11997222900390625, -0.11392784118652344, -0.10788345336914062, -0.10183906555175781, -0.095794677734375, -0.08975028991699219, -0.08370590209960938, -0.07766151428222656, -0.07161712646484375, -0.06557273864746094, -0.059528350830078125, -0.05348396301269531, -0.0474395751953125, -0.04139518737792969, -0.035350799560546875, -0.029306411743164062, -0.02326202392578125, -0.017217636108398438, -0.011173248291015625, -0.0051288604736328125, 0.00091552734375, 0.0069599151611328125, 0.013004302978515625, 0.019048690795898438, 0.02509307861328125, 0.031137466430664062, 0.037181854248046875, 0.04322624206542969, 0.0492706298828125, 0.05531501770019531, 0.061359405517578125, 0.06740379333496094, 0.07344818115234375, 0.07949256896972656, 0.08553695678710938, 0.09158134460449219, 0.097625732421875, 0.10367012023925781, 0.10971450805664062, 0.11575889587402344, 0.12180328369140625, 0.12784767150878906, 0.13389205932617188, 0.1399364471435547, 0.1459808349609375, 0.1520252227783203, 0.15806961059570312, 0.16411399841308594, 0.17015838623046875, 0.17620277404785156, 0.18224716186523438, 0.1882915496826172, 0.1943359375]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 3.0, 2.0, 5.0, 4.0, 3.0, 9.0, 7.0, 15.0, 20.0, 20.0, 19.0, 40.0, 33.0, 33.0, 60.0, 46.0, 57.0, 51.0, 57.0, 59.0, 57.0, 52.0, 47.0, 40.0, 50.0, 37.0, 34.0, 28.0, 27.0, 22.0, 12.0, 19.0, 6.0, 17.0, 5.0, 5.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.5703125, -3.4571533203125, -3.343994140625, -3.2308349609375, -3.11767578125, -3.0045166015625, -2.891357421875, -2.7781982421875, -2.6650390625, -2.5518798828125, -2.438720703125, -2.3255615234375, -2.21240234375, -2.0992431640625, -1.986083984375, -1.8729248046875, -1.759765625, -1.6466064453125, -1.533447265625, -1.4202880859375, -1.30712890625, -1.1939697265625, -1.080810546875, -0.9676513671875, -0.8544921875, -0.7413330078125, -0.628173828125, -0.5150146484375, -0.40185546875, -0.2886962890625, -0.175537109375, -0.0623779296875, 0.05078125, 0.1639404296875, 0.277099609375, 0.3902587890625, 0.50341796875, 0.6165771484375, 0.729736328125, 0.8428955078125, 0.9560546875, 1.0692138671875, 1.182373046875, 1.2955322265625, 1.40869140625, 1.5218505859375, 1.635009765625, 1.7481689453125, 1.861328125, 1.9744873046875, 2.087646484375, 2.2008056640625, 2.31396484375, 2.4271240234375, 2.540283203125, 2.6534423828125, 2.7666015625, 2.8797607421875, 2.992919921875, 3.1060791015625, 3.21923828125, 3.3323974609375, 3.445556640625, 3.5587158203125, 3.671875]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 3.0, 4.0, 10.0, 18.0, 28.0, 58.0, 98.0, 207.0, 361.0, 736.0, 1608.0, 4144.0, 14087.0, 76188.0, 543410.0, 345977.0, 46160.0, 9756.0, 3201.0, 1291.0, 605.0, 298.0, 144.0, 76.0, 36.0, 34.0, 13.0, 6.0, 3.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.12139892578125, -0.11810588836669922, -0.11481285095214844, -0.11151981353759766, -0.10822677612304688, -0.1049337387084961, -0.10164070129394531, -0.09834766387939453, -0.09505462646484375, -0.09176158905029297, -0.08846855163574219, -0.0851755142211914, -0.08188247680664062, -0.07858943939208984, -0.07529640197753906, -0.07200336456298828, -0.0687103271484375, -0.06541728973388672, -0.06212425231933594, -0.058831214904785156, -0.055538177490234375, -0.052245140075683594, -0.04895210266113281, -0.04565906524658203, -0.04236602783203125, -0.03907299041748047, -0.03577995300292969, -0.032486915588378906, -0.029193878173828125, -0.025900840759277344, -0.022607803344726562, -0.01931476593017578, -0.016021728515625, -0.012728691101074219, -0.009435653686523438, -0.006142616271972656, -0.002849578857421875, 0.00044345855712890625, 0.0037364959716796875, 0.007029533386230469, 0.01032257080078125, 0.013615608215332031, 0.016908645629882812, 0.020201683044433594, 0.023494720458984375, 0.026787757873535156, 0.030080795288085938, 0.03337383270263672, 0.0366668701171875, 0.03995990753173828, 0.04325294494628906, 0.046545982360839844, 0.049839019775390625, 0.053132057189941406, 0.05642509460449219, 0.05971813201904297, 0.06301116943359375, 0.06630420684814453, 0.06959724426269531, 0.0728902816772461, 0.07618331909179688, 0.07947635650634766, 0.08276939392089844, 0.08606243133544922, 0.08935546875]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 4.0, 9.0, 9.0, 14.0, 17.0, 35.0, 42.0, 49.0, 94.0, 153.0, 160.0, 110.0, 116.0, 72.0, 43.0, 30.0, 17.0, 8.0, 11.0, 5.0, 8.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.276369094848633e-05, -6.077531725168228e-05, -5.8786943554878235e-05, -5.679856985807419e-05, -5.481019616127014e-05, -5.2821822464466095e-05, -5.083344876766205e-05, -4.8845075070858e-05, -4.6856701374053955e-05, -4.486832767724991e-05, -4.287995398044586e-05, -4.0891580283641815e-05, -3.890320658683777e-05, -3.691483289003372e-05, -3.4926459193229675e-05, -3.293808549642563e-05, -3.094971179962158e-05, -2.8961338102817535e-05, -2.697296440601349e-05, -2.4984590709209442e-05, -2.2996217012405396e-05, -2.100784331560135e-05, -1.9019469618797302e-05, -1.7031095921993256e-05, -1.5042722225189209e-05, -1.3054348528385162e-05, -1.1065974831581116e-05, -9.077601134777069e-06, -7.0892274379730225e-06, -5.100853741168976e-06, -3.112480044364929e-06, -1.1241063475608826e-06, 8.642673492431641e-07, 2.8526410460472107e-06, 4.841014742851257e-06, 6.829388439655304e-06, 8.81776213645935e-06, 1.0806135833263397e-05, 1.2794509530067444e-05, 1.478288322687149e-05, 1.6771256923675537e-05, 1.8759630620479584e-05, 2.074800431728363e-05, 2.2736378014087677e-05, 2.4724751710891724e-05, 2.671312540769577e-05, 2.8701499104499817e-05, 3.0689872801303864e-05, 3.267824649810791e-05, 3.466662019491196e-05, 3.6654993891716003e-05, 3.864336758852005e-05, 4.06317412853241e-05, 4.262011498212814e-05, 4.460848867893219e-05, 4.6596862375736237e-05, 4.858523607254028e-05, 5.057360976934433e-05, 5.2561983466148376e-05, 5.455035716295242e-05, 5.653873085975647e-05, 5.8527104556560516e-05, 6.051547825336456e-05, 6.250385195016861e-05, 6.449222564697266e-05]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 1.0, 1.0, 6.0, 3.0, 6.0, 3.0, 8.0, 7.0, 15.0, 18.0, 19.0, 40.0, 38.0, 77.0, 108.0, 184.0, 311.0, 696.0, 1481.0, 3676.0, 11263.0, 39403.0, 172276.0, 532571.0, 216455.0, 49051.0, 13056.0, 4397.0, 1683.0, 765.0, 378.0, 200.0, 117.0, 73.0, 43.0, 37.0, 25.0, 18.0, 11.0, 7.0, 10.0, 5.0, 8.0, 2.0, 1.0, 4.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.088623046875, -0.0859832763671875, -0.083343505859375, -0.0807037353515625, -0.07806396484375, -0.0754241943359375, -0.072784423828125, -0.0701446533203125, -0.0675048828125, -0.0648651123046875, -0.062225341796875, -0.0595855712890625, -0.05694580078125, -0.0543060302734375, -0.051666259765625, -0.0490264892578125, -0.04638671875, -0.0437469482421875, -0.041107177734375, -0.0384674072265625, -0.03582763671875, -0.0331878662109375, -0.030548095703125, -0.0279083251953125, -0.0252685546875, -0.0226287841796875, -0.019989013671875, -0.0173492431640625, -0.01470947265625, -0.0120697021484375, -0.009429931640625, -0.0067901611328125, -0.004150390625, -0.0015106201171875, 0.001129150390625, 0.0037689208984375, 0.00640869140625, 0.0090484619140625, 0.011688232421875, 0.0143280029296875, 0.0169677734375, 0.0196075439453125, 0.022247314453125, 0.0248870849609375, 0.02752685546875, 0.0301666259765625, 0.032806396484375, 0.0354461669921875, 0.0380859375, 0.0407257080078125, 0.043365478515625, 0.0460052490234375, 0.04864501953125, 0.0512847900390625, 0.053924560546875, 0.0565643310546875, 0.0592041015625, 0.0618438720703125, 0.064483642578125, 0.0671234130859375, 0.06976318359375, 0.0724029541015625, 0.075042724609375, 0.0776824951171875, 0.080322265625]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 2.0, 4.0, 4.0, 8.0, 6.0, 3.0, 14.0, 14.0, 19.0, 27.0, 32.0, 41.0, 49.0, 50.0, 63.0, 100.0, 98.0, 89.0, 80.0, 65.0, 62.0, 42.0, 30.0, 28.0, 17.0, 17.0, 13.0, 5.0, 6.0, 4.0, 3.0, 3.0, 2.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0203399658203125, -0.019622802734375, -0.0189056396484375, -0.0181884765625, -0.0174713134765625, -0.016754150390625, -0.0160369873046875, -0.01531982421875, -0.0146026611328125, -0.013885498046875, -0.0131683349609375, -0.012451171875, -0.0117340087890625, -0.011016845703125, -0.0102996826171875, -0.00958251953125, -0.0088653564453125, -0.008148193359375, -0.0074310302734375, -0.0067138671875, -0.0059967041015625, -0.005279541015625, -0.0045623779296875, -0.00384521484375, -0.0031280517578125, -0.002410888671875, -0.0016937255859375, -0.0009765625, -0.0002593994140625, 0.000457763671875, 0.0011749267578125, 0.00189208984375, 0.0026092529296875, 0.003326416015625, 0.0040435791015625, 0.0047607421875, 0.0054779052734375, 0.006195068359375, 0.0069122314453125, 0.00762939453125, 0.0083465576171875, 0.009063720703125, 0.0097808837890625, 0.010498046875, 0.0112152099609375, 0.011932373046875, 0.0126495361328125, 0.01336669921875, 0.0140838623046875, 0.014801025390625, 0.0155181884765625, 0.0162353515625, 0.0169525146484375, 0.017669677734375, 0.0183868408203125, 0.01910400390625, 0.0198211669921875, 0.020538330078125, 0.0212554931640625, 0.02197265625, 0.0226898193359375, 0.023406982421875, 0.0241241455078125, 0.02484130859375, 0.0255584716796875]}, "gradients/decoder.model.decoder.layers.5.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 13.0, 52.0, 213.0, 396.0, 251.0, 62.0, 18.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-15.11353874206543, -14.814570426940918, -14.51560115814209, -14.216632843017578, -13.91766357421875, -13.618695259094238, -13.319726943969727, -13.020757675170898, -12.721789360046387, -12.422821044921875, -12.123851776123047, -11.824883460998535, -11.525915145874023, -11.226945877075195, -10.927977561950684, -10.629009246826172, -10.330039978027344, -10.031071662902832, -9.732102394104004, -9.433134078979492, -9.134164810180664, -8.835196495056152, -8.53622817993164, -8.237258911132812, -7.938290596008301, -7.639321804046631, -7.340353012084961, -7.041384696960449, -6.742415904998779, -6.443447113037109, -6.144478797912598, -5.845510005950928, -5.546541213989258, -5.247572422027588, -4.948603630065918, -4.649635314941406, -4.350666522979736, -4.051697731018066, -3.7527291774749756, -3.4537606239318848, -3.154791831970215, -2.855823040008545, -2.556854486465454, -2.2578859329223633, -1.9589171409606934, -1.659948468208313, -1.3609797954559326, -1.0620112419128418, -0.7630424499511719, -0.4640737771987915, -0.16510510444641113, 0.13386356830596924, 0.4328322410583496, 0.73180091381073, 1.0307695865631104, 1.3297381401062012, 1.628706932067871, 1.9276756048202515, 2.226644277572632, 2.5256128311157227, 2.8245816230773926, 3.1235504150390625, 3.4225189685821533, 3.721487522125244, 4.020456314086914]}, "gradients/decoder.model.decoder.layers.5.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 4.0, 4.0, 6.0, 11.0, 8.0, 16.0, 23.0, 12.0, 26.0, 38.0, 30.0, 42.0, 56.0, 62.0, 55.0, 63.0, 72.0, 66.0, 70.0, 60.0, 54.0, 51.0, 40.0, 33.0, 36.0, 20.0, 17.0, 14.0, 8.0, 8.0, 3.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.947766900062561, -1.8817667961120605, -1.8157665729522705, -1.74976646900177, -1.6837663650512695, -1.617766261100769, -1.5517661571502686, -1.4857659339904785, -1.419765830039978, -1.3537657260894775, -1.2877655029296875, -1.221765398979187, -1.1557652950286865, -1.089765191078186, -1.0237650871276855, -0.9577648639678955, -0.891764760017395, -0.8257646560668945, -0.7597644925117493, -0.693764328956604, -0.6277642250061035, -0.561764121055603, -0.49576395750045776, -0.4297638237476349, -0.363763689994812, -0.29776355624198914, -0.23176342248916626, -0.16576328873634338, -0.09976315498352051, -0.03376302123069763, 0.032237112522125244, 0.09823724627494812, 0.16423749923706055, 0.23023763298988342, 0.2962377667427063, 0.3622379004955292, 0.42823803424835205, 0.4942381680011749, 0.5602383017539978, 0.6262384653091431, 0.6922385692596436, 0.758238673210144, 0.8242388367652893, 0.8902390003204346, 0.9562391042709351, 1.0222392082214355, 1.0882394313812256, 1.154239535331726, 1.2202396392822266, 1.286239743232727, 1.3522398471832275, 1.4182400703430176, 1.484240174293518, 1.5502402782440186, 1.6162405014038086, 1.682240605354309, 1.7482407093048096, 1.81424081325531, 1.8802409172058105, 1.9462411403656006, 2.0122413635253906, 2.0782413482666016, 2.1442415714263916, 2.2102415561676025, 2.2762417793273926]}, "gradients/decoder.model.decoder.layers.5.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 9.0, 4.0, 12.0, 10.0, 14.0, 20.0, 26.0, 45.0, 53.0, 111.0, 228.0, 553.0, 1468.0, 4478.0, 14568.0, 56854.0, 284416.0, 528824.0, 117884.0, 27340.0, 7569.0, 2400.0, 845.0, 381.0, 173.0, 100.0, 36.0, 32.0, 29.0, 14.0, 14.0, 8.0, 11.0, 4.0, 6.0, 4.0, 5.0, 3.0, 0.0, 0.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.009765625, -1.94329833984375, -1.8768310546875, -1.81036376953125, -1.743896484375, -1.67742919921875, -1.6109619140625, -1.54449462890625, -1.47802734375, -1.41156005859375, -1.3450927734375, -1.27862548828125, -1.212158203125, -1.14569091796875, -1.0792236328125, -1.01275634765625, -0.9462890625, -0.87982177734375, -0.8133544921875, -0.74688720703125, -0.680419921875, -0.61395263671875, -0.5474853515625, -0.48101806640625, -0.41455078125, -0.34808349609375, -0.2816162109375, -0.21514892578125, -0.148681640625, -0.08221435546875, -0.0157470703125, 0.05072021484375, 0.1171875, 0.18365478515625, 0.2501220703125, 0.31658935546875, 0.383056640625, 0.44952392578125, 0.5159912109375, 0.58245849609375, 0.64892578125, 0.71539306640625, 0.7818603515625, 0.84832763671875, 0.914794921875, 0.98126220703125, 1.0477294921875, 1.11419677734375, 1.1806640625, 1.24713134765625, 1.3135986328125, 1.38006591796875, 1.446533203125, 1.51300048828125, 1.5794677734375, 1.64593505859375, 1.71240234375, 1.77886962890625, 1.8453369140625, 1.91180419921875, 1.978271484375, 2.04473876953125, 2.1112060546875, 2.17767333984375, 2.244140625]}, "gradients/decoder.model.decoder.layers.5.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 4.0, 1.0, 4.0, 5.0, 13.0, 14.0, 17.0, 12.0, 20.0, 24.0, 30.0, 33.0, 41.0, 54.0, 46.0, 47.0, 63.0, 64.0, 56.0, 69.0, 55.0, 52.0, 45.0, 29.0, 52.0, 30.0, 36.0, 23.0, 17.0, 22.0, 10.0, 7.0, 8.0, 4.0, 2.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.33984375, -4.220245361328125, -4.10064697265625, -3.981048583984375, -3.8614501953125, -3.741851806640625, -3.62225341796875, -3.502655029296875, -3.383056640625, -3.263458251953125, -3.14385986328125, -3.024261474609375, -2.9046630859375, -2.785064697265625, -2.66546630859375, -2.545867919921875, -2.42626953125, -2.306671142578125, -2.18707275390625, -2.067474365234375, -1.9478759765625, -1.828277587890625, -1.70867919921875, -1.589080810546875, -1.469482421875, -1.349884033203125, -1.23028564453125, -1.110687255859375, -0.9910888671875, -0.871490478515625, -0.75189208984375, -0.632293701171875, -0.5126953125, -0.393096923828125, -0.27349853515625, -0.153900146484375, -0.0343017578125, 0.085296630859375, 0.20489501953125, 0.324493408203125, 0.444091796875, 0.563690185546875, 0.68328857421875, 0.802886962890625, 0.9224853515625, 1.042083740234375, 1.16168212890625, 1.281280517578125, 1.40087890625, 1.520477294921875, 1.64007568359375, 1.759674072265625, 1.8792724609375, 1.998870849609375, 2.11846923828125, 2.238067626953125, 2.357666015625, 2.477264404296875, 2.59686279296875, 2.716461181640625, 2.8360595703125, 2.955657958984375, 3.07525634765625, 3.194854736328125, 3.314453125]}, "gradients/decoder.model.decoder.layers.5.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 4.0, 6.0, 8.0, 14.0, 15.0, 13.0, 16.0, 34.0, 46.0, 63.0, 90.0, 138.0, 210.0, 293.0, 609.0, 2241.0, 21958.0, 515015.0, 483094.0, 20812.0, 2229.0, 634.0, 336.0, 205.0, 140.0, 114.0, 53.0, 53.0, 29.0, 17.0, 25.0, 10.0, 11.0, 4.0, 2.0, 3.0, 8.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.203125, -4.0794677734375, -3.955810546875, -3.8321533203125, -3.70849609375, -3.5848388671875, -3.461181640625, -3.3375244140625, -3.2138671875, -3.0902099609375, -2.966552734375, -2.8428955078125, -2.71923828125, -2.5955810546875, -2.471923828125, -2.3482666015625, -2.224609375, -2.1009521484375, -1.977294921875, -1.8536376953125, -1.72998046875, -1.6063232421875, -1.482666015625, -1.3590087890625, -1.2353515625, -1.1116943359375, -0.988037109375, -0.8643798828125, -0.74072265625, -0.6170654296875, -0.493408203125, -0.3697509765625, -0.24609375, -0.1224365234375, 0.001220703125, 0.1248779296875, 0.24853515625, 0.3721923828125, 0.495849609375, 0.6195068359375, 0.7431640625, 0.8668212890625, 0.990478515625, 1.1141357421875, 1.23779296875, 1.3614501953125, 1.485107421875, 1.6087646484375, 1.732421875, 1.8560791015625, 1.979736328125, 2.1033935546875, 2.22705078125, 2.3507080078125, 2.474365234375, 2.5980224609375, 2.7216796875, 2.8453369140625, 2.968994140625, 3.0926513671875, 3.21630859375, 3.3399658203125, 3.463623046875, 3.5872802734375, 3.7109375]}, "gradients/decoder.model.decoder.layers.5.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 3.0, 4.0, 4.0, 2.0, 7.0, 8.0, 5.0, 9.0, 11.0, 15.0, 18.0, 17.0, 21.0, 32.0, 33.0, 34.0, 29.0, 48.0, 27.0, 55.0, 51.0, 55.0, 46.0, 44.0, 44.0, 39.0, 35.0, 41.0, 43.0, 31.0, 39.0, 22.0, 30.0, 13.0, 26.0, 9.0, 11.0, 8.0, 14.0, 3.0, 6.0, 6.0, 5.0, 4.0, 1.0, 2.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.10546875, -3.9813232421875, -3.857177734375, -3.7330322265625, -3.60888671875, -3.4847412109375, -3.360595703125, -3.2364501953125, -3.1123046875, -2.9881591796875, -2.864013671875, -2.7398681640625, -2.61572265625, -2.4915771484375, -2.367431640625, -2.2432861328125, -2.119140625, -1.9949951171875, -1.870849609375, -1.7467041015625, -1.62255859375, -1.4984130859375, -1.374267578125, -1.2501220703125, -1.1259765625, -1.0018310546875, -0.877685546875, -0.7535400390625, -0.62939453125, -0.5052490234375, -0.381103515625, -0.2569580078125, -0.1328125, -0.0086669921875, 0.115478515625, 0.2396240234375, 0.36376953125, 0.4879150390625, 0.612060546875, 0.7362060546875, 0.8603515625, 0.9844970703125, 1.108642578125, 1.2327880859375, 1.35693359375, 1.4810791015625, 1.605224609375, 1.7293701171875, 1.853515625, 1.9776611328125, 2.101806640625, 2.2259521484375, 2.35009765625, 2.4742431640625, 2.598388671875, 2.7225341796875, 2.8466796875, 2.9708251953125, 3.094970703125, 3.2191162109375, 3.34326171875, 3.4674072265625, 3.591552734375, 3.7156982421875, 3.83984375]}, "gradients/decoder.model.decoder.layers.5.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 5.0, 1.0, 3.0, 3.0, 2.0, 11.0, 11.0, 5.0, 25.0, 27.0, 36.0, 57.0, 102.0, 210.0, 374.0, 922.0, 2576.0, 12232.0, 394740.0, 615705.0, 16590.0, 2947.0, 1072.0, 456.0, 202.0, 108.0, 58.0, 31.0, 13.0, 11.0, 7.0, 5.0, 4.0, 5.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.029296875, -1.9679107666015625, -1.906524658203125, -1.8451385498046875, -1.78375244140625, -1.7223663330078125, -1.660980224609375, -1.5995941162109375, -1.5382080078125, -1.4768218994140625, -1.415435791015625, -1.3540496826171875, -1.29266357421875, -1.2312774658203125, -1.169891357421875, -1.1085052490234375, -1.047119140625, -0.9857330322265625, -0.924346923828125, -0.8629608154296875, -0.80157470703125, -0.7401885986328125, -0.678802490234375, -0.6174163818359375, -0.5560302734375, -0.4946441650390625, -0.433258056640625, -0.3718719482421875, -0.31048583984375, -0.2490997314453125, -0.187713623046875, -0.1263275146484375, -0.06494140625, -0.0035552978515625, 0.057830810546875, 0.1192169189453125, 0.18060302734375, 0.2419891357421875, 0.303375244140625, 0.3647613525390625, 0.4261474609375, 0.4875335693359375, 0.548919677734375, 0.6103057861328125, 0.67169189453125, 0.7330780029296875, 0.794464111328125, 0.8558502197265625, 0.917236328125, 0.9786224365234375, 1.040008544921875, 1.1013946533203125, 1.16278076171875, 1.2241668701171875, 1.285552978515625, 1.3469390869140625, 1.4083251953125, 1.4697113037109375, 1.531097412109375, 1.5924835205078125, 1.65386962890625, 1.7152557373046875, 1.776641845703125, 1.8380279541015625, 1.8994140625]}, "gradients/decoder.model.decoder.layers.5.self_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 10.0, 4.0, 9.0, 10.0, 12.0, 15.0, 36.0, 47.0, 67.0, 79.0, 110.0, 160.0, 125.0, 93.0, 68.0, 43.0, 36.0, 21.0, 15.0, 11.0, 15.0, 3.0, 4.0, 2.0, 4.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00018906593322753906, -0.0001828894019126892, -0.00017671287059783936, -0.0001705363392829895, -0.00016435980796813965, -0.0001581832766532898, -0.00015200674533843994, -0.0001458302140235901, -0.00013965368270874023, -0.00013347715139389038, -0.00012730062007904053, -0.00012112408876419067, -0.00011494755744934082, -0.00010877102613449097, -0.00010259449481964111, -9.641796350479126e-05, -9.02414321899414e-05, -8.406490087509155e-05, -7.78883695602417e-05, -7.171183824539185e-05, -6.553530693054199e-05, -5.935877561569214e-05, -5.3182244300842285e-05, -4.700571298599243e-05, -4.082918167114258e-05, -3.4652650356292725e-05, -2.847611904144287e-05, -2.2299587726593018e-05, -1.6123056411743164e-05, -9.94652509689331e-06, -3.769993782043457e-06, 2.4065375328063965e-06, 8.58306884765625e-06, 1.4759600162506104e-05, 2.0936131477355957e-05, 2.711266279220581e-05, 3.3289194107055664e-05, 3.946572542190552e-05, 4.564225673675537e-05, 5.1818788051605225e-05, 5.799531936645508e-05, 6.417185068130493e-05, 7.034838199615479e-05, 7.652491331100464e-05, 8.270144462585449e-05, 8.887797594070435e-05, 9.50545072555542e-05, 0.00010123103857040405, 0.0001074075698852539, 0.00011358410120010376, 0.00011976063251495361, 0.00012593716382980347, 0.00013211369514465332, 0.00013829022645950317, 0.00014446675777435303, 0.00015064328908920288, 0.00015681982040405273, 0.0001629963517189026, 0.00016917288303375244, 0.0001753494143486023, 0.00018152594566345215, 0.000187702476978302, 0.00019387900829315186, 0.0002000555396080017, 0.00020623207092285156]}, "gradients/decoder.model.decoder.layers.5.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 3.0, 2.0, 1.0, 5.0, 9.0, 16.0, 19.0, 18.0, 44.0, 76.0, 151.0, 314.0, 1005.0, 3377.0, 26536.0, 882205.0, 125752.0, 6447.0, 1561.0, 550.0, 216.0, 102.0, 55.0, 26.0, 14.0, 13.0, 11.0, 8.0, 10.0, 1.0, 5.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.583984375, -2.509521484375, -2.43505859375, -2.360595703125, -2.2861328125, -2.211669921875, -2.13720703125, -2.062744140625, -1.98828125, -1.913818359375, -1.83935546875, -1.764892578125, -1.6904296875, -1.615966796875, -1.54150390625, -1.467041015625, -1.392578125, -1.318115234375, -1.24365234375, -1.169189453125, -1.0947265625, -1.020263671875, -0.94580078125, -0.871337890625, -0.796875, -0.722412109375, -0.64794921875, -0.573486328125, -0.4990234375, -0.424560546875, -0.35009765625, -0.275634765625, -0.201171875, -0.126708984375, -0.05224609375, 0.022216796875, 0.0966796875, 0.171142578125, 0.24560546875, 0.320068359375, 0.39453125, 0.468994140625, 0.54345703125, 0.617919921875, 0.6923828125, 0.766845703125, 0.84130859375, 0.915771484375, 0.990234375, 1.064697265625, 1.13916015625, 1.213623046875, 1.2880859375, 1.362548828125, 1.43701171875, 1.511474609375, 1.5859375, 1.660400390625, 1.73486328125, 1.809326171875, 1.8837890625, 1.958251953125, 2.03271484375, 2.107177734375, 2.181640625]}, "gradients/decoder.model.decoder.layers.5.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 4.0, 9.0, 4.0, 8.0, 11.0, 12.0, 20.0, 33.0, 28.0, 59.0, 84.0, 110.0, 141.0, 154.0, 97.0, 64.0, 52.0, 34.0, 23.0, 18.0, 13.0, 10.0, 7.0, 6.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0], "bins": [-0.64599609375, -0.62847900390625, -0.6109619140625, -0.59344482421875, -0.575927734375, -0.55841064453125, -0.5408935546875, -0.52337646484375, -0.505859375, -0.48834228515625, -0.4708251953125, -0.45330810546875, -0.435791015625, -0.41827392578125, -0.4007568359375, -0.38323974609375, -0.36572265625, -0.34820556640625, -0.3306884765625, -0.31317138671875, -0.295654296875, -0.27813720703125, -0.2606201171875, -0.24310302734375, -0.2255859375, -0.20806884765625, -0.1905517578125, -0.17303466796875, -0.155517578125, -0.13800048828125, -0.1204833984375, -0.10296630859375, -0.08544921875, -0.06793212890625, -0.0504150390625, -0.03289794921875, -0.015380859375, 0.00213623046875, 0.0196533203125, 0.03717041015625, 0.0546875, 0.07220458984375, 0.0897216796875, 0.10723876953125, 0.124755859375, 0.14227294921875, 0.1597900390625, 0.17730712890625, 0.19482421875, 0.21234130859375, 0.2298583984375, 0.24737548828125, 0.264892578125, 0.28240966796875, 0.2999267578125, 0.31744384765625, 0.3349609375, 0.35247802734375, 0.3699951171875, 0.38751220703125, 0.405029296875, 0.42254638671875, 0.4400634765625, 0.45758056640625, 0.47509765625]}, "gradients/decoder.model.decoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 0.0, 5.0, 5.0, 8.0, 13.0, 29.0, 62.0, 106.0, 130.0, 157.0, 188.0, 129.0, 69.0, 46.0, 19.0, 16.0, 9.0, 6.0, 4.0, 0.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-10.693497657775879, -10.44906234741211, -10.20462703704834, -9.96019172668457, -9.7157564163208, -9.471321105957031, -9.226886749267578, -8.982451438903809, -8.738016128540039, -8.49358081817627, -8.2491455078125, -8.00471019744873, -7.760275363922119, -7.51584005355835, -7.27140474319458, -7.0269694328308105, -6.782534122467041, -6.5380988121032715, -6.293663501739502, -6.049228668212891, -5.804793357849121, -5.560358047485352, -5.315922737121582, -5.0714874267578125, -4.827052116394043, -4.582616806030273, -4.338181495666504, -4.093746185302734, -3.849311351776123, -3.6048760414123535, -3.360440731048584, -3.1160054206848145, -2.8715710639953613, -2.627135753631592, -2.3827006816864014, -2.138265371322632, -1.8938301801681519, -1.6493949890136719, -1.4049596786499023, -1.1605244874954224, -0.9160892963409424, -0.6716541051864624, -0.42721885442733765, -0.1827836036682129, 0.06165158748626709, 0.30608677864074707, 0.5505220890045166, 0.7949572801589966, 1.0393924713134766, 1.2838276624679565, 1.5282628536224365, 1.772698163986206, 2.0171332359313965, 2.261568546295166, 2.5060038566589355, 2.750439167022705, 2.9948742389678955, 3.239309549331665, 3.4837446212768555, 3.728179931640625, 3.9726152420043945, 4.217050552368164, 4.461485862731934, 4.705920696258545, 4.9503560066223145]}, "gradients/decoder.model.decoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 4.0, 5.0, 10.0, 11.0, 7.0, 12.0, 15.0, 15.0, 24.0, 13.0, 23.0, 42.0, 30.0, 32.0, 27.0, 36.0, 49.0, 52.0, 31.0, 37.0, 38.0, 42.0, 46.0, 48.0, 59.0, 36.0, 33.0, 36.0, 26.0, 35.0, 13.0, 23.0, 15.0, 13.0, 15.0, 17.0, 9.0, 7.0, 8.0, 3.0, 2.0, 5.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.585938930511475, -6.369170188903809, -6.152400970458984, -5.935632228851318, -5.718863010406494, -5.502094268798828, -5.285325050354004, -5.068556308746338, -4.851787567138672, -4.635018825531006, -4.418249607086182, -4.201480865478516, -3.9847116470336914, -3.7679429054260254, -3.5511739253997803, -3.334404945373535, -3.117635726928711, -2.900866746902466, -2.6840977668762207, -2.4673290252685547, -2.2505598068237305, -2.0337910652160645, -1.8170220851898193, -1.6002531051635742, -1.383484125137329, -1.166715145111084, -0.9499462246894836, -0.7331773042678833, -0.5164083242416382, -0.29963934421539307, -0.0828704833984375, 0.13389849662780762, 0.35066795349121094, 0.567436933517456, 0.7842058539390564, 1.0009747743606567, 1.2177437543869019, 1.434512734413147, 1.6512815952301025, 1.8680505752563477, 2.0848195552825928, 2.301588535308838, 2.518357515335083, 2.735126495361328, 2.951895236968994, 3.1686644554138184, 3.3854331970214844, 3.6022021770477295, 3.8189711570739746, 4.035739898681641, 4.252509117126465, 4.469277858734131, 4.686047077178955, 4.902815818786621, 5.119585037231445, 5.336353778839111, 5.553122520446777, 5.769891262054443, 5.986660480499268, 6.203429222106934, 6.420198440551758, 6.636967182159424, 6.85373592376709, 7.070505142211914, 7.287274360656738]}, "gradients/decoder.model.decoder.layers.4.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 5.0, 1.0, 4.0, 3.0, 7.0, 3.0, 11.0, 22.0, 26.0, 47.0, 78.0, 175.0, 503.0, 2517.0, 42982.0, 3356278.0, 778979.0, 10563.0, 1303.0, 390.0, 161.0, 90.0, 51.0, 32.0, 18.0, 13.0, 8.0, 5.0, 7.0, 3.0, 2.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.234375, -8.99005126953125, -8.7457275390625, -8.50140380859375, -8.257080078125, -8.01275634765625, -7.7684326171875, -7.52410888671875, -7.27978515625, -7.03546142578125, -6.7911376953125, -6.54681396484375, -6.302490234375, -6.05816650390625, -5.8138427734375, -5.56951904296875, -5.3251953125, -5.08087158203125, -4.8365478515625, -4.59222412109375, -4.347900390625, -4.10357666015625, -3.8592529296875, -3.61492919921875, -3.37060546875, -3.12628173828125, -2.8819580078125, -2.63763427734375, -2.393310546875, -2.14898681640625, -1.9046630859375, -1.66033935546875, -1.416015625, -1.17169189453125, -0.9273681640625, -0.68304443359375, -0.438720703125, -0.19439697265625, 0.0499267578125, 0.29425048828125, 0.53857421875, 0.78289794921875, 1.0272216796875, 1.27154541015625, 1.515869140625, 1.76019287109375, 2.0045166015625, 2.24884033203125, 2.4931640625, 2.73748779296875, 2.9818115234375, 3.22613525390625, 3.470458984375, 3.71478271484375, 3.9591064453125, 4.20343017578125, 4.44775390625, 4.69207763671875, 4.9364013671875, 5.18072509765625, 5.425048828125, 5.66937255859375, 5.9136962890625, 6.15802001953125, 6.40234375]}, "gradients/decoder.model.decoder.layers.4.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 5.0, 8.0, 1.0, 4.0, 9.0, 9.0, 17.0, 22.0, 36.0, 33.0, 37.0, 51.0, 47.0, 41.0, 68.0, 55.0, 64.0, 67.0, 69.0, 69.0, 59.0, 45.0, 46.0, 34.0, 36.0, 26.0, 11.0, 15.0, 9.0, 6.0, 4.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.38671875, -2.30035400390625, -2.2139892578125, -2.12762451171875, -2.041259765625, -1.95489501953125, -1.8685302734375, -1.78216552734375, -1.69580078125, -1.60943603515625, -1.5230712890625, -1.43670654296875, -1.350341796875, -1.26397705078125, -1.1776123046875, -1.09124755859375, -1.0048828125, -0.91851806640625, -0.8321533203125, -0.74578857421875, -0.659423828125, -0.57305908203125, -0.4866943359375, -0.40032958984375, -0.31396484375, -0.22760009765625, -0.1412353515625, -0.05487060546875, 0.031494140625, 0.11785888671875, 0.2042236328125, 0.29058837890625, 0.376953125, 0.46331787109375, 0.5496826171875, 0.63604736328125, 0.722412109375, 0.80877685546875, 0.8951416015625, 0.98150634765625, 1.06787109375, 1.15423583984375, 1.2406005859375, 1.32696533203125, 1.413330078125, 1.49969482421875, 1.5860595703125, 1.67242431640625, 1.7587890625, 1.84515380859375, 1.9315185546875, 2.01788330078125, 2.104248046875, 2.19061279296875, 2.2769775390625, 2.36334228515625, 2.44970703125, 2.53607177734375, 2.6224365234375, 2.70880126953125, 2.795166015625, 2.88153076171875, 2.9678955078125, 3.05426025390625, 3.140625]}, "gradients/decoder.model.decoder.layers.4.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 3.0, 1.0, 2.0, 4.0, 5.0, 7.0, 8.0, 18.0, 19.0, 36.0, 55.0, 74.0, 148.0, 287.0, 624.0, 1537.0, 5668.0, 46928.0, 2489336.0, 1607546.0, 34492.0, 4861.0, 1412.0, 531.0, 288.0, 143.0, 79.0, 68.0, 34.0, 22.0, 13.0, 17.0, 7.0, 5.0, 6.0, 2.0, 2.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.6171875, -3.45953369140625, -3.3018798828125, -3.14422607421875, -2.986572265625, -2.82891845703125, -2.6712646484375, -2.51361083984375, -2.35595703125, -2.19830322265625, -2.0406494140625, -1.88299560546875, -1.725341796875, -1.56768798828125, -1.4100341796875, -1.25238037109375, -1.0947265625, -0.93707275390625, -0.7794189453125, -0.62176513671875, -0.464111328125, -0.30645751953125, -0.1488037109375, 0.00885009765625, 0.16650390625, 0.32415771484375, 0.4818115234375, 0.63946533203125, 0.797119140625, 0.95477294921875, 1.1124267578125, 1.27008056640625, 1.427734375, 1.58538818359375, 1.7430419921875, 1.90069580078125, 2.058349609375, 2.21600341796875, 2.3736572265625, 2.53131103515625, 2.68896484375, 2.84661865234375, 3.0042724609375, 3.16192626953125, 3.319580078125, 3.47723388671875, 3.6348876953125, 3.79254150390625, 3.9501953125, 4.10784912109375, 4.2655029296875, 4.42315673828125, 4.580810546875, 4.73846435546875, 4.8961181640625, 5.05377197265625, 5.21142578125, 5.36907958984375, 5.5267333984375, 5.68438720703125, 5.842041015625, 5.99969482421875, 6.1573486328125, 6.31500244140625, 6.47265625]}, "gradients/decoder.model.decoder.layers.4.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 4.0, 1.0, 1.0, 10.0, 13.0, 16.0, 12.0, 25.0, 50.0, 49.0, 82.0, 158.0, 178.0, 315.0, 477.0, 656.0, 628.0, 485.0, 304.0, 206.0, 165.0, 63.0, 59.0, 43.0, 28.0, 20.0, 8.0, 9.0, 5.0, 3.0, 5.0, 2.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.275390625, -1.2418060302734375, -1.208221435546875, -1.1746368408203125, -1.14105224609375, -1.1074676513671875, -1.073883056640625, -1.0402984619140625, -1.0067138671875, -0.9731292724609375, -0.939544677734375, -0.9059600830078125, -0.87237548828125, -0.8387908935546875, -0.805206298828125, -0.7716217041015625, -0.738037109375, -0.7044525146484375, -0.670867919921875, -0.6372833251953125, -0.60369873046875, -0.5701141357421875, -0.536529541015625, -0.5029449462890625, -0.4693603515625, -0.4357757568359375, -0.402191162109375, -0.3686065673828125, -0.33502197265625, -0.3014373779296875, -0.267852783203125, -0.2342681884765625, -0.20068359375, -0.1670989990234375, -0.133514404296875, -0.0999298095703125, -0.06634521484375, -0.0327606201171875, 0.000823974609375, 0.0344085693359375, 0.0679931640625, 0.1015777587890625, 0.135162353515625, 0.1687469482421875, 0.20233154296875, 0.2359161376953125, 0.269500732421875, 0.3030853271484375, 0.336669921875, 0.3702545166015625, 0.403839111328125, 0.4374237060546875, 0.47100830078125, 0.5045928955078125, 0.538177490234375, 0.5717620849609375, 0.6053466796875, 0.6389312744140625, 0.672515869140625, 0.7061004638671875, 0.73968505859375, 0.7732696533203125, 0.806854248046875, 0.8404388427734375, 0.8740234375]}, "gradients/decoder.model.decoder.layers.4.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 5.0, 3.0, 7.0, 12.0, 18.0, 24.0, 43.0, 59.0, 79.0, 115.0, 125.0, 111.0, 113.0, 108.0, 55.0, 39.0, 29.0, 22.0, 14.0, 8.0, 8.0, 2.0, 4.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.257492542266846, -4.1158342361450195, -3.9741759300231934, -3.832517623901367, -3.690859317779541, -3.549201011657715, -3.4075429439544678, -3.2658846378326416, -3.1242263317108154, -2.9825680255889893, -2.840909719467163, -2.699251413345337, -2.55759334564209, -2.4159350395202637, -2.2742767333984375, -2.1326184272766113, -1.9909601211547852, -1.849301815032959, -1.7076435089111328, -1.5659853219985962, -1.42432701587677, -1.2826687097549438, -1.1410105228424072, -0.999352216720581, -0.8576939105987549, -0.7160356044769287, -0.5743773579597473, -0.43271908164024353, -0.29106080532073975, -0.14940249919891357, -0.007744252681732178, 0.13391399383544922, 0.2755727767944336, 0.4172310531139374, 0.5588893294334412, 0.7005475759506226, 0.8422058820724487, 0.9838641881942749, 1.1255223751068115, 1.2671806812286377, 1.4088389873504639, 1.55049729347229, 1.6921555995941162, 1.8338137865066528, 1.975472092628479, 2.1171302795410156, 2.258788585662842, 2.400446891784668, 2.542105197906494, 2.6837635040283203, 2.8254218101501465, 2.9670801162719727, 3.108738422393799, 3.250396728515625, 3.392054796218872, 3.5337131023406982, 3.6753714084625244, 3.8170297145843506, 3.9586880207061768, 4.100346088409424, 4.24200439453125, 4.383662700653076, 4.525321006774902, 4.6669793128967285, 4.808637619018555]}, "gradients/decoder.model.decoder.layers.4.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 5.0, 4.0, 4.0, 9.0, 8.0, 9.0, 9.0, 11.0, 22.0, 17.0, 18.0, 23.0, 27.0, 31.0, 38.0, 31.0, 35.0, 66.0, 52.0, 51.0, 50.0, 48.0, 54.0, 35.0, 52.0, 47.0, 45.0, 34.0, 39.0, 27.0, 28.0, 21.0, 8.0, 10.0, 11.0, 8.0, 3.0, 8.0, 6.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-2.4210946559906006, -2.3459179401397705, -2.2707412242889404, -2.1955645084381104, -2.1203877925872803, -2.04521107673645, -1.9700344800949097, -1.8948577642440796, -1.8196810483932495, -1.7445043325424194, -1.6693276166915894, -1.5941509008407593, -1.5189743041992188, -1.4437975883483887, -1.3686208724975586, -1.2934441566467285, -1.2182674407958984, -1.1430907249450684, -1.0679140090942383, -0.992737352848053, -0.9175606369972229, -0.8423839211463928, -0.7672072649002075, -0.6920305490493774, -0.6168538331985474, -0.5416771173477173, -0.4665004312992096, -0.3913237452507019, -0.3161470293998718, -0.24097031354904175, -0.16579362750053406, -0.09061694145202637, -0.015440225601196289, 0.059736475348472595, 0.13491317629814148, 0.21008987724781036, 0.28526657819747925, 0.3604432940483093, 0.435619980096817, 0.5107966661453247, 0.5859733819961548, 0.6611500978469849, 0.7363268136978149, 0.8115034699440002, 0.8866801857948303, 0.9618569016456604, 1.0370335578918457, 1.1122102737426758, 1.1873869895935059, 1.262563705444336, 1.337740421295166, 1.412917137145996, 1.4880938529968262, 1.5632705688476562, 1.6384471654891968, 1.7136238813400269, 1.788800597190857, 1.863977313041687, 1.939154028892517, 2.0143306255340576, 2.0895073413848877, 2.1646840572357178, 2.239860773086548, 2.315037488937378, 2.390214204788208]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 4.0, 12.0, 11.0, 17.0, 24.0, 52.0, 80.0, 138.0, 215.0, 449.0, 1135.0, 4213.0, 20002.0, 108517.0, 408125.0, 385244.0, 96786.0, 17576.0, 3897.0, 1098.0, 443.0, 217.0, 116.0, 75.0, 46.0, 32.0, 15.0, 7.0, 6.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.66650390625, -0.6456527709960938, -0.6248016357421875, -0.6039505004882812, -0.583099365234375, -0.5622482299804688, -0.5413970947265625, -0.5205459594726562, -0.49969482421875, -0.47884368896484375, -0.4579925537109375, -0.43714141845703125, -0.416290283203125, -0.39543914794921875, -0.3745880126953125, -0.35373687744140625, -0.3328857421875, -0.31203460693359375, -0.2911834716796875, -0.27033233642578125, -0.249481201171875, -0.22863006591796875, -0.2077789306640625, -0.18692779541015625, -0.16607666015625, -0.14522552490234375, -0.1243743896484375, -0.10352325439453125, -0.082672119140625, -0.06182098388671875, -0.0409698486328125, -0.02011871337890625, 0.000732421875, 0.02158355712890625, 0.0424346923828125, 0.06328582763671875, 0.084136962890625, 0.10498809814453125, 0.1258392333984375, 0.14669036865234375, 0.16754150390625, 0.18839263916015625, 0.2092437744140625, 0.23009490966796875, 0.250946044921875, 0.27179718017578125, 0.2926483154296875, 0.31349945068359375, 0.3343505859375, 0.35520172119140625, 0.3760528564453125, 0.39690399169921875, 0.417755126953125, 0.43860626220703125, 0.4594573974609375, 0.48030853271484375, 0.50115966796875, 0.5220108032226562, 0.5428619384765625, 0.5637130737304688, 0.584564208984375, 0.6054153442382812, 0.6262664794921875, 0.6471176147460938, 0.66796875]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 3.0, 7.0, 13.0, 12.0, 18.0, 16.0, 23.0, 41.0, 49.0, 45.0, 72.0, 84.0, 86.0, 69.0, 86.0, 82.0, 72.0, 68.0, 49.0, 36.0, 26.0, 22.0, 13.0, 7.0, 6.0, 0.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.12890625, -2.045013427734375, -1.96112060546875, -1.877227783203125, -1.7933349609375, -1.709442138671875, -1.62554931640625, -1.541656494140625, -1.457763671875, -1.373870849609375, -1.28997802734375, -1.206085205078125, -1.1221923828125, -1.038299560546875, -0.95440673828125, -0.870513916015625, -0.78662109375, -0.702728271484375, -0.61883544921875, -0.534942626953125, -0.4510498046875, -0.367156982421875, -0.28326416015625, -0.199371337890625, -0.115478515625, -0.031585693359375, 0.05230712890625, 0.136199951171875, 0.2200927734375, 0.303985595703125, 0.38787841796875, 0.471771240234375, 0.5556640625, 0.639556884765625, 0.72344970703125, 0.807342529296875, 0.8912353515625, 0.975128173828125, 1.05902099609375, 1.142913818359375, 1.226806640625, 1.310699462890625, 1.39459228515625, 1.478485107421875, 1.5623779296875, 1.646270751953125, 1.73016357421875, 1.814056396484375, 1.89794921875, 1.981842041015625, 2.06573486328125, 2.149627685546875, 2.2335205078125, 2.317413330078125, 2.40130615234375, 2.485198974609375, 2.569091796875, 2.652984619140625, 2.73687744140625, 2.820770263671875, 2.9046630859375, 2.988555908203125, 3.07244873046875, 3.156341552734375, 3.240234375]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 4.0, 2.0, 3.0, 8.0, 5.0, 14.0, 20.0, 35.0, 69.0, 90.0, 132.0, 246.0, 422.0, 730.0, 1255.0, 2244.0, 4311.0, 7661.0, 13609.0, 24297.0, 42005.0, 69195.0, 106321.0, 145224.0, 166091.0, 154292.0, 117191.0, 79059.0, 48542.0, 28550.0, 16406.0, 8961.0, 5105.0, 2824.0, 1541.0, 814.0, 534.0, 285.0, 172.0, 108.0, 61.0, 41.0, 27.0, 19.0, 10.0, 13.0, 6.0, 7.0, 5.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.179931640625, -0.17386245727539062, -0.16779327392578125, -0.16172409057617188, -0.1556549072265625, -0.14958572387695312, -0.14351654052734375, -0.13744735717773438, -0.131378173828125, -0.12530899047851562, -0.11923980712890625, -0.11317062377929688, -0.1071014404296875, -0.10103225708007812, -0.09496307373046875, -0.08889389038085938, -0.08282470703125, -0.07675552368164062, -0.07068634033203125, -0.06461715698242188, -0.0585479736328125, -0.052478790283203125, -0.04640960693359375, -0.040340423583984375, -0.034271240234375, -0.028202056884765625, -0.02213287353515625, -0.016063690185546875, -0.0099945068359375, -0.003925323486328125, 0.00214385986328125, 0.008213043212890625, 0.0142822265625, 0.020351409912109375, 0.02642059326171875, 0.032489776611328125, 0.0385589599609375, 0.044628143310546875, 0.05069732666015625, 0.056766510009765625, 0.062835693359375, 0.06890487670898438, 0.07497406005859375, 0.08104324340820312, 0.0871124267578125, 0.09318161010742188, 0.09925079345703125, 0.10531997680664062, 0.11138916015625, 0.11745834350585938, 0.12352752685546875, 0.12959671020507812, 0.1356658935546875, 0.14173507690429688, 0.14780426025390625, 0.15387344360351562, 0.159942626953125, 0.16601181030273438, 0.17208099365234375, 0.17815017700195312, 0.1842193603515625, 0.19028854370117188, 0.19635772705078125, 0.20242691040039062, 0.20849609375]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 1.0, 2.0, 2.0, 6.0, 6.0, 9.0, 8.0, 14.0, 13.0, 12.0, 16.0, 16.0, 23.0, 20.0, 26.0, 25.0, 29.0, 36.0, 45.0, 31.0, 40.0, 51.0, 43.0, 43.0, 43.0, 35.0, 40.0, 32.0, 49.0, 39.0, 29.0, 28.0, 26.0, 28.0, 17.0, 17.0, 22.0, 20.0, 14.0, 13.0, 7.0, 9.0, 5.0, 4.0, 0.0, 3.0, 2.0, 1.0, 5.0, 2.0, 3.0, 1.0, 1.0, 2.0], "bins": [-3.09375, -3.002777099609375, -2.91180419921875, -2.820831298828125, -2.7298583984375, -2.638885498046875, -2.54791259765625, -2.456939697265625, -2.365966796875, -2.274993896484375, -2.18402099609375, -2.093048095703125, -2.0020751953125, -1.911102294921875, -1.82012939453125, -1.729156494140625, -1.63818359375, -1.547210693359375, -1.45623779296875, -1.365264892578125, -1.2742919921875, -1.183319091796875, -1.09234619140625, -1.001373291015625, -0.910400390625, -0.819427490234375, -0.72845458984375, -0.637481689453125, -0.5465087890625, -0.455535888671875, -0.36456298828125, -0.273590087890625, -0.1826171875, -0.091644287109375, -0.00067138671875, 0.090301513671875, 0.1812744140625, 0.272247314453125, 0.36322021484375, 0.454193115234375, 0.545166015625, 0.636138916015625, 0.72711181640625, 0.818084716796875, 0.9090576171875, 1.000030517578125, 1.09100341796875, 1.181976318359375, 1.27294921875, 1.363922119140625, 1.45489501953125, 1.545867919921875, 1.6368408203125, 1.727813720703125, 1.81878662109375, 1.909759521484375, 2.000732421875, 2.091705322265625, 2.18267822265625, 2.273651123046875, 2.3646240234375, 2.455596923828125, 2.54656982421875, 2.637542724609375, 2.728515625]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 5.0, 5.0, 8.0, 11.0, 13.0, 24.0, 39.0, 70.0, 128.0, 193.0, 399.0, 1019.0, 3138.0, 15881.0, 192261.0, 747952.0, 75371.0, 8637.0, 2040.0, 691.0, 309.0, 156.0, 90.0, 39.0, 29.0, 16.0, 14.0, 7.0, 6.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.18359375, -0.17839813232421875, -0.1732025146484375, -0.16800689697265625, -0.162811279296875, -0.15761566162109375, -0.1524200439453125, -0.14722442626953125, -0.14202880859375, -0.13683319091796875, -0.1316375732421875, -0.12644195556640625, -0.121246337890625, -0.11605072021484375, -0.1108551025390625, -0.10565948486328125, -0.1004638671875, -0.09526824951171875, -0.0900726318359375, -0.08487701416015625, -0.079681396484375, -0.07448577880859375, -0.0692901611328125, -0.06409454345703125, -0.05889892578125, -0.05370330810546875, -0.0485076904296875, -0.04331207275390625, -0.038116455078125, -0.03292083740234375, -0.0277252197265625, -0.02252960205078125, -0.017333984375, -0.01213836669921875, -0.0069427490234375, -0.00174713134765625, 0.003448486328125, 0.00864410400390625, 0.0138397216796875, 0.01903533935546875, 0.02423095703125, 0.02942657470703125, 0.0346221923828125, 0.03981781005859375, 0.045013427734375, 0.05020904541015625, 0.0554046630859375, 0.06060028076171875, 0.0657958984375, 0.07099151611328125, 0.0761871337890625, 0.08138275146484375, 0.086578369140625, 0.09177398681640625, 0.0969696044921875, 0.10216522216796875, 0.10736083984375, 0.11255645751953125, 0.1177520751953125, 0.12294769287109375, 0.128143310546875, 0.13333892822265625, 0.1385345458984375, 0.14373016357421875, 0.14892578125]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 5.0, 0.0, 1.0, 2.0, 3.0, 1.0, 10.0, 2.0, 5.0, 4.0, 12.0, 21.0, 14.0, 19.0, 36.0, 46.0, 56.0, 57.0, 95.0, 76.0, 76.0, 87.0, 81.0, 64.0, 57.0, 30.0, 36.0, 34.0, 19.0, 15.0, 14.0, 8.0, 6.0, 3.0, 4.0, 6.0, 4.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-4.4405460357666016e-05, -4.319101572036743e-05, -4.197657108306885e-05, -4.0762126445770264e-05, -3.954768180847168e-05, -3.8333237171173096e-05, -3.711879253387451e-05, -3.590434789657593e-05, -3.4689903259277344e-05, -3.347545862197876e-05, -3.2261013984680176e-05, -3.104656934738159e-05, -2.9832124710083008e-05, -2.8617680072784424e-05, -2.740323543548584e-05, -2.6188790798187256e-05, -2.4974346160888672e-05, -2.3759901523590088e-05, -2.2545456886291504e-05, -2.133101224899292e-05, -2.0116567611694336e-05, -1.8902122974395752e-05, -1.7687678337097168e-05, -1.6473233699798584e-05, -1.52587890625e-05, -1.4044344425201416e-05, -1.2829899787902832e-05, -1.1615455150604248e-05, -1.0401010513305664e-05, -9.18656587600708e-06, -7.972121238708496e-06, -6.757676601409912e-06, -5.543231964111328e-06, -4.328787326812744e-06, -3.11434268951416e-06, -1.8998980522155762e-06, -6.854534149169922e-07, 5.289912223815918e-07, 1.7434358596801758e-06, 2.9578804969787598e-06, 4.172325134277344e-06, 5.386769771575928e-06, 6.601214408874512e-06, 7.815659046173096e-06, 9.03010368347168e-06, 1.0244548320770264e-05, 1.1458992958068848e-05, 1.2673437595367432e-05, 1.3887882232666016e-05, 1.51023268699646e-05, 1.6316771507263184e-05, 1.7531216144561768e-05, 1.874566078186035e-05, 1.9960105419158936e-05, 2.117455005645752e-05, 2.2388994693756104e-05, 2.3603439331054688e-05, 2.481788396835327e-05, 2.6032328605651855e-05, 2.724677324295044e-05, 2.8461217880249023e-05, 2.9675662517547607e-05, 3.089010715484619e-05, 3.2104551792144775e-05, 3.331899642944336e-05]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 4.0, 4.0, 5.0, 3.0, 7.0, 12.0, 19.0, 21.0, 43.0, 56.0, 104.0, 190.0, 368.0, 839.0, 2227.0, 7610.0, 32956.0, 201838.0, 598470.0, 165256.0, 28233.0, 6656.0, 2041.0, 768.0, 371.0, 172.0, 97.0, 62.0, 37.0, 32.0, 15.0, 13.0, 19.0, 3.0, 3.0, 2.0, 0.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.10150146484375, -0.09793376922607422, -0.09436607360839844, -0.09079837799072266, -0.08723068237304688, -0.0836629867553711, -0.08009529113769531, -0.07652759552001953, -0.07295989990234375, -0.06939220428466797, -0.06582450866699219, -0.062256813049316406, -0.058689117431640625, -0.055121421813964844, -0.05155372619628906, -0.04798603057861328, -0.0444183349609375, -0.04085063934326172, -0.03728294372558594, -0.033715248107910156, -0.030147552490234375, -0.026579856872558594, -0.023012161254882812, -0.01944446563720703, -0.01587677001953125, -0.012309074401855469, -0.008741378784179688, -0.005173683166503906, -0.001605987548828125, 0.0019617080688476562, 0.0055294036865234375, 0.009097099304199219, 0.012664794921875, 0.01623249053955078, 0.019800186157226562, 0.023367881774902344, 0.026935577392578125, 0.030503273010253906, 0.03407096862792969, 0.03763866424560547, 0.04120635986328125, 0.04477405548095703, 0.04834175109863281, 0.051909446716308594, 0.055477142333984375, 0.059044837951660156, 0.06261253356933594, 0.06618022918701172, 0.0697479248046875, 0.07331562042236328, 0.07688331604003906, 0.08045101165771484, 0.08401870727539062, 0.0875864028930664, 0.09115409851074219, 0.09472179412841797, 0.09828948974609375, 0.10185718536376953, 0.10542488098144531, 0.1089925765991211, 0.11256027221679688, 0.11612796783447266, 0.11969566345214844, 0.12326335906982422, 0.1268310546875]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 2.0, 4.0, 1.0, 3.0, 7.0, 7.0, 15.0, 14.0, 22.0, 20.0, 21.0, 29.0, 36.0, 61.0, 84.0, 109.0, 110.0, 105.0, 79.0, 68.0, 52.0, 30.0, 29.0, 22.0, 14.0, 18.0, 10.0, 6.0, 11.0, 9.0, 6.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.03570556640625, -0.034679412841796875, -0.03365325927734375, -0.032627105712890625, -0.0316009521484375, -0.030574798583984375, -0.02954864501953125, -0.028522491455078125, -0.027496337890625, -0.026470184326171875, -0.02544403076171875, -0.024417877197265625, -0.0233917236328125, -0.022365570068359375, -0.02133941650390625, -0.020313262939453125, -0.019287109375, -0.018260955810546875, -0.01723480224609375, -0.016208648681640625, -0.0151824951171875, -0.014156341552734375, -0.01313018798828125, -0.012104034423828125, -0.011077880859375, -0.010051727294921875, -0.00902557373046875, -0.007999420166015625, -0.0069732666015625, -0.005947113037109375, -0.00492095947265625, -0.003894805908203125, -0.00286865234375, -0.001842498779296875, -0.00081634521484375, 0.000209808349609375, 0.0012359619140625, 0.002262115478515625, 0.00328826904296875, 0.004314422607421875, 0.005340576171875, 0.006366729736328125, 0.00739288330078125, 0.008419036865234375, 0.0094451904296875, 0.010471343994140625, 0.01149749755859375, 0.012523651123046875, 0.0135498046875, 0.014575958251953125, 0.01560211181640625, 0.016628265380859375, 0.0176544189453125, 0.018680572509765625, 0.01970672607421875, 0.020732879638671875, 0.021759033203125, 0.022785186767578125, 0.02381134033203125, 0.024837493896484375, 0.0258636474609375, 0.026889801025390625, 0.02791595458984375, 0.028942108154296875, 0.02996826171875]}, "gradients/decoder.model.decoder.layers.4.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 9.0, 10.0, 34.0, 105.0, 245.0, 303.0, 181.0, 75.0, 30.0, 10.0, 5.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.61667537689209, -9.409029006958008, -9.20138168334961, -8.993735313415527, -8.786088943481445, -8.578441619873047, -8.370795249938965, -8.163148880004883, -7.955501556396484, -7.747854709625244, -7.540208339691162, -7.332561492919922, -7.124914646148682, -6.917267799377441, -6.709621429443359, -6.501974582672119, -6.294328212738037, -6.086681365966797, -5.879034996032715, -5.671388149261475, -5.463741302490234, -5.256094932556152, -5.048448085784912, -4.840801239013672, -4.63315486907959, -4.42550802230835, -4.217861652374268, -4.010214805603027, -3.802567958831787, -3.594921350479126, -3.387274742126465, -3.1796278953552246, -2.971980571746826, -2.764333963394165, -2.556687116622925, -2.3490405082702637, -2.1413936614990234, -1.9337470531463623, -1.7261004447937012, -1.5184537172317505, -1.3108069896697998, -1.1031602621078491, -0.8955135941505432, -0.6878669261932373, -0.4802201986312866, -0.27257347106933594, -0.0649268627166748, 0.14271986484527588, 0.35036659240722656, 0.5580133199691772, 0.7656599879264832, 0.9733066558837891, 1.1809533834457397, 1.3886001110076904, 1.5962467193603516, 1.8038934469223022, 2.011540174484253, 2.219186782836914, 2.4268336296081543, 2.6344802379608154, 2.8421268463134766, 3.049773693084717, 3.257420301437378, 3.465066909790039, 3.6727137565612793]}, "gradients/decoder.model.decoder.layers.4.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 1.0, 2.0, 3.0, 9.0, 4.0, 10.0, 13.0, 15.0, 18.0, 23.0, 34.0, 30.0, 46.0, 49.0, 47.0, 78.0, 71.0, 69.0, 73.0, 57.0, 58.0, 68.0, 50.0, 46.0, 42.0, 30.0, 11.0, 15.0, 12.0, 5.0, 10.0, 1.0, 9.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.057645797729492, -1.9905017614364624, -1.9233578443527222, -1.8562138080596924, -1.7890697717666626, -1.7219257354736328, -1.6547818183898926, -1.5876377820968628, -1.520493745803833, -1.4533497095108032, -1.386205792427063, -1.3190617561340332, -1.2519177198410034, -1.1847736835479736, -1.1176297664642334, -1.0504857301712036, -0.9833418130874634, -0.9161978363990784, -0.8490538001060486, -0.7819098234176636, -0.7147657871246338, -0.6476218104362488, -0.5804778337478638, -0.513333797454834, -0.446189820766449, -0.3790458142757416, -0.3119018077850342, -0.24475783109664917, -0.17761382460594177, -0.11046981811523438, -0.043325841426849365, 0.023818165063858032, 0.09096217155456543, 0.15810617804527283, 0.22525016963481903, 0.29239416122436523, 0.35953816771507263, 0.42668217420578003, 0.49382615089416504, 0.5609701871871948, 0.6281141638755798, 0.6952581405639648, 0.7624021768569946, 0.8295461535453796, 0.8966901302337646, 0.9638341665267944, 1.0309782028198242, 1.0981221199035645, 1.1652661561965942, 1.232410192489624, 1.2995541095733643, 1.366698145866394, 1.4338421821594238, 1.500986099243164, 1.5681301355361938, 1.6352741718292236, 1.7024180889129639, 1.7695621252059937, 1.8367060422897339, 1.9038500785827637, 1.9709941148757935, 2.0381381511688232, 2.1052820682525635, 2.1724259853363037, 2.239570140838623]}, "gradients/decoder.model.decoder.layers.4.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 4.0, 2.0, 5.0, 8.0, 11.0, 8.0, 17.0, 28.0, 59.0, 103.0, 200.0, 450.0, 1307.0, 4054.0, 14871.0, 66205.0, 395905.0, 462219.0, 78939.0, 17000.0, 4740.0, 1459.0, 498.0, 221.0, 85.0, 52.0, 29.0, 29.0, 15.0, 13.0, 2.0, 4.0, 7.0, 3.0, 2.0, 3.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.421875, -2.348602294921875, -2.27532958984375, -2.202056884765625, -2.1287841796875, -2.055511474609375, -1.98223876953125, -1.908966064453125, -1.835693359375, -1.762420654296875, -1.68914794921875, -1.615875244140625, -1.5426025390625, -1.469329833984375, -1.39605712890625, -1.322784423828125, -1.24951171875, -1.176239013671875, -1.10296630859375, -1.029693603515625, -0.9564208984375, -0.883148193359375, -0.80987548828125, -0.736602783203125, -0.663330078125, -0.590057373046875, -0.51678466796875, -0.443511962890625, -0.3702392578125, -0.296966552734375, -0.22369384765625, -0.150421142578125, -0.0771484375, -0.003875732421875, 0.06939697265625, 0.142669677734375, 0.2159423828125, 0.289215087890625, 0.36248779296875, 0.435760498046875, 0.509033203125, 0.582305908203125, 0.65557861328125, 0.728851318359375, 0.8021240234375, 0.875396728515625, 0.94866943359375, 1.021942138671875, 1.09521484375, 1.168487548828125, 1.24176025390625, 1.315032958984375, 1.3883056640625, 1.461578369140625, 1.53485107421875, 1.608123779296875, 1.681396484375, 1.754669189453125, 1.82794189453125, 1.901214599609375, 1.9744873046875, 2.047760009765625, 2.12103271484375, 2.194305419921875, 2.267578125]}, "gradients/decoder.model.decoder.layers.4.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 1.0, 2.0, 3.0, 6.0, 5.0, 9.0, 12.0, 14.0, 20.0, 19.0, 26.0, 33.0, 42.0, 50.0, 46.0, 47.0, 77.0, 65.0, 68.0, 61.0, 63.0, 57.0, 50.0, 39.0, 48.0, 34.0, 35.0, 25.0, 11.0, 12.0, 8.0, 9.0, 5.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-4.58203125, -4.459869384765625, -4.33770751953125, -4.215545654296875, -4.0933837890625, -3.971221923828125, -3.84906005859375, -3.726898193359375, -3.604736328125, -3.482574462890625, -3.36041259765625, -3.238250732421875, -3.1160888671875, -2.993927001953125, -2.87176513671875, -2.749603271484375, -2.62744140625, -2.505279541015625, -2.38311767578125, -2.260955810546875, -2.1387939453125, -2.016632080078125, -1.89447021484375, -1.772308349609375, -1.650146484375, -1.527984619140625, -1.40582275390625, -1.283660888671875, -1.1614990234375, -1.039337158203125, -0.91717529296875, -0.795013427734375, -0.6728515625, -0.550689697265625, -0.42852783203125, -0.306365966796875, -0.1842041015625, -0.062042236328125, 0.06011962890625, 0.182281494140625, 0.304443359375, 0.426605224609375, 0.54876708984375, 0.670928955078125, 0.7930908203125, 0.915252685546875, 1.03741455078125, 1.159576416015625, 1.28173828125, 1.403900146484375, 1.52606201171875, 1.648223876953125, 1.7703857421875, 1.892547607421875, 2.01470947265625, 2.136871337890625, 2.259033203125, 2.381195068359375, 2.50335693359375, 2.625518798828125, 2.7476806640625, 2.869842529296875, 2.99200439453125, 3.114166259765625, 3.236328125]}, "gradients/decoder.model.decoder.layers.4.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 3.0, 3.0, 2.0, 5.0, 9.0, 4.0, 12.0, 14.0, 13.0, 14.0, 14.0, 23.0, 44.0, 63.0, 93.0, 123.0, 164.0, 326.0, 807.0, 3038.0, 26922.0, 565489.0, 426447.0, 20696.0, 2674.0, 709.0, 299.0, 171.0, 107.0, 87.0, 50.0, 40.0, 23.0, 19.0, 17.0, 14.0, 3.0, 7.0, 5.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-4.43359375, -4.3135986328125, -4.193603515625, -4.0736083984375, -3.95361328125, -3.8336181640625, -3.713623046875, -3.5936279296875, -3.4736328125, -3.3536376953125, -3.233642578125, -3.1136474609375, -2.99365234375, -2.8736572265625, -2.753662109375, -2.6336669921875, -2.513671875, -2.3936767578125, -2.273681640625, -2.1536865234375, -2.03369140625, -1.9136962890625, -1.793701171875, -1.6737060546875, -1.5537109375, -1.4337158203125, -1.313720703125, -1.1937255859375, -1.07373046875, -0.9537353515625, -0.833740234375, -0.7137451171875, -0.59375, -0.4737548828125, -0.353759765625, -0.2337646484375, -0.11376953125, 0.0062255859375, 0.126220703125, 0.2462158203125, 0.3662109375, 0.4862060546875, 0.606201171875, 0.7261962890625, 0.84619140625, 0.9661865234375, 1.086181640625, 1.2061767578125, 1.326171875, 1.4461669921875, 1.566162109375, 1.6861572265625, 1.80615234375, 1.9261474609375, 2.046142578125, 2.1661376953125, 2.2861328125, 2.4061279296875, 2.526123046875, 2.6461181640625, 2.76611328125, 2.8861083984375, 3.006103515625, 3.1260986328125, 3.24609375]}, "gradients/decoder.model.decoder.layers.4.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 3.0, 2.0, 4.0, 8.0, 6.0, 9.0, 20.0, 18.0, 17.0, 18.0, 25.0, 31.0, 31.0, 23.0, 37.0, 37.0, 35.0, 32.0, 51.0, 58.0, 49.0, 54.0, 59.0, 58.0, 40.0, 43.0, 36.0, 30.0, 29.0, 20.0, 27.0, 15.0, 15.0, 18.0, 10.0, 8.0, 13.0, 7.0, 6.0, 1.0, 2.0, 4.0, 3.0, 1.0, 1.0, 2.0, 2.0], "bins": [-4.6171875, -4.494049072265625, -4.37091064453125, -4.247772216796875, -4.1246337890625, -4.001495361328125, -3.87835693359375, -3.755218505859375, -3.632080078125, -3.508941650390625, -3.38580322265625, -3.262664794921875, -3.1395263671875, -3.016387939453125, -2.89324951171875, -2.770111083984375, -2.64697265625, -2.523834228515625, -2.40069580078125, -2.277557373046875, -2.1544189453125, -2.031280517578125, -1.90814208984375, -1.785003662109375, -1.661865234375, -1.538726806640625, -1.41558837890625, -1.292449951171875, -1.1693115234375, -1.046173095703125, -0.92303466796875, -0.799896240234375, -0.6767578125, -0.553619384765625, -0.43048095703125, -0.307342529296875, -0.1842041015625, -0.061065673828125, 0.06207275390625, 0.185211181640625, 0.308349609375, 0.431488037109375, 0.55462646484375, 0.677764892578125, 0.8009033203125, 0.924041748046875, 1.04718017578125, 1.170318603515625, 1.29345703125, 1.416595458984375, 1.53973388671875, 1.662872314453125, 1.7860107421875, 1.909149169921875, 2.03228759765625, 2.155426025390625, 2.278564453125, 2.401702880859375, 2.52484130859375, 2.647979736328125, 2.7711181640625, 2.894256591796875, 3.01739501953125, 3.140533447265625, 3.263671875]}, "gradients/decoder.model.decoder.layers.4.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 8.0, 3.0, 3.0, 15.0, 14.0, 33.0, 57.0, 146.0, 404.0, 1375.0, 7805.0, 635822.0, 394465.0, 6455.0, 1271.0, 403.0, 138.0, 61.0, 29.0, 15.0, 8.0, 8.0, 4.0, 2.0, 5.0, 5.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.271484375, -3.17791748046875, -3.0843505859375, -2.99078369140625, -2.897216796875, -2.80364990234375, -2.7100830078125, -2.61651611328125, -2.52294921875, -2.42938232421875, -2.3358154296875, -2.24224853515625, -2.148681640625, -2.05511474609375, -1.9615478515625, -1.86798095703125, -1.7744140625, -1.68084716796875, -1.5872802734375, -1.49371337890625, -1.400146484375, -1.30657958984375, -1.2130126953125, -1.11944580078125, -1.02587890625, -0.93231201171875, -0.8387451171875, -0.74517822265625, -0.651611328125, -0.55804443359375, -0.4644775390625, -0.37091064453125, -0.27734375, -0.18377685546875, -0.0902099609375, 0.00335693359375, 0.096923828125, 0.19049072265625, 0.2840576171875, 0.37762451171875, 0.47119140625, 0.56475830078125, 0.6583251953125, 0.75189208984375, 0.845458984375, 0.93902587890625, 1.0325927734375, 1.12615966796875, 1.2197265625, 1.31329345703125, 1.4068603515625, 1.50042724609375, 1.593994140625, 1.68756103515625, 1.7811279296875, 1.87469482421875, 1.96826171875, 2.06182861328125, 2.1553955078125, 2.24896240234375, 2.342529296875, 2.43609619140625, 2.5296630859375, 2.62322998046875, 2.716796875]}, "gradients/decoder.model.decoder.layers.4.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 10.0, 18.0, 20.0, 56.0, 71.0, 167.0, 280.0, 149.0, 93.0, 54.0, 42.0, 16.0, 11.0, 3.0, 2.0, 4.0, 4.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0003230571746826172, -0.0003124848008155823, -0.00030191242694854736, -0.00029134005308151245, -0.00028076767921447754, -0.0002701953053474426, -0.0002596229314804077, -0.0002490505576133728, -0.0002384781837463379, -0.00022790580987930298, -0.00021733343601226807, -0.00020676106214523315, -0.00019618868827819824, -0.00018561631441116333, -0.00017504394054412842, -0.0001644715666770935, -0.0001538991928100586, -0.00014332681894302368, -0.00013275444507598877, -0.00012218207120895386, -0.00011160969734191895, -0.00010103732347488403, -9.046494960784912e-05, -7.989257574081421e-05, -6.93202018737793e-05, -5.8747828006744385e-05, -4.817545413970947e-05, -3.760308027267456e-05, -2.703070640563965e-05, -1.6458332538604736e-05, -5.885958671569824e-06, 4.686415195465088e-06, 1.52587890625e-05, 2.5831162929534912e-05, 3.6403536796569824e-05, 4.6975910663604736e-05, 5.754828453063965e-05, 6.812065839767456e-05, 7.869303226470947e-05, 8.926540613174438e-05, 9.98377799987793e-05, 0.00011041015386581421, 0.00012098252773284912, 0.00013155490159988403, 0.00014212727546691895, 0.00015269964933395386, 0.00016327202320098877, 0.00017384439706802368, 0.0001844167709350586, 0.0001949891448020935, 0.00020556151866912842, 0.00021613389253616333, 0.00022670626640319824, 0.00023727864027023315, 0.00024785101413726807, 0.000258423388004303, 0.0002689957618713379, 0.0002795681357383728, 0.0002901405096054077, 0.0003007128834724426, 0.00031128525733947754, 0.00032185763120651245, 0.00033243000507354736, 0.0003430023789405823, 0.0003535747528076172]}, "gradients/decoder.model.decoder.layers.4.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 4.0, 3.0, 2.0, 7.0, 10.0, 15.0, 23.0, 46.0, 84.0, 166.0, 392.0, 1205.0, 5199.0, 100486.0, 909863.0, 26641.0, 3013.0, 737.0, 291.0, 153.0, 81.0, 40.0, 26.0, 23.0, 15.0, 9.0, 3.0, 5.0, 4.0, 2.0, 4.0, 3.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9443359375, -1.8644256591796875, -1.784515380859375, -1.7046051025390625, -1.62469482421875, -1.5447845458984375, -1.464874267578125, -1.3849639892578125, -1.3050537109375, -1.2251434326171875, -1.145233154296875, -1.0653228759765625, -0.98541259765625, -0.9055023193359375, -0.825592041015625, -0.7456817626953125, -0.665771484375, -0.5858612060546875, -0.505950927734375, -0.4260406494140625, -0.34613037109375, -0.2662200927734375, -0.186309814453125, -0.1063995361328125, -0.0264892578125, 0.0534210205078125, 0.133331298828125, 0.2132415771484375, 0.29315185546875, 0.3730621337890625, 0.452972412109375, 0.5328826904296875, 0.61279296875, 0.6927032470703125, 0.772613525390625, 0.8525238037109375, 0.93243408203125, 1.0123443603515625, 1.092254638671875, 1.1721649169921875, 1.2520751953125, 1.3319854736328125, 1.411895751953125, 1.4918060302734375, 1.57171630859375, 1.6516265869140625, 1.731536865234375, 1.8114471435546875, 1.891357421875, 1.9712677001953125, 2.051177978515625, 2.1310882568359375, 2.21099853515625, 2.2909088134765625, 2.370819091796875, 2.4507293701171875, 2.5306396484375, 2.6105499267578125, 2.690460205078125, 2.7703704833984375, 2.85028076171875, 2.9301910400390625, 3.010101318359375, 3.0900115966796875, 3.169921875]}, "gradients/decoder.model.decoder.layers.4.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 6.0, 3.0, 1.0, 5.0, 6.0, 7.0, 8.0, 14.0, 13.0, 28.0, 28.0, 41.0, 65.0, 102.0, 207.0, 182.0, 86.0, 58.0, 48.0, 33.0, 18.0, 18.0, 12.0, 10.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.76171875, -0.7416152954101562, -0.7215118408203125, -0.7014083862304688, -0.681304931640625, -0.6612014770507812, -0.6410980224609375, -0.6209945678710938, -0.60089111328125, -0.5807876586914062, -0.5606842041015625, -0.5405807495117188, -0.520477294921875, -0.5003738403320312, -0.4802703857421875, -0.46016693115234375, -0.4400634765625, -0.41996002197265625, -0.3998565673828125, -0.37975311279296875, -0.359649658203125, -0.33954620361328125, -0.3194427490234375, -0.29933929443359375, -0.27923583984375, -0.25913238525390625, -0.2390289306640625, -0.21892547607421875, -0.198822021484375, -0.17871856689453125, -0.1586151123046875, -0.13851165771484375, -0.118408203125, -0.09830474853515625, -0.0782012939453125, -0.05809783935546875, -0.037994384765625, -0.01789093017578125, 0.0022125244140625, 0.02231597900390625, 0.04241943359375, 0.06252288818359375, 0.0826263427734375, 0.10272979736328125, 0.122833251953125, 0.14293670654296875, 0.1630401611328125, 0.18314361572265625, 0.2032470703125, 0.22335052490234375, 0.2434539794921875, 0.26355743408203125, 0.283660888671875, 0.30376434326171875, 0.3238677978515625, 0.34397125244140625, 0.36407470703125, 0.38417816162109375, 0.4042816162109375, 0.42438507080078125, 0.444488525390625, 0.46459197998046875, 0.4846954345703125, 0.5047988891601562, 0.52490234375]}, "gradients/decoder.model.decoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 13.0, 11.0, 24.0, 57.0, 128.0, 188.0, 216.0, 176.0, 109.0, 36.0, 23.0, 9.0, 10.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.872335910797119, -4.554630279541016, -4.236924171447754, -3.9192185401916504, -3.6015124320983887, -3.283806800842285, -2.9661009311676025, -2.64839506149292, -2.3306891918182373, -2.0129833221435547, -1.695277452468872, -1.377571702003479, -1.0598658323287964, -0.7421599626541138, -0.4244542121887207, -0.10674834251403809, 0.21095752716064453, 0.5286633968353271, 0.846369206905365, 1.1640750169754028, 1.4817808866500854, 1.799486756324768, 2.117192506790161, 2.4348983764648438, 2.7526042461395264, 3.070310115814209, 3.3880159854888916, 3.705721855163574, 4.023427486419678, 4.3411335945129395, 4.658839225769043, 4.976545333862305, 5.294251441955566, 5.61195707321167, 5.929663181304932, 6.247368812561035, 6.565074920654297, 6.8827805519104, 7.200486183166504, 7.518192291259766, 7.835898399353027, 8.153604507446289, 8.471309661865234, 8.789015769958496, 9.106721878051758, 9.42442798614502, 9.742133140563965, 10.059839248657227, 10.377544403076172, 10.695250511169434, 11.012955665588379, 11.33066177368164, 11.648367881774902, 11.966073989868164, 12.28377914428711, 12.601485252380371, 12.919191360473633, 13.236897468566895, 13.55460262298584, 13.872308731079102, 14.190014839172363, 14.507720947265625, 14.82542610168457, 15.143132209777832, 15.460838317871094]}, "gradients/decoder.model.decoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 3.0, 4.0, 7.0, 2.0, 7.0, 4.0, 6.0, 8.0, 9.0, 10.0, 14.0, 9.0, 22.0, 14.0, 25.0, 22.0, 23.0, 22.0, 22.0, 17.0, 24.0, 40.0, 28.0, 19.0, 31.0, 44.0, 34.0, 38.0, 42.0, 27.0, 28.0, 42.0, 24.0, 28.0, 42.0, 34.0, 29.0, 32.0, 32.0, 17.0, 23.0, 14.0, 16.0, 18.0, 14.0, 9.0, 9.0, 8.0, 6.0, 4.0, 3.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-4.496866226196289, -4.350981712341309, -4.20509672164917, -4.0592122077941895, -3.91332745552063, -3.7674427032470703, -3.62155818939209, -3.4756734371185303, -3.3297886848449707, -3.183903932571411, -3.0380194187164307, -2.892134666442871, -2.7462499141693115, -2.600365161895752, -2.4544806480407715, -2.308595895767212, -2.1627113819122314, -2.016826629638672, -1.8709419965744019, -1.7250573635101318, -1.5791726112365723, -1.4332879781723022, -1.2874033451080322, -1.1415185928344727, -0.9956339597702026, -0.8497492671012878, -0.703864574432373, -0.557979941368103, -0.41209524869918823, -0.26621055603027344, -0.12032592296600342, 0.025558829307556152, 0.17144346237182617, 0.31732815504074097, 0.4632128179073334, 0.6090974807739258, 0.7549821734428406, 0.9008668661117554, 1.0467514991760254, 1.192636251449585, 1.338520884513855, 1.484405517578125, 1.6302902698516846, 1.7761749029159546, 1.9220595359802246, 2.067944288253784, 2.2138290405273438, 2.359713554382324, 2.505598306655884, 2.6514830589294434, 2.797367572784424, 2.9432523250579834, 3.089137077331543, 3.2350215911865234, 3.380906343460083, 3.5267910957336426, 3.672675609588623, 3.8185603618621826, 3.964444875717163, 4.110329627990723, 4.256214141845703, 4.402099132537842, 4.547983646392822, 4.693868637084961, 4.839753150939941]}, "gradients/decoder.model.decoder.layers.3.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 4.0, 2.0, 7.0, 3.0, 8.0, 16.0, 19.0, 27.0, 59.0, 111.0, 258.0, 701.0, 2645.0, 54604.0, 3888712.0, 241818.0, 4208.0, 642.0, 220.0, 89.0, 53.0, 21.0, 23.0, 16.0, 10.0, 7.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.6484375, -7.3717041015625, -7.094970703125, -6.8182373046875, -6.54150390625, -6.2647705078125, -5.988037109375, -5.7113037109375, -5.4345703125, -5.1578369140625, -4.881103515625, -4.6043701171875, -4.32763671875, -4.0509033203125, -3.774169921875, -3.4974365234375, -3.220703125, -2.9439697265625, -2.667236328125, -2.3905029296875, -2.11376953125, -1.8370361328125, -1.560302734375, -1.2835693359375, -1.0068359375, -0.7301025390625, -0.453369140625, -0.1766357421875, 0.10009765625, 0.3768310546875, 0.653564453125, 0.9302978515625, 1.20703125, 1.4837646484375, 1.760498046875, 2.0372314453125, 2.31396484375, 2.5906982421875, 2.867431640625, 3.1441650390625, 3.4208984375, 3.6976318359375, 3.974365234375, 4.2510986328125, 4.52783203125, 4.8045654296875, 5.081298828125, 5.3580322265625, 5.634765625, 5.9114990234375, 6.188232421875, 6.4649658203125, 6.74169921875, 7.0184326171875, 7.295166015625, 7.5718994140625, 7.8486328125, 8.1253662109375, 8.402099609375, 8.6788330078125, 8.95556640625, 9.2322998046875, 9.509033203125, 9.7857666015625, 10.0625]}, "gradients/decoder.model.decoder.layers.3.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 4.0, 2.0, 0.0, 4.0, 5.0, 10.0, 11.0, 16.0, 20.0, 16.0, 20.0, 22.0, 31.0, 41.0, 46.0, 43.0, 56.0, 44.0, 48.0, 58.0, 73.0, 51.0, 55.0, 60.0, 36.0, 43.0, 34.0, 28.0, 28.0, 25.0, 17.0, 18.0, 7.0, 7.0, 10.0, 6.0, 3.0, 5.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.01953125, -1.951568603515625, -1.88360595703125, -1.815643310546875, -1.7476806640625, -1.679718017578125, -1.61175537109375, -1.543792724609375, -1.475830078125, -1.407867431640625, -1.33990478515625, -1.271942138671875, -1.2039794921875, -1.136016845703125, -1.06805419921875, -1.000091552734375, -0.93212890625, -0.864166259765625, -0.79620361328125, -0.728240966796875, -0.6602783203125, -0.592315673828125, -0.52435302734375, -0.456390380859375, -0.388427734375, -0.320465087890625, -0.25250244140625, -0.184539794921875, -0.1165771484375, -0.048614501953125, 0.01934814453125, 0.087310791015625, 0.1552734375, 0.223236083984375, 0.29119873046875, 0.359161376953125, 0.4271240234375, 0.495086669921875, 0.56304931640625, 0.631011962890625, 0.698974609375, 0.766937255859375, 0.83489990234375, 0.902862548828125, 0.9708251953125, 1.038787841796875, 1.10675048828125, 1.174713134765625, 1.24267578125, 1.310638427734375, 1.37860107421875, 1.446563720703125, 1.5145263671875, 1.582489013671875, 1.65045166015625, 1.718414306640625, 1.786376953125, 1.854339599609375, 1.92230224609375, 1.990264892578125, 2.0582275390625, 2.126190185546875, 2.19415283203125, 2.262115478515625, 2.330078125]}, "gradients/decoder.model.decoder.layers.3.fc1.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 6.0, 1.0, 2.0, 3.0, 5.0, 9.0, 10.0, 11.0, 18.0, 20.0, 30.0, 53.0, 75.0, 145.0, 279.0, 614.0, 1696.0, 6577.0, 60058.0, 3408273.0, 691211.0, 19806.0, 3469.0, 1018.0, 429.0, 195.0, 106.0, 54.0, 39.0, 19.0, 19.0, 15.0, 7.0, 8.0, 1.0, 2.0, 1.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.4765625, -5.3043212890625, -5.132080078125, -4.9598388671875, -4.78759765625, -4.6153564453125, -4.443115234375, -4.2708740234375, -4.0986328125, -3.9263916015625, -3.754150390625, -3.5819091796875, -3.40966796875, -3.2374267578125, -3.065185546875, -2.8929443359375, -2.720703125, -2.5484619140625, -2.376220703125, -2.2039794921875, -2.03173828125, -1.8594970703125, -1.687255859375, -1.5150146484375, -1.3427734375, -1.1705322265625, -0.998291015625, -0.8260498046875, -0.65380859375, -0.4815673828125, -0.309326171875, -0.1370849609375, 0.03515625, 0.2073974609375, 0.379638671875, 0.5518798828125, 0.72412109375, 0.8963623046875, 1.068603515625, 1.2408447265625, 1.4130859375, 1.5853271484375, 1.757568359375, 1.9298095703125, 2.10205078125, 2.2742919921875, 2.446533203125, 2.6187744140625, 2.791015625, 2.9632568359375, 3.135498046875, 3.3077392578125, 3.47998046875, 3.6522216796875, 3.824462890625, 3.9967041015625, 4.1689453125, 4.3411865234375, 4.513427734375, 4.6856689453125, 4.85791015625, 5.0301513671875, 5.202392578125, 5.3746337890625, 5.546875]}, "gradients/decoder.model.decoder.layers.3.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 4.0, 3.0, 3.0, 2.0, 4.0, 6.0, 8.0, 24.0, 23.0, 58.0, 70.0, 110.0, 176.0, 257.0, 475.0, 675.0, 710.0, 520.0, 359.0, 217.0, 134.0, 88.0, 48.0, 36.0, 25.0, 12.0, 15.0, 5.0, 4.0, 4.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9892578125, -0.9541778564453125, -0.919097900390625, -0.8840179443359375, -0.84893798828125, -0.8138580322265625, -0.778778076171875, -0.7436981201171875, -0.7086181640625, -0.6735382080078125, -0.638458251953125, -0.6033782958984375, -0.56829833984375, -0.5332183837890625, -0.498138427734375, -0.4630584716796875, -0.427978515625, -0.3928985595703125, -0.357818603515625, -0.3227386474609375, -0.28765869140625, -0.2525787353515625, -0.217498779296875, -0.1824188232421875, -0.1473388671875, -0.1122589111328125, -0.077178955078125, -0.0420989990234375, -0.00701904296875, 0.0280609130859375, 0.063140869140625, 0.0982208251953125, 0.13330078125, 0.1683807373046875, 0.203460693359375, 0.2385406494140625, 0.27362060546875, 0.3087005615234375, 0.343780517578125, 0.3788604736328125, 0.4139404296875, 0.4490203857421875, 0.484100341796875, 0.5191802978515625, 0.55426025390625, 0.5893402099609375, 0.624420166015625, 0.6595001220703125, 0.694580078125, 0.7296600341796875, 0.764739990234375, 0.7998199462890625, 0.83489990234375, 0.8699798583984375, 0.905059814453125, 0.9401397705078125, 0.9752197265625, 1.0102996826171875, 1.045379638671875, 1.0804595947265625, 1.11553955078125, 1.1506195068359375, 1.185699462890625, 1.2207794189453125, 1.255859375]}, "gradients/decoder.model.decoder.layers.3.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 7.0, 12.0, 12.0, 38.0, 63.0, 116.0, 147.0, 152.0, 171.0, 119.0, 95.0, 35.0, 19.0, 13.0, 6.0, 3.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.59725284576416, -7.3842339515686035, -7.171214580535889, -6.958195686340332, -6.745176792144775, -6.532157897949219, -6.319138526916504, -6.106119632720947, -5.893100738525391, -5.680081844329834, -5.467062473297119, -5.2540435791015625, -5.041024684906006, -4.828005790710449, -4.614986419677734, -4.401967525482178, -4.188948154449463, -3.975929021835327, -3.7629101276397705, -3.5498909950256348, -3.336872100830078, -3.1238529682159424, -2.9108338356018066, -2.69781494140625, -2.4847958087921143, -2.2717766761779785, -2.058757781982422, -1.8457386493682861, -1.63271963596344, -1.4197006225585938, -1.206681489944458, -0.9936624765396118, -0.7806439399719238, -0.5676249265670776, -0.35460585355758667, -0.1415867805480957, 0.07143223285675049, 0.2844512462615967, 0.4974703788757324, 0.7104893922805786, 0.9235084056854248, 1.136527419090271, 1.3495464324951172, 1.562565565109253, 1.7755845785140991, 1.9886035919189453, 2.201622724533081, 2.414641857147217, 2.6276607513427734, 2.840679883956909, 3.053698778152466, 3.2667179107666016, 3.479736804962158, 3.692755937576294, 3.9057750701904297, 4.118793964385986, 4.331812858581543, 4.5448317527771, 4.7578511238098145, 4.970870018005371, 5.183888912200928, 5.396907806396484, 5.609927177429199, 5.822946071624756, 6.035965442657471]}, "gradients/decoder.model.decoder.layers.3.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 6.0, 6.0, 7.0, 9.0, 10.0, 12.0, 19.0, 15.0, 17.0, 17.0, 22.0, 26.0, 22.0, 42.0, 36.0, 45.0, 44.0, 48.0, 47.0, 44.0, 33.0, 46.0, 55.0, 59.0, 43.0, 42.0, 26.0, 31.0, 43.0, 22.0, 20.0, 20.0, 17.0, 14.0, 14.0, 11.0, 2.0, 6.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.1844964027404785, -2.1115779876708984, -2.0386595726013184, -1.9657411575317383, -1.8928228616714478, -1.8199044466018677, -1.7469860315322876, -1.674067735671997, -1.601149320602417, -1.528230905532837, -1.4553124904632568, -1.3823940753936768, -1.3094757795333862, -1.2365573644638062, -1.163638949394226, -1.0907206535339355, -1.017802119255066, -0.9448837041854858, -0.8719653487205505, -0.7990469336509705, -0.7261285781860352, -0.6532101631164551, -0.580291748046875, -0.5073733925819397, -0.4344549775123596, -0.36153659224510193, -0.28861820697784424, -0.21569979190826416, -0.14278140664100647, -0.06986302137374878, 0.003055393695831299, 0.0759737491607666, 0.14889216423034668, 0.22181054949760437, 0.29472893476486206, 0.36764734983444214, 0.44056573510169983, 0.5134841203689575, 0.5864025354385376, 0.6593208909034729, 0.732239305973053, 0.8051577210426331, 0.8780760765075684, 0.9509944915771484, 1.0239129066467285, 1.0968313217163086, 1.1697497367858887, 1.2426680326461792, 1.3155864477157593, 1.3885048627853394, 1.4614232778549194, 1.53434157371521, 1.60725998878479, 1.6801784038543701, 1.7530968189239502, 1.8260152339935303, 1.8989336490631104, 1.9718520641326904, 2.0447704792022705, 2.1176888942718506, 2.1906073093414307, 2.2635254859924316, 2.3364439010620117, 2.409362316131592, 2.482280731201172]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 3.0, 5.0, 2.0, 5.0, 4.0, 4.0, 5.0, 17.0, 8.0, 17.0, 19.0, 29.0, 19.0, 45.0, 52.0, 66.0, 77.0, 149.0, 299.0, 618.0, 1695.0, 6270.0, 32495.0, 188357.0, 523129.0, 240724.0, 42842.0, 7954.0, 2017.0, 705.0, 349.0, 184.0, 97.0, 74.0, 49.0, 42.0, 30.0, 27.0, 18.0, 23.0, 10.0, 5.0, 10.0, 8.0, 1.0, 4.0, 0.0, 3.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.7978515625, -0.7760391235351562, -0.7542266845703125, -0.7324142456054688, -0.710601806640625, -0.6887893676757812, -0.6669769287109375, -0.6451644897460938, -0.62335205078125, -0.6015396118164062, -0.5797271728515625, -0.5579147338867188, -0.536102294921875, -0.5142898559570312, -0.4924774169921875, -0.47066497802734375, -0.4488525390625, -0.42704010009765625, -0.4052276611328125, -0.38341522216796875, -0.361602783203125, -0.33979034423828125, -0.3179779052734375, -0.29616546630859375, -0.27435302734375, -0.25254058837890625, -0.2307281494140625, -0.20891571044921875, -0.187103271484375, -0.16529083251953125, -0.1434783935546875, -0.12166595458984375, -0.099853515625, -0.07804107666015625, -0.0562286376953125, -0.03441619873046875, -0.012603759765625, 0.00920867919921875, 0.0310211181640625, 0.05283355712890625, 0.07464599609375, 0.09645843505859375, 0.1182708740234375, 0.14008331298828125, 0.161895751953125, 0.18370819091796875, 0.2055206298828125, 0.22733306884765625, 0.2491455078125, 0.27095794677734375, 0.2927703857421875, 0.31458282470703125, 0.336395263671875, 0.35820770263671875, 0.3800201416015625, 0.40183258056640625, 0.42364501953125, 0.44545745849609375, 0.4672698974609375, 0.48908233642578125, 0.510894775390625, 0.5327072143554688, 0.5545196533203125, 0.5763320922851562, 0.59814453125]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 5.0, 7.0, 5.0, 11.0, 11.0, 18.0, 20.0, 34.0, 26.0, 39.0, 25.0, 60.0, 69.0, 63.0, 67.0, 65.0, 66.0, 72.0, 63.0, 66.0, 47.0, 49.0, 27.0, 22.0, 27.0, 18.0, 7.0, 9.0, 2.0, 5.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.5947265625, -1.5268096923828125, -1.458892822265625, -1.3909759521484375, -1.32305908203125, -1.2551422119140625, -1.187225341796875, -1.1193084716796875, -1.0513916015625, -0.9834747314453125, -0.915557861328125, -0.8476409912109375, -0.77972412109375, -0.7118072509765625, -0.643890380859375, -0.5759735107421875, -0.508056640625, -0.4401397705078125, -0.372222900390625, -0.3043060302734375, -0.23638916015625, -0.1684722900390625, -0.100555419921875, -0.0326385498046875, 0.0352783203125, 0.1031951904296875, 0.171112060546875, 0.2390289306640625, 0.30694580078125, 0.3748626708984375, 0.442779541015625, 0.5106964111328125, 0.57861328125, 0.6465301513671875, 0.714447021484375, 0.7823638916015625, 0.85028076171875, 0.9181976318359375, 0.986114501953125, 1.0540313720703125, 1.1219482421875, 1.1898651123046875, 1.257781982421875, 1.3256988525390625, 1.39361572265625, 1.4615325927734375, 1.529449462890625, 1.5973663330078125, 1.665283203125, 1.7332000732421875, 1.801116943359375, 1.8690338134765625, 1.93695068359375, 2.0048675537109375, 2.072784423828125, 2.1407012939453125, 2.2086181640625, 2.2765350341796875, 2.344451904296875, 2.4123687744140625, 2.48028564453125, 2.5482025146484375, 2.616119384765625, 2.6840362548828125, 2.751953125]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 2.0, 2.0, 3.0, 2.0, 9.0, 11.0, 12.0, 14.0, 26.0, 31.0, 48.0, 91.0, 161.0, 314.0, 565.0, 1134.0, 2336.0, 5127.0, 11168.0, 24393.0, 51781.0, 105090.0, 182666.0, 235330.0, 197296.0, 117918.0, 60015.0, 28227.0, 13111.0, 6053.0, 2758.0, 1358.0, 676.0, 335.0, 189.0, 104.0, 60.0, 48.0, 28.0, 21.0, 18.0, 10.0, 4.0, 3.0, 5.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.247314453125, -0.2394866943359375, -0.231658935546875, -0.2238311767578125, -0.21600341796875, -0.2081756591796875, -0.200347900390625, -0.1925201416015625, -0.1846923828125, -0.1768646240234375, -0.169036865234375, -0.1612091064453125, -0.15338134765625, -0.1455535888671875, -0.137725830078125, -0.1298980712890625, -0.1220703125, -0.1142425537109375, -0.106414794921875, -0.0985870361328125, -0.09075927734375, -0.0829315185546875, -0.075103759765625, -0.0672760009765625, -0.0594482421875, -0.0516204833984375, -0.043792724609375, -0.0359649658203125, -0.02813720703125, -0.0203094482421875, -0.012481689453125, -0.0046539306640625, 0.003173828125, 0.0110015869140625, 0.018829345703125, 0.0266571044921875, 0.03448486328125, 0.0423126220703125, 0.050140380859375, 0.0579681396484375, 0.0657958984375, 0.0736236572265625, 0.081451416015625, 0.0892791748046875, 0.09710693359375, 0.1049346923828125, 0.112762451171875, 0.1205902099609375, 0.12841796875, 0.1362457275390625, 0.144073486328125, 0.1519012451171875, 0.15972900390625, 0.1675567626953125, 0.175384521484375, 0.1832122802734375, 0.1910400390625, 0.1988677978515625, 0.206695556640625, 0.2145233154296875, 0.22235107421875, 0.2301788330078125, 0.238006591796875, 0.2458343505859375, 0.253662109375]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 7.0, 9.0, 7.0, 4.0, 8.0, 7.0, 11.0, 17.0, 16.0, 25.0, 23.0, 30.0, 31.0, 37.0, 48.0, 48.0, 55.0, 45.0, 55.0, 49.0, 53.0, 54.0, 34.0, 50.0, 41.0, 39.0, 27.0, 32.0, 19.0, 21.0, 15.0, 16.0, 17.0, 11.0, 9.0, 6.0, 6.0, 7.0, 5.0, 4.0, 8.0, 1.0, 5.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.423828125, -2.331695556640625, -2.23956298828125, -2.147430419921875, -2.0552978515625, -1.963165283203125, -1.87103271484375, -1.778900146484375, -1.686767578125, -1.594635009765625, -1.50250244140625, -1.410369873046875, -1.3182373046875, -1.226104736328125, -1.13397216796875, -1.041839599609375, -0.94970703125, -0.857574462890625, -0.76544189453125, -0.673309326171875, -0.5811767578125, -0.489044189453125, -0.39691162109375, -0.304779052734375, -0.212646484375, -0.120513916015625, -0.02838134765625, 0.063751220703125, 0.1558837890625, 0.248016357421875, 0.34014892578125, 0.432281494140625, 0.5244140625, 0.616546630859375, 0.70867919921875, 0.800811767578125, 0.8929443359375, 0.985076904296875, 1.07720947265625, 1.169342041015625, 1.261474609375, 1.353607177734375, 1.44573974609375, 1.537872314453125, 1.6300048828125, 1.722137451171875, 1.81427001953125, 1.906402587890625, 1.99853515625, 2.090667724609375, 2.18280029296875, 2.274932861328125, 2.3670654296875, 2.459197998046875, 2.55133056640625, 2.643463134765625, 2.735595703125, 2.827728271484375, 2.91986083984375, 3.011993408203125, 3.1041259765625, 3.196258544921875, 3.28839111328125, 3.380523681640625, 3.47265625]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 4.0, 3.0, 6.0, 8.0, 9.0, 14.0, 21.0, 29.0, 60.0, 80.0, 138.0, 258.0, 478.0, 1022.0, 2388.0, 6116.0, 20297.0, 99339.0, 472576.0, 355560.0, 66514.0, 15114.0, 4743.0, 1851.0, 893.0, 414.0, 252.0, 143.0, 71.0, 51.0, 31.0, 29.0, 15.0, 10.0, 4.0, 8.0, 4.0, 2.0, 3.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.087158203125, -0.08403205871582031, -0.08090591430664062, -0.07777976989746094, -0.07465362548828125, -0.07152748107910156, -0.06840133666992188, -0.06527519226074219, -0.0621490478515625, -0.05902290344238281, -0.055896759033203125, -0.05277061462402344, -0.04964447021484375, -0.04651832580566406, -0.043392181396484375, -0.04026603698730469, -0.037139892578125, -0.03401374816894531, -0.030887603759765625, -0.027761459350585938, -0.02463531494140625, -0.021509170532226562, -0.018383026123046875, -0.015256881713867188, -0.0121307373046875, -0.009004592895507812, -0.005878448486328125, -0.0027523040771484375, 0.00037384033203125, 0.0034999847412109375, 0.006626129150390625, 0.009752273559570312, 0.01287841796875, 0.016004562377929688, 0.019130706787109375, 0.022256851196289062, 0.02538299560546875, 0.028509140014648438, 0.031635284423828125, 0.03476142883300781, 0.0378875732421875, 0.04101371765136719, 0.044139862060546875, 0.04726600646972656, 0.05039215087890625, 0.05351829528808594, 0.056644439697265625, 0.05977058410644531, 0.062896728515625, 0.06602287292480469, 0.06914901733398438, 0.07227516174316406, 0.07540130615234375, 0.07852745056152344, 0.08165359497070312, 0.08477973937988281, 0.0879058837890625, 0.09103202819824219, 0.09415817260742188, 0.09728431701660156, 0.10041046142578125, 0.10353660583496094, 0.10666275024414062, 0.10978889465332031, 0.1129150390625]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 2.0, 4.0, 3.0, 7.0, 22.0, 34.0, 41.0, 61.0, 51.0, 106.0, 106.0, 122.0, 129.0, 89.0, 68.0, 46.0, 44.0, 25.0, 11.0, 8.0, 14.0, 3.0, 6.0, 1.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.61015510559082e-05, -6.422773003578186e-05, -6.235390901565552e-05, -6.0480087995529175e-05, -5.860626697540283e-05, -5.673244595527649e-05, -5.4858624935150146e-05, -5.2984803915023804e-05, -5.111098289489746e-05, -4.923716187477112e-05, -4.7363340854644775e-05, -4.548951983451843e-05, -4.361569881439209e-05, -4.174187779426575e-05, -3.9868056774139404e-05, -3.799423575401306e-05, -3.612041473388672e-05, -3.4246593713760376e-05, -3.237277269363403e-05, -3.049895167350769e-05, -2.8625130653381348e-05, -2.6751309633255005e-05, -2.4877488613128662e-05, -2.300366759300232e-05, -2.1129846572875977e-05, -1.9256025552749634e-05, -1.738220453262329e-05, -1.5508383512496948e-05, -1.3634562492370605e-05, -1.1760741472244263e-05, -9.88692045211792e-06, -8.013099431991577e-06, -6.139278411865234e-06, -4.265457391738892e-06, -2.391636371612549e-06, -5.178153514862061e-07, 1.3560056686401367e-06, 3.2298266887664795e-06, 5.103647708892822e-06, 6.977468729019165e-06, 8.851289749145508e-06, 1.072511076927185e-05, 1.2598931789398193e-05, 1.4472752809524536e-05, 1.634657382965088e-05, 1.822039484977722e-05, 2.0094215869903564e-05, 2.1968036890029907e-05, 2.384185791015625e-05, 2.5715678930282593e-05, 2.7589499950408936e-05, 2.946332097053528e-05, 3.133714199066162e-05, 3.3210963010787964e-05, 3.508478403091431e-05, 3.695860505104065e-05, 3.883242607116699e-05, 4.0706247091293335e-05, 4.258006811141968e-05, 4.445388913154602e-05, 4.632771015167236e-05, 4.8201531171798706e-05, 5.007535219192505e-05, 5.194917321205139e-05, 5.3822994232177734e-05]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 2.0, 6.0, 8.0, 7.0, 14.0, 12.0, 14.0, 36.0, 43.0, 70.0, 115.0, 189.0, 348.0, 661.0, 1298.0, 2875.0, 6995.0, 19104.0, 61791.0, 235982.0, 471297.0, 175271.0, 46766.0, 15293.0, 5560.0, 2341.0, 1140.0, 563.0, 311.0, 135.0, 92.0, 66.0, 44.0, 31.0, 23.0, 17.0, 11.0, 7.0, 8.0, 3.0, 6.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09100341796875, -0.088104248046875, -0.085205078125, -0.082305908203125, -0.07940673828125, -0.076507568359375, -0.0736083984375, -0.070709228515625, -0.06781005859375, -0.064910888671875, -0.06201171875, -0.059112548828125, -0.05621337890625, -0.053314208984375, -0.0504150390625, -0.047515869140625, -0.04461669921875, -0.041717529296875, -0.038818359375, -0.035919189453125, -0.03302001953125, -0.030120849609375, -0.0272216796875, -0.024322509765625, -0.02142333984375, -0.018524169921875, -0.015625, -0.012725830078125, -0.00982666015625, -0.006927490234375, -0.0040283203125, -0.001129150390625, 0.00177001953125, 0.004669189453125, 0.007568359375, 0.010467529296875, 0.01336669921875, 0.016265869140625, 0.0191650390625, 0.022064208984375, 0.02496337890625, 0.027862548828125, 0.03076171875, 0.033660888671875, 0.03656005859375, 0.039459228515625, 0.0423583984375, 0.045257568359375, 0.04815673828125, 0.051055908203125, 0.053955078125, 0.056854248046875, 0.05975341796875, 0.062652587890625, 0.0655517578125, 0.068450927734375, 0.07135009765625, 0.074249267578125, 0.0771484375, 0.080047607421875, 0.08294677734375, 0.085845947265625, 0.0887451171875, 0.091644287109375, 0.09454345703125]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 4.0, 1.0, 1.0, 7.0, 5.0, 0.0, 1.0, 11.0, 9.0, 9.0, 16.0, 23.0, 36.0, 40.0, 45.0, 67.0, 94.0, 87.0, 78.0, 94.0, 80.0, 72.0, 53.0, 50.0, 32.0, 21.0, 22.0, 8.0, 13.0, 8.0, 4.0, 2.0, 5.0, 1.0, 2.0, 1.0, 3.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.024688720703125, -0.023790359497070312, -0.022891998291015625, -0.021993637084960938, -0.02109527587890625, -0.020196914672851562, -0.019298553466796875, -0.018400192260742188, -0.0175018310546875, -0.016603469848632812, -0.015705108642578125, -0.014806747436523438, -0.01390838623046875, -0.013010025024414062, -0.012111663818359375, -0.011213302612304688, -0.01031494140625, -0.009416580200195312, -0.008518218994140625, -0.0076198577880859375, -0.00672149658203125, -0.0058231353759765625, -0.004924774169921875, -0.0040264129638671875, -0.0031280517578125, -0.0022296905517578125, -0.001331329345703125, -0.0004329681396484375, 0.00046539306640625, 0.0013637542724609375, 0.002262115478515625, 0.0031604766845703125, 0.004058837890625, 0.0049571990966796875, 0.005855560302734375, 0.0067539215087890625, 0.00765228271484375, 0.008550643920898438, 0.009449005126953125, 0.010347366333007812, 0.0112457275390625, 0.012144088745117188, 0.013042449951171875, 0.013940811157226562, 0.01483917236328125, 0.015737533569335938, 0.016635894775390625, 0.017534255981445312, 0.0184326171875, 0.019330978393554688, 0.020229339599609375, 0.021127700805664062, 0.02202606201171875, 0.022924423217773438, 0.023822784423828125, 0.024721145629882812, 0.0256195068359375, 0.026517868041992188, 0.027416229248046875, 0.028314590454101562, 0.02921295166015625, 0.030111312866210938, 0.031009674072265625, 0.03190803527832031, 0.032806396484375]}, "gradients/decoder.model.decoder.layers.3.self_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 4.0, 4.0, 11.0, 28.0, 50.0, 96.0, 138.0, 168.0, 169.0, 149.0, 96.0, 43.0, 26.0, 12.0, 4.0, 4.0, 3.0, 4.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-4.926216125488281, -4.799779891967773, -4.673343658447266, -4.546907424926758, -4.42047119140625, -4.294034957885742, -4.167598724365234, -4.041162967681885, -3.914726734161377, -3.788290500640869, -3.6618542671203613, -3.5354180335998535, -3.408982038497925, -3.282545804977417, -3.156109571456909, -3.0296733379364014, -2.9032371044158936, -2.7768008708953857, -2.650364637374878, -2.523928642272949, -2.3974924087524414, -2.2710561752319336, -2.144619941711426, -2.018183708190918, -1.8917475938796997, -1.765311360359192, -1.6388752460479736, -1.5124390125274658, -1.386002779006958, -1.2595666646957397, -1.133130431175232, -1.0066943168640137, -0.8802578449249268, -0.7538216710090637, -0.6273854970932007, -0.5009492635726929, -0.37451308965682983, -0.2480769157409668, -0.12164068222045898, 0.004795491695404053, 0.1312316656112671, 0.2576678395271301, 0.38410404324531555, 0.510540246963501, 0.636976420879364, 0.763412594795227, 0.8898488283157349, 1.0162849426269531, 1.142721176147461, 1.2691574096679688, 1.395593523979187, 1.5220297574996948, 1.648465871810913, 1.774902105331421, 1.9013383388519287, 2.0277745723724365, 2.1542105674743652, 2.280646800994873, 2.407083034515381, 2.5335192680358887, 2.6599552631378174, 2.786391496658325, 2.912827730178833, 3.039263963699341, 3.1657001972198486]}, "gradients/decoder.model.decoder.layers.3.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 4.0, 5.0, 6.0, 9.0, 12.0, 18.0, 22.0, 25.0, 34.0, 23.0, 47.0, 44.0, 60.0, 68.0, 84.0, 51.0, 61.0, 88.0, 65.0, 58.0, 43.0, 54.0, 33.0, 25.0, 27.0, 17.0, 13.0, 5.0, 4.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.6342898607254028, -1.5679179430007935, -1.5015461444854736, -1.4351742267608643, -1.3688024282455444, -1.302430510520935, -1.2360587120056152, -1.1696867942810059, -1.1033148765563965, -1.036942958831787, -0.9705711603164673, -0.9041992425918579, -0.8378274440765381, -0.7714555263519287, -0.7050836682319641, -0.6387118101119995, -0.5723400115966797, -0.5059681534767151, -0.4395962953567505, -0.3732244074344635, -0.3068525493144989, -0.2404806911945343, -0.17410880327224731, -0.10773694515228271, -0.041365087032318115, 0.02500677853822708, 0.09137864410877228, 0.15775051712989807, 0.22412237524986267, 0.29049423336982727, 0.35686612129211426, 0.42323797941207886, 0.489609956741333, 0.5559818148612976, 0.6223536729812622, 0.6887255907058716, 0.7550973892211914, 0.8214693069458008, 0.8878411650657654, 0.95421302318573, 1.0205848217010498, 1.0869567394256592, 1.153328537940979, 1.2197004556655884, 1.2860722541809082, 1.3524441719055176, 1.418816089630127, 1.4851878881454468, 1.5515598058700562, 1.6179317235946655, 1.6843035221099854, 1.7506754398345947, 1.8170472383499146, 1.883419156074524, 1.9497909545898438, 2.016162872314453, 2.0825347900390625, 2.148906707763672, 2.2152786254882812, 2.2816503047943115, 2.348022222518921, 2.4143941402435303, 2.4807660579681396, 2.54713773727417, 2.6135096549987793]}, "gradients/decoder.model.decoder.layers.3.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 4.0, 2.0, 3.0, 3.0, 4.0, 9.0, 8.0, 13.0, 9.0, 16.0, 17.0, 20.0, 37.0, 66.0, 138.0, 289.0, 754.0, 2467.0, 11251.0, 75725.0, 753319.0, 177218.0, 21055.0, 4221.0, 1104.0, 380.0, 174.0, 85.0, 52.0, 33.0, 19.0, 14.0, 13.0, 9.0, 4.0, 6.0, 2.0, 4.0, 4.0, 3.0, 5.0, 0.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.626953125, -2.53204345703125, -2.4371337890625, -2.34222412109375, -2.247314453125, -2.15240478515625, -2.0574951171875, -1.96258544921875, -1.86767578125, -1.77276611328125, -1.6778564453125, -1.58294677734375, -1.488037109375, -1.39312744140625, -1.2982177734375, -1.20330810546875, -1.1083984375, -1.01348876953125, -0.9185791015625, -0.82366943359375, -0.728759765625, -0.63385009765625, -0.5389404296875, -0.44403076171875, -0.34912109375, -0.25421142578125, -0.1593017578125, -0.06439208984375, 0.030517578125, 0.12542724609375, 0.2203369140625, 0.31524658203125, 0.41015625, 0.50506591796875, 0.5999755859375, 0.69488525390625, 0.789794921875, 0.88470458984375, 0.9796142578125, 1.07452392578125, 1.16943359375, 1.26434326171875, 1.3592529296875, 1.45416259765625, 1.549072265625, 1.64398193359375, 1.7388916015625, 1.83380126953125, 1.9287109375, 2.02362060546875, 2.1185302734375, 2.21343994140625, 2.308349609375, 2.40325927734375, 2.4981689453125, 2.59307861328125, 2.68798828125, 2.78289794921875, 2.8778076171875, 2.97271728515625, 3.067626953125, 3.16253662109375, 3.2574462890625, 3.35235595703125, 3.447265625]}, "gradients/decoder.model.decoder.layers.3.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 2.0, 4.0, 5.0, 6.0, 6.0, 7.0, 12.0, 21.0, 9.0, 19.0, 11.0, 19.0, 24.0, 35.0, 37.0, 39.0, 61.0, 62.0, 58.0, 55.0, 50.0, 53.0, 52.0, 47.0, 66.0, 42.0, 31.0, 42.0, 31.0, 16.0, 27.0, 12.0, 9.0, 10.0, 10.0, 12.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.208984375, -3.10614013671875, -3.0032958984375, -2.90045166015625, -2.797607421875, -2.69476318359375, -2.5919189453125, -2.48907470703125, -2.38623046875, -2.28338623046875, -2.1805419921875, -2.07769775390625, -1.974853515625, -1.87200927734375, -1.7691650390625, -1.66632080078125, -1.5634765625, -1.46063232421875, -1.3577880859375, -1.25494384765625, -1.152099609375, -1.04925537109375, -0.9464111328125, -0.84356689453125, -0.74072265625, -0.63787841796875, -0.5350341796875, -0.43218994140625, -0.329345703125, -0.22650146484375, -0.1236572265625, -0.02081298828125, 0.08203125, 0.18487548828125, 0.2877197265625, 0.39056396484375, 0.493408203125, 0.59625244140625, 0.6990966796875, 0.80194091796875, 0.90478515625, 1.00762939453125, 1.1104736328125, 1.21331787109375, 1.316162109375, 1.41900634765625, 1.5218505859375, 1.62469482421875, 1.7275390625, 1.83038330078125, 1.9332275390625, 2.03607177734375, 2.138916015625, 2.24176025390625, 2.3446044921875, 2.44744873046875, 2.55029296875, 2.65313720703125, 2.7559814453125, 2.85882568359375, 2.961669921875, 3.06451416015625, 3.1673583984375, 3.27020263671875, 3.373046875]}, "gradients/decoder.model.decoder.layers.3.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 3.0, 3.0, 6.0, 12.0, 7.0, 11.0, 7.0, 7.0, 16.0, 21.0, 17.0, 26.0, 40.0, 53.0, 79.0, 117.0, 157.0, 275.0, 528.0, 1571.0, 14271.0, 746907.0, 273691.0, 8304.0, 1215.0, 460.0, 237.0, 154.0, 106.0, 70.0, 42.0, 29.0, 25.0, 27.0, 19.0, 13.0, 8.0, 8.0, 6.0, 4.0, 3.0, 3.0, 2.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0], "bins": [-5.80859375, -5.64678955078125, -5.4849853515625, -5.32318115234375, -5.161376953125, -4.99957275390625, -4.8377685546875, -4.67596435546875, -4.51416015625, -4.35235595703125, -4.1905517578125, -4.02874755859375, -3.866943359375, -3.70513916015625, -3.5433349609375, -3.38153076171875, -3.2197265625, -3.05792236328125, -2.8961181640625, -2.73431396484375, -2.572509765625, -2.41070556640625, -2.2489013671875, -2.08709716796875, -1.92529296875, -1.76348876953125, -1.6016845703125, -1.43988037109375, -1.278076171875, -1.11627197265625, -0.9544677734375, -0.79266357421875, -0.630859375, -0.46905517578125, -0.3072509765625, -0.14544677734375, 0.016357421875, 0.17816162109375, 0.3399658203125, 0.50177001953125, 0.66357421875, 0.82537841796875, 0.9871826171875, 1.14898681640625, 1.310791015625, 1.47259521484375, 1.6343994140625, 1.79620361328125, 1.9580078125, 2.11981201171875, 2.2816162109375, 2.44342041015625, 2.605224609375, 2.76702880859375, 2.9288330078125, 3.09063720703125, 3.25244140625, 3.41424560546875, 3.5760498046875, 3.73785400390625, 3.899658203125, 4.06146240234375, 4.2232666015625, 4.38507080078125, 4.546875]}, "gradients/decoder.model.decoder.layers.3.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 3.0, 1.0, 3.0, 8.0, 8.0, 6.0, 9.0, 13.0, 12.0, 13.0, 16.0, 10.0, 17.0, 21.0, 29.0, 39.0, 22.0, 33.0, 39.0, 32.0, 42.0, 34.0, 42.0, 51.0, 50.0, 45.0, 45.0, 48.0, 38.0, 30.0, 37.0, 34.0, 34.0, 30.0, 25.0, 9.0, 14.0, 20.0, 9.0, 9.0, 7.0, 3.0, 3.0, 4.0, 7.0, 1.0, 0.0, 1.0, 0.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-3.193359375, -3.09051513671875, -2.9876708984375, -2.88482666015625, -2.781982421875, -2.67913818359375, -2.5762939453125, -2.47344970703125, -2.37060546875, -2.26776123046875, -2.1649169921875, -2.06207275390625, -1.959228515625, -1.85638427734375, -1.7535400390625, -1.65069580078125, -1.5478515625, -1.44500732421875, -1.3421630859375, -1.23931884765625, -1.136474609375, -1.03363037109375, -0.9307861328125, -0.82794189453125, -0.72509765625, -0.62225341796875, -0.5194091796875, -0.41656494140625, -0.313720703125, -0.21087646484375, -0.1080322265625, -0.00518798828125, 0.09765625, 0.20050048828125, 0.3033447265625, 0.40618896484375, 0.509033203125, 0.61187744140625, 0.7147216796875, 0.81756591796875, 0.92041015625, 1.02325439453125, 1.1260986328125, 1.22894287109375, 1.331787109375, 1.43463134765625, 1.5374755859375, 1.64031982421875, 1.7431640625, 1.84600830078125, 1.9488525390625, 2.05169677734375, 2.154541015625, 2.25738525390625, 2.3602294921875, 2.46307373046875, 2.56591796875, 2.66876220703125, 2.7716064453125, 2.87445068359375, 2.977294921875, 3.08013916015625, 3.1829833984375, 3.28582763671875, 3.388671875]}, "gradients/decoder.model.decoder.layers.3.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 4.0, 3.0, 2.0, 9.0, 8.0, 14.0, 31.0, 94.0, 153.0, 376.0, 939.0, 5135.0, 229030.0, 802089.0, 8544.0, 1331.0, 444.0, 190.0, 77.0, 44.0, 19.0, 7.0, 4.0, 2.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.60546875, -3.5198211669921875, -3.434173583984375, -3.3485260009765625, -3.26287841796875, -3.1772308349609375, -3.091583251953125, -3.0059356689453125, -2.9202880859375, -2.8346405029296875, -2.748992919921875, -2.6633453369140625, -2.57769775390625, -2.4920501708984375, -2.406402587890625, -2.3207550048828125, -2.235107421875, -2.1494598388671875, -2.063812255859375, -1.9781646728515625, -1.89251708984375, -1.8068695068359375, -1.721221923828125, -1.6355743408203125, -1.5499267578125, -1.4642791748046875, -1.378631591796875, -1.2929840087890625, -1.20733642578125, -1.1216888427734375, -1.036041259765625, -0.9503936767578125, -0.86474609375, -0.7790985107421875, -0.693450927734375, -0.6078033447265625, -0.52215576171875, -0.4365081787109375, -0.350860595703125, -0.2652130126953125, -0.1795654296875, -0.0939178466796875, -0.008270263671875, 0.0773773193359375, 0.16302490234375, 0.2486724853515625, 0.334320068359375, 0.4199676513671875, 0.505615234375, 0.5912628173828125, 0.676910400390625, 0.7625579833984375, 0.84820556640625, 0.9338531494140625, 1.019500732421875, 1.1051483154296875, 1.1907958984375, 1.2764434814453125, 1.362091064453125, 1.4477386474609375, 1.53338623046875, 1.6190338134765625, 1.704681396484375, 1.7903289794921875, 1.8759765625]}, "gradients/decoder.model.decoder.layers.3.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 4.0, 3.0, 4.0, 6.0, 11.0, 6.0, 6.0, 9.0, 21.0, 30.0, 32.0, 43.0, 71.0, 108.0, 336.0, 78.0, 62.0, 39.0, 29.0, 21.0, 19.0, 18.0, 14.0, 10.0, 12.0, 2.0, 5.0, 2.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00018215179443359375, -0.00017573684453964233, -0.00016932189464569092, -0.0001629069447517395, -0.00015649199485778809, -0.00015007704496383667, -0.00014366209506988525, -0.00013724714517593384, -0.00013083219528198242, -0.000124417245388031, -0.00011800229549407959, -0.00011158734560012817, -0.00010517239570617676, -9.875744581222534e-05, -9.234249591827393e-05, -8.592754602432251e-05, -7.95125961303711e-05, -7.309764623641968e-05, -6.668269634246826e-05, -6.0267746448516846e-05, -5.385279655456543e-05, -4.7437846660614014e-05, -4.10228967666626e-05, -3.460794687271118e-05, -2.8192996978759766e-05, -2.177804708480835e-05, -1.5363097190856934e-05, -8.948147296905518e-06, -2.5331974029541016e-06, 3.8817524909973145e-06, 1.029670238494873e-05, 1.6711652278900146e-05, 2.3126602172851562e-05, 2.954155206680298e-05, 3.5956501960754395e-05, 4.237145185470581e-05, 4.8786401748657227e-05, 5.520135164260864e-05, 6.161630153656006e-05, 6.803125143051147e-05, 7.444620132446289e-05, 8.08611512184143e-05, 8.727610111236572e-05, 9.369105100631714e-05, 0.00010010600090026855, 0.00010652095079421997, 0.00011293590068817139, 0.0001193508505821228, 0.00012576580047607422, 0.00013218075037002563, 0.00013859570026397705, 0.00014501065015792847, 0.00015142560005187988, 0.0001578405499458313, 0.00016425549983978271, 0.00017067044973373413, 0.00017708539962768555, 0.00018350034952163696, 0.00018991529941558838, 0.0001963302493095398, 0.0002027451992034912, 0.00020916014909744263, 0.00021557509899139404, 0.00022199004888534546, 0.00022840499877929688]}, "gradients/decoder.model.decoder.layers.3.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 6.0, 8.0, 8.0, 14.0, 21.0, 32.0, 48.0, 59.0, 115.0, 174.0, 306.0, 590.0, 1442.0, 7977.0, 229998.0, 789379.0, 14984.0, 1829.0, 686.0, 342.0, 193.0, 122.0, 75.0, 49.0, 38.0, 20.0, 14.0, 7.0, 6.0, 2.0, 2.0, 6.0, 3.0, 1.0, 5.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9052734375, -1.8262786865234375, -1.747283935546875, -1.6682891845703125, -1.58929443359375, -1.5102996826171875, -1.431304931640625, -1.3523101806640625, -1.2733154296875, -1.1943206787109375, -1.115325927734375, -1.0363311767578125, -0.95733642578125, -0.8783416748046875, -0.799346923828125, -0.7203521728515625, -0.641357421875, -0.5623626708984375, -0.483367919921875, -0.4043731689453125, -0.32537841796875, -0.2463836669921875, -0.167388916015625, -0.0883941650390625, -0.0093994140625, 0.0695953369140625, 0.148590087890625, 0.2275848388671875, 0.30657958984375, 0.3855743408203125, 0.464569091796875, 0.5435638427734375, 0.62255859375, 0.7015533447265625, 0.780548095703125, 0.8595428466796875, 0.93853759765625, 1.0175323486328125, 1.096527099609375, 1.1755218505859375, 1.2545166015625, 1.3335113525390625, 1.412506103515625, 1.4915008544921875, 1.57049560546875, 1.6494903564453125, 1.728485107421875, 1.8074798583984375, 1.886474609375, 1.9654693603515625, 2.044464111328125, 2.1234588623046875, 2.20245361328125, 2.2814483642578125, 2.360443115234375, 2.4394378662109375, 2.5184326171875, 2.5974273681640625, 2.676422119140625, 2.7554168701171875, 2.83441162109375, 2.9134063720703125, 2.992401123046875, 3.0713958740234375, 3.150390625]}, "gradients/decoder.model.decoder.layers.3.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 3.0, 6.0, 11.0, 11.0, 11.0, 26.0, 32.0, 40.0, 48.0, 60.0, 177.0, 262.0, 94.0, 54.0, 42.0, 31.0, 29.0, 19.0, 18.0, 10.0, 4.0, 5.0, 3.0, 2.0, 3.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.72216796875, -0.7050247192382812, -0.6878814697265625, -0.6707382202148438, -0.653594970703125, -0.6364517211914062, -0.6193084716796875, -0.6021652221679688, -0.58502197265625, -0.5678787231445312, -0.5507354736328125, -0.5335922241210938, -0.516448974609375, -0.49930572509765625, -0.4821624755859375, -0.46501922607421875, -0.4478759765625, -0.43073272705078125, -0.4135894775390625, -0.39644622802734375, -0.379302978515625, -0.36215972900390625, -0.3450164794921875, -0.32787322998046875, -0.31072998046875, -0.29358673095703125, -0.2764434814453125, -0.25930023193359375, -0.242156982421875, -0.22501373291015625, -0.2078704833984375, -0.19072723388671875, -0.173583984375, -0.15644073486328125, -0.1392974853515625, -0.12215423583984375, -0.105010986328125, -0.08786773681640625, -0.0707244873046875, -0.05358123779296875, -0.03643798828125, -0.01929473876953125, -0.0021514892578125, 0.01499176025390625, 0.032135009765625, 0.04927825927734375, 0.0664215087890625, 0.08356475830078125, 0.1007080078125, 0.11785125732421875, 0.1349945068359375, 0.15213775634765625, 0.169281005859375, 0.18642425537109375, 0.2035675048828125, 0.22071075439453125, 0.23785400390625, 0.25499725341796875, 0.2721405029296875, 0.28928375244140625, 0.306427001953125, 0.32357025146484375, 0.3407135009765625, 0.35785675048828125, 0.375]}, "gradients/decoder.model.decoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 13.0, 23.0, 52.0, 97.0, 152.0, 205.0, 217.0, 122.0, 65.0, 36.0, 9.0, 7.0, 3.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-14.607107162475586, -14.273211479187012, -13.939315795898438, -13.605419158935547, -13.271523475646973, -12.937627792358398, -12.603732109069824, -12.26983642578125, -11.935940742492676, -11.602045059204102, -11.268149375915527, -10.934253692626953, -10.600357055664062, -10.266461372375488, -9.932565689086914, -9.59867000579834, -9.264774322509766, -8.930878639221191, -8.596982955932617, -8.263086318969727, -7.9291911125183105, -7.595294952392578, -7.261399269104004, -6.92750358581543, -6.593606948852539, -6.259711265563965, -5.925815105438232, -5.591919422149658, -5.258023738861084, -4.924127578735352, -4.590231895446777, -4.256336212158203, -3.922440528869629, -3.5885446071624756, -3.2546489238739014, -2.920753002166748, -2.586857318878174, -2.2529613971710205, -1.9190654754638672, -1.585169792175293, -1.2512738704681396, -0.9173780679702759, -0.5834822058677673, -0.2495863437652588, 0.08430945873260498, 0.41820526123046875, 0.7521011829376221, 1.0859968662261963, 1.4198927879333496, 1.7537885904312134, 2.087684392929077, 2.4215803146362305, 2.7554759979248047, 3.089371919631958, 3.4232678413391113, 3.7571635246276855, 4.091059684753418, 4.424955368041992, 4.758851528167725, 5.092747211456299, 5.426642894744873, 5.7605390548706055, 6.09443473815918, 6.428330421447754, 6.762226104736328]}, "gradients/decoder.model.decoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 4.0, 3.0, 2.0, 5.0, 9.0, 8.0, 10.0, 12.0, 20.0, 21.0, 22.0, 24.0, 26.0, 33.0, 45.0, 49.0, 41.0, 47.0, 49.0, 41.0, 38.0, 56.0, 66.0, 51.0, 42.0, 32.0, 33.0, 35.0, 34.0, 30.0, 19.0, 16.0, 21.0, 11.0, 16.0, 7.0, 4.0, 10.0, 3.0, 4.0, 3.0, 0.0, 6.0, 0.0, 1.0, 3.0, 1.0, 1.0], "bins": [-6.703184127807617, -6.517426490783691, -6.331668853759766, -6.145910739898682, -5.960153102874756, -5.77439546585083, -5.588637828826904, -5.40287971496582, -5.2171220779418945, -5.031364440917969, -4.845606803894043, -4.659848690032959, -4.474091053009033, -4.288333415985107, -4.102575778961182, -3.9168179035186768, -3.731060266494751, -3.545302629470825, -3.3595447540283203, -3.1737871170043945, -2.9880292415618896, -2.802271604537964, -2.616513729095459, -2.430756092071533, -2.2449984550476074, -2.0592408180236816, -1.8734829425811768, -1.687725305557251, -1.501967430114746, -1.3162097930908203, -1.130452036857605, -0.9446942806243896, -0.7589364051818848, -0.5731786489486694, -0.3874209225177765, -0.20166319608688354, -0.015905439853668213, 0.16985231637954712, 0.3556100130081177, 0.541367769241333, 0.7271255254745483, 0.9128832817077637, 1.098641037940979, 1.2843987941741943, 1.4701564311981201, 1.655914306640625, 1.8416719436645508, 2.0274295806884766, 2.2131874561309814, 2.3989450931549072, 2.584702968597412, 2.770460605621338, 2.9562184810638428, 3.1419761180877686, 3.3277339935302734, 3.513491630554199, 3.699249267578125, 3.885006904602051, 4.070764541625977, 4.2565226554870605, 4.442280292510986, 4.628037929534912, 4.813795566558838, 4.999553680419922, 5.185311317443848]}, "gradients/decoder.model.decoder.layers.2.fc2.weight": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 4.0, 2.0, 4.0, 3.0, 8.0, 9.0, 16.0, 12.0, 15.0, 25.0, 29.0, 24.0, 44.0, 97.0, 127.0, 259.0, 693.0, 2734.0, 40990.0, 3653101.0, 487390.0, 7044.0, 892.0, 300.0, 130.0, 79.0, 50.0, 50.0, 38.0, 36.0, 18.0, 17.0, 16.0, 10.0, 6.0, 9.0, 2.0, 5.0, 1.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.82421875, -5.56817626953125, -5.3121337890625, -5.05609130859375, -4.800048828125, -4.54400634765625, -4.2879638671875, -4.03192138671875, -3.77587890625, -3.51983642578125, -3.2637939453125, -3.00775146484375, -2.751708984375, -2.49566650390625, -2.2396240234375, -1.98358154296875, -1.7275390625, -1.47149658203125, -1.2154541015625, -0.95941162109375, -0.703369140625, -0.44732666015625, -0.1912841796875, 0.06475830078125, 0.32080078125, 0.57684326171875, 0.8328857421875, 1.08892822265625, 1.344970703125, 1.60101318359375, 1.8570556640625, 2.11309814453125, 2.369140625, 2.62518310546875, 2.8812255859375, 3.13726806640625, 3.393310546875, 3.64935302734375, 3.9053955078125, 4.16143798828125, 4.41748046875, 4.67352294921875, 4.9295654296875, 5.18560791015625, 5.441650390625, 5.69769287109375, 5.9537353515625, 6.20977783203125, 6.4658203125, 6.72186279296875, 6.9779052734375, 7.23394775390625, 7.489990234375, 7.74603271484375, 8.0020751953125, 8.25811767578125, 8.51416015625, 8.77020263671875, 9.0262451171875, 9.28228759765625, 9.538330078125, 9.79437255859375, 10.0504150390625, 10.30645751953125, 10.5625]}, "gradients/decoder.model.decoder.layers.2.fc2.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 6.0, 1.0, 2.0, 8.0, 11.0, 11.0, 10.0, 15.0, 14.0, 20.0, 29.0, 31.0, 28.0, 47.0, 47.0, 55.0, 65.0, 80.0, 57.0, 65.0, 66.0, 41.0, 48.0, 53.0, 48.0, 37.0, 33.0, 18.0, 15.0, 15.0, 11.0, 7.0, 5.0, 2.0, 2.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.73828125, -1.667144775390625, -1.59600830078125, -1.524871826171875, -1.4537353515625, -1.382598876953125, -1.31146240234375, -1.240325927734375, -1.169189453125, -1.098052978515625, -1.02691650390625, -0.955780029296875, -0.8846435546875, -0.813507080078125, -0.74237060546875, -0.671234130859375, -0.60009765625, -0.528961181640625, -0.45782470703125, -0.386688232421875, -0.3155517578125, -0.244415283203125, -0.17327880859375, -0.102142333984375, -0.031005859375, 0.040130615234375, 0.11126708984375, 0.182403564453125, 0.2535400390625, 0.324676513671875, 0.39581298828125, 0.466949462890625, 0.5380859375, 0.609222412109375, 0.68035888671875, 0.751495361328125, 0.8226318359375, 0.893768310546875, 0.96490478515625, 1.036041259765625, 1.107177734375, 1.178314208984375, 1.24945068359375, 1.320587158203125, 1.3917236328125, 1.462860107421875, 1.53399658203125, 1.605133056640625, 1.67626953125, 1.747406005859375, 1.81854248046875, 1.889678955078125, 1.9608154296875, 2.031951904296875, 2.10308837890625, 2.174224853515625, 2.245361328125, 2.316497802734375, 2.38763427734375, 2.458770751953125, 2.5299072265625, 2.601043701171875, 2.67218017578125, 2.743316650390625, 2.814453125]}, "gradients/decoder.model.decoder.layers.2.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 8.0, 6.0, 7.0, 19.0, 24.0, 47.0, 78.0, 249.0, 705.0, 2633.0, 31259.0, 4003724.0, 149208.0, 4606.0, 1029.0, 365.0, 152.0, 67.0, 33.0, 24.0, 14.0, 8.0, 8.0, 3.0, 6.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.8359375, -9.543701171875, -9.25146484375, -8.959228515625, -8.6669921875, -8.374755859375, -8.08251953125, -7.790283203125, -7.498046875, -7.205810546875, -6.91357421875, -6.621337890625, -6.3291015625, -6.036865234375, -5.74462890625, -5.452392578125, -5.16015625, -4.867919921875, -4.57568359375, -4.283447265625, -3.9912109375, -3.698974609375, -3.40673828125, -3.114501953125, -2.822265625, -2.530029296875, -2.23779296875, -1.945556640625, -1.6533203125, -1.361083984375, -1.06884765625, -0.776611328125, -0.484375, -0.192138671875, 0.10009765625, 0.392333984375, 0.6845703125, 0.976806640625, 1.26904296875, 1.561279296875, 1.853515625, 2.145751953125, 2.43798828125, 2.730224609375, 3.0224609375, 3.314697265625, 3.60693359375, 3.899169921875, 4.19140625, 4.483642578125, 4.77587890625, 5.068115234375, 5.3603515625, 5.652587890625, 5.94482421875, 6.237060546875, 6.529296875, 6.821533203125, 7.11376953125, 7.406005859375, 7.6982421875, 7.990478515625, 8.28271484375, 8.574951171875, 8.8671875]}, "gradients/decoder.model.decoder.layers.2.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 8.0, 11.0, 8.0, 9.0, 13.0, 22.0, 47.0, 58.0, 83.0, 161.0, 252.0, 441.0, 698.0, 789.0, 576.0, 348.0, 220.0, 130.0, 69.0, 47.0, 33.0, 16.0, 19.0, 8.0, 2.0, 3.0, 0.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.447265625, -1.408447265625, -1.36962890625, -1.330810546875, -1.2919921875, -1.253173828125, -1.21435546875, -1.175537109375, -1.13671875, -1.097900390625, -1.05908203125, -1.020263671875, -0.9814453125, -0.942626953125, -0.90380859375, -0.864990234375, -0.826171875, -0.787353515625, -0.74853515625, -0.709716796875, -0.6708984375, -0.632080078125, -0.59326171875, -0.554443359375, -0.515625, -0.476806640625, -0.43798828125, -0.399169921875, -0.3603515625, -0.321533203125, -0.28271484375, -0.243896484375, -0.205078125, -0.166259765625, -0.12744140625, -0.088623046875, -0.0498046875, -0.010986328125, 0.02783203125, 0.066650390625, 0.10546875, 0.144287109375, 0.18310546875, 0.221923828125, 0.2607421875, 0.299560546875, 0.33837890625, 0.377197265625, 0.416015625, 0.454833984375, 0.49365234375, 0.532470703125, 0.5712890625, 0.610107421875, 0.64892578125, 0.687744140625, 0.7265625, 0.765380859375, 0.80419921875, 0.843017578125, 0.8818359375, 0.920654296875, 0.95947265625, 0.998291015625, 1.037109375]}, "gradients/decoder.model.decoder.layers.2.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 12.0, 14.0, 41.0, 63.0, 131.0, 156.0, 163.0, 166.0, 118.0, 62.0, 45.0, 19.0, 15.0, 4.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.07180643081665, -6.849813461303711, -6.6278204917907715, -6.405827522277832, -6.183834075927734, -5.961841106414795, -5.7398481369018555, -5.517855167388916, -5.295862197875977, -5.073869228363037, -4.851876258850098, -4.6298828125, -4.4078898429870605, -4.185896873474121, -3.9639039039611816, -3.741910934448242, -3.5199174880981445, -3.297924518585205, -3.0759313106536865, -2.853938341140747, -2.6319451332092285, -2.409952163696289, -2.1879591941833496, -1.9659661054611206, -1.7439730167388916, -1.5219799280166626, -1.2999868392944336, -1.0779938697814941, -0.8560007810592651, -0.6340076923370361, -0.4120147228240967, -0.19002163410186768, 0.031970977783203125, 0.25396403670310974, 0.47595709562301636, 0.6979501247406006, 0.9199432134628296, 1.1419363021850586, 1.363929271697998, 1.585922360420227, 1.807915449142456, 2.0299084186553955, 2.251901626586914, 2.4738945960998535, 2.695887565612793, 2.9178807735443115, 3.139873743057251, 3.3618669509887695, 3.583859920501709, 3.8058528900146484, 4.027845859527588, 4.249838829040527, 4.471832275390625, 4.6938252449035645, 4.915818214416504, 5.137811183929443, 5.359804153442383, 5.581797122955322, 5.803790092468262, 6.025783538818359, 6.247776508331299, 6.469769477844238, 6.691762447357178, 6.913755416870117, 7.135748863220215]}, "gradients/decoder.model.decoder.layers.2.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 8.0, 4.0, 4.0, 8.0, 17.0, 15.0, 11.0, 15.0, 11.0, 16.0, 27.0, 31.0, 28.0, 31.0, 34.0, 44.0, 47.0, 45.0, 44.0, 49.0, 32.0, 60.0, 34.0, 42.0, 52.0, 42.0, 35.0, 33.0, 33.0, 30.0, 26.0, 17.0, 18.0, 16.0, 16.0, 7.0, 8.0, 7.0, 4.0, 4.0, 3.0, 0.0, 1.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.0989229679107666, -2.02917742729187, -1.9594320058822632, -1.8896865844726562, -1.8199410438537598, -1.7501956224441528, -1.680450201034546, -1.6107046604156494, -1.5409592390060425, -1.4712138175964355, -1.401468276977539, -1.3317228555679321, -1.2619774341583252, -1.1922318935394287, -1.1224864721298218, -1.0527410507202148, -0.9829955101013184, -0.9132500290870667, -0.8435045480728149, -0.773759126663208, -0.7040136456489563, -0.6342681646347046, -0.5645227432250977, -0.49477726221084595, -0.42503178119659424, -0.35528630018234253, -0.2855408489704132, -0.2157953828573227, -0.14604991674423218, -0.07630443572998047, -0.0065589845180511475, 0.06318646669387817, 0.13293194770812988, 0.2026774138212204, 0.2724228799343109, 0.34216833114624023, 0.41191381216049194, 0.48165929317474365, 0.5514047145843506, 0.6211501955986023, 0.690895676612854, 0.7606411576271057, 0.8303866386413574, 0.9001320600509644, 0.9698775410652161, 1.0396230220794678, 1.1093684434890747, 1.1791138648986816, 1.2488594055175781, 1.318604826927185, 1.3883503675460815, 1.4580957889556885, 1.527841329574585, 1.597586750984192, 1.6673321723937988, 1.7370777130126953, 1.8068231344223022, 1.8765685558319092, 1.9463140964508057, 2.016059637069702, 2.0858049392700195, 2.155550479888916, 2.2252960205078125, 2.29504132270813, 2.3647868633270264]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 6.0, 7.0, 2.0, 9.0, 9.0, 13.0, 21.0, 24.0, 31.0, 54.0, 75.0, 109.0, 144.0, 194.0, 288.0, 497.0, 921.0, 1814.0, 4717.0, 14988.0, 56853.0, 198186.0, 400246.0, 258025.0, 79286.0, 20923.0, 6191.0, 2215.0, 1061.0, 558.0, 344.0, 241.0, 158.0, 117.0, 64.0, 54.0, 38.0, 31.0, 13.0, 9.0, 8.0, 7.0, 3.0, 5.0, 2.0, 0.0, 3.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.59326171875, -0.5738906860351562, -0.5545196533203125, -0.5351486206054688, -0.515777587890625, -0.49640655517578125, -0.4770355224609375, -0.45766448974609375, -0.43829345703125, -0.41892242431640625, -0.3995513916015625, -0.38018035888671875, -0.360809326171875, -0.34143829345703125, -0.3220672607421875, -0.30269622802734375, -0.2833251953125, -0.26395416259765625, -0.2445831298828125, -0.22521209716796875, -0.205841064453125, -0.18647003173828125, -0.1670989990234375, -0.14772796630859375, -0.12835693359375, -0.10898590087890625, -0.0896148681640625, -0.07024383544921875, -0.050872802734375, -0.03150177001953125, -0.0121307373046875, 0.00724029541015625, 0.026611328125, 0.04598236083984375, 0.0653533935546875, 0.08472442626953125, 0.104095458984375, 0.12346649169921875, 0.1428375244140625, 0.16220855712890625, 0.18157958984375, 0.20095062255859375, 0.2203216552734375, 0.23969268798828125, 0.259063720703125, 0.27843475341796875, 0.2978057861328125, 0.31717681884765625, 0.3365478515625, 0.35591888427734375, 0.3752899169921875, 0.39466094970703125, 0.414031982421875, 0.43340301513671875, 0.4527740478515625, 0.47214508056640625, 0.49151611328125, 0.5108871459960938, 0.5302581787109375, 0.5496292114257812, 0.569000244140625, 0.5883712768554688, 0.6077423095703125, 0.6271133422851562, 0.646484375]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 5.0, 3.0, 4.0, 7.0, 10.0, 17.0, 17.0, 13.0, 19.0, 20.0, 30.0, 35.0, 29.0, 39.0, 40.0, 50.0, 41.0, 49.0, 59.0, 47.0, 49.0, 49.0, 48.0, 41.0, 42.0, 32.0, 33.0, 35.0, 20.0, 24.0, 24.0, 16.0, 15.0, 11.0, 10.0, 4.0, 6.0, 4.0, 3.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.4716796875, -1.4199066162109375, -1.368133544921875, -1.3163604736328125, -1.26458740234375, -1.2128143310546875, -1.161041259765625, -1.1092681884765625, -1.0574951171875, -1.0057220458984375, -0.953948974609375, -0.9021759033203125, -0.85040283203125, -0.7986297607421875, -0.746856689453125, -0.6950836181640625, -0.643310546875, -0.5915374755859375, -0.539764404296875, -0.4879913330078125, -0.43621826171875, -0.3844451904296875, -0.332672119140625, -0.2808990478515625, -0.2291259765625, -0.1773529052734375, -0.125579833984375, -0.0738067626953125, -0.02203369140625, 0.0297393798828125, 0.081512451171875, 0.1332855224609375, 0.18505859375, 0.2368316650390625, 0.288604736328125, 0.3403778076171875, 0.39215087890625, 0.4439239501953125, 0.495697021484375, 0.5474700927734375, 0.5992431640625, 0.6510162353515625, 0.702789306640625, 0.7545623779296875, 0.80633544921875, 0.8581085205078125, 0.909881591796875, 0.9616546630859375, 1.013427734375, 1.0652008056640625, 1.116973876953125, 1.1687469482421875, 1.22052001953125, 1.2722930908203125, 1.324066162109375, 1.3758392333984375, 1.4276123046875, 1.4793853759765625, 1.531158447265625, 1.5829315185546875, 1.63470458984375, 1.6864776611328125, 1.738250732421875, 1.7900238037109375, 1.841796875]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 2.0, 6.0, 5.0, 13.0, 13.0, 17.0, 24.0, 25.0, 43.0, 85.0, 139.0, 240.0, 493.0, 1045.0, 2234.0, 4822.0, 10551.0, 23048.0, 49849.0, 100632.0, 177470.0, 234105.0, 201616.0, 123750.0, 63378.0, 29517.0, 13577.0, 6203.0, 2865.0, 1376.0, 668.0, 296.0, 191.0, 90.0, 60.0, 31.0, 25.0, 18.0, 10.0, 12.0, 4.0, 3.0, 2.0, 1.0, 3.0, 3.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.2607421875, -0.2516441345214844, -0.24254608154296875, -0.23344802856445312, -0.2243499755859375, -0.21525192260742188, -0.20615386962890625, -0.19705581665039062, -0.187957763671875, -0.17885971069335938, -0.16976165771484375, -0.16066360473632812, -0.1515655517578125, -0.14246749877929688, -0.13336944580078125, -0.12427139282226562, -0.11517333984375, -0.10607528686523438, -0.09697723388671875, -0.08787918090820312, -0.0787811279296875, -0.06968307495117188, -0.06058502197265625, -0.051486968994140625, -0.042388916015625, -0.033290863037109375, -0.02419281005859375, -0.015094757080078125, -0.0059967041015625, 0.003101348876953125, 0.01219940185546875, 0.021297454833984375, 0.0303955078125, 0.039493560791015625, 0.04859161376953125, 0.057689666748046875, 0.0667877197265625, 0.07588577270507812, 0.08498382568359375, 0.09408187866210938, 0.103179931640625, 0.11227798461914062, 0.12137603759765625, 0.13047409057617188, 0.1395721435546875, 0.14867019653320312, 0.15776824951171875, 0.16686630249023438, 0.17596435546875, 0.18506240844726562, 0.19416046142578125, 0.20325851440429688, 0.2123565673828125, 0.22145462036132812, 0.23055267333984375, 0.23965072631835938, 0.248748779296875, 0.2578468322753906, 0.26694488525390625, 0.2760429382324219, 0.2851409912109375, 0.2942390441894531, 0.30333709716796875, 0.3124351501464844, 0.321533203125]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 4.0, 4.0, 8.0, 7.0, 10.0, 17.0, 12.0, 16.0, 22.0, 30.0, 35.0, 41.0, 41.0, 55.0, 49.0, 40.0, 40.0, 49.0, 45.0, 50.0, 46.0, 57.0, 56.0, 29.0, 41.0, 31.0, 23.0, 30.0, 27.0, 26.0, 16.0, 18.0, 4.0, 5.0, 8.0, 3.0, 7.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.1171875, -3.01123046875, -2.9052734375, -2.79931640625, -2.693359375, -2.58740234375, -2.4814453125, -2.37548828125, -2.26953125, -2.16357421875, -2.0576171875, -1.95166015625, -1.845703125, -1.73974609375, -1.6337890625, -1.52783203125, -1.421875, -1.31591796875, -1.2099609375, -1.10400390625, -0.998046875, -0.89208984375, -0.7861328125, -0.68017578125, -0.57421875, -0.46826171875, -0.3623046875, -0.25634765625, -0.150390625, -0.04443359375, 0.0615234375, 0.16748046875, 0.2734375, 0.37939453125, 0.4853515625, 0.59130859375, 0.697265625, 0.80322265625, 0.9091796875, 1.01513671875, 1.12109375, 1.22705078125, 1.3330078125, 1.43896484375, 1.544921875, 1.65087890625, 1.7568359375, 1.86279296875, 1.96875, 2.07470703125, 2.1806640625, 2.28662109375, 2.392578125, 2.49853515625, 2.6044921875, 2.71044921875, 2.81640625, 2.92236328125, 3.0283203125, 3.13427734375, 3.240234375, 3.34619140625, 3.4521484375, 3.55810546875, 3.6640625]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 2.0, 11.0, 19.0, 33.0, 45.0, 99.0, 227.0, 513.0, 1587.0, 8905.0, 124291.0, 809591.0, 93347.0, 7515.0, 1479.0, 448.0, 230.0, 86.0, 49.0, 33.0, 24.0, 7.0, 9.0, 4.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1942138671875, -0.1868724822998047, -0.17953109741210938, -0.17218971252441406, -0.16484832763671875, -0.15750694274902344, -0.15016555786132812, -0.1428241729736328, -0.1354827880859375, -0.1281414031982422, -0.12080001831054688, -0.11345863342285156, -0.10611724853515625, -0.09877586364746094, -0.09143447875976562, -0.08409309387207031, -0.076751708984375, -0.06941032409667969, -0.062068939208984375, -0.05472755432128906, -0.04738616943359375, -0.04004478454589844, -0.032703399658203125, -0.025362014770507812, -0.0180206298828125, -0.010679244995117188, -0.003337860107421875, 0.0040035247802734375, 0.01134490966796875, 0.018686294555664062, 0.026027679443359375, 0.03336906433105469, 0.04071044921875, 0.04805183410644531, 0.055393218994140625, 0.06273460388183594, 0.07007598876953125, 0.07741737365722656, 0.08475875854492188, 0.09210014343261719, 0.0994415283203125, 0.10678291320800781, 0.11412429809570312, 0.12146568298339844, 0.12880706787109375, 0.13614845275878906, 0.14348983764648438, 0.1508312225341797, 0.158172607421875, 0.1655139923095703, 0.17285537719726562, 0.18019676208496094, 0.18753814697265625, 0.19487953186035156, 0.20222091674804688, 0.2095623016357422, 0.2169036865234375, 0.2242450714111328, 0.23158645629882812, 0.23892784118652344, 0.24626922607421875, 0.25361061096191406, 0.2609519958496094, 0.2682933807373047, 0.275634765625]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 6.0, 1.0, 4.0, 14.0, 10.0, 17.0, 26.0, 35.0, 30.0, 45.0, 67.0, 71.0, 83.0, 98.0, 97.0, 82.0, 69.0, 63.0, 43.0, 36.0, 37.0, 15.0, 19.0, 14.0, 6.0, 6.0, 6.0, 6.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.5703182220458984e-05, -3.421306610107422e-05, -3.272294998168945e-05, -3.123283386230469e-05, -2.9742717742919922e-05, -2.8252601623535156e-05, -2.676248550415039e-05, -2.5272369384765625e-05, -2.378225326538086e-05, -2.2292137145996094e-05, -2.0802021026611328e-05, -1.9311904907226562e-05, -1.7821788787841797e-05, -1.633167266845703e-05, -1.4841556549072266e-05, -1.33514404296875e-05, -1.1861324310302734e-05, -1.0371208190917969e-05, -8.881092071533203e-06, -7.3909759521484375e-06, -5.900859832763672e-06, -4.410743713378906e-06, -2.9206275939941406e-06, -1.430511474609375e-06, 5.960464477539063e-08, 1.5497207641601562e-06, 3.039836883544922e-06, 4.5299530029296875e-06, 6.020069122314453e-06, 7.510185241699219e-06, 9.000301361083984e-06, 1.049041748046875e-05, 1.1980533599853516e-05, 1.3470649719238281e-05, 1.4960765838623047e-05, 1.6450881958007812e-05, 1.7940998077392578e-05, 1.9431114196777344e-05, 2.092123031616211e-05, 2.2411346435546875e-05, 2.390146255493164e-05, 2.5391578674316406e-05, 2.6881694793701172e-05, 2.8371810913085938e-05, 2.9861927032470703e-05, 3.135204315185547e-05, 3.2842159271240234e-05, 3.4332275390625e-05, 3.5822391510009766e-05, 3.731250762939453e-05, 3.88026237487793e-05, 4.029273986816406e-05, 4.178285598754883e-05, 4.3272972106933594e-05, 4.476308822631836e-05, 4.6253204345703125e-05, 4.774332046508789e-05, 4.9233436584472656e-05, 5.072355270385742e-05, 5.221366882324219e-05, 5.370378494262695e-05, 5.519390106201172e-05, 5.6684017181396484e-05, 5.817413330078125e-05, 5.9664249420166016e-05]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 3.0, 5.0, 5.0, 4.0, 6.0, 8.0, 6.0, 10.0, 12.0, 30.0, 46.0, 69.0, 89.0, 178.0, 282.0, 638.0, 1740.0, 5530.0, 23917.0, 155030.0, 663783.0, 163447.0, 24762.0, 5722.0, 1770.0, 706.0, 321.0, 174.0, 96.0, 48.0, 35.0, 27.0, 16.0, 13.0, 7.0, 6.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 0.0, 2.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0], "bins": [-0.1671142578125, -0.1612529754638672, -0.15539169311523438, -0.14953041076660156, -0.14366912841796875, -0.13780784606933594, -0.13194656372070312, -0.1260852813720703, -0.1202239990234375, -0.11436271667480469, -0.10850143432617188, -0.10264015197753906, -0.09677886962890625, -0.09091758728027344, -0.08505630493164062, -0.07919502258300781, -0.073333740234375, -0.06747245788574219, -0.061611175537109375, -0.05574989318847656, -0.04988861083984375, -0.04402732849121094, -0.038166046142578125, -0.03230476379394531, -0.0264434814453125, -0.020582199096679688, -0.014720916748046875, -0.008859634399414062, -0.00299835205078125, 0.0028629302978515625, 0.008724212646484375, 0.014585494995117188, 0.02044677734375, 0.026308059692382812, 0.032169342041015625, 0.03803062438964844, 0.04389190673828125, 0.04975318908691406, 0.055614471435546875, 0.06147575378417969, 0.0673370361328125, 0.07319831848144531, 0.07905960083007812, 0.08492088317871094, 0.09078216552734375, 0.09664344787597656, 0.10250473022460938, 0.10836601257324219, 0.114227294921875, 0.12008857727050781, 0.12594985961914062, 0.13181114196777344, 0.13767242431640625, 0.14353370666503906, 0.14939498901367188, 0.1552562713623047, 0.1611175537109375, 0.1669788360595703, 0.17284011840820312, 0.17870140075683594, 0.18456268310546875, 0.19042396545410156, 0.19628524780273438, 0.2021465301513672, 0.2080078125]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 1.0, 3.0, 7.0, 9.0, 6.0, 23.0, 22.0, 26.0, 36.0, 67.0, 97.0, 107.0, 133.0, 136.0, 112.0, 68.0, 45.0, 30.0, 26.0, 11.0, 7.0, 11.0, 7.0, 6.0, 1.0, 1.0, 2.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07000732421875, -0.06804323196411133, -0.06607913970947266, -0.06411504745483398, -0.06215095520019531, -0.06018686294555664, -0.05822277069091797, -0.0562586784362793, -0.054294586181640625, -0.05233049392700195, -0.05036640167236328, -0.04840230941772461, -0.04643821716308594, -0.044474124908447266, -0.042510032653808594, -0.04054594039916992, -0.03858184814453125, -0.03661775588989258, -0.034653663635253906, -0.032689571380615234, -0.030725479125976562, -0.02876138687133789, -0.02679729461669922, -0.024833202362060547, -0.022869110107421875, -0.020905017852783203, -0.01894092559814453, -0.01697683334350586, -0.015012741088867188, -0.013048648834228516, -0.011084556579589844, -0.009120464324951172, -0.0071563720703125, -0.005192279815673828, -0.0032281875610351562, -0.0012640953063964844, 0.0006999969482421875, 0.0026640892028808594, 0.004628181457519531, 0.006592273712158203, 0.008556365966796875, 0.010520458221435547, 0.012484550476074219, 0.01444864273071289, 0.016412734985351562, 0.018376827239990234, 0.020340919494628906, 0.022305011749267578, 0.02426910400390625, 0.026233196258544922, 0.028197288513183594, 0.030161380767822266, 0.03212547302246094, 0.03408956527709961, 0.03605365753173828, 0.03801774978637695, 0.039981842041015625, 0.0419459342956543, 0.04391002655029297, 0.04587411880493164, 0.04783821105957031, 0.049802303314208984, 0.051766395568847656, 0.05373048782348633, 0.055694580078125]}, "gradients/decoder.model.decoder.layers.2.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 12.0, 19.0, 44.0, 85.0, 161.0, 164.0, 175.0, 160.0, 102.0, 45.0, 19.0, 12.0, 10.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.4635112285614014, -3.307328701019287, -3.1511459350585938, -2.9949634075164795, -2.8387808799743652, -2.682598114013672, -2.5264155864715576, -2.3702330589294434, -2.21405029296875, -2.0578677654266357, -1.901685118675232, -1.7455024719238281, -1.5893199443817139, -1.43313729763031, -1.2769546508789062, -1.120772123336792, -0.9645895957946777, -0.8084070086479187, -0.6522244215011597, -0.49604177474975586, -0.3398591876029968, -0.1836766004562378, -0.027493953704833984, 0.12868857383728027, 0.2848712205886841, 0.4410538077354431, 0.5972363948822021, 0.753419041633606, 0.909601628780365, 1.065784215927124, 1.2219668626785278, 1.378149390220642, 1.5343317985534668, 1.6905144453048706, 1.8466969728469849, 2.0028796195983887, 2.159062147140503, 2.315244674682617, 2.4714274406433105, 2.627609968185425, 2.783792495727539, 2.9399750232696533, 3.0961577892303467, 3.252340316772461, 3.408522844314575, 3.5647053718566895, 3.720888137817383, 3.877070665359497, 4.0332536697387695, 4.189436435699463, 4.345618724822998, 4.501801490783691, 4.657984256744385, 4.81416654586792, 4.970349311828613, 5.126531600952148, 5.282714366912842, 5.438897132873535, 5.59507942199707, 5.751262187957764, 5.907444953918457, 6.063627243041992, 6.2198100090026855, 6.375992774963379, 6.532175064086914]}, "gradients/decoder.model.decoder.layers.2.self_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 6.0, 4.0, 12.0, 13.0, 17.0, 16.0, 10.0, 24.0, 34.0, 33.0, 34.0, 36.0, 41.0, 56.0, 54.0, 58.0, 43.0, 49.0, 57.0, 53.0, 58.0, 40.0, 51.0, 30.0, 34.0, 35.0, 21.0, 19.0, 24.0, 8.0, 9.0, 7.0, 4.0, 8.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.6688393354415894, -1.6133403778076172, -1.5578415393829346, -1.5023425817489624, -1.4468437433242798, -1.3913447856903076, -1.335845947265625, -1.2803469896316528, -1.2248481512069702, -1.169349193572998, -1.1138503551483154, -1.0583513975143433, -1.0028525590896606, -0.9473536014556885, -0.8918547630310059, -0.8363558053970337, -0.7808569073677063, -0.7253580093383789, -0.6698591113090515, -0.6143602132797241, -0.5588613152503967, -0.5033624172210693, -0.44786348938941956, -0.39236459136009216, -0.33686569333076477, -0.2813667953014374, -0.22586789727210999, -0.1703689843416214, -0.114870086312294, -0.05937117338180542, -0.0038722753524780273, 0.051626622676849365, 0.10712552070617676, 0.16262441873550415, 0.21812331676483154, 0.27362221479415894, 0.32912111282348633, 0.3846200406551361, 0.4401189386844635, 0.4956178367137909, 0.5511167049407959, 0.6066156029701233, 0.6621145009994507, 0.7176133990287781, 0.7731122970581055, 0.8286112546920776, 0.8841100931167603, 0.9396090507507324, 0.9951079487800598, 1.0506068468093872, 1.1061058044433594, 1.161604642868042, 1.2171036005020142, 1.2726024389266968, 1.328101396560669, 1.3836002349853516, 1.4390991926193237, 1.494598150253296, 1.5500969886779785, 1.6055959463119507, 1.6610947847366333, 1.7165937423706055, 1.772092580795288, 1.8275915384292603, 1.8830903768539429]}, "gradients/decoder.model.decoder.layers.2.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 6.0, 1.0, 4.0, 15.0, 9.0, 15.0, 30.0, 62.0, 88.0, 147.0, 287.0, 582.0, 1537.0, 5608.0, 26820.0, 209512.0, 702667.0, 82375.0, 13679.0, 3142.0, 1008.0, 438.0, 214.0, 120.0, 72.0, 36.0, 33.0, 11.0, 14.0, 8.0, 7.0, 4.0, 4.0, 3.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-2.693359375, -2.586883544921875, -2.48040771484375, -2.373931884765625, -2.2674560546875, -2.160980224609375, -2.05450439453125, -1.948028564453125, -1.841552734375, -1.735076904296875, -1.62860107421875, -1.522125244140625, -1.4156494140625, -1.309173583984375, -1.20269775390625, -1.096221923828125, -0.98974609375, -0.883270263671875, -0.77679443359375, -0.670318603515625, -0.5638427734375, -0.457366943359375, -0.35089111328125, -0.244415283203125, -0.137939453125, -0.031463623046875, 0.07501220703125, 0.181488037109375, 0.2879638671875, 0.394439697265625, 0.50091552734375, 0.607391357421875, 0.7138671875, 0.820343017578125, 0.92681884765625, 1.033294677734375, 1.1397705078125, 1.246246337890625, 1.35272216796875, 1.459197998046875, 1.565673828125, 1.672149658203125, 1.77862548828125, 1.885101318359375, 1.9915771484375, 2.098052978515625, 2.20452880859375, 2.311004638671875, 2.41748046875, 2.523956298828125, 2.63043212890625, 2.736907958984375, 2.8433837890625, 2.949859619140625, 3.05633544921875, 3.162811279296875, 3.269287109375, 3.375762939453125, 3.48223876953125, 3.588714599609375, 3.6951904296875, 3.801666259765625, 3.90814208984375, 4.014617919921875, 4.12109375]}, "gradients/decoder.model.decoder.layers.2.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 6.0, 0.0, 6.0, 16.0, 19.0, 29.0, 33.0, 43.0, 49.0, 55.0, 84.0, 72.0, 88.0, 76.0, 83.0, 93.0, 67.0, 46.0, 51.0, 37.0, 16.0, 17.0, 11.0, 4.0, 2.0, 4.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.162109375, -3.004058837890625, -2.84600830078125, -2.687957763671875, -2.5299072265625, -2.371856689453125, -2.21380615234375, -2.055755615234375, -1.897705078125, -1.739654541015625, -1.58160400390625, -1.423553466796875, -1.2655029296875, -1.107452392578125, -0.94940185546875, -0.791351318359375, -0.63330078125, -0.475250244140625, -0.31719970703125, -0.159149169921875, -0.0010986328125, 0.156951904296875, 0.31500244140625, 0.473052978515625, 0.631103515625, 0.789154052734375, 0.94720458984375, 1.105255126953125, 1.2633056640625, 1.421356201171875, 1.57940673828125, 1.737457275390625, 1.8955078125, 2.053558349609375, 2.21160888671875, 2.369659423828125, 2.5277099609375, 2.685760498046875, 2.84381103515625, 3.001861572265625, 3.159912109375, 3.317962646484375, 3.47601318359375, 3.634063720703125, 3.7921142578125, 3.950164794921875, 4.10821533203125, 4.266265869140625, 4.42431640625, 4.582366943359375, 4.74041748046875, 4.898468017578125, 5.0565185546875, 5.214569091796875, 5.37261962890625, 5.530670166015625, 5.688720703125, 5.846771240234375, 6.00482177734375, 6.162872314453125, 6.3209228515625, 6.478973388671875, 6.63702392578125, 6.795074462890625, 6.953125]}, "gradients/decoder.model.decoder.layers.2.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 2.0, 4.0, 5.0, 7.0, 2.0, 7.0, 7.0, 11.0, 7.0, 14.0, 20.0, 24.0, 25.0, 33.0, 60.0, 69.0, 91.0, 165.0, 308.0, 568.0, 2287.0, 25183.0, 857308.0, 153762.0, 6575.0, 1065.0, 329.0, 215.0, 112.0, 64.0, 46.0, 38.0, 31.0, 27.0, 16.0, 19.0, 10.0, 7.0, 6.0, 10.0, 7.0, 3.0, 1.0, 5.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-6.55859375, -6.3642578125, -6.169921875, -5.9755859375, -5.78125, -5.5869140625, -5.392578125, -5.1982421875, -5.00390625, -4.8095703125, -4.615234375, -4.4208984375, -4.2265625, -4.0322265625, -3.837890625, -3.6435546875, -3.44921875, -3.2548828125, -3.060546875, -2.8662109375, -2.671875, -2.4775390625, -2.283203125, -2.0888671875, -1.89453125, -1.7001953125, -1.505859375, -1.3115234375, -1.1171875, -0.9228515625, -0.728515625, -0.5341796875, -0.33984375, -0.1455078125, 0.048828125, 0.2431640625, 0.4375, 0.6318359375, 0.826171875, 1.0205078125, 1.21484375, 1.4091796875, 1.603515625, 1.7978515625, 1.9921875, 2.1865234375, 2.380859375, 2.5751953125, 2.76953125, 2.9638671875, 3.158203125, 3.3525390625, 3.546875, 3.7412109375, 3.935546875, 4.1298828125, 4.32421875, 4.5185546875, 4.712890625, 4.9072265625, 5.1015625, 5.2958984375, 5.490234375, 5.6845703125, 5.87890625]}, "gradients/decoder.model.decoder.layers.2.self_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 6.0, 5.0, 6.0, 10.0, 10.0, 11.0, 11.0, 9.0, 23.0, 20.0, 22.0, 29.0, 24.0, 23.0, 37.0, 34.0, 52.0, 42.0, 43.0, 49.0, 58.0, 45.0, 50.0, 51.0, 46.0, 43.0, 30.0, 28.0, 34.0, 26.0, 27.0, 14.0, 17.0, 11.0, 11.0, 10.0, 6.0, 4.0, 9.0, 5.0, 2.0, 3.0, 2.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-3.54296875, -3.433990478515625, -3.32501220703125, -3.216033935546875, -3.1070556640625, -2.998077392578125, -2.88909912109375, -2.780120849609375, -2.671142578125, -2.562164306640625, -2.45318603515625, -2.344207763671875, -2.2352294921875, -2.126251220703125, -2.01727294921875, -1.908294677734375, -1.79931640625, -1.690338134765625, -1.58135986328125, -1.472381591796875, -1.3634033203125, -1.254425048828125, -1.14544677734375, -1.036468505859375, -0.927490234375, -0.818511962890625, -0.70953369140625, -0.600555419921875, -0.4915771484375, -0.382598876953125, -0.27362060546875, -0.164642333984375, -0.0556640625, 0.053314208984375, 0.16229248046875, 0.271270751953125, 0.3802490234375, 0.489227294921875, 0.59820556640625, 0.707183837890625, 0.816162109375, 0.925140380859375, 1.03411865234375, 1.143096923828125, 1.2520751953125, 1.361053466796875, 1.47003173828125, 1.579010009765625, 1.68798828125, 1.796966552734375, 1.90594482421875, 2.014923095703125, 2.1239013671875, 2.232879638671875, 2.34185791015625, 2.450836181640625, 2.559814453125, 2.668792724609375, 2.77777099609375, 2.886749267578125, 2.9957275390625, 3.104705810546875, 3.21368408203125, 3.322662353515625, 3.431640625]}, "gradients/decoder.model.decoder.layers.2.self_attn.k_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 11.0, 5.0, 4.0, 8.0, 13.0, 9.0, 14.0, 15.0, 20.0, 17.0, 42.0, 44.0, 69.0, 108.0, 277.0, 577.0, 1792.0, 7330.0, 61805.0, 798681.0, 159135.0, 14229.0, 2732.0, 847.0, 337.0, 165.0, 87.0, 43.0, 42.0, 28.0, 10.0, 19.0, 12.0, 5.0, 5.0, 5.0, 4.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3212890625, -1.271759033203125, -1.22222900390625, -1.172698974609375, -1.1231689453125, -1.073638916015625, -1.02410888671875, -0.974578857421875, -0.925048828125, -0.875518798828125, -0.82598876953125, -0.776458740234375, -0.7269287109375, -0.677398681640625, -0.62786865234375, -0.578338623046875, -0.52880859375, -0.479278564453125, -0.42974853515625, -0.380218505859375, -0.3306884765625, -0.281158447265625, -0.23162841796875, -0.182098388671875, -0.132568359375, -0.083038330078125, -0.03350830078125, 0.016021728515625, 0.0655517578125, 0.115081787109375, 0.16461181640625, 0.214141845703125, 0.263671875, 0.313201904296875, 0.36273193359375, 0.412261962890625, 0.4617919921875, 0.511322021484375, 0.56085205078125, 0.610382080078125, 0.659912109375, 0.709442138671875, 0.75897216796875, 0.808502197265625, 0.8580322265625, 0.907562255859375, 0.95709228515625, 1.006622314453125, 1.05615234375, 1.105682373046875, 1.15521240234375, 1.204742431640625, 1.2542724609375, 1.303802490234375, 1.35333251953125, 1.402862548828125, 1.452392578125, 1.501922607421875, 1.55145263671875, 1.600982666015625, 1.6505126953125, 1.700042724609375, 1.74957275390625, 1.799102783203125, 1.8486328125]}, "gradients/decoder.model.decoder.layers.2.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 7.0, 2.0, 3.0, 3.0, 3.0, 3.0, 14.0, 14.0, 42.0, 43.0, 56.0, 116.0, 198.0, 222.0, 87.0, 60.0, 51.0, 21.0, 19.0, 9.0, 5.0, 12.0, 5.0, 2.0, 1.0, 3.0, 3.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00023627281188964844, -0.0002284012734889984, -0.0002205297350883484, -0.00021265819668769836, -0.00020478665828704834, -0.00019691511988639832, -0.0001890435814857483, -0.00018117204308509827, -0.00017330050468444824, -0.00016542896628379822, -0.0001575574278831482, -0.00014968588948249817, -0.00014181435108184814, -0.00013394281268119812, -0.0001260712742805481, -0.00011819973587989807, -0.00011032819747924805, -0.00010245665907859802, -9.4585120677948e-05, -8.671358227729797e-05, -7.884204387664795e-05, -7.097050547599792e-05, -6.30989670753479e-05, -5.5227428674697876e-05, -4.735589027404785e-05, -3.948435187339783e-05, -3.16128134727478e-05, -2.374127507209778e-05, -1.5869736671447754e-05, -7.99819827079773e-06, -1.2665987014770508e-07, 7.74487853050232e-06, 1.5616416931152344e-05, 2.3487955331802368e-05, 3.135949373245239e-05, 3.923103213310242e-05, 4.710257053375244e-05, 5.4974108934402466e-05, 6.284564733505249e-05, 7.071718573570251e-05, 7.858872413635254e-05, 8.646026253700256e-05, 9.433180093765259e-05, 0.00010220333933830261, 0.00011007487773895264, 0.00011794641613960266, 0.00012581795454025269, 0.0001336894929409027, 0.00014156103134155273, 0.00014943256974220276, 0.00015730410814285278, 0.0001651756465435028, 0.00017304718494415283, 0.00018091872334480286, 0.00018879026174545288, 0.0001966618001461029, 0.00020453333854675293, 0.00021240487694740295, 0.00022027641534805298, 0.000228147953748703, 0.00023601949214935303, 0.00024389103055000305, 0.0002517625689506531, 0.0002596341073513031, 0.0002675056457519531]}, "gradients/decoder.model.decoder.layers.2.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 1.0, 1.0, 6.0, 8.0, 13.0, 23.0, 48.0, 135.0, 350.0, 985.0, 6291.0, 838940.0, 197064.0, 3487.0, 771.0, 242.0, 95.0, 48.0, 19.0, 17.0, 7.0, 2.0, 2.0, 2.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.203125, -4.082611083984375, -3.96209716796875, -3.841583251953125, -3.7210693359375, -3.600555419921875, -3.48004150390625, -3.359527587890625, -3.239013671875, -3.118499755859375, -2.99798583984375, -2.877471923828125, -2.7569580078125, -2.636444091796875, -2.51593017578125, -2.395416259765625, -2.27490234375, -2.154388427734375, -2.03387451171875, -1.913360595703125, -1.7928466796875, -1.672332763671875, -1.55181884765625, -1.431304931640625, -1.310791015625, -1.190277099609375, -1.06976318359375, -0.949249267578125, -0.8287353515625, -0.708221435546875, -0.58770751953125, -0.467193603515625, -0.3466796875, -0.226165771484375, -0.10565185546875, 0.014862060546875, 0.1353759765625, 0.255889892578125, 0.37640380859375, 0.496917724609375, 0.617431640625, 0.737945556640625, 0.85845947265625, 0.978973388671875, 1.0994873046875, 1.220001220703125, 1.34051513671875, 1.461029052734375, 1.58154296875, 1.702056884765625, 1.82257080078125, 1.943084716796875, 2.0635986328125, 2.184112548828125, 2.30462646484375, 2.425140380859375, 2.545654296875, 2.666168212890625, 2.78668212890625, 2.907196044921875, 3.0277099609375, 3.148223876953125, 3.26873779296875, 3.389251708984375, 3.509765625]}, "gradients/decoder.model.decoder.layers.2.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 0.0, 2.0, 3.0, 4.0, 12.0, 9.0, 25.0, 26.0, 81.0, 94.0, 275.0, 190.0, 111.0, 62.0, 44.0, 27.0, 17.0, 14.0, 1.0, 2.0, 2.0, 2.0, 1.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.77099609375, -0.7412796020507812, -0.7115631103515625, -0.6818466186523438, -0.652130126953125, -0.6224136352539062, -0.5926971435546875, -0.5629806518554688, -0.53326416015625, -0.5035476684570312, -0.4738311767578125, -0.44411468505859375, -0.414398193359375, -0.38468170166015625, -0.3549652099609375, -0.32524871826171875, -0.2955322265625, -0.26581573486328125, -0.2360992431640625, -0.20638275146484375, -0.176666259765625, -0.14694976806640625, -0.1172332763671875, -0.08751678466796875, -0.05780029296875, -0.02808380126953125, 0.0016326904296875, 0.03134918212890625, 0.061065673828125, 0.09078216552734375, 0.1204986572265625, 0.15021514892578125, 0.179931640625, 0.20964813232421875, 0.2393646240234375, 0.26908111572265625, 0.298797607421875, 0.32851409912109375, 0.3582305908203125, 0.38794708251953125, 0.41766357421875, 0.44738006591796875, 0.4770965576171875, 0.5068130493164062, 0.536529541015625, 0.5662460327148438, 0.5959625244140625, 0.6256790161132812, 0.6553955078125, 0.6851119995117188, 0.7148284912109375, 0.7445449829101562, 0.774261474609375, 0.8039779663085938, 0.8336944580078125, 0.8634109497070312, 0.89312744140625, 0.9228439331054688, 0.9525604248046875, 0.9822769165039062, 1.011993408203125, 1.0417098999023438, 1.0714263916015625, 1.1011428833007812, 1.130859375]}, "gradients/decoder.model.decoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 8.0, 36.0, 80.0, 134.0, 195.0, 209.0, 186.0, 84.0, 41.0, 23.0, 8.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.748982906341553, -6.381380558013916, -6.013778209686279, -5.646175861358643, -5.278573513031006, -4.910971164703369, -4.543368339538574, -4.1757659912109375, -3.80816388130188, -3.440561532974243, -3.0729591846466064, -2.7053565979003906, -2.337754249572754, -1.9701520204544067, -1.6025495529174805, -1.2349472045898438, -0.867344856262207, -0.4997424781322479, -0.13214010000228882, 0.23546230792999268, 0.6030646562576294, 0.9706670045852661, 1.3382694721221924, 1.705871820449829, 2.073474168777466, 2.4410765171051025, 2.8086788654327393, 3.176281452178955, 3.543883800506592, 3.9114861488342285, 4.279088497161865, 4.646690845489502, 5.0142927169799805, 5.381895065307617, 5.749497413635254, 6.117099761962891, 6.484702110290527, 6.852304458618164, 7.219906806945801, 7.5875091552734375, 7.955111503601074, 8.322713851928711, 8.690316200256348, 9.057918548583984, 9.425520896911621, 9.793123245239258, 10.160725593566895, 10.528327941894531, 10.895931243896484, 11.263533592224121, 11.631135940551758, 11.998738288879395, 12.366340637207031, 12.733942985534668, 13.101545333862305, 13.469147682189941, 13.836750030517578, 14.204352378845215, 14.571954727172852, 14.939557075500488, 15.307159423828125, 15.674761772155762, 16.0423641204834, 16.40996742248535, 16.777568817138672]}, "gradients/decoder.model.decoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 5.0, 2.0, 9.0, 7.0, 8.0, 7.0, 5.0, 10.0, 9.0, 27.0, 20.0, 19.0, 22.0, 32.0, 37.0, 32.0, 26.0, 36.0, 36.0, 32.0, 40.0, 47.0, 39.0, 51.0, 44.0, 41.0, 41.0, 38.0, 36.0, 32.0, 24.0, 30.0, 25.0, 31.0, 25.0, 21.0, 15.0, 6.0, 10.0, 9.0, 7.0, 4.0, 5.0, 10.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.386319160461426, -4.2209906578063965, -4.055662155151367, -3.890333890914917, -3.725005626678467, -3.5596771240234375, -3.394348621368408, -3.229020118713379, -3.0636918544769287, -2.8983633518218994, -2.733035087585449, -2.56770658493042, -2.4023780822753906, -2.2370498180389404, -2.071721315383911, -1.9063929319381714, -1.7410645484924316, -1.575736165046692, -1.4104077816009521, -1.2450792789459229, -1.079750895500183, -0.9144225120544434, -0.7490940690040588, -0.5837656259536743, -0.41843724250793457, -0.25310882925987244, -0.0877804160118103, 0.07754799723625183, 0.24287641048431396, 0.4082047939300537, 0.5735332369804382, 0.7388616800308228, 0.9041905403137207, 1.0695189237594604, 1.2348473072052002, 1.4001758098602295, 1.5655041933059692, 1.730832576751709, 1.8961610794067383, 2.0614895820617676, 2.2268178462982178, 2.392146348953247, 2.5574746131896973, 2.7228031158447266, 2.888131618499756, 3.053459882736206, 3.2187883853912354, 3.3841166496276855, 3.549445152282715, 3.714773654937744, 3.8801019191741943, 4.0454301834106445, 4.210758686065674, 4.376087188720703, 4.541415691375732, 4.706744194030762, 4.872072219848633, 5.037400722503662, 5.202729225158691, 5.3680572509765625, 5.533385753631592, 5.698714256286621, 5.86404275894165, 6.02937126159668, 6.194699764251709]}, "gradients/decoder.model.decoder.layers.1.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 0.0, 3.0, 1.0, 6.0, 4.0, 6.0, 7.0, 23.0, 27.0, 38.0, 47.0, 66.0, 116.0, 180.0, 266.0, 568.0, 1227.0, 2896.0, 8321.0, 32656.0, 185561.0, 1486484.0, 2105224.0, 303450.0, 49072.0, 11621.0, 3551.0, 1345.0, 645.0, 343.0, 161.0, 118.0, 88.0, 56.0, 39.0, 22.0, 10.0, 10.0, 8.0, 5.0, 5.0, 3.0, 3.0, 5.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.865234375, -2.778717041015625, -2.69219970703125, -2.605682373046875, -2.5191650390625, -2.432647705078125, -2.34613037109375, -2.259613037109375, -2.173095703125, -2.086578369140625, -2.00006103515625, -1.913543701171875, -1.8270263671875, -1.740509033203125, -1.65399169921875, -1.567474365234375, -1.48095703125, -1.394439697265625, -1.30792236328125, -1.221405029296875, -1.1348876953125, -1.048370361328125, -0.96185302734375, -0.875335693359375, -0.788818359375, -0.702301025390625, -0.61578369140625, -0.529266357421875, -0.4427490234375, -0.356231689453125, -0.26971435546875, -0.183197021484375, -0.0966796875, -0.010162353515625, 0.07635498046875, 0.162872314453125, 0.2493896484375, 0.335906982421875, 0.42242431640625, 0.508941650390625, 0.595458984375, 0.681976318359375, 0.76849365234375, 0.855010986328125, 0.9415283203125, 1.028045654296875, 1.11456298828125, 1.201080322265625, 1.28759765625, 1.374114990234375, 1.46063232421875, 1.547149658203125, 1.6336669921875, 1.720184326171875, 1.80670166015625, 1.893218994140625, 1.979736328125, 2.066253662109375, 2.15277099609375, 2.239288330078125, 2.3258056640625, 2.412322998046875, 2.49884033203125, 2.585357666015625, 2.671875]}, "gradients/decoder.model.decoder.layers.1.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 2.0, 4.0, 3.0, 9.0, 3.0, 8.0, 18.0, 16.0, 22.0, 31.0, 34.0, 38.0, 51.0, 44.0, 47.0, 49.0, 49.0, 58.0, 51.0, 61.0, 59.0, 45.0, 59.0, 38.0, 33.0, 49.0, 31.0, 18.0, 21.0, 13.0, 12.0, 11.0, 7.0, 5.0, 2.0, 3.0, 0.0, 2.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.08984375, -2.02484130859375, -1.9598388671875, -1.89483642578125, -1.829833984375, -1.76483154296875, -1.6998291015625, -1.63482666015625, -1.56982421875, -1.50482177734375, -1.4398193359375, -1.37481689453125, -1.309814453125, -1.24481201171875, -1.1798095703125, -1.11480712890625, -1.0498046875, -0.98480224609375, -0.9197998046875, -0.85479736328125, -0.789794921875, -0.72479248046875, -0.6597900390625, -0.59478759765625, -0.52978515625, -0.46478271484375, -0.3997802734375, -0.33477783203125, -0.269775390625, -0.20477294921875, -0.1397705078125, -0.07476806640625, -0.009765625, 0.05523681640625, 0.1202392578125, 0.18524169921875, 0.250244140625, 0.31524658203125, 0.3802490234375, 0.44525146484375, 0.51025390625, 0.57525634765625, 0.6402587890625, 0.70526123046875, 0.770263671875, 0.83526611328125, 0.9002685546875, 0.96527099609375, 1.0302734375, 1.09527587890625, 1.1602783203125, 1.22528076171875, 1.290283203125, 1.35528564453125, 1.4202880859375, 1.48529052734375, 1.55029296875, 1.61529541015625, 1.6802978515625, 1.74530029296875, 1.810302734375, 1.87530517578125, 1.9403076171875, 2.00531005859375, 2.0703125]}, "gradients/decoder.model.decoder.layers.1.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 5.0, 3.0, 4.0, 6.0, 6.0, 7.0, 11.0, 20.0, 26.0, 36.0, 70.0, 141.0, 290.0, 1018.0, 5987.0, 186730.0, 3947642.0, 47880.0, 3298.0, 644.0, 219.0, 97.0, 50.0, 31.0, 23.0, 16.0, 4.0, 6.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-9.2109375, -8.94281005859375, -8.6746826171875, -8.40655517578125, -8.138427734375, -7.87030029296875, -7.6021728515625, -7.33404541015625, -7.06591796875, -6.79779052734375, -6.5296630859375, -6.26153564453125, -5.993408203125, -5.72528076171875, -5.4571533203125, -5.18902587890625, -4.9208984375, -4.65277099609375, -4.3846435546875, -4.11651611328125, -3.848388671875, -3.58026123046875, -3.3121337890625, -3.04400634765625, -2.77587890625, -2.50775146484375, -2.2396240234375, -1.97149658203125, -1.703369140625, -1.43524169921875, -1.1671142578125, -0.89898681640625, -0.630859375, -0.36273193359375, -0.0946044921875, 0.17352294921875, 0.441650390625, 0.70977783203125, 0.9779052734375, 1.24603271484375, 1.51416015625, 1.78228759765625, 2.0504150390625, 2.31854248046875, 2.586669921875, 2.85479736328125, 3.1229248046875, 3.39105224609375, 3.6591796875, 3.92730712890625, 4.1954345703125, 4.46356201171875, 4.731689453125, 4.99981689453125, 5.2679443359375, 5.53607177734375, 5.80419921875, 6.07232666015625, 6.3404541015625, 6.60858154296875, 6.876708984375, 7.14483642578125, 7.4129638671875, 7.68109130859375, 7.94921875]}, "gradients/decoder.model.decoder.layers.1.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 5.0, 6.0, 7.0, 8.0, 7.0, 11.0, 22.0, 27.0, 45.0, 81.0, 123.0, 212.0, 289.0, 486.0, 722.0, 633.0, 510.0, 318.0, 198.0, 93.0, 79.0, 56.0, 41.0, 35.0, 15.0, 11.0, 5.0, 6.0, 9.0, 4.0, 3.0, 1.0, 2.0, 1.0, 3.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1630859375, -1.1267547607421875, -1.090423583984375, -1.0540924072265625, -1.01776123046875, -0.9814300537109375, -0.945098876953125, -0.9087677001953125, -0.8724365234375, -0.8361053466796875, -0.799774169921875, -0.7634429931640625, -0.72711181640625, -0.6907806396484375, -0.654449462890625, -0.6181182861328125, -0.581787109375, -0.5454559326171875, -0.509124755859375, -0.4727935791015625, -0.43646240234375, -0.4001312255859375, -0.363800048828125, -0.3274688720703125, -0.2911376953125, -0.2548065185546875, -0.218475341796875, -0.1821441650390625, -0.14581298828125, -0.1094818115234375, -0.073150634765625, -0.0368194580078125, -0.00048828125, 0.0358428955078125, 0.072174072265625, 0.1085052490234375, 0.14483642578125, 0.1811676025390625, 0.217498779296875, 0.2538299560546875, 0.2901611328125, 0.3264923095703125, 0.362823486328125, 0.3991546630859375, 0.43548583984375, 0.4718170166015625, 0.508148193359375, 0.5444793701171875, 0.580810546875, 0.6171417236328125, 0.653472900390625, 0.6898040771484375, 0.72613525390625, 0.7624664306640625, 0.798797607421875, 0.8351287841796875, 0.8714599609375, 0.9077911376953125, 0.944122314453125, 0.9804534912109375, 1.01678466796875, 1.0531158447265625, 1.089447021484375, 1.1257781982421875, 1.162109375]}, "gradients/decoder.model.decoder.layers.1.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 8.0, 10.0, 19.0, 11.0, 21.0, 37.0, 38.0, 62.0, 64.0, 72.0, 94.0, 79.0, 91.0, 89.0, 65.0, 64.0, 50.0, 43.0, 36.0, 19.0, 16.0, 12.0, 2.0, 5.0, 4.0, 2.0, 1.0, 1.0, 1.0], "bins": [-5.423590183258057, -5.30781888961792, -5.192047595977783, -5.076275825500488, -4.960504531860352, -4.844733238220215, -4.728961944580078, -4.613190650939941, -4.497419357299805, -4.381648063659668, -4.265876770019531, -4.1501054763793945, -4.0343337059021, -3.918562412261963, -3.802791118621826, -3.6870198249816895, -3.5712482929229736, -3.455476999282837, -3.339705467224121, -3.2239341735839844, -3.1081628799438477, -2.992391586303711, -2.876620054244995, -2.7608487606048584, -2.6450772285461426, -2.529305934906006, -2.41353440284729, -2.2977631092071533, -2.1819918155670166, -2.066220283508301, -1.950448989868164, -1.8346776962280273, -1.7189065217971802, -1.603135108947754, -1.4873638153076172, -1.371592402458191, -1.2558209896087646, -1.140049695968628, -1.0242782831192017, -0.9085069298744202, -0.7927355766296387, -0.6769642233848572, -0.5611928701400757, -0.4454214572906494, -0.3296501040458679, -0.21387875080108643, -0.09810733795166016, 0.017664015293121338, 0.13343536853790283, 0.24920673668384552, 0.3649781048297882, 0.4807494878768921, 0.5965208411216736, 0.7122921943664551, 0.8280636072158813, 0.9438349604606628, 1.0596063137054443, 1.1753777265548706, 1.2911490201950073, 1.4069204330444336, 1.5226917266845703, 1.6384631395339966, 1.7542345523834229, 1.8700058460235596, 1.9857772588729858]}, "gradients/decoder.model.decoder.layers.1.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 1.0, 1.0, 3.0, 0.0, 6.0, 12.0, 7.0, 7.0, 15.0, 14.0, 19.0, 15.0, 17.0, 24.0, 19.0, 40.0, 31.0, 25.0, 56.0, 42.0, 44.0, 53.0, 35.0, 44.0, 37.0, 43.0, 38.0, 38.0, 38.0, 39.0, 35.0, 32.0, 30.0, 23.0, 23.0, 16.0, 17.0, 20.0, 12.0, 13.0, 5.0, 7.0, 2.0, 2.0, 2.0, 4.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.040525436401367, -1.977013349533081, -1.9135013818740845, -1.849989414215088, -1.7864773273468018, -1.7229652404785156, -1.659453272819519, -1.5959413051605225, -1.5324292182922363, -1.4689171314239502, -1.4054051637649536, -1.341893196105957, -1.278381109237671, -1.2148690223693848, -1.1513570547103882, -1.0878450870513916, -1.0243330001831055, -0.9608209729194641, -0.8973089456558228, -0.8337969183921814, -0.77028489112854, -0.7067728638648987, -0.6432608366012573, -0.579748809337616, -0.5162367820739746, -0.45272475481033325, -0.3892127275466919, -0.32570070028305054, -0.2621886730194092, -0.19867664575576782, -0.13516461849212646, -0.07165259122848511, -0.00814056396484375, 0.05537146329879761, 0.11888349056243896, 0.18239551782608032, 0.24590754508972168, 0.30941957235336304, 0.3729315996170044, 0.43644362688064575, 0.4999556541442871, 0.5634676814079285, 0.6269797086715698, 0.6904917359352112, 0.7540037631988525, 0.8175157904624939, 0.8810278177261353, 0.9445398449897766, 1.008051872253418, 1.071563959121704, 1.1350759267807007, 1.1985878944396973, 1.2620999813079834, 1.3256120681762695, 1.3891240358352661, 1.4526360034942627, 1.5161480903625488, 1.579660177230835, 1.6431721448898315, 1.7066841125488281, 1.7701961994171143, 1.8337082862854004, 1.897220253944397, 1.9607322216033936, 2.0242443084716797]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 2.0, 4.0, 0.0, 2.0, 7.0, 6.0, 5.0, 9.0, 14.0, 23.0, 33.0, 52.0, 68.0, 121.0, 143.0, 282.0, 594.0, 1190.0, 3126.0, 8625.0, 29007.0, 102518.0, 300760.0, 376551.0, 158284.0, 45782.0, 13447.0, 4431.0, 1794.0, 723.0, 371.0, 192.0, 147.0, 73.0, 59.0, 43.0, 21.0, 19.0, 14.0, 8.0, 4.0, 5.0, 0.0, 4.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.455322265625, -0.4385719299316406, -0.42182159423828125, -0.4050712585449219, -0.3883209228515625, -0.3715705871582031, -0.35482025146484375, -0.3380699157714844, -0.321319580078125, -0.3045692443847656, -0.28781890869140625, -0.2710685729980469, -0.2543182373046875, -0.23756790161132812, -0.22081756591796875, -0.20406723022460938, -0.18731689453125, -0.17056655883789062, -0.15381622314453125, -0.13706588745117188, -0.1203155517578125, -0.10356521606445312, -0.08681488037109375, -0.07006454467773438, -0.053314208984375, -0.036563873291015625, -0.01981353759765625, -0.003063201904296875, 0.0136871337890625, 0.030437469482421875, 0.04718780517578125, 0.06393814086914062, 0.0806884765625, 0.09743881225585938, 0.11418914794921875, 0.13093948364257812, 0.1476898193359375, 0.16444015502929688, 0.18119049072265625, 0.19794082641601562, 0.214691162109375, 0.23144149780273438, 0.24819183349609375, 0.2649421691894531, 0.2816925048828125, 0.2984428405761719, 0.31519317626953125, 0.3319435119628906, 0.34869384765625, 0.3654441833496094, 0.38219451904296875, 0.3989448547363281, 0.4156951904296875, 0.4324455261230469, 0.44919586181640625, 0.4659461975097656, 0.482696533203125, 0.4994468688964844, 0.5161972045898438, 0.5329475402832031, 0.5496978759765625, 0.5664482116699219, 0.5831985473632812, 0.5999488830566406, 0.61669921875]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 3.0, 4.0, 3.0, 6.0, 10.0, 18.0, 16.0, 15.0, 22.0, 19.0, 32.0, 34.0, 47.0, 50.0, 41.0, 45.0, 66.0, 56.0, 48.0, 55.0, 52.0, 51.0, 47.0, 43.0, 37.0, 35.0, 26.0, 26.0, 17.0, 18.0, 20.0, 16.0, 8.0, 7.0, 2.0, 5.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2578125, -1.2117919921875, -1.165771484375, -1.1197509765625, -1.07373046875, -1.0277099609375, -0.981689453125, -0.9356689453125, -0.8896484375, -0.8436279296875, -0.797607421875, -0.7515869140625, -0.70556640625, -0.6595458984375, -0.613525390625, -0.5675048828125, -0.521484375, -0.4754638671875, -0.429443359375, -0.3834228515625, -0.33740234375, -0.2913818359375, -0.245361328125, -0.1993408203125, -0.1533203125, -0.1072998046875, -0.061279296875, -0.0152587890625, 0.03076171875, 0.0767822265625, 0.122802734375, 0.1688232421875, 0.21484375, 0.2608642578125, 0.306884765625, 0.3529052734375, 0.39892578125, 0.4449462890625, 0.490966796875, 0.5369873046875, 0.5830078125, 0.6290283203125, 0.675048828125, 0.7210693359375, 0.76708984375, 0.8131103515625, 0.859130859375, 0.9051513671875, 0.951171875, 0.9971923828125, 1.043212890625, 1.0892333984375, 1.13525390625, 1.1812744140625, 1.227294921875, 1.2733154296875, 1.3193359375, 1.3653564453125, 1.411376953125, 1.4573974609375, 1.50341796875, 1.5494384765625, 1.595458984375, 1.6414794921875, 1.6875]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 3.0, 7.0, 7.0, 4.0, 10.0, 7.0, 17.0, 25.0, 55.0, 79.0, 143.0, 321.0, 621.0, 1369.0, 3162.0, 7242.0, 16803.0, 39330.0, 88686.0, 178670.0, 268726.0, 224052.0, 120951.0, 56029.0, 24308.0, 10087.0, 4269.0, 1859.0, 883.0, 409.0, 179.0, 95.0, 57.0, 32.0, 22.0, 18.0, 11.0, 2.0, 4.0, 2.0, 3.0, 1.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.298828125, -0.2899627685546875, -0.281097412109375, -0.2722320556640625, -0.26336669921875, -0.2545013427734375, -0.245635986328125, -0.2367706298828125, -0.2279052734375, -0.2190399169921875, -0.210174560546875, -0.2013092041015625, -0.19244384765625, -0.1835784912109375, -0.174713134765625, -0.1658477783203125, -0.156982421875, -0.1481170654296875, -0.139251708984375, -0.1303863525390625, -0.12152099609375, -0.1126556396484375, -0.103790283203125, -0.0949249267578125, -0.0860595703125, -0.0771942138671875, -0.068328857421875, -0.0594635009765625, -0.05059814453125, -0.0417327880859375, -0.032867431640625, -0.0240020751953125, -0.01513671875, -0.0062713623046875, 0.002593994140625, 0.0114593505859375, 0.02032470703125, 0.0291900634765625, 0.038055419921875, 0.0469207763671875, 0.0557861328125, 0.0646514892578125, 0.073516845703125, 0.0823822021484375, 0.09124755859375, 0.1001129150390625, 0.108978271484375, 0.1178436279296875, 0.126708984375, 0.1355743408203125, 0.144439697265625, 0.1533050537109375, 0.16217041015625, 0.1710357666015625, 0.179901123046875, 0.1887664794921875, 0.1976318359375, 0.2064971923828125, 0.215362548828125, 0.2242279052734375, 0.23309326171875, 0.2419586181640625, 0.250823974609375, 0.2596893310546875, 0.2685546875]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 4.0, 6.0, 10.0, 6.0, 10.0, 10.0, 13.0, 9.0, 19.0, 21.0, 24.0, 45.0, 46.0, 50.0, 50.0, 52.0, 48.0, 50.0, 65.0, 57.0, 58.0, 46.0, 49.0, 38.0, 41.0, 44.0, 24.0, 18.0, 19.0, 16.0, 20.0, 6.0, 8.0, 7.0, 2.0, 4.0, 2.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-3.291015625, -3.200286865234375, -3.10955810546875, -3.018829345703125, -2.9281005859375, -2.837371826171875, -2.74664306640625, -2.655914306640625, -2.565185546875, -2.474456787109375, -2.38372802734375, -2.292999267578125, -2.2022705078125, -2.111541748046875, -2.02081298828125, -1.930084228515625, -1.83935546875, -1.748626708984375, -1.65789794921875, -1.567169189453125, -1.4764404296875, -1.385711669921875, -1.29498291015625, -1.204254150390625, -1.113525390625, -1.022796630859375, -0.93206787109375, -0.841339111328125, -0.7506103515625, -0.659881591796875, -0.56915283203125, -0.478424072265625, -0.3876953125, -0.296966552734375, -0.20623779296875, -0.115509033203125, -0.0247802734375, 0.065948486328125, 0.15667724609375, 0.247406005859375, 0.338134765625, 0.428863525390625, 0.51959228515625, 0.610321044921875, 0.7010498046875, 0.791778564453125, 0.88250732421875, 0.973236083984375, 1.06396484375, 1.154693603515625, 1.24542236328125, 1.336151123046875, 1.4268798828125, 1.517608642578125, 1.60833740234375, 1.699066162109375, 1.789794921875, 1.880523681640625, 1.97125244140625, 2.061981201171875, 2.1527099609375, 2.243438720703125, 2.33416748046875, 2.424896240234375, 2.515625]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 6.0, 5.0, 13.0, 17.0, 14.0, 35.0, 50.0, 69.0, 130.0, 279.0, 533.0, 1243.0, 3502.0, 13485.0, 83604.0, 588421.0, 307376.0, 38151.0, 7538.0, 2298.0, 903.0, 369.0, 207.0, 107.0, 96.0, 42.0, 16.0, 11.0, 11.0, 12.0, 5.0, 3.0, 1.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.2020263671875, -0.19653701782226562, -0.19104766845703125, -0.18555831909179688, -0.1800689697265625, -0.17457962036132812, -0.16909027099609375, -0.16360092163085938, -0.158111572265625, -0.15262222290039062, -0.14713287353515625, -0.14164352416992188, -0.1361541748046875, -0.13066482543945312, -0.12517547607421875, -0.11968612670898438, -0.11419677734375, -0.10870742797851562, -0.10321807861328125, -0.09772872924804688, -0.0922393798828125, -0.08675003051757812, -0.08126068115234375, -0.07577133178710938, -0.070281982421875, -0.06479263305664062, -0.05930328369140625, -0.053813934326171875, -0.0483245849609375, -0.042835235595703125, -0.03734588623046875, -0.031856536865234375, -0.0263671875, -0.020877838134765625, -0.01538848876953125, -0.009899139404296875, -0.0044097900390625, 0.001079559326171875, 0.00656890869140625, 0.012058258056640625, 0.017547607421875, 0.023036956787109375, 0.02852630615234375, 0.034015655517578125, 0.0395050048828125, 0.044994354248046875, 0.05048370361328125, 0.055973052978515625, 0.06146240234375, 0.06695175170898438, 0.07244110107421875, 0.07793045043945312, 0.0834197998046875, 0.08890914916992188, 0.09439849853515625, 0.09988784790039062, 0.105377197265625, 0.11086654663085938, 0.11635589599609375, 0.12184524536132812, 0.1273345947265625, 0.13282394409179688, 0.13831329345703125, 0.14380264282226562, 0.1492919921875]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 2.0, 4.0, 4.0, 4.0, 4.0, 11.0, 9.0, 8.0, 16.0, 18.0, 24.0, 41.0, 35.0, 59.0, 52.0, 61.0, 61.0, 72.0, 88.0, 61.0, 79.0, 57.0, 49.0, 33.0, 22.0, 26.0, 31.0, 14.0, 20.0, 9.0, 7.0, 8.0, 2.0, 3.0, 2.0, 1.0, 4.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.6253204345703125e-05, -4.474259912967682e-05, -4.323199391365051e-05, -4.1721388697624207e-05, -4.02107834815979e-05, -3.8700178265571594e-05, -3.718957304954529e-05, -3.567896783351898e-05, -3.4168362617492676e-05, -3.265775740146637e-05, -3.1147152185440063e-05, -2.9636546969413757e-05, -2.812594175338745e-05, -2.6615336537361145e-05, -2.510473132133484e-05, -2.3594126105308533e-05, -2.2083520889282227e-05, -2.057291567325592e-05, -1.9062310457229614e-05, -1.7551705241203308e-05, -1.6041100025177002e-05, -1.4530494809150696e-05, -1.301988959312439e-05, -1.1509284377098083e-05, -9.998679161071777e-06, -8.488073945045471e-06, -6.977468729019165e-06, -5.466863512992859e-06, -3.956258296966553e-06, -2.4456530809402466e-06, -9.350478649139404e-07, 5.755573511123657e-07, 2.086162567138672e-06, 3.596767783164978e-06, 5.107372999191284e-06, 6.61797821521759e-06, 8.128583431243896e-06, 9.639188647270203e-06, 1.1149793863296509e-05, 1.2660399079322815e-05, 1.4171004295349121e-05, 1.5681609511375427e-05, 1.7192214727401733e-05, 1.870281994342804e-05, 2.0213425159454346e-05, 2.1724030375480652e-05, 2.3234635591506958e-05, 2.4745240807533264e-05, 2.625584602355957e-05, 2.7766451239585876e-05, 2.9277056455612183e-05, 3.078766167163849e-05, 3.2298266887664795e-05, 3.38088721036911e-05, 3.531947731971741e-05, 3.683008253574371e-05, 3.834068775177002e-05, 3.9851292967796326e-05, 4.136189818382263e-05, 4.287250339984894e-05, 4.4383108615875244e-05, 4.589371383190155e-05, 4.7404319047927856e-05, 4.891492426395416e-05, 5.042552947998047e-05]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 1.0, 6.0, 10.0, 7.0, 14.0, 18.0, 26.0, 34.0, 58.0, 67.0, 131.0, 196.0, 319.0, 627.0, 1210.0, 2511.0, 5883.0, 15274.0, 45725.0, 174186.0, 514333.0, 206467.0, 52394.0, 16792.0, 6458.0, 2840.0, 1346.0, 666.0, 335.0, 209.0, 138.0, 68.0, 45.0, 43.0, 29.0, 31.0, 14.0, 7.0, 6.0, 7.0, 9.0, 5.0, 6.0, 1.0, 3.0, 0.0, 1.0, 1.0], "bins": [-0.17236328125, -0.1676483154296875, -0.162933349609375, -0.1582183837890625, -0.15350341796875, -0.1487884521484375, -0.144073486328125, -0.1393585205078125, -0.1346435546875, -0.1299285888671875, -0.125213623046875, -0.1204986572265625, -0.11578369140625, -0.1110687255859375, -0.106353759765625, -0.1016387939453125, -0.096923828125, -0.0922088623046875, -0.087493896484375, -0.0827789306640625, -0.07806396484375, -0.0733489990234375, -0.068634033203125, -0.0639190673828125, -0.0592041015625, -0.0544891357421875, -0.049774169921875, -0.0450592041015625, -0.04034423828125, -0.0356292724609375, -0.030914306640625, -0.0261993408203125, -0.021484375, -0.0167694091796875, -0.012054443359375, -0.0073394775390625, -0.00262451171875, 0.0020904541015625, 0.006805419921875, 0.0115203857421875, 0.0162353515625, 0.0209503173828125, 0.025665283203125, 0.0303802490234375, 0.03509521484375, 0.0398101806640625, 0.044525146484375, 0.0492401123046875, 0.053955078125, 0.0586700439453125, 0.063385009765625, 0.0680999755859375, 0.07281494140625, 0.0775299072265625, 0.082244873046875, 0.0869598388671875, 0.0916748046875, 0.0963897705078125, 0.101104736328125, 0.1058197021484375, 0.11053466796875, 0.1152496337890625, 0.119964599609375, 0.1246795654296875, 0.12939453125]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 6.0, 1.0, 4.0, 9.0, 4.0, 8.0, 9.0, 10.0, 12.0, 26.0, 27.0, 29.0, 66.0, 102.0, 109.0, 127.0, 97.0, 105.0, 72.0, 50.0, 28.0, 24.0, 23.0, 18.0, 10.0, 8.0, 7.0, 6.0, 5.0, 2.0, 2.0, 1.0, 2.0, 0.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.036651611328125, -0.03532838821411133, -0.034005165100097656, -0.032681941986083984, -0.03135871887207031, -0.03003549575805664, -0.02871227264404297, -0.027389049530029297, -0.026065826416015625, -0.024742603302001953, -0.02341938018798828, -0.02209615707397461, -0.020772933959960938, -0.019449710845947266, -0.018126487731933594, -0.016803264617919922, -0.01548004150390625, -0.014156818389892578, -0.012833595275878906, -0.011510372161865234, -0.010187149047851562, -0.00886392593383789, -0.007540702819824219, -0.006217479705810547, -0.004894256591796875, -0.003571033477783203, -0.0022478103637695312, -0.0009245872497558594, 0.0003986358642578125, 0.0017218589782714844, 0.0030450820922851562, 0.004368305206298828, 0.0056915283203125, 0.007014751434326172, 0.008337974548339844, 0.009661197662353516, 0.010984420776367188, 0.01230764389038086, 0.013630867004394531, 0.014954090118408203, 0.016277313232421875, 0.017600536346435547, 0.01892375946044922, 0.02024698257446289, 0.021570205688476562, 0.022893428802490234, 0.024216651916503906, 0.025539875030517578, 0.02686309814453125, 0.028186321258544922, 0.029509544372558594, 0.030832767486572266, 0.03215599060058594, 0.03347921371459961, 0.03480243682861328, 0.03612565994262695, 0.037448883056640625, 0.0387721061706543, 0.04009532928466797, 0.04141855239868164, 0.04274177551269531, 0.044064998626708984, 0.045388221740722656, 0.04671144485473633, 0.04803466796875]}, "gradients/decoder.model.decoder.layers.1.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 3.0, 11.0, 16.0, 21.0, 33.0, 48.0, 53.0, 68.0, 82.0, 99.0, 79.0, 119.0, 89.0, 82.0, 65.0, 55.0, 25.0, 22.0, 18.0, 8.0, 6.0, 4.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.6389849185943604, -2.5651090145111084, -2.4912331104278564, -2.4173572063446045, -2.3434813022613525, -2.2696056365966797, -2.1957297325134277, -2.121853828430176, -2.047977924346924, -1.9741020202636719, -1.90022611618042, -1.826350212097168, -1.7524744272232056, -1.6785985231399536, -1.6047226190567017, -1.5308468341827393, -1.4569708108901978, -1.3830949068069458, -1.3092190027236938, -1.2353432178497314, -1.1614673137664795, -1.0875914096832275, -1.0137155055999756, -0.9398396611213684, -0.8659637570381165, -0.7920878529548645, -0.7182120084762573, -0.6443361043930054, -0.5704602003097534, -0.49658435583114624, -0.4227084517478943, -0.3488326072692871, -0.27495670318603516, -0.2010808289051056, -0.12720493972301483, -0.05332905054092407, 0.020546823740005493, 0.09442269802093506, 0.168298602104187, 0.2421744465827942, 0.31605035066604614, 0.3899262249469757, 0.4638020992279053, 0.5376780033111572, 0.6115539073944092, 0.6854297518730164, 0.7593056559562683, 0.8331815004348755, 0.9070574045181274, 0.9809333086013794, 1.0548092126846313, 1.1286849975585938, 1.2025609016418457, 1.2764368057250977, 1.3503127098083496, 1.4241886138916016, 1.4980645179748535, 1.5719404220581055, 1.6458163261413574, 1.7196922302246094, 1.7935680150985718, 1.8674439191818237, 1.9413198232650757, 2.015195608139038, 2.08907151222229]}, "gradients/decoder.model.decoder.layers.1.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 5.0, 0.0, 1.0, 5.0, 1.0, 10.0, 8.0, 16.0, 8.0, 16.0, 19.0, 19.0, 19.0, 18.0, 32.0, 45.0, 37.0, 50.0, 46.0, 55.0, 51.0, 40.0, 56.0, 34.0, 50.0, 46.0, 45.0, 31.0, 44.0, 38.0, 30.0, 27.0, 20.0, 19.0, 17.0, 17.0, 9.0, 11.0, 3.0, 4.0, 2.0, 2.0, 2.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.1370736360549927, -1.0966190099716187, -1.0561643838882446, -1.0157097578048706, -0.9752551317214966, -0.9348005056381226, -0.8943458199501038, -0.8538911938667297, -0.8134365677833557, -0.7729819416999817, -0.7325273156166077, -0.6920726895332336, -0.6516180038452148, -0.6111633777618408, -0.5707087516784668, -0.5302541255950928, -0.48979949951171875, -0.4493448734283447, -0.4088902473449707, -0.3684355914592743, -0.32798096537590027, -0.28752633929252625, -0.24707169830799103, -0.2066170573234558, -0.1661624312400818, -0.12570780515670776, -0.08525316417217255, -0.044798530638217926, -0.004343897104263306, 0.03611072897911072, 0.07656536996364594, 0.11702001094818115, 0.15747475624084473, 0.19792938232421875, 0.23838402330875397, 0.2788386642932892, 0.3192932903766632, 0.35974791646003723, 0.40020257234573364, 0.44065719842910767, 0.4811118245124817, 0.5215664505958557, 0.5620210766792297, 0.6024757027626038, 0.6429303884506226, 0.6833850145339966, 0.7238396406173706, 0.7642942667007446, 0.8047488927841187, 0.8452035188674927, 0.8856581449508667, 0.9261127710342407, 0.9665673971176147, 1.0070220232009888, 1.0474766492843628, 1.0879313945770264, 1.1283860206604004, 1.1688406467437744, 1.2092952728271484, 1.2497498989105225, 1.2902045249938965, 1.3306591510772705, 1.3711137771606445, 1.4115684032440186, 1.4520230293273926]}, "gradients/decoder.model.decoder.layers.1.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 4.0, 2.0, 4.0, 4.0, 5.0, 13.0, 10.0, 14.0, 27.0, 44.0, 39.0, 52.0, 80.0, 139.0, 186.0, 291.0, 543.0, 978.0, 1823.0, 3865.0, 8047.0, 17563.0, 40214.0, 96479.0, 259826.0, 362289.0, 149591.0, 58670.0, 25368.0, 11291.0, 5376.0, 2560.0, 1270.0, 736.0, 424.0, 245.0, 144.0, 96.0, 73.0, 51.0, 32.0, 25.0, 16.0, 11.0, 11.0, 6.0, 6.0, 11.0, 5.0, 3.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.49609375, -1.4449005126953125, -1.393707275390625, -1.3425140380859375, -1.29132080078125, -1.2401275634765625, -1.188934326171875, -1.1377410888671875, -1.0865478515625, -1.0353546142578125, -0.984161376953125, -0.9329681396484375, -0.88177490234375, -0.8305816650390625, -0.779388427734375, -0.7281951904296875, -0.677001953125, -0.6258087158203125, -0.574615478515625, -0.5234222412109375, -0.47222900390625, -0.4210357666015625, -0.369842529296875, -0.3186492919921875, -0.2674560546875, -0.2162628173828125, -0.165069580078125, -0.1138763427734375, -0.06268310546875, -0.0114898681640625, 0.039703369140625, 0.0908966064453125, 0.14208984375, 0.1932830810546875, 0.244476318359375, 0.2956695556640625, 0.34686279296875, 0.3980560302734375, 0.449249267578125, 0.5004425048828125, 0.5516357421875, 0.6028289794921875, 0.654022216796875, 0.7052154541015625, 0.75640869140625, 0.8076019287109375, 0.858795166015625, 0.9099884033203125, 0.961181640625, 1.0123748779296875, 1.063568115234375, 1.1147613525390625, 1.16595458984375, 1.2171478271484375, 1.268341064453125, 1.3195343017578125, 1.3707275390625, 1.4219207763671875, 1.473114013671875, 1.5243072509765625, 1.57550048828125, 1.6266937255859375, 1.677886962890625, 1.7290802001953125, 1.7802734375]}, "gradients/decoder.model.decoder.layers.1.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 0.0, 5.0, 0.0, 1.0, 3.0, 3.0, 8.0, 17.0, 15.0, 14.0, 11.0, 19.0, 29.0, 26.0, 36.0, 38.0, 30.0, 52.0, 42.0, 46.0, 57.0, 41.0, 54.0, 55.0, 40.0, 48.0, 47.0, 39.0, 41.0, 36.0, 27.0, 19.0, 28.0, 25.0, 10.0, 9.0, 4.0, 9.0, 8.0, 5.0, 5.0, 3.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.3359375, -2.25286865234375, -2.1697998046875, -2.08673095703125, -2.003662109375, -1.92059326171875, -1.8375244140625, -1.75445556640625, -1.67138671875, -1.58831787109375, -1.5052490234375, -1.42218017578125, -1.339111328125, -1.25604248046875, -1.1729736328125, -1.08990478515625, -1.0068359375, -0.92376708984375, -0.8406982421875, -0.75762939453125, -0.674560546875, -0.59149169921875, -0.5084228515625, -0.42535400390625, -0.34228515625, -0.25921630859375, -0.1761474609375, -0.09307861328125, -0.010009765625, 0.07305908203125, 0.1561279296875, 0.23919677734375, 0.322265625, 0.40533447265625, 0.4884033203125, 0.57147216796875, 0.654541015625, 0.73760986328125, 0.8206787109375, 0.90374755859375, 0.98681640625, 1.06988525390625, 1.1529541015625, 1.23602294921875, 1.319091796875, 1.40216064453125, 1.4852294921875, 1.56829833984375, 1.6513671875, 1.73443603515625, 1.8175048828125, 1.90057373046875, 1.983642578125, 2.06671142578125, 2.1497802734375, 2.23284912109375, 2.31591796875, 2.39898681640625, 2.4820556640625, 2.56512451171875, 2.648193359375, 2.73126220703125, 2.8143310546875, 2.89739990234375, 2.98046875]}, "gradients/decoder.model.decoder.layers.1.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 8.0, 6.0, 7.0, 13.0, 14.0, 26.0, 19.0, 55.0, 72.0, 119.0, 202.0, 445.0, 1081.0, 3596.0, 21069.0, 207134.0, 710047.0, 90017.0, 10814.0, 2220.0, 772.0, 334.0, 173.0, 101.0, 73.0, 45.0, 23.0, 15.0, 11.0, 7.0, 8.0, 9.0, 4.0, 5.0, 2.0, 3.0, 2.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.11328125, -3.9776611328125, -3.842041015625, -3.7064208984375, -3.57080078125, -3.4351806640625, -3.299560546875, -3.1639404296875, -3.0283203125, -2.8927001953125, -2.757080078125, -2.6214599609375, -2.48583984375, -2.3502197265625, -2.214599609375, -2.0789794921875, -1.943359375, -1.8077392578125, -1.672119140625, -1.5364990234375, -1.40087890625, -1.2652587890625, -1.129638671875, -0.9940185546875, -0.8583984375, -0.7227783203125, -0.587158203125, -0.4515380859375, -0.31591796875, -0.1802978515625, -0.044677734375, 0.0909423828125, 0.2265625, 0.3621826171875, 0.497802734375, 0.6334228515625, 0.76904296875, 0.9046630859375, 1.040283203125, 1.1759033203125, 1.3115234375, 1.4471435546875, 1.582763671875, 1.7183837890625, 1.85400390625, 1.9896240234375, 2.125244140625, 2.2608642578125, 2.396484375, 2.5321044921875, 2.667724609375, 2.8033447265625, 2.93896484375, 3.0745849609375, 3.210205078125, 3.3458251953125, 3.4814453125, 3.6170654296875, 3.752685546875, 3.8883056640625, 4.02392578125, 4.1595458984375, 4.295166015625, 4.4307861328125, 4.56640625]}, "gradients/decoder.model.decoder.layers.1.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 4.0, 3.0, 5.0, 7.0, 3.0, 8.0, 20.0, 14.0, 15.0, 28.0, 25.0, 43.0, 47.0, 48.0, 52.0, 62.0, 56.0, 71.0, 69.0, 68.0, 53.0, 48.0, 40.0, 48.0, 29.0, 30.0, 22.0, 19.0, 18.0, 15.0, 11.0, 13.0, 5.0, 6.0, 4.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.337890625, -3.222869873046875, -3.10784912109375, -2.992828369140625, -2.8778076171875, -2.762786865234375, -2.64776611328125, -2.532745361328125, -2.417724609375, -2.302703857421875, -2.18768310546875, -2.072662353515625, -1.9576416015625, -1.842620849609375, -1.72760009765625, -1.612579345703125, -1.49755859375, -1.382537841796875, -1.26751708984375, -1.152496337890625, -1.0374755859375, -0.922454833984375, -0.80743408203125, -0.692413330078125, -0.577392578125, -0.462371826171875, -0.34735107421875, -0.232330322265625, -0.1173095703125, -0.002288818359375, 0.11273193359375, 0.227752685546875, 0.3427734375, 0.457794189453125, 0.57281494140625, 0.687835693359375, 0.8028564453125, 0.917877197265625, 1.03289794921875, 1.147918701171875, 1.262939453125, 1.377960205078125, 1.49298095703125, 1.608001708984375, 1.7230224609375, 1.838043212890625, 1.95306396484375, 2.068084716796875, 2.18310546875, 2.298126220703125, 2.41314697265625, 2.528167724609375, 2.6431884765625, 2.758209228515625, 2.87322998046875, 2.988250732421875, 3.103271484375, 3.218292236328125, 3.33331298828125, 3.448333740234375, 3.5633544921875, 3.678375244140625, 3.79339599609375, 3.908416748046875, 4.0234375]}, "gradients/decoder.model.decoder.layers.1.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 4.0, 1.0, 0.0, 1.0, 4.0, 2.0, 5.0, 5.0, 11.0, 15.0, 29.0, 54.0, 104.0, 216.0, 544.0, 1404.0, 4249.0, 21788.0, 220218.0, 712976.0, 73006.0, 9796.0, 2548.0, 903.0, 365.0, 146.0, 69.0, 45.0, 19.0, 12.0, 8.0, 4.0, 6.0, 5.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.521484375, -1.4743499755859375, -1.427215576171875, -1.3800811767578125, -1.33294677734375, -1.2858123779296875, -1.238677978515625, -1.1915435791015625, -1.1444091796875, -1.0972747802734375, -1.050140380859375, -1.0030059814453125, -0.95587158203125, -0.9087371826171875, -0.861602783203125, -0.8144683837890625, -0.767333984375, -0.7201995849609375, -0.673065185546875, -0.6259307861328125, -0.57879638671875, -0.5316619873046875, -0.484527587890625, -0.4373931884765625, -0.3902587890625, -0.3431243896484375, -0.295989990234375, -0.2488555908203125, -0.20172119140625, -0.1545867919921875, -0.107452392578125, -0.0603179931640625, -0.01318359375, 0.0339508056640625, 0.081085205078125, 0.1282196044921875, 0.17535400390625, 0.2224884033203125, 0.269622802734375, 0.3167572021484375, 0.3638916015625, 0.4110260009765625, 0.458160400390625, 0.5052947998046875, 0.55242919921875, 0.5995635986328125, 0.646697998046875, 0.6938323974609375, 0.740966796875, 0.7881011962890625, 0.835235595703125, 0.8823699951171875, 0.92950439453125, 0.9766387939453125, 1.023773193359375, 1.0709075927734375, 1.1180419921875, 1.1651763916015625, 1.212310791015625, 1.2594451904296875, 1.30657958984375, 1.3537139892578125, 1.400848388671875, 1.4479827880859375, 1.4951171875]}, "gradients/decoder.model.decoder.layers.1.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 7.0, 8.0, 8.0, 15.0, 12.0, 21.0, 32.0, 44.0, 53.0, 74.0, 115.0, 140.0, 142.0, 98.0, 51.0, 54.0, 42.0, 27.0, 14.0, 14.0, 10.0, 2.0, 8.0, 3.0, 4.0, 1.0, 2.0, 1.0, 0.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0002415180206298828, -0.00023513101041316986, -0.0002287440001964569, -0.00022235698997974396, -0.000215969979763031, -0.00020958296954631805, -0.0002031959593296051, -0.00019680894911289215, -0.0001904219388961792, -0.00018403492867946625, -0.0001776479184627533, -0.00017126090824604034, -0.0001648738980293274, -0.00015848688781261444, -0.0001520998775959015, -0.00014571286737918854, -0.00013932585716247559, -0.00013293884694576263, -0.00012655183672904968, -0.00012016482651233673, -0.00011377781629562378, -0.00010739080607891083, -0.00010100379586219788, -9.461678564548492e-05, -8.822977542877197e-05, -8.184276521205902e-05, -7.545575499534607e-05, -6.906874477863312e-05, -6.268173456192017e-05, -5.6294724345207214e-05, -4.990771412849426e-05, -4.352070391178131e-05, -3.713369369506836e-05, -3.074668347835541e-05, -2.4359673261642456e-05, -1.7972663044929504e-05, -1.1585652828216553e-05, -5.198642611503601e-06, 1.1883676052093506e-06, 7.575377821922302e-06, 1.3962388038635254e-05, 2.0349398255348206e-05, 2.6736408472061157e-05, 3.312341868877411e-05, 3.951042890548706e-05, 4.589743912220001e-05, 5.2284449338912964e-05, 5.8671459555625916e-05, 6.505846977233887e-05, 7.144547998905182e-05, 7.783249020576477e-05, 8.421950042247772e-05, 9.060651063919067e-05, 9.699352085590363e-05, 0.00010338053107261658, 0.00010976754128932953, 0.00011615455150604248, 0.00012254156172275543, 0.00012892857193946838, 0.00013531558215618134, 0.0001417025923728943, 0.00014808960258960724, 0.0001544766128063202, 0.00016086362302303314, 0.0001672506332397461]}, "gradients/decoder.model.decoder.layers.1.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 5.0, 9.0, 8.0, 4.0, 11.0, 15.0, 24.0, 34.0, 53.0, 125.0, 230.0, 534.0, 1162.0, 3042.0, 8827.0, 38550.0, 291922.0, 596845.0, 84103.0, 15326.0, 4516.0, 1751.0, 725.0, 339.0, 163.0, 94.0, 39.0, 23.0, 21.0, 15.0, 11.0, 6.0, 6.0, 4.0, 4.0, 2.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.265625, -1.2222900390625, -1.178955078125, -1.1356201171875, -1.09228515625, -1.0489501953125, -1.005615234375, -0.9622802734375, -0.9189453125, -0.8756103515625, -0.832275390625, -0.7889404296875, -0.74560546875, -0.7022705078125, -0.658935546875, -0.6156005859375, -0.572265625, -0.5289306640625, -0.485595703125, -0.4422607421875, -0.39892578125, -0.3555908203125, -0.312255859375, -0.2689208984375, -0.2255859375, -0.1822509765625, -0.138916015625, -0.0955810546875, -0.05224609375, -0.0089111328125, 0.034423828125, 0.0777587890625, 0.12109375, 0.1644287109375, 0.207763671875, 0.2510986328125, 0.29443359375, 0.3377685546875, 0.381103515625, 0.4244384765625, 0.4677734375, 0.5111083984375, 0.554443359375, 0.5977783203125, 0.64111328125, 0.6844482421875, 0.727783203125, 0.7711181640625, 0.814453125, 0.8577880859375, 0.901123046875, 0.9444580078125, 0.98779296875, 1.0311279296875, 1.074462890625, 1.1177978515625, 1.1611328125, 1.2044677734375, 1.247802734375, 1.2911376953125, 1.33447265625, 1.3778076171875, 1.421142578125, 1.4644775390625, 1.5078125]}, "gradients/decoder.model.decoder.layers.1.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 4.0, 4.0, 4.0, 9.0, 2.0, 4.0, 8.0, 12.0, 10.0, 13.0, 14.0, 17.0, 24.0, 42.0, 38.0, 55.0, 62.0, 70.0, 64.0, 85.0, 67.0, 79.0, 65.0, 55.0, 47.0, 24.0, 24.0, 22.0, 17.0, 13.0, 13.0, 9.0, 7.0, 6.0, 6.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.469970703125, -0.4574317932128906, -0.44489288330078125, -0.4323539733886719, -0.4198150634765625, -0.4072761535644531, -0.39473724365234375, -0.3821983337402344, -0.369659423828125, -0.3571205139160156, -0.34458160400390625, -0.3320426940917969, -0.3195037841796875, -0.3069648742675781, -0.29442596435546875, -0.2818870544433594, -0.26934814453125, -0.2568092346191406, -0.24427032470703125, -0.23173141479492188, -0.2191925048828125, -0.20665359497070312, -0.19411468505859375, -0.18157577514648438, -0.169036865234375, -0.15649795532226562, -0.14395904541015625, -0.13142013549804688, -0.1188812255859375, -0.10634231567382812, -0.09380340576171875, -0.08126449584960938, -0.0687255859375, -0.056186676025390625, -0.04364776611328125, -0.031108856201171875, -0.0185699462890625, -0.006031036376953125, 0.00650787353515625, 0.019046783447265625, 0.031585693359375, 0.044124603271484375, 0.05666351318359375, 0.06920242309570312, 0.0817413330078125, 0.09428024291992188, 0.10681915283203125, 0.11935806274414062, 0.13189697265625, 0.14443588256835938, 0.15697479248046875, 0.16951370239257812, 0.1820526123046875, 0.19459152221679688, 0.20713043212890625, 0.21966934204101562, 0.232208251953125, 0.24474716186523438, 0.25728607177734375, 0.2698249816894531, 0.2823638916015625, 0.2949028015136719, 0.30744171142578125, 0.3199806213378906, 0.33251953125]}, "gradients/decoder.model.decoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 6.0, 16.0, 31.0, 91.0, 145.0, 213.0, 230.0, 155.0, 81.0, 26.0, 16.0, 4.0, 2.0, 0.0, 1.0, 1.0], "bins": [-20.0159912109375, -19.64496421813965, -19.273935317993164, -18.902908325195312, -18.53188133239746, -18.160852432250977, -17.789825439453125, -17.418798446655273, -17.047771453857422, -16.67674446105957, -16.305715560913086, -15.934688568115234, -15.563661575317383, -15.192633628845215, -14.821605682373047, -14.450578689575195, -14.079549789428711, -13.708521842956543, -13.337494850158691, -12.966466903686523, -12.595439910888672, -12.224411964416504, -11.853384017944336, -11.482357025146484, -11.111329078674316, -10.740301132202148, -10.369274139404297, -9.998246192932129, -9.627218246459961, -9.25619125366211, -8.885163307189941, -8.514135360717773, -8.143108367919922, -7.772080898284912, -7.401053428649902, -7.030025482177734, -6.658998012542725, -6.287970542907715, -5.916942596435547, -5.545915126800537, -5.174887657165527, -4.803860187530518, -4.432832717895508, -4.06180477142334, -3.69077730178833, -3.3197498321533203, -2.9487221240997314, -2.5776944160461426, -2.206666946411133, -1.8356393575668335, -1.4646117687225342, -1.0935841798782349, -0.7225565910339355, -0.35152900218963623, 0.019498586654663086, 0.39052629470825195, 0.7615537643432617, 1.132581353187561, 1.5036089420318604, 1.8746365308761597, 2.245664119720459, 2.6166915893554688, 2.9877192974090576, 3.3587470054626465, 3.7297744750976562]}, "gradients/decoder.model.decoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 5.0, 6.0, 6.0, 13.0, 17.0, 8.0, 24.0, 19.0, 26.0, 29.0, 28.0, 29.0, 34.0, 36.0, 43.0, 51.0, 50.0, 42.0, 61.0, 44.0, 41.0, 40.0, 49.0, 33.0, 33.0, 38.0, 41.0, 29.0, 12.0, 22.0, 30.0, 20.0, 12.0, 10.0, 8.0, 5.0, 1.0, 5.0, 3.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0], "bins": [-5.846386909484863, -5.69079065322876, -5.5351948738098145, -5.379598617553711, -5.224002361297607, -5.068406105041504, -4.912810325622559, -4.757214069366455, -4.601617813110352, -4.446021556854248, -4.290425777435303, -4.134829521179199, -3.9792332649230957, -3.8236372470855713, -3.668041229248047, -3.5124449729919434, -3.356848955154419, -3.2012529373168945, -3.045656681060791, -2.8900606632232666, -2.734464406967163, -2.5788683891296387, -2.423272132873535, -2.2676761150360107, -2.1120800971984863, -1.9564839601516724, -1.8008878231048584, -1.645291805267334, -1.4896955490112305, -1.334099531173706, -1.178503394126892, -1.0229072570800781, -0.8673110008239746, -0.7117148637771606, -0.5561187267303467, -0.4005226492881775, -0.24492651224136353, -0.08933037519454956, 0.06626570224761963, 0.2218618392944336, 0.37745797634124756, 0.5330541133880615, 0.6886502504348755, 0.8442463278770447, 0.9998424649238586, 1.1554386615753174, 1.3110346794128418, 1.4666308164596558, 1.6222269535064697, 1.7778230905532837, 1.9334192276000977, 2.089015245437622, 2.2446115016937256, 2.40020751953125, 2.5558037757873535, 2.711399793624878, 2.8669958114624023, 3.0225918292999268, 3.1781880855560303, 3.3337841033935547, 3.489380359649658, 3.6449763774871826, 3.800572395324707, 3.9561686515808105, 4.111764907836914]}, "gradients/decoder.model.decoder.layers.0.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 3.0, 2.0, 1.0, 2.0, 10.0, 13.0, 16.0, 17.0, 24.0, 29.0, 40.0, 74.0, 91.0, 152.0, 273.0, 576.0, 1469.0, 5580.0, 28837.0, 251990.0, 2618530.0, 1179338.0, 89945.0, 12849.0, 2643.0, 854.0, 381.0, 191.0, 103.0, 62.0, 42.0, 49.0, 24.0, 22.0, 15.0, 8.0, 10.0, 6.0, 8.0, 4.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 3.0, 0.0, 0.0, 1.0], "bins": [-3.791015625, -3.678802490234375, -3.56658935546875, -3.454376220703125, -3.3421630859375, -3.229949951171875, -3.11773681640625, -3.005523681640625, -2.893310546875, -2.781097412109375, -2.66888427734375, -2.556671142578125, -2.4444580078125, -2.332244873046875, -2.22003173828125, -2.107818603515625, -1.99560546875, -1.883392333984375, -1.77117919921875, -1.658966064453125, -1.5467529296875, -1.434539794921875, -1.32232666015625, -1.210113525390625, -1.097900390625, -0.985687255859375, -0.87347412109375, -0.761260986328125, -0.6490478515625, -0.536834716796875, -0.42462158203125, -0.312408447265625, -0.2001953125, -0.087982177734375, 0.02423095703125, 0.136444091796875, 0.2486572265625, 0.360870361328125, 0.47308349609375, 0.585296630859375, 0.697509765625, 0.809722900390625, 0.92193603515625, 1.034149169921875, 1.1463623046875, 1.258575439453125, 1.37078857421875, 1.483001708984375, 1.59521484375, 1.707427978515625, 1.81964111328125, 1.931854248046875, 2.0440673828125, 2.156280517578125, 2.26849365234375, 2.380706787109375, 2.492919921875, 2.605133056640625, 2.71734619140625, 2.829559326171875, 2.9417724609375, 3.053985595703125, 3.16619873046875, 3.278411865234375, 3.390625]}, "gradients/decoder.model.decoder.layers.0.fc2.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 0.0, 2.0, 5.0, 8.0, 11.0, 14.0, 13.0, 16.0, 30.0, 27.0, 39.0, 42.0, 42.0, 53.0, 63.0, 58.0, 46.0, 66.0, 67.0, 55.0, 52.0, 55.0, 41.0, 38.0, 30.0, 30.0, 26.0, 18.0, 15.0, 17.0, 9.0, 7.0, 5.0, 1.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3916015625, -1.3347320556640625, -1.277862548828125, -1.2209930419921875, -1.16412353515625, -1.1072540283203125, -1.050384521484375, -0.9935150146484375, -0.9366455078125, -0.8797760009765625, -0.822906494140625, -0.7660369873046875, -0.70916748046875, -0.6522979736328125, -0.595428466796875, -0.5385589599609375, -0.481689453125, -0.4248199462890625, -0.367950439453125, -0.3110809326171875, -0.25421142578125, -0.1973419189453125, -0.140472412109375, -0.0836029052734375, -0.0267333984375, 0.0301361083984375, 0.087005615234375, 0.1438751220703125, 0.20074462890625, 0.2576141357421875, 0.314483642578125, 0.3713531494140625, 0.42822265625, 0.4850921630859375, 0.541961669921875, 0.5988311767578125, 0.65570068359375, 0.7125701904296875, 0.769439697265625, 0.8263092041015625, 0.8831787109375, 0.9400482177734375, 0.996917724609375, 1.0537872314453125, 1.11065673828125, 1.1675262451171875, 1.224395751953125, 1.2812652587890625, 1.338134765625, 1.3950042724609375, 1.451873779296875, 1.5087432861328125, 1.56561279296875, 1.6224822998046875, 1.679351806640625, 1.7362213134765625, 1.7930908203125, 1.8499603271484375, 1.906829833984375, 1.9636993408203125, 2.02056884765625, 2.0774383544921875, 2.134307861328125, 2.1911773681640625, 2.248046875]}, "gradients/decoder.model.decoder.layers.0.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 5.0, 9.0, 7.0, 23.0, 55.0, 107.0, 417.0, 1608.0, 15174.0, 3969324.0, 202561.0, 3858.0, 787.0, 199.0, 72.0, 29.0, 19.0, 11.0, 5.0, 4.0, 3.0, 3.0, 1.0, 0.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-10.8359375, -10.4945068359375, -10.153076171875, -9.8116455078125, -9.47021484375, -9.1287841796875, -8.787353515625, -8.4459228515625, -8.1044921875, -7.7630615234375, -7.421630859375, -7.0802001953125, -6.73876953125, -6.3973388671875, -6.055908203125, -5.7144775390625, -5.373046875, -5.0316162109375, -4.690185546875, -4.3487548828125, -4.00732421875, -3.6658935546875, -3.324462890625, -2.9830322265625, -2.6416015625, -2.3001708984375, -1.958740234375, -1.6173095703125, -1.27587890625, -0.9344482421875, -0.593017578125, -0.2515869140625, 0.08984375, 0.4312744140625, 0.772705078125, 1.1141357421875, 1.45556640625, 1.7969970703125, 2.138427734375, 2.4798583984375, 2.8212890625, 3.1627197265625, 3.504150390625, 3.8455810546875, 4.18701171875, 4.5284423828125, 4.869873046875, 5.2113037109375, 5.552734375, 5.8941650390625, 6.235595703125, 6.5770263671875, 6.91845703125, 7.2598876953125, 7.601318359375, 7.9427490234375, 8.2841796875, 8.6256103515625, 8.967041015625, 9.3084716796875, 9.64990234375, 9.9913330078125, 10.332763671875, 10.6741943359375, 11.015625]}, "gradients/decoder.model.decoder.layers.0.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 5.0, 4.0, 5.0, 9.0, 11.0, 8.0, 28.0, 38.0, 94.0, 128.0, 201.0, 382.0, 558.0, 689.0, 709.0, 490.0, 288.0, 168.0, 101.0, 74.0, 26.0, 24.0, 15.0, 9.0, 6.0, 2.0, 2.0, 4.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.3916015625, -1.3492279052734375, -1.306854248046875, -1.2644805908203125, -1.22210693359375, -1.1797332763671875, -1.137359619140625, -1.0949859619140625, -1.0526123046875, -1.0102386474609375, -0.967864990234375, -0.9254913330078125, -0.88311767578125, -0.8407440185546875, -0.798370361328125, -0.7559967041015625, -0.713623046875, -0.6712493896484375, -0.628875732421875, -0.5865020751953125, -0.54412841796875, -0.5017547607421875, -0.459381103515625, -0.4170074462890625, -0.3746337890625, -0.3322601318359375, -0.289886474609375, -0.2475128173828125, -0.20513916015625, -0.1627655029296875, -0.120391845703125, -0.0780181884765625, -0.03564453125, 0.0067291259765625, 0.049102783203125, 0.0914764404296875, 0.13385009765625, 0.1762237548828125, 0.218597412109375, 0.2609710693359375, 0.3033447265625, 0.3457183837890625, 0.388092041015625, 0.4304656982421875, 0.47283935546875, 0.5152130126953125, 0.557586669921875, 0.5999603271484375, 0.642333984375, 0.6847076416015625, 0.727081298828125, 0.7694549560546875, 0.81182861328125, 0.8542022705078125, 0.896575927734375, 0.9389495849609375, 0.9813232421875, 1.0236968994140625, 1.066070556640625, 1.1084442138671875, 1.15081787109375, 1.1931915283203125, 1.235565185546875, 1.2779388427734375, 1.3203125]}, "gradients/decoder.model.decoder.layers.0.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 2.0, 3.0, 8.0, 9.0, 13.0, 14.0, 16.0, 28.0, 25.0, 34.0, 36.0, 41.0, 31.0, 44.0, 50.0, 51.0, 57.0, 66.0, 73.0, 56.0, 56.0, 43.0, 41.0, 36.0, 38.0, 23.0, 20.0, 21.0, 19.0, 13.0, 12.0, 8.0, 10.0, 4.0, 5.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.906385064125061, -1.8349493741989136, -1.7635135650634766, -1.692077875137329, -1.6206421852111816, -1.5492063760757446, -1.4777706861495972, -1.4063348770141602, -1.3348991870880127, -1.2634634971618652, -1.1920276880264282, -1.1205919981002808, -1.0491561889648438, -0.9777204990386963, -0.9062848091125488, -0.8348490595817566, -0.7634133100509644, -0.6919775605201721, -0.6205418109893799, -0.5491061210632324, -0.4776703715324402, -0.40623462200164795, -0.3347989022731781, -0.26336318254470825, -0.19192743301391602, -0.12049169838428497, -0.04905596375465393, 0.022379770874977112, 0.09381550550460815, 0.1652512550354004, 0.23668697476387024, 0.3081226944923401, 0.3795585632324219, 0.4509943127632141, 0.5224300622940063, 0.5938657522201538, 0.665301501750946, 0.7367372512817383, 0.8081729412078857, 0.879608690738678, 0.9510444402694702, 1.0224801301956177, 1.0939159393310547, 1.1653516292572021, 1.2367873191833496, 1.3082231283187866, 1.379658818244934, 1.451094627380371, 1.5225303173065186, 1.593966007232666, 1.665401816368103, 1.7368375062942505, 1.8082733154296875, 1.879709005355835, 1.9511446952819824, 2.02258038520813, 2.0940160751342773, 2.165451765060425, 2.2368874549865723, 2.308323383331299, 2.3797590732574463, 2.4511947631835938, 2.522630453109741, 2.5940661430358887, 2.6655020713806152]}, "gradients/decoder.model.decoder.layers.0.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 4.0, 7.0, 2.0, 9.0, 8.0, 15.0, 13.0, 16.0, 15.0, 25.0, 25.0, 27.0, 30.0, 33.0, 57.0, 51.0, 48.0, 55.0, 50.0, 50.0, 44.0, 39.0, 49.0, 27.0, 45.0, 36.0, 36.0, 34.0, 32.0, 25.0, 19.0, 14.0, 19.0, 10.0, 7.0, 9.0, 3.0, 7.0, 4.0, 5.0, 3.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9667867422103882, -1.9001915454864502, -1.8335963487625122, -1.7670011520385742, -1.7004058361053467, -1.6338107585906982, -1.5672154426574707, -1.5006202459335327, -1.4340250492095947, -1.3674298524856567, -1.3008346557617188, -1.2342394590377808, -1.1676442623138428, -1.1010489463806152, -1.0344537496566772, -0.9678585529327393, -0.9012633562088013, -0.8346681594848633, -0.7680729627609253, -0.7014777064323425, -0.6348825097084045, -0.5682873129844666, -0.5016920566558838, -0.4350968599319458, -0.3685016632080078, -0.3019064664840698, -0.23531123995780945, -0.16871602833271027, -0.10212081670761108, -0.035525619983673096, 0.03106960654258728, 0.09766483306884766, 0.1642601490020752, 0.23085536062717438, 0.29745057225227356, 0.36404579877853394, 0.4306409955024719, 0.4972361922264099, 0.5638314485549927, 0.6304266452789307, 0.6970218420028687, 0.7636170387268066, 0.8302122354507446, 0.8968074917793274, 0.9634026885032654, 1.0299978256225586, 1.0965931415557861, 1.1631883382797241, 1.229783535003662, 1.2963787317276, 1.362973928451538, 1.429569125175476, 1.496164321899414, 1.5627596378326416, 1.6293548345565796, 1.6959500312805176, 1.7625452280044556, 1.8291404247283936, 1.8957356214523315, 1.9623308181762695, 2.028926134109497, 2.0955212116241455, 2.162116527557373, 2.2287116050720215, 2.295306921005249]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 5.0, 3.0, 8.0, 8.0, 12.0, 11.0, 20.0, 29.0, 30.0, 36.0, 67.0, 85.0, 115.0, 171.0, 226.0, 386.0, 715.0, 1910.0, 9943.0, 71602.0, 365747.0, 460142.0, 116285.0, 16042.0, 2762.0, 864.0, 435.0, 281.0, 161.0, 124.0, 72.0, 83.0, 46.0, 32.0, 29.0, 17.0, 14.0, 12.0, 14.0, 4.0, 4.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8046875, -0.7796401977539062, -0.7545928955078125, -0.7295455932617188, -0.704498291015625, -0.6794509887695312, -0.6544036865234375, -0.6293563842773438, -0.60430908203125, -0.5792617797851562, -0.5542144775390625, -0.5291671752929688, -0.504119873046875, -0.47907257080078125, -0.4540252685546875, -0.42897796630859375, -0.4039306640625, -0.37888336181640625, -0.3538360595703125, -0.32878875732421875, -0.303741455078125, -0.27869415283203125, -0.2536468505859375, -0.22859954833984375, -0.20355224609375, -0.17850494384765625, -0.1534576416015625, -0.12841033935546875, -0.103363037109375, -0.07831573486328125, -0.0532684326171875, -0.02822113037109375, -0.003173828125, 0.02187347412109375, 0.0469207763671875, 0.07196807861328125, 0.097015380859375, 0.12206268310546875, 0.1471099853515625, 0.17215728759765625, 0.19720458984375, 0.22225189208984375, 0.2472991943359375, 0.27234649658203125, 0.297393798828125, 0.32244110107421875, 0.3474884033203125, 0.37253570556640625, 0.3975830078125, 0.42263031005859375, 0.4476776123046875, 0.47272491455078125, 0.497772216796875, 0.5228195190429688, 0.5478668212890625, 0.5729141235351562, 0.59796142578125, 0.6230087280273438, 0.6480560302734375, 0.6731033325195312, 0.698150634765625, 0.7231979370117188, 0.7482452392578125, 0.7732925415039062, 0.79833984375]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 5.0, 3.0, 10.0, 9.0, 11.0, 15.0, 9.0, 20.0, 32.0, 21.0, 25.0, 28.0, 36.0, 45.0, 62.0, 40.0, 53.0, 52.0, 39.0, 53.0, 46.0, 42.0, 42.0, 39.0, 41.0, 32.0, 36.0, 22.0, 32.0, 23.0, 18.0, 8.0, 17.0, 12.0, 2.0, 8.0, 5.0, 3.0, 4.0, 6.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.3330078125, -1.289947509765625, -1.24688720703125, -1.203826904296875, -1.1607666015625, -1.117706298828125, -1.07464599609375, -1.031585693359375, -0.988525390625, -0.945465087890625, -0.90240478515625, -0.859344482421875, -0.8162841796875, -0.773223876953125, -0.73016357421875, -0.687103271484375, -0.64404296875, -0.600982666015625, -0.55792236328125, -0.514862060546875, -0.4718017578125, -0.428741455078125, -0.38568115234375, -0.342620849609375, -0.299560546875, -0.256500244140625, -0.21343994140625, -0.170379638671875, -0.1273193359375, -0.084259033203125, -0.04119873046875, 0.001861572265625, 0.044921875, 0.087982177734375, 0.13104248046875, 0.174102783203125, 0.2171630859375, 0.260223388671875, 0.30328369140625, 0.346343994140625, 0.389404296875, 0.432464599609375, 0.47552490234375, 0.518585205078125, 0.5616455078125, 0.604705810546875, 0.64776611328125, 0.690826416015625, 0.73388671875, 0.776947021484375, 0.82000732421875, 0.863067626953125, 0.9061279296875, 0.949188232421875, 0.99224853515625, 1.035308837890625, 1.078369140625, 1.121429443359375, 1.16448974609375, 1.207550048828125, 1.2506103515625, 1.293670654296875, 1.33673095703125, 1.379791259765625, 1.4228515625]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 4.0, 8.0, 3.0, 11.0, 16.0, 15.0, 38.0, 58.0, 84.0, 141.0, 215.0, 350.0, 688.0, 1218.0, 2161.0, 4078.0, 7482.0, 14136.0, 25559.0, 45258.0, 76199.0, 119278.0, 160538.0, 175492.0, 151090.0, 108558.0, 67749.0, 39812.0, 22081.0, 12131.0, 6443.0, 3381.0, 1925.0, 1011.0, 564.0, 308.0, 197.0, 103.0, 62.0, 40.0, 23.0, 16.0, 13.0, 9.0, 9.0, 1.0, 6.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.2398681640625, -0.23289108276367188, -0.22591400146484375, -0.21893692016601562, -0.2119598388671875, -0.20498275756835938, -0.19800567626953125, -0.19102859497070312, -0.184051513671875, -0.17707443237304688, -0.17009735107421875, -0.16312026977539062, -0.1561431884765625, -0.14916610717773438, -0.14218902587890625, -0.13521194458007812, -0.12823486328125, -0.12125778198242188, -0.11428070068359375, -0.10730361938476562, -0.1003265380859375, -0.09334945678710938, -0.08637237548828125, -0.07939529418945312, -0.072418212890625, -0.06544113159179688, -0.05846405029296875, -0.051486968994140625, -0.0445098876953125, -0.037532806396484375, -0.03055572509765625, -0.023578643798828125, -0.0166015625, -0.009624481201171875, -0.00264739990234375, 0.004329681396484375, 0.0113067626953125, 0.018283843994140625, 0.02526092529296875, 0.032238006591796875, 0.039215087890625, 0.046192169189453125, 0.05316925048828125, 0.060146331787109375, 0.0671234130859375, 0.07410049438476562, 0.08107757568359375, 0.08805465698242188, 0.09503173828125, 0.10200881958007812, 0.10898590087890625, 0.11596298217773438, 0.1229400634765625, 0.12991714477539062, 0.13689422607421875, 0.14387130737304688, 0.150848388671875, 0.15782546997070312, 0.16480255126953125, 0.17177963256835938, 0.1787567138671875, 0.18573379516601562, 0.19271087646484375, 0.19968795776367188, 0.2066650390625]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 6.0, 2.0, 4.0, 2.0, 1.0, 9.0, 6.0, 9.0, 15.0, 18.0, 12.0, 25.0, 26.0, 27.0, 23.0, 23.0, 34.0, 31.0, 51.0, 44.0, 44.0, 47.0, 62.0, 44.0, 36.0, 54.0, 39.0, 49.0, 38.0, 22.0, 35.0, 20.0, 24.0, 18.0, 26.0, 16.0, 16.0, 18.0, 6.0, 8.0, 5.0, 5.0, 4.0, 3.0, 3.0, 3.0, 0.0, 2.0, 0.0, 3.0], "bins": [-3.669921875, -3.570465087890625, -3.47100830078125, -3.371551513671875, -3.2720947265625, -3.172637939453125, -3.07318115234375, -2.973724365234375, -2.874267578125, -2.774810791015625, -2.67535400390625, -2.575897216796875, -2.4764404296875, -2.376983642578125, -2.27752685546875, -2.178070068359375, -2.07861328125, -1.979156494140625, -1.87969970703125, -1.780242919921875, -1.6807861328125, -1.581329345703125, -1.48187255859375, -1.382415771484375, -1.282958984375, -1.183502197265625, -1.08404541015625, -0.984588623046875, -0.8851318359375, -0.785675048828125, -0.68621826171875, -0.586761474609375, -0.4873046875, -0.387847900390625, -0.28839111328125, -0.188934326171875, -0.0894775390625, 0.009979248046875, 0.10943603515625, 0.208892822265625, 0.308349609375, 0.407806396484375, 0.50726318359375, 0.606719970703125, 0.7061767578125, 0.805633544921875, 0.90509033203125, 1.004547119140625, 1.10400390625, 1.203460693359375, 1.30291748046875, 1.402374267578125, 1.5018310546875, 1.601287841796875, 1.70074462890625, 1.800201416015625, 1.899658203125, 1.999114990234375, 2.09857177734375, 2.198028564453125, 2.2974853515625, 2.396942138671875, 2.49639892578125, 2.595855712890625, 2.6953125]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 1.0, 2.0, 3.0, 3.0, 6.0, 14.0, 14.0, 19.0, 32.0, 53.0, 125.0, 202.0, 321.0, 619.0, 1483.0, 4097.0, 21763.0, 285432.0, 662079.0, 60275.0, 7835.0, 2309.0, 934.0, 457.0, 222.0, 107.0, 54.0, 39.0, 23.0, 15.0, 6.0, 1.0, 7.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.3564453125, -0.3466033935546875, -0.336761474609375, -0.3269195556640625, -0.31707763671875, -0.3072357177734375, -0.297393798828125, -0.2875518798828125, -0.2777099609375, -0.2678680419921875, -0.258026123046875, -0.2481842041015625, -0.23834228515625, -0.2285003662109375, -0.218658447265625, -0.2088165283203125, -0.198974609375, -0.1891326904296875, -0.179290771484375, -0.1694488525390625, -0.15960693359375, -0.1497650146484375, -0.139923095703125, -0.1300811767578125, -0.1202392578125, -0.1103973388671875, -0.100555419921875, -0.0907135009765625, -0.08087158203125, -0.0710296630859375, -0.061187744140625, -0.0513458251953125, -0.04150390625, -0.0316619873046875, -0.021820068359375, -0.0119781494140625, -0.00213623046875, 0.0077056884765625, 0.017547607421875, 0.0273895263671875, 0.0372314453125, 0.0470733642578125, 0.056915283203125, 0.0667572021484375, 0.07659912109375, 0.0864410400390625, 0.096282958984375, 0.1061248779296875, 0.115966796875, 0.1258087158203125, 0.135650634765625, 0.1454925537109375, 0.15533447265625, 0.1651763916015625, 0.175018310546875, 0.1848602294921875, 0.1947021484375, 0.2045440673828125, 0.214385986328125, 0.2242279052734375, 0.23406982421875, 0.2439117431640625, 0.253753662109375, 0.2635955810546875, 0.2734375]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 4.0, 5.0, 5.0, 3.0, 3.0, 9.0, 16.0, 20.0, 28.0, 44.0, 63.0, 78.0, 81.0, 84.0, 86.0, 122.0, 93.0, 73.0, 63.0, 36.0, 36.0, 18.0, 16.0, 9.0, 4.0, 4.0, 3.0, 3.0, 2.0, 1.0, 2.0, 1.0], "bins": [-0.0001289844512939453, -0.00012620538473129272, -0.00012342631816864014, -0.00012064725160598755, -0.00011786818504333496, -0.00011508911848068237, -0.00011231005191802979, -0.0001095309853553772, -0.00010675191879272461, -0.00010397285223007202, -0.00010119378566741943, -9.841471910476685e-05, -9.563565254211426e-05, -9.285658597946167e-05, -9.007751941680908e-05, -8.72984528541565e-05, -8.45193862915039e-05, -8.174031972885132e-05, -7.896125316619873e-05, -7.618218660354614e-05, -7.340312004089355e-05, -7.062405347824097e-05, -6.784498691558838e-05, -6.506592035293579e-05, -6.22868537902832e-05, -5.9507787227630615e-05, -5.672872066497803e-05, -5.394965410232544e-05, -5.117058753967285e-05, -4.8391520977020264e-05, -4.5612454414367676e-05, -4.283338785171509e-05, -4.00543212890625e-05, -3.727525472640991e-05, -3.4496188163757324e-05, -3.1717121601104736e-05, -2.893805503845215e-05, -2.615898847579956e-05, -2.3379921913146973e-05, -2.0600855350494385e-05, -1.7821788787841797e-05, -1.5042722225189209e-05, -1.2263655662536621e-05, -9.484589099884033e-06, -6.705522537231445e-06, -3.926455974578857e-06, -1.1473894119262695e-06, 1.6316771507263184e-06, 4.410743713378906e-06, 7.189810276031494e-06, 9.968876838684082e-06, 1.274794340133667e-05, 1.5527009963989258e-05, 1.8306076526641846e-05, 2.1085143089294434e-05, 2.386420965194702e-05, 2.664327621459961e-05, 2.9422342777252197e-05, 3.2201409339904785e-05, 3.498047590255737e-05, 3.775954246520996e-05, 4.053860902786255e-05, 4.331767559051514e-05, 4.6096742153167725e-05, 4.887580871582031e-05]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 4.0, 2.0, 5.0, 3.0, 5.0, 12.0, 14.0, 26.0, 20.0, 30.0, 40.0, 51.0, 80.0, 127.0, 161.0, 272.0, 453.0, 728.0, 1314.0, 2554.0, 5177.0, 10612.0, 23390.0, 55728.0, 147592.0, 368378.0, 266296.0, 94650.0, 37809.0, 16354.0, 7731.0, 3858.0, 2016.0, 1112.0, 704.0, 413.0, 261.0, 175.0, 115.0, 91.0, 62.0, 38.0, 33.0, 16.0, 15.0, 13.0, 9.0, 4.0, 4.0, 5.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.180419921875, -0.1752338409423828, -0.17004776000976562, -0.16486167907714844, -0.15967559814453125, -0.15448951721191406, -0.14930343627929688, -0.1441173553466797, -0.1389312744140625, -0.1337451934814453, -0.12855911254882812, -0.12337303161621094, -0.11818695068359375, -0.11300086975097656, -0.10781478881835938, -0.10262870788574219, -0.097442626953125, -0.09225654602050781, -0.08707046508789062, -0.08188438415527344, -0.07669830322265625, -0.07151222229003906, -0.06632614135742188, -0.06114006042480469, -0.0559539794921875, -0.05076789855957031, -0.045581817626953125, -0.04039573669433594, -0.03520965576171875, -0.030023574829101562, -0.024837493896484375, -0.019651412963867188, -0.01446533203125, -0.009279251098632812, -0.004093170166015625, 0.0010929107666015625, 0.00627899169921875, 0.011465072631835938, 0.016651153564453125, 0.021837234497070312, 0.0270233154296875, 0.03220939636230469, 0.037395477294921875, 0.04258155822753906, 0.04776763916015625, 0.05295372009277344, 0.058139801025390625, 0.06332588195800781, 0.068511962890625, 0.07369804382324219, 0.07888412475585938, 0.08407020568847656, 0.08925628662109375, 0.09444236755371094, 0.09962844848632812, 0.10481452941894531, 0.1100006103515625, 0.11518669128417969, 0.12037277221679688, 0.12555885314941406, 0.13074493408203125, 0.13593101501464844, 0.14111709594726562, 0.1463031768798828, 0.1514892578125]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 6.0, 7.0, 6.0, 5.0, 5.0, 8.0, 10.0, 14.0, 20.0, 21.0, 19.0, 24.0, 25.0, 35.0, 50.0, 57.0, 81.0, 67.0, 84.0, 94.0, 71.0, 43.0, 44.0, 39.0, 20.0, 30.0, 21.0, 21.0, 13.0, 7.0, 13.0, 8.0, 13.0, 7.0, 5.0, 1.0, 3.0, 4.0, 1.0, 1.0, 6.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.05023193359375, -0.04827690124511719, -0.046321868896484375, -0.04436683654785156, -0.04241180419921875, -0.04045677185058594, -0.038501739501953125, -0.03654670715332031, -0.0345916748046875, -0.03263664245605469, -0.030681610107421875, -0.028726577758789062, -0.02677154541015625, -0.024816513061523438, -0.022861480712890625, -0.020906448364257812, -0.018951416015625, -0.016996383666992188, -0.015041351318359375, -0.013086318969726562, -0.01113128662109375, -0.009176254272460938, -0.007221221923828125, -0.0052661895751953125, -0.0033111572265625, -0.0013561248779296875, 0.000598907470703125, 0.0025539398193359375, 0.00450897216796875, 0.0064640045166015625, 0.008419036865234375, 0.010374069213867188, 0.0123291015625, 0.014284133911132812, 0.016239166259765625, 0.018194198608398438, 0.02014923095703125, 0.022104263305664062, 0.024059295654296875, 0.026014328002929688, 0.0279693603515625, 0.029924392700195312, 0.031879425048828125, 0.03383445739746094, 0.03578948974609375, 0.03774452209472656, 0.039699554443359375, 0.04165458679199219, 0.043609619140625, 0.04556465148925781, 0.047519683837890625, 0.04947471618652344, 0.05142974853515625, 0.05338478088378906, 0.055339813232421875, 0.05729484558105469, 0.0592498779296875, 0.06120491027832031, 0.06315994262695312, 0.06511497497558594, 0.06707000732421875, 0.06902503967285156, 0.07098007202148438, 0.07293510437011719, 0.07489013671875]}, "gradients/decoder.model.decoder.layers.0.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 10.0, 5.0, 17.0, 30.0, 40.0, 47.0, 49.0, 70.0, 77.0, 82.0, 102.0, 112.0, 89.0, 69.0, 61.0, 44.0, 31.0, 27.0, 16.0, 12.0, 9.0, 9.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.2007575035095215, -2.1314151287078857, -2.062072515487671, -1.9927300214767456, -1.9233875274658203, -1.8540451526641846, -1.7847026586532593, -1.715360164642334, -1.6460176706314087, -1.5766751766204834, -1.507332682609558, -1.4379901885986328, -1.368647813796997, -1.2993052005767822, -1.2299628257751465, -1.1606203317642212, -1.091277837753296, -1.0219353437423706, -0.9525928497314453, -0.8832504153251648, -0.8139079213142395, -0.7445654273033142, -0.6752229928970337, -0.6058804988861084, -0.5365380048751831, -0.4671955108642578, -0.3978530466556549, -0.328510582447052, -0.2591680884361267, -0.18982559442520142, -0.12048313021659851, -0.051140666007995605, 0.018201589584350586, 0.08754406869411469, 0.15688654780387878, 0.22622902691364288, 0.295571506023407, 0.3649140000343323, 0.4342564642429352, 0.5035989284515381, 0.5729414224624634, 0.6422839164733887, 0.711626410484314, 0.7809688448905945, 0.8503113389015198, 0.9196538329124451, 0.9889962673187256, 1.0583387613296509, 1.1276812553405762, 1.1970237493515015, 1.2663662433624268, 1.335708737373352, 1.4050512313842773, 1.474393606185913, 1.5437361001968384, 1.6130785942077637, 1.682421088218689, 1.7517635822296143, 1.8211060762405396, 1.8904485702514648, 1.9597909450531006, 2.0291335582733154, 2.098475933074951, 2.167818546295166, 2.2371609210968018]}, "gradients/decoder.model.decoder.layers.0.self_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 3.0, 1.0, 2.0, 2.0, 9.0, 8.0, 7.0, 8.0, 13.0, 10.0, 21.0, 20.0, 28.0, 25.0, 35.0, 37.0, 31.0, 47.0, 43.0, 51.0, 55.0, 64.0, 38.0, 46.0, 48.0, 41.0, 39.0, 40.0, 24.0, 45.0, 28.0, 35.0, 19.0, 20.0, 10.0, 17.0, 9.0, 6.0, 8.0, 2.0, 5.0, 3.0, 4.0, 1.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2035744190216064, -1.1631237268447876, -1.1226730346679688, -1.0822222232818604, -1.0417715311050415, -1.0013208389282227, -0.9608701467514038, -0.9204193949699402, -0.8799686431884766, -0.8395179510116577, -0.7990671992301941, -0.7586165070533752, -0.7181657552719116, -0.6777150630950928, -0.6372643709182739, -0.5968136191368103, -0.5563629269599915, -0.5159122347831726, -0.475461483001709, -0.43501079082489014, -0.3945600390434265, -0.35410934686660767, -0.31365862488746643, -0.2732079029083252, -0.23275718092918396, -0.19230645895004272, -0.1518557369709015, -0.11140502989292145, -0.07095430791378021, -0.030503585934638977, 0.009947121143341064, 0.0503978431224823, 0.09084856510162354, 0.13129928708076477, 0.171750009059906, 0.21220071613788605, 0.2526514530181885, 0.2931021451950073, 0.33355286717414856, 0.3740035891532898, 0.41445431113243103, 0.45490503311157227, 0.4953557550907135, 0.5358064770698547, 0.5762571692466736, 0.6167079210281372, 0.657158613204956, 0.6976093053817749, 0.7380600571632385, 0.7785107493400574, 0.818961501121521, 0.8594121932983398, 0.8998629450798035, 0.9403136372566223, 0.9807643890380859, 1.0212150812149048, 1.0616657733917236, 1.1021164655685425, 1.1425671577453613, 1.1830179691314697, 1.2234686613082886, 1.2639193534851074, 1.3043700456619263, 1.3448207378387451, 1.3852715492248535]}, "gradients/decoder.model.decoder.layers.0.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 3.0, 3.0, 3.0, 3.0, 6.0, 5.0, 10.0, 14.0, 17.0, 26.0, 36.0, 34.0, 50.0, 88.0, 142.0, 178.0, 248.0, 432.0, 785.0, 1532.0, 2908.0, 6152.0, 13912.0, 31817.0, 74644.0, 157924.0, 257753.0, 243782.0, 140816.0, 64595.0, 27409.0, 12193.0, 5215.0, 2603.0, 1293.0, 698.0, 395.0, 291.0, 176.0, 98.0, 66.0, 60.0, 46.0, 22.0, 22.0, 15.0, 14.0, 9.0, 11.0, 5.0, 2.0, 3.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 2.0], "bins": [-1.7646484375, -1.7075653076171875, -1.650482177734375, -1.5933990478515625, -1.53631591796875, -1.4792327880859375, -1.422149658203125, -1.3650665283203125, -1.3079833984375, -1.2509002685546875, -1.193817138671875, -1.1367340087890625, -1.07965087890625, -1.0225677490234375, -0.965484619140625, -0.9084014892578125, -0.851318359375, -0.7942352294921875, -0.737152099609375, -0.6800689697265625, -0.62298583984375, -0.5659027099609375, -0.508819580078125, -0.4517364501953125, -0.3946533203125, -0.3375701904296875, -0.280487060546875, -0.2234039306640625, -0.16632080078125, -0.1092376708984375, -0.052154541015625, 0.0049285888671875, 0.06201171875, 0.1190948486328125, 0.176177978515625, 0.2332611083984375, 0.29034423828125, 0.3474273681640625, 0.404510498046875, 0.4615936279296875, 0.5186767578125, 0.5757598876953125, 0.632843017578125, 0.6899261474609375, 0.74700927734375, 0.8040924072265625, 0.861175537109375, 0.9182586669921875, 0.975341796875, 1.0324249267578125, 1.089508056640625, 1.1465911865234375, 1.20367431640625, 1.2607574462890625, 1.317840576171875, 1.3749237060546875, 1.4320068359375, 1.4890899658203125, 1.546173095703125, 1.6032562255859375, 1.66033935546875, 1.7174224853515625, 1.774505615234375, 1.8315887451171875, 1.888671875]}, "gradients/decoder.model.decoder.layers.0.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 4.0, 5.0, 8.0, 5.0, 4.0, 6.0, 9.0, 13.0, 19.0, 15.0, 16.0, 22.0, 23.0, 27.0, 28.0, 49.0, 40.0, 52.0, 45.0, 46.0, 45.0, 43.0, 44.0, 43.0, 44.0, 53.0, 36.0, 34.0, 33.0, 34.0, 34.0, 27.0, 18.0, 19.0, 12.0, 10.0, 10.0, 8.0, 6.0, 3.0, 5.0, 8.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.013671875, -1.94561767578125, -1.8775634765625, -1.80950927734375, -1.741455078125, -1.67340087890625, -1.6053466796875, -1.53729248046875, -1.46923828125, -1.40118408203125, -1.3331298828125, -1.26507568359375, -1.197021484375, -1.12896728515625, -1.0609130859375, -0.99285888671875, -0.9248046875, -0.85675048828125, -0.7886962890625, -0.72064208984375, -0.652587890625, -0.58453369140625, -0.5164794921875, -0.44842529296875, -0.38037109375, -0.31231689453125, -0.2442626953125, -0.17620849609375, -0.108154296875, -0.04010009765625, 0.0279541015625, 0.09600830078125, 0.1640625, 0.23211669921875, 0.3001708984375, 0.36822509765625, 0.436279296875, 0.50433349609375, 0.5723876953125, 0.64044189453125, 0.70849609375, 0.77655029296875, 0.8446044921875, 0.91265869140625, 0.980712890625, 1.04876708984375, 1.1168212890625, 1.18487548828125, 1.2529296875, 1.32098388671875, 1.3890380859375, 1.45709228515625, 1.525146484375, 1.59320068359375, 1.6612548828125, 1.72930908203125, 1.79736328125, 1.86541748046875, 1.9334716796875, 2.00152587890625, 2.069580078125, 2.13763427734375, 2.2056884765625, 2.27374267578125, 2.341796875]}, "gradients/decoder.model.decoder.layers.0.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 6.0, 3.0, 6.0, 13.0, 5.0, 8.0, 15.0, 22.0, 36.0, 39.0, 76.0, 101.0, 145.0, 170.0, 290.0, 469.0, 764.0, 1428.0, 2767.0, 6105.0, 15479.0, 41232.0, 113805.0, 270560.0, 326952.0, 166923.0, 61738.0, 22641.0, 8605.0, 3706.0, 1794.0, 995.0, 569.0, 362.0, 215.0, 140.0, 104.0, 79.0, 55.0, 37.0, 27.0, 16.0, 24.0, 11.0, 9.0, 4.0, 6.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.544921875, -2.46588134765625, -2.3868408203125, -2.30780029296875, -2.228759765625, -2.14971923828125, -2.0706787109375, -1.99163818359375, -1.91259765625, -1.83355712890625, -1.7545166015625, -1.67547607421875, -1.596435546875, -1.51739501953125, -1.4383544921875, -1.35931396484375, -1.2802734375, -1.20123291015625, -1.1221923828125, -1.04315185546875, -0.964111328125, -0.88507080078125, -0.8060302734375, -0.72698974609375, -0.64794921875, -0.56890869140625, -0.4898681640625, -0.41082763671875, -0.331787109375, -0.25274658203125, -0.1737060546875, -0.09466552734375, -0.015625, 0.06341552734375, 0.1424560546875, 0.22149658203125, 0.300537109375, 0.37957763671875, 0.4586181640625, 0.53765869140625, 0.61669921875, 0.69573974609375, 0.7747802734375, 0.85382080078125, 0.932861328125, 1.01190185546875, 1.0909423828125, 1.16998291015625, 1.2490234375, 1.32806396484375, 1.4071044921875, 1.48614501953125, 1.565185546875, 1.64422607421875, 1.7232666015625, 1.80230712890625, 1.88134765625, 1.96038818359375, 2.0394287109375, 2.11846923828125, 2.197509765625, 2.27655029296875, 2.3555908203125, 2.43463134765625, 2.513671875]}, "gradients/decoder.model.decoder.layers.0.self_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 7.0, 4.0, 3.0, 2.0, 5.0, 1.0, 1.0, 8.0, 7.0, 12.0, 21.0, 24.0, 16.0, 22.0, 30.0, 27.0, 21.0, 35.0, 41.0, 35.0, 41.0, 44.0, 53.0, 69.0, 50.0, 43.0, 46.0, 35.0, 35.0, 39.0, 31.0, 27.0, 26.0, 29.0, 15.0, 18.0, 16.0, 14.0, 11.0, 7.0, 13.0, 6.0, 7.0, 7.0, 5.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0], "bins": [-2.576171875, -2.49822998046875, -2.4202880859375, -2.34234619140625, -2.264404296875, -2.18646240234375, -2.1085205078125, -2.03057861328125, -1.95263671875, -1.87469482421875, -1.7967529296875, -1.71881103515625, -1.640869140625, -1.56292724609375, -1.4849853515625, -1.40704345703125, -1.3291015625, -1.25115966796875, -1.1732177734375, -1.09527587890625, -1.017333984375, -0.93939208984375, -0.8614501953125, -0.78350830078125, -0.70556640625, -0.62762451171875, -0.5496826171875, -0.47174072265625, -0.393798828125, -0.31585693359375, -0.2379150390625, -0.15997314453125, -0.08203125, -0.00408935546875, 0.0738525390625, 0.15179443359375, 0.229736328125, 0.30767822265625, 0.3856201171875, 0.46356201171875, 0.54150390625, 0.61944580078125, 0.6973876953125, 0.77532958984375, 0.853271484375, 0.93121337890625, 1.0091552734375, 1.08709716796875, 1.1650390625, 1.24298095703125, 1.3209228515625, 1.39886474609375, 1.476806640625, 1.55474853515625, 1.6326904296875, 1.71063232421875, 1.78857421875, 1.86651611328125, 1.9444580078125, 2.02239990234375, 2.100341796875, 2.17828369140625, 2.2562255859375, 2.33416748046875, 2.412109375]}, "gradients/decoder.model.decoder.layers.0.self_attn.k_proj.weight": {"_type": "histogram", "values": [4.0, 0.0, 1.0, 4.0, 2.0, 4.0, 0.0, 5.0, 11.0, 18.0, 18.0, 32.0, 49.0, 53.0, 91.0, 142.0, 244.0, 367.0, 565.0, 927.0, 1509.0, 2603.0, 4828.0, 9381.0, 19168.0, 41420.0, 87205.0, 168266.0, 280173.0, 209335.0, 114369.0, 55321.0, 25878.0, 12256.0, 6031.0, 3435.0, 1872.0, 1099.0, 668.0, 439.0, 260.0, 171.0, 104.0, 73.0, 49.0, 37.0, 23.0, 17.0, 21.0, 8.0, 4.0, 4.0, 1.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.40673828125, -0.3925628662109375, -0.378387451171875, -0.3642120361328125, -0.35003662109375, -0.3358612060546875, -0.321685791015625, -0.3075103759765625, -0.2933349609375, -0.2791595458984375, -0.264984130859375, -0.2508087158203125, -0.23663330078125, -0.2224578857421875, -0.208282470703125, -0.1941070556640625, -0.179931640625, -0.1657562255859375, -0.151580810546875, -0.1374053955078125, -0.12322998046875, -0.1090545654296875, -0.094879150390625, -0.0807037353515625, -0.0665283203125, -0.0523529052734375, -0.038177490234375, -0.0240020751953125, -0.00982666015625, 0.0043487548828125, 0.018524169921875, 0.0326995849609375, 0.046875, 0.0610504150390625, 0.075225830078125, 0.0894012451171875, 0.10357666015625, 0.1177520751953125, 0.131927490234375, 0.1461029052734375, 0.1602783203125, 0.1744537353515625, 0.188629150390625, 0.2028045654296875, 0.21697998046875, 0.2311553955078125, 0.245330810546875, 0.2595062255859375, 0.273681640625, 0.2878570556640625, 0.302032470703125, 0.3162078857421875, 0.33038330078125, 0.3445587158203125, 0.358734130859375, 0.3729095458984375, 0.3870849609375, 0.4012603759765625, 0.415435791015625, 0.4296112060546875, 0.44378662109375, 0.4579620361328125, 0.472137451171875, 0.4863128662109375, 0.50048828125]}, "gradients/decoder.model.decoder.layers.0.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 3.0, 6.0, 8.0, 6.0, 11.0, 9.0, 15.0, 23.0, 29.0, 34.0, 53.0, 54.0, 59.0, 82.0, 93.0, 95.0, 60.0, 67.0, 60.0, 46.0, 38.0, 37.0, 36.0, 22.0, 14.0, 13.0, 10.0, 6.0, 5.0, 2.0, 5.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0001385211944580078, -0.0001342184841632843, -0.0001299157738685608, -0.00012561306357383728, -0.00012131035327911377, -0.00011700764298439026, -0.00011270493268966675, -0.00010840222239494324, -0.00010409951210021973, -9.979680180549622e-05, -9.54940915107727e-05, -9.11913812160492e-05, -8.688867092132568e-05, -8.258596062660217e-05, -7.828325033187866e-05, -7.398054003715515e-05, -6.967782974243164e-05, -6.537511944770813e-05, -6.107240915298462e-05, -5.676969885826111e-05, -5.24669885635376e-05, -4.816427826881409e-05, -4.3861567974090576e-05, -3.9558857679367065e-05, -3.5256147384643555e-05, -3.0953437089920044e-05, -2.6650726795196533e-05, -2.2348016500473022e-05, -1.8045306205749512e-05, -1.3742595911026001e-05, -9.43988561630249e-06, -5.1371753215789795e-06, -8.344650268554688e-07, 3.468245267868042e-06, 7.770955562591553e-06, 1.2073665857315063e-05, 1.6376376152038574e-05, 2.0679086446762085e-05, 2.4981796741485596e-05, 2.9284507036209106e-05, 3.358721733093262e-05, 3.788992762565613e-05, 4.219263792037964e-05, 4.649534821510315e-05, 5.079805850982666e-05, 5.510076880455017e-05, 5.940347909927368e-05, 6.370618939399719e-05, 6.80088996887207e-05, 7.231160998344421e-05, 7.661432027816772e-05, 8.091703057289124e-05, 8.521974086761475e-05, 8.952245116233826e-05, 9.382516145706177e-05, 9.812787175178528e-05, 0.00010243058204650879, 0.0001067332923412323, 0.00011103600263595581, 0.00011533871293067932, 0.00011964142322540283, 0.00012394413352012634, 0.00012824684381484985, 0.00013254955410957336, 0.00013685226440429688]}, "gradients/decoder.model.decoder.layers.0.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 5.0, 1.0, 10.0, 9.0, 12.0, 7.0, 19.0, 26.0, 37.0, 70.0, 79.0, 122.0, 131.0, 241.0, 326.0, 448.0, 671.0, 935.0, 1332.0, 2002.0, 3383.0, 5713.0, 10462.0, 20945.0, 45634.0, 101756.0, 204778.0, 308229.0, 176868.0, 85111.0, 38010.0, 17991.0, 9030.0, 5045.0, 3098.0, 1937.0, 1217.0, 858.0, 625.0, 446.0, 253.0, 202.0, 119.0, 104.0, 65.0, 58.0, 36.0, 33.0, 20.0, 17.0, 16.0, 10.0, 12.0, 2.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0], "bins": [-0.53369140625, -0.5161285400390625, -0.498565673828125, -0.4810028076171875, -0.46343994140625, -0.4458770751953125, -0.428314208984375, -0.4107513427734375, -0.3931884765625, -0.3756256103515625, -0.358062744140625, -0.3404998779296875, -0.32293701171875, -0.3053741455078125, -0.287811279296875, -0.2702484130859375, -0.252685546875, -0.2351226806640625, -0.217559814453125, -0.1999969482421875, -0.18243408203125, -0.1648712158203125, -0.147308349609375, -0.1297454833984375, -0.1121826171875, -0.0946197509765625, -0.077056884765625, -0.0594940185546875, -0.04193115234375, -0.0243682861328125, -0.006805419921875, 0.0107574462890625, 0.0283203125, 0.0458831787109375, 0.063446044921875, 0.0810089111328125, 0.09857177734375, 0.1161346435546875, 0.133697509765625, 0.1512603759765625, 0.1688232421875, 0.1863861083984375, 0.203948974609375, 0.2215118408203125, 0.23907470703125, 0.2566375732421875, 0.274200439453125, 0.2917633056640625, 0.309326171875, 0.3268890380859375, 0.344451904296875, 0.3620147705078125, 0.37957763671875, 0.3971405029296875, 0.414703369140625, 0.4322662353515625, 0.4498291015625, 0.4673919677734375, 0.484954833984375, 0.5025177001953125, 0.52008056640625, 0.5376434326171875, 0.555206298828125, 0.5727691650390625, 0.59033203125]}, "gradients/decoder.model.decoder.layers.0.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 2.0, 5.0, 4.0, 1.0, 8.0, 5.0, 9.0, 19.0, 20.0, 32.0, 55.0, 61.0, 87.0, 99.0, 120.0, 104.0, 103.0, 71.0, 59.0, 29.0, 35.0, 20.0, 16.0, 10.0, 5.0, 6.0, 5.0, 4.0, 0.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.6435546875, -0.6226577758789062, -0.6017608642578125, -0.5808639526367188, -0.559967041015625, -0.5390701293945312, -0.5181732177734375, -0.49727630615234375, -0.47637939453125, -0.45548248291015625, -0.4345855712890625, -0.41368865966796875, -0.392791748046875, -0.37189483642578125, -0.3509979248046875, -0.33010101318359375, -0.3092041015625, -0.28830718994140625, -0.2674102783203125, -0.24651336669921875, -0.225616455078125, -0.20471954345703125, -0.1838226318359375, -0.16292572021484375, -0.14202880859375, -0.12113189697265625, -0.1002349853515625, -0.07933807373046875, -0.058441162109375, -0.03754425048828125, -0.0166473388671875, 0.00424957275390625, 0.025146484375, 0.04604339599609375, 0.0669403076171875, 0.08783721923828125, 0.108734130859375, 0.12963104248046875, 0.1505279541015625, 0.17142486572265625, 0.19232177734375, 0.21321868896484375, 0.2341156005859375, 0.25501251220703125, 0.275909423828125, 0.29680633544921875, 0.3177032470703125, 0.33860015869140625, 0.3594970703125, 0.38039398193359375, 0.4012908935546875, 0.42218780517578125, 0.443084716796875, 0.46398162841796875, 0.4848785400390625, 0.5057754516601562, 0.52667236328125, 0.5475692749023438, 0.5684661865234375, 0.5893630981445312, 0.610260009765625, 0.6311569213867188, 0.6520538330078125, 0.6729507446289062, 0.69384765625]}, "gradients/decoder.model.decoder.layernorm_embedding.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 4.0, 3.0, 3.0, 6.0, 21.0, 40.0, 81.0, 117.0, 126.0, 185.0, 148.0, 107.0, 78.0, 47.0, 20.0, 10.0, 7.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.285005569458008, -7.029697895050049, -6.774389743804932, -6.519082069396973, -6.2637739181518555, -6.0084662437438965, -5.7531585693359375, -5.49785041809082, -5.242542743682861, -4.987235069274902, -4.731926918029785, -4.476619243621826, -4.221311569213867, -3.96600341796875, -3.710695743560791, -3.455387830734253, -3.200079917907715, -2.9447720050811768, -2.6894640922546387, -2.4341564178466797, -2.1788485050201416, -1.9235405921936035, -1.668232798576355, -1.4129250049591064, -1.1576170921325684, -0.902309238910675, -0.6470013856887817, -0.3916935324668884, -0.13638567924499512, 0.11892223358154297, 0.3742300271987915, 0.62953782081604, 0.8848447799682617, 1.1401526927947998, 1.3954604864120483, 1.6507682800292969, 1.906076192855835, 2.161384105682373, 2.416691780090332, 2.67199969291687, 2.927307605743408, 3.1826155185699463, 3.4379234313964844, 3.6932311058044434, 3.9485390186309814, 4.2038469314575195, 4.4591546058654785, 4.7144622802734375, 4.969770431518555, 5.225078105926514, 5.480386257171631, 5.73569393157959, 5.991002082824707, 6.246309757232666, 6.501617431640625, 6.756925582885742, 7.012233257293701, 7.26754093170166, 7.522849082946777, 7.778156757354736, 8.033464431762695, 8.288772583007812, 8.54408073425293, 8.79938793182373, 9.054696083068848]}, "gradients/decoder.model.decoder.layernorm_embedding.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 3.0, 2.0, 6.0, 13.0, 5.0, 4.0, 13.0, 14.0, 12.0, 15.0, 24.0, 24.0, 16.0, 17.0, 33.0, 20.0, 27.0, 26.0, 44.0, 47.0, 41.0, 40.0, 37.0, 31.0, 35.0, 38.0, 46.0, 37.0, 37.0, 35.0, 27.0, 28.0, 20.0, 24.0, 26.0, 21.0, 14.0, 18.0, 13.0, 12.0, 11.0, 9.0, 11.0, 9.0, 6.0, 4.0, 3.0, 2.0, 1.0, 4.0, 3.0, 3.0, 3.0, 0.0, 1.0, 1.0], "bins": [-3.366345167160034, -3.260174512863159, -3.154003858566284, -3.047833204269409, -2.941662549972534, -2.835491895675659, -2.729321002960205, -2.62315034866333, -2.516979694366455, -2.41080904006958, -2.304638385772705, -2.19846773147583, -2.092297077178955, -1.98612642288208, -1.8799556493759155, -1.7737849950790405, -1.667614459991455, -1.56144380569458, -1.455273151397705, -1.34910249710083, -1.242931842803955, -1.13676118850708, -1.0305904150009155, -0.9244197607040405, -0.8182491064071655, -0.7120784521102905, -0.6059077978134155, -0.49973708391189575, -0.39356642961502075, -0.28739577531814575, -0.18122506141662598, -0.07505440711975098, 0.031116247177124023, 0.13728691637516022, 0.2434575855731964, 0.3496282696723938, 0.4557989239692688, 0.5619695782661438, 0.6681402921676636, 0.7743109464645386, 0.8804816007614136, 0.9866522550582886, 1.0928229093551636, 1.1989936828613281, 1.3051643371582031, 1.4113349914550781, 1.5175056457519531, 1.6236763000488281, 1.7298469543457031, 1.8360176086425781, 1.9421882629394531, 2.048358917236328, 2.154529571533203, 2.260700225830078, 2.366870880126953, 2.473041534423828, 2.579212188720703, 2.685382843017578, 2.791553497314453, 2.897724151611328, 3.003894805908203, 3.110065460205078, 3.216236114501953, 3.322406768798828, 3.4285776615142822]}, "gradients/decoder.model.decoder.embed_positions.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 11.0, 10.0, 13.0, 14.0, 31.0, 38.0, 43.0, 64.0, 64.0, 114.0, 167.0, 229.0, 319.0, 431.0, 599.0, 917.0, 1168.0, 1654.0, 2193.0, 2835.0, 3676.0, 6302.0, 1011250.0, 5148.0, 3358.0, 2514.0, 2022.0, 1480.0, 1071.0, 770.0, 586.0, 400.0, 307.0, 243.0, 185.0, 113.0, 83.0, 51.0, 47.0, 25.0, 16.0, 11.0, 11.0, 4.0, 7.0, 3.0, 7.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-3.26330828666687, -3.1592674255371094, -3.0552265644073486, -2.951185703277588, -2.847144603729248, -2.7431039810180664, -2.6390628814697266, -2.535022020339966, -2.430981159210205, -2.3269402980804443, -2.2228994369506836, -2.118858575820923, -2.014817714691162, -1.9107767343521118, -1.8067357540130615, -1.7026948928833008, -1.59865403175354, -1.4946131706237793, -1.3905723094940186, -1.2865313291549683, -1.1824904680252075, -1.0784496068954468, -0.9744086861610413, -0.8703677654266357, -0.766326904296875, -0.6622860431671143, -0.5582451224327087, -0.4542042315006256, -0.3501633405685425, -0.24612247943878174, -0.14208155870437622, -0.0380406379699707, 0.06599998474121094, 0.17004087567329407, 0.2740817666053772, 0.3781226575374603, 0.48216354846954346, 0.5862044095993042, 0.6902453303337097, 0.7942862510681152, 0.898327112197876, 1.0023679733276367, 1.1064088344573975, 1.2104498147964478, 1.3144906759262085, 1.4185315370559692, 1.5225725173950195, 1.6266133785247803, 1.730654239654541, 1.8346951007843018, 1.9387359619140625, 2.0427768230438232, 2.146817684173584, 2.250858783721924, 2.3548996448516846, 2.4589405059814453, 2.562981367111206, 2.667022228240967, 2.7710630893707275, 2.8751039505004883, 2.979145050048828, 3.0831856727600098, 3.1872267723083496, 3.2912676334381104, 3.395308494567871]}, "gradients/decoder.model.decoder.embed_tokens.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 3.0, 1.0, 5.0, 5.0, 13.0, 23.0, 140.0, 170.0, 749.0, 8554.0, 51386280.0, 71409.0, 3279.0, 414.0, 154.0, 77.0, 36.0, 24.0, 14.0, 3.0, 6.0, 5.0, 2.0, 0.0, 2.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.0625, -32.083946228027344, -31.105396270751953, -30.12684440612793, -29.148292541503906, -28.16973876953125, -27.191186904907227, -26.212635040283203, -25.23408317565918, -24.255531311035156, -23.276979446411133, -22.29842758178711, -21.319873809814453, -20.341323852539062, -19.362770080566406, -18.384218215942383, -17.40566635131836, -16.427114486694336, -15.448562622070312, -14.470009803771973, -13.49145793914795, -12.512906074523926, -11.534353256225586, -10.555801391601562, -9.577249526977539, -8.598697662353516, -7.620145320892334, -6.641592979431152, -5.663041114807129, -4.6844892501831055, -3.705936908721924, -2.727384567260742, -1.7488346099853516, -0.770282506942749, 0.20826959609985352, 1.186821699142456, 2.1653738021850586, 3.143925666809082, 4.122478008270264, 5.101030349731445, 6.079582214355469, 7.058134078979492, 8.036685943603516, 9.015238761901855, 9.993790626525879, 10.972342491149902, 11.950895309448242, 12.929447174072266, 13.907999038696289, 14.886550903320312, 15.865102767944336, 16.84365463256836, 17.822208404541016, 18.800758361816406, 19.779312133789062, 20.757863998413086, 21.73641586303711, 22.714967727661133, 23.693519592285156, 24.67207145690918, 25.650623321533203, 26.62917709350586, 27.607728958129883, 28.586280822753906, 29.56483268737793]}, "gradients/encoder.adapter.layers.2.conv.weight": {"_type": "histogram", "values": [3.0, 8.0, 3.0, 7.0, 16.0, 16.0, 27.0, 34.0, 61.0, 85.0, 150.0, 226.0, 410.0, 622.0, 914.0, 1522.0, 2483.0, 4066.0, 6650.0, 10406.0, 16729.0, 26531.0, 41004.0, 62175.0, 94163.0, 134846.0, 185562.0, 241687.0, 295806.0, 459630.0, 3334492.0, 343414.0, 280776.0, 223590.0, 168171.0, 120737.0, 82970.0, 54733.0, 35771.0, 22803.0, 14297.0, 8963.0, 5612.0, 3498.0, 2114.0, 1365.0, 823.0, 549.0, 337.0, 217.0, 135.0, 86.0, 49.0, 33.0, 22.0, 20.0, 12.0, 9.0, 5.0, 3.0, 4.0, 2.0, 0.0, 2.0], "bins": [-0.7099609375, -0.6865692138671875, -0.663177490234375, -0.6397857666015625, -0.61639404296875, -0.5930023193359375, -0.569610595703125, -0.5462188720703125, -0.5228271484375, -0.4994354248046875, -0.476043701171875, -0.4526519775390625, -0.42926025390625, -0.4058685302734375, -0.382476806640625, -0.3590850830078125, -0.335693359375, -0.3123016357421875, -0.288909912109375, -0.2655181884765625, -0.24212646484375, -0.2187347412109375, -0.195343017578125, -0.1719512939453125, -0.1485595703125, -0.1251678466796875, -0.101776123046875, -0.0783843994140625, -0.05499267578125, -0.0316009521484375, -0.008209228515625, 0.0151824951171875, 0.03857421875, 0.0619659423828125, 0.085357666015625, 0.1087493896484375, 0.13214111328125, 0.1555328369140625, 0.178924560546875, 0.2023162841796875, 0.2257080078125, 0.2490997314453125, 0.272491455078125, 0.2958831787109375, 0.31927490234375, 0.3426666259765625, 0.366058349609375, 0.3894500732421875, 0.412841796875, 0.4362335205078125, 0.459625244140625, 0.4830169677734375, 0.50640869140625, 0.5298004150390625, 0.553192138671875, 0.5765838623046875, 0.5999755859375, 0.6233673095703125, 0.646759033203125, 0.6701507568359375, 0.69354248046875, 0.7169342041015625, 0.740325927734375, 0.7637176513671875, 0.787109375]}, "gradients/encoder.adapter.layers.2.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 1.0, 4.0, 1.0, 9.0, 10.0, 15.0, 20.0, 22.0, 20.0, 29.0, 35.0, 24.0, 33.0, 35.0, 30.0, 42.0, 50.0, 57.0, 66.0, 1033.0, 94.0, 43.0, 39.0, 36.0, 42.0, 35.0, 32.0, 24.0, 27.0, 23.0, 12.0, 27.0, 15.0, 11.0, 9.0, 6.0, 3.0, 5.0, 3.0, 1.0, 4.0, 5.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.390625, -18.8614501953125, -18.332275390625, -17.8031005859375, -17.27392578125, -16.7447509765625, -16.215576171875, -15.6864013671875, -15.1572265625, -14.6280517578125, -14.098876953125, -13.5697021484375, -13.04052734375, -12.5113525390625, -11.982177734375, -11.4530029296875, -10.923828125, -10.3946533203125, -9.865478515625, -9.3363037109375, -8.80712890625, -8.2779541015625, -7.748779296875, -7.2196044921875, -6.6904296875, -6.1612548828125, -5.632080078125, -5.1029052734375, -4.57373046875, -4.0445556640625, -3.515380859375, -2.9862060546875, -2.45703125, -1.9278564453125, -1.398681640625, -0.8695068359375, -0.34033203125, 0.1888427734375, 0.718017578125, 1.2471923828125, 1.7763671875, 2.3055419921875, 2.834716796875, 3.3638916015625, 3.89306640625, 4.4222412109375, 4.951416015625, 5.4805908203125, 6.009765625, 6.5389404296875, 7.068115234375, 7.5972900390625, 8.12646484375, 8.6556396484375, 9.184814453125, 9.7139892578125, 10.2431640625, 10.7723388671875, 11.301513671875, 11.8306884765625, 12.35986328125, 12.8890380859375, 13.418212890625, 13.9473876953125, 14.4765625]}, "gradients/encoder.adapter.layers.1.conv.weight": {"_type": "histogram", "values": [5.0, 4.0, 5.0, 16.0, 22.0, 34.0, 43.0, 53.0, 107.0, 147.0, 239.0, 339.0, 532.0, 878.0, 1371.0, 2234.0, 3434.0, 5259.0, 8410.0, 12714.0, 19250.0, 28754.0, 42415.0, 60073.0, 85048.0, 115853.0, 152440.0, 191797.0, 230935.0, 266041.0, 729750.0, 2976170.0, 285683.0, 245544.0, 210004.0, 169120.0, 130857.0, 97507.0, 70399.0, 49210.0, 33682.0, 23002.0, 15077.0, 9795.0, 6425.0, 4026.0, 2500.0, 1630.0, 989.0, 577.0, 413.0, 258.0, 161.0, 94.0, 56.0, 31.0, 17.0, 10.0, 7.0, 2.0, 5.0, 0.0, 2.0, 1.0], "bins": [-0.5390625, -0.5217971801757812, -0.5045318603515625, -0.48726654052734375, -0.470001220703125, -0.45273590087890625, -0.4354705810546875, -0.41820526123046875, -0.40093994140625, -0.38367462158203125, -0.3664093017578125, -0.34914398193359375, -0.331878662109375, -0.31461334228515625, -0.2973480224609375, -0.28008270263671875, -0.2628173828125, -0.24555206298828125, -0.2282867431640625, -0.21102142333984375, -0.193756103515625, -0.17649078369140625, -0.1592254638671875, -0.14196014404296875, -0.12469482421875, -0.10742950439453125, -0.0901641845703125, -0.07289886474609375, -0.055633544921875, -0.03836822509765625, -0.0211029052734375, -0.00383758544921875, 0.013427734375, 0.03069305419921875, 0.0479583740234375, 0.06522369384765625, 0.082489013671875, 0.09975433349609375, 0.1170196533203125, 0.13428497314453125, 0.15155029296875, 0.16881561279296875, 0.1860809326171875, 0.20334625244140625, 0.220611572265625, 0.23787689208984375, 0.2551422119140625, 0.27240753173828125, 0.2896728515625, 0.30693817138671875, 0.3242034912109375, 0.34146881103515625, 0.358734130859375, 0.37599945068359375, 0.3932647705078125, 0.41053009033203125, 0.42779541015625, 0.44506072998046875, 0.4623260498046875, 0.47959136962890625, 0.496856689453125, 0.5141220092773438, 0.5313873291015625, 0.5486526489257812, 0.56591796875]}, "gradients/encoder.adapter.layers.1.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 5.0, 6.0, 6.0, 9.0, 11.0, 13.0, 17.0, 13.0, 20.0, 30.0, 26.0, 38.0, 25.0, 39.0, 40.0, 38.0, 39.0, 48.0, 53.0, 959.0, 157.0, 41.0, 46.0, 60.0, 30.0, 41.0, 32.0, 28.0, 29.0, 23.0, 23.0, 18.0, 18.0, 12.0, 10.0, 8.0, 2.0, 4.0, 3.0, 2.0, 8.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-15.7734375, -15.3448486328125, -14.916259765625, -14.4876708984375, -14.05908203125, -13.6304931640625, -13.201904296875, -12.7733154296875, -12.3447265625, -11.9161376953125, -11.487548828125, -11.0589599609375, -10.63037109375, -10.2017822265625, -9.773193359375, -9.3446044921875, -8.916015625, -8.4874267578125, -8.058837890625, -7.6302490234375, -7.20166015625, -6.7730712890625, -6.344482421875, -5.9158935546875, -5.4873046875, -5.0587158203125, -4.630126953125, -4.2015380859375, -3.77294921875, -3.3443603515625, -2.915771484375, -2.4871826171875, -2.05859375, -1.6300048828125, -1.201416015625, -0.7728271484375, -0.34423828125, 0.0843505859375, 0.512939453125, 0.9415283203125, 1.3701171875, 1.7987060546875, 2.227294921875, 2.6558837890625, 3.08447265625, 3.5130615234375, 3.941650390625, 4.3702392578125, 4.798828125, 5.2274169921875, 5.656005859375, 6.0845947265625, 6.51318359375, 6.9417724609375, 7.370361328125, 7.7989501953125, 8.2275390625, 8.6561279296875, 9.084716796875, 9.5133056640625, 9.94189453125, 10.3704833984375, 10.799072265625, 11.2276611328125, 11.65625]}, "gradients/encoder.adapter.layers.0.conv.weight": {"_type": "histogram", "values": [3.0, 2.0, 3.0, 5.0, 5.0, 6.0, 5.0, 5.0, 12.0, 15.0, 17.0, 17.0, 30.0, 37.0, 40.0, 55.0, 68.0, 91.0, 110.0, 132.0, 208.0, 250.0, 365.0, 559.0, 1071.0, 2421.0, 5463.0, 12925.0, 29548.0, 64871.0, 137997.0, 5725529.0, 167886.0, 77461.0, 35559.0, 15577.0, 6629.0, 2945.0, 1327.0, 656.0, 385.0, 285.0, 186.0, 155.0, 107.0, 81.0, 89.0, 51.0, 55.0, 43.0, 27.0, 17.0, 17.0, 7.0, 8.0, 7.0, 8.0, 7.0, 1.0, 2.0, 3.0, 4.0, 3.0, 3.0], "bins": [-3.0390625, -2.94293212890625, -2.8468017578125, -2.75067138671875, -2.654541015625, -2.55841064453125, -2.4622802734375, -2.36614990234375, -2.27001953125, -2.17388916015625, -2.0777587890625, -1.98162841796875, -1.885498046875, -1.78936767578125, -1.6932373046875, -1.59710693359375, -1.5009765625, -1.40484619140625, -1.3087158203125, -1.21258544921875, -1.116455078125, -1.02032470703125, -0.9241943359375, -0.82806396484375, -0.73193359375, -0.63580322265625, -0.5396728515625, -0.44354248046875, -0.347412109375, -0.25128173828125, -0.1551513671875, -0.05902099609375, 0.037109375, 0.13323974609375, 0.2293701171875, 0.32550048828125, 0.421630859375, 0.51776123046875, 0.6138916015625, 0.71002197265625, 0.80615234375, 0.90228271484375, 0.9984130859375, 1.09454345703125, 1.190673828125, 1.28680419921875, 1.3829345703125, 1.47906494140625, 1.5751953125, 1.67132568359375, 1.7674560546875, 1.86358642578125, 1.959716796875, 2.05584716796875, 2.1519775390625, 2.24810791015625, 2.34423828125, 2.44036865234375, 2.5364990234375, 2.63262939453125, 2.728759765625, 2.82489013671875, 2.9210205078125, 3.01715087890625, 3.11328125]}, "gradients/encoder.adapter.layers.0.conv.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 4.0, 2.0, 2.0, 4.0, 9.0, 7.0, 10.0, 15.0, 10.0, 13.0, 17.0, 16.0, 16.0, 31.0, 30.0, 31.0, 24.0, 38.0, 32.0, 30.0, 40.0, 27.0, 31.0, 87.0, 1001.0, 58.0, 35.0, 34.0, 33.0, 36.0, 32.0, 28.0, 22.0, 18.0, 28.0, 24.0, 17.0, 17.0, 15.0, 13.0, 14.0, 12.0, 9.0, 8.0, 5.0, 6.0, 10.0, 9.0, 5.0, 5.0, 4.0, 5.0, 6.0, 0.0, 1.0, 1.0], "bins": [-10.125, -9.8126220703125, -9.500244140625, -9.1878662109375, -8.87548828125, -8.5631103515625, -8.250732421875, -7.9383544921875, -7.6259765625, -7.3135986328125, -7.001220703125, -6.6888427734375, -6.37646484375, -6.0640869140625, -5.751708984375, -5.4393310546875, -5.126953125, -4.8145751953125, -4.502197265625, -4.1898193359375, -3.87744140625, -3.5650634765625, -3.252685546875, -2.9403076171875, -2.6279296875, -2.3155517578125, -2.003173828125, -1.6907958984375, -1.37841796875, -1.0660400390625, -0.753662109375, -0.4412841796875, -0.12890625, 0.1834716796875, 0.495849609375, 0.8082275390625, 1.12060546875, 1.4329833984375, 1.745361328125, 2.0577392578125, 2.3701171875, 2.6824951171875, 2.994873046875, 3.3072509765625, 3.61962890625, 3.9320068359375, 4.244384765625, 4.5567626953125, 4.869140625, 5.1815185546875, 5.493896484375, 5.8062744140625, 6.11865234375, 6.4310302734375, 6.743408203125, 7.0557861328125, 7.3681640625, 7.6805419921875, 7.992919921875, 8.3052978515625, 8.61767578125, 8.9300537109375, 9.242431640625, 9.5548095703125, 9.8671875]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 2.0, 2.0, 13.0, 37.0, 101.0, 298.0, 342.0, 122.0, 54.0, 20.0, 11.0, 5.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-133.92686462402344, -130.41455078125, -126.90223693847656, -123.38992309570312, -119.87760925292969, -116.36529541015625, -112.85298156738281, -109.34066009521484, -105.8283462524414, -102.31603240966797, -98.80371856689453, -95.2914047241211, -91.77909088134766, -88.26676940917969, -84.75445556640625, -81.24214172363281, -77.72982788085938, -74.21751403808594, -70.7052001953125, -67.19288635253906, -63.68056869506836, -60.16825485229492, -56.655941009521484, -53.14362335205078, -49.631317138671875, -46.11900329589844, -42.606689453125, -39.09437561035156, -35.58205795288086, -32.06974411010742, -28.557430267333984, -25.045114517211914, -21.532798767089844, -18.020484924316406, -14.508169174194336, -10.995855331420898, -7.4835405349731445, -3.9712257385253906, -0.4589118957519531, 3.053403854370117, 6.565717697143555, 10.078032493591309, 13.590347290039062, 17.1026611328125, 20.614974975585938, 24.127290725708008, 27.639604568481445, 31.151920318603516, 34.66423416137695, 38.17654800415039, 41.68886184692383, 45.20117950439453, 48.71349334716797, 52.225807189941406, 55.738121032714844, 59.25043487548828, 62.76274871826172, 66.27506256103516, 69.7873764038086, 73.29969024658203, 76.81200408935547, 80.32432556152344, 83.83663940429688, 87.34895324707031, 90.86126708984375]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 0.0, 4.0, 1.0, 0.0, 6.0, 5.0, 7.0, 4.0, 3.0, 9.0, 16.0, 20.0, 16.0, 26.0, 36.0, 45.0, 67.0, 58.0, 73.0, 118.0, 89.0, 80.0, 75.0, 53.0, 49.0, 32.0, 27.0, 19.0, 11.0, 18.0, 8.0, 10.0, 5.0, 3.0, 5.0, 2.0, 3.0, 0.0, 0.0, 3.0, 1.0, 3.0, 1.0, 0.0, 2.0], "bins": [-158.6954345703125, -154.61233520507812, -150.5292205810547, -146.44610595703125, -142.36300659179688, -138.2799072265625, -134.19679260253906, -130.11367797851562, -126.03057861328125, -121.94747161865234, -117.86436462402344, -113.78125762939453, -109.69815063476562, -105.61504364013672, -101.53193664550781, -97.4488296508789, -93.36572265625, -89.2826156616211, -85.19950866699219, -81.11640167236328, -77.03329467773438, -72.95018768310547, -68.86708068847656, -64.78397369384766, -60.70086669921875, -56.617759704589844, -52.53465270996094, -48.45154571533203, -44.368438720703125, -40.28533172607422, -36.20222473144531, -32.119117736816406, -28.036026000976562, -23.952919006347656, -19.86981201171875, -15.786705017089844, -11.703598022460938, -7.620491027832031, -3.537384033203125, 0.5457229614257812, 4.6288299560546875, 8.711936950683594, 12.7950439453125, 16.878150939941406, 20.961257934570312, 25.04436492919922, 29.127471923828125, 33.21057891845703, 37.29368591308594, 41.376792907714844, 45.45989990234375, 49.543006896972656, 53.62611389160156, 57.70922088623047, 61.792327880859375, 65.87543487548828, 69.95854187011719, 74.0416488647461, 78.124755859375, 82.2078628540039, 86.29096984863281, 90.37407684326172, 94.45718383789062, 98.54029083251953, 102.62339782714844]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 4.0, 4.0, 9.0, 7.0, 19.0, 11.0, 23.0, 39.0, 42.0, 56.0, 78.0, 90.0, 119.0, 213.0, 308.0, 448.0, 740.0, 1167.0, 1925.0, 3541.0, 7069.0, 18122.0, 82595.0, 3913789.0, 120008.0, 23635.0, 9148.0, 4489.0, 2370.0, 1391.0, 837.0, 591.0, 383.0, 293.0, 168.0, 153.0, 97.0, 79.0, 67.0, 57.0, 25.0, 14.0, 13.0, 12.0, 11.0, 10.0, 9.0, 3.0, 2.0, 3.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.140625, -0.13602638244628906, -0.13142776489257812, -0.1268291473388672, -0.12223052978515625, -0.11763191223144531, -0.11303329467773438, -0.10843467712402344, -0.1038360595703125, -0.09923744201660156, -0.09463882446289062, -0.09004020690917969, -0.08544158935546875, -0.08084297180175781, -0.07624435424804688, -0.07164573669433594, -0.067047119140625, -0.06244850158691406, -0.057849884033203125, -0.05325126647949219, -0.04865264892578125, -0.04405403137207031, -0.039455413818359375, -0.03485679626464844, -0.0302581787109375, -0.025659561157226562, -0.021060943603515625, -0.016462326049804688, -0.01186370849609375, -0.0072650909423828125, -0.002666473388671875, 0.0019321441650390625, 0.00653076171875, 0.011129379272460938, 0.015727996826171875, 0.020326614379882812, 0.02492523193359375, 0.029523849487304688, 0.034122467041015625, 0.03872108459472656, 0.0433197021484375, 0.04791831970214844, 0.052516937255859375, 0.05711555480957031, 0.06171417236328125, 0.06631278991699219, 0.07091140747070312, 0.07551002502441406, 0.080108642578125, 0.08470726013183594, 0.08930587768554688, 0.09390449523925781, 0.09850311279296875, 0.10310173034667969, 0.10770034790039062, 0.11229896545410156, 0.1168975830078125, 0.12149620056152344, 0.12609481811523438, 0.1306934356689453, 0.13529205322265625, 0.1398906707763672, 0.14448928833007812, 0.14908790588378906, 0.1536865234375]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 8.0, 3.0, 2.0, 2.0, 4.0, 5.0, 5.0, 4.0, 6.0, 5.0, 5.0, 10.0, 8.0, 10.0, 22.0, 135.0, 625.0, 27.0, 14.0, 20.0, 12.0, 13.0, 5.0, 9.0, 5.0, 6.0, 4.0, 3.0, 1.0, 4.0, 5.0, 3.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.1231689453125, -0.11947822570800781, -0.11578750610351562, -0.11209678649902344, -0.10840606689453125, -0.10471534729003906, -0.10102462768554688, -0.09733390808105469, -0.0936431884765625, -0.08995246887207031, -0.08626174926757812, -0.08257102966308594, -0.07888031005859375, -0.07518959045410156, -0.07149887084960938, -0.06780815124511719, -0.064117431640625, -0.06042671203613281, -0.056735992431640625, -0.05304527282714844, -0.04935455322265625, -0.04566383361816406, -0.041973114013671875, -0.03828239440917969, -0.0345916748046875, -0.030900955200195312, -0.027210235595703125, -0.023519515991210938, -0.01982879638671875, -0.016138076782226562, -0.012447357177734375, -0.008756637573242188, -0.00506591796875, -0.0013751983642578125, 0.002315521240234375, 0.0060062408447265625, 0.00969696044921875, 0.013387680053710938, 0.017078399658203125, 0.020769119262695312, 0.0244598388671875, 0.028150558471679688, 0.031841278076171875, 0.03553199768066406, 0.03922271728515625, 0.04291343688964844, 0.046604156494140625, 0.05029487609863281, 0.053985595703125, 0.05767631530761719, 0.061367034912109375, 0.06505775451660156, 0.06874847412109375, 0.07243919372558594, 0.07612991333007812, 0.07982063293457031, 0.0835113525390625, 0.08720207214355469, 0.09089279174804688, 0.09458351135253906, 0.09827423095703125, 0.10196495056152344, 0.10565567016601562, 0.10934638977050781, 0.113037109375]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 1.0, 6.0, 5.0, 6.0, 11.0, 15.0, 21.0, 25.0, 30.0, 61.0, 68.0, 131.0, 175.0, 338.0, 627.0, 1438.0, 3565.0, 10267.0, 39697.0, 287368.0, 3442156.0, 345825.0, 44402.0, 11215.0, 3789.0, 1492.0, 666.0, 316.0, 212.0, 91.0, 90.0, 48.0, 36.0, 22.0, 15.0, 25.0, 9.0, 4.0, 8.0, 6.0, 2.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.1573486328125, -0.1525115966796875, -0.147674560546875, -0.1428375244140625, -0.13800048828125, -0.1331634521484375, -0.128326416015625, -0.1234893798828125, -0.11865234375, -0.1138153076171875, -0.108978271484375, -0.1041412353515625, -0.09930419921875, -0.0944671630859375, -0.089630126953125, -0.0847930908203125, -0.0799560546875, -0.0751190185546875, -0.070281982421875, -0.0654449462890625, -0.06060791015625, -0.0557708740234375, -0.050933837890625, -0.0460968017578125, -0.041259765625, -0.0364227294921875, -0.031585693359375, -0.0267486572265625, -0.02191162109375, -0.0170745849609375, -0.012237548828125, -0.0074005126953125, -0.0025634765625, 0.0022735595703125, 0.007110595703125, 0.0119476318359375, 0.01678466796875, 0.0216217041015625, 0.026458740234375, 0.0312957763671875, 0.0361328125, 0.0409698486328125, 0.045806884765625, 0.0506439208984375, 0.05548095703125, 0.0603179931640625, 0.065155029296875, 0.0699920654296875, 0.0748291015625, 0.0796661376953125, 0.084503173828125, 0.0893402099609375, 0.09417724609375, 0.0990142822265625, 0.103851318359375, 0.1086883544921875, 0.113525390625, 0.1183624267578125, 0.123199462890625, 0.1280364990234375, 0.13287353515625, 0.1377105712890625, 0.142547607421875, 0.1473846435546875, 0.1522216796875]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 6.0, 8.0, 5.0, 2.0, 4.0, 2.0, 9.0, 15.0, 18.0, 26.0, 24.0, 42.0, 43.0, 108.0, 164.0, 312.0, 784.0, 1344.0, 504.0, 229.0, 137.0, 86.0, 42.0, 46.0, 25.0, 20.0, 22.0, 10.0, 13.0, 7.0, 4.0, 1.0, 8.0, 2.0, 3.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.091796875, -0.08895301818847656, -0.08610916137695312, -0.08326530456542969, -0.08042144775390625, -0.07757759094238281, -0.07473373413085938, -0.07188987731933594, -0.0690460205078125, -0.06620216369628906, -0.06335830688476562, -0.06051445007324219, -0.05767059326171875, -0.05482673645019531, -0.051982879638671875, -0.04913902282714844, -0.046295166015625, -0.04345130920410156, -0.040607452392578125, -0.03776359558105469, -0.03491973876953125, -0.03207588195800781, -0.029232025146484375, -0.026388168334960938, -0.0235443115234375, -0.020700454711914062, -0.017856597900390625, -0.015012741088867188, -0.01216888427734375, -0.009325027465820312, -0.006481170654296875, -0.0036373138427734375, -0.00079345703125, 0.0020503997802734375, 0.004894256591796875, 0.0077381134033203125, 0.01058197021484375, 0.013425827026367188, 0.016269683837890625, 0.019113540649414062, 0.0219573974609375, 0.024801254272460938, 0.027645111083984375, 0.030488967895507812, 0.03333282470703125, 0.03617668151855469, 0.039020538330078125, 0.04186439514160156, 0.044708251953125, 0.04755210876464844, 0.050395965576171875, 0.05323982238769531, 0.05608367919921875, 0.05892753601074219, 0.061771392822265625, 0.06461524963378906, 0.0674591064453125, 0.07030296325683594, 0.07314682006835938, 0.07599067687988281, 0.07883453369140625, 0.08167839050292969, 0.08452224731445312, 0.08736610412597656, 0.0902099609375]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 5.0, 30.0, 156.0, 574.0, 209.0, 23.0, 4.0, 5.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.0225844383239746, -0.9930246472358704, -0.9634647965431213, -0.9339050054550171, -0.9043452143669128, -0.8747854232788086, -0.8452255725860596, -0.8156657814979553, -0.7861059904098511, -0.7565461993217468, -0.7269863486289978, -0.6974265575408936, -0.6678667664527893, -0.6383069753646851, -0.608747124671936, -0.5791873335838318, -0.5496275424957275, -0.5200677514076233, -0.49050793051719666, -0.46094810962677, -0.43138831853866577, -0.40182849764823914, -0.3722686767578125, -0.34270888566970825, -0.31314903497695923, -0.2835892140865326, -0.25402942299842834, -0.2244696021080017, -0.19490981101989746, -0.16534999012947083, -0.13579018414020538, -0.10623037815093994, -0.0766705870628357, -0.04711078107357025, -0.01755097135901451, 0.01200883835554123, 0.04156864434480667, 0.07112845778465271, 0.10068826377391815, 0.1302480697631836, 0.15980787575244904, 0.18936768174171448, 0.21892748773097992, 0.24848729372024536, 0.278047114610672, 0.30760693550109863, 0.3371667265892029, 0.36672651767730713, 0.39628633856773376, 0.4258461594581604, 0.45540595054626465, 0.4849657714366913, 0.5145255923271179, 0.5440853834152222, 0.5736451745033264, 0.6032049655914307, 0.6327648162841797, 0.6623246073722839, 0.691884458065033, 0.7214442491531372, 0.7510040402412415, 0.7805638313293457, 0.8101236820220947, 0.839683473110199, 0.8692432641983032]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 3.0, 4.0, 4.0, 10.0, 11.0, 11.0, 10.0, 16.0, 24.0, 33.0, 35.0, 46.0, 48.0, 57.0, 74.0, 61.0, 71.0, 82.0, 53.0, 61.0, 57.0, 42.0, 44.0, 40.0, 30.0, 26.0, 15.0, 9.0, 6.0, 9.0, 3.0, 2.0, 7.0, 0.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.34378623962402344, -0.33228981494903564, -0.32079336047172546, -0.3092969059944153, -0.2978004813194275, -0.2863040566444397, -0.2748076021671295, -0.26331114768981934, -0.25181472301483154, -0.24031828343868256, -0.22882184386253357, -0.21732540428638458, -0.2058289647102356, -0.1943325251340866, -0.18283608555793762, -0.17133964598178864, -0.15984320640563965, -0.14834676682949066, -0.13685032725334167, -0.1253538876771927, -0.1138574481010437, -0.10236100852489471, -0.09086456894874573, -0.07936812937259674, -0.06787168979644775, -0.05637525022029877, -0.04487881064414978, -0.03338237106800079, -0.021885931491851807, -0.01038949191570282, 0.001106947660446167, 0.012603387236595154, 0.02409982681274414, 0.03559626638889313, 0.047092705965042114, 0.0585891455411911, 0.07008558511734009, 0.08158202469348907, 0.09307846426963806, 0.10457490384578705, 0.11607134342193604, 0.12756778299808502, 0.139064222574234, 0.150560662150383, 0.16205710172653198, 0.17355354130268097, 0.18504998087882996, 0.19654642045497894, 0.20804286003112793, 0.21953929960727692, 0.2310357391834259, 0.2425321787595749, 0.2540286183357239, 0.26552504301071167, 0.27702149748802185, 0.28851795196533203, 0.3000143766403198, 0.3115108013153076, 0.3230072557926178, 0.334503710269928, 0.34600013494491577, 0.35749655961990356, 0.36899301409721375, 0.3804894685745239, 0.3919858932495117]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 4.0, 4.0, 5.0, 8.0, 11.0, 14.0, 23.0, 29.0, 34.0, 43.0, 63.0, 93.0, 108.0, 150.0, 226.0, 291.0, 365.0, 512.0, 709.0, 988.0, 1295.0, 1854.0, 2637.0, 3790.0, 5719.0, 9156.0, 15429.0, 30174.0, 222880.0, 671474.0, 33854.0, 16934.0, 9614.0, 6141.0, 4060.0, 2721.0, 1942.0, 1373.0, 1048.0, 743.0, 526.0, 417.0, 316.0, 185.0, 163.0, 112.0, 77.0, 70.0, 57.0, 35.0, 26.0, 19.0, 19.0, 6.0, 8.0, 7.0, 5.0, 2.0, 1.0, 0.0, 2.0, 1.0, 2.0], "bins": [-0.360107421875, -0.3481330871582031, -0.33615875244140625, -0.3241844177246094, -0.3122100830078125, -0.3002357482910156, -0.28826141357421875, -0.2762870788574219, -0.264312744140625, -0.2523384094238281, -0.24036407470703125, -0.22838973999023438, -0.2164154052734375, -0.20444107055664062, -0.19246673583984375, -0.18049240112304688, -0.16851806640625, -0.15654373168945312, -0.14456939697265625, -0.13259506225585938, -0.1206207275390625, -0.10864639282226562, -0.09667205810546875, -0.08469772338867188, -0.072723388671875, -0.060749053955078125, -0.04877471923828125, -0.036800384521484375, -0.0248260498046875, -0.012851715087890625, -0.00087738037109375, 0.011096954345703125, 0.0230712890625, 0.035045623779296875, 0.04701995849609375, 0.058994293212890625, 0.0709686279296875, 0.08294296264648438, 0.09491729736328125, 0.10689163208007812, 0.118865966796875, 0.13084030151367188, 0.14281463623046875, 0.15478897094726562, 0.1667633056640625, 0.17873764038085938, 0.19071197509765625, 0.20268630981445312, 0.21466064453125, 0.22663497924804688, 0.23860931396484375, 0.2505836486816406, 0.2625579833984375, 0.2745323181152344, 0.28650665283203125, 0.2984809875488281, 0.310455322265625, 0.3224296569824219, 0.33440399169921875, 0.3463783264160156, 0.3583526611328125, 0.3703269958496094, 0.38230133056640625, 0.3942756652832031, 0.40625]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 5.0, 6.0, 3.0, 1.0, 2.0, 5.0, 4.0, 4.0, 4.0, 5.0, 8.0, 5.0, 9.0, 9.0, 11.0, 34.0, 438.0, 313.0, 23.0, 15.0, 19.0, 17.0, 6.0, 7.0, 9.0, 7.0, 5.0, 1.0, 3.0, 3.0, 4.0, 4.0, 3.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.12188720703125, -0.1182088851928711, -0.11453056335449219, -0.11085224151611328, -0.10717391967773438, -0.10349559783935547, -0.09981727600097656, -0.09613895416259766, -0.09246063232421875, -0.08878231048583984, -0.08510398864746094, -0.08142566680908203, -0.07774734497070312, -0.07406902313232422, -0.07039070129394531, -0.0667123794555664, -0.0630340576171875, -0.059355735778808594, -0.05567741394042969, -0.05199909210205078, -0.048320770263671875, -0.04464244842529297, -0.04096412658691406, -0.037285804748535156, -0.03360748291015625, -0.029929161071777344, -0.026250839233398438, -0.02257251739501953, -0.018894195556640625, -0.015215873718261719, -0.011537551879882812, -0.007859230041503906, -0.004180908203125, -0.0005025863647460938, 0.0031757354736328125, 0.006854057312011719, 0.010532379150390625, 0.014210700988769531, 0.017889022827148438, 0.021567344665527344, 0.02524566650390625, 0.028923988342285156, 0.03260231018066406, 0.03628063201904297, 0.039958953857421875, 0.04363727569580078, 0.04731559753417969, 0.050993919372558594, 0.0546722412109375, 0.058350563049316406, 0.06202888488769531, 0.06570720672607422, 0.06938552856445312, 0.07306385040283203, 0.07674217224121094, 0.08042049407958984, 0.08409881591796875, 0.08777713775634766, 0.09145545959472656, 0.09513378143310547, 0.09881210327148438, 0.10249042510986328, 0.10616874694824219, 0.1098470687866211, 0.113525390625]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 1.0, 1.0, 2.0, 7.0, 4.0, 8.0, 18.0, 14.0, 22.0, 43.0, 49.0, 61.0, 100.0, 126.0, 157.0, 235.0, 437.0, 696.0, 1402.0, 3123.0, 7631.0, 22706.0, 85057.0, 388808.0, 410027.0, 89256.0, 23657.0, 8164.0, 3218.0, 1435.0, 717.0, 452.0, 267.0, 180.0, 144.0, 93.0, 55.0, 59.0, 43.0, 30.0, 18.0, 10.0, 11.0, 5.0, 7.0, 6.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.356689453125, -0.34588623046875, -0.3350830078125, -0.32427978515625, -0.3134765625, -0.30267333984375, -0.2918701171875, -0.28106689453125, -0.270263671875, -0.25946044921875, -0.2486572265625, -0.23785400390625, -0.22705078125, -0.21624755859375, -0.2054443359375, -0.19464111328125, -0.183837890625, -0.17303466796875, -0.1622314453125, -0.15142822265625, -0.140625, -0.12982177734375, -0.1190185546875, -0.10821533203125, -0.097412109375, -0.08660888671875, -0.0758056640625, -0.06500244140625, -0.05419921875, -0.04339599609375, -0.0325927734375, -0.02178955078125, -0.010986328125, -0.00018310546875, 0.0106201171875, 0.02142333984375, 0.0322265625, 0.04302978515625, 0.0538330078125, 0.06463623046875, 0.075439453125, 0.08624267578125, 0.0970458984375, 0.10784912109375, 0.11865234375, 0.12945556640625, 0.1402587890625, 0.15106201171875, 0.161865234375, 0.17266845703125, 0.1834716796875, 0.19427490234375, 0.205078125, 0.21588134765625, 0.2266845703125, 0.23748779296875, 0.248291015625, 0.25909423828125, 0.2698974609375, 0.28070068359375, 0.29150390625, 0.30230712890625, 0.3131103515625, 0.32391357421875, 0.334716796875]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 5.0, 8.0, 6.0, 15.0, 11.0, 15.0, 13.0, 21.0, 23.0, 27.0, 34.0, 30.0, 33.0, 21.0, 37.0, 53.0, 30.0, 43.0, 51.0, 45.0, 47.0, 47.0, 50.0, 42.0, 39.0, 27.0, 35.0, 26.0, 30.0, 37.0, 22.0, 16.0, 15.0, 13.0, 14.0, 5.0, 3.0, 7.0, 3.0, 3.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4921875, -0.47589111328125, -0.4595947265625, -0.44329833984375, -0.427001953125, -0.41070556640625, -0.3944091796875, -0.37811279296875, -0.36181640625, -0.34552001953125, -0.3292236328125, -0.31292724609375, -0.296630859375, -0.28033447265625, -0.2640380859375, -0.24774169921875, -0.2314453125, -0.21514892578125, -0.1988525390625, -0.18255615234375, -0.166259765625, -0.14996337890625, -0.1336669921875, -0.11737060546875, -0.10107421875, -0.08477783203125, -0.0684814453125, -0.05218505859375, -0.035888671875, -0.01959228515625, -0.0032958984375, 0.01300048828125, 0.029296875, 0.04559326171875, 0.0618896484375, 0.07818603515625, 0.094482421875, 0.11077880859375, 0.1270751953125, 0.14337158203125, 0.15966796875, 0.17596435546875, 0.1922607421875, 0.20855712890625, 0.224853515625, 0.24114990234375, 0.2574462890625, 0.27374267578125, 0.2900390625, 0.30633544921875, 0.3226318359375, 0.33892822265625, 0.355224609375, 0.37152099609375, 0.3878173828125, 0.40411376953125, 0.42041015625, 0.43670654296875, 0.4530029296875, 0.46929931640625, 0.485595703125, 0.50189208984375, 0.5181884765625, 0.53448486328125, 0.55078125]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 4.0, 1.0, 1.0, 6.0, 6.0, 4.0, 5.0, 12.0, 13.0, 17.0, 19.0, 33.0, 37.0, 79.0, 131.0, 235.0, 504.0, 1300.0, 3837.0, 26158.0, 960750.0, 47496.0, 5168.0, 1509.0, 594.0, 249.0, 149.0, 87.0, 45.0, 33.0, 21.0, 16.0, 13.0, 9.0, 2.0, 5.0, 7.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4794921875, -1.435455322265625, -1.39141845703125, -1.347381591796875, -1.3033447265625, -1.259307861328125, -1.21527099609375, -1.171234130859375, -1.127197265625, -1.083160400390625, -1.03912353515625, -0.995086669921875, -0.9510498046875, -0.907012939453125, -0.86297607421875, -0.818939208984375, -0.77490234375, -0.730865478515625, -0.68682861328125, -0.642791748046875, -0.5987548828125, -0.554718017578125, -0.51068115234375, -0.466644287109375, -0.422607421875, -0.378570556640625, -0.33453369140625, -0.290496826171875, -0.2464599609375, -0.202423095703125, -0.15838623046875, -0.114349365234375, -0.0703125, -0.026275634765625, 0.01776123046875, 0.061798095703125, 0.1058349609375, 0.149871826171875, 0.19390869140625, 0.237945556640625, 0.281982421875, 0.326019287109375, 0.37005615234375, 0.414093017578125, 0.4581298828125, 0.502166748046875, 0.54620361328125, 0.590240478515625, 0.63427734375, 0.678314208984375, 0.72235107421875, 0.766387939453125, 0.8104248046875, 0.854461669921875, 0.89849853515625, 0.942535400390625, 0.986572265625, 1.030609130859375, 1.07464599609375, 1.118682861328125, 1.1627197265625, 1.206756591796875, 1.25079345703125, 1.294830322265625, 1.3388671875]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 4.0, 7.0, 5.0, 4.0, 15.0, 14.0, 30.0, 37.0, 59.0, 79.0, 137.0, 168.0, 154.0, 88.0, 63.0, 56.0, 32.0, 10.0, 13.0, 7.0, 6.0, 5.0, 3.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.412101745605469e-05, -5.2012503147125244e-05, -4.99039888381958e-05, -4.779547452926636e-05, -4.5686960220336914e-05, -4.357844591140747e-05, -4.146993160247803e-05, -3.9361417293548584e-05, -3.725290298461914e-05, -3.51443886756897e-05, -3.3035874366760254e-05, -3.092736005783081e-05, -2.8818845748901367e-05, -2.6710331439971924e-05, -2.460181713104248e-05, -2.2493302822113037e-05, -2.0384788513183594e-05, -1.827627420425415e-05, -1.6167759895324707e-05, -1.4059245586395264e-05, -1.195073127746582e-05, -9.842216968536377e-06, -7.733702659606934e-06, -5.62518835067749e-06, -3.516674041748047e-06, -1.4081597328186035e-06, 7.003545761108398e-07, 2.808868885040283e-06, 4.9173831939697266e-06, 7.02589750289917e-06, 9.134411811828613e-06, 1.1242926120758057e-05, 1.33514404296875e-05, 1.5459954738616943e-05, 1.7568469047546387e-05, 1.967698335647583e-05, 2.1785497665405273e-05, 2.3894011974334717e-05, 2.600252628326416e-05, 2.8111040592193604e-05, 3.0219554901123047e-05, 3.232806921005249e-05, 3.4436583518981934e-05, 3.654509782791138e-05, 3.865361213684082e-05, 4.0762126445770264e-05, 4.287064075469971e-05, 4.497915506362915e-05, 4.7087669372558594e-05, 4.919618368148804e-05, 5.130469799041748e-05, 5.3413212299346924e-05, 5.552172660827637e-05, 5.763024091720581e-05, 5.9738755226135254e-05, 6.18472695350647e-05, 6.395578384399414e-05, 6.606429815292358e-05, 6.817281246185303e-05, 7.028132677078247e-05, 7.238984107971191e-05, 7.449835538864136e-05, 7.66068696975708e-05, 7.871538400650024e-05, 8.082389831542969e-05]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 4.0, 2.0, 7.0, 8.0, 16.0, 15.0, 31.0, 61.0, 117.0, 277.0, 747.0, 3315.0, 36645.0, 965318.0, 37241.0, 3424.0, 784.0, 286.0, 131.0, 51.0, 27.0, 12.0, 13.0, 6.0, 5.0, 9.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.3291015625, -1.2894287109375, -1.249755859375, -1.2100830078125, -1.17041015625, -1.1307373046875, -1.091064453125, -1.0513916015625, -1.01171875, -0.9720458984375, -0.932373046875, -0.8927001953125, -0.85302734375, -0.8133544921875, -0.773681640625, -0.7340087890625, -0.6943359375, -0.6546630859375, -0.614990234375, -0.5753173828125, -0.53564453125, -0.4959716796875, -0.456298828125, -0.4166259765625, -0.376953125, -0.3372802734375, -0.297607421875, -0.2579345703125, -0.21826171875, -0.1785888671875, -0.138916015625, -0.0992431640625, -0.0595703125, -0.0198974609375, 0.019775390625, 0.0594482421875, 0.09912109375, 0.1387939453125, 0.178466796875, 0.2181396484375, 0.2578125, 0.2974853515625, 0.337158203125, 0.3768310546875, 0.41650390625, 0.4561767578125, 0.495849609375, 0.5355224609375, 0.5751953125, 0.6148681640625, 0.654541015625, 0.6942138671875, 0.73388671875, 0.7735595703125, 0.813232421875, 0.8529052734375, 0.892578125, 0.9322509765625, 0.971923828125, 1.0115966796875, 1.05126953125, 1.0909423828125, 1.130615234375, 1.1702880859375, 1.2099609375]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 4.0, 3.0, 5.0, 8.0, 8.0, 11.0, 14.0, 18.0, 30.0, 27.0, 51.0, 82.0, 145.0, 161.0, 146.0, 73.0, 59.0, 46.0, 34.0, 17.0, 12.0, 6.0, 11.0, 4.0, 9.0, 8.0, 2.0, 6.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.791015625, -0.765869140625, -0.74072265625, -0.715576171875, -0.6904296875, -0.665283203125, -0.64013671875, -0.614990234375, -0.58984375, -0.564697265625, -0.53955078125, -0.514404296875, -0.4892578125, -0.464111328125, -0.43896484375, -0.413818359375, -0.388671875, -0.363525390625, -0.33837890625, -0.313232421875, -0.2880859375, -0.262939453125, -0.23779296875, -0.212646484375, -0.1875, -0.162353515625, -0.13720703125, -0.112060546875, -0.0869140625, -0.061767578125, -0.03662109375, -0.011474609375, 0.013671875, 0.038818359375, 0.06396484375, 0.089111328125, 0.1142578125, 0.139404296875, 0.16455078125, 0.189697265625, 0.21484375, 0.239990234375, 0.26513671875, 0.290283203125, 0.3154296875, 0.340576171875, 0.36572265625, 0.390869140625, 0.416015625, 0.441162109375, 0.46630859375, 0.491455078125, 0.5166015625, 0.541748046875, 0.56689453125, 0.592041015625, 0.6171875, 0.642333984375, 0.66748046875, 0.692626953125, 0.7177734375, 0.742919921875, 0.76806640625, 0.793212890625, 0.818359375]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 12.0, 36.0, 346.0, 506.0, 79.0, 17.0, 4.0, 3.0, 4.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.117149353027344, -19.61482810974121, -19.11250877380371, -18.610187530517578, -18.107868194580078, -17.605546951293945, -17.103227615356445, -16.600906372070312, -16.098587036132812, -15.596266746520996, -15.09394645690918, -14.591626167297363, -14.089305877685547, -13.58698558807373, -13.084665298461914, -12.582344055175781, -12.080023765563965, -11.577703475952148, -11.075383186340332, -10.573062896728516, -10.0707426071167, -9.568422317504883, -9.06610107421875, -8.56378173828125, -8.061460494995117, -7.559140205383301, -7.056819915771484, -6.554499626159668, -6.052179336547852, -5.549859046936035, -5.0475382804870605, -4.545217990875244, -4.042898178100586, -3.5405778884887695, -3.038257598876953, -2.5359370708465576, -2.033616781234741, -1.5312964916229248, -1.0289759635925293, -0.5266556739807129, -0.024335384368896484, 0.4779849648475647, 0.9803053140640259, 1.4826257228851318, 1.9849460124969482, 2.4872663021087646, 2.98958683013916, 3.4919071197509766, 3.994227409362793, 4.496547698974609, 4.998867988586426, 5.501188278198242, 6.003508567810059, 6.505828857421875, 7.00814962387085, 7.510469913482666, 8.01279067993164, 8.515110969543457, 9.017431259155273, 9.51975154876709, 10.022071838378906, 10.524392127990723, 11.026712417602539, 11.529033660888672, 12.031352996826172]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 4.0, 1.0, 1.0, 4.0, 5.0, 2.0, 1.0, 3.0, 3.0, 2.0, 5.0, 5.0, 6.0, 7.0, 18.0, 13.0, 24.0, 44.0, 70.0, 125.0, 171.0, 144.0, 128.0, 80.0, 46.0, 32.0, 22.0, 10.0, 3.0, 7.0, 2.0, 4.0, 4.0, 3.0, 3.0, 3.0, 5.0, 3.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-9.919219970703125, -9.588475227355957, -9.257730484008789, -8.926985740661621, -8.596240997314453, -8.265496253967285, -7.934751510620117, -7.604006767272949, -7.273262023925781, -6.942517280578613, -6.611772537231445, -6.281027793884277, -5.950283050537109, -5.619538307189941, -5.288793563842773, -4.9580488204956055, -4.627304553985596, -4.296559810638428, -3.9658150672912598, -3.635070323944092, -3.304325580596924, -2.973580837249756, -2.642836332321167, -2.312091588973999, -1.981346845626831, -1.650602102279663, -1.3198573589324951, -0.9891127347946167, -0.6583679914474487, -0.32762324810028076, 0.0031213760375976562, 0.3338661193847656, 0.6646108627319336, 0.9953556060791016, 1.3261003494262695, 1.656844973564148, 1.987589716911316, 2.3183345794677734, 2.6490790843963623, 2.9798238277435303, 3.3105685710906982, 3.641313314437866, 3.972058057785034, 4.302802562713623, 4.633547306060791, 4.964292049407959, 5.295036792755127, 5.625781536102295, 5.956526279449463, 6.287271022796631, 6.618015766143799, 6.948760509490967, 7.279505252838135, 7.610249996185303, 7.9409942626953125, 8.27173900604248, 8.602483749389648, 8.933228492736816, 9.263973236083984, 9.594717979431152, 9.92546272277832, 10.256207466125488, 10.586952209472656, 10.917696952819824, 11.248441696166992]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 1.0, 3.0, 2.0, 5.0, 4.0, 5.0, 11.0, 16.0, 15.0, 30.0, 30.0, 64.0, 66.0, 110.0, 165.0, 222.0, 348.0, 484.0, 796.0, 1290.0, 2146.0, 3692.0, 7497.0, 16859.0, 50524.0, 582868.0, 3408596.0, 77910.0, 21714.0, 8859.0, 4306.0, 2256.0, 1273.0, 784.0, 465.0, 284.0, 207.0, 130.0, 96.0, 56.0, 42.0, 13.0, 18.0, 13.0, 6.0, 4.0, 6.0, 2.0, 0.0, 2.0, 0.0, 2.0], "bins": [-0.8486328125, -0.8263778686523438, -0.8041229248046875, -0.7818679809570312, -0.759613037109375, -0.7373580932617188, -0.7151031494140625, -0.6928482055664062, -0.67059326171875, -0.6483383178710938, -0.6260833740234375, -0.6038284301757812, -0.581573486328125, -0.5593185424804688, -0.5370635986328125, -0.5148086547851562, -0.4925537109375, -0.47029876708984375, -0.4480438232421875, -0.42578887939453125, -0.403533935546875, -0.38127899169921875, -0.3590240478515625, -0.33676910400390625, -0.31451416015625, -0.29225921630859375, -0.2700042724609375, -0.24774932861328125, -0.225494384765625, -0.20323944091796875, -0.1809844970703125, -0.15872955322265625, -0.136474609375, -0.11421966552734375, -0.0919647216796875, -0.06970977783203125, -0.047454833984375, -0.02519989013671875, -0.0029449462890625, 0.01930999755859375, 0.04156494140625, 0.06381988525390625, 0.0860748291015625, 0.10832977294921875, 0.130584716796875, 0.15283966064453125, 0.1750946044921875, 0.19734954833984375, 0.2196044921875, 0.24185943603515625, 0.2641143798828125, 0.28636932373046875, 0.308624267578125, 0.33087921142578125, 0.3531341552734375, 0.37538909912109375, 0.39764404296875, 0.41989898681640625, 0.4421539306640625, 0.46440887451171875, 0.486663818359375, 0.5089187622070312, 0.5311737060546875, 0.5534286499023438, 0.57568359375]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 1.0, 3.0, 4.0, 3.0, 5.0, 4.0, 6.0, 13.0, 4.0, 5.0, 12.0, 7.0, 9.0, 24.0, 60.0, 203.0, 299.0, 146.0, 64.0, 30.0, 15.0, 4.0, 14.0, 15.0, 10.0, 8.0, 6.0, 5.0, 5.0, 2.0, 1.0, 5.0, 5.0, 1.0, 1.0, 2.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10882568359375, -0.10584354400634766, -0.10286140441894531, -0.09987926483154297, -0.09689712524414062, -0.09391498565673828, -0.09093284606933594, -0.0879507064819336, -0.08496856689453125, -0.0819864273071289, -0.07900428771972656, -0.07602214813232422, -0.07304000854492188, -0.07005786895751953, -0.06707572937011719, -0.06409358978271484, -0.0611114501953125, -0.058129310607910156, -0.05514717102050781, -0.05216503143310547, -0.049182891845703125, -0.04620075225830078, -0.04321861267089844, -0.040236473083496094, -0.03725433349609375, -0.034272193908691406, -0.03129005432128906, -0.02830791473388672, -0.025325775146484375, -0.02234363555908203, -0.019361495971679688, -0.016379356384277344, -0.013397216796875, -0.010415077209472656, -0.0074329376220703125, -0.004450798034667969, -0.001468658447265625, 0.0015134811401367188, 0.0044956207275390625, 0.007477760314941406, 0.01045989990234375, 0.013442039489746094, 0.016424179077148438, 0.01940631866455078, 0.022388458251953125, 0.02537059783935547, 0.028352737426757812, 0.031334877014160156, 0.0343170166015625, 0.037299156188964844, 0.04028129577636719, 0.04326343536376953, 0.046245574951171875, 0.04922771453857422, 0.05220985412597656, 0.055191993713378906, 0.05817413330078125, 0.061156272888183594, 0.06413841247558594, 0.06712055206298828, 0.07010269165039062, 0.07308483123779297, 0.07606697082519531, 0.07904911041259766, 0.08203125]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 5.0, 3.0, 3.0, 6.0, 6.0, 7.0, 10.0, 24.0, 29.0, 58.0, 67.0, 118.0, 200.0, 371.0, 672.0, 1369.0, 3443.0, 10994.0, 52197.0, 686389.0, 3264172.0, 142782.0, 21203.0, 5862.0, 2164.0, 974.0, 479.0, 237.0, 137.0, 98.0, 67.0, 50.0, 35.0, 22.0, 12.0, 11.0, 4.0, 6.0, 4.0, 0.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.53857421875, -0.522369384765625, -0.50616455078125, -0.489959716796875, -0.4737548828125, -0.457550048828125, -0.44134521484375, -0.425140380859375, -0.408935546875, -0.392730712890625, -0.37652587890625, -0.360321044921875, -0.3441162109375, -0.327911376953125, -0.31170654296875, -0.295501708984375, -0.279296875, -0.263092041015625, -0.24688720703125, -0.230682373046875, -0.2144775390625, -0.198272705078125, -0.18206787109375, -0.165863037109375, -0.149658203125, -0.133453369140625, -0.11724853515625, -0.101043701171875, -0.0848388671875, -0.068634033203125, -0.05242919921875, -0.036224365234375, -0.02001953125, -0.003814697265625, 0.01239013671875, 0.028594970703125, 0.0447998046875, 0.061004638671875, 0.07720947265625, 0.093414306640625, 0.109619140625, 0.125823974609375, 0.14202880859375, 0.158233642578125, 0.1744384765625, 0.190643310546875, 0.20684814453125, 0.223052978515625, 0.2392578125, 0.255462646484375, 0.27166748046875, 0.287872314453125, 0.3040771484375, 0.320281982421875, 0.33648681640625, 0.352691650390625, 0.368896484375, 0.385101318359375, 0.40130615234375, 0.417510986328125, 0.4337158203125, 0.449920654296875, 0.46612548828125, 0.482330322265625, 0.49853515625]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 4.0, 6.0, 6.0, 3.0, 10.0, 9.0, 14.0, 16.0, 29.0, 46.0, 86.0, 111.0, 220.0, 365.0, 1033.0, 1054.0, 477.0, 241.0, 105.0, 86.0, 54.0, 28.0, 19.0, 18.0, 7.0, 6.0, 6.0, 4.0, 6.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.14013671875, -0.13634967803955078, -0.13256263732910156, -0.12877559661865234, -0.12498855590820312, -0.1212015151977539, -0.11741447448730469, -0.11362743377685547, -0.10984039306640625, -0.10605335235595703, -0.10226631164550781, -0.0984792709350586, -0.09469223022460938, -0.09090518951416016, -0.08711814880371094, -0.08333110809326172, -0.0795440673828125, -0.07575702667236328, -0.07196998596191406, -0.06818294525146484, -0.06439590454101562, -0.060608863830566406, -0.05682182312011719, -0.05303478240966797, -0.04924774169921875, -0.04546070098876953, -0.04167366027832031, -0.037886619567871094, -0.034099578857421875, -0.030312538146972656, -0.026525497436523438, -0.02273845672607422, -0.018951416015625, -0.015164375305175781, -0.011377334594726562, -0.007590293884277344, -0.003803253173828125, -1.621246337890625e-05, 0.0037708282470703125, 0.007557868957519531, 0.01134490966796875, 0.015131950378417969, 0.018918991088867188, 0.022706031799316406, 0.026493072509765625, 0.030280113220214844, 0.03406715393066406, 0.03785419464111328, 0.0416412353515625, 0.04542827606201172, 0.04921531677246094, 0.053002357482910156, 0.056789398193359375, 0.060576438903808594, 0.06436347961425781, 0.06815052032470703, 0.07193756103515625, 0.07572460174560547, 0.07951164245605469, 0.0832986831665039, 0.08708572387695312, 0.09087276458740234, 0.09465980529785156, 0.09844684600830078, 0.10223388671875]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [10.0, 196.0, 742.0, 45.0, 11.0, 6.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.26927781105041504, -0.14243300259113312, -0.015588194131851196, 0.11125659942626953, 0.23810142278671265, 0.36494624614715576, 0.4917910099029541, 0.6186358332633972, 0.7454806566238403, 0.8723254799842834, 0.9991703033447266, 1.126015067100525, 1.2528598308563232, 1.3797047138214111, 1.5065494775772095, 1.6333942413330078, 1.7602391242980957, 1.887083888053894, 2.0139286518096924, 2.1407735347747803, 2.267618417739868, 2.394463062286377, 2.521307945251465, 2.6481528282165527, 2.7749977111816406, 2.9018425941467285, 3.0286872386932373, 3.155532121658325, 3.282377004623413, 3.409221649169922, 3.5360665321350098, 3.6629114151000977, 3.7897562980651855, 3.9166011810302734, 4.043446063995361, 4.170290946960449, 4.297135353088379, 4.423980236053467, 4.550825119018555, 4.677670001983643, 4.8045148849487305, 4.931359767913818, 5.058204650878906, 5.185049057006836, 5.311893939971924, 5.438738822937012, 5.5655837059021, 5.6924285888671875, 5.819272994995117, 5.946117877960205, 6.072962760925293, 6.199807167053223, 6.3266520500183105, 6.453496932983398, 6.580341815948486, 6.707186698913574, 6.834031581878662, 6.96087646484375, 7.087721347808838, 7.214566230773926, 7.3414106369018555, 7.468255519866943, 7.595100402832031, 7.721945285797119, 7.848790168762207]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 4.0, 2.0, 10.0, 1.0, 10.0, 6.0, 16.0, 21.0, 24.0, 26.0, 24.0, 36.0, 52.0, 52.0, 76.0, 81.0, 70.0, 66.0, 72.0, 62.0, 75.0, 54.0, 38.0, 38.0, 21.0, 14.0, 12.0, 8.0, 9.0, 5.0, 6.0, 1.0, 6.0, 4.0, 1.0, 1.0, 0.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8020894527435303, -0.7790535092353821, -0.7560175657272339, -0.7329816222190857, -0.7099456787109375, -0.6869097352027893, -0.6638737916946411, -0.6408379077911377, -0.6178019046783447, -0.5947659611701965, -0.5717300176620483, -0.5486940741539001, -0.525658130645752, -0.5026221871376038, -0.47958627343177795, -0.45655032992362976, -0.43351441621780396, -0.41047847270965576, -0.38744252920150757, -0.3644065856933594, -0.3413706421852112, -0.318334698677063, -0.2952987849712372, -0.272262841463089, -0.2492268979549408, -0.2261909544467926, -0.2031550109386444, -0.1801190823316574, -0.15708313882350922, -0.13404719531536102, -0.11101126670837402, -0.08797532320022583, -0.06493937969207764, -0.04190343990921974, -0.018867500126361847, 0.0041684359312057495, 0.027204379439353943, 0.050240322947502136, 0.07327625155448914, 0.09631219506263733, 0.11934813857078552, 0.14238408207893372, 0.1654200255870819, 0.1884559541940689, 0.2114918977022171, 0.2345278412103653, 0.2575637698173523, 0.2805997133255005, 0.3036356568336487, 0.3266716003417969, 0.34970754384994507, 0.37274348735809326, 0.39577943086624146, 0.41881537437438965, 0.44185128808021545, 0.46488723158836365, 0.48792317509651184, 0.5109590888023376, 0.5339950323104858, 0.557030975818634, 0.5800669193267822, 0.6031028628349304, 0.6261388063430786, 0.6491747498512268, 0.672210693359375]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 5.0, 5.0, 9.0, 3.0, 8.0, 13.0, 21.0, 24.0, 36.0, 62.0, 85.0, 141.0, 177.0, 256.0, 458.0, 681.0, 1082.0, 1811.0, 3147.0, 5799.0, 10969.0, 23399.0, 73340.0, 624329.0, 229924.0, 38290.0, 15967.0, 7896.0, 4334.0, 2462.0, 1368.0, 844.0, 533.0, 350.0, 257.0, 154.0, 99.0, 70.0, 39.0, 37.0, 24.0, 16.0, 7.0, 9.0, 13.0, 5.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4541015625, -0.43933868408203125, -0.4245758056640625, -0.40981292724609375, -0.395050048828125, -0.38028717041015625, -0.3655242919921875, -0.35076141357421875, -0.33599853515625, -0.32123565673828125, -0.3064727783203125, -0.29170989990234375, -0.276947021484375, -0.26218414306640625, -0.2474212646484375, -0.23265838623046875, -0.2178955078125, -0.20313262939453125, -0.1883697509765625, -0.17360687255859375, -0.158843994140625, -0.14408111572265625, -0.1293182373046875, -0.11455535888671875, -0.09979248046875, -0.08502960205078125, -0.0702667236328125, -0.05550384521484375, -0.040740966796875, -0.02597808837890625, -0.0112152099609375, 0.00354766845703125, 0.018310546875, 0.03307342529296875, 0.0478363037109375, 0.06259918212890625, 0.077362060546875, 0.09212493896484375, 0.1068878173828125, 0.12165069580078125, 0.13641357421875, 0.15117645263671875, 0.1659393310546875, 0.18070220947265625, 0.195465087890625, 0.21022796630859375, 0.2249908447265625, 0.23975372314453125, 0.2545166015625, 0.26927947998046875, 0.2840423583984375, 0.29880523681640625, 0.313568115234375, 0.32833099365234375, 0.3430938720703125, 0.35785675048828125, 0.37261962890625, 0.38738250732421875, 0.4021453857421875, 0.41690826416015625, 0.431671142578125, 0.44643402099609375, 0.4611968994140625, 0.47595977783203125, 0.49072265625]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 3.0, 0.0, 1.0, 3.0, 2.0, 3.0, 3.0, 7.0, 13.0, 5.0, 6.0, 7.0, 5.0, 11.0, 24.0, 51.0, 98.0, 200.0, 217.0, 134.0, 86.0, 35.0, 14.0, 18.0, 12.0, 11.0, 5.0, 8.0, 2.0, 10.0, 3.0, 3.0, 3.0, 5.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1082763671875, -0.10529422760009766, -0.10231208801269531, -0.09932994842529297, -0.09634780883789062, -0.09336566925048828, -0.09038352966308594, -0.0874013900756836, -0.08441925048828125, -0.0814371109008789, -0.07845497131347656, -0.07547283172607422, -0.07249069213867188, -0.06950855255126953, -0.06652641296386719, -0.06354427337646484, -0.0605621337890625, -0.057579994201660156, -0.05459785461425781, -0.05161571502685547, -0.048633575439453125, -0.04565143585205078, -0.04266929626464844, -0.039687156677246094, -0.03670501708984375, -0.033722877502441406, -0.030740737915039062, -0.02775859832763672, -0.024776458740234375, -0.02179431915283203, -0.018812179565429688, -0.015830039978027344, -0.012847900390625, -0.009865760803222656, -0.0068836212158203125, -0.0039014816284179688, -0.000919342041015625, 0.0020627975463867188, 0.0050449371337890625, 0.008027076721191406, 0.01100921630859375, 0.013991355895996094, 0.016973495483398438, 0.01995563507080078, 0.022937774658203125, 0.02591991424560547, 0.028902053833007812, 0.031884193420410156, 0.0348663330078125, 0.037848472595214844, 0.04083061218261719, 0.04381275177001953, 0.046794891357421875, 0.04977703094482422, 0.05275917053222656, 0.055741310119628906, 0.05872344970703125, 0.061705589294433594, 0.06468772888183594, 0.06766986846923828, 0.07065200805664062, 0.07363414764404297, 0.07661628723144531, 0.07959842681884766, 0.08258056640625]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 4.0, 2.0, 3.0, 2.0, 2.0, 6.0, 8.0, 6.0, 15.0, 22.0, 24.0, 36.0, 36.0, 57.0, 90.0, 133.0, 220.0, 312.0, 564.0, 1127.0, 2568.0, 6794.0, 20761.0, 78357.0, 344449.0, 443789.0, 107001.0, 27194.0, 8587.0, 3239.0, 1334.0, 686.0, 382.0, 230.0, 154.0, 100.0, 65.0, 52.0, 38.0, 29.0, 20.0, 16.0, 17.0, 11.0, 6.0, 3.0, 8.0, 1.0, 3.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.2841796875, -0.27407073974609375, -0.2639617919921875, -0.25385284423828125, -0.243743896484375, -0.23363494873046875, -0.2235260009765625, -0.21341705322265625, -0.20330810546875, -0.19319915771484375, -0.1830902099609375, -0.17298126220703125, -0.162872314453125, -0.15276336669921875, -0.1426544189453125, -0.13254547119140625, -0.1224365234375, -0.11232757568359375, -0.1022186279296875, -0.09210968017578125, -0.082000732421875, -0.07189178466796875, -0.0617828369140625, -0.05167388916015625, -0.04156494140625, -0.03145599365234375, -0.0213470458984375, -0.01123809814453125, -0.001129150390625, 0.00897979736328125, 0.0190887451171875, 0.02919769287109375, 0.039306640625, 0.04941558837890625, 0.0595245361328125, 0.06963348388671875, 0.079742431640625, 0.08985137939453125, 0.0999603271484375, 0.11006927490234375, 0.12017822265625, 0.13028717041015625, 0.1403961181640625, 0.15050506591796875, 0.160614013671875, 0.17072296142578125, 0.1808319091796875, 0.19094085693359375, 0.2010498046875, 0.21115875244140625, 0.2212677001953125, 0.23137664794921875, 0.241485595703125, 0.25159454345703125, 0.2617034912109375, 0.27181243896484375, 0.28192138671875, 0.29203033447265625, 0.3021392822265625, 0.31224822998046875, 0.322357177734375, 0.33246612548828125, 0.3425750732421875, 0.35268402099609375, 0.36279296875]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 3.0, 4.0, 1.0, 2.0, 2.0, 8.0, 7.0, 5.0, 6.0, 8.0, 8.0, 15.0, 17.0, 17.0, 16.0, 25.0, 24.0, 34.0, 38.0, 38.0, 29.0, 39.0, 27.0, 46.0, 52.0, 36.0, 46.0, 47.0, 43.0, 39.0, 38.0, 38.0, 35.0, 27.0, 32.0, 16.0, 27.0, 20.0, 14.0, 17.0, 10.0, 12.0, 4.0, 8.0, 7.0, 8.0, 3.0, 7.0, 1.0, 5.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.263916015625, -0.25514984130859375, -0.2463836669921875, -0.23761749267578125, -0.228851318359375, -0.22008514404296875, -0.2113189697265625, -0.20255279541015625, -0.19378662109375, -0.18502044677734375, -0.1762542724609375, -0.16748809814453125, -0.158721923828125, -0.14995574951171875, -0.1411895751953125, -0.13242340087890625, -0.1236572265625, -0.11489105224609375, -0.1061248779296875, -0.09735870361328125, -0.088592529296875, -0.07982635498046875, -0.0710601806640625, -0.06229400634765625, -0.05352783203125, -0.04476165771484375, -0.0359954833984375, -0.02722930908203125, -0.018463134765625, -0.00969696044921875, -0.0009307861328125, 0.00783538818359375, 0.0166015625, 0.02536773681640625, 0.0341339111328125, 0.04290008544921875, 0.051666259765625, 0.06043243408203125, 0.0691986083984375, 0.07796478271484375, 0.08673095703125, 0.09549713134765625, 0.1042633056640625, 0.11302947998046875, 0.121795654296875, 0.13056182861328125, 0.1393280029296875, 0.14809417724609375, 0.1568603515625, 0.16562652587890625, 0.1743927001953125, 0.18315887451171875, 0.191925048828125, 0.20069122314453125, 0.2094573974609375, 0.21822357177734375, 0.22698974609375, 0.23575592041015625, 0.2445220947265625, 0.25328826904296875, 0.262054443359375, 0.27082061767578125, 0.2795867919921875, 0.28835296630859375, 0.297119140625]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 3.0, 3.0, 1.0, 3.0, 4.0, 2.0, 4.0, 5.0, 3.0, 10.0, 11.0, 14.0, 19.0, 33.0, 43.0, 52.0, 75.0, 126.0, 219.0, 374.0, 757.0, 1781.0, 5006.0, 29857.0, 794822.0, 196999.0, 12581.0, 3059.0, 1233.0, 616.0, 320.0, 179.0, 104.0, 69.0, 49.0, 34.0, 20.0, 23.0, 15.0, 10.0, 5.0, 4.0, 5.0, 6.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.89404296875, -0.8650131225585938, -0.8359832763671875, -0.8069534301757812, -0.777923583984375, -0.7488937377929688, -0.7198638916015625, -0.6908340454101562, -0.66180419921875, -0.6327743530273438, -0.6037445068359375, -0.5747146606445312, -0.545684814453125, -0.5166549682617188, -0.4876251220703125, -0.45859527587890625, -0.4295654296875, -0.40053558349609375, -0.3715057373046875, -0.34247589111328125, -0.313446044921875, -0.28441619873046875, -0.2553863525390625, -0.22635650634765625, -0.19732666015625, -0.16829681396484375, -0.1392669677734375, -0.11023712158203125, -0.081207275390625, -0.05217742919921875, -0.0231475830078125, 0.00588226318359375, 0.034912109375, 0.06394195556640625, 0.0929718017578125, 0.12200164794921875, 0.151031494140625, 0.18006134033203125, 0.2090911865234375, 0.23812103271484375, 0.26715087890625, 0.29618072509765625, 0.3252105712890625, 0.35424041748046875, 0.383270263671875, 0.41230010986328125, 0.4413299560546875, 0.47035980224609375, 0.4993896484375, 0.5284194946289062, 0.5574493408203125, 0.5864791870117188, 0.615509033203125, 0.6445388793945312, 0.6735687255859375, 0.7025985717773438, 0.73162841796875, 0.7606582641601562, 0.7896881103515625, 0.8187179565429688, 0.847747802734375, 0.8767776489257812, 0.9058074951171875, 0.9348373413085938, 0.9638671875]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 7.0, 4.0, 1.0, 7.0, 8.0, 1.0, 11.0, 11.0, 19.0, 36.0, 63.0, 123.0, 201.0, 199.0, 151.0, 60.0, 37.0, 19.0, 9.0, 9.0, 8.0, 6.0, 5.0, 6.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.322166442871094e-05, -8.989870548248291e-05, -8.657574653625488e-05, -8.325278759002686e-05, -7.992982864379883e-05, -7.66068696975708e-05, -7.328391075134277e-05, -6.996095180511475e-05, -6.663799285888672e-05, -6.331503391265869e-05, -5.9992074966430664e-05, -5.666911602020264e-05, -5.334615707397461e-05, -5.002319812774658e-05, -4.6700239181518555e-05, -4.337728023529053e-05, -4.00543212890625e-05, -3.673136234283447e-05, -3.3408403396606445e-05, -3.0085444450378418e-05, -2.676248550415039e-05, -2.3439526557922363e-05, -2.0116567611694336e-05, -1.679360866546631e-05, -1.3470649719238281e-05, -1.0147690773010254e-05, -6.8247318267822266e-06, -3.5017728805541992e-06, -1.7881393432617188e-07, 3.1441450119018555e-06, 6.467103958129883e-06, 9.79006290435791e-06, 1.3113021850585938e-05, 1.6435980796813965e-05, 1.9758939743041992e-05, 2.308189868927002e-05, 2.6404857635498047e-05, 2.9727816581726074e-05, 3.30507755279541e-05, 3.637373447418213e-05, 3.9696693420410156e-05, 4.3019652366638184e-05, 4.634261131286621e-05, 4.966557025909424e-05, 5.2988529205322266e-05, 5.631148815155029e-05, 5.963444709777832e-05, 6.295740604400635e-05, 6.628036499023438e-05, 6.96033239364624e-05, 7.292628288269043e-05, 7.624924182891846e-05, 7.957220077514648e-05, 8.289515972137451e-05, 8.621811866760254e-05, 8.954107761383057e-05, 9.28640365600586e-05, 9.618699550628662e-05, 9.950995445251465e-05, 0.00010283291339874268, 0.0001061558723449707, 0.00010947883129119873, 0.00011280179023742676, 0.00011612474918365479, 0.00011944770812988281]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 4.0, 2.0, 8.0, 6.0, 6.0, 14.0, 20.0, 32.0, 71.0, 97.0, 158.0, 283.0, 629.0, 1418.0, 4760.0, 25319.0, 375155.0, 594842.0, 35905.0, 6265.0, 1882.0, 780.0, 379.0, 204.0, 96.0, 76.0, 51.0, 25.0, 21.0, 7.0, 10.0, 3.0, 6.0, 6.0, 4.0, 5.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.66650390625, -0.6463546752929688, -0.6262054443359375, -0.6060562133789062, -0.585906982421875, -0.5657577514648438, -0.5456085205078125, -0.5254592895507812, -0.50531005859375, -0.48516082763671875, -0.4650115966796875, -0.44486236572265625, -0.424713134765625, -0.40456390380859375, -0.3844146728515625, -0.36426544189453125, -0.3441162109375, -0.32396697998046875, -0.3038177490234375, -0.28366851806640625, -0.263519287109375, -0.24337005615234375, -0.2232208251953125, -0.20307159423828125, -0.18292236328125, -0.16277313232421875, -0.1426239013671875, -0.12247467041015625, -0.102325439453125, -0.08217620849609375, -0.0620269775390625, -0.04187774658203125, -0.021728515625, -0.00157928466796875, 0.0185699462890625, 0.03871917724609375, 0.058868408203125, 0.07901763916015625, 0.0991668701171875, 0.11931610107421875, 0.13946533203125, 0.15961456298828125, 0.1797637939453125, 0.19991302490234375, 0.220062255859375, 0.24021148681640625, 0.2603607177734375, 0.28050994873046875, 0.3006591796875, 0.32080841064453125, 0.3409576416015625, 0.36110687255859375, 0.381256103515625, 0.40140533447265625, 0.4215545654296875, 0.44170379638671875, 0.46185302734375, 0.48200225830078125, 0.5021514892578125, 0.5223007202148438, 0.542449951171875, 0.5625991821289062, 0.5827484130859375, 0.6028976440429688, 0.623046875]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 1.0, 2.0, 3.0, 7.0, 14.0, 15.0, 12.0, 20.0, 19.0, 50.0, 72.0, 96.0, 191.0, 167.0, 115.0, 75.0, 41.0, 31.0, 21.0, 16.0, 16.0, 8.0, 3.0, 5.0, 7.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.58251953125, -0.5648956298828125, -0.547271728515625, -0.5296478271484375, -0.51202392578125, -0.4944000244140625, -0.476776123046875, -0.4591522216796875, -0.4415283203125, -0.4239044189453125, -0.406280517578125, -0.3886566162109375, -0.37103271484375, -0.3534088134765625, -0.335784912109375, -0.3181610107421875, -0.300537109375, -0.2829132080078125, -0.265289306640625, -0.2476654052734375, -0.23004150390625, -0.2124176025390625, -0.194793701171875, -0.1771697998046875, -0.1595458984375, -0.1419219970703125, -0.124298095703125, -0.1066741943359375, -0.08905029296875, -0.0714263916015625, -0.053802490234375, -0.0361785888671875, -0.0185546875, -0.0009307861328125, 0.016693115234375, 0.0343170166015625, 0.05194091796875, 0.0695648193359375, 0.087188720703125, 0.1048126220703125, 0.1224365234375, 0.1400604248046875, 0.157684326171875, 0.1753082275390625, 0.19293212890625, 0.2105560302734375, 0.228179931640625, 0.2458038330078125, 0.263427734375, 0.2810516357421875, 0.298675537109375, 0.3162994384765625, 0.33392333984375, 0.3515472412109375, 0.369171142578125, 0.3867950439453125, 0.4044189453125, 0.4220428466796875, 0.439666748046875, 0.4572906494140625, 0.47491455078125, 0.4925384521484375, 0.510162353515625, 0.5277862548828125, 0.54541015625]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 3.0, 27.0, 161.0, 507.0, 251.0, 37.0, 12.0, 7.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.829008102416992, -9.59841251373291, -9.367816925048828, -9.137221336364746, -8.906625747680664, -8.676031112670898, -8.445435523986816, -8.214839935302734, -7.984244346618652, -7.75364875793457, -7.523053169250488, -7.2924580574035645, -7.061862468719482, -6.8312668800354, -6.600671291351318, -6.3700761795043945, -6.1394805908203125, -5.9088850021362305, -5.678289413452148, -5.447694301605225, -5.217098712921143, -4.9865031242370605, -4.7559075355529785, -4.525312423706055, -4.2947163581848145, -4.064120769500732, -3.8335254192352295, -3.6029298305511475, -3.3723344802856445, -3.1417388916015625, -2.9111433029174805, -2.6805479526519775, -2.4499526023864746, -2.2193570137023926, -1.9887616634368896, -1.7581660747528076, -1.5275707244873047, -1.2969751358032227, -1.0663796663284302, -0.8357841968536377, -0.6051887273788452, -0.37459325790405273, -0.14399775862693787, 0.086597740650177, 0.3171932101249695, 0.5477887392044067, 0.7783842086791992, 1.0089796781539917, 1.2395751476287842, 1.4701706171035767, 1.7007660865783691, 1.9313616752624512, 2.161957025527954, 2.392552614212036, 2.623147964477539, 2.853743553161621, 3.084339141845703, 3.314934730529785, 3.545530080795288, 3.77612566947937, 4.006721019744873, 4.237316608428955, 4.467912197113037, 4.698507308959961, 4.929102897644043]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 1.0, 3.0, 1.0, 4.0, 4.0, 5.0, 6.0, 7.0, 15.0, 18.0, 21.0, 27.0, 40.0, 54.0, 58.0, 74.0, 82.0, 118.0, 78.0, 82.0, 67.0, 59.0, 43.0, 47.0, 27.0, 16.0, 15.0, 9.0, 5.0, 8.0, 5.0, 2.0, 4.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.269229412078857, -4.146988868713379, -4.024747848510742, -3.9025070667266846, -3.780266284942627, -3.6580257415771484, -3.535784959793091, -3.413544178009033, -3.2913033962249756, -3.169062614440918, -3.0468218326568604, -2.9245810508728027, -2.802340507507324, -2.6800994873046875, -2.557858943939209, -2.4356181621551514, -2.3133773803710938, -2.191136598587036, -2.0688958168029785, -1.9466551542282104, -1.8244143724441528, -1.7021735906600952, -1.5799329280853271, -1.4576921463012695, -1.335451364517212, -1.2132105827331543, -1.0909698009490967, -0.9687291383743286, -0.846488356590271, -0.7242475748062134, -0.6020068526268005, -0.4797661304473877, -0.3575253486633301, -0.23528459668159485, -0.11304384469985962, 0.00919690728187561, 0.13143765926361084, 0.25367844104766846, 0.3759191632270813, 0.49815988540649414, 0.6204006671905518, 0.7426414489746094, 0.8648821711540222, 0.9871228933334351, 1.1093636751174927, 1.2316044569015503, 1.3538451194763184, 1.476085901260376, 1.5983266830444336, 1.7205674648284912, 1.8428082466125488, 1.965048909187317, 2.087289810180664, 2.2095303535461426, 2.3317711353302, 2.454011917114258, 2.5762526988983154, 2.698493480682373, 2.8207342624664307, 2.9429750442504883, 3.065215587615967, 3.1874566078186035, 3.309697151184082, 3.4319379329681396, 3.5541787147521973]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 5.0, 11.0, 7.0, 11.0, 3.0, 11.0, 11.0, 13.0, 21.0, 29.0, 39.0, 30.0, 59.0, 58.0, 91.0, 130.0, 217.0, 324.0, 463.0, 671.0, 1053.0, 1996.0, 4381.0, 15669.0, 153986.0, 3943980.0, 54535.0, 9175.0, 3278.0, 1510.0, 928.0, 526.0, 375.0, 256.0, 157.0, 97.0, 68.0, 28.0, 27.0, 9.0, 11.0, 10.0, 12.0, 8.0, 1.0, 4.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0], "bins": [-1.5810546875, -1.5387115478515625, -1.496368408203125, -1.4540252685546875, -1.41168212890625, -1.3693389892578125, -1.326995849609375, -1.2846527099609375, -1.2423095703125, -1.1999664306640625, -1.157623291015625, -1.1152801513671875, -1.07293701171875, -1.0305938720703125, -0.988250732421875, -0.9459075927734375, -0.903564453125, -0.8612213134765625, -0.818878173828125, -0.7765350341796875, -0.73419189453125, -0.6918487548828125, -0.649505615234375, -0.6071624755859375, -0.5648193359375, -0.5224761962890625, -0.480133056640625, -0.4377899169921875, -0.39544677734375, -0.3531036376953125, -0.310760498046875, -0.2684173583984375, -0.22607421875, -0.1837310791015625, -0.141387939453125, -0.0990447998046875, -0.05670166015625, -0.0143585205078125, 0.027984619140625, 0.0703277587890625, 0.1126708984375, 0.1550140380859375, 0.197357177734375, 0.2397003173828125, 0.28204345703125, 0.3243865966796875, 0.366729736328125, 0.4090728759765625, 0.451416015625, 0.4937591552734375, 0.536102294921875, 0.5784454345703125, 0.62078857421875, 0.6631317138671875, 0.705474853515625, 0.7478179931640625, 0.7901611328125, 0.8325042724609375, 0.874847412109375, 0.9171905517578125, 0.95953369140625, 1.0018768310546875, 1.044219970703125, 1.0865631103515625, 1.12890625]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 4.0, 6.0, 2.0, 7.0, 7.0, 7.0, 12.0, 14.0, 25.0, 60.0, 126.0, 185.0, 165.0, 164.0, 91.0, 43.0, 26.0, 17.0, 9.0, 6.0, 7.0, 8.0, 2.0, 5.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1197509765625, -0.11653423309326172, -0.11331748962402344, -0.11010074615478516, -0.10688400268554688, -0.1036672592163086, -0.10045051574707031, -0.09723377227783203, -0.09401702880859375, -0.09080028533935547, -0.08758354187011719, -0.0843667984008789, -0.08115005493164062, -0.07793331146240234, -0.07471656799316406, -0.07149982452392578, -0.0682830810546875, -0.06506633758544922, -0.06184959411621094, -0.058632850646972656, -0.055416107177734375, -0.052199363708496094, -0.04898262023925781, -0.04576587677001953, -0.04254913330078125, -0.03933238983154297, -0.03611564636230469, -0.032898902893066406, -0.029682159423828125, -0.026465415954589844, -0.023248672485351562, -0.02003192901611328, -0.016815185546875, -0.013598442077636719, -0.010381698608398438, -0.007164955139160156, -0.003948211669921875, -0.0007314682006835938, 0.0024852752685546875, 0.005702018737792969, 0.00891876220703125, 0.012135505676269531, 0.015352249145507812, 0.018568992614746094, 0.021785736083984375, 0.025002479553222656, 0.028219223022460938, 0.03143596649169922, 0.0346527099609375, 0.03786945343017578, 0.04108619689941406, 0.044302940368652344, 0.047519683837890625, 0.050736427307128906, 0.05395317077636719, 0.05716991424560547, 0.06038665771484375, 0.06360340118408203, 0.06682014465332031, 0.0700368881225586, 0.07325363159179688, 0.07647037506103516, 0.07968711853027344, 0.08290386199951172, 0.08612060546875]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 4.0, 3.0, 2.0, 4.0, 8.0, 6.0, 15.0, 30.0, 38.0, 68.0, 151.0, 463.0, 3551.0, 132918.0, 4039292.0, 15871.0, 1288.0, 324.0, 102.0, 52.0, 29.0, 16.0, 12.0, 12.0, 6.0, 7.0, 1.0, 2.0, 1.0, 0.0, 5.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-2.15234375, -2.0975341796875, -2.042724609375, -1.9879150390625, -1.93310546875, -1.8782958984375, -1.823486328125, -1.7686767578125, -1.7138671875, -1.6590576171875, -1.604248046875, -1.5494384765625, -1.49462890625, -1.4398193359375, -1.385009765625, -1.3302001953125, -1.275390625, -1.2205810546875, -1.165771484375, -1.1109619140625, -1.05615234375, -1.0013427734375, -0.946533203125, -0.8917236328125, -0.8369140625, -0.7821044921875, -0.727294921875, -0.6724853515625, -0.61767578125, -0.5628662109375, -0.508056640625, -0.4532470703125, -0.3984375, -0.3436279296875, -0.288818359375, -0.2340087890625, -0.17919921875, -0.1243896484375, -0.069580078125, -0.0147705078125, 0.0400390625, 0.0948486328125, 0.149658203125, 0.2044677734375, 0.25927734375, 0.3140869140625, 0.368896484375, 0.4237060546875, 0.478515625, 0.5333251953125, 0.588134765625, 0.6429443359375, 0.69775390625, 0.7525634765625, 0.807373046875, 0.8621826171875, 0.9169921875, 0.9718017578125, 1.026611328125, 1.0814208984375, 1.13623046875, 1.1910400390625, 1.245849609375, 1.3006591796875, 1.35546875]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 2.0, 2.0, 5.0, 4.0, 2.0, 4.0, 9.0, 16.0, 20.0, 12.0, 35.0, 62.0, 115.0, 226.0, 491.0, 1346.0, 945.0, 381.0, 154.0, 83.0, 51.0, 41.0, 26.0, 13.0, 5.0, 8.0, 4.0, 3.0, 5.0, 5.0, 0.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10430908203125, -0.10027217864990234, -0.09623527526855469, -0.09219837188720703, -0.08816146850585938, -0.08412456512451172, -0.08008766174316406, -0.0760507583618164, -0.07201385498046875, -0.0679769515991211, -0.06394004821777344, -0.05990314483642578, -0.055866241455078125, -0.05182933807373047, -0.04779243469238281, -0.043755531311035156, -0.0397186279296875, -0.035681724548339844, -0.03164482116699219, -0.02760791778564453, -0.023571014404296875, -0.01953411102294922, -0.015497207641601562, -0.011460304260253906, -0.00742340087890625, -0.0033864974975585938, 0.0006504058837890625, 0.004687309265136719, 0.008724212646484375, 0.012761116027832031, 0.016798019409179688, 0.020834922790527344, 0.024871826171875, 0.028908729553222656, 0.03294563293457031, 0.03698253631591797, 0.041019439697265625, 0.04505634307861328, 0.04909324645996094, 0.053130149841308594, 0.05716705322265625, 0.061203956604003906, 0.06524085998535156, 0.06927776336669922, 0.07331466674804688, 0.07735157012939453, 0.08138847351074219, 0.08542537689208984, 0.0894622802734375, 0.09349918365478516, 0.09753608703613281, 0.10157299041748047, 0.10560989379882812, 0.10964679718017578, 0.11368370056152344, 0.1177206039428711, 0.12175750732421875, 0.1257944107055664, 0.12983131408691406, 0.13386821746826172, 0.13790512084960938, 0.14194202423095703, 0.1459789276123047, 0.15001583099365234, 0.154052734375]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 7.0, 17.0, 67.0, 293.0, 462.0, 129.0, 29.0, 2.0, 0.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8766725659370422, -0.8288012742996216, -0.7809299230575562, -0.7330585718154907, -0.6851872801780701, -0.6373159885406494, -0.589444637298584, -0.5415732860565186, -0.4937019944190979, -0.44583067297935486, -0.3979593515396118, -0.3500880300998688, -0.30221670866012573, -0.2543453872203827, -0.20647406578063965, -0.1586027443408966, -0.11073142290115356, -0.06286010146141052, -0.01498878002166748, 0.03288254141807556, 0.0807538628578186, 0.12862518429756165, 0.1764965057373047, 0.22436782717704773, 0.27223914861679077, 0.3201104700565338, 0.36798179149627686, 0.4158531129360199, 0.46372443437576294, 0.5115957260131836, 0.559467077255249, 0.6073384284973145, 0.6552097797393799, 0.7030811309814453, 0.750952422618866, 0.7988237142562866, 0.846695065498352, 0.8945664167404175, 0.9424377083778381, 0.9903090000152588, 1.0381803512573242, 1.0860517024993896, 1.133923053741455, 1.181794285774231, 1.2296656370162964, 1.2775369882583618, 1.3254082202911377, 1.3732795715332031, 1.4211509227752686, 1.469022274017334, 1.5168936252593994, 1.5647648572921753, 1.6126362085342407, 1.6605075597763062, 1.708378791809082, 1.7562501430511475, 1.804121494293213, 1.8519928455352783, 1.8998641967773438, 1.9477354288101196, 1.995606780052185, 2.043478012084961, 2.0913493633270264, 2.139220714569092, 2.1870920658111572]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 3.0, 7.0, 5.0, 7.0, 5.0, 14.0, 14.0, 27.0, 18.0, 30.0, 40.0, 40.0, 54.0, 56.0, 67.0, 73.0, 73.0, 65.0, 61.0, 64.0, 46.0, 41.0, 36.0, 23.0, 32.0, 22.0, 18.0, 14.0, 19.0, 11.0, 6.0, 7.0, 1.0, 2.0, 5.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.4359545111656189, -0.42113929986953735, -0.4063240587711334, -0.3915088474750519, -0.37669363617897034, -0.3618783950805664, -0.34706318378448486, -0.3322479724884033, -0.3174327313899994, -0.30261752009391785, -0.2878022789955139, -0.2729870676994324, -0.25817185640335083, -0.2433566153049469, -0.22854140400886536, -0.21372617781162262, -0.19891096651554108, -0.18409574031829834, -0.1692805290222168, -0.15446530282497406, -0.13965007662773132, -0.12483485788106918, -0.11001963913440704, -0.0952044129371643, -0.08038919419050217, -0.06557397544384003, -0.05075874924659729, -0.03594353049993515, -0.021128308027982712, -0.0063130855560302734, 0.008502133190631866, 0.023317359387874603, 0.03813257813453674, 0.05294780060648918, 0.06776302307844162, 0.08257824182510376, 0.0973934680223465, 0.11220868676900864, 0.12702390551567078, 0.1418391317129135, 0.15665435791015625, 0.171469584107399, 0.18628479540348053, 0.20110002160072327, 0.215915247797966, 0.23073047399520874, 0.24554568529129028, 0.2603608965873718, 0.27517610788345337, 0.2899913191795349, 0.30480656027793884, 0.3196217715740204, 0.33443698287010193, 0.34925222396850586, 0.3640674352645874, 0.37888264656066895, 0.3936978876590729, 0.4085130989551544, 0.42332834005355835, 0.4381435513496399, 0.45295876264572144, 0.46777400374412537, 0.4825892150402069, 0.49740445613861084, 0.5122196674346924]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 5.0, 3.0, 4.0, 3.0, 6.0, 7.0, 19.0, 15.0, 23.0, 43.0, 83.0, 110.0, 197.0, 363.0, 785.0, 1870.0, 5541.0, 26539.0, 475706.0, 500497.0, 27502.0, 5677.0, 1871.0, 752.0, 394.0, 199.0, 137.0, 76.0, 37.0, 38.0, 19.0, 12.0, 12.0, 4.0, 2.0, 6.0, 3.0, 0.0, 1.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.70947265625, -0.6865921020507812, -0.6637115478515625, -0.6408309936523438, -0.617950439453125, -0.5950698852539062, -0.5721893310546875, -0.5493087768554688, -0.52642822265625, -0.5035476684570312, -0.4806671142578125, -0.45778656005859375, -0.434906005859375, -0.41202545166015625, -0.3891448974609375, -0.36626434326171875, -0.3433837890625, -0.32050323486328125, -0.2976226806640625, -0.27474212646484375, -0.251861572265625, -0.22898101806640625, -0.2061004638671875, -0.18321990966796875, -0.16033935546875, -0.13745880126953125, -0.1145782470703125, -0.09169769287109375, -0.068817138671875, -0.04593658447265625, -0.0230560302734375, -0.00017547607421875, 0.022705078125, 0.04558563232421875, 0.0684661865234375, 0.09134674072265625, 0.114227294921875, 0.13710784912109375, 0.1599884033203125, 0.18286895751953125, 0.20574951171875, 0.22863006591796875, 0.2515106201171875, 0.27439117431640625, 0.297271728515625, 0.32015228271484375, 0.3430328369140625, 0.36591339111328125, 0.3887939453125, 0.41167449951171875, 0.4345550537109375, 0.45743560791015625, 0.480316162109375, 0.5031967163085938, 0.5260772705078125, 0.5489578247070312, 0.57183837890625, 0.5947189331054688, 0.6175994873046875, 0.6404800415039062, 0.663360595703125, 0.6862411499023438, 0.7091217041015625, 0.7320022583007812, 0.7548828125]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 7.0, 1.0, 2.0, 12.0, 6.0, 8.0, 8.0, 17.0, 30.0, 73.0, 134.0, 196.0, 195.0, 122.0, 88.0, 45.0, 23.0, 9.0, 8.0, 6.0, 8.0, 4.0, 3.0, 4.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.115966796875, -0.1129159927368164, -0.10986518859863281, -0.10681438446044922, -0.10376358032226562, -0.10071277618408203, -0.09766197204589844, -0.09461116790771484, -0.09156036376953125, -0.08850955963134766, -0.08545875549316406, -0.08240795135498047, -0.07935714721679688, -0.07630634307861328, -0.07325553894042969, -0.0702047348022461, -0.0671539306640625, -0.0641031265258789, -0.06105232238769531, -0.05800151824951172, -0.054950714111328125, -0.05189990997314453, -0.04884910583496094, -0.045798301696777344, -0.04274749755859375, -0.039696693420410156, -0.03664588928222656, -0.03359508514404297, -0.030544281005859375, -0.02749347686767578, -0.024442672729492188, -0.021391868591308594, -0.018341064453125, -0.015290260314941406, -0.012239456176757812, -0.009188652038574219, -0.006137847900390625, -0.0030870437622070312, -3.62396240234375e-05, 0.0030145645141601562, 0.00606536865234375, 0.009116172790527344, 0.012166976928710938, 0.015217781066894531, 0.018268585205078125, 0.02131938934326172, 0.024370193481445312, 0.027420997619628906, 0.0304718017578125, 0.033522605895996094, 0.03657341003417969, 0.03962421417236328, 0.042675018310546875, 0.04572582244873047, 0.04877662658691406, 0.051827430725097656, 0.05487823486328125, 0.057929039001464844, 0.06097984313964844, 0.06403064727783203, 0.06708145141601562, 0.07013225555419922, 0.07318305969238281, 0.0762338638305664, 0.07928466796875]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 2.0, 2.0, 1.0, 4.0, 0.0, 5.0, 8.0, 7.0, 11.0, 13.0, 12.0, 16.0, 24.0, 30.0, 31.0, 73.0, 70.0, 127.0, 192.0, 258.0, 516.0, 1122.0, 2882.0, 10504.0, 56342.0, 395847.0, 487000.0, 74321.0, 12946.0, 3336.0, 1261.0, 603.0, 313.0, 202.0, 142.0, 88.0, 55.0, 51.0, 34.0, 25.0, 19.0, 20.0, 13.0, 10.0, 7.0, 4.0, 3.0, 7.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3720703125, -0.3592720031738281, -0.34647369384765625, -0.3336753845214844, -0.3208770751953125, -0.3080787658691406, -0.29528045654296875, -0.2824821472167969, -0.269683837890625, -0.2568855285644531, -0.24408721923828125, -0.23128890991210938, -0.2184906005859375, -0.20569229125976562, -0.19289398193359375, -0.18009567260742188, -0.16729736328125, -0.15449905395507812, -0.14170074462890625, -0.12890243530273438, -0.1161041259765625, -0.10330581665039062, -0.09050750732421875, -0.07770919799804688, -0.064910888671875, -0.052112579345703125, -0.03931427001953125, -0.026515960693359375, -0.0137176513671875, -0.000919342041015625, 0.01187896728515625, 0.024677276611328125, 0.0374755859375, 0.050273895263671875, 0.06307220458984375, 0.07587051391601562, 0.0886688232421875, 0.10146713256835938, 0.11426544189453125, 0.12706375122070312, 0.139862060546875, 0.15266036987304688, 0.16545867919921875, 0.17825698852539062, 0.1910552978515625, 0.20385360717773438, 0.21665191650390625, 0.22945022583007812, 0.24224853515625, 0.2550468444824219, 0.26784515380859375, 0.2806434631347656, 0.2934417724609375, 0.3062400817871094, 0.31903839111328125, 0.3318367004394531, 0.344635009765625, 0.3574333190917969, 0.37023162841796875, 0.3830299377441406, 0.3958282470703125, 0.4086265563964844, 0.42142486572265625, 0.4342231750488281, 0.447021484375]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0, 9.0, 3.0, 6.0, 7.0, 4.0, 10.0, 8.0, 16.0, 21.0, 16.0, 30.0, 37.0, 31.0, 42.0, 47.0, 43.0, 58.0, 56.0, 66.0, 51.0, 64.0, 51.0, 43.0, 43.0, 40.0, 26.0, 29.0, 27.0, 20.0, 16.0, 18.0, 16.0, 11.0, 15.0, 4.0, 5.0, 4.0, 4.0, 4.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.25634765625, -0.2475433349609375, -0.238739013671875, -0.2299346923828125, -0.22113037109375, -0.2123260498046875, -0.203521728515625, -0.1947174072265625, -0.1859130859375, -0.1771087646484375, -0.168304443359375, -0.1595001220703125, -0.15069580078125, -0.1418914794921875, -0.133087158203125, -0.1242828369140625, -0.115478515625, -0.1066741943359375, -0.097869873046875, -0.0890655517578125, -0.08026123046875, -0.0714569091796875, -0.062652587890625, -0.0538482666015625, -0.0450439453125, -0.0362396240234375, -0.027435302734375, -0.0186309814453125, -0.00982666015625, -0.0010223388671875, 0.007781982421875, 0.0165863037109375, 0.025390625, 0.0341949462890625, 0.042999267578125, 0.0518035888671875, 0.06060791015625, 0.0694122314453125, 0.078216552734375, 0.0870208740234375, 0.0958251953125, 0.1046295166015625, 0.113433837890625, 0.1222381591796875, 0.13104248046875, 0.1398468017578125, 0.148651123046875, 0.1574554443359375, 0.166259765625, 0.1750640869140625, 0.183868408203125, 0.1926727294921875, 0.20147705078125, 0.2102813720703125, 0.219085693359375, 0.2278900146484375, 0.2366943359375, 0.2454986572265625, 0.254302978515625, 0.2631072998046875, 0.27191162109375, 0.2807159423828125, 0.289520263671875, 0.2983245849609375, 0.30712890625]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 1.0, 3.0, 0.0, 4.0, 10.0, 16.0, 15.0, 26.0, 42.0, 76.0, 145.0, 282.0, 681.0, 2126.0, 11524.0, 100782.0, 760168.0, 152364.0, 15890.0, 2874.0, 837.0, 328.0, 166.0, 66.0, 37.0, 23.0, 17.0, 18.0, 12.0, 6.0, 8.0, 5.0, 3.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.29345703125, -0.2828178405761719, -0.27217864990234375, -0.2615394592285156, -0.2509002685546875, -0.24026107788085938, -0.22962188720703125, -0.21898269653320312, -0.208343505859375, -0.19770431518554688, -0.18706512451171875, -0.17642593383789062, -0.1657867431640625, -0.15514755249023438, -0.14450836181640625, -0.13386917114257812, -0.12322998046875, -0.11259078979492188, -0.10195159912109375, -0.09131240844726562, -0.0806732177734375, -0.07003402709960938, -0.05939483642578125, -0.048755645751953125, -0.038116455078125, -0.027477264404296875, -0.01683807373046875, -0.006198883056640625, 0.0044403076171875, 0.015079498291015625, 0.02571868896484375, 0.036357879638671875, 0.0469970703125, 0.057636260986328125, 0.06827545166015625, 0.07891464233398438, 0.0895538330078125, 0.10019302368164062, 0.11083221435546875, 0.12147140502929688, 0.132110595703125, 0.14274978637695312, 0.15338897705078125, 0.16402816772460938, 0.1746673583984375, 0.18530654907226562, 0.19594573974609375, 0.20658493041992188, 0.21722412109375, 0.22786331176757812, 0.23850250244140625, 0.24914169311523438, 0.2597808837890625, 0.2704200744628906, 0.28105926513671875, 0.2916984558105469, 0.302337646484375, 0.3129768371582031, 0.32361602783203125, 0.3342552185058594, 0.3448944091796875, 0.3555335998535156, 0.36617279052734375, 0.3768119812011719, 0.387451171875]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 4.0, 2.0, 0.0, 3.0, 2.0, 4.0, 12.0, 10.0, 13.0, 20.0, 20.0, 41.0, 49.0, 39.0, 74.0, 115.0, 153.0, 133.0, 94.0, 47.0, 47.0, 39.0, 29.0, 15.0, 16.0, 8.0, 9.0, 8.0, 4.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.747245788574219e-05, -6.365403532981873e-05, -5.9835612773895264e-05, -5.60171902179718e-05, -5.219876766204834e-05, -4.838034510612488e-05, -4.4561922550201416e-05, -4.0743499994277954e-05, -3.692507743835449e-05, -3.310665488243103e-05, -2.928823232650757e-05, -2.5469809770584106e-05, -2.1651387214660645e-05, -1.7832964658737183e-05, -1.401454210281372e-05, -1.0196119546890259e-05, -6.377696990966797e-06, -2.559274435043335e-06, 1.259148120880127e-06, 5.077570676803589e-06, 8.89599323272705e-06, 1.2714415788650513e-05, 1.6532838344573975e-05, 2.0351260900497437e-05, 2.41696834564209e-05, 2.798810601234436e-05, 3.180652856826782e-05, 3.5624951124191284e-05, 3.9443373680114746e-05, 4.326179623603821e-05, 4.708021879196167e-05, 5.089864134788513e-05, 5.4717063903808594e-05, 5.8535486459732056e-05, 6.235390901565552e-05, 6.617233157157898e-05, 6.999075412750244e-05, 7.38091766834259e-05, 7.762759923934937e-05, 8.144602179527283e-05, 8.526444435119629e-05, 8.908286690711975e-05, 9.290128946304321e-05, 9.671971201896667e-05, 0.00010053813457489014, 0.0001043565571308136, 0.00010817497968673706, 0.00011199340224266052, 0.00011581182479858398, 0.00011963024735450745, 0.0001234486699104309, 0.00012726709246635437, 0.00013108551502227783, 0.0001349039375782013, 0.00013872236013412476, 0.00014254078269004822, 0.00014635920524597168, 0.00015017762780189514, 0.0001539960503578186, 0.00015781447291374207, 0.00016163289546966553, 0.000165451318025589, 0.00016926974058151245, 0.0001730881631374359, 0.00017690658569335938]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 4.0, 4.0, 2.0, 12.0, 19.0, 21.0, 44.0, 74.0, 127.0, 288.0, 666.0, 1751.0, 10037.0, 103243.0, 807136.0, 111404.0, 10490.0, 1973.0, 651.0, 307.0, 112.0, 80.0, 43.0, 30.0, 18.0, 14.0, 1.0, 5.0, 3.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.50244140625, -0.4893951416015625, -0.476348876953125, -0.4633026123046875, -0.45025634765625, -0.4372100830078125, -0.424163818359375, -0.4111175537109375, -0.3980712890625, -0.3850250244140625, -0.371978759765625, -0.3589324951171875, -0.34588623046875, -0.3328399658203125, -0.319793701171875, -0.3067474365234375, -0.293701171875, -0.2806549072265625, -0.267608642578125, -0.2545623779296875, -0.24151611328125, -0.2284698486328125, -0.215423583984375, -0.2023773193359375, -0.1893310546875, -0.1762847900390625, -0.163238525390625, -0.1501922607421875, -0.13714599609375, -0.1240997314453125, -0.111053466796875, -0.0980072021484375, -0.0849609375, -0.0719146728515625, -0.058868408203125, -0.0458221435546875, -0.03277587890625, -0.0197296142578125, -0.006683349609375, 0.0063629150390625, 0.0194091796875, 0.0324554443359375, 0.045501708984375, 0.0585479736328125, 0.07159423828125, 0.0846405029296875, 0.097686767578125, 0.1107330322265625, 0.123779296875, 0.1368255615234375, 0.149871826171875, 0.1629180908203125, 0.17596435546875, 0.1890106201171875, 0.202056884765625, 0.2151031494140625, 0.2281494140625, 0.2411956787109375, 0.254241943359375, 0.2672882080078125, 0.28033447265625, 0.2933807373046875, 0.306427001953125, 0.3194732666015625, 0.33251953125]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 3.0, 1.0, 11.0, 16.0, 17.0, 24.0, 36.0, 59.0, 88.0, 115.0, 157.0, 159.0, 103.0, 65.0, 42.0, 34.0, 26.0, 21.0, 12.0, 7.0, 4.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2393798828125, -0.23268890380859375, -0.2259979248046875, -0.21930694580078125, -0.212615966796875, -0.20592498779296875, -0.1992340087890625, -0.19254302978515625, -0.18585205078125, -0.17916107177734375, -0.1724700927734375, -0.16577911376953125, -0.159088134765625, -0.15239715576171875, -0.1457061767578125, -0.13901519775390625, -0.13232421875, -0.12563323974609375, -0.1189422607421875, -0.11225128173828125, -0.105560302734375, -0.09886932373046875, -0.0921783447265625, -0.08548736572265625, -0.07879638671875, -0.07210540771484375, -0.0654144287109375, -0.05872344970703125, -0.052032470703125, -0.04534149169921875, -0.0386505126953125, -0.03195953369140625, -0.0252685546875, -0.01857757568359375, -0.0118865966796875, -0.00519561767578125, 0.001495361328125, 0.00818634033203125, 0.0148773193359375, 0.02156829833984375, 0.02825927734375, 0.03495025634765625, 0.0416412353515625, 0.04833221435546875, 0.055023193359375, 0.06171417236328125, 0.0684051513671875, 0.07509613037109375, 0.081787109375, 0.08847808837890625, 0.0951690673828125, 0.10186004638671875, 0.108551025390625, 0.11524200439453125, 0.1219329833984375, 0.12862396240234375, 0.13531494140625, 0.14200592041015625, 0.1486968994140625, 0.15538787841796875, 0.162078857421875, 0.16876983642578125, 0.1754608154296875, 0.18215179443359375, 0.1888427734375]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 10.0, 24.0, 87.0, 255.0, 368.0, 172.0, 59.0, 12.0, 7.0, 3.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.41822624206543, -4.277159690856934, -4.1360931396484375, -3.9950265884399414, -3.8539600372314453, -3.712893486022949, -3.571826934814453, -3.430760383605957, -3.289693832397461, -3.148627281188965, -3.0075607299804688, -2.8664941787719727, -2.7254276275634766, -2.5843610763549805, -2.4432945251464844, -2.3022279739379883, -2.161161422729492, -2.020094871520996, -1.8790283203125, -1.737961769104004, -1.5968952178955078, -1.4558286666870117, -1.3147621154785156, -1.1736955642700195, -1.0326290130615234, -0.8915624618530273, -0.7504959106445312, -0.6094293594360352, -0.46836280822753906, -0.32729625701904297, -0.18622970581054688, -0.04516315460205078, 0.09590339660644531, 0.2369699478149414, 0.3780364990234375, 0.5191030502319336, 0.6601696014404297, 0.8012361526489258, 0.9423027038574219, 1.083369255065918, 1.224435806274414, 1.3655023574829102, 1.5065689086914062, 1.6476354598999023, 1.7887020111083984, 1.9297685623168945, 2.0708351135253906, 2.2119016647338867, 2.352968215942383, 2.494034767150879, 2.635101318359375, 2.776167869567871, 2.917234420776367, 3.0583009719848633, 3.1993675231933594, 3.3404340744018555, 3.4815006256103516, 3.6225671768188477, 3.7636337280273438, 3.90470027923584, 4.045766830444336, 4.186833381652832, 4.327899932861328, 4.468966484069824, 4.61003303527832]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 5.0, 4.0, 6.0, 3.0, 8.0, 14.0, 15.0, 16.0, 13.0, 35.0, 28.0, 38.0, 48.0, 56.0, 59.0, 52.0, 66.0, 76.0, 60.0, 64.0, 48.0, 45.0, 46.0, 45.0, 40.0, 27.0, 25.0, 15.0, 15.0, 15.0, 9.0, 2.0, 5.0, 1.0, 2.0, 0.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.1233720779418945, -2.0433895587921143, -1.963407278060913, -1.8834248781204224, -1.8034424781799316, -1.7234599590301514, -1.6434775590896606, -1.56349515914917, -1.4835127592086792, -1.4035303592681885, -1.3235479593276978, -1.243565559387207, -1.1635830402374268, -1.0836007595062256, -1.0036182403564453, -0.9236358404159546, -0.8436534404754639, -0.7636710405349731, -0.6836886405944824, -0.6037061810493469, -0.5237237811088562, -0.4437413811683655, -0.36375895142555237, -0.28377652168273926, -0.20379412174224854, -0.12381170690059662, -0.0438292920589447, 0.036153122782707214, 0.11613553762435913, 0.19611793756484985, 0.27610036730766296, 0.3560827970504761, 0.4360651969909668, 0.5160475969314575, 0.5960299968719482, 0.6760124564170837, 0.7559948563575745, 0.8359772562980652, 0.9159597158432007, 0.9959421157836914, 1.0759245157241821, 1.1559069156646729, 1.2358893156051636, 1.3158717155456543, 1.3958542346954346, 1.4758365154266357, 1.555819034576416, 1.6358014345169067, 1.7157838344573975, 1.7957662343978882, 1.875748634338379, 1.9557310342788696, 2.0357134342193604, 2.1156959533691406, 2.195678234100342, 2.275660753250122, 2.3556432723999023, 2.4356257915496826, 2.515608072280884, 2.595590591430664, 2.6755728721618652, 2.7555553913116455, 2.8355376720428467, 2.915520191192627, 2.995502471923828]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 5.0, 5.0, 10.0, 8.0, 14.0, 13.0, 30.0, 44.0, 67.0, 123.0, 303.0, 911.0, 4727.0, 3453818.0, 729406.0, 3737.0, 655.0, 199.0, 89.0, 55.0, 32.0, 12.0, 14.0, 7.0, 0.0, 1.0, 5.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-3.615234375, -3.52001953125, -3.4248046875, -3.32958984375, -3.234375, -3.13916015625, -3.0439453125, -2.94873046875, -2.853515625, -2.75830078125, -2.6630859375, -2.56787109375, -2.47265625, -2.37744140625, -2.2822265625, -2.18701171875, -2.091796875, -1.99658203125, -1.9013671875, -1.80615234375, -1.7109375, -1.61572265625, -1.5205078125, -1.42529296875, -1.330078125, -1.23486328125, -1.1396484375, -1.04443359375, -0.94921875, -0.85400390625, -0.7587890625, -0.66357421875, -0.568359375, -0.47314453125, -0.3779296875, -0.28271484375, -0.1875, -0.09228515625, 0.0029296875, 0.09814453125, 0.193359375, 0.28857421875, 0.3837890625, 0.47900390625, 0.57421875, 0.66943359375, 0.7646484375, 0.85986328125, 0.955078125, 1.05029296875, 1.1455078125, 1.24072265625, 1.3359375, 1.43115234375, 1.5263671875, 1.62158203125, 1.716796875, 1.81201171875, 1.9072265625, 2.00244140625, 2.09765625, 2.19287109375, 2.2880859375, 2.38330078125, 2.478515625]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 5.0, 3.0, 5.0, 5.0, 14.0, 18.0, 16.0, 51.0, 63.0, 113.0, 134.0, 159.0, 119.0, 99.0, 67.0, 46.0, 27.0, 26.0, 11.0, 9.0, 3.0, 4.0, 3.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.12939453125, -0.12602615356445312, -0.12265777587890625, -0.11928939819335938, -0.1159210205078125, -0.11255264282226562, -0.10918426513671875, -0.10581588745117188, -0.102447509765625, -0.09907913208007812, -0.09571075439453125, -0.09234237670898438, -0.0889739990234375, -0.08560562133789062, -0.08223724365234375, -0.07886886596679688, -0.07550048828125, -0.07213211059570312, -0.06876373291015625, -0.06539535522460938, -0.0620269775390625, -0.058658599853515625, -0.05529022216796875, -0.051921844482421875, -0.048553466796875, -0.045185089111328125, -0.04181671142578125, -0.038448333740234375, -0.0350799560546875, -0.031711578369140625, -0.02834320068359375, -0.024974822998046875, -0.0216064453125, -0.018238067626953125, -0.01486968994140625, -0.011501312255859375, -0.0081329345703125, -0.004764556884765625, -0.00139617919921875, 0.001972198486328125, 0.005340576171875, 0.008708953857421875, 0.01207733154296875, 0.015445709228515625, 0.0188140869140625, 0.022182464599609375, 0.02555084228515625, 0.028919219970703125, 0.03228759765625, 0.035655975341796875, 0.03902435302734375, 0.042392730712890625, 0.0457611083984375, 0.049129486083984375, 0.05249786376953125, 0.055866241455078125, 0.059234619140625, 0.06260299682617188, 0.06597137451171875, 0.06933975219726562, 0.0727081298828125, 0.07607650756835938, 0.07944488525390625, 0.08281326293945312, 0.086181640625]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 5.0, 5.0, 4.0, 9.0, 11.0, 19.0, 30.0, 48.0, 60.0, 88.0, 173.0, 317.0, 698.0, 1612.0, 3963.0, 13022.0, 63875.0, 1028269.0, 2945906.0, 109376.0, 18116.0, 5144.0, 1869.0, 819.0, 381.0, 180.0, 107.0, 60.0, 45.0, 28.0, 15.0, 5.0, 8.0, 7.0, 6.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.395263671875, -0.3806953430175781, -0.36612701416015625, -0.3515586853027344, -0.3369903564453125, -0.3224220275878906, -0.30785369873046875, -0.2932853698730469, -0.278717041015625, -0.2641487121582031, -0.24958038330078125, -0.23501205444335938, -0.2204437255859375, -0.20587539672851562, -0.19130706787109375, -0.17673873901367188, -0.16217041015625, -0.14760208129882812, -0.13303375244140625, -0.11846542358398438, -0.1038970947265625, -0.08932876586914062, -0.07476043701171875, -0.060192108154296875, -0.045623779296875, -0.031055450439453125, -0.01648712158203125, -0.001918792724609375, 0.0126495361328125, 0.027217864990234375, 0.04178619384765625, 0.056354522705078125, 0.0709228515625, 0.08549118041992188, 0.10005950927734375, 0.11462783813476562, 0.1291961669921875, 0.14376449584960938, 0.15833282470703125, 0.17290115356445312, 0.187469482421875, 0.20203781127929688, 0.21660614013671875, 0.23117446899414062, 0.2457427978515625, 0.2603111267089844, 0.27487945556640625, 0.2894477844238281, 0.30401611328125, 0.3185844421386719, 0.33315277099609375, 0.3477210998535156, 0.3622894287109375, 0.3768577575683594, 0.39142608642578125, 0.4059944152832031, 0.420562744140625, 0.4351310729980469, 0.44969940185546875, 0.4642677307128906, 0.4788360595703125, 0.4934043884277344, 0.5079727172851562, 0.5225410461425781, 0.537109375]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 0.0, 3.0, 1.0, 1.0, 2.0, 4.0, 5.0, 11.0, 5.0, 12.0, 18.0, 16.0, 20.0, 24.0, 54.0, 99.0, 137.0, 258.0, 501.0, 1303.0, 796.0, 311.0, 182.0, 87.0, 79.0, 33.0, 34.0, 16.0, 11.0, 11.0, 8.0, 13.0, 5.0, 2.0, 4.0, 6.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0], "bins": [-0.125, -0.12169170379638672, -0.11838340759277344, -0.11507511138916016, -0.11176681518554688, -0.1084585189819336, -0.10515022277832031, -0.10184192657470703, -0.09853363037109375, -0.09522533416748047, -0.09191703796386719, -0.0886087417602539, -0.08530044555664062, -0.08199214935302734, -0.07868385314941406, -0.07537555694580078, -0.0720672607421875, -0.06875896453857422, -0.06545066833496094, -0.062142372131347656, -0.058834075927734375, -0.055525779724121094, -0.05221748352050781, -0.04890918731689453, -0.04560089111328125, -0.04229259490966797, -0.03898429870605469, -0.035676002502441406, -0.032367706298828125, -0.029059410095214844, -0.025751113891601562, -0.02244281768798828, -0.019134521484375, -0.01582622528076172, -0.012517929077148438, -0.009209632873535156, -0.005901336669921875, -0.0025930404663085938, 0.0007152557373046875, 0.004023551940917969, 0.00733184814453125, 0.010640144348144531, 0.013948440551757812, 0.017256736755371094, 0.020565032958984375, 0.023873329162597656, 0.027181625366210938, 0.03048992156982422, 0.0337982177734375, 0.03710651397705078, 0.04041481018066406, 0.043723106384277344, 0.047031402587890625, 0.050339698791503906, 0.05364799499511719, 0.05695629119873047, 0.06026458740234375, 0.06357288360595703, 0.06688117980957031, 0.0701894760131836, 0.07349777221679688, 0.07680606842041016, 0.08011436462402344, 0.08342266082763672, 0.08673095703125]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 4.0, 12.0, 52.0, 244.0, 453.0, 199.0, 40.0, 5.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9817826747894287, -0.9313123822212219, -0.8808420300483704, -0.8303717374801636, -0.779901385307312, -0.7294310927391052, -0.6789608001708984, -0.6284904479980469, -0.5780200958251953, -0.5275498032569885, -0.47707945108413696, -0.4266091585159302, -0.3761388063430786, -0.3256685137748718, -0.27519819140434265, -0.22472786903381348, -0.1742575764656067, -0.12378725409507751, -0.07331693917512894, -0.02284662425518036, 0.027623698115348816, 0.0780940055847168, 0.12856432795524597, 0.17903465032577515, 0.22950497269630432, 0.2799752950668335, 0.33044561743736267, 0.38091593980789185, 0.43138623237609863, 0.4818565547466278, 0.532326877117157, 0.5827971696853638, 0.6332675218582153, 0.6837378144264221, 0.7342081665992737, 0.7846784591674805, 0.835148811340332, 0.8856191039085388, 0.9360893964767456, 0.9865597486495972, 1.0370301008224487, 1.0875004529953003, 1.1379706859588623, 1.1884410381317139, 1.2389113903045654, 1.289381742477417, 1.339851975440979, 1.3903223276138306, 1.4407925605773926, 1.4912629127502441, 1.5417331457138062, 1.5922034978866577, 1.6426738500595093, 1.6931440830230713, 1.7436144351959229, 1.7940847873687744, 1.844555139541626, 1.8950254917144775, 1.9454957246780396, 1.9959660768508911, 2.046436309814453, 2.0969066619873047, 2.1473770141601562, 2.197847366333008, 2.2483177185058594]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 1.0, 4.0, 4.0, 6.0, 7.0, 8.0, 10.0, 15.0, 7.0, 17.0, 17.0, 29.0, 27.0, 36.0, 30.0, 43.0, 35.0, 42.0, 49.0, 43.0, 46.0, 44.0, 46.0, 50.0, 53.0, 41.0, 37.0, 41.0, 35.0, 23.0, 27.0, 32.0, 17.0, 17.0, 15.0, 10.0, 13.0, 6.0, 10.0, 5.0, 3.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.35060304403305054, -0.3394174873828888, -0.32823196053504944, -0.3170464038848877, -0.30586087703704834, -0.2946753203868866, -0.28348976373672485, -0.2723042368888855, -0.26111871004104614, -0.2499331682920456, -0.23874762654304504, -0.2275620698928833, -0.21637654304504395, -0.2051909863948822, -0.19400544464588165, -0.1828199028968811, -0.17163434624671936, -0.1604488044977188, -0.14926326274871826, -0.13807770609855652, -0.12689217925071716, -0.11570663005113602, -0.10452108085155487, -0.09333553910255432, -0.08214999735355377, -0.07096445560455322, -0.059778910130262375, -0.04859336465597153, -0.03740782290697098, -0.02622228115797043, -0.015036731958389282, -0.003851190209388733, 0.007334351539611816, 0.018519895151257515, 0.029705438762903214, 0.04089098423719406, 0.05207652598619461, 0.06326206773519516, 0.0744476169347763, 0.08563315868377686, 0.0968187004327774, 0.10800424218177795, 0.1191897839307785, 0.13037532567977905, 0.1415608823299408, 0.15274640917778015, 0.1639319658279419, 0.17511750757694244, 0.186303049325943, 0.19748859107494354, 0.2086741328239441, 0.21985968947410583, 0.2310452163219452, 0.24223077297210693, 0.2534162998199463, 0.26460185647010803, 0.2757874131202698, 0.2869729697704315, 0.2981584966182709, 0.3093440532684326, 0.320529580116272, 0.3317151367664337, 0.34290069341659546, 0.3540862202644348, 0.36527174711227417]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 0.0, 2.0, 6.0, 6.0, 1.0, 3.0, 7.0, 5.0, 8.0, 25.0, 41.0, 53.0, 81.0, 132.0, 247.0, 519.0, 1131.0, 2864.0, 10720.0, 111481.0, 805033.0, 101050.0, 10165.0, 2777.0, 1092.0, 492.0, 255.0, 132.0, 87.0, 54.0, 31.0, 17.0, 10.0, 6.0, 5.0, 8.0, 3.0, 4.0, 1.0, 4.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.6884765625, -0.6679153442382812, -0.6473541259765625, -0.6267929077148438, -0.606231689453125, -0.5856704711914062, -0.5651092529296875, -0.5445480346679688, -0.52398681640625, -0.5034255981445312, -0.4828643798828125, -0.46230316162109375, -0.441741943359375, -0.42118072509765625, -0.4006195068359375, -0.38005828857421875, -0.3594970703125, -0.33893585205078125, -0.3183746337890625, -0.29781341552734375, -0.277252197265625, -0.25669097900390625, -0.2361297607421875, -0.21556854248046875, -0.19500732421875, -0.17444610595703125, -0.1538848876953125, -0.13332366943359375, -0.112762451171875, -0.09220123291015625, -0.0716400146484375, -0.05107879638671875, -0.030517578125, -0.00995635986328125, 0.0106048583984375, 0.03116607666015625, 0.051727294921875, 0.07228851318359375, 0.0928497314453125, 0.11341094970703125, 0.13397216796875, 0.15453338623046875, 0.1750946044921875, 0.19565582275390625, 0.216217041015625, 0.23677825927734375, 0.2573394775390625, 0.27790069580078125, 0.2984619140625, 0.31902313232421875, 0.3395843505859375, 0.36014556884765625, 0.380706787109375, 0.40126800537109375, 0.4218292236328125, 0.44239044189453125, 0.46295166015625, 0.48351287841796875, 0.5040740966796875, 0.5246353149414062, 0.545196533203125, 0.5657577514648438, 0.5863189697265625, 0.6068801879882812, 0.62744140625]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 4.0, 6.0, 4.0, 7.0, 7.0, 14.0, 16.0, 31.0, 65.0, 102.0, 128.0, 163.0, 136.0, 119.0, 64.0, 53.0, 38.0, 19.0, 10.0, 5.0, 4.0, 3.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.12322998046875, -0.12003898620605469, -0.11684799194335938, -0.11365699768066406, -0.11046600341796875, -0.10727500915527344, -0.10408401489257812, -0.10089302062988281, -0.0977020263671875, -0.09451103210449219, -0.09132003784179688, -0.08812904357910156, -0.08493804931640625, -0.08174705505371094, -0.07855606079101562, -0.07536506652832031, -0.072174072265625, -0.06898307800292969, -0.06579208374023438, -0.06260108947753906, -0.05941009521484375, -0.05621910095214844, -0.053028106689453125, -0.04983711242675781, -0.0466461181640625, -0.04345512390136719, -0.040264129638671875, -0.03707313537597656, -0.03388214111328125, -0.030691146850585938, -0.027500152587890625, -0.024309158325195312, -0.0211181640625, -0.017927169799804688, -0.014736175537109375, -0.011545181274414062, -0.00835418701171875, -0.0051631927490234375, -0.001972198486328125, 0.0012187957763671875, 0.0044097900390625, 0.0076007843017578125, 0.010791778564453125, 0.013982772827148438, 0.01717376708984375, 0.020364761352539062, 0.023555755615234375, 0.026746749877929688, 0.029937744140625, 0.03312873840332031, 0.036319732666015625, 0.03951072692871094, 0.04270172119140625, 0.04589271545410156, 0.049083709716796875, 0.05227470397949219, 0.0554656982421875, 0.05865669250488281, 0.061847686767578125, 0.06503868103027344, 0.06822967529296875, 0.07142066955566406, 0.07461166381835938, 0.07780265808105469, 0.08099365234375]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 2.0, 5.0, 6.0, 7.0, 14.0, 12.0, 24.0, 32.0, 42.0, 54.0, 66.0, 106.0, 159.0, 236.0, 421.0, 838.0, 1828.0, 5755.0, 22517.0, 108711.0, 450827.0, 358395.0, 74482.0, 16300.0, 4372.0, 1592.0, 671.0, 364.0, 214.0, 130.0, 112.0, 70.0, 46.0, 38.0, 28.0, 24.0, 13.0, 15.0, 9.0, 10.0, 3.0, 8.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.3046875, -0.29376220703125, -0.2828369140625, -0.27191162109375, -0.260986328125, -0.25006103515625, -0.2391357421875, -0.22821044921875, -0.21728515625, -0.20635986328125, -0.1954345703125, -0.18450927734375, -0.173583984375, -0.16265869140625, -0.1517333984375, -0.14080810546875, -0.1298828125, -0.11895751953125, -0.1080322265625, -0.09710693359375, -0.086181640625, -0.07525634765625, -0.0643310546875, -0.05340576171875, -0.04248046875, -0.03155517578125, -0.0206298828125, -0.00970458984375, 0.001220703125, 0.01214599609375, 0.0230712890625, 0.03399658203125, 0.044921875, 0.05584716796875, 0.0667724609375, 0.07769775390625, 0.088623046875, 0.09954833984375, 0.1104736328125, 0.12139892578125, 0.13232421875, 0.14324951171875, 0.1541748046875, 0.16510009765625, 0.176025390625, 0.18695068359375, 0.1978759765625, 0.20880126953125, 0.2197265625, 0.23065185546875, 0.2415771484375, 0.25250244140625, 0.263427734375, 0.27435302734375, 0.2852783203125, 0.29620361328125, 0.30712890625, 0.31805419921875, 0.3289794921875, 0.33990478515625, 0.350830078125, 0.36175537109375, 0.3726806640625, 0.38360595703125, 0.39453125]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 3.0, 2.0, 7.0, 5.0, 7.0, 11.0, 23.0, 19.0, 19.0, 18.0, 33.0, 32.0, 39.0, 37.0, 37.0, 37.0, 54.0, 49.0, 65.0, 52.0, 38.0, 54.0, 47.0, 41.0, 40.0, 44.0, 39.0, 19.0, 18.0, 19.0, 24.0, 15.0, 15.0, 12.0, 11.0, 11.0, 3.0, 7.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.28369140625, -0.2737236022949219, -0.26375579833984375, -0.2537879943847656, -0.2438201904296875, -0.23385238647460938, -0.22388458251953125, -0.21391677856445312, -0.203948974609375, -0.19398117065429688, -0.18401336669921875, -0.17404556274414062, -0.1640777587890625, -0.15410995483398438, -0.14414215087890625, -0.13417434692382812, -0.12420654296875, -0.11423873901367188, -0.10427093505859375, -0.09430313110351562, -0.0843353271484375, -0.07436752319335938, -0.06439971923828125, -0.054431915283203125, -0.044464111328125, -0.034496307373046875, -0.02452850341796875, -0.014560699462890625, -0.0045928955078125, 0.005374908447265625, 0.01534271240234375, 0.025310516357421875, 0.0352783203125, 0.045246124267578125, 0.05521392822265625, 0.06518173217773438, 0.0751495361328125, 0.08511734008789062, 0.09508514404296875, 0.10505294799804688, 0.115020751953125, 0.12498855590820312, 0.13495635986328125, 0.14492416381835938, 0.1548919677734375, 0.16485977172851562, 0.17482757568359375, 0.18479537963867188, 0.19476318359375, 0.20473098754882812, 0.21469879150390625, 0.22466659545898438, 0.2346343994140625, 0.24460220336914062, 0.25457000732421875, 0.2645378112792969, 0.274505615234375, 0.2844734191894531, 0.29444122314453125, 0.3044090270996094, 0.3143768310546875, 0.3243446350097656, 0.33431243896484375, 0.3442802429199219, 0.354248046875]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 4.0, 11.0, 6.0, 13.0, 23.0, 49.0, 66.0, 141.0, 326.0, 936.0, 3898.0, 27676.0, 244591.0, 662489.0, 94067.0, 11067.0, 2069.0, 612.0, 274.0, 108.0, 58.0, 28.0, 18.0, 12.0, 11.0, 4.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.302490234375, -0.29415321350097656, -0.2858161926269531, -0.2774791717529297, -0.26914215087890625, -0.2608051300048828, -0.2524681091308594, -0.24413108825683594, -0.2357940673828125, -0.22745704650878906, -0.21912002563476562, -0.2107830047607422, -0.20244598388671875, -0.1941089630126953, -0.18577194213867188, -0.17743492126464844, -0.169097900390625, -0.16076087951660156, -0.15242385864257812, -0.1440868377685547, -0.13574981689453125, -0.1274127960205078, -0.11907577514648438, -0.11073875427246094, -0.1024017333984375, -0.09406471252441406, -0.08572769165039062, -0.07739067077636719, -0.06905364990234375, -0.06071662902832031, -0.052379608154296875, -0.04404258728027344, -0.03570556640625, -0.027368545532226562, -0.019031524658203125, -0.010694503784179688, -0.00235748291015625, 0.0059795379638671875, 0.014316558837890625, 0.022653579711914062, 0.0309906005859375, 0.03932762145996094, 0.047664642333984375, 0.05600166320800781, 0.06433868408203125, 0.07267570495605469, 0.08101272583007812, 0.08934974670410156, 0.097686767578125, 0.10602378845214844, 0.11436080932617188, 0.12269783020019531, 0.13103485107421875, 0.1393718719482422, 0.14770889282226562, 0.15604591369628906, 0.1643829345703125, 0.17271995544433594, 0.18105697631835938, 0.1893939971923828, 0.19773101806640625, 0.2060680389404297, 0.21440505981445312, 0.22274208068847656, 0.2310791015625]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 5.0, 2.0, 2.0, 7.0, 8.0, 8.0, 18.0, 21.0, 27.0, 32.0, 41.0, 48.0, 78.0, 163.0, 163.0, 122.0, 71.0, 38.0, 30.0, 23.0, 28.0, 24.0, 16.0, 7.0, 6.0, 6.0, 6.0, 2.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.255243301391602e-05, -7.902737706899643e-05, -7.550232112407684e-05, -7.197726517915726e-05, -6.845220923423767e-05, -6.492715328931808e-05, -6.14020973443985e-05, -5.787704139947891e-05, -5.4351985454559326e-05, -5.082692950963974e-05, -4.7301873564720154e-05, -4.377681761980057e-05, -4.025176167488098e-05, -3.6726705729961395e-05, -3.320164978504181e-05, -2.9676593840122223e-05, -2.6151537895202637e-05, -2.262648195028305e-05, -1.9101426005363464e-05, -1.5576370060443878e-05, -1.2051314115524292e-05, -8.526258170604706e-06, -5.00120222568512e-06, -1.4761462807655334e-06, 2.0489096641540527e-06, 5.573965609073639e-06, 9.099021553993225e-06, 1.2624077498912811e-05, 1.6149133443832397e-05, 1.9674189388751984e-05, 2.319924533367157e-05, 2.6724301278591156e-05, 3.0249357223510742e-05, 3.377441316843033e-05, 3.7299469113349915e-05, 4.08245250582695e-05, 4.434958100318909e-05, 4.787463694810867e-05, 5.139969289302826e-05, 5.4924748837947845e-05, 5.844980478286743e-05, 6.197486072778702e-05, 6.54999166727066e-05, 6.902497261762619e-05, 7.255002856254578e-05, 7.607508450746536e-05, 7.960014045238495e-05, 8.312519639730453e-05, 8.665025234222412e-05, 9.017530828714371e-05, 9.37003642320633e-05, 9.722542017698288e-05, 0.00010075047612190247, 0.00010427553206682205, 0.00010780058801174164, 0.00011132564395666122, 0.00011485069990158081, 0.0001183757558465004, 0.00012190081179141998, 0.00012542586773633957, 0.00012895092368125916, 0.00013247597962617874, 0.00013600103557109833, 0.00013952609151601791, 0.0001430511474609375]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 5.0, 3.0, 11.0, 18.0, 28.0, 27.0, 60.0, 59.0, 145.0, 311.0, 593.0, 1664.0, 6569.0, 41228.0, 322749.0, 587047.0, 73523.0, 10701.0, 2227.0, 801.0, 359.0, 175.0, 95.0, 57.0, 38.0, 20.0, 14.0, 9.0, 11.0, 6.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.39501953125, -0.3856468200683594, -0.37627410888671875, -0.3669013977050781, -0.3575286865234375, -0.3481559753417969, -0.33878326416015625, -0.3294105529785156, -0.320037841796875, -0.3106651306152344, -0.30129241943359375, -0.2919197082519531, -0.2825469970703125, -0.2731742858886719, -0.26380157470703125, -0.2544288635253906, -0.24505615234375, -0.23568344116210938, -0.22631072998046875, -0.21693801879882812, -0.2075653076171875, -0.19819259643554688, -0.18881988525390625, -0.17944717407226562, -0.170074462890625, -0.16070175170898438, -0.15132904052734375, -0.14195632934570312, -0.1325836181640625, -0.12321090698242188, -0.11383819580078125, -0.10446548461914062, -0.0950927734375, -0.08572006225585938, -0.07634735107421875, -0.06697463989257812, -0.0576019287109375, -0.048229217529296875, -0.03885650634765625, -0.029483795166015625, -0.020111083984375, -0.010738372802734375, -0.00136566162109375, 0.008007049560546875, 0.0173797607421875, 0.026752471923828125, 0.03612518310546875, 0.045497894287109375, 0.05487060546875, 0.06424331665039062, 0.07361602783203125, 0.08298873901367188, 0.0923614501953125, 0.10173416137695312, 0.11110687255859375, 0.12047958374023438, 0.129852294921875, 0.13922500610351562, 0.14859771728515625, 0.15797042846679688, 0.1673431396484375, 0.17671585083007812, 0.18608856201171875, 0.19546127319335938, 0.204833984375]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 2.0, 4.0, 5.0, 3.0, 6.0, 11.0, 9.0, 11.0, 12.0, 11.0, 18.0, 12.0, 19.0, 38.0, 39.0, 43.0, 45.0, 69.0, 74.0, 80.0, 88.0, 68.0, 82.0, 51.0, 42.0, 26.0, 26.0, 26.0, 13.0, 15.0, 13.0, 11.0, 7.0, 9.0, 5.0, 5.0, 2.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.1380615234375, -0.1341991424560547, -0.13033676147460938, -0.12647438049316406, -0.12261199951171875, -0.11874961853027344, -0.11488723754882812, -0.11102485656738281, -0.1071624755859375, -0.10330009460449219, -0.09943771362304688, -0.09557533264160156, -0.09171295166015625, -0.08785057067871094, -0.08398818969726562, -0.08012580871582031, -0.076263427734375, -0.07240104675292969, -0.06853866577148438, -0.06467628479003906, -0.06081390380859375, -0.05695152282714844, -0.053089141845703125, -0.04922676086425781, -0.0453643798828125, -0.04150199890136719, -0.037639617919921875, -0.03377723693847656, -0.02991485595703125, -0.026052474975585938, -0.022190093994140625, -0.018327713012695312, -0.01446533203125, -0.010602951049804688, -0.006740570068359375, -0.0028781890869140625, 0.00098419189453125, 0.0048465728759765625, 0.008708953857421875, 0.012571334838867188, 0.0164337158203125, 0.020296096801757812, 0.024158477783203125, 0.028020858764648438, 0.03188323974609375, 0.03574562072753906, 0.039608001708984375, 0.04347038269042969, 0.047332763671875, 0.05119514465332031, 0.055057525634765625, 0.05891990661621094, 0.06278228759765625, 0.06664466857910156, 0.07050704956054688, 0.07436943054199219, 0.0782318115234375, 0.08209419250488281, 0.08595657348632812, 0.08981895446777344, 0.09368133544921875, 0.09754371643066406, 0.10140609741210938, 0.10526847839355469, 0.109130859375]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 12.0, 24.0, 39.0, 74.0, 162.0, 217.0, 221.0, 119.0, 60.0, 35.0, 21.0, 12.0, 6.0, 2.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.002054691314697, -3.9129621982574463, -3.8238697052001953, -3.7347772121429443, -3.6456847190856934, -3.5565922260284424, -3.4674997329711914, -3.3784074783325195, -3.2893147468566895, -3.2002222537994385, -3.1111297607421875, -3.0220372676849365, -2.9329447746276855, -2.8438522815704346, -2.7547597885131836, -2.6656675338745117, -2.5765750408172607, -2.4874825477600098, -2.398390054702759, -2.309297561645508, -2.220205068588257, -2.131112575531006, -2.042020320892334, -1.9529277086257935, -1.8638352155685425, -1.7747427225112915, -1.6856502294540405, -1.596557855606079, -1.5074653625488281, -1.4183728694915771, -1.3292803764343262, -1.2401878833770752, -1.1510956287384033, -1.0620031356811523, -0.9729106426239014, -0.8838182091712952, -0.7947257161140442, -0.7056332230567932, -0.616540789604187, -0.527448296546936, -0.43835580348968506, -0.3492633104324341, -0.2601708471775055, -0.1710783839225769, -0.08198589086532593, 0.007106602191925049, 0.09619903564453125, 0.18529152870178223, 0.2743840217590332, 0.3634765148162842, 0.45256897807121277, 0.5416614413261414, 0.6307539343833923, 0.7198464274406433, 0.8089388608932495, 0.8980313539505005, 0.9871238470077515, 1.0762163400650024, 1.1653088331222534, 1.2544012069702148, 1.3434937000274658, 1.4325861930847168, 1.5216786861419678, 1.6107711791992188, 1.6998636722564697]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 0.0, 4.0, 3.0, 5.0, 10.0, 9.0, 14.0, 8.0, 11.0, 19.0, 19.0, 20.0, 23.0, 23.0, 39.0, 31.0, 28.0, 38.0, 40.0, 52.0, 57.0, 54.0, 55.0, 49.0, 52.0, 33.0, 37.0, 34.0, 29.0, 34.0, 28.0, 20.0, 18.0, 18.0, 12.0, 18.0, 7.0, 12.0, 6.0, 7.0, 13.0, 7.0, 5.0, 2.0, 1.0, 1.0, 4.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0], "bins": [-2.007315158843994, -1.9458867311477661, -1.884458303451538, -1.82302987575531, -1.761601448059082, -1.700173020362854, -1.638744592666626, -1.577316164970398, -1.51588773727417, -1.454459309577942, -1.3930308818817139, -1.3316024541854858, -1.2701740264892578, -1.2087455987930298, -1.1473171710968018, -1.0858887434005737, -1.0244603157043457, -0.9630318880081177, -0.9016034603118896, -0.8401750326156616, -0.7787466049194336, -0.7173181772232056, -0.6558897495269775, -0.5944613218307495, -0.533033013343811, -0.471604585647583, -0.410176157951355, -0.34874773025512695, -0.2873193025588989, -0.2258909046649933, -0.16446247696876526, -0.10303404927253723, -0.041605591773986816, 0.019822832196950912, 0.08125125616788864, 0.14267967641353607, 0.2041081041097641, 0.26553651690483093, 0.32696494460105896, 0.388393372297287, 0.449821799993515, 0.5112501978874207, 0.5726786255836487, 0.6341070532798767, 0.6955354809761047, 0.7569639086723328, 0.8183923363685608, 0.8798207640647888, 0.9412491917610168, 1.0026775598526, 1.0641059875488281, 1.1255344152450562, 1.1869628429412842, 1.2483912706375122, 1.3098196983337402, 1.3712481260299683, 1.4326765537261963, 1.4941049814224243, 1.5555334091186523, 1.6169618368148804, 1.6783902645111084, 1.7398186922073364, 1.8012471199035645, 1.8626755475997925, 1.9241039752960205]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 5.0, 1.0, 1.0, 2.0, 4.0, 6.0, 7.0, 20.0, 14.0, 18.0, 55.0, 83.0, 134.0, 301.0, 569.0, 1464.0, 5282.0, 52702.0, 4005849.0, 118130.0, 7058.0, 1555.0, 549.0, 222.0, 110.0, 58.0, 29.0, 16.0, 11.0, 10.0, 7.0, 4.0, 5.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.060546875, -1.0315780639648438, -1.0026092529296875, -0.9736404418945312, -0.944671630859375, -0.9157028198242188, -0.8867340087890625, -0.8577651977539062, -0.82879638671875, -0.7998275756835938, -0.7708587646484375, -0.7418899536132812, -0.712921142578125, -0.6839523315429688, -0.6549835205078125, -0.6260147094726562, -0.5970458984375, -0.5680770874023438, -0.5391082763671875, -0.5101394653320312, -0.481170654296875, -0.45220184326171875, -0.4232330322265625, -0.39426422119140625, -0.36529541015625, -0.33632659912109375, -0.3073577880859375, -0.27838897705078125, -0.249420166015625, -0.22045135498046875, -0.1914825439453125, -0.16251373291015625, -0.133544921875, -0.10457611083984375, -0.0756072998046875, -0.04663848876953125, -0.017669677734375, 0.01129913330078125, 0.0402679443359375, 0.06923675537109375, 0.09820556640625, 0.12717437744140625, 0.1561431884765625, 0.18511199951171875, 0.214080810546875, 0.24304962158203125, 0.2720184326171875, 0.30098724365234375, 0.3299560546875, 0.35892486572265625, 0.3878936767578125, 0.41686248779296875, 0.445831298828125, 0.47480010986328125, 0.5037689208984375, 0.5327377319335938, 0.56170654296875, 0.5906753540039062, 0.6196441650390625, 0.6486129760742188, 0.677581787109375, 0.7065505981445312, 0.7355194091796875, 0.7644882202148438, 0.79345703125]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 3.0, 4.0, 1.0, 7.0, 9.0, 6.0, 7.0, 21.0, 26.0, 45.0, 55.0, 68.0, 87.0, 108.0, 94.0, 110.0, 93.0, 68.0, 63.0, 52.0, 26.0, 18.0, 18.0, 5.0, 6.0, 2.0, 3.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.1240234375, -0.12079906463623047, -0.11757469177246094, -0.1143503189086914, -0.11112594604492188, -0.10790157318115234, -0.10467720031738281, -0.10145282745361328, -0.09822845458984375, -0.09500408172607422, -0.09177970886230469, -0.08855533599853516, -0.08533096313476562, -0.0821065902709961, -0.07888221740722656, -0.07565784454345703, -0.0724334716796875, -0.06920909881591797, -0.06598472595214844, -0.0627603530883789, -0.059535980224609375, -0.056311607360839844, -0.05308723449707031, -0.04986286163330078, -0.04663848876953125, -0.04341411590576172, -0.04018974304199219, -0.036965370178222656, -0.033740997314453125, -0.030516624450683594, -0.027292251586914062, -0.02406787872314453, -0.020843505859375, -0.01761913299560547, -0.014394760131835938, -0.011170387268066406, -0.007946014404296875, -0.004721641540527344, -0.0014972686767578125, 0.0017271041870117188, 0.00495147705078125, 0.008175849914550781, 0.011400222778320312, 0.014624595642089844, 0.017848968505859375, 0.021073341369628906, 0.024297714233398438, 0.02752208709716797, 0.0307464599609375, 0.03397083282470703, 0.03719520568847656, 0.040419578552246094, 0.043643951416015625, 0.046868324279785156, 0.05009269714355469, 0.05331707000732422, 0.05654144287109375, 0.05976581573486328, 0.06299018859863281, 0.06621456146240234, 0.06943893432617188, 0.0726633071899414, 0.07588768005371094, 0.07911205291748047, 0.08233642578125]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 5.0, 1.0, 5.0, 7.0, 5.0, 13.0, 22.0, 23.0, 43.0, 61.0, 130.0, 246.0, 554.0, 1441.0, 4666.0, 21573.0, 205492.0, 3623568.0, 299221.0, 27808.0, 5933.0, 1832.0, 733.0, 372.0, 213.0, 129.0, 71.0, 51.0, 21.0, 16.0, 18.0, 3.0, 10.0, 2.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.25537109375, -0.242950439453125, -0.23052978515625, -0.218109130859375, -0.2056884765625, -0.193267822265625, -0.18084716796875, -0.168426513671875, -0.156005859375, -0.143585205078125, -0.13116455078125, -0.118743896484375, -0.1063232421875, -0.093902587890625, -0.08148193359375, -0.069061279296875, -0.056640625, -0.044219970703125, -0.03179931640625, -0.019378662109375, -0.0069580078125, 0.005462646484375, 0.01788330078125, 0.030303955078125, 0.042724609375, 0.055145263671875, 0.06756591796875, 0.079986572265625, 0.0924072265625, 0.104827880859375, 0.11724853515625, 0.129669189453125, 0.14208984375, 0.154510498046875, 0.16693115234375, 0.179351806640625, 0.1917724609375, 0.204193115234375, 0.21661376953125, 0.229034423828125, 0.241455078125, 0.253875732421875, 0.26629638671875, 0.278717041015625, 0.2911376953125, 0.303558349609375, 0.31597900390625, 0.328399658203125, 0.3408203125, 0.353240966796875, 0.36566162109375, 0.378082275390625, 0.3905029296875, 0.402923583984375, 0.41534423828125, 0.427764892578125, 0.440185546875, 0.452606201171875, 0.46502685546875, 0.477447509765625, 0.4898681640625, 0.502288818359375, 0.51470947265625, 0.527130126953125, 0.53955078125]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 2.0, 2.0, 4.0, 7.0, 7.0, 21.0, 23.0, 40.0, 69.0, 117.0, 340.0, 823.0, 1600.0, 533.0, 228.0, 93.0, 63.0, 27.0, 30.0, 13.0, 12.0, 12.0, 5.0, 5.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0924072265625, -0.0882720947265625, -0.084136962890625, -0.0800018310546875, -0.07586669921875, -0.0717315673828125, -0.067596435546875, -0.0634613037109375, -0.059326171875, -0.0551910400390625, -0.051055908203125, -0.0469207763671875, -0.04278564453125, -0.0386505126953125, -0.034515380859375, -0.0303802490234375, -0.0262451171875, -0.0221099853515625, -0.017974853515625, -0.0138397216796875, -0.00970458984375, -0.0055694580078125, -0.001434326171875, 0.0027008056640625, 0.0068359375, 0.0109710693359375, 0.015106201171875, 0.0192413330078125, 0.02337646484375, 0.0275115966796875, 0.031646728515625, 0.0357818603515625, 0.0399169921875, 0.0440521240234375, 0.048187255859375, 0.0523223876953125, 0.05645751953125, 0.0605926513671875, 0.064727783203125, 0.0688629150390625, 0.072998046875, 0.0771331787109375, 0.081268310546875, 0.0854034423828125, 0.08953857421875, 0.0936737060546875, 0.097808837890625, 0.1019439697265625, 0.1060791015625, 0.1102142333984375, 0.114349365234375, 0.1184844970703125, 0.12261962890625, 0.1267547607421875, 0.130889892578125, 0.1350250244140625, 0.13916015625, 0.1432952880859375, 0.147430419921875, 0.1515655517578125, 0.15570068359375, 0.1598358154296875, 0.163970947265625, 0.1681060791015625, 0.1722412109375]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 3.0, 18.0, 64.0, 182.0, 336.0, 248.0, 123.0, 27.0, 6.0, 5.0, 0.0, 1.0, 1.0], "bins": [-1.9848458766937256, -1.949238896369934, -1.9136319160461426, -1.8780250549316406, -1.8424180746078491, -1.8068110942840576, -1.7712041139602661, -1.7355971336364746, -1.6999902725219727, -1.6643832921981812, -1.6287763118743896, -1.5931694507598877, -1.5575624704360962, -1.5219554901123047, -1.4863485097885132, -1.4507415294647217, -1.4151345491409302, -1.3795275688171387, -1.3439205884933472, -1.3083137273788452, -1.2727067470550537, -1.2370997667312622, -1.2014927864074707, -1.1658858060836792, -1.1302788257598877, -1.0946718454360962, -1.0590648651123047, -1.0234580039978027, -0.9878510236740112, -0.9522440433502197, -0.9166370630264282, -0.8810300827026367, -0.8454233407974243, -0.8098163604736328, -0.7742094397544861, -0.7386024594306946, -0.7029955387115479, -0.6673885583877563, -0.6317815780639648, -0.5961745977401733, -0.5605676770210266, -0.5249606966972351, -0.4893537759780884, -0.4537467956542969, -0.41813984513282776, -0.38253289461135864, -0.34692591428756714, -0.311318963766098, -0.2757120132446289, -0.2401050627231598, -0.20449809730052948, -0.16889113187789917, -0.13328418135643005, -0.09767723083496094, -0.06207026541233063, -0.026463299989700317, 0.009143650531768799, 0.04475060850381851, 0.08035756647586823, 0.11596452444791794, 0.15157148241996765, 0.18717843294143677, 0.22278539836406708, 0.2583923637866974, 0.2939993143081665]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 5.0, 0.0, 4.0, 6.0, 3.0, 7.0, 6.0, 5.0, 14.0, 14.0, 9.0, 15.0, 13.0, 27.0, 21.0, 23.0, 32.0, 24.0, 28.0, 32.0, 43.0, 43.0, 35.0, 43.0, 52.0, 37.0, 42.0, 47.0, 31.0, 29.0, 55.0, 33.0, 35.0, 31.0, 19.0, 20.0, 22.0, 17.0, 15.0, 20.0, 11.0, 11.0, 10.0, 4.0, 6.0, 3.0, 2.0, 1.0, 6.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.30326271057128906, -0.29452818632125854, -0.28579363226890564, -0.2770591080188751, -0.2683245837688446, -0.2595900297164917, -0.2508555054664612, -0.24212098121643066, -0.23338644206523895, -0.22465190291404724, -0.21591737866401672, -0.207182839512825, -0.1984483003616333, -0.18971377611160278, -0.18097923696041107, -0.17224469780921936, -0.16351017355918884, -0.15477563440799713, -0.1460411101579666, -0.1373065710067749, -0.12857204675674438, -0.11983750760555267, -0.11110296845436096, -0.10236843675374985, -0.09363390505313873, -0.08489937335252762, -0.0761648416519165, -0.06743030250072479, -0.05869577080011368, -0.049961239099502563, -0.04122670367360115, -0.03249216824769974, -0.023757636547088623, -0.01502310298383236, -0.006288569420576096, 0.002445964142680168, 0.011180497705936432, 0.019915029406547546, 0.02864956483244896, 0.03738410025835037, 0.04611863195896149, 0.0548531636595726, 0.06358769536018372, 0.07232223451137543, 0.08105676621198654, 0.08979129791259766, 0.09852583706378937, 0.10726036876440048, 0.1159949004650116, 0.12472943216562271, 0.13346396386623383, 0.14219850301742554, 0.15093302726745605, 0.15966756641864777, 0.16840210556983948, 0.17713662981987, 0.1858711689710617, 0.19460570812225342, 0.20334023237228394, 0.21207477152347565, 0.22080931067466736, 0.22954383492469788, 0.2382783740758896, 0.2470129132270813, 0.2557474374771118]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 5.0, 5.0, 6.0, 9.0, 13.0, 20.0, 23.0, 29.0, 39.0, 43.0, 70.0, 87.0, 113.0, 205.0, 262.0, 426.0, 578.0, 909.0, 1593.0, 2875.0, 5930.0, 14329.0, 39528.0, 123089.0, 342894.0, 333473.0, 117216.0, 37875.0, 13789.0, 5841.0, 2848.0, 1561.0, 939.0, 596.0, 388.0, 259.0, 188.0, 127.0, 114.0, 72.0, 43.0, 39.0, 26.0, 29.0, 17.0, 9.0, 6.0, 9.0, 4.0, 1.0, 6.0, 2.0, 3.0, 3.0, 2.0, 1.0, 1.0], "bins": [-0.206787109375, -0.20032119750976562, -0.19385528564453125, -0.18738937377929688, -0.1809234619140625, -0.17445755004882812, -0.16799163818359375, -0.16152572631835938, -0.155059814453125, -0.14859390258789062, -0.14212799072265625, -0.13566207885742188, -0.1291961669921875, -0.12273025512695312, -0.11626434326171875, -0.10979843139648438, -0.10333251953125, -0.09686660766601562, -0.09040069580078125, -0.08393478393554688, -0.0774688720703125, -0.07100296020507812, -0.06453704833984375, -0.058071136474609375, -0.051605224609375, -0.045139312744140625, -0.03867340087890625, -0.032207489013671875, -0.0257415771484375, -0.019275665283203125, -0.01280975341796875, -0.006343841552734375, 0.0001220703125, 0.006587982177734375, 0.01305389404296875, 0.019519805908203125, 0.0259857177734375, 0.032451629638671875, 0.03891754150390625, 0.045383453369140625, 0.051849365234375, 0.058315277099609375, 0.06478118896484375, 0.07124710083007812, 0.0777130126953125, 0.08417892456054688, 0.09064483642578125, 0.09711074829101562, 0.10357666015625, 0.11004257202148438, 0.11650848388671875, 0.12297439575195312, 0.1294403076171875, 0.13590621948242188, 0.14237213134765625, 0.14883804321289062, 0.155303955078125, 0.16176986694335938, 0.16823577880859375, 0.17470169067382812, 0.1811676025390625, 0.18763351440429688, 0.19409942626953125, 0.20056533813476562, 0.20703125]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 6.0, 2.0, 7.0, 10.0, 18.0, 22.0, 28.0, 49.0, 55.0, 55.0, 93.0, 102.0, 113.0, 105.0, 75.0, 57.0, 61.0, 52.0, 36.0, 19.0, 11.0, 10.0, 3.0, 2.0, 5.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.11529541015625, -0.11228752136230469, -0.10927963256835938, -0.10627174377441406, -0.10326385498046875, -0.10025596618652344, -0.09724807739257812, -0.09424018859863281, -0.0912322998046875, -0.08822441101074219, -0.08521652221679688, -0.08220863342285156, -0.07920074462890625, -0.07619285583496094, -0.07318496704101562, -0.07017707824707031, -0.067169189453125, -0.06416130065917969, -0.061153411865234375, -0.05814552307128906, -0.05513763427734375, -0.05212974548339844, -0.049121856689453125, -0.04611396789550781, -0.0431060791015625, -0.04009819030761719, -0.037090301513671875, -0.03408241271972656, -0.03107452392578125, -0.028066635131835938, -0.025058746337890625, -0.022050857543945312, -0.01904296875, -0.016035079956054688, -0.013027191162109375, -0.010019302368164062, -0.00701141357421875, -0.0040035247802734375, -0.000995635986328125, 0.0020122528076171875, 0.0050201416015625, 0.008028030395507812, 0.011035919189453125, 0.014043807983398438, 0.01705169677734375, 0.020059585571289062, 0.023067474365234375, 0.026075363159179688, 0.029083251953125, 0.03209114074707031, 0.035099029541015625, 0.03810691833496094, 0.04111480712890625, 0.04412269592285156, 0.047130584716796875, 0.05013847351074219, 0.0531463623046875, 0.05615425109863281, 0.059162139892578125, 0.06217002868652344, 0.06517791748046875, 0.06818580627441406, 0.07119369506835938, 0.07420158386230469, 0.07720947265625]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 1.0, 6.0, 6.0, 9.0, 6.0, 13.0, 24.0, 31.0, 41.0, 68.0, 92.0, 141.0, 194.0, 320.0, 562.0, 1082.0, 2410.0, 6438.0, 18827.0, 66395.0, 242935.0, 431743.0, 199201.0, 52718.0, 15341.0, 5518.0, 2127.0, 940.0, 463.0, 284.0, 200.0, 124.0, 107.0, 59.0, 38.0, 25.0, 29.0, 9.0, 10.0, 12.0, 2.0, 2.0, 5.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.264404296875, -0.25672149658203125, -0.2490386962890625, -0.24135589599609375, -0.233673095703125, -0.22599029541015625, -0.2183074951171875, -0.21062469482421875, -0.20294189453125, -0.19525909423828125, -0.1875762939453125, -0.17989349365234375, -0.172210693359375, -0.16452789306640625, -0.1568450927734375, -0.14916229248046875, -0.1414794921875, -0.13379669189453125, -0.1261138916015625, -0.11843109130859375, -0.110748291015625, -0.10306549072265625, -0.0953826904296875, -0.08769989013671875, -0.08001708984375, -0.07233428955078125, -0.0646514892578125, -0.05696868896484375, -0.049285888671875, -0.04160308837890625, -0.0339202880859375, -0.02623748779296875, -0.0185546875, -0.01087188720703125, -0.0031890869140625, 0.00449371337890625, 0.012176513671875, 0.01985931396484375, 0.0275421142578125, 0.03522491455078125, 0.04290771484375, 0.05059051513671875, 0.0582733154296875, 0.06595611572265625, 0.073638916015625, 0.08132171630859375, 0.0890045166015625, 0.09668731689453125, 0.1043701171875, 0.11205291748046875, 0.1197357177734375, 0.12741851806640625, 0.135101318359375, 0.14278411865234375, 0.1504669189453125, 0.15814971923828125, 0.16583251953125, 0.17351531982421875, 0.1811981201171875, 0.18888092041015625, 0.196563720703125, 0.20424652099609375, 0.2119293212890625, 0.21961212158203125, 0.227294921875]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 1.0, 3.0, 0.0, 7.0, 8.0, 5.0, 15.0, 14.0, 15.0, 17.0, 26.0, 32.0, 26.0, 30.0, 40.0, 44.0, 43.0, 46.0, 56.0, 39.0, 49.0, 62.0, 56.0, 50.0, 39.0, 36.0, 38.0, 39.0, 25.0, 32.0, 23.0, 21.0, 14.0, 9.0, 18.0, 5.0, 6.0, 2.0, 3.0, 10.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.347412109375, -0.3372688293457031, -0.32712554931640625, -0.3169822692871094, -0.3068389892578125, -0.2966957092285156, -0.28655242919921875, -0.2764091491699219, -0.266265869140625, -0.2561225891113281, -0.24597930908203125, -0.23583602905273438, -0.2256927490234375, -0.21554946899414062, -0.20540618896484375, -0.19526290893554688, -0.18511962890625, -0.17497634887695312, -0.16483306884765625, -0.15468978881835938, -0.1445465087890625, -0.13440322875976562, -0.12425994873046875, -0.11411666870117188, -0.103973388671875, -0.09383010864257812, -0.08368682861328125, -0.07354354858398438, -0.0634002685546875, -0.053256988525390625, -0.04311370849609375, -0.032970428466796875, -0.0228271484375, -0.012683868408203125, -0.00254058837890625, 0.007602691650390625, 0.0177459716796875, 0.027889251708984375, 0.03803253173828125, 0.048175811767578125, 0.058319091796875, 0.06846237182617188, 0.07860565185546875, 0.08874893188476562, 0.0988922119140625, 0.10903549194335938, 0.11917877197265625, 0.12932205200195312, 0.13946533203125, 0.14960861206054688, 0.15975189208984375, 0.16989517211914062, 0.1800384521484375, 0.19018173217773438, 0.20032501220703125, 0.21046829223632812, 0.220611572265625, 0.23075485229492188, 0.24089813232421875, 0.2510414123535156, 0.2611846923828125, 0.2713279724121094, 0.28147125244140625, 0.2916145324707031, 0.3017578125]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 4.0, 4.0, 1.0, 3.0, 6.0, 9.0, 12.0, 18.0, 24.0, 36.0, 43.0, 84.0, 136.0, 261.0, 551.0, 1277.0, 3695.0, 14257.0, 80399.0, 512021.0, 367417.0, 53066.0, 10189.0, 2892.0, 1091.0, 474.0, 226.0, 132.0, 70.0, 54.0, 32.0, 14.0, 15.0, 13.0, 12.0, 4.0, 3.0, 5.0, 1.0, 2.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.1351318359375, -0.13114452362060547, -0.12715721130371094, -0.1231698989868164, -0.11918258666992188, -0.11519527435302734, -0.11120796203613281, -0.10722064971923828, -0.10323333740234375, -0.09924602508544922, -0.09525871276855469, -0.09127140045166016, -0.08728408813476562, -0.0832967758178711, -0.07930946350097656, -0.07532215118408203, -0.0713348388671875, -0.06734752655029297, -0.06336021423339844, -0.059372901916503906, -0.055385589599609375, -0.051398277282714844, -0.04741096496582031, -0.04342365264892578, -0.03943634033203125, -0.03544902801513672, -0.03146171569824219, -0.027474403381347656, -0.023487091064453125, -0.019499778747558594, -0.015512466430664062, -0.011525154113769531, -0.007537841796875, -0.0035505294799804688, 0.0004367828369140625, 0.004424095153808594, 0.008411407470703125, 0.012398719787597656, 0.016386032104492188, 0.02037334442138672, 0.02436065673828125, 0.02834796905517578, 0.03233528137207031, 0.036322593688964844, 0.040309906005859375, 0.044297218322753906, 0.04828453063964844, 0.05227184295654297, 0.0562591552734375, 0.06024646759033203, 0.06423377990722656, 0.0682210922241211, 0.07220840454101562, 0.07619571685791016, 0.08018302917480469, 0.08417034149169922, 0.08815765380859375, 0.09214496612548828, 0.09613227844238281, 0.10011959075927734, 0.10410690307617188, 0.1080942153930664, 0.11208152770996094, 0.11606884002685547, 0.12005615234375]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 3.0, 6.0, 4.0, 4.0, 7.0, 3.0, 9.0, 9.0, 15.0, 12.0, 20.0, 23.0, 16.0, 18.0, 25.0, 44.0, 46.0, 60.0, 73.0, 94.0, 79.0, 69.0, 59.0, 66.0, 36.0, 37.0, 36.0, 20.0, 19.0, 18.0, 10.0, 13.0, 8.0, 7.0, 14.0, 9.0, 5.0, 7.0, 0.0, 4.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.587671279907227e-05, -7.366389036178589e-05, -7.145106792449951e-05, -6.923824548721313e-05, -6.702542304992676e-05, -6.481260061264038e-05, -6.2599778175354e-05, -6.038695573806763e-05, -5.817413330078125e-05, -5.596131086349487e-05, -5.3748488426208496e-05, -5.153566598892212e-05, -4.932284355163574e-05, -4.7110021114349365e-05, -4.489719867706299e-05, -4.268437623977661e-05, -4.0471553802490234e-05, -3.825873136520386e-05, -3.604590892791748e-05, -3.3833086490631104e-05, -3.1620264053344727e-05, -2.940744161605835e-05, -2.7194619178771973e-05, -2.4981796741485596e-05, -2.276897430419922e-05, -2.0556151866912842e-05, -1.8343329429626465e-05, -1.6130506992340088e-05, -1.3917684555053711e-05, -1.1704862117767334e-05, -9.492039680480957e-06, -7.27921724319458e-06, -5.066394805908203e-06, -2.853572368621826e-06, -6.407499313354492e-07, 1.5720725059509277e-06, 3.7848949432373047e-06, 5.997717380523682e-06, 8.210539817810059e-06, 1.0423362255096436e-05, 1.2636184692382812e-05, 1.484900712966919e-05, 1.7061829566955566e-05, 1.9274652004241943e-05, 2.148747444152832e-05, 2.3700296878814697e-05, 2.5913119316101074e-05, 2.812594175338745e-05, 3.0338764190673828e-05, 3.2551586627960205e-05, 3.476440906524658e-05, 3.697723150253296e-05, 3.9190053939819336e-05, 4.140287637710571e-05, 4.361569881439209e-05, 4.582852125167847e-05, 4.8041343688964844e-05, 5.025416612625122e-05, 5.24669885635376e-05, 5.4679811000823975e-05, 5.689263343811035e-05, 5.910545587539673e-05, 6.13182783126831e-05, 6.353110074996948e-05, 6.574392318725586e-05]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 4.0, 5.0, 6.0, 8.0, 11.0, 14.0, 20.0, 35.0, 54.0, 101.0, 212.0, 467.0, 1086.0, 3206.0, 11644.0, 63118.0, 448481.0, 441872.0, 61378.0, 11520.0, 3246.0, 1103.0, 479.0, 190.0, 127.0, 62.0, 40.0, 22.0, 23.0, 12.0, 5.0, 5.0, 3.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.16845703125, -0.16402339935302734, -0.1595897674560547, -0.15515613555908203, -0.15072250366210938, -0.14628887176513672, -0.14185523986816406, -0.1374216079711914, -0.13298797607421875, -0.1285543441772461, -0.12412071228027344, -0.11968708038330078, -0.11525344848632812, -0.11081981658935547, -0.10638618469238281, -0.10195255279541016, -0.0975189208984375, -0.09308528900146484, -0.08865165710449219, -0.08421802520751953, -0.07978439331054688, -0.07535076141357422, -0.07091712951660156, -0.0664834976196289, -0.06204986572265625, -0.057616233825683594, -0.05318260192871094, -0.04874897003173828, -0.044315338134765625, -0.03988170623779297, -0.03544807434082031, -0.031014442443847656, -0.026580810546875, -0.022147178649902344, -0.017713546752929688, -0.013279914855957031, -0.008846282958984375, -0.004412651062011719, 2.09808349609375e-05, 0.004454612731933594, 0.00888824462890625, 0.013321876525878906, 0.017755508422851562, 0.02218914031982422, 0.026622772216796875, 0.03105640411376953, 0.03549003601074219, 0.039923667907714844, 0.0443572998046875, 0.048790931701660156, 0.05322456359863281, 0.05765819549560547, 0.062091827392578125, 0.06652545928955078, 0.07095909118652344, 0.0753927230834961, 0.07982635498046875, 0.0842599868774414, 0.08869361877441406, 0.09312725067138672, 0.09756088256835938, 0.10199451446533203, 0.10642814636230469, 0.11086177825927734, 0.11529541015625]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 0.0, 4.0, 11.0, 9.0, 10.0, 10.0, 19.0, 29.0, 32.0, 38.0, 54.0, 82.0, 70.0, 101.0, 109.0, 81.0, 79.0, 66.0, 41.0, 43.0, 29.0, 18.0, 17.0, 16.0, 10.0, 5.0, 5.0, 0.0, 5.0, 2.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0927734375, -0.08970928192138672, -0.08664512634277344, -0.08358097076416016, -0.08051681518554688, -0.0774526596069336, -0.07438850402832031, -0.07132434844970703, -0.06826019287109375, -0.06519603729248047, -0.06213188171386719, -0.059067726135253906, -0.056003570556640625, -0.052939414978027344, -0.04987525939941406, -0.04681110382080078, -0.0437469482421875, -0.04068279266357422, -0.03761863708496094, -0.034554481506347656, -0.031490325927734375, -0.028426170349121094, -0.025362014770507812, -0.02229785919189453, -0.01923370361328125, -0.01616954803466797, -0.013105392456054688, -0.010041236877441406, -0.006977081298828125, -0.003912925720214844, -0.0008487701416015625, 0.0022153854370117188, 0.005279541015625, 0.008343696594238281, 0.011407852172851562, 0.014472007751464844, 0.017536163330078125, 0.020600318908691406, 0.023664474487304688, 0.02672863006591797, 0.02979278564453125, 0.03285694122314453, 0.03592109680175781, 0.038985252380371094, 0.042049407958984375, 0.045113563537597656, 0.04817771911621094, 0.05124187469482422, 0.0543060302734375, 0.05737018585205078, 0.06043434143066406, 0.06349849700927734, 0.06656265258789062, 0.0696268081665039, 0.07269096374511719, 0.07575511932373047, 0.07881927490234375, 0.08188343048095703, 0.08494758605957031, 0.0880117416381836, 0.09107589721679688, 0.09414005279541016, 0.09720420837402344, 0.10026836395263672, 0.10333251953125]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 7.0, 9.0, 12.0, 23.0, 79.0, 149.0, 240.0, 236.0, 136.0, 52.0, 36.0, 11.0, 7.0, 5.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.505434036254883, -3.4200596809387207, -3.3346853256225586, -3.2493109703063965, -3.1639363765716553, -3.078562021255493, -2.993187665939331, -2.907813310623169, -2.8224387168884277, -2.7370643615722656, -2.6516900062561035, -2.5663156509399414, -2.4809410572052, -2.395566701889038, -2.310192346572876, -2.224817991256714, -2.1394436359405518, -2.0540692806243896, -1.968694806098938, -1.8833204507827759, -1.7979459762573242, -1.712571620941162, -1.627197265625, -1.541822910308838, -1.4564484357833862, -1.3710740804672241, -1.2856996059417725, -1.2003252506256104, -1.1149508953094482, -1.0295764207839966, -0.9442020654678345, -0.8588276505470276, -0.7734529972076416, -0.6880785822868347, -0.6027041673660278, -0.5173298120498657, -0.43195539712905884, -0.34658098220825195, -0.26120662689208984, -0.17583221197128296, -0.09045779705047607, -0.005083397030830383, 0.08029100298881531, 0.1656653881072998, 0.2510398030281067, 0.3364142179489136, 0.4217885732650757, 0.5071629881858826, 0.5925374031066895, 0.6779118180274963, 0.7632862329483032, 0.8486605882644653, 0.9340350031852722, 1.019409418106079, 1.1047837734222412, 1.1901581287384033, 1.275532603263855, 1.360906958580017, 1.4462814331054688, 1.5316557884216309, 1.617030143737793, 1.7024046182632446, 1.7877789735794067, 1.8731534481048584, 1.9585278034210205]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 5.0, 5.0, 2.0, 2.0, 6.0, 6.0, 5.0, 7.0, 12.0, 14.0, 18.0, 12.0, 20.0, 17.0, 19.0, 28.0, 28.0, 31.0, 26.0, 51.0, 37.0, 39.0, 43.0, 56.0, 38.0, 38.0, 40.0, 56.0, 49.0, 31.0, 34.0, 35.0, 28.0, 25.0, 27.0, 21.0, 19.0, 17.0, 13.0, 10.0, 5.0, 9.0, 3.0, 11.0, 4.0, 1.0, 3.0, 2.0, 1.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0], "bins": [-1.6746662855148315, -1.6245983839035034, -1.5745306015014648, -1.5244626998901367, -1.4743949174880981, -1.42432701587677, -1.3742592334747314, -1.3241913318634033, -1.2741234302520752, -1.224055528640747, -1.1739877462387085, -1.1239198446273804, -1.0738520622253418, -1.0237841606140137, -0.9737163186073303, -0.923648476600647, -0.8735806345939636, -0.8235127925872803, -0.7734449505805969, -0.7233771085739136, -0.6733092069625854, -0.6232413649559021, -0.5731735229492188, -0.5231056213378906, -0.47303780913352966, -0.4229699671268463, -0.3729020953178406, -0.3228342533111572, -0.2727664113044739, -0.22269853949546814, -0.1726306974887848, -0.12256282567977905, -0.0724949836730957, -0.022427130490541458, 0.027640722692012787, 0.07770857214927673, 0.12777642905712128, 0.17784428596496582, 0.22791212797164917, 0.2779799997806549, 0.32804784178733826, 0.3781156837940216, 0.42818355560302734, 0.4782513976097107, 0.528319239616394, 0.5783871412277222, 0.6284549236297607, 0.6785228252410889, 0.7285906672477722, 0.7786585092544556, 0.8287263512611389, 0.8787941932678223, 0.9288620948791504, 0.9789299368858337, 1.028997778892517, 1.0790656805038452, 1.1291334629058838, 1.179201364517212, 1.2292691469192505, 1.2793370485305786, 1.3294048309326172, 1.3794727325439453, 1.4295406341552734, 1.479608416557312, 1.5296763181686401]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 1.0, 4.0, 3.0, 0.0, 6.0, 4.0, 10.0, 16.0, 16.0, 20.0, 19.0, 33.0, 47.0, 62.0, 137.0, 170.0, 261.0, 486.0, 959.0, 2253.0, 5825.0, 21995.0, 185691.0, 3841487.0, 109864.0, 16740.0, 4673.0, 1791.0, 802.0, 407.0, 202.0, 111.0, 85.0, 34.0, 34.0, 13.0, 7.0, 7.0, 7.0, 2.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.466064453125, -0.4539299011230469, -0.44179534912109375, -0.4296607971191406, -0.4175262451171875, -0.4053916931152344, -0.39325714111328125, -0.3811225891113281, -0.368988037109375, -0.3568534851074219, -0.34471893310546875, -0.3325843811035156, -0.3204498291015625, -0.3083152770996094, -0.29618072509765625, -0.2840461730957031, -0.27191162109375, -0.2597770690917969, -0.24764251708984375, -0.23550796508789062, -0.2233734130859375, -0.21123886108398438, -0.19910430908203125, -0.18696975708007812, -0.174835205078125, -0.16270065307617188, -0.15056610107421875, -0.13843154907226562, -0.1262969970703125, -0.11416244506835938, -0.10202789306640625, -0.08989334106445312, -0.0777587890625, -0.06562423706054688, -0.05348968505859375, -0.041355133056640625, -0.0292205810546875, -0.017086029052734375, -0.00495147705078125, 0.007183074951171875, 0.019317626953125, 0.031452178955078125, 0.04358673095703125, 0.055721282958984375, 0.0678558349609375, 0.07999038696289062, 0.09212493896484375, 0.10425949096679688, 0.11639404296875, 0.12852859497070312, 0.14066314697265625, 0.15279769897460938, 0.1649322509765625, 0.17706680297851562, 0.18920135498046875, 0.20133590698242188, 0.213470458984375, 0.22560501098632812, 0.23773956298828125, 0.24987411499023438, 0.2620086669921875, 0.2741432189941406, 0.28627777099609375, 0.2984123229980469, 0.310546875]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 3.0, 2.0, 6.0, 6.0, 13.0, 17.0, 18.0, 42.0, 41.0, 56.0, 78.0, 86.0, 81.0, 94.0, 83.0, 82.0, 72.0, 49.0, 44.0, 31.0, 32.0, 25.0, 19.0, 9.0, 4.0, 5.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.1136474609375, -0.11069679260253906, -0.10774612426757812, -0.10479545593261719, -0.10184478759765625, -0.09889411926269531, -0.09594345092773438, -0.09299278259277344, -0.0900421142578125, -0.08709144592285156, -0.08414077758789062, -0.08119010925292969, -0.07823944091796875, -0.07528877258300781, -0.07233810424804688, -0.06938743591308594, -0.066436767578125, -0.06348609924316406, -0.060535430908203125, -0.05758476257324219, -0.05463409423828125, -0.05168342590332031, -0.048732757568359375, -0.04578208923339844, -0.0428314208984375, -0.03988075256347656, -0.036930084228515625, -0.03397941589355469, -0.03102874755859375, -0.028078079223632812, -0.025127410888671875, -0.022176742553710938, -0.01922607421875, -0.016275405883789062, -0.013324737548828125, -0.010374069213867188, -0.00742340087890625, -0.0044727325439453125, -0.001522064208984375, 0.0014286041259765625, 0.0043792724609375, 0.0073299407958984375, 0.010280609130859375, 0.013231277465820312, 0.01618194580078125, 0.019132614135742188, 0.022083282470703125, 0.025033950805664062, 0.027984619140625, 0.030935287475585938, 0.033885955810546875, 0.03683662414550781, 0.03978729248046875, 0.04273796081542969, 0.045688629150390625, 0.04863929748535156, 0.0515899658203125, 0.05454063415527344, 0.057491302490234375, 0.06044197082519531, 0.06339263916015625, 0.06634330749511719, 0.06929397583007812, 0.07224464416503906, 0.0751953125]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 3.0, 7.0, 8.0, 24.0, 31.0, 33.0, 79.0, 140.0, 295.0, 573.0, 1343.0, 3790.0, 13065.0, 73207.0, 1736699.0, 2261935.0, 81962.0, 14442.0, 3959.0, 1466.0, 622.0, 277.0, 128.0, 86.0, 51.0, 24.0, 14.0, 12.0, 5.0, 5.0, 2.0, 2.0, 2.0, 0.0, 1.0], "bins": [-0.369873046875, -0.36147117614746094, -0.3530693054199219, -0.3446674346923828, -0.33626556396484375, -0.3278636932373047, -0.3194618225097656, -0.31105995178222656, -0.3026580810546875, -0.29425621032714844, -0.2858543395996094, -0.2774524688720703, -0.26905059814453125, -0.2606487274169922, -0.2522468566894531, -0.24384498596191406, -0.235443115234375, -0.22704124450683594, -0.21863937377929688, -0.2102375030517578, -0.20183563232421875, -0.1934337615966797, -0.18503189086914062, -0.17663002014160156, -0.1682281494140625, -0.15982627868652344, -0.15142440795898438, -0.1430225372314453, -0.13462066650390625, -0.1262187957763672, -0.11781692504882812, -0.10941505432128906, -0.10101318359375, -0.09261131286621094, -0.08420944213867188, -0.07580757141113281, -0.06740570068359375, -0.05900382995605469, -0.050601959228515625, -0.04220008850097656, -0.0337982177734375, -0.025396347045898438, -0.016994476318359375, -0.008592605590820312, -0.00019073486328125, 0.008211135864257812, 0.016613006591796875, 0.025014877319335938, 0.033416748046875, 0.04181861877441406, 0.050220489501953125, 0.05862236022949219, 0.06702423095703125, 0.07542610168457031, 0.08382797241210938, 0.09222984313964844, 0.1006317138671875, 0.10903358459472656, 0.11743545532226562, 0.1258373260498047, 0.13423919677734375, 0.1426410675048828, 0.15104293823242188, 0.15944480895996094, 0.1678466796875]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 3.0, 5.0, 4.0, 4.0, 5.0, 6.0, 12.0, 23.0, 18.0, 48.0, 58.0, 114.0, 252.0, 619.0, 1568.0, 675.0, 305.0, 137.0, 67.0, 55.0, 32.0, 29.0, 14.0, 4.0, 4.0, 6.0, 2.0, 4.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.088623046875, -0.08598136901855469, -0.08333969116210938, -0.08069801330566406, -0.07805633544921875, -0.07541465759277344, -0.07277297973632812, -0.07013130187988281, -0.0674896240234375, -0.06484794616699219, -0.062206268310546875, -0.05956459045410156, -0.05692291259765625, -0.05428123474121094, -0.051639556884765625, -0.04899787902832031, -0.046356201171875, -0.04371452331542969, -0.041072845458984375, -0.03843116760253906, -0.03578948974609375, -0.03314781188964844, -0.030506134033203125, -0.027864456176757812, -0.0252227783203125, -0.022581100463867188, -0.019939422607421875, -0.017297744750976562, -0.01465606689453125, -0.012014389038085938, -0.009372711181640625, -0.0067310333251953125, -0.00408935546875, -0.0014476776123046875, 0.001194000244140625, 0.0038356781005859375, 0.00647735595703125, 0.009119033813476562, 0.011760711669921875, 0.014402389526367188, 0.0170440673828125, 0.019685745239257812, 0.022327423095703125, 0.024969100952148438, 0.02761077880859375, 0.030252456665039062, 0.032894134521484375, 0.03553581237792969, 0.038177490234375, 0.04081916809082031, 0.043460845947265625, 0.04610252380371094, 0.04874420166015625, 0.05138587951660156, 0.054027557373046875, 0.05666923522949219, 0.0593109130859375, 0.06195259094238281, 0.06459426879882812, 0.06723594665527344, 0.06987762451171875, 0.07251930236816406, 0.07516098022460938, 0.07780265808105469, 0.0804443359375]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 7.0, 13.0, 82.0, 196.0, 333.0, 237.0, 109.0, 23.0, 8.0, 2.0, 3.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-1.5152854919433594, -1.4864425659179688, -1.4575996398925781, -1.4287567138671875, -1.3999139070510864, -1.3710709810256958, -1.3422280550003052, -1.3133851289749146, -1.284542202949524, -1.2556992769241333, -1.2268563508987427, -1.1980135440826416, -1.169170618057251, -1.1403276920318604, -1.1114847660064697, -1.082641839981079, -1.053799033164978, -1.0249561071395874, -0.9961132407188416, -0.9672703146934509, -0.9384273886680603, -0.9095845222473145, -0.8807415962219238, -0.8518986701965332, -0.8230557441711426, -0.794212818145752, -0.7653699517250061, -0.7365270256996155, -0.7076840996742249, -0.678841233253479, -0.6499983072280884, -0.6211553812026978, -0.5923125743865967, -0.563469648361206, -0.5346267819404602, -0.5057838559150696, -0.47694095969200134, -0.4480980634689331, -0.4192551374435425, -0.39041224122047424, -0.36156928539276123, -0.332726389169693, -0.30388346314430237, -0.27504056692123413, -0.2461976706981659, -0.21735475957393646, -0.18851184844970703, -0.1596689522266388, -0.13082605600357056, -0.10198315232992172, -0.07314024865627289, -0.04429733753204346, -0.015454433858394623, 0.013388469815254211, 0.04223138093948364, 0.07107427716255188, 0.09991718828678131, 0.12876009941101074, 0.15760299563407898, 0.1864459067583084, 0.21528881788253784, 0.24413171410560608, 0.2729746103286743, 0.30181753635406494, 0.3306604325771332]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 3.0, 2.0, 7.0, 3.0, 7.0, 9.0, 11.0, 17.0, 11.0, 19.0, 29.0, 26.0, 30.0, 33.0, 48.0, 38.0, 32.0, 43.0, 45.0, 51.0, 48.0, 45.0, 49.0, 41.0, 48.0, 38.0, 39.0, 39.0, 30.0, 26.0, 30.0, 17.0, 27.0, 9.0, 13.0, 11.0, 5.0, 5.0, 6.0, 0.0, 7.0, 3.0, 1.0, 2.0, 3.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.23657631874084473, -0.22934478521347046, -0.222113236784935, -0.21488170325756073, -0.20765015482902527, -0.200418621301651, -0.19318708777427673, -0.18595553934574127, -0.1787239909172058, -0.17149245738983154, -0.16426090896129608, -0.15702937543392181, -0.14979782700538635, -0.14256629347801208, -0.13533475995063782, -0.12810321152210236, -0.12087167799472809, -0.11364013701677322, -0.10640859603881836, -0.09917706251144409, -0.09194551408290863, -0.08471398055553436, -0.0774824395775795, -0.07025089859962463, -0.06301935762166977, -0.055787816643714905, -0.04855627566576004, -0.041324738413095474, -0.03409319743514061, -0.026861656457185745, -0.01963011920452118, -0.012398578226566315, -0.00516703724861145, 0.0020645027980208397, 0.00929604284465313, 0.016527581959962845, 0.02375912293791771, 0.030990663915872574, 0.03822220116853714, 0.045453742146492004, 0.05268528312444687, 0.05991682410240173, 0.0671483650803566, 0.07437990605831146, 0.08161143958568573, 0.08884298801422119, 0.09607452154159546, 0.10330606251955032, 0.11053760349750519, 0.11776914447546005, 0.12500068545341492, 0.13223221898078918, 0.13946376740932465, 0.1466953009366989, 0.15392684936523438, 0.16115838289260864, 0.1683899164199829, 0.17562144994735718, 0.18285299837589264, 0.1900845319032669, 0.19731608033180237, 0.20454761385917664, 0.2117791473865509, 0.21901069581508636, 0.22624224424362183]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 3.0, 2.0, 3.0, 7.0, 10.0, 8.0, 12.0, 19.0, 32.0, 45.0, 83.0, 71.0, 132.0, 196.0, 334.0, 576.0, 1023.0, 1889.0, 4092.0, 10874.0, 35040.0, 134277.0, 423411.0, 315671.0, 83350.0, 23070.0, 7712.0, 3074.0, 1408.0, 844.0, 481.0, 264.0, 176.0, 125.0, 68.0, 42.0, 49.0, 26.0, 13.0, 15.0, 10.0, 7.0, 4.0, 4.0, 4.0, 5.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.25634765625, -0.24898719787597656, -0.24162673950195312, -0.2342662811279297, -0.22690582275390625, -0.2195453643798828, -0.21218490600585938, -0.20482444763183594, -0.1974639892578125, -0.19010353088378906, -0.18274307250976562, -0.1753826141357422, -0.16802215576171875, -0.1606616973876953, -0.15330123901367188, -0.14594078063964844, -0.138580322265625, -0.13121986389160156, -0.12385940551757812, -0.11649894714355469, -0.10913848876953125, -0.10177803039550781, -0.09441757202148438, -0.08705711364746094, -0.0796966552734375, -0.07233619689941406, -0.06497573852539062, -0.05761528015136719, -0.05025482177734375, -0.04289436340332031, -0.035533905029296875, -0.028173446655273438, -0.02081298828125, -0.013452529907226562, -0.006092071533203125, 0.0012683868408203125, 0.00862884521484375, 0.015989303588867188, 0.023349761962890625, 0.030710220336914062, 0.0380706787109375, 0.04543113708496094, 0.052791595458984375, 0.06015205383300781, 0.06751251220703125, 0.07487297058105469, 0.08223342895507812, 0.08959388732910156, 0.096954345703125, 0.10431480407714844, 0.11167526245117188, 0.11903572082519531, 0.12639617919921875, 0.1337566375732422, 0.14111709594726562, 0.14847755432128906, 0.1558380126953125, 0.16319847106933594, 0.17055892944335938, 0.1779193878173828, 0.18527984619140625, 0.1926403045654297, 0.20000076293945312, 0.20736122131347656, 0.2147216796875]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 4.0, 8.0, 5.0, 15.0, 17.0, 27.0, 41.0, 47.0, 49.0, 100.0, 94.0, 86.0, 92.0, 86.0, 69.0, 68.0, 39.0, 46.0, 36.0, 25.0, 22.0, 15.0, 6.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1195068359375, -0.11644935607910156, -0.11339187622070312, -0.11033439636230469, -0.10727691650390625, -0.10421943664550781, -0.10116195678710938, -0.09810447692871094, -0.0950469970703125, -0.09198951721191406, -0.08893203735351562, -0.08587455749511719, -0.08281707763671875, -0.07975959777832031, -0.07670211791992188, -0.07364463806152344, -0.070587158203125, -0.06752967834472656, -0.06447219848632812, -0.06141471862792969, -0.05835723876953125, -0.05529975891113281, -0.052242279052734375, -0.04918479919433594, -0.0461273193359375, -0.04306983947753906, -0.040012359619140625, -0.03695487976074219, -0.03389739990234375, -0.030839920043945312, -0.027782440185546875, -0.024724960327148438, -0.02166748046875, -0.018610000610351562, -0.015552520751953125, -0.012495040893554688, -0.00943756103515625, -0.0063800811767578125, -0.003322601318359375, -0.0002651214599609375, 0.0027923583984375, 0.0058498382568359375, 0.008907318115234375, 0.011964797973632812, 0.01502227783203125, 0.018079757690429688, 0.021137237548828125, 0.024194717407226562, 0.027252197265625, 0.030309677124023438, 0.033367156982421875, 0.03642463684082031, 0.03948211669921875, 0.04253959655761719, 0.045597076416015625, 0.04865455627441406, 0.0517120361328125, 0.05476951599121094, 0.057826995849609375, 0.06088447570800781, 0.06394195556640625, 0.06699943542480469, 0.07005691528320312, 0.07311439514160156, 0.076171875]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 5.0, 4.0, 4.0, 5.0, 12.0, 12.0, 24.0, 25.0, 37.0, 68.0, 97.0, 160.0, 238.0, 467.0, 974.0, 2543.0, 8963.0, 43455.0, 266133.0, 545444.0, 146201.0, 24511.0, 5761.0, 1824.0, 761.0, 372.0, 197.0, 100.0, 60.0, 42.0, 27.0, 12.0, 10.0, 4.0, 6.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.261474609375, -0.2525596618652344, -0.24364471435546875, -0.23472976684570312, -0.2258148193359375, -0.21689987182617188, -0.20798492431640625, -0.19906997680664062, -0.190155029296875, -0.18124008178710938, -0.17232513427734375, -0.16341018676757812, -0.1544952392578125, -0.14558029174804688, -0.13666534423828125, -0.12775039672851562, -0.11883544921875, -0.10992050170898438, -0.10100555419921875, -0.09209060668945312, -0.0831756591796875, -0.07426071166992188, -0.06534576416015625, -0.056430816650390625, -0.047515869140625, -0.038600921630859375, -0.02968597412109375, -0.020771026611328125, -0.0118560791015625, -0.002941131591796875, 0.00597381591796875, 0.014888763427734375, 0.0238037109375, 0.032718658447265625, 0.04163360595703125, 0.050548553466796875, 0.0594635009765625, 0.06837844848632812, 0.07729339599609375, 0.08620834350585938, 0.095123291015625, 0.10403823852539062, 0.11295318603515625, 0.12186813354492188, 0.1307830810546875, 0.13969802856445312, 0.14861297607421875, 0.15752792358398438, 0.16644287109375, 0.17535781860351562, 0.18427276611328125, 0.19318771362304688, 0.2021026611328125, 0.21101760864257812, 0.21993255615234375, 0.22884750366210938, 0.237762451171875, 0.24667739868164062, 0.25559234619140625, 0.2645072937011719, 0.2734222412109375, 0.2823371887207031, 0.29125213623046875, 0.3001670837402344, 0.30908203125]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 2.0, 5.0, 4.0, 7.0, 6.0, 6.0, 3.0, 7.0, 9.0, 6.0, 15.0, 14.0, 19.0, 21.0, 22.0, 26.0, 27.0, 23.0, 35.0, 38.0, 36.0, 47.0, 48.0, 53.0, 47.0, 56.0, 54.0, 38.0, 49.0, 36.0, 28.0, 44.0, 32.0, 32.0, 16.0, 18.0, 15.0, 20.0, 10.0, 11.0, 6.0, 8.0, 3.0, 2.0, 3.0, 5.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.273193359375, -0.2650909423828125, -0.256988525390625, -0.2488861083984375, -0.24078369140625, -0.2326812744140625, -0.224578857421875, -0.2164764404296875, -0.2083740234375, -0.2002716064453125, -0.192169189453125, -0.1840667724609375, -0.17596435546875, -0.1678619384765625, -0.159759521484375, -0.1516571044921875, -0.1435546875, -0.1354522705078125, -0.127349853515625, -0.1192474365234375, -0.11114501953125, -0.1030426025390625, -0.094940185546875, -0.0868377685546875, -0.0787353515625, -0.0706329345703125, -0.062530517578125, -0.0544281005859375, -0.04632568359375, -0.0382232666015625, -0.030120849609375, -0.0220184326171875, -0.013916015625, -0.0058135986328125, 0.002288818359375, 0.0103912353515625, 0.01849365234375, 0.0265960693359375, 0.034698486328125, 0.0428009033203125, 0.0509033203125, 0.0590057373046875, 0.067108154296875, 0.0752105712890625, 0.08331298828125, 0.0914154052734375, 0.099517822265625, 0.1076202392578125, 0.11572265625, 0.1238250732421875, 0.131927490234375, 0.1400299072265625, 0.14813232421875, 0.1562347412109375, 0.164337158203125, 0.1724395751953125, 0.1805419921875, 0.1886444091796875, 0.196746826171875, 0.2048492431640625, 0.21295166015625, 0.2210540771484375, 0.229156494140625, 0.2372589111328125, 0.245361328125]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 5.0, 10.0, 6.0, 8.0, 16.0, 46.0, 97.0, 268.0, 1165.0, 10481.0, 249260.0, 750335.0, 33620.0, 2535.0, 477.0, 125.0, 55.0, 21.0, 11.0, 6.0, 2.0, 6.0, 3.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.156982421875, -0.15099143981933594, -0.14500045776367188, -0.1390094757080078, -0.13301849365234375, -0.1270275115966797, -0.12103652954101562, -0.11504554748535156, -0.1090545654296875, -0.10306358337402344, -0.09707260131835938, -0.09108161926269531, -0.08509063720703125, -0.07909965515136719, -0.07310867309570312, -0.06711769104003906, -0.061126708984375, -0.05513572692871094, -0.049144744873046875, -0.04315376281738281, -0.03716278076171875, -0.031171798706054688, -0.025180816650390625, -0.019189834594726562, -0.0131988525390625, -0.0072078704833984375, -0.001216888427734375, 0.0047740936279296875, 0.01076507568359375, 0.016756057739257812, 0.022747039794921875, 0.028738021850585938, 0.03472900390625, 0.04071998596191406, 0.046710968017578125, 0.05270195007324219, 0.05869293212890625, 0.06468391418457031, 0.07067489624023438, 0.07666587829589844, 0.0826568603515625, 0.08864784240722656, 0.09463882446289062, 0.10062980651855469, 0.10662078857421875, 0.11261177062988281, 0.11860275268554688, 0.12459373474121094, 0.130584716796875, 0.13657569885253906, 0.14256668090820312, 0.1485576629638672, 0.15454864501953125, 0.1605396270751953, 0.16653060913085938, 0.17252159118652344, 0.1785125732421875, 0.18450355529785156, 0.19049453735351562, 0.1964855194091797, 0.20247650146484375, 0.2084674835205078, 0.21445846557617188, 0.22044944763183594, 0.2264404296875]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 5.0, 4.0, 7.0, 9.0, 8.0, 16.0, 21.0, 17.0, 22.0, 33.0, 42.0, 64.0, 76.0, 107.0, 135.0, 128.0, 83.0, 43.0, 45.0, 34.0, 19.0, 22.0, 14.0, 11.0, 15.0, 8.0, 2.0, 4.0, 1.0, 4.0, 2.0, 2.0, 1.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-7.033348083496094e-05, -6.787572056055069e-05, -6.541796028614044e-05, -6.29602000117302e-05, -6.0502439737319946e-05, -5.80446794629097e-05, -5.558691918849945e-05, -5.31291589140892e-05, -5.0671398639678955e-05, -4.821363836526871e-05, -4.575587809085846e-05, -4.329811781644821e-05, -4.0840357542037964e-05, -3.8382597267627716e-05, -3.592483699321747e-05, -3.346707671880722e-05, -3.100931644439697e-05, -2.8551556169986725e-05, -2.6093795895576477e-05, -2.363603562116623e-05, -2.117827534675598e-05, -1.8720515072345734e-05, -1.6262754797935486e-05, -1.3804994523525238e-05, -1.134723424911499e-05, -8.889473974704742e-06, -6.431713700294495e-06, -3.973953425884247e-06, -1.516193151473999e-06, 9.415671229362488e-07, 3.3993273973464966e-06, 5.857087671756744e-06, 8.314847946166992e-06, 1.077260822057724e-05, 1.3230368494987488e-05, 1.5688128769397736e-05, 1.8145889043807983e-05, 2.060364931821823e-05, 2.306140959262848e-05, 2.5519169867038727e-05, 2.7976930141448975e-05, 3.0434690415859222e-05, 3.289245069026947e-05, 3.535021096467972e-05, 3.7807971239089966e-05, 4.0265731513500214e-05, 4.272349178791046e-05, 4.518125206232071e-05, 4.763901233673096e-05, 5.0096772611141205e-05, 5.255453288555145e-05, 5.50122931599617e-05, 5.747005343437195e-05, 5.9927813708782196e-05, 6.238557398319244e-05, 6.484333425760269e-05, 6.730109453201294e-05, 6.975885480642319e-05, 7.221661508083344e-05, 7.467437535524368e-05, 7.713213562965393e-05, 7.958989590406418e-05, 8.204765617847443e-05, 8.450541645288467e-05, 8.696317672729492e-05]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 3.0, 4.0, 3.0, 7.0, 8.0, 18.0, 26.0, 27.0, 37.0, 67.0, 103.0, 183.0, 326.0, 639.0, 1376.0, 3797.0, 14460.0, 77141.0, 528948.0, 357151.0, 49018.0, 9992.0, 2891.0, 1105.0, 512.0, 260.0, 196.0, 98.0, 56.0, 32.0, 27.0, 17.0, 8.0, 8.0, 3.0, 4.0, 3.0, 2.0, 2.0, 4.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10211181640625, -0.0984487533569336, -0.09478569030761719, -0.09112262725830078, -0.08745956420898438, -0.08379650115966797, -0.08013343811035156, -0.07647037506103516, -0.07280731201171875, -0.06914424896240234, -0.06548118591308594, -0.06181812286376953, -0.058155059814453125, -0.05449199676513672, -0.05082893371582031, -0.047165870666503906, -0.0435028076171875, -0.039839744567871094, -0.03617668151855469, -0.03251361846923828, -0.028850555419921875, -0.02518749237060547, -0.021524429321289062, -0.017861366271972656, -0.01419830322265625, -0.010535240173339844, -0.0068721771240234375, -0.0032091140747070312, 0.000453948974609375, 0.004117012023925781, 0.0077800750732421875, 0.011443138122558594, 0.015106201171875, 0.018769264221191406, 0.022432327270507812, 0.02609539031982422, 0.029758453369140625, 0.03342151641845703, 0.03708457946777344, 0.040747642517089844, 0.04441070556640625, 0.048073768615722656, 0.05173683166503906, 0.05539989471435547, 0.059062957763671875, 0.06272602081298828, 0.06638908386230469, 0.0700521469116211, 0.0737152099609375, 0.0773782730102539, 0.08104133605957031, 0.08470439910888672, 0.08836746215820312, 0.09203052520751953, 0.09569358825683594, 0.09935665130615234, 0.10301971435546875, 0.10668277740478516, 0.11034584045410156, 0.11400890350341797, 0.11767196655273438, 0.12133502960205078, 0.12499809265136719, 0.1286611557006836, 0.13232421875]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 8.0, 5.0, 20.0, 23.0, 34.0, 68.0, 96.0, 174.0, 154.0, 171.0, 107.0, 68.0, 27.0, 22.0, 15.0, 10.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1771240234375, -0.1718120574951172, -0.16650009155273438, -0.16118812561035156, -0.15587615966796875, -0.15056419372558594, -0.14525222778320312, -0.1399402618408203, -0.1346282958984375, -0.1293163299560547, -0.12400436401367188, -0.11869239807128906, -0.11338043212890625, -0.10806846618652344, -0.10275650024414062, -0.09744453430175781, -0.092132568359375, -0.08682060241699219, -0.08150863647460938, -0.07619667053222656, -0.07088470458984375, -0.06557273864746094, -0.060260772705078125, -0.05494880676269531, -0.0496368408203125, -0.04432487487792969, -0.039012908935546875, -0.03370094299316406, -0.02838897705078125, -0.023077011108398438, -0.017765045166015625, -0.012453079223632812, -0.00714111328125, -0.0018291473388671875, 0.003482818603515625, 0.008794784545898438, 0.01410675048828125, 0.019418716430664062, 0.024730682373046875, 0.030042648315429688, 0.0353546142578125, 0.04066658020019531, 0.045978546142578125, 0.05129051208496094, 0.05660247802734375, 0.06191444396972656, 0.06722640991210938, 0.07253837585449219, 0.077850341796875, 0.08316230773925781, 0.08847427368164062, 0.09378623962402344, 0.09909820556640625, 0.10441017150878906, 0.10972213745117188, 0.11503410339355469, 0.1203460693359375, 0.1256580352783203, 0.13097000122070312, 0.13628196716308594, 0.14159393310546875, 0.14690589904785156, 0.15221786499023438, 0.1575298309326172, 0.162841796875]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 5.0, 22.0, 59.0, 147.0, 297.0, 281.0, 124.0, 45.0, 18.0, 8.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1073718070983887, -1.0068485736846924, -0.9063252210617065, -0.8058019876480103, -0.7052786946296692, -0.6047554016113281, -0.5042321681976318, -0.40370887517929077, -0.3031855821609497, -0.20266230404376984, -0.10213902592658997, -0.001615762710571289, 0.09890753030776978, 0.19943082332611084, 0.29995405673980713, 0.4004773497581482, 0.5010006427764893, 0.6015239357948303, 0.7020472288131714, 0.8025704622268677, 0.9030937552452087, 1.0036170482635498, 1.104140281677246, 1.2046635150909424, 1.3051868677139282, 1.4057101011276245, 1.5062334537506104, 1.6067566871643066, 1.707279920578003, 1.8078032732009888, 1.908326506614685, 2.008849859237671, 2.109373092651367, 2.2098963260650635, 2.3104195594787598, 2.410943031311035, 2.5114662647247314, 2.6119894981384277, 2.712512731552124, 2.8130359649658203, 2.9135594367980957, 3.014082670211792, 3.1146059036254883, 3.2151293754577637, 3.31565260887146, 3.4161758422851562, 3.5166990756988525, 3.617222309112549, 3.717745542526245, 3.8182687759399414, 3.9187920093536377, 4.019315242767334, 4.119838714599609, 4.220361709594727, 4.320885181427002, 4.421408653259277, 4.5219316482543945, 4.62245512008667, 4.722978115081787, 4.8235015869140625, 4.92402458190918, 5.024548053741455, 5.1250715255737305, 5.225594520568848, 5.326117992401123]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 4.0, 3.0, 3.0, 5.0, 10.0, 8.0, 14.0, 18.0, 14.0, 23.0, 26.0, 28.0, 34.0, 45.0, 52.0, 61.0, 64.0, 47.0, 53.0, 63.0, 49.0, 61.0, 52.0, 46.0, 37.0, 36.0, 27.0, 28.0, 18.0, 16.0, 19.0, 14.0, 3.0, 6.0, 5.0, 1.0, 3.0, 3.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.7119643688201904, -1.65807044506073, -1.604176640510559, -1.5502827167510986, -1.4963887929916382, -1.4424949884414673, -1.3886010646820068, -1.334707260131836, -1.2808133363723755, -1.226919412612915, -1.1730256080627441, -1.1191316843032837, -1.0652377605438232, -1.0113439559936523, -0.9574500322341919, -0.9035561680793762, -0.8496622443199158, -0.7957683801651001, -0.7418744564056396, -0.687980592250824, -0.6340867280960083, -0.5801928043365479, -0.5262989401817322, -0.4724050760269165, -0.41851118206977844, -0.3646172881126404, -0.3107234239578247, -0.25682953000068665, -0.20293565094470978, -0.1490417718887329, -0.09514787793159485, -0.041254013776779175, 0.012639880180358887, 0.06653375923633575, 0.12042764574289322, 0.17432153224945068, 0.22821541130542755, 0.2821092903614044, 0.3360031843185425, 0.38989704847335815, 0.4437909424304962, 0.4976848363876343, 0.55157870054245, 0.6054725646972656, 0.6593664884567261, 0.7132603526115417, 0.7671542167663574, 0.8210481405258179, 0.8749420046806335, 0.9288358688354492, 0.9827297925949097, 1.0366237163543701, 1.090517520904541, 1.1444114446640015, 1.198305368423462, 1.2521991729736328, 1.3060930967330933, 1.3599870204925537, 1.4138808250427246, 1.467774748802185, 1.5216686725616455, 1.5755624771118164, 1.6294564008712769, 1.6833503246307373, 1.7372441291809082]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 4.0, 2.0, 3.0, 2.0, 1.0, 4.0, 6.0, 5.0, 7.0, 6.0, 13.0, 18.0, 24.0, 31.0, 49.0, 71.0, 92.0, 151.0, 302.0, 516.0, 1004.0, 2202.0, 6194.0, 25647.0, 273121.0, 3742627.0, 118084.0, 16520.0, 4465.0, 1591.0, 701.0, 345.0, 197.0, 99.0, 68.0, 40.0, 31.0, 23.0, 8.0, 5.0, 7.0, 4.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.427978515625, -0.4165229797363281, -0.40506744384765625, -0.3936119079589844, -0.3821563720703125, -0.3707008361816406, -0.35924530029296875, -0.3477897644042969, -0.336334228515625, -0.3248786926269531, -0.31342315673828125, -0.3019676208496094, -0.2905120849609375, -0.2790565490722656, -0.26760101318359375, -0.2561454772949219, -0.24468994140625, -0.23323440551757812, -0.22177886962890625, -0.21032333374023438, -0.1988677978515625, -0.18741226196289062, -0.17595672607421875, -0.16450119018554688, -0.153045654296875, -0.14159011840820312, -0.13013458251953125, -0.11867904663085938, -0.1072235107421875, -0.09576797485351562, -0.08431243896484375, -0.07285690307617188, -0.0614013671875, -0.049945831298828125, -0.03849029541015625, -0.027034759521484375, -0.0155792236328125, -0.004123687744140625, 0.00733184814453125, 0.018787384033203125, 0.030242919921875, 0.041698455810546875, 0.05315399169921875, 0.06460952758789062, 0.0760650634765625, 0.08752059936523438, 0.09897613525390625, 0.11043167114257812, 0.12188720703125, 0.13334274291992188, 0.14479827880859375, 0.15625381469726562, 0.1677093505859375, 0.17916488647460938, 0.19062042236328125, 0.20207595825195312, 0.213531494140625, 0.22498703002929688, 0.23644256591796875, 0.24789810180664062, 0.2593536376953125, 0.2708091735839844, 0.28226470947265625, 0.2937202453613281, 0.30517578125]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 5.0, 9.0, 17.0, 17.0, 24.0, 40.0, 43.0, 46.0, 62.0, 96.0, 93.0, 76.0, 73.0, 78.0, 70.0, 52.0, 50.0, 34.0, 31.0, 20.0, 26.0, 19.0, 8.0, 3.0, 4.0, 1.0, 0.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.10858154296875, -0.10570144653320312, -0.10282135009765625, -0.09994125366210938, -0.0970611572265625, -0.09418106079101562, -0.09130096435546875, -0.08842086791992188, -0.085540771484375, -0.08266067504882812, -0.07978057861328125, -0.07690048217773438, -0.0740203857421875, -0.07114028930664062, -0.06826019287109375, -0.06538009643554688, -0.0625, -0.059619903564453125, -0.05673980712890625, -0.053859710693359375, -0.0509796142578125, -0.048099517822265625, -0.04521942138671875, -0.042339324951171875, -0.039459228515625, -0.036579132080078125, -0.03369903564453125, -0.030818939208984375, -0.0279388427734375, -0.025058746337890625, -0.02217864990234375, -0.019298553466796875, -0.01641845703125, -0.013538360595703125, -0.01065826416015625, -0.007778167724609375, -0.0048980712890625, -0.002017974853515625, 0.00086212158203125, 0.003742218017578125, 0.006622314453125, 0.009502410888671875, 0.01238250732421875, 0.015262603759765625, 0.0181427001953125, 0.021022796630859375, 0.02390289306640625, 0.026782989501953125, 0.0296630859375, 0.032543182373046875, 0.03542327880859375, 0.038303375244140625, 0.0411834716796875, 0.044063568115234375, 0.04694366455078125, 0.049823760986328125, 0.052703857421875, 0.055583953857421875, 0.05846405029296875, 0.061344146728515625, 0.0642242431640625, 0.06710433959960938, 0.06998443603515625, 0.07286453247070312, 0.07574462890625]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 5.0, 1.0, 1.0, 6.0, 7.0, 9.0, 15.0, 24.0, 40.0, 51.0, 107.0, 188.0, 357.0, 821.0, 1975.0, 7270.0, 42733.0, 875462.0, 3153177.0, 94617.0, 12295.0, 2940.0, 1035.0, 481.0, 263.0, 150.0, 94.0, 52.0, 44.0, 27.0, 11.0, 15.0, 7.0, 4.0, 7.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.235107421875, -0.22576522827148438, -0.21642303466796875, -0.20708084106445312, -0.1977386474609375, -0.18839645385742188, -0.17905426025390625, -0.16971206665039062, -0.160369873046875, -0.15102767944335938, -0.14168548583984375, -0.13234329223632812, -0.1230010986328125, -0.11365890502929688, -0.10431671142578125, -0.09497451782226562, -0.08563232421875, -0.07629013061523438, -0.06694793701171875, -0.057605743408203125, -0.0482635498046875, -0.038921356201171875, -0.02957916259765625, -0.020236968994140625, -0.010894775390625, -0.001552581787109375, 0.00778961181640625, 0.017131805419921875, 0.0264739990234375, 0.035816192626953125, 0.04515838623046875, 0.054500579833984375, 0.0638427734375, 0.07318496704101562, 0.08252716064453125, 0.09186935424804688, 0.1012115478515625, 0.11055374145507812, 0.11989593505859375, 0.12923812866210938, 0.138580322265625, 0.14792251586914062, 0.15726470947265625, 0.16660690307617188, 0.1759490966796875, 0.18529129028320312, 0.19463348388671875, 0.20397567749023438, 0.21331787109375, 0.22266006469726562, 0.23200225830078125, 0.24134445190429688, 0.2506866455078125, 0.2600288391113281, 0.26937103271484375, 0.2787132263183594, 0.288055419921875, 0.2973976135253906, 0.30673980712890625, 0.3160820007324219, 0.3254241943359375, 0.3347663879394531, 0.34410858154296875, 0.3534507751464844, 0.36279296875]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 4.0, 8.0, 4.0, 5.0, 16.0, 25.0, 27.0, 63.0, 118.0, 272.0, 766.0, 1636.0, 651.0, 234.0, 95.0, 62.0, 28.0, 28.0, 13.0, 12.0, 4.0, 2.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.11785888671875, -0.11303424835205078, -0.10820960998535156, -0.10338497161865234, -0.09856033325195312, -0.0937356948852539, -0.08891105651855469, -0.08408641815185547, -0.07926177978515625, -0.07443714141845703, -0.06961250305175781, -0.0647878646850586, -0.059963226318359375, -0.055138587951660156, -0.05031394958496094, -0.04548931121826172, -0.0406646728515625, -0.03584003448486328, -0.031015396118164062, -0.026190757751464844, -0.021366119384765625, -0.016541481018066406, -0.011716842651367188, -0.006892204284667969, -0.00206756591796875, 0.0027570724487304688, 0.0075817108154296875, 0.012406349182128906, 0.017230987548828125, 0.022055625915527344, 0.026880264282226562, 0.03170490264892578, 0.036529541015625, 0.04135417938232422, 0.04617881774902344, 0.051003456115722656, 0.055828094482421875, 0.060652732849121094, 0.06547737121582031, 0.07030200958251953, 0.07512664794921875, 0.07995128631591797, 0.08477592468261719, 0.0896005630493164, 0.09442520141601562, 0.09924983978271484, 0.10407447814941406, 0.10889911651611328, 0.1137237548828125, 0.11854839324951172, 0.12337303161621094, 0.12819766998291016, 0.13302230834960938, 0.1378469467163086, 0.1426715850830078, 0.14749622344970703, 0.15232086181640625, 0.15714550018310547, 0.1619701385498047, 0.1667947769165039, 0.17161941528320312, 0.17644405364990234, 0.18126869201660156, 0.18609333038330078, 0.19091796875]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 6.0, 21.0, 55.0, 173.0, 318.0, 255.0, 124.0, 39.0, 12.0, 3.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7482775449752808, -1.7084803581237793, -1.6686832904815674, -1.628886103630066, -1.5890889167785645, -1.549291729927063, -1.5094945430755615, -1.4696974754333496, -1.4299002885818481, -1.3901031017303467, -1.3503060340881348, -1.3105088472366333, -1.2707116603851318, -1.2309144735336304, -1.191117286682129, -1.151320219039917, -1.1115230321884155, -1.071725845336914, -1.0319287776947021, -0.9921315908432007, -0.9523344039916992, -0.9125372171401978, -0.8727400898933411, -0.8329429626464844, -0.7931457757949829, -0.7533485889434814, -0.7135514616966248, -0.6737543344497681, -0.6339571475982666, -0.5941599607467651, -0.5543628334999084, -0.5145657062530518, -0.47476840019226074, -0.43497124314308167, -0.3951740860939026, -0.3553769290447235, -0.31557977199554443, -0.27578261494636536, -0.23598545789718628, -0.1961883008480072, -0.15639114379882812, -0.11659398674964905, -0.07679682970046997, -0.036999672651290894, 0.0027974843978881836, 0.04259464144706726, 0.08239179849624634, 0.12218895554542542, 0.1619861125946045, 0.20178326964378357, 0.24158042669296265, 0.2813775837421417, 0.3211747407913208, 0.3609718978404999, 0.40076905488967896, 0.44056621193885803, 0.4803633689880371, 0.5201605558395386, 0.5599576830863953, 0.599754810333252, 0.6395519971847534, 0.6793491840362549, 0.7191463112831116, 0.7589434385299683, 0.7987406253814697]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 4.0, 4.0, 6.0, 7.0, 7.0, 12.0, 11.0, 19.0, 18.0, 20.0, 25.0, 19.0, 41.0, 39.0, 47.0, 47.0, 40.0, 52.0, 49.0, 46.0, 53.0, 50.0, 48.0, 44.0, 44.0, 37.0, 35.0, 36.0, 33.0, 23.0, 21.0, 18.0, 15.0, 7.0, 7.0, 3.0, 6.0, 3.0, 4.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0], "bins": [-0.41998982429504395, -0.4070392847061157, -0.3940887153148651, -0.3811381757259369, -0.3681876063346863, -0.35523706674575806, -0.34228652715682983, -0.3293359577655792, -0.3163853883743286, -0.3034348487854004, -0.2904842793941498, -0.27753373980522156, -0.26458317041397095, -0.2516326308250427, -0.2386820763349533, -0.2257315218448639, -0.21278098225593567, -0.19983042776584625, -0.18687987327575684, -0.1739293336868286, -0.160978764295578, -0.14802822470664978, -0.13507767021656036, -0.12212711572647095, -0.10917656123638153, -0.09622600674629211, -0.0832754522562027, -0.07032490521669388, -0.05737435072660446, -0.044423796236515045, -0.031473249197006226, -0.01852269470691681, -0.005572140216827393, 0.007378412410616875, 0.020328965038061142, 0.03327951580286026, 0.046230070292949677, 0.05918062478303909, 0.07213117182254791, 0.08508172631263733, 0.09803228080272675, 0.11098283529281616, 0.12393338978290558, 0.136883944272995, 0.14983448386192322, 0.16278505325317383, 0.17573559284210205, 0.18868614733219147, 0.20163670182228088, 0.2145872563123703, 0.22753781080245972, 0.24048835039138794, 0.25343891978263855, 0.2663894593715668, 0.2793400287628174, 0.2922905683517456, 0.30524110794067383, 0.31819164752960205, 0.33114221692085266, 0.3440927565097809, 0.3570433259010315, 0.3699938654899597, 0.38294440507888794, 0.39589497447013855, 0.40884554386138916]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 4.0, 4.0, 1.0, 3.0, 6.0, 10.0, 11.0, 22.0, 34.0, 83.0, 98.0, 188.0, 353.0, 651.0, 1222.0, 2873.0, 9090.0, 41408.0, 258474.0, 579825.0, 122730.0, 21990.0, 5512.0, 2004.0, 884.0, 462.0, 251.0, 145.0, 90.0, 47.0, 33.0, 15.0, 17.0, 4.0, 8.0, 4.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.377685546875, -0.3663444519042969, -0.35500335693359375, -0.3436622619628906, -0.3323211669921875, -0.3209800720214844, -0.30963897705078125, -0.2982978820800781, -0.286956787109375, -0.2756156921386719, -0.26427459716796875, -0.2529335021972656, -0.2415924072265625, -0.23025131225585938, -0.21891021728515625, -0.20756912231445312, -0.19622802734375, -0.18488693237304688, -0.17354583740234375, -0.16220474243164062, -0.1508636474609375, -0.13952255249023438, -0.12818145751953125, -0.11684036254882812, -0.105499267578125, -0.09415817260742188, -0.08281707763671875, -0.07147598266601562, -0.0601348876953125, -0.048793792724609375, -0.03745269775390625, -0.026111602783203125, -0.0147705078125, -0.003429412841796875, 0.00791168212890625, 0.019252777099609375, 0.0305938720703125, 0.041934967041015625, 0.05327606201171875, 0.06461715698242188, 0.075958251953125, 0.08729934692382812, 0.09864044189453125, 0.10998153686523438, 0.1213226318359375, 0.13266372680664062, 0.14400482177734375, 0.15534591674804688, 0.16668701171875, 0.17802810668945312, 0.18936920166015625, 0.20071029663085938, 0.2120513916015625, 0.22339248657226562, 0.23473358154296875, 0.24607467651367188, 0.257415771484375, 0.2687568664550781, 0.28009796142578125, 0.2914390563964844, 0.3027801513671875, 0.3141212463378906, 0.32546234130859375, 0.3368034362792969, 0.34814453125]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 6.0, 5.0, 9.0, 17.0, 23.0, 33.0, 43.0, 49.0, 66.0, 83.0, 93.0, 89.0, 81.0, 78.0, 68.0, 55.0, 44.0, 51.0, 29.0, 26.0, 20.0, 15.0, 6.0, 3.0, 1.0, 4.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.11236572265625, -0.10947513580322266, -0.10658454895019531, -0.10369396209716797, -0.10080337524414062, -0.09791278839111328, -0.09502220153808594, -0.0921316146850586, -0.08924102783203125, -0.0863504409790039, -0.08345985412597656, -0.08056926727294922, -0.07767868041992188, -0.07478809356689453, -0.07189750671386719, -0.06900691986083984, -0.0661163330078125, -0.06322574615478516, -0.06033515930175781, -0.05744457244873047, -0.054553985595703125, -0.05166339874267578, -0.04877281188964844, -0.045882225036621094, -0.04299163818359375, -0.040101051330566406, -0.03721046447753906, -0.03431987762451172, -0.031429290771484375, -0.02853870391845703, -0.025648117065429688, -0.022757530212402344, -0.019866943359375, -0.016976356506347656, -0.014085769653320312, -0.011195182800292969, -0.008304595947265625, -0.005414009094238281, -0.0025234222412109375, 0.00036716461181640625, 0.00325775146484375, 0.006148338317871094, 0.009038925170898438, 0.011929512023925781, 0.014820098876953125, 0.01771068572998047, 0.020601272583007812, 0.023491859436035156, 0.0263824462890625, 0.029273033142089844, 0.03216361999511719, 0.03505420684814453, 0.037944793701171875, 0.04083538055419922, 0.04372596740722656, 0.046616554260253906, 0.04950714111328125, 0.052397727966308594, 0.05528831481933594, 0.05817890167236328, 0.061069488525390625, 0.06396007537841797, 0.06685066223144531, 0.06974124908447266, 0.0726318359375]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 3.0, 3.0, 6.0, 6.0, 10.0, 22.0, 36.0, 49.0, 83.0, 129.0, 235.0, 478.0, 1060.0, 2778.0, 8247.0, 30071.0, 132551.0, 447009.0, 321778.0, 77098.0, 18452.0, 5132.0, 1805.0, 725.0, 344.0, 175.0, 104.0, 65.0, 40.0, 25.0, 13.0, 11.0, 7.0, 5.0, 4.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.258544921875, -0.2509002685546875, -0.243255615234375, -0.2356109619140625, -0.22796630859375, -0.2203216552734375, -0.212677001953125, -0.2050323486328125, -0.1973876953125, -0.1897430419921875, -0.182098388671875, -0.1744537353515625, -0.16680908203125, -0.1591644287109375, -0.151519775390625, -0.1438751220703125, -0.13623046875, -0.1285858154296875, -0.120941162109375, -0.1132965087890625, -0.10565185546875, -0.0980072021484375, -0.090362548828125, -0.0827178955078125, -0.0750732421875, -0.0674285888671875, -0.059783935546875, -0.0521392822265625, -0.04449462890625, -0.0368499755859375, -0.029205322265625, -0.0215606689453125, -0.013916015625, -0.0062713623046875, 0.001373291015625, 0.0090179443359375, 0.01666259765625, 0.0243072509765625, 0.031951904296875, 0.0395965576171875, 0.0472412109375, 0.0548858642578125, 0.062530517578125, 0.0701751708984375, 0.07781982421875, 0.0854644775390625, 0.093109130859375, 0.1007537841796875, 0.1083984375, 0.1160430908203125, 0.123687744140625, 0.1313323974609375, 0.13897705078125, 0.1466217041015625, 0.154266357421875, 0.1619110107421875, 0.1695556640625, 0.1772003173828125, 0.184844970703125, 0.1924896240234375, 0.20013427734375, 0.2077789306640625, 0.215423583984375, 0.2230682373046875, 0.230712890625]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 5.0, 4.0, 7.0, 9.0, 9.0, 12.0, 15.0, 17.0, 13.0, 26.0, 32.0, 32.0, 34.0, 53.0, 48.0, 56.0, 48.0, 57.0, 57.0, 44.0, 55.0, 55.0, 52.0, 40.0, 54.0, 33.0, 18.0, 25.0, 26.0, 15.0, 13.0, 9.0, 11.0, 5.0, 3.0, 9.0, 1.0, 7.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2158203125, -0.2062225341796875, -0.196624755859375, -0.1870269775390625, -0.17742919921875, -0.1678314208984375, -0.158233642578125, -0.1486358642578125, -0.1390380859375, -0.1294403076171875, -0.119842529296875, -0.1102447509765625, -0.10064697265625, -0.0910491943359375, -0.081451416015625, -0.0718536376953125, -0.062255859375, -0.0526580810546875, -0.043060302734375, -0.0334625244140625, -0.02386474609375, -0.0142669677734375, -0.004669189453125, 0.0049285888671875, 0.0145263671875, 0.0241241455078125, 0.033721923828125, 0.0433197021484375, 0.05291748046875, 0.0625152587890625, 0.072113037109375, 0.0817108154296875, 0.09130859375, 0.1009063720703125, 0.110504150390625, 0.1201019287109375, 0.12969970703125, 0.1392974853515625, 0.148895263671875, 0.1584930419921875, 0.1680908203125, 0.1776885986328125, 0.187286376953125, 0.1968841552734375, 0.20648193359375, 0.2160797119140625, 0.225677490234375, 0.2352752685546875, 0.244873046875, 0.2544708251953125, 0.264068603515625, 0.2736663818359375, 0.28326416015625, 0.2928619384765625, 0.302459716796875, 0.3120574951171875, 0.3216552734375, 0.3312530517578125, 0.340850830078125, 0.3504486083984375, 0.36004638671875, 0.3696441650390625, 0.379241943359375, 0.3888397216796875, 0.3984375]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 2.0, 3.0, 5.0, 4.0, 6.0, 8.0, 12.0, 16.0, 17.0, 55.0, 60.0, 80.0, 230.0, 492.0, 1308.0, 4885.0, 31375.0, 543214.0, 434261.0, 26100.0, 4309.0, 1217.0, 434.0, 193.0, 104.0, 60.0, 28.0, 24.0, 18.0, 11.0, 8.0, 4.0, 2.0, 3.0, 2.0, 3.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1741943359375, -0.16856765747070312, -0.16294097900390625, -0.15731430053710938, -0.1516876220703125, -0.14606094360351562, -0.14043426513671875, -0.13480758666992188, -0.129180908203125, -0.12355422973632812, -0.11792755126953125, -0.11230087280273438, -0.1066741943359375, -0.10104751586914062, -0.09542083740234375, -0.08979415893554688, -0.08416748046875, -0.07854080200195312, -0.07291412353515625, -0.06728744506835938, -0.0616607666015625, -0.056034088134765625, -0.05040740966796875, -0.044780731201171875, -0.039154052734375, -0.033527374267578125, -0.02790069580078125, -0.022274017333984375, -0.0166473388671875, -0.011020660400390625, -0.00539398193359375, 0.000232696533203125, 0.005859375, 0.011486053466796875, 0.01711273193359375, 0.022739410400390625, 0.0283660888671875, 0.033992767333984375, 0.03961944580078125, 0.045246124267578125, 0.050872802734375, 0.056499481201171875, 0.06212615966796875, 0.06775283813476562, 0.0733795166015625, 0.07900619506835938, 0.08463287353515625, 0.09025955200195312, 0.09588623046875, 0.10151290893554688, 0.10713958740234375, 0.11276626586914062, 0.1183929443359375, 0.12401962280273438, 0.12964630126953125, 0.13527297973632812, 0.140899658203125, 0.14652633666992188, 0.15215301513671875, 0.15777969360351562, 0.1634063720703125, 0.16903305053710938, 0.17465972900390625, 0.18028640747070312, 0.1859130859375]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 1.0, 3.0, 4.0, 4.0, 7.0, 8.0, 10.0, 8.0, 15.0, 17.0, 22.0, 31.0, 30.0, 71.0, 117.0, 141.0, 138.0, 102.0, 86.0, 48.0, 34.0, 20.0, 14.0, 22.0, 21.0, 10.0, 7.0, 6.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.842613220214844e-05, -6.590224802494049e-05, -6.337836384773254e-05, -6.08544796705246e-05, -5.833059549331665e-05, -5.5806711316108704e-05, -5.328282713890076e-05, -5.075894296169281e-05, -4.823505878448486e-05, -4.5711174607276917e-05, -4.318729043006897e-05, -4.066340625286102e-05, -3.8139522075653076e-05, -3.561563789844513e-05, -3.309175372123718e-05, -3.0567869544029236e-05, -2.804398536682129e-05, -2.5520101189613342e-05, -2.2996217012405396e-05, -2.047233283519745e-05, -1.7948448657989502e-05, -1.5424564480781555e-05, -1.2900680303573608e-05, -1.0376796126365662e-05, -7.852911949157715e-06, -5.329027771949768e-06, -2.8051435947418213e-06, -2.812594175338745e-07, 2.2426247596740723e-06, 4.766508936882019e-06, 7.290393114089966e-06, 9.814277291297913e-06, 1.233816146850586e-05, 1.4862045645713806e-05, 1.7385929822921753e-05, 1.99098140001297e-05, 2.2433698177337646e-05, 2.4957582354545593e-05, 2.748146653175354e-05, 3.0005350708961487e-05, 3.2529234886169434e-05, 3.505311906337738e-05, 3.757700324058533e-05, 4.0100887417793274e-05, 4.262477159500122e-05, 4.514865577220917e-05, 4.7672539949417114e-05, 5.019642412662506e-05, 5.272030830383301e-05, 5.5244192481040955e-05, 5.77680766582489e-05, 6.029196083545685e-05, 6.28158450126648e-05, 6.533972918987274e-05, 6.786361336708069e-05, 7.038749754428864e-05, 7.291138172149658e-05, 7.543526589870453e-05, 7.795915007591248e-05, 8.048303425312042e-05, 8.300691843032837e-05, 8.553080260753632e-05, 8.805468678474426e-05, 9.057857096195221e-05, 9.310245513916016e-05]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 0.0, 6.0, 5.0, 11.0, 14.0, 9.0, 20.0, 25.0, 53.0, 94.0, 124.0, 209.0, 357.0, 788.0, 1621.0, 4190.0, 14382.0, 82731.0, 644509.0, 254851.0, 32089.0, 7429.0, 2659.0, 1117.0, 510.0, 310.0, 164.0, 86.0, 73.0, 34.0, 24.0, 18.0, 9.0, 13.0, 4.0, 7.0, 4.0, 2.0, 3.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1329345703125, -0.12874794006347656, -0.12456130981445312, -0.12037467956542969, -0.11618804931640625, -0.11200141906738281, -0.10781478881835938, -0.10362815856933594, -0.0994415283203125, -0.09525489807128906, -0.09106826782226562, -0.08688163757324219, -0.08269500732421875, -0.07850837707519531, -0.07432174682617188, -0.07013511657714844, -0.065948486328125, -0.06176185607910156, -0.057575225830078125, -0.05338859558105469, -0.04920196533203125, -0.04501533508300781, -0.040828704833984375, -0.03664207458496094, -0.0324554443359375, -0.028268814086914062, -0.024082183837890625, -0.019895553588867188, -0.01570892333984375, -0.011522293090820312, -0.007335662841796875, -0.0031490325927734375, 0.00103759765625, 0.0052242279052734375, 0.009410858154296875, 0.013597488403320312, 0.01778411865234375, 0.021970748901367188, 0.026157379150390625, 0.030344009399414062, 0.0345306396484375, 0.03871726989746094, 0.042903900146484375, 0.04709053039550781, 0.05127716064453125, 0.05546379089355469, 0.059650421142578125, 0.06383705139160156, 0.068023681640625, 0.07221031188964844, 0.07639694213867188, 0.08058357238769531, 0.08477020263671875, 0.08895683288574219, 0.09314346313476562, 0.09733009338378906, 0.1015167236328125, 0.10570335388183594, 0.10988998413085938, 0.11407661437988281, 0.11826324462890625, 0.12244987487792969, 0.12663650512695312, 0.13082313537597656, 0.135009765625]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 3.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 4.0, 4.0, 8.0, 10.0, 6.0, 27.0, 31.0, 47.0, 96.0, 128.0, 157.0, 139.0, 121.0, 66.0, 67.0, 29.0, 19.0, 24.0, 4.0, 3.0, 0.0, 4.0, 1.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10101318359375, -0.09693622589111328, -0.09285926818847656, -0.08878231048583984, -0.08470535278320312, -0.0806283950805664, -0.07655143737792969, -0.07247447967529297, -0.06839752197265625, -0.06432056427001953, -0.06024360656738281, -0.056166648864746094, -0.052089691162109375, -0.048012733459472656, -0.04393577575683594, -0.03985881805419922, -0.0357818603515625, -0.03170490264892578, -0.027627944946289062, -0.023550987243652344, -0.019474029541015625, -0.015397071838378906, -0.011320114135742188, -0.007243156433105469, -0.00316619873046875, 0.0009107589721679688, 0.0049877166748046875, 0.009064674377441406, 0.013141632080078125, 0.017218589782714844, 0.021295547485351562, 0.02537250518798828, 0.029449462890625, 0.03352642059326172, 0.03760337829589844, 0.041680335998535156, 0.045757293701171875, 0.049834251403808594, 0.05391120910644531, 0.05798816680908203, 0.06206512451171875, 0.06614208221435547, 0.07021903991699219, 0.0742959976196289, 0.07837295532226562, 0.08244991302490234, 0.08652687072753906, 0.09060382843017578, 0.0946807861328125, 0.09875774383544922, 0.10283470153808594, 0.10691165924072266, 0.11098861694335938, 0.1150655746459961, 0.11914253234863281, 0.12321949005126953, 0.12729644775390625, 0.13137340545654297, 0.1354503631591797, 0.1395273208618164, 0.14360427856445312, 0.14768123626708984, 0.15175819396972656, 0.15583515167236328, 0.159912109375]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 5.0, 1.0, 6.0, 5.0, 12.0, 19.0, 24.0, 43.0, 64.0, 121.0, 109.0, 146.0, 142.0, 97.0, 86.0, 48.0, 32.0, 21.0, 9.0, 8.0, 2.0, 4.0, 3.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.149479627609253, -1.1032607555389404, -1.057041883468628, -1.0108230113983154, -0.9646040797233582, -0.9183852076530457, -0.8721662759780884, -0.8259474039077759, -0.7797285318374634, -0.7335096597671509, -0.6872907876968384, -0.6410718560218811, -0.5948529839515686, -0.5486341118812561, -0.5024151802062988, -0.45619630813598633, -0.40997743606567383, -0.36375856399536133, -0.31753966212272644, -0.27132076025009155, -0.22510188817977905, -0.17888300120830536, -0.13266411423683167, -0.08644521236419678, -0.04022634029388428, 0.0059925466775894165, 0.05221143364906311, 0.0984303206205368, 0.1446492075920105, 0.1908680945634842, 0.23708698153495789, 0.2833058834075928, 0.3295247554779053, 0.3757436275482178, 0.42196252942085266, 0.46818143129348755, 0.5144003033638, 0.5606191754341125, 0.6068381071090698, 0.6530569791793823, 0.6992758512496948, 0.7454947233200073, 0.7917135953903198, 0.8379325270652771, 0.8841513991355896, 0.9303702712059021, 0.9765892028808594, 1.0228080749511719, 1.0690269470214844, 1.1152458190917969, 1.1614646911621094, 1.2076835632324219, 1.2539024353027344, 1.3001214265823364, 1.346340298652649, 1.3925591707229614, 1.438778042793274, 1.4849969148635864, 1.531215786933899, 1.5774346590042114, 1.6236536502838135, 1.669872522354126, 1.7160913944244385, 1.762310266494751, 1.8085291385650635]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 6.0, 5.0, 9.0, 11.0, 8.0, 8.0, 14.0, 13.0, 18.0, 19.0, 20.0, 32.0, 29.0, 37.0, 42.0, 35.0, 32.0, 49.0, 49.0, 41.0, 38.0, 44.0, 55.0, 46.0, 43.0, 52.0, 34.0, 27.0, 33.0, 21.0, 27.0, 24.0, 16.0, 18.0, 14.0, 9.0, 8.0, 10.0, 7.0, 4.0, 1.0, 2.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0], "bins": [-1.705547571182251, -1.65894615650177, -1.612344741821289, -1.5657432079315186, -1.5191417932510376, -1.4725403785705566, -1.4259389638900757, -1.3793375492095947, -1.3327360153198242, -1.2861346006393433, -1.2395331859588623, -1.1929316520690918, -1.1463302373886108, -1.0997288227081299, -1.053127408027649, -1.006525993347168, -0.9599245190620422, -0.9133231043815613, -0.8667216300964355, -0.8201202154159546, -0.7735187411308289, -0.7269173264503479, -0.6803158521652222, -0.6337144374847412, -0.5871130228042603, -0.5405116081237793, -0.49391013383865356, -0.4473087191581726, -0.4007072448730469, -0.3541058301925659, -0.3075043857097626, -0.26090294122695923, -0.2143014669418335, -0.16770002245903015, -0.1210985854268074, -0.07449714839458466, -0.02789570391178131, 0.018705740571022034, 0.06530717015266418, 0.11190861463546753, 0.15851005911827087, 0.20511150360107422, 0.25171294808387756, 0.2983143925666809, 0.34491580724716187, 0.3915172815322876, 0.43811869621276855, 0.4847201406955719, 0.5313215851783752, 0.5779229998588562, 0.6245244741439819, 0.6711258888244629, 0.7177273631095886, 0.7643287777900696, 0.8109302520751953, 0.8575316667556763, 0.9041330814361572, 0.9507344961166382, 0.9973359704017639, 1.0439374446868896, 1.0905388593673706, 1.1371402740478516, 1.1837416887283325, 1.2303431034088135, 1.276944637298584]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 3.0, 6.0, 10.0, 3.0, 4.0, 13.0, 13.0, 16.0, 36.0, 37.0, 54.0, 68.0, 99.0, 187.0, 351.0, 622.0, 1223.0, 2665.0, 7349.0, 27075.0, 215813.0, 3771273.0, 136014.0, 21094.0, 6126.0, 2260.0, 946.0, 428.0, 214.0, 125.0, 67.0, 45.0, 21.0, 10.0, 5.0, 8.0, 5.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.325927734375, -0.3172168731689453, -0.3085060119628906, -0.29979515075683594, -0.29108428955078125, -0.28237342834472656, -0.2736625671386719, -0.2649517059326172, -0.2562408447265625, -0.2475299835205078, -0.23881912231445312, -0.23010826110839844, -0.22139739990234375, -0.21268653869628906, -0.20397567749023438, -0.1952648162841797, -0.186553955078125, -0.1778430938720703, -0.16913223266601562, -0.16042137145996094, -0.15171051025390625, -0.14299964904785156, -0.13428878784179688, -0.1255779266357422, -0.1168670654296875, -0.10815620422363281, -0.09944534301757812, -0.09073448181152344, -0.08202362060546875, -0.07331275939941406, -0.06460189819335938, -0.05589103698730469, -0.04718017578125, -0.03846931457519531, -0.029758453369140625, -0.021047592163085938, -0.01233673095703125, -0.0036258697509765625, 0.005084991455078125, 0.013795852661132812, 0.0225067138671875, 0.031217575073242188, 0.039928436279296875, 0.04863929748535156, 0.05735015869140625, 0.06606101989746094, 0.07477188110351562, 0.08348274230957031, 0.092193603515625, 0.10090446472167969, 0.10961532592773438, 0.11832618713378906, 0.12703704833984375, 0.13574790954589844, 0.14445877075195312, 0.1531696319580078, 0.1618804931640625, 0.1705913543701172, 0.17930221557617188, 0.18801307678222656, 0.19672393798828125, 0.20543479919433594, 0.21414566040039062, 0.2228565216064453, 0.2315673828125]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 9.0, 9.0, 10.0, 18.0, 18.0, 21.0, 36.0, 41.0, 60.0, 49.0, 75.0, 80.0, 70.0, 63.0, 74.0, 71.0, 56.0, 47.0, 40.0, 50.0, 23.0, 28.0, 19.0, 10.0, 8.0, 5.0, 2.0, 2.0, 0.0, 2.0, 1.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10504150390625, -0.10227012634277344, -0.09949874877929688, -0.09672737121582031, -0.09395599365234375, -0.09118461608886719, -0.08841323852539062, -0.08564186096191406, -0.0828704833984375, -0.08009910583496094, -0.07732772827148438, -0.07455635070800781, -0.07178497314453125, -0.06901359558105469, -0.06624221801757812, -0.06347084045410156, -0.060699462890625, -0.05792808532714844, -0.055156707763671875, -0.05238533020019531, -0.04961395263671875, -0.04684257507324219, -0.044071197509765625, -0.04129981994628906, -0.0385284423828125, -0.03575706481933594, -0.032985687255859375, -0.030214309692382812, -0.02744293212890625, -0.024671554565429688, -0.021900177001953125, -0.019128799438476562, -0.016357421875, -0.013586044311523438, -0.010814666748046875, -0.008043289184570312, -0.00527191162109375, -0.0025005340576171875, 0.000270843505859375, 0.0030422210693359375, 0.0058135986328125, 0.008584976196289062, 0.011356353759765625, 0.014127731323242188, 0.01689910888671875, 0.019670486450195312, 0.022441864013671875, 0.025213241577148438, 0.027984619140625, 0.030755996704101562, 0.033527374267578125, 0.03629875183105469, 0.03907012939453125, 0.04184150695800781, 0.044612884521484375, 0.04738426208496094, 0.0501556396484375, 0.05292701721191406, 0.055698394775390625, 0.05846977233886719, 0.06124114990234375, 0.06401252746582031, 0.06678390502929688, 0.06955528259277344, 0.07232666015625]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 4.0, 8.0, 2.0, 7.0, 7.0, 17.0, 33.0, 42.0, 70.0, 183.0, 326.0, 746.0, 2039.0, 7123.0, 36687.0, 463111.0, 3503983.0, 153659.0, 19180.0, 4453.0, 1445.0, 573.0, 296.0, 124.0, 73.0, 39.0, 21.0, 14.0, 7.0, 6.0, 8.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1756591796875, -0.16812705993652344, -0.16059494018554688, -0.1530628204345703, -0.14553070068359375, -0.1379985809326172, -0.13046646118164062, -0.12293434143066406, -0.1154022216796875, -0.10787010192871094, -0.10033798217773438, -0.09280586242675781, -0.08527374267578125, -0.07774162292480469, -0.07020950317382812, -0.06267738342285156, -0.055145263671875, -0.04761314392089844, -0.040081024169921875, -0.03254890441894531, -0.02501678466796875, -0.017484664916992188, -0.009952545166015625, -0.0024204254150390625, 0.0051116943359375, 0.012643814086914062, 0.020175933837890625, 0.027708053588867188, 0.03524017333984375, 0.04277229309082031, 0.050304412841796875, 0.05783653259277344, 0.06536865234375, 0.07290077209472656, 0.08043289184570312, 0.08796501159667969, 0.09549713134765625, 0.10302925109863281, 0.11056137084960938, 0.11809349060058594, 0.1256256103515625, 0.13315773010253906, 0.14068984985351562, 0.1482219696044922, 0.15575408935546875, 0.1632862091064453, 0.17081832885742188, 0.17835044860839844, 0.185882568359375, 0.19341468811035156, 0.20094680786132812, 0.2084789276123047, 0.21601104736328125, 0.2235431671142578, 0.23107528686523438, 0.23860740661621094, 0.2461395263671875, 0.25367164611816406, 0.2612037658691406, 0.2687358856201172, 0.27626800537109375, 0.2838001251220703, 0.2913322448730469, 0.29886436462402344, 0.306396484375]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 5.0, 0.0, 2.0, 4.0, 7.0, 5.0, 18.0, 13.0, 28.0, 51.0, 89.0, 195.0, 479.0, 1504.0, 1055.0, 315.0, 127.0, 74.0, 38.0, 25.0, 14.0, 15.0, 10.0, 5.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08538818359375, -0.08208370208740234, -0.07877922058105469, -0.07547473907470703, -0.07217025756835938, -0.06886577606201172, -0.06556129455566406, -0.062256813049316406, -0.05895233154296875, -0.055647850036621094, -0.05234336853027344, -0.04903888702392578, -0.045734405517578125, -0.04242992401123047, -0.03912544250488281, -0.035820960998535156, -0.0325164794921875, -0.029211997985839844, -0.025907516479492188, -0.02260303497314453, -0.019298553466796875, -0.01599407196044922, -0.012689590454101562, -0.009385108947753906, -0.00608062744140625, -0.0027761459350585938, 0.0005283355712890625, 0.0038328170776367188, 0.007137298583984375, 0.010441780090332031, 0.013746261596679688, 0.017050743103027344, 0.020355224609375, 0.023659706115722656, 0.026964187622070312, 0.03026866912841797, 0.033573150634765625, 0.03687763214111328, 0.04018211364746094, 0.043486595153808594, 0.04679107666015625, 0.050095558166503906, 0.05340003967285156, 0.05670452117919922, 0.060009002685546875, 0.06331348419189453, 0.06661796569824219, 0.06992244720458984, 0.0732269287109375, 0.07653141021728516, 0.07983589172363281, 0.08314037322998047, 0.08644485473632812, 0.08974933624267578, 0.09305381774902344, 0.0963582992553711, 0.09966278076171875, 0.1029672622680664, 0.10627174377441406, 0.10957622528076172, 0.11288070678710938, 0.11618518829345703, 0.11948966979980469, 0.12279415130615234, 0.1260986328125]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 5.0, 6.0, 19.0, 77.0, 146.0, 248.0, 246.0, 146.0, 67.0, 32.0, 10.0, 7.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.31054216623306274, -0.2850634753704071, -0.2595847547054291, -0.23410606384277344, -0.2086273580789566, -0.18314865231513977, -0.15766996145248413, -0.1321912556886673, -0.10671254992485046, -0.08123384416103363, -0.055755145847797394, -0.030276447534561157, -0.004797741770744324, 0.02068096399307251, 0.04615965485572815, 0.07163836061954498, 0.09711706638336182, 0.12259577214717865, 0.14807447791099548, 0.17355316877365112, 0.19903187453746796, 0.2245105803012848, 0.24998927116394043, 0.27546799182891846, 0.3009466826915741, 0.32642537355422974, 0.35190409421920776, 0.3773827850818634, 0.40286147594451904, 0.42834019660949707, 0.4538188874721527, 0.47929757833480835, 0.5047763586044312, 0.5302550792694092, 0.5557337403297424, 0.5812124609947205, 0.6066911816596985, 0.6321698427200317, 0.6576485633850098, 0.6831272840499878, 0.7086060047149658, 0.7340847253799438, 0.7595633864402771, 0.7850421071052551, 0.8105208277702332, 0.8359994888305664, 0.8614782094955444, 0.8869569301605225, 0.9124355912208557, 0.9379143118858337, 0.963392972946167, 0.988871693611145, 1.014350414276123, 1.039829134941101, 1.065307855606079, 1.0907864570617676, 1.1162651777267456, 1.1417438983917236, 1.1672226190567017, 1.1927013397216797, 1.2181799411773682, 1.2436586618423462, 1.2691373825073242, 1.2946161031723022, 1.3200948238372803]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 3.0, 1.0, 5.0, 8.0, 6.0, 7.0, 9.0, 15.0, 17.0, 14.0, 11.0, 16.0, 17.0, 23.0, 22.0, 33.0, 31.0, 34.0, 44.0, 35.0, 49.0, 50.0, 42.0, 56.0, 47.0, 41.0, 49.0, 40.0, 33.0, 30.0, 31.0, 30.0, 33.0, 17.0, 23.0, 15.0, 15.0, 17.0, 12.0, 8.0, 2.0, 5.0, 4.0, 1.0, 5.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.20412296056747437, -0.1965848058462143, -0.18904663622379303, -0.18150848150253296, -0.1739703118801117, -0.16643215715885162, -0.15889400243759155, -0.1513558328151703, -0.14381766319274902, -0.13627950847148895, -0.1287413388490677, -0.12120318412780762, -0.11366501450538635, -0.10612685978412628, -0.09858869761228561, -0.09105053544044495, -0.08351238071918488, -0.07597421854734421, -0.06843605637550354, -0.06089789792895317, -0.0533597357571125, -0.045821573585271835, -0.038283415138721466, -0.0307452529668808, -0.02320709079504013, -0.015668928623199463, -0.008130768314003944, -0.0005926080048084259, 0.006945554167032242, 0.01448371633887291, 0.02202187478542328, 0.029560036957263947, 0.037098199129104614, 0.04463636130094528, 0.05217452347278595, 0.05971268191933632, 0.06725084781646729, 0.07478900253772736, 0.08232716470956802, 0.08986532688140869, 0.09740348905324936, 0.10494165122509003, 0.1124798133969307, 0.12001797556877136, 0.12755613029003143, 0.1350942999124527, 0.14263245463371277, 0.15017062425613403, 0.1577087789773941, 0.16524693369865417, 0.17278510332107544, 0.1803232580423355, 0.18786142766475677, 0.19539958238601685, 0.2029377520084381, 0.21047590672969818, 0.21801406145095825, 0.22555221617221832, 0.2330903857946396, 0.24062854051589966, 0.24816671013832092, 0.2557048797607422, 0.26324301958084106, 0.27078118920326233, 0.2783193588256836]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 5.0, 4.0, 9.0, 14.0, 16.0, 40.0, 58.0, 75.0, 109.0, 209.0, 262.0, 530.0, 927.0, 1849.0, 3996.0, 9714.0, 28754.0, 94770.0, 312146.0, 397775.0, 134595.0, 39738.0, 12976.0, 4975.0, 2235.0, 1173.0, 628.0, 350.0, 204.0, 145.0, 91.0, 64.0, 30.0, 26.0, 16.0, 15.0, 9.0, 6.0, 8.0, 4.0, 4.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2247314453125, -0.21727561950683594, -0.20981979370117188, -0.2023639678955078, -0.19490814208984375, -0.1874523162841797, -0.17999649047851562, -0.17254066467285156, -0.1650848388671875, -0.15762901306152344, -0.15017318725585938, -0.1427173614501953, -0.13526153564453125, -0.1278057098388672, -0.12034988403320312, -0.11289405822753906, -0.105438232421875, -0.09798240661621094, -0.09052658081054688, -0.08307075500488281, -0.07561492919921875, -0.06815910339355469, -0.060703277587890625, -0.05324745178222656, -0.0457916259765625, -0.03833580017089844, -0.030879974365234375, -0.023424148559570312, -0.01596832275390625, -0.008512496948242188, -0.001056671142578125, 0.0063991546630859375, 0.01385498046875, 0.021310806274414062, 0.028766632080078125, 0.03622245788574219, 0.04367828369140625, 0.05113410949707031, 0.058589935302734375, 0.06604576110839844, 0.0735015869140625, 0.08095741271972656, 0.08841323852539062, 0.09586906433105469, 0.10332489013671875, 0.11078071594238281, 0.11823654174804688, 0.12569236755371094, 0.133148193359375, 0.14060401916503906, 0.14805984497070312, 0.1555156707763672, 0.16297149658203125, 0.1704273223876953, 0.17788314819335938, 0.18533897399902344, 0.1927947998046875, 0.20025062561035156, 0.20770645141601562, 0.2151622772216797, 0.22261810302734375, 0.2300739288330078, 0.23752975463867188, 0.24498558044433594, 0.25244140625]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 5.0, 3.0, 14.0, 5.0, 14.0, 16.0, 22.0, 36.0, 32.0, 58.0, 58.0, 75.0, 63.0, 82.0, 69.0, 67.0, 75.0, 56.0, 50.0, 44.0, 43.0, 33.0, 23.0, 20.0, 16.0, 8.0, 4.0, 4.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10565185546875, -0.10288715362548828, -0.10012245178222656, -0.09735774993896484, -0.09459304809570312, -0.0918283462524414, -0.08906364440917969, -0.08629894256591797, -0.08353424072265625, -0.08076953887939453, -0.07800483703613281, -0.0752401351928711, -0.07247543334960938, -0.06971073150634766, -0.06694602966308594, -0.06418132781982422, -0.0614166259765625, -0.05865192413330078, -0.05588722229003906, -0.053122520446777344, -0.050357818603515625, -0.047593116760253906, -0.04482841491699219, -0.04206371307373047, -0.03929901123046875, -0.03653430938720703, -0.03376960754394531, -0.031004905700683594, -0.028240203857421875, -0.025475502014160156, -0.022710800170898438, -0.01994609832763672, -0.017181396484375, -0.014416694641113281, -0.011651992797851562, -0.008887290954589844, -0.006122589111328125, -0.0033578872680664062, -0.0005931854248046875, 0.0021715164184570312, 0.00493621826171875, 0.007700920104980469, 0.010465621948242188, 0.013230323791503906, 0.015995025634765625, 0.018759727478027344, 0.021524429321289062, 0.02428913116455078, 0.0270538330078125, 0.02981853485107422, 0.03258323669433594, 0.035347938537597656, 0.038112640380859375, 0.040877342224121094, 0.04364204406738281, 0.04640674591064453, 0.04917144775390625, 0.05193614959716797, 0.05470085144042969, 0.057465553283691406, 0.060230255126953125, 0.06299495697021484, 0.06575965881347656, 0.06852436065673828, 0.0712890625]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 5.0, 4.0, 7.0, 7.0, 16.0, 16.0, 20.0, 28.0, 30.0, 51.0, 73.0, 99.0, 148.0, 185.0, 302.0, 505.0, 768.0, 1515.0, 3334.0, 8080.0, 21790.0, 64469.0, 177732.0, 347298.0, 261332.0, 103074.0, 35495.0, 12355.0, 4863.0, 2116.0, 1076.0, 632.0, 374.0, 235.0, 158.0, 114.0, 78.0, 47.0, 37.0, 25.0, 17.0, 14.0, 14.0, 5.0, 5.0, 5.0, 1.0, 5.0, 5.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.1611328125, -0.1560535430908203, -0.15097427368164062, -0.14589500427246094, -0.14081573486328125, -0.13573646545410156, -0.13065719604492188, -0.1255779266357422, -0.1204986572265625, -0.11541938781738281, -0.11034011840820312, -0.10526084899902344, -0.10018157958984375, -0.09510231018066406, -0.09002304077148438, -0.08494377136230469, -0.079864501953125, -0.07478523254394531, -0.06970596313476562, -0.06462669372558594, -0.05954742431640625, -0.05446815490722656, -0.049388885498046875, -0.04430961608886719, -0.0392303466796875, -0.03415107727050781, -0.029071807861328125, -0.023992538452148438, -0.01891326904296875, -0.013833999633789062, -0.008754730224609375, -0.0036754608154296875, 0.00140380859375, 0.0064830780029296875, 0.011562347412109375, 0.016641616821289062, 0.02172088623046875, 0.026800155639648438, 0.031879425048828125, 0.03695869445800781, 0.0420379638671875, 0.04711723327636719, 0.052196502685546875, 0.05727577209472656, 0.06235504150390625, 0.06743431091308594, 0.07251358032226562, 0.07759284973144531, 0.082672119140625, 0.08775138854980469, 0.09283065795898438, 0.09790992736816406, 0.10298919677734375, 0.10806846618652344, 0.11314773559570312, 0.11822700500488281, 0.1233062744140625, 0.1283855438232422, 0.13346481323242188, 0.13854408264160156, 0.14362335205078125, 0.14870262145996094, 0.15378189086914062, 0.1588611602783203, 0.1639404296875]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 3.0, 4.0, 2.0, 8.0, 15.0, 6.0, 15.0, 12.0, 18.0, 21.0, 16.0, 20.0, 33.0, 36.0, 33.0, 33.0, 37.0, 37.0, 35.0, 43.0, 53.0, 47.0, 36.0, 48.0, 46.0, 33.0, 42.0, 43.0, 38.0, 32.0, 34.0, 24.0, 19.0, 6.0, 16.0, 10.0, 7.0, 16.0, 7.0, 8.0, 5.0, 2.0, 2.0, 3.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.277587890625, -0.26958656311035156, -0.2615852355957031, -0.2535839080810547, -0.24558258056640625, -0.2375812530517578, -0.22957992553710938, -0.22157859802246094, -0.2135772705078125, -0.20557594299316406, -0.19757461547851562, -0.1895732879638672, -0.18157196044921875, -0.1735706329345703, -0.16556930541992188, -0.15756797790527344, -0.149566650390625, -0.14156532287597656, -0.13356399536132812, -0.1255626678466797, -0.11756134033203125, -0.10956001281738281, -0.10155868530273438, -0.09355735778808594, -0.0855560302734375, -0.07755470275878906, -0.06955337524414062, -0.06155204772949219, -0.05355072021484375, -0.04554939270019531, -0.037548065185546875, -0.029546737670898438, -0.02154541015625, -0.013544082641601562, -0.005542755126953125, 0.0024585723876953125, 0.01045989990234375, 0.018461227416992188, 0.026462554931640625, 0.03446388244628906, 0.0424652099609375, 0.05046653747558594, 0.058467864990234375, 0.06646919250488281, 0.07447052001953125, 0.08247184753417969, 0.09047317504882812, 0.09847450256347656, 0.106475830078125, 0.11447715759277344, 0.12247848510742188, 0.1304798126220703, 0.13848114013671875, 0.1464824676513672, 0.15448379516601562, 0.16248512268066406, 0.1704864501953125, 0.17848777770996094, 0.18648910522460938, 0.1944904327392578, 0.20249176025390625, 0.2104930877685547, 0.21849441528320312, 0.22649574279785156, 0.2344970703125]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 3.0, 0.0, 0.0, 2.0, 5.0, 8.0, 10.0, 24.0, 48.0, 94.0, 181.0, 380.0, 939.0, 2723.0, 10868.0, 61434.0, 543986.0, 373644.0, 42572.0, 8081.0, 2211.0, 715.0, 308.0, 139.0, 85.0, 40.0, 27.0, 14.0, 6.0, 5.0, 3.0, 2.0, 1.0, 2.0, 2.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11126708984375, -0.10679912567138672, -0.10233116149902344, -0.09786319732666016, -0.09339523315429688, -0.0889272689819336, -0.08445930480957031, -0.07999134063720703, -0.07552337646484375, -0.07105541229248047, -0.06658744812011719, -0.062119483947753906, -0.057651519775390625, -0.053183555603027344, -0.04871559143066406, -0.04424762725830078, -0.0397796630859375, -0.03531169891357422, -0.030843734741210938, -0.026375770568847656, -0.021907806396484375, -0.017439842224121094, -0.012971878051757812, -0.008503913879394531, -0.00403594970703125, 0.00043201446533203125, 0.0048999786376953125, 0.009367942810058594, 0.013835906982421875, 0.018303871154785156, 0.022771835327148438, 0.02723979949951172, 0.031707763671875, 0.03617572784423828, 0.04064369201660156, 0.045111656188964844, 0.049579620361328125, 0.054047584533691406, 0.05851554870605469, 0.06298351287841797, 0.06745147705078125, 0.07191944122314453, 0.07638740539550781, 0.0808553695678711, 0.08532333374023438, 0.08979129791259766, 0.09425926208496094, 0.09872722625732422, 0.1031951904296875, 0.10766315460205078, 0.11213111877441406, 0.11659908294677734, 0.12106704711914062, 0.1255350112915039, 0.1300029754638672, 0.13447093963623047, 0.13893890380859375, 0.14340686798095703, 0.1478748321533203, 0.1523427963256836, 0.15681076049804688, 0.16127872467041016, 0.16574668884277344, 0.17021465301513672, 0.1746826171875]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 4.0, 3.0, 1.0, 3.0, 11.0, 14.0, 10.0, 12.0, 22.0, 18.0, 23.0, 35.0, 43.0, 51.0, 108.0, 93.0, 108.0, 108.0, 71.0, 53.0, 38.0, 38.0, 29.0, 27.0, 20.0, 15.0, 12.0, 9.0, 9.0, 4.0, 7.0, 6.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.230043411254883e-05, -6.975512951612473e-05, -6.720982491970062e-05, -6.466452032327652e-05, -6.211921572685242e-05, -5.9573911130428314e-05, -5.702860653400421e-05, -5.448330193758011e-05, -5.1937997341156006e-05, -4.93926927447319e-05, -4.68473881483078e-05, -4.43020835518837e-05, -4.1756778955459595e-05, -3.921147435903549e-05, -3.666616976261139e-05, -3.4120865166187286e-05, -3.1575560569763184e-05, -2.903025597333908e-05, -2.6484951376914978e-05, -2.3939646780490875e-05, -2.1394342184066772e-05, -1.884903758764267e-05, -1.6303732991218567e-05, -1.3758428394794464e-05, -1.1213123798370361e-05, -8.667819201946259e-06, -6.122514605522156e-06, -3.577210009098053e-06, -1.0319054126739502e-06, 1.5133991837501526e-06, 4.058703780174255e-06, 6.604008376598358e-06, 9.149312973022461e-06, 1.1694617569446564e-05, 1.4239922165870667e-05, 1.678522676229477e-05, 1.9330531358718872e-05, 2.1875835955142975e-05, 2.4421140551567078e-05, 2.696644514799118e-05, 2.9511749744415283e-05, 3.2057054340839386e-05, 3.460235893726349e-05, 3.714766353368759e-05, 3.9692968130111694e-05, 4.22382727265358e-05, 4.47835773229599e-05, 4.7328881919384e-05, 4.9874186515808105e-05, 5.241949111223221e-05, 5.496479570865631e-05, 5.7510100305080414e-05, 6.0055404901504517e-05, 6.260070949792862e-05, 6.514601409435272e-05, 6.769131869077682e-05, 7.023662328720093e-05, 7.278192788362503e-05, 7.532723248004913e-05, 7.787253707647324e-05, 8.041784167289734e-05, 8.296314626932144e-05, 8.550845086574554e-05, 8.805375546216965e-05, 9.059906005859375e-05]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 0.0, 1.0, 3.0, 8.0, 12.0, 11.0, 23.0, 22.0, 27.0, 37.0, 41.0, 64.0, 102.0, 179.0, 320.0, 559.0, 1092.0, 2309.0, 5470.0, 15569.0, 52849.0, 245615.0, 545436.0, 128936.0, 32111.0, 10299.0, 3841.0, 1631.0, 818.0, 491.0, 232.0, 161.0, 103.0, 61.0, 28.0, 28.0, 20.0, 14.0, 11.0, 13.0, 4.0, 3.0, 0.0, 4.0, 3.0, 1.0, 0.0, 3.0, 1.0, 2.0], "bins": [-0.11834716796875, -0.11508750915527344, -0.11182785034179688, -0.10856819152832031, -0.10530853271484375, -0.10204887390136719, -0.09878921508789062, -0.09552955627441406, -0.0922698974609375, -0.08901023864746094, -0.08575057983398438, -0.08249092102050781, -0.07923126220703125, -0.07597160339355469, -0.07271194458007812, -0.06945228576660156, -0.066192626953125, -0.06293296813964844, -0.059673309326171875, -0.05641365051269531, -0.05315399169921875, -0.04989433288574219, -0.046634674072265625, -0.04337501525878906, -0.0401153564453125, -0.03685569763183594, -0.033596038818359375, -0.030336380004882812, -0.02707672119140625, -0.023817062377929688, -0.020557403564453125, -0.017297744750976562, -0.0140380859375, -0.010778427124023438, -0.007518768310546875, -0.0042591094970703125, -0.00099945068359375, 0.0022602081298828125, 0.005519866943359375, 0.008779525756835938, 0.0120391845703125, 0.015298843383789062, 0.018558502197265625, 0.021818161010742188, 0.02507781982421875, 0.028337478637695312, 0.031597137451171875, 0.03485679626464844, 0.038116455078125, 0.04137611389160156, 0.044635772705078125, 0.04789543151855469, 0.05115509033203125, 0.05441474914550781, 0.057674407958984375, 0.06093406677246094, 0.0641937255859375, 0.06745338439941406, 0.07071304321289062, 0.07397270202636719, 0.07723236083984375, 0.08049201965332031, 0.08375167846679688, 0.08701133728027344, 0.09027099609375]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 4.0, 1.0, 3.0, 3.0, 15.0, 12.0, 10.0, 15.0, 25.0, 53.0, 49.0, 68.0, 86.0, 134.0, 131.0, 115.0, 93.0, 62.0, 50.0, 31.0, 13.0, 16.0, 6.0, 4.0, 6.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.159423828125, -0.15544986724853516, -0.1514759063720703, -0.14750194549560547, -0.14352798461914062, -0.13955402374267578, -0.13558006286621094, -0.1316061019897461, -0.12763214111328125, -0.1236581802368164, -0.11968421936035156, -0.11571025848388672, -0.11173629760742188, -0.10776233673095703, -0.10378837585449219, -0.09981441497802734, -0.0958404541015625, -0.09186649322509766, -0.08789253234863281, -0.08391857147216797, -0.07994461059570312, -0.07597064971923828, -0.07199668884277344, -0.0680227279663086, -0.06404876708984375, -0.060074806213378906, -0.05610084533691406, -0.05212688446044922, -0.048152923583984375, -0.04417896270751953, -0.04020500183105469, -0.036231040954589844, -0.032257080078125, -0.028283119201660156, -0.024309158325195312, -0.02033519744873047, -0.016361236572265625, -0.012387275695800781, -0.008413314819335938, -0.004439353942871094, -0.00046539306640625, 0.0035085678100585938, 0.0074825286865234375, 0.011456489562988281, 0.015430450439453125, 0.01940441131591797, 0.023378372192382812, 0.027352333068847656, 0.0313262939453125, 0.035300254821777344, 0.03927421569824219, 0.04324817657470703, 0.047222137451171875, 0.05119609832763672, 0.05517005920410156, 0.059144020080566406, 0.06311798095703125, 0.0670919418334961, 0.07106590270996094, 0.07503986358642578, 0.07901382446289062, 0.08298778533935547, 0.08696174621582031, 0.09093570709228516, 0.09490966796875]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 3.0, 6.0, 11.0, 30.0, 72.0, 133.0, 234.0, 239.0, 145.0, 78.0, 34.0, 9.0, 6.0, 1.0, 2.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3133618831634521, -1.232060194015503, -1.1507583856582642, -1.0694565773010254, -0.9881548881530762, -0.9068531394004822, -0.8255513906478882, -0.7442496418952942, -0.6629478931427002, -0.5816461443901062, -0.5003443956375122, -0.4190426468849182, -0.3377408981323242, -0.2564391493797302, -0.17513740062713623, -0.09383565187454224, -0.012533903121948242, 0.06876784563064575, 0.15006959438323975, 0.23137134313583374, 0.31267309188842773, 0.39397484064102173, 0.4752765893936157, 0.5565783381462097, 0.6378800868988037, 0.7191818356513977, 0.8004835844039917, 0.8817853331565857, 0.9630870819091797, 1.044388771057129, 1.1256905794143677, 1.2069923877716064, 1.2882943153381348, 1.369596004486084, 1.4508978128433228, 1.5321996212005615, 1.6135013103485107, 1.69480299949646, 1.7761048078536987, 1.8574066162109375, 1.9387083053588867, 2.020009994506836, 2.101311683654785, 2.1826136112213135, 2.2639153003692627, 2.345216989517212, 2.4265189170837402, 2.5078206062316895, 2.5891222953796387, 2.670423984527588, 2.751725673675537, 2.8330276012420654, 2.9143292903900146, 2.995630979537964, 3.076932907104492, 3.1582345962524414, 3.2395362854003906, 3.32083797454834, 3.402139663696289, 3.4834415912628174, 3.5647432804107666, 3.646044969558716, 3.727346897125244, 3.8086485862731934, 3.8899502754211426]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 5.0, 5.0, 3.0, 8.0, 6.0, 16.0, 6.0, 12.0, 25.0, 26.0, 26.0, 26.0, 33.0, 30.0, 27.0, 27.0, 29.0, 37.0, 51.0, 49.0, 46.0, 46.0, 41.0, 44.0, 41.0, 45.0, 38.0, 32.0, 24.0, 36.0, 27.0, 16.0, 18.0, 21.0, 14.0, 14.0, 9.0, 10.0, 9.0, 5.0, 4.0, 5.0, 2.0, 3.0, 4.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-1.3588221073150635, -1.3138513565063477, -1.2688804864883423, -1.2239097356796265, -1.178938865661621, -1.1339681148529053, -1.0889973640441895, -1.0440266132354736, -0.9990557432174683, -0.9540849328041077, -0.9091141223907471, -0.8641433715820312, -0.8191725611686707, -0.7742017507553101, -0.7292309999465942, -0.6842601895332336, -0.639289379119873, -0.5943185687065125, -0.5493477582931519, -0.504377007484436, -0.45940619707107544, -0.41443538665771484, -0.36946460604667664, -0.3244938254356384, -0.27952301502227783, -0.23455221951007843, -0.18958142399787903, -0.14461062848567963, -0.09963983297348022, -0.05466903746128082, -0.009698241949081421, 0.03527253866195679, 0.08024322986602783, 0.12521402537822723, 0.17018482089042664, 0.21515561640262604, 0.26012641191482544, 0.30509722232818604, 0.35006800293922424, 0.39503878355026245, 0.44000959396362305, 0.48498040437698364, 0.5299512147903442, 0.5749219655990601, 0.6198927760124207, 0.6648635864257812, 0.7098343372344971, 0.7548051476478577, 0.7997759580612183, 0.8447467684745789, 0.8897175788879395, 0.9346883296966553, 0.9796591401100159, 1.0246299505233765, 1.0696007013320923, 1.1145715713500977, 1.1595423221588135, 1.2045130729675293, 1.2494839429855347, 1.2944546937942505, 1.3394255638122559, 1.3843963146209717, 1.4293670654296875, 1.4743378162384033, 1.5193086862564087]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 1.0, 5.0, 4.0, 9.0, 7.0, 11.0, 11.0, 21.0, 33.0, 46.0, 76.0, 97.0, 176.0, 237.0, 435.0, 797.0, 1538.0, 4005.0, 11420.0, 52770.0, 1684934.0, 2362533.0, 56290.0, 11832.0, 3956.0, 1517.0, 676.0, 368.0, 198.0, 110.0, 60.0, 40.0, 27.0, 10.0, 11.0, 13.0, 3.0, 1.0, 1.0, 3.0, 1.0, 2.0, 2.0], "bins": [-0.346923828125, -0.3386669158935547, -0.3304100036621094, -0.32215309143066406, -0.31389617919921875, -0.30563926696777344, -0.2973823547363281, -0.2891254425048828, -0.2808685302734375, -0.2726116180419922, -0.2643547058105469, -0.25609779357910156, -0.24784088134765625, -0.23958396911621094, -0.23132705688476562, -0.2230701446533203, -0.214813232421875, -0.2065563201904297, -0.19829940795898438, -0.19004249572753906, -0.18178558349609375, -0.17352867126464844, -0.16527175903320312, -0.1570148468017578, -0.1487579345703125, -0.1405010223388672, -0.13224411010742188, -0.12398719787597656, -0.11573028564453125, -0.10747337341308594, -0.09921646118164062, -0.09095954895019531, -0.08270263671875, -0.07444572448730469, -0.06618881225585938, -0.05793190002441406, -0.04967498779296875, -0.04141807556152344, -0.033161163330078125, -0.024904251098632812, -0.0166473388671875, -0.008390426635742188, -0.000133514404296875, 0.008123397827148438, 0.01638031005859375, 0.024637222290039062, 0.032894134521484375, 0.04115104675292969, 0.049407958984375, 0.05766487121582031, 0.06592178344726562, 0.07417869567871094, 0.08243560791015625, 0.09069252014160156, 0.09894943237304688, 0.10720634460449219, 0.1154632568359375, 0.12372016906738281, 0.13197708129882812, 0.14023399353027344, 0.14849090576171875, 0.15674781799316406, 0.16500473022460938, 0.1732616424560547, 0.1815185546875]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 3.0, 6.0, 8.0, 6.0, 14.0, 16.0, 18.0, 22.0, 29.0, 32.0, 52.0, 56.0, 59.0, 76.0, 63.0, 65.0, 59.0, 59.0, 66.0, 55.0, 60.0, 43.0, 30.0, 42.0, 22.0, 14.0, 3.0, 6.0, 9.0, 3.0, 1.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.1090087890625, -0.10617256164550781, -0.10333633422851562, -0.10050010681152344, -0.09766387939453125, -0.09482765197753906, -0.09199142456054688, -0.08915519714355469, -0.0863189697265625, -0.08348274230957031, -0.08064651489257812, -0.07781028747558594, -0.07497406005859375, -0.07213783264160156, -0.06930160522460938, -0.06646537780761719, -0.063629150390625, -0.06079292297363281, -0.057956695556640625, -0.05512046813964844, -0.05228424072265625, -0.04944801330566406, -0.046611785888671875, -0.04377555847167969, -0.0409393310546875, -0.03810310363769531, -0.035266876220703125, -0.03243064880371094, -0.02959442138671875, -0.026758193969726562, -0.023921966552734375, -0.021085739135742188, -0.01824951171875, -0.015413284301757812, -0.012577056884765625, -0.009740829467773438, -0.00690460205078125, -0.0040683746337890625, -0.001232147216796875, 0.0016040802001953125, 0.0044403076171875, 0.0072765350341796875, 0.010112762451171875, 0.012948989868164062, 0.01578521728515625, 0.018621444702148438, 0.021457672119140625, 0.024293899536132812, 0.027130126953125, 0.029966354370117188, 0.032802581787109375, 0.03563880920410156, 0.03847503662109375, 0.04131126403808594, 0.044147491455078125, 0.04698371887207031, 0.0498199462890625, 0.05265617370605469, 0.055492401123046875, 0.05832862854003906, 0.06116485595703125, 0.06400108337402344, 0.06683731079101562, 0.06967353820800781, 0.072509765625]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 6.0, 7.0, 9.0, 20.0, 40.0, 92.0, 224.0, 613.0, 1562.0, 5945.0, 36917.0, 1093728.0, 2984976.0, 58307.0, 8268.0, 2154.0, 828.0, 349.0, 130.0, 60.0, 30.0, 13.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.298095703125, -0.2890892028808594, -0.28008270263671875, -0.2710762023925781, -0.2620697021484375, -0.2530632019042969, -0.24405670166015625, -0.23505020141601562, -0.226043701171875, -0.21703720092773438, -0.20803070068359375, -0.19902420043945312, -0.1900177001953125, -0.18101119995117188, -0.17200469970703125, -0.16299819946289062, -0.15399169921875, -0.14498519897460938, -0.13597869873046875, -0.12697219848632812, -0.1179656982421875, -0.10895919799804688, -0.09995269775390625, -0.09094619750976562, -0.081939697265625, -0.07293319702148438, -0.06392669677734375, -0.054920196533203125, -0.0459136962890625, -0.036907196044921875, -0.02790069580078125, -0.018894195556640625, -0.0098876953125, -0.000881195068359375, 0.00812530517578125, 0.017131805419921875, 0.0261383056640625, 0.035144805908203125, 0.04415130615234375, 0.053157806396484375, 0.062164306640625, 0.07117080688476562, 0.08017730712890625, 0.08918380737304688, 0.0981903076171875, 0.10719680786132812, 0.11620330810546875, 0.12520980834960938, 0.13421630859375, 0.14322280883789062, 0.15222930908203125, 0.16123580932617188, 0.1702423095703125, 0.17924880981445312, 0.18825531005859375, 0.19726181030273438, 0.206268310546875, 0.21527481079101562, 0.22428131103515625, 0.23328781127929688, 0.2422943115234375, 0.2513008117675781, 0.26030731201171875, 0.2693138122558594, 0.2783203125]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 4.0, 9.0, 4.0, 10.0, 5.0, 12.0, 19.0, 31.0, 55.0, 88.0, 177.0, 480.0, 1281.0, 1109.0, 387.0, 173.0, 72.0, 51.0, 24.0, 19.0, 22.0, 15.0, 5.0, 6.0, 6.0, 5.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0904541015625, -0.08709716796875, -0.083740234375, -0.08038330078125, -0.0770263671875, -0.07366943359375, -0.0703125, -0.06695556640625, -0.0635986328125, -0.06024169921875, -0.056884765625, -0.05352783203125, -0.0501708984375, -0.04681396484375, -0.04345703125, -0.04010009765625, -0.0367431640625, -0.03338623046875, -0.030029296875, -0.02667236328125, -0.0233154296875, -0.01995849609375, -0.0166015625, -0.01324462890625, -0.0098876953125, -0.00653076171875, -0.003173828125, 0.00018310546875, 0.0035400390625, 0.00689697265625, 0.01025390625, 0.01361083984375, 0.0169677734375, 0.02032470703125, 0.023681640625, 0.02703857421875, 0.0303955078125, 0.03375244140625, 0.037109375, 0.04046630859375, 0.0438232421875, 0.04718017578125, 0.050537109375, 0.05389404296875, 0.0572509765625, 0.06060791015625, 0.06396484375, 0.06732177734375, 0.0706787109375, 0.07403564453125, 0.077392578125, 0.08074951171875, 0.0841064453125, 0.08746337890625, 0.0908203125, 0.09417724609375, 0.0975341796875, 0.10089111328125, 0.104248046875, 0.10760498046875, 0.1109619140625, 0.11431884765625, 0.11767578125, 0.12103271484375, 0.1243896484375]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 0.0, 5.0, 8.0, 21.0, 49.0, 121.0, 202.0, 266.0, 177.0, 105.0, 31.0, 12.0, 5.0, 4.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9393589496612549, -0.9111850261688232, -0.8830111622810364, -0.8548372983932495, -0.8266633749008179, -0.7984894514083862, -0.7703155875205994, -0.7421417236328125, -0.7139678001403809, -0.6857938766479492, -0.6576200127601624, -0.6294461488723755, -0.6012722253799438, -0.5730983018875122, -0.5449244379997253, -0.5167505741119385, -0.48857665061950684, -0.4604027569293976, -0.43222886323928833, -0.4040549695491791, -0.3758810758590698, -0.34770718216896057, -0.3195332884788513, -0.29135939478874207, -0.2631855010986328, -0.23501160740852356, -0.2068377137184143, -0.17866382002830505, -0.1504899263381958, -0.12231603264808655, -0.0941421389579773, -0.06596824526786804, -0.037794411182403564, -0.009620517492294312, 0.01855337619781494, 0.046727269887924194, 0.07490116357803345, 0.1030750572681427, 0.13124895095825195, 0.1594228446483612, 0.18759673833847046, 0.2157706320285797, 0.24394452571868896, 0.2721184194087982, 0.30029231309890747, 0.3284662067890167, 0.356640100479126, 0.38481399416923523, 0.4129878878593445, 0.44116178154945374, 0.469335675239563, 0.49750956892967224, 0.5256834626197815, 0.5538573265075684, 0.58203125, 0.6102051734924316, 0.6383790373802185, 0.6665529012680054, 0.694726824760437, 0.7229007482528687, 0.7510746121406555, 0.7792484760284424, 0.807422399520874, 0.8355963230133057, 0.8637701869010925]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 2.0, 6.0, 3.0, 9.0, 7.0, 18.0, 13.0, 13.0, 15.0, 24.0, 27.0, 30.0, 34.0, 42.0, 31.0, 33.0, 36.0, 48.0, 45.0, 34.0, 48.0, 43.0, 32.0, 38.0, 37.0, 41.0, 31.0, 27.0, 36.0, 43.0, 30.0, 24.0, 21.0, 20.0, 11.0, 8.0, 10.0, 8.0, 5.0, 3.0, 3.0, 4.0, 1.0, 3.0, 3.0, 2.0, 0.0, 3.0, 2.0, 0.0, 3.0], "bins": [-0.31077879667282104, -0.3014974594116211, -0.29221612215042114, -0.2829347550868988, -0.27365341782569885, -0.2643720805644989, -0.25509074330329895, -0.245809406042099, -0.23652805387973785, -0.2272467166185379, -0.21796536445617676, -0.2086840271949768, -0.19940268993377686, -0.1901213377714157, -0.18084000051021576, -0.17155864834785461, -0.16227731108665466, -0.1529959738254547, -0.14371462166309357, -0.13443328440189362, -0.12515193223953247, -0.11587059497833252, -0.10658925771713257, -0.09730791300535202, -0.08802656829357147, -0.07874522358179092, -0.06946387887001038, -0.060182541608810425, -0.05090119689702988, -0.04161985218524933, -0.03233851119875908, -0.02305717021226883, -0.013775825500488281, -0.004494482651352882, 0.0047868601977825165, 0.014068203046917915, 0.023349545896053314, 0.03263089060783386, 0.04191223159432411, 0.05119357258081436, 0.06047491729259491, 0.06975626200437546, 0.079037606716156, 0.08831894397735596, 0.0976002886891365, 0.10688163340091705, 0.116162970662117, 0.12544432282447815, 0.1347256600856781, 0.14400699734687805, 0.1532883495092392, 0.16256968677043915, 0.1718510389328003, 0.18113237619400024, 0.1904137134552002, 0.19969505071640015, 0.2089764028787613, 0.21825774013996124, 0.2275390923023224, 0.23682042956352234, 0.2461017668247223, 0.25538313388824463, 0.2646644711494446, 0.27394580841064453, 0.2832271456718445]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 4.0, 0.0, 2.0, 2.0, 2.0, 7.0, 6.0, 5.0, 9.0, 15.0, 15.0, 19.0, 30.0, 44.0, 64.0, 90.0, 174.0, 239.0, 387.0, 653.0, 1197.0, 2206.0, 4771.0, 11123.0, 29569.0, 91549.0, 340462.0, 398544.0, 109221.0, 34274.0, 12824.0, 5329.0, 2554.0, 1274.0, 748.0, 400.0, 256.0, 148.0, 93.0, 88.0, 56.0, 33.0, 26.0, 17.0, 11.0, 8.0, 9.0, 6.0, 5.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.238037109375, -0.23178482055664062, -0.22553253173828125, -0.21928024291992188, -0.2130279541015625, -0.20677566528320312, -0.20052337646484375, -0.19427108764648438, -0.188018798828125, -0.18176651000976562, -0.17551422119140625, -0.16926193237304688, -0.1630096435546875, -0.15675735473632812, -0.15050506591796875, -0.14425277709960938, -0.13800048828125, -0.13174819946289062, -0.12549591064453125, -0.11924362182617188, -0.1129913330078125, -0.10673904418945312, -0.10048675537109375, -0.09423446655273438, -0.087982177734375, -0.08172988891601562, -0.07547760009765625, -0.06922531127929688, -0.0629730224609375, -0.056720733642578125, -0.05046844482421875, -0.044216156005859375, -0.0379638671875, -0.031711578369140625, -0.02545928955078125, -0.019207000732421875, -0.0129547119140625, -0.006702423095703125, -0.00045013427734375, 0.005802154541015625, 0.012054443359375, 0.018306732177734375, 0.02455902099609375, 0.030811309814453125, 0.0370635986328125, 0.043315887451171875, 0.04956817626953125, 0.055820465087890625, 0.06207275390625, 0.06832504272460938, 0.07457733154296875, 0.08082962036132812, 0.0870819091796875, 0.09333419799804688, 0.09958648681640625, 0.10583877563476562, 0.112091064453125, 0.11834335327148438, 0.12459564208984375, 0.13084793090820312, 0.1371002197265625, 0.14335250854492188, 0.14960479736328125, 0.15585708618164062, 0.162109375]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 5.0, 2.0, 10.0, 6.0, 11.0, 15.0, 16.0, 20.0, 19.0, 35.0, 40.0, 60.0, 55.0, 70.0, 71.0, 61.0, 67.0, 59.0, 57.0, 64.0, 48.0, 56.0, 39.0, 46.0, 19.0, 13.0, 14.0, 6.0, 7.0, 6.0, 1.0, 3.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.10858154296875, -0.10579109191894531, -0.10300064086914062, -0.10021018981933594, -0.09741973876953125, -0.09462928771972656, -0.09183883666992188, -0.08904838562011719, -0.0862579345703125, -0.08346748352050781, -0.08067703247070312, -0.07788658142089844, -0.07509613037109375, -0.07230567932128906, -0.06951522827148438, -0.06672477722167969, -0.063934326171875, -0.06114387512207031, -0.058353424072265625, -0.05556297302246094, -0.05277252197265625, -0.04998207092285156, -0.047191619873046875, -0.04440116882324219, -0.0416107177734375, -0.03882026672363281, -0.036029815673828125, -0.03323936462402344, -0.03044891357421875, -0.027658462524414062, -0.024868011474609375, -0.022077560424804688, -0.019287109375, -0.016496658325195312, -0.013706207275390625, -0.010915756225585938, -0.00812530517578125, -0.0053348541259765625, -0.002544403076171875, 0.0002460479736328125, 0.0030364990234375, 0.0058269500732421875, 0.008617401123046875, 0.011407852172851562, 0.01419830322265625, 0.016988754272460938, 0.019779205322265625, 0.022569656372070312, 0.025360107421875, 0.028150558471679688, 0.030941009521484375, 0.03373146057128906, 0.03652191162109375, 0.03931236267089844, 0.042102813720703125, 0.04489326477050781, 0.0476837158203125, 0.05047416687011719, 0.053264617919921875, 0.05605506896972656, 0.05884552001953125, 0.06163597106933594, 0.06442642211914062, 0.06721687316894531, 0.07000732421875]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 2.0, 5.0, 6.0, 7.0, 11.0, 18.0, 18.0, 31.0, 39.0, 67.0, 96.0, 132.0, 219.0, 400.0, 772.0, 1893.0, 6774.0, 38402.0, 326779.0, 584060.0, 72832.0, 11078.0, 2696.0, 1000.0, 468.0, 267.0, 170.0, 87.0, 63.0, 41.0, 35.0, 26.0, 22.0, 14.0, 6.0, 4.0, 7.0, 5.0, 1.0, 2.0, 3.0, 0.0, 2.0, 1.0, 2.0], "bins": [-0.356689453125, -0.34734153747558594, -0.3379936218261719, -0.3286457061767578, -0.31929779052734375, -0.3099498748779297, -0.3006019592285156, -0.29125404357910156, -0.2819061279296875, -0.27255821228027344, -0.2632102966308594, -0.2538623809814453, -0.24451446533203125, -0.2351665496826172, -0.22581863403320312, -0.21647071838378906, -0.207122802734375, -0.19777488708496094, -0.18842697143554688, -0.1790790557861328, -0.16973114013671875, -0.1603832244873047, -0.15103530883789062, -0.14168739318847656, -0.1323394775390625, -0.12299156188964844, -0.11364364624023438, -0.10429573059082031, -0.09494781494140625, -0.08559989929199219, -0.07625198364257812, -0.06690406799316406, -0.05755615234375, -0.04820823669433594, -0.038860321044921875, -0.029512405395507812, -0.02016448974609375, -0.010816574096679688, -0.001468658447265625, 0.007879257202148438, 0.0172271728515625, 0.026575088500976562, 0.035923004150390625, 0.04527091979980469, 0.05461883544921875, 0.06396675109863281, 0.07331466674804688, 0.08266258239746094, 0.092010498046875, 0.10135841369628906, 0.11070632934570312, 0.12005424499511719, 0.12940216064453125, 0.1387500762939453, 0.14809799194335938, 0.15744590759277344, 0.1667938232421875, 0.17614173889160156, 0.18548965454101562, 0.1948375701904297, 0.20418548583984375, 0.2135334014892578, 0.22288131713867188, 0.23222923278808594, 0.2415771484375]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 1.0, 4.0, 5.0, 5.0, 5.0, 13.0, 14.0, 19.0, 22.0, 16.0, 25.0, 26.0, 38.0, 36.0, 36.0, 42.0, 44.0, 53.0, 47.0, 55.0, 45.0, 44.0, 42.0, 53.0, 46.0, 43.0, 50.0, 36.0, 28.0, 25.0, 16.0, 14.0, 13.0, 11.0, 7.0, 5.0, 5.0, 3.0, 2.0, 6.0, 3.0, 4.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.26416015625, -0.2552604675292969, -0.24636077880859375, -0.23746109008789062, -0.2285614013671875, -0.21966171264648438, -0.21076202392578125, -0.20186233520507812, -0.192962646484375, -0.18406295776367188, -0.17516326904296875, -0.16626358032226562, -0.1573638916015625, -0.14846420288085938, -0.13956451416015625, -0.13066482543945312, -0.12176513671875, -0.11286544799804688, -0.10396575927734375, -0.09506607055664062, -0.0861663818359375, -0.07726669311523438, -0.06836700439453125, -0.059467315673828125, -0.050567626953125, -0.041667938232421875, -0.03276824951171875, -0.023868560791015625, -0.0149688720703125, -0.006069183349609375, 0.00283050537109375, 0.011730194091796875, 0.0206298828125, 0.029529571533203125, 0.03842926025390625, 0.047328948974609375, 0.0562286376953125, 0.06512832641601562, 0.07402801513671875, 0.08292770385742188, 0.091827392578125, 0.10072708129882812, 0.10962677001953125, 0.11852645874023438, 0.1274261474609375, 0.13632583618164062, 0.14522552490234375, 0.15412521362304688, 0.16302490234375, 0.17192459106445312, 0.18082427978515625, 0.18972396850585938, 0.1986236572265625, 0.20752334594726562, 0.21642303466796875, 0.22532272338867188, 0.234222412109375, 0.24312210083007812, 0.25202178955078125, 0.2609214782714844, 0.2698211669921875, 0.2787208557128906, 0.28762054443359375, 0.2965202331542969, 0.305419921875]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 6.0, 6.0, 13.0, 17.0, 42.0, 94.0, 272.0, 1763.0, 104284.0, 935661.0, 5692.0, 443.0, 146.0, 61.0, 28.0, 11.0, 7.0, 5.0, 2.0, 0.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.292236328125, -0.2801513671875, -0.26806640625, -0.2559814453125, -0.243896484375, -0.2318115234375, -0.2197265625, -0.2076416015625, -0.195556640625, -0.1834716796875, -0.17138671875, -0.1593017578125, -0.147216796875, -0.1351318359375, -0.123046875, -0.1109619140625, -0.098876953125, -0.0867919921875, -0.07470703125, -0.0626220703125, -0.050537109375, -0.0384521484375, -0.0263671875, -0.0142822265625, -0.002197265625, 0.0098876953125, 0.02197265625, 0.0340576171875, 0.046142578125, 0.0582275390625, 0.0703125, 0.0823974609375, 0.094482421875, 0.1065673828125, 0.11865234375, 0.1307373046875, 0.142822265625, 0.1549072265625, 0.1669921875, 0.1790771484375, 0.191162109375, 0.2032470703125, 0.21533203125, 0.2274169921875, 0.239501953125, 0.2515869140625, 0.263671875, 0.2757568359375, 0.287841796875, 0.2999267578125, 0.31201171875, 0.3240966796875, 0.336181640625, 0.3482666015625, 0.3603515625, 0.3724365234375, 0.384521484375, 0.3966064453125, 0.40869140625, 0.4207763671875, 0.432861328125, 0.4449462890625, 0.45703125, 0.4691162109375, 0.481201171875]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 4.0, 5.0, 5.0, 6.0, 7.0, 15.0, 15.0, 15.0, 25.0, 25.0, 35.0, 36.0, 51.0, 55.0, 73.0, 109.0, 114.0, 81.0, 76.0, 64.0, 42.0, 36.0, 26.0, 18.0, 11.0, 13.0, 13.0, 10.0, 6.0, 2.0, 4.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-7.802248001098633e-05, -7.591862231492996e-05, -7.38147646188736e-05, -7.171090692281723e-05, -6.960704922676086e-05, -6.75031915307045e-05, -6.539933383464813e-05, -6.329547613859177e-05, -6.11916184425354e-05, -5.9087760746479034e-05, -5.698390305042267e-05, -5.48800453543663e-05, -5.2776187658309937e-05, -5.067232996225357e-05, -4.8568472266197205e-05, -4.646461457014084e-05, -4.436075687408447e-05, -4.225689917802811e-05, -4.015304148197174e-05, -3.8049183785915375e-05, -3.594532608985901e-05, -3.384146839380264e-05, -3.173761069774628e-05, -2.963375300168991e-05, -2.7529895305633545e-05, -2.542603760957718e-05, -2.3322179913520813e-05, -2.1218322217464447e-05, -1.911446452140808e-05, -1.7010606825351715e-05, -1.4906749129295349e-05, -1.2802891433238983e-05, -1.0699033737182617e-05, -8.595176041126251e-06, -6.491318345069885e-06, -4.387460649013519e-06, -2.2836029529571533e-06, -1.7974525690078735e-07, 1.9241124391555786e-06, 4.027970135211945e-06, 6.1318278312683105e-06, 8.235685527324677e-06, 1.0339543223381042e-05, 1.2443400919437408e-05, 1.4547258615493774e-05, 1.665111631155014e-05, 1.8754974007606506e-05, 2.0858831703662872e-05, 2.2962689399719238e-05, 2.5066547095775604e-05, 2.717040479183197e-05, 2.9274262487888336e-05, 3.13781201839447e-05, 3.348197788000107e-05, 3.5585835576057434e-05, 3.76896932721138e-05, 3.9793550968170166e-05, 4.189740866422653e-05, 4.40012663602829e-05, 4.6105124056339264e-05, 4.820898175239563e-05, 5.0312839448451996e-05, 5.241669714450836e-05, 5.452055484056473e-05, 5.6624412536621094e-05]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 5.0, 8.0, 2.0, 6.0, 7.0, 18.0, 28.0, 55.0, 82.0, 175.0, 495.0, 2383.0, 77130.0, 953512.0, 13060.0, 1049.0, 274.0, 121.0, 56.0, 42.0, 19.0, 17.0, 11.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.373046875, -0.3621673583984375, -0.351287841796875, -0.3404083251953125, -0.32952880859375, -0.3186492919921875, -0.307769775390625, -0.2968902587890625, -0.2860107421875, -0.2751312255859375, -0.264251708984375, -0.2533721923828125, -0.24249267578125, -0.2316131591796875, -0.220733642578125, -0.2098541259765625, -0.198974609375, -0.1880950927734375, -0.177215576171875, -0.1663360595703125, -0.15545654296875, -0.1445770263671875, -0.133697509765625, -0.1228179931640625, -0.1119384765625, -0.1010589599609375, -0.090179443359375, -0.0792999267578125, -0.06842041015625, -0.0575408935546875, -0.046661376953125, -0.0357818603515625, -0.02490234375, -0.0140228271484375, -0.003143310546875, 0.0077362060546875, 0.01861572265625, 0.0294952392578125, 0.040374755859375, 0.0512542724609375, 0.0621337890625, 0.0730133056640625, 0.083892822265625, 0.0947723388671875, 0.10565185546875, 0.1165313720703125, 0.127410888671875, 0.1382904052734375, 0.149169921875, 0.1600494384765625, 0.170928955078125, 0.1818084716796875, 0.19268798828125, 0.2035675048828125, 0.214447021484375, 0.2253265380859375, 0.2362060546875, 0.2470855712890625, 0.257965087890625, 0.2688446044921875, 0.27972412109375, 0.2906036376953125, 0.301483154296875, 0.3123626708984375, 0.3232421875]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 9.0, 8.0, 16.0, 34.0, 57.0, 187.0, 386.0, 172.0, 61.0, 37.0, 25.0, 9.0, 5.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.3779296875, -0.3704566955566406, -0.36298370361328125, -0.3555107116699219, -0.3480377197265625, -0.3405647277832031, -0.33309173583984375, -0.3256187438964844, -0.318145751953125, -0.3106727600097656, -0.30319976806640625, -0.2957267761230469, -0.2882537841796875, -0.2807807922363281, -0.27330780029296875, -0.2658348083496094, -0.25836181640625, -0.2508888244628906, -0.24341583251953125, -0.23594284057617188, -0.2284698486328125, -0.22099685668945312, -0.21352386474609375, -0.20605087280273438, -0.198577880859375, -0.19110488891601562, -0.18363189697265625, -0.17615890502929688, -0.1686859130859375, -0.16121292114257812, -0.15373992919921875, -0.14626693725585938, -0.1387939453125, -0.13132095336914062, -0.12384796142578125, -0.11637496948242188, -0.1089019775390625, -0.10142898559570312, -0.09395599365234375, -0.08648300170898438, -0.079010009765625, -0.07153701782226562, -0.06406402587890625, -0.056591033935546875, -0.0491180419921875, -0.041645050048828125, -0.03417205810546875, -0.026699066162109375, -0.01922607421875, -0.011753082275390625, -0.00428009033203125, 0.003192901611328125, 0.0106658935546875, 0.018138885498046875, 0.02561187744140625, 0.033084869384765625, 0.040557861328125, 0.048030853271484375, 0.05550384521484375, 0.06297683715820312, 0.0704498291015625, 0.07792282104492188, 0.08539581298828125, 0.09286880493164062, 0.100341796875]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 0.0, 2.0, 1.0, 3.0, 8.0, 12.0, 36.0, 71.0, 92.0, 160.0, 184.0, 191.0, 118.0, 66.0, 18.0, 17.0, 13.0, 5.0, 5.0, 0.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.6501035690307617, -2.590501308441162, -2.5308990478515625, -2.471296787261963, -2.4116945266723633, -2.3520922660827637, -2.292490005493164, -2.2328879833221436, -2.173285722732544, -2.1136834621429443, -2.0540812015533447, -1.9944789409637451, -1.934876799583435, -1.8752745389938354, -1.8156722784042358, -1.7560700178146362, -1.6964677572250366, -1.636865496635437, -1.5772632360458374, -1.5176610946655273, -1.4580588340759277, -1.3984565734863281, -1.3388543128967285, -1.279252052307129, -1.2196497917175293, -1.1600475311279297, -1.10044527053833, -1.0408430099487305, -0.9812408685684204, -0.9216386079788208, -0.8620363473892212, -0.8024340867996216, -0.7428319454193115, -0.6832296848297119, -0.6236274838447571, -0.5640252232551575, -0.5044230222702026, -0.444820761680603, -0.3852185010910034, -0.3256162703037262, -0.266014039516449, -0.20641180872917175, -0.14680956304073334, -0.08720731735229492, -0.0276050865650177, 0.03199714422225952, 0.09159940481185913, 0.15120163559913635, 0.21080386638641357, 0.2704060971736908, 0.330008327960968, 0.3896105885505676, 0.44921281933784485, 0.5088150501251221, 0.5684173107147217, 0.6280195713043213, 0.6876217722892761, 0.7472240328788757, 0.8068262338638306, 0.8664284944534302, 0.9260307550430298, 0.9856329560279846, 1.0452351570129395, 1.104837417602539, 1.1644396781921387]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 6.0, 4.0, 1.0, 4.0, 6.0, 6.0, 9.0, 7.0, 16.0, 17.0, 17.0, 22.0, 22.0, 22.0, 32.0, 30.0, 38.0, 36.0, 35.0, 29.0, 38.0, 51.0, 34.0, 41.0, 35.0, 47.0, 40.0, 27.0, 36.0, 24.0, 26.0, 28.0, 27.0, 28.0, 19.0, 23.0, 17.0, 16.0, 16.0, 12.0, 17.0, 13.0, 3.0, 8.0, 4.0, 8.0, 3.0, 3.0, 2.0, 3.0, 1.0, 1.0, 2.0, 3.0], "bins": [-1.2632848024368286, -1.226023554801941, -1.1887624263763428, -1.151501178741455, -1.1142399311065674, -1.0769786834716797, -1.039717435836792, -1.0024563074111938, -0.9651950597763062, -0.9279338121414185, -0.8906726241111755, -0.8534114360809326, -0.8161501884460449, -0.7788889408111572, -0.7416277527809143, -0.7043665647506714, -0.6671053171157837, -0.629844069480896, -0.5925828814506531, -0.5553216934204102, -0.5180604457855225, -0.48079922795295715, -0.44353801012039185, -0.40627679228782654, -0.36901557445526123, -0.3317543566226959, -0.2944931387901306, -0.2572319209575653, -0.219970703125, -0.1827094852924347, -0.14544826745986938, -0.10818704962730408, -0.07092595100402832, -0.03366473317146301, 0.003596484661102295, 0.0408577024936676, 0.07811892032623291, 0.11538013815879822, 0.15264135599136353, 0.18990257382392883, 0.22716379165649414, 0.26442500948905945, 0.30168622732162476, 0.33894744515419006, 0.37620866298675537, 0.4134698808193207, 0.450731098651886, 0.4879923164844513, 0.5252535343170166, 0.5625147819519043, 0.5997759699821472, 0.6370371580123901, 0.6742984056472778, 0.7115596532821655, 0.7488208413124084, 0.7860820293426514, 0.8233432769775391, 0.8606045246124268, 0.8978657126426697, 0.9351269006729126, 0.9723881483078003, 1.009649395942688, 1.0469105243682861, 1.0841717720031738, 1.1214330196380615]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 8.0, 10.0, 4.0, 6.0, 10.0, 19.0, 21.0, 29.0, 42.0, 50.0, 70.0, 105.0, 163.0, 267.0, 440.0, 696.0, 1275.0, 2391.0, 5196.0, 11996.0, 35396.0, 192521.0, 3571995.0, 300830.0, 45103.0, 14079.0, 5804.0, 2716.0, 1368.0, 689.0, 360.0, 229.0, 151.0, 79.0, 56.0, 35.0, 27.0, 10.0, 11.0, 10.0, 5.0, 5.0, 4.0, 3.0, 0.0, 1.0, 2.0, 1.0], "bins": [-0.2342529296875, -0.2281818389892578, -0.22211074829101562, -0.21603965759277344, -0.20996856689453125, -0.20389747619628906, -0.19782638549804688, -0.1917552947998047, -0.1856842041015625, -0.1796131134033203, -0.17354202270507812, -0.16747093200683594, -0.16139984130859375, -0.15532875061035156, -0.14925765991210938, -0.1431865692138672, -0.137115478515625, -0.1310443878173828, -0.12497329711914062, -0.11890220642089844, -0.11283111572265625, -0.10676002502441406, -0.10068893432617188, -0.09461784362792969, -0.0885467529296875, -0.08247566223144531, -0.07640457153320312, -0.07033348083496094, -0.06426239013671875, -0.05819129943847656, -0.052120208740234375, -0.04604911804199219, -0.03997802734375, -0.03390693664550781, -0.027835845947265625, -0.021764755249023438, -0.01569366455078125, -0.009622573852539062, -0.003551483154296875, 0.0025196075439453125, 0.0085906982421875, 0.014661788940429688, 0.020732879638671875, 0.026803970336914062, 0.03287506103515625, 0.03894615173339844, 0.045017242431640625, 0.05108833312988281, 0.057159423828125, 0.06323051452636719, 0.06930160522460938, 0.07537269592285156, 0.08144378662109375, 0.08751487731933594, 0.09358596801757812, 0.09965705871582031, 0.1057281494140625, 0.11179924011230469, 0.11787033081054688, 0.12394142150878906, 0.13001251220703125, 0.13608360290527344, 0.14215469360351562, 0.1482257843017578, 0.154296875]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 4.0, 8.0, 6.0, 10.0, 16.0, 23.0, 17.0, 35.0, 30.0, 48.0, 51.0, 54.0, 70.0, 75.0, 68.0, 58.0, 62.0, 68.0, 56.0, 50.0, 50.0, 39.0, 38.0, 25.0, 8.0, 17.0, 3.0, 3.0, 6.0, 4.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.11181640625, -0.10884952545166016, -0.10588264465332031, -0.10291576385498047, -0.09994888305664062, -0.09698200225830078, -0.09401512145996094, -0.0910482406616211, -0.08808135986328125, -0.0851144790649414, -0.08214759826660156, -0.07918071746826172, -0.07621383666992188, -0.07324695587158203, -0.07028007507324219, -0.06731319427490234, -0.0643463134765625, -0.061379432678222656, -0.05841255187988281, -0.05544567108154297, -0.052478790283203125, -0.04951190948486328, -0.04654502868652344, -0.043578147888183594, -0.04061126708984375, -0.037644386291503906, -0.03467750549316406, -0.03171062469482422, -0.028743743896484375, -0.02577686309814453, -0.022809982299804688, -0.019843101501464844, -0.016876220703125, -0.013909339904785156, -0.010942459106445312, -0.007975578308105469, -0.005008697509765625, -0.0020418167114257812, 0.0009250640869140625, 0.0038919448852539062, 0.00685882568359375, 0.009825706481933594, 0.012792587280273438, 0.01575946807861328, 0.018726348876953125, 0.02169322967529297, 0.024660110473632812, 0.027626991271972656, 0.0305938720703125, 0.033560752868652344, 0.03652763366699219, 0.03949451446533203, 0.042461395263671875, 0.04542827606201172, 0.04839515686035156, 0.051362037658691406, 0.05432891845703125, 0.057295799255371094, 0.06026268005371094, 0.06322956085205078, 0.06619644165039062, 0.06916332244873047, 0.07213020324707031, 0.07509708404541016, 0.07806396484375]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 1.0, 12.0, 10.0, 25.0, 69.0, 112.0, 249.0, 563.0, 1478.0, 4396.0, 20066.0, 211244.0, 3792200.0, 141614.0, 16151.0, 3900.0, 1245.0, 520.0, 229.0, 96.0, 56.0, 20.0, 16.0, 7.0, 4.0, 0.0, 4.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.234375, -0.22583389282226562, -0.21729278564453125, -0.20875167846679688, -0.2002105712890625, -0.19166946411132812, -0.18312835693359375, -0.17458724975585938, -0.166046142578125, -0.15750503540039062, -0.14896392822265625, -0.14042282104492188, -0.1318817138671875, -0.12334060668945312, -0.11479949951171875, -0.10625839233398438, -0.09771728515625, -0.08917617797851562, -0.08063507080078125, -0.07209396362304688, -0.0635528564453125, -0.055011749267578125, -0.04647064208984375, -0.037929534912109375, -0.029388427734375, -0.020847320556640625, -0.01230621337890625, -0.003765106201171875, 0.0047760009765625, 0.013317108154296875, 0.02185821533203125, 0.030399322509765625, 0.0389404296875, 0.047481536865234375, 0.05602264404296875, 0.06456375122070312, 0.0731048583984375, 0.08164596557617188, 0.09018707275390625, 0.09872817993164062, 0.107269287109375, 0.11581039428710938, 0.12435150146484375, 0.13289260864257812, 0.1414337158203125, 0.14997482299804688, 0.15851593017578125, 0.16705703735351562, 0.17559814453125, 0.18413925170898438, 0.19268035888671875, 0.20122146606445312, 0.2097625732421875, 0.21830368041992188, 0.22684478759765625, 0.23538589477539062, 0.243927001953125, 0.2524681091308594, 0.26100921630859375, 0.2695503234863281, 0.2780914306640625, 0.2866325378417969, 0.29517364501953125, 0.3037147521972656, 0.312255859375]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 0.0, 3.0, 7.0, 7.0, 16.0, 23.0, 24.0, 50.0, 97.0, 253.0, 905.0, 1973.0, 444.0, 132.0, 62.0, 25.0, 15.0, 8.0, 11.0, 10.0, 4.0, 5.0, 1.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11285400390625, -0.10912609100341797, -0.10539817810058594, -0.1016702651977539, -0.09794235229492188, -0.09421443939208984, -0.09048652648925781, -0.08675861358642578, -0.08303070068359375, -0.07930278778076172, -0.07557487487792969, -0.07184696197509766, -0.06811904907226562, -0.0643911361694336, -0.06066322326660156, -0.05693531036376953, -0.0532073974609375, -0.04947948455810547, -0.04575157165527344, -0.042023658752441406, -0.038295745849609375, -0.034567832946777344, -0.030839920043945312, -0.02711200714111328, -0.02338409423828125, -0.01965618133544922, -0.015928268432617188, -0.012200355529785156, -0.008472442626953125, -0.004744529724121094, -0.0010166168212890625, 0.0027112960815429688, 0.006439208984375, 0.010167121887207031, 0.013895034790039062, 0.017622947692871094, 0.021350860595703125, 0.025078773498535156, 0.028806686401367188, 0.03253459930419922, 0.03626251220703125, 0.03999042510986328, 0.04371833801269531, 0.047446250915527344, 0.051174163818359375, 0.054902076721191406, 0.05862998962402344, 0.06235790252685547, 0.0660858154296875, 0.06981372833251953, 0.07354164123535156, 0.0772695541381836, 0.08099746704101562, 0.08472537994384766, 0.08845329284667969, 0.09218120574951172, 0.09590911865234375, 0.09963703155517578, 0.10336494445800781, 0.10709285736083984, 0.11082077026367188, 0.1145486831665039, 0.11827659606933594, 0.12200450897216797, 0.125732421875]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 6.0, 9.0, 61.0, 253.0, 390.0, 220.0, 60.0, 16.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.628408432006836, -1.5903983116149902, -1.5523881912231445, -1.5143780708312988, -1.4763679504394531, -1.4383577108383179, -1.4003475904464722, -1.3623374700546265, -1.3243273496627808, -1.286317229270935, -1.2483071088790894, -1.2102969884872437, -1.1722867488861084, -1.1342766284942627, -1.096266508102417, -1.0582563877105713, -1.0202462673187256, -0.9822361469268799, -0.9442260265350342, -0.9062158465385437, -0.868205726146698, -0.8301956057548523, -0.7921854257583618, -0.7541753053665161, -0.7161651849746704, -0.6781550645828247, -0.640144944190979, -0.6021347641944885, -0.5641246438026428, -0.5261145234107971, -0.48810437321662903, -0.45009422302246094, -0.41208410263061523, -0.37407398223876953, -0.33606383204460144, -0.29805368185043335, -0.26004356145858765, -0.22203342616558075, -0.18402329087257385, -0.14601314067840576, -0.10800302028656006, -0.06999288499355316, -0.031982749700546265, 0.006027385592460632, 0.04403752088546753, 0.08204765617847443, 0.12005779147148132, 0.15806794166564941, 0.19607806205749512, 0.23408819735050201, 0.2720983326435089, 0.310108482837677, 0.3481186032295227, 0.3861287236213684, 0.4241388738155365, 0.4621490240097046, 0.5001591444015503, 0.538169264793396, 0.5761793851852417, 0.6141895651817322, 0.6521996855735779, 0.6902098059654236, 0.7282199859619141, 0.7662301063537598, 0.8042402267456055]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 9.0, 3.0, 10.0, 2.0, 6.0, 6.0, 12.0, 9.0, 14.0, 12.0, 18.0, 16.0, 25.0, 27.0, 25.0, 24.0, 28.0, 36.0, 35.0, 45.0, 41.0, 41.0, 37.0, 51.0, 39.0, 41.0, 41.0, 48.0, 34.0, 35.0, 30.0, 28.0, 19.0, 18.0, 14.0, 22.0, 12.0, 22.0, 17.0, 7.0, 14.0, 9.0, 10.0, 4.0, 3.0, 4.0, 1.0, 6.0, 1.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0], "bins": [-0.24504172801971436, -0.2374468445777893, -0.22985196113586426, -0.22225706279277802, -0.21466217935085297, -0.20706729590892792, -0.19947239756584167, -0.19187751412391663, -0.18428263068199158, -0.17668774724006653, -0.16909286379814148, -0.16149796545505524, -0.1539030820131302, -0.14630819857120514, -0.1387133002281189, -0.13111841678619385, -0.1235235333442688, -0.11592864990234375, -0.1083337590098381, -0.10073886811733246, -0.09314398467540741, -0.08554910123348236, -0.07795421034097672, -0.07035931944847107, -0.06276443600654602, -0.05516954883933067, -0.047574661672115326, -0.03997977450489998, -0.03238488733768463, -0.024790000170469284, -0.017195113003253937, -0.00960022583603859, -0.002005338668823242, 0.005589548498392105, 0.013184435665607452, 0.0207793228328228, 0.028374210000038147, 0.035969097167253494, 0.04356398433446884, 0.05115887150168419, 0.058753758668899536, 0.06634864211082458, 0.07394353300333023, 0.08153842389583588, 0.08913330733776093, 0.09672819077968597, 0.10432308167219162, 0.11191797256469727, 0.11951285600662231, 0.12710773944854736, 0.1347026228904724, 0.14229752123355865, 0.1498924046754837, 0.15748728811740875, 0.165082186460495, 0.17267706990242004, 0.1802719533443451, 0.18786683678627014, 0.1954617202281952, 0.20305661857128143, 0.21065150201320648, 0.21824638545513153, 0.22584128379821777, 0.23343616724014282, 0.24103105068206787]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 4.0, 6.0, 4.0, 6.0, 17.0, 20.0, 26.0, 42.0, 64.0, 117.0, 201.0, 396.0, 813.0, 2214.0, 7504.0, 35840.0, 242770.0, 626100.0, 107117.0, 18207.0, 4266.0, 1445.0, 617.0, 297.0, 182.0, 88.0, 59.0, 45.0, 27.0, 18.0, 15.0, 6.0, 5.0, 2.0, 6.0, 3.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.39892578125, -0.3887748718261719, -0.37862396240234375, -0.3684730529785156, -0.3583221435546875, -0.3481712341308594, -0.33802032470703125, -0.3278694152832031, -0.317718505859375, -0.3075675964355469, -0.29741668701171875, -0.2872657775878906, -0.2771148681640625, -0.2669639587402344, -0.25681304931640625, -0.24666213989257812, -0.23651123046875, -0.22636032104492188, -0.21620941162109375, -0.20605850219726562, -0.1959075927734375, -0.18575668334960938, -0.17560577392578125, -0.16545486450195312, -0.155303955078125, -0.14515304565429688, -0.13500213623046875, -0.12485122680664062, -0.1147003173828125, -0.10454940795898438, -0.09439849853515625, -0.08424758911132812, -0.0740966796875, -0.06394577026367188, -0.05379486083984375, -0.043643951416015625, -0.0334930419921875, -0.023342132568359375, -0.01319122314453125, -0.003040313720703125, 0.007110595703125, 0.017261505126953125, 0.02741241455078125, 0.037563323974609375, 0.0477142333984375, 0.057865142822265625, 0.06801605224609375, 0.07816696166992188, 0.08831787109375, 0.09846878051757812, 0.10861968994140625, 0.11877059936523438, 0.1289215087890625, 0.13907241821289062, 0.14922332763671875, 0.15937423706054688, 0.169525146484375, 0.17967605590820312, 0.18982696533203125, 0.19997787475585938, 0.2101287841796875, 0.22027969360351562, 0.23043060302734375, 0.24058151245117188, 0.250732421875]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 6.0, 1.0, 7.0, 7.0, 8.0, 19.0, 17.0, 27.0, 29.0, 26.0, 53.0, 53.0, 52.0, 70.0, 68.0, 64.0, 74.0, 51.0, 71.0, 62.0, 53.0, 42.0, 43.0, 37.0, 16.0, 22.0, 7.0, 8.0, 3.0, 2.0, 4.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1064453125, -0.103546142578125, -0.10064697265625, -0.097747802734375, -0.0948486328125, -0.091949462890625, -0.08905029296875, -0.086151123046875, -0.083251953125, -0.080352783203125, -0.07745361328125, -0.074554443359375, -0.0716552734375, -0.068756103515625, -0.06585693359375, -0.062957763671875, -0.06005859375, -0.057159423828125, -0.05426025390625, -0.051361083984375, -0.0484619140625, -0.045562744140625, -0.04266357421875, -0.039764404296875, -0.036865234375, -0.033966064453125, -0.03106689453125, -0.028167724609375, -0.0252685546875, -0.022369384765625, -0.01947021484375, -0.016571044921875, -0.013671875, -0.010772705078125, -0.00787353515625, -0.004974365234375, -0.0020751953125, 0.000823974609375, 0.00372314453125, 0.006622314453125, 0.009521484375, 0.012420654296875, 0.01531982421875, 0.018218994140625, 0.0211181640625, 0.024017333984375, 0.02691650390625, 0.029815673828125, 0.03271484375, 0.035614013671875, 0.03851318359375, 0.041412353515625, 0.0443115234375, 0.047210693359375, 0.05010986328125, 0.053009033203125, 0.055908203125, 0.058807373046875, 0.06170654296875, 0.064605712890625, 0.0675048828125, 0.070404052734375, 0.07330322265625, 0.076202392578125, 0.0791015625]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 3.0, 1.0, 1.0, 2.0, 6.0, 7.0, 8.0, 12.0, 15.0, 31.0, 33.0, 43.0, 77.0, 109.0, 192.0, 343.0, 692.0, 1774.0, 5332.0, 18847.0, 75990.0, 337740.0, 460527.0, 108629.0, 26656.0, 7317.0, 2293.0, 870.0, 388.0, 225.0, 111.0, 89.0, 63.0, 44.0, 15.0, 24.0, 11.0, 9.0, 6.0, 10.0, 4.0, 3.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1990966796875, -0.1924877166748047, -0.18587875366210938, -0.17926979064941406, -0.17266082763671875, -0.16605186462402344, -0.15944290161132812, -0.1528339385986328, -0.1462249755859375, -0.1396160125732422, -0.13300704956054688, -0.12639808654785156, -0.11978912353515625, -0.11318016052246094, -0.10657119750976562, -0.09996223449707031, -0.093353271484375, -0.08674430847167969, -0.08013534545898438, -0.07352638244628906, -0.06691741943359375, -0.06030845642089844, -0.053699493408203125, -0.04709053039550781, -0.0404815673828125, -0.03387260437011719, -0.027263641357421875, -0.020654678344726562, -0.01404571533203125, -0.0074367523193359375, -0.000827789306640625, 0.0057811737060546875, 0.01239013671875, 0.018999099731445312, 0.025608062744140625, 0.03221702575683594, 0.03882598876953125, 0.04543495178222656, 0.052043914794921875, 0.05865287780761719, 0.0652618408203125, 0.07187080383300781, 0.07847976684570312, 0.08508872985839844, 0.09169769287109375, 0.09830665588378906, 0.10491561889648438, 0.11152458190917969, 0.118133544921875, 0.12474250793457031, 0.13135147094726562, 0.13796043395996094, 0.14456939697265625, 0.15117835998535156, 0.15778732299804688, 0.1643962860107422, 0.1710052490234375, 0.1776142120361328, 0.18422317504882812, 0.19083213806152344, 0.19744110107421875, 0.20405006408691406, 0.21065902709960938, 0.2172679901123047, 0.223876953125]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 3.0, 1.0, 3.0, 5.0, 2.0, 3.0, 6.0, 8.0, 6.0, 11.0, 12.0, 11.0, 11.0, 19.0, 12.0, 29.0, 25.0, 36.0, 29.0, 35.0, 29.0, 28.0, 40.0, 39.0, 44.0, 41.0, 53.0, 37.0, 39.0, 43.0, 40.0, 41.0, 33.0, 27.0, 35.0, 24.0, 28.0, 19.0, 17.0, 16.0, 11.0, 14.0, 13.0, 11.0, 4.0, 4.0, 2.0, 6.0, 3.0, 2.0, 3.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2291259765625, -0.22152137756347656, -0.21391677856445312, -0.2063121795654297, -0.19870758056640625, -0.1911029815673828, -0.18349838256835938, -0.17589378356933594, -0.1682891845703125, -0.16068458557128906, -0.15307998657226562, -0.1454753875732422, -0.13787078857421875, -0.1302661895751953, -0.12266159057617188, -0.11505699157714844, -0.107452392578125, -0.09984779357910156, -0.09224319458007812, -0.08463859558105469, -0.07703399658203125, -0.06942939758300781, -0.061824798583984375, -0.05422019958496094, -0.0466156005859375, -0.03901100158691406, -0.031406402587890625, -0.023801803588867188, -0.01619720458984375, -0.008592605590820312, -0.000988006591796875, 0.0066165924072265625, 0.01422119140625, 0.021825790405273438, 0.029430389404296875, 0.03703498840332031, 0.04463958740234375, 0.05224418640136719, 0.059848785400390625, 0.06745338439941406, 0.0750579833984375, 0.08266258239746094, 0.09026718139648438, 0.09787178039550781, 0.10547637939453125, 0.11308097839355469, 0.12068557739257812, 0.12829017639160156, 0.135894775390625, 0.14349937438964844, 0.15110397338867188, 0.1587085723876953, 0.16631317138671875, 0.1739177703857422, 0.18152236938476562, 0.18912696838378906, 0.1967315673828125, 0.20433616638183594, 0.21194076538085938, 0.2195453643798828, 0.22714996337890625, 0.2347545623779297, 0.24235916137695312, 0.24996376037597656, 0.257568359375]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 2.0, 2.0, 5.0, 9.0, 15.0, 30.0, 102.0, 189.0, 542.0, 1255.0, 3471.0, 15023.0, 189174.0, 787009.0, 42283.0, 6275.0, 1870.0, 732.0, 309.0, 143.0, 56.0, 27.0, 8.0, 7.0, 11.0, 2.0, 6.0, 4.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.150390625, -0.14572525024414062, -0.14105987548828125, -0.13639450073242188, -0.1317291259765625, -0.12706375122070312, -0.12239837646484375, -0.11773300170898438, -0.113067626953125, -0.10840225219726562, -0.10373687744140625, -0.09907150268554688, -0.0944061279296875, -0.08974075317382812, -0.08507537841796875, -0.08041000366210938, -0.07574462890625, -0.07107925415039062, -0.06641387939453125, -0.061748504638671875, -0.0570831298828125, -0.052417755126953125, -0.04775238037109375, -0.043087005615234375, -0.038421630859375, -0.033756256103515625, -0.02909088134765625, -0.024425506591796875, -0.0197601318359375, -0.015094757080078125, -0.01042938232421875, -0.005764007568359375, -0.0010986328125, 0.003566741943359375, 0.00823211669921875, 0.012897491455078125, 0.0175628662109375, 0.022228240966796875, 0.02689361572265625, 0.031558990478515625, 0.036224365234375, 0.040889739990234375, 0.04555511474609375, 0.050220489501953125, 0.0548858642578125, 0.059551239013671875, 0.06421661376953125, 0.06888198852539062, 0.07354736328125, 0.07821273803710938, 0.08287811279296875, 0.08754348754882812, 0.0922088623046875, 0.09687423706054688, 0.10153961181640625, 0.10620498657226562, 0.110870361328125, 0.11553573608398438, 0.12020111083984375, 0.12486648559570312, 0.1295318603515625, 0.13419723510742188, 0.13886260986328125, 0.14352798461914062, 0.148193359375]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 5.0, 1.0, 4.0, 0.0, 3.0, 2.0, 4.0, 9.0, 5.0, 13.0, 13.0, 19.0, 22.0, 26.0, 21.0, 38.0, 59.0, 73.0, 88.0, 101.0, 111.0, 78.0, 59.0, 71.0, 51.0, 28.0, 20.0, 20.0, 10.0, 15.0, 10.0, 8.0, 4.0, 3.0, 4.0, 2.0, 5.0, 2.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.282329559326172e-05, -6.0916878283023834e-05, -5.901046097278595e-05, -5.7104043662548065e-05, -5.519762635231018e-05, -5.3291209042072296e-05, -5.138479173183441e-05, -4.947837442159653e-05, -4.757195711135864e-05, -4.566553980112076e-05, -4.3759122490882874e-05, -4.185270518064499e-05, -3.9946287870407104e-05, -3.803987056016922e-05, -3.6133453249931335e-05, -3.422703593969345e-05, -3.2320618629455566e-05, -3.0414201319217682e-05, -2.8507784008979797e-05, -2.6601366698741913e-05, -2.469494938850403e-05, -2.2788532078266144e-05, -2.088211476802826e-05, -1.8975697457790375e-05, -1.706928014755249e-05, -1.5162862837314606e-05, -1.3256445527076721e-05, -1.1350028216838837e-05, -9.443610906600952e-06, -7.537193596363068e-06, -5.630776286125183e-06, -3.7243589758872986e-06, -1.817941665649414e-06, 8.847564458847046e-08, 1.994892954826355e-06, 3.9013102650642395e-06, 5.807727575302124e-06, 7.714144885540009e-06, 9.620562195777893e-06, 1.1526979506015778e-05, 1.3433396816253662e-05, 1.5339814126491547e-05, 1.724623143672943e-05, 1.9152648746967316e-05, 2.10590660572052e-05, 2.2965483367443085e-05, 2.487190067768097e-05, 2.6778317987918854e-05, 2.8684735298156738e-05, 3.059115260839462e-05, 3.249756991863251e-05, 3.440398722887039e-05, 3.6310404539108276e-05, 3.821682184934616e-05, 4.0123239159584045e-05, 4.202965646982193e-05, 4.3936073780059814e-05, 4.58424910902977e-05, 4.7748908400535583e-05, 4.965532571077347e-05, 5.156174302101135e-05, 5.346816033124924e-05, 5.537457764148712e-05, 5.7280994951725006e-05, 5.918741226196289e-05]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 6.0, 6.0, 2.0, 6.0, 2.0, 7.0, 9.0, 20.0, 26.0, 52.0, 64.0, 112.0, 165.0, 370.0, 686.0, 1361.0, 2853.0, 7410.0, 29048.0, 225060.0, 689726.0, 69537.0, 13706.0, 4387.0, 1913.0, 880.0, 490.0, 255.0, 152.0, 87.0, 50.0, 29.0, 24.0, 11.0, 14.0, 8.0, 5.0, 7.0, 2.0, 3.0, 2.0, 3.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.103515625, -0.10020256042480469, -0.09688949584960938, -0.09357643127441406, -0.09026336669921875, -0.08695030212402344, -0.08363723754882812, -0.08032417297363281, -0.0770111083984375, -0.07369804382324219, -0.07038497924804688, -0.06707191467285156, -0.06375885009765625, -0.06044578552246094, -0.057132720947265625, -0.05381965637207031, -0.050506591796875, -0.04719352722167969, -0.043880462646484375, -0.04056739807128906, -0.03725433349609375, -0.03394126892089844, -0.030628204345703125, -0.027315139770507812, -0.0240020751953125, -0.020689010620117188, -0.017375946044921875, -0.014062881469726562, -0.01074981689453125, -0.0074367523193359375, -0.004123687744140625, -0.0008106231689453125, 0.00250244140625, 0.0058155059814453125, 0.009128570556640625, 0.012441635131835938, 0.01575469970703125, 0.019067764282226562, 0.022380828857421875, 0.025693893432617188, 0.0290069580078125, 0.03232002258300781, 0.035633087158203125, 0.03894615173339844, 0.04225921630859375, 0.04557228088378906, 0.048885345458984375, 0.05219841003417969, 0.055511474609375, 0.05882453918457031, 0.062137603759765625, 0.06545066833496094, 0.06876373291015625, 0.07207679748535156, 0.07538986206054688, 0.07870292663574219, 0.0820159912109375, 0.08532905578613281, 0.08864212036132812, 0.09195518493652344, 0.09526824951171875, 0.09858131408691406, 0.10189437866210938, 0.10520744323730469, 0.1085205078125]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 3.0, 0.0, 2.0, 4.0, 7.0, 5.0, 18.0, 16.0, 20.0, 23.0, 47.0, 45.0, 76.0, 143.0, 121.0, 133.0, 98.0, 64.0, 50.0, 35.0, 27.0, 18.0, 14.0, 12.0, 7.0, 7.0, 3.0, 3.0, 3.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08892822265625, -0.085845947265625, -0.082763671875, -0.079681396484375, -0.07659912109375, -0.073516845703125, -0.0704345703125, -0.067352294921875, -0.06427001953125, -0.061187744140625, -0.05810546875, -0.055023193359375, -0.05194091796875, -0.048858642578125, -0.0457763671875, -0.042694091796875, -0.03961181640625, -0.036529541015625, -0.033447265625, -0.030364990234375, -0.02728271484375, -0.024200439453125, -0.0211181640625, -0.018035888671875, -0.01495361328125, -0.011871337890625, -0.0087890625, -0.005706787109375, -0.00262451171875, 0.000457763671875, 0.0035400390625, 0.006622314453125, 0.00970458984375, 0.012786865234375, 0.015869140625, 0.018951416015625, 0.02203369140625, 0.025115966796875, 0.0281982421875, 0.031280517578125, 0.03436279296875, 0.037445068359375, 0.04052734375, 0.043609619140625, 0.04669189453125, 0.049774169921875, 0.0528564453125, 0.055938720703125, 0.05902099609375, 0.062103271484375, 0.065185546875, 0.068267822265625, 0.07135009765625, 0.074432373046875, 0.0775146484375, 0.080596923828125, 0.08367919921875, 0.086761474609375, 0.08984375, 0.092926025390625, 0.09600830078125, 0.099090576171875, 0.1021728515625, 0.105255126953125, 0.10833740234375]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 8.0, 15.0, 60.0, 114.0, 232.0, 245.0, 185.0, 98.0, 32.0, 16.0, 0.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8235732316970825, -1.7516988515853882, -1.6798243522644043, -1.60794997215271, -1.5360755920410156, -1.4642012119293213, -1.3923267126083374, -1.320452332496643, -1.2485778331756592, -1.1767034530639648, -1.104828953742981, -1.0329545736312866, -0.9610801935195923, -0.8892057538032532, -0.8173313140869141, -0.7454569339752197, -0.6735825538635254, -0.6017081141471863, -0.5298337340354919, -0.45795929431915283, -0.3860848844051361, -0.3142104744911194, -0.24233603477478027, -0.17046165466308594, -0.09858721494674683, -0.026712797582149506, 0.045161619782447815, 0.11703604459762573, 0.18891045451164246, 0.2607848644256592, 0.3326593041419983, 0.4045336842536926, 0.4764082431793213, 0.5482826828956604, 0.6201570630073547, 0.6920315027236938, 0.7639058828353882, 0.8357803225517273, 0.9076547622680664, 0.9795291423797607, 1.051403522491455, 1.1232779026031494, 1.1951524019241333, 1.2670267820358276, 1.338901162147522, 1.4107756614685059, 1.4826500415802002, 1.5545244216918945, 1.6263989210128784, 1.6982733011245728, 1.7701478004455566, 1.842022180557251, 1.9138965606689453, 1.9857709407806396, 2.057645320892334, 2.1295199394226074, 2.2013943195343018, 2.273268699645996, 2.3451430797576904, 2.4170174598693848, 2.488892078399658, 2.5607664585113525, 2.632640838623047, 2.704515218734741, 2.7763895988464355]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 3.0, 0.0, 3.0, 3.0, 7.0, 5.0, 4.0, 11.0, 8.0, 8.0, 11.0, 11.0, 20.0, 16.0, 16.0, 14.0, 21.0, 22.0, 34.0, 29.0, 34.0, 36.0, 46.0, 35.0, 36.0, 53.0, 39.0, 42.0, 52.0, 37.0, 45.0, 29.0, 32.0, 36.0, 32.0, 26.0, 28.0, 17.0, 26.0, 16.0, 12.0, 12.0, 6.0, 8.0, 9.0, 6.0, 6.0, 8.0, 0.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.0415022373199463, -1.007263422012329, -0.9730246663093567, -0.9387859106063843, -0.9045470952987671, -0.8703083395957947, -0.8360695838928223, -0.8018307685852051, -0.7675919532775879, -0.7333531975746155, -0.6991143822669983, -0.6648756265640259, -0.6306368112564087, -0.5963980555534363, -0.5621592998504639, -0.5279204845428467, -0.49368172883987427, -0.45944294333457947, -0.42520415782928467, -0.39096540212631226, -0.35672658681869507, -0.32248783111572266, -0.28824904561042786, -0.25401026010513306, -0.21977147459983826, -0.18553268909454346, -0.15129390358924866, -0.11705513298511505, -0.08281634747982025, -0.04857756197452545, -0.014338791370391846, 0.019899994134902954, 0.054138779640197754, 0.08837756514549255, 0.12261634320020676, 0.15685512125492096, 0.19109390676021576, 0.22533269226551056, 0.25957146286964417, 0.29381024837493896, 0.32804903388023376, 0.36228781938552856, 0.39652660489082336, 0.43076539039611816, 0.4650041460990906, 0.49924296140670776, 0.5334817171096802, 0.5677205324172974, 0.6019592881202698, 0.6361980438232422, 0.6704368591308594, 0.7046756148338318, 0.738914430141449, 0.7731531858444214, 0.8073920011520386, 0.841630756855011, 0.8758695125579834, 0.9101082682609558, 0.944347083568573, 0.9785858392715454, 1.0128246545791626, 1.0470634698867798, 1.0813021659851074, 1.1155409812927246, 1.1497797966003418]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 1.0, 5.0, 5.0, 4.0, 8.0, 8.0, 10.0, 10.0, 23.0, 38.0, 50.0, 65.0, 111.0, 180.0, 265.0, 455.0, 911.0, 1744.0, 4205.0, 11601.0, 44051.0, 423144.0, 3569093.0, 106386.0, 20529.0, 6392.0, 2535.0, 1125.0, 585.0, 301.0, 179.0, 95.0, 55.0, 42.0, 23.0, 21.0, 10.0, 8.0, 5.0, 5.0, 4.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.34130859375, -0.3318901062011719, -0.32247161865234375, -0.3130531311035156, -0.3036346435546875, -0.2942161560058594, -0.28479766845703125, -0.2753791809082031, -0.265960693359375, -0.2565422058105469, -0.24712371826171875, -0.23770523071289062, -0.2282867431640625, -0.21886825561523438, -0.20944976806640625, -0.20003128051757812, -0.19061279296875, -0.18119430541992188, -0.17177581787109375, -0.16235733032226562, -0.1529388427734375, -0.14352035522460938, -0.13410186767578125, -0.12468338012695312, -0.115264892578125, -0.10584640502929688, -0.09642791748046875, -0.08700942993164062, -0.0775909423828125, -0.06817245483398438, -0.05875396728515625, -0.049335479736328125, -0.0399169921875, -0.030498504638671875, -0.02108001708984375, -0.011661529541015625, -0.0022430419921875, 0.007175445556640625, 0.01659393310546875, 0.026012420654296875, 0.035430908203125, 0.044849395751953125, 0.05426788330078125, 0.06368637084960938, 0.0731048583984375, 0.08252334594726562, 0.09194183349609375, 0.10136032104492188, 0.11077880859375, 0.12019729614257812, 0.12961578369140625, 0.13903427124023438, 0.1484527587890625, 0.15787124633789062, 0.16728973388671875, 0.17670822143554688, 0.186126708984375, 0.19554519653320312, 0.20496368408203125, 0.21438217163085938, 0.2238006591796875, 0.23321914672851562, 0.24263763427734375, 0.2520561218261719, 0.261474609375]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 5.0, 4.0, 4.0, 7.0, 9.0, 16.0, 21.0, 17.0, 33.0, 34.0, 41.0, 54.0, 65.0, 76.0, 71.0, 80.0, 66.0, 67.0, 49.0, 58.0, 54.0, 45.0, 30.0, 37.0, 22.0, 11.0, 15.0, 5.0, 6.0, 0.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.110107421875, -0.10701370239257812, -0.10391998291015625, -0.10082626342773438, -0.0977325439453125, -0.09463882446289062, -0.09154510498046875, -0.08845138549804688, -0.085357666015625, -0.08226394653320312, -0.07917022705078125, -0.07607650756835938, -0.0729827880859375, -0.06988906860351562, -0.06679534912109375, -0.06370162963867188, -0.06060791015625, -0.057514190673828125, -0.05442047119140625, -0.051326751708984375, -0.0482330322265625, -0.045139312744140625, -0.04204559326171875, -0.038951873779296875, -0.035858154296875, -0.032764434814453125, -0.02967071533203125, -0.026576995849609375, -0.0234832763671875, -0.020389556884765625, -0.01729583740234375, -0.014202117919921875, -0.0111083984375, -0.008014678955078125, -0.00492095947265625, -0.001827239990234375, 0.0012664794921875, 0.004360198974609375, 0.00745391845703125, 0.010547637939453125, 0.013641357421875, 0.016735076904296875, 0.01982879638671875, 0.022922515869140625, 0.0260162353515625, 0.029109954833984375, 0.03220367431640625, 0.035297393798828125, 0.03839111328125, 0.041484832763671875, 0.04457855224609375, 0.047672271728515625, 0.0507659912109375, 0.053859710693359375, 0.05695343017578125, 0.060047149658203125, 0.063140869140625, 0.06623458862304688, 0.06932830810546875, 0.07242202758789062, 0.0755157470703125, 0.07860946655273438, 0.08170318603515625, 0.08479690551757812, 0.087890625]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 9.0, 22.0, 60.0, 111.0, 218.0, 487.0, 1037.0, 2590.0, 7368.0, 25929.0, 159213.0, 3554763.0, 381803.0, 43286.0, 10902.0, 3702.0, 1555.0, 664.0, 296.0, 129.0, 76.0, 40.0, 12.0, 10.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.20166015625, -0.1938018798828125, -0.185943603515625, -0.1780853271484375, -0.17022705078125, -0.1623687744140625, -0.154510498046875, -0.1466522216796875, -0.1387939453125, -0.1309356689453125, -0.123077392578125, -0.1152191162109375, -0.10736083984375, -0.0995025634765625, -0.091644287109375, -0.0837860107421875, -0.075927734375, -0.0680694580078125, -0.060211181640625, -0.0523529052734375, -0.04449462890625, -0.0366363525390625, -0.028778076171875, -0.0209197998046875, -0.0130615234375, -0.0052032470703125, 0.002655029296875, 0.0105133056640625, 0.01837158203125, 0.0262298583984375, 0.034088134765625, 0.0419464111328125, 0.0498046875, 0.0576629638671875, 0.065521240234375, 0.0733795166015625, 0.08123779296875, 0.0890960693359375, 0.096954345703125, 0.1048126220703125, 0.1126708984375, 0.1205291748046875, 0.128387451171875, 0.1362457275390625, 0.14410400390625, 0.1519622802734375, 0.159820556640625, 0.1676788330078125, 0.175537109375, 0.1833953857421875, 0.191253662109375, 0.1991119384765625, 0.20697021484375, 0.2148284912109375, 0.222686767578125, 0.2305450439453125, 0.2384033203125, 0.2462615966796875, 0.254119873046875, 0.2619781494140625, 0.26983642578125, 0.2776947021484375, 0.285552978515625, 0.2934112548828125, 0.30126953125]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 2.0, 4.0, 2.0, 3.0, 9.0, 8.0, 8.0, 19.0, 27.0, 40.0, 52.0, 91.0, 143.0, 353.0, 1329.0, 1231.0, 354.0, 135.0, 86.0, 43.0, 47.0, 19.0, 13.0, 7.0, 9.0, 12.0, 10.0, 6.0, 3.0, 2.0, 3.0, 0.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.08038330078125, -0.07761001586914062, -0.07483673095703125, -0.07206344604492188, -0.0692901611328125, -0.06651687622070312, -0.06374359130859375, -0.060970306396484375, -0.058197021484375, -0.055423736572265625, -0.05265045166015625, -0.049877166748046875, -0.0471038818359375, -0.044330596923828125, -0.04155731201171875, -0.038784027099609375, -0.0360107421875, -0.033237457275390625, -0.03046417236328125, -0.027690887451171875, -0.0249176025390625, -0.022144317626953125, -0.01937103271484375, -0.016597747802734375, -0.013824462890625, -0.011051177978515625, -0.00827789306640625, -0.005504608154296875, -0.0027313232421875, 4.1961669921875e-05, 0.00281524658203125, 0.005588531494140625, 0.00836181640625, 0.011135101318359375, 0.01390838623046875, 0.016681671142578125, 0.0194549560546875, 0.022228240966796875, 0.02500152587890625, 0.027774810791015625, 0.030548095703125, 0.033321380615234375, 0.03609466552734375, 0.038867950439453125, 0.0416412353515625, 0.044414520263671875, 0.04718780517578125, 0.049961090087890625, 0.052734375, 0.055507659912109375, 0.05828094482421875, 0.061054229736328125, 0.0638275146484375, 0.06660079956054688, 0.06937408447265625, 0.07214736938476562, 0.074920654296875, 0.07769393920898438, 0.08046722412109375, 0.08324050903320312, 0.0860137939453125, 0.08878707885742188, 0.09156036376953125, 0.09433364868164062, 0.09710693359375]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 7.0, 5.0, 27.0, 49.0, 105.0, 133.0, 171.0, 164.0, 137.0, 94.0, 61.0, 21.0, 9.0, 10.0, 1.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.36987996101379395, -0.35131651163101196, -0.33275306224823, -0.314189612865448, -0.295626163482666, -0.27706271409988403, -0.25849923491477966, -0.23993578553199768, -0.2213723361492157, -0.20280888676643372, -0.18424543738365173, -0.16568197309970856, -0.14711852371692657, -0.1285550743341446, -0.10999161750078201, -0.09142816066741943, -0.07286471128463745, -0.05430125817656517, -0.03573780506849289, -0.01717435196042061, 0.0013891011476516724, 0.019952550530433655, 0.038516007363796234, 0.057079464197158813, 0.0756429135799408, 0.09420636296272278, 0.11276981979608536, 0.13133327662944794, 0.14989672601222992, 0.1684601753950119, 0.18702363967895508, 0.20558708906173706, 0.22415059804916382, 0.2427140474319458, 0.2612774968147278, 0.27984094619750977, 0.29840439558029175, 0.31696784496307373, 0.3355313241481781, 0.3540947735309601, 0.37265822291374207, 0.39122167229652405, 0.40978512167930603, 0.428348571062088, 0.4469120502471924, 0.46547549962997437, 0.48403894901275635, 0.5026023983955383, 0.5211658477783203, 0.5397292971611023, 0.5582927465438843, 0.5768561959266663, 0.5954196453094482, 0.6139830946922302, 0.6325465440750122, 0.651110053062439, 0.6696734428405762, 0.6882368922233582, 0.7068003416061401, 0.7253637909889221, 0.7439272403717041, 0.7624906897544861, 0.7810541391372681, 0.7996176481246948, 0.8181810975074768]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 2.0, 4.0, 3.0, 11.0, 13.0, 12.0, 7.0, 20.0, 21.0, 21.0, 24.0, 23.0, 35.0, 44.0, 41.0, 61.0, 57.0, 38.0, 52.0, 47.0, 41.0, 53.0, 51.0, 46.0, 53.0, 27.0, 27.0, 26.0, 27.0, 29.0, 22.0, 22.0, 10.0, 10.0, 6.0, 9.0, 4.0, 3.0, 1.0, 4.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.26835745573043823, -0.2592984139919281, -0.25023937225341797, -0.24118031561374664, -0.23212125897407532, -0.22306221723556519, -0.21400317549705505, -0.20494411885738373, -0.1958850622177124, -0.18682602047920227, -0.17776696383953094, -0.1687079221010208, -0.1596488654613495, -0.15058982372283936, -0.14153078198432922, -0.1324717253446579, -0.12341268360614777, -0.11435363441705704, -0.10529458522796631, -0.09623554348945618, -0.08717648684978485, -0.07811744511127472, -0.06905839592218399, -0.05999934673309326, -0.05094029754400253, -0.041881248354911804, -0.032822199165821075, -0.023763153702020645, -0.014704104512929916, -0.005645055323839188, 0.0034139901399612427, 0.012473039329051971, 0.0215320885181427, 0.03059113770723343, 0.03965018689632416, 0.04870923236012459, 0.05776828154921532, 0.06682732701301575, 0.07588637620210648, 0.0849454253911972, 0.09400447458028793, 0.10306352376937866, 0.11212257295846939, 0.12118162214756012, 0.13024066388607025, 0.13929972052574158, 0.1483587622642517, 0.15741780400276184, 0.16647686064243317, 0.1755359023809433, 0.18459495902061462, 0.19365400075912476, 0.20271305739879608, 0.2117720991373062, 0.22083115577697754, 0.22989019751548767, 0.2389492392539978, 0.24800828099250793, 0.25706732273101807, 0.2661263942718506, 0.2751854360103607, 0.28424447774887085, 0.293303519487381, 0.3023625612258911, 0.31142163276672363]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 4.0, 7.0, 7.0, 8.0, 13.0, 22.0, 45.0, 73.0, 110.0, 171.0, 292.0, 598.0, 1257.0, 3072.0, 8976.0, 35228.0, 163981.0, 523255.0, 240149.0, 51698.0, 12485.0, 4003.0, 1564.0, 730.0, 357.0, 163.0, 106.0, 71.0, 33.0, 27.0, 20.0, 12.0, 9.0, 6.0, 2.0, 4.0, 3.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.298583984375, -0.28850555419921875, -0.2784271240234375, -0.26834869384765625, -0.258270263671875, -0.24819183349609375, -0.2381134033203125, -0.22803497314453125, -0.21795654296875, -0.20787811279296875, -0.1977996826171875, -0.18772125244140625, -0.177642822265625, -0.16756439208984375, -0.1574859619140625, -0.14740753173828125, -0.1373291015625, -0.12725067138671875, -0.1171722412109375, -0.10709381103515625, -0.097015380859375, -0.08693695068359375, -0.0768585205078125, -0.06678009033203125, -0.05670166015625, -0.04662322998046875, -0.0365447998046875, -0.02646636962890625, -0.016387939453125, -0.00630950927734375, 0.0037689208984375, 0.01384735107421875, 0.02392578125, 0.03400421142578125, 0.0440826416015625, 0.05416107177734375, 0.064239501953125, 0.07431793212890625, 0.0843963623046875, 0.09447479248046875, 0.10455322265625, 0.11463165283203125, 0.1247100830078125, 0.13478851318359375, 0.144866943359375, 0.15494537353515625, 0.1650238037109375, 0.17510223388671875, 0.1851806640625, 0.19525909423828125, 0.2053375244140625, 0.21541595458984375, 0.225494384765625, 0.23557281494140625, 0.2456512451171875, 0.25572967529296875, 0.26580810546875, 0.27588653564453125, 0.2859649658203125, 0.29604339599609375, 0.306121826171875, 0.31620025634765625, 0.3262786865234375, 0.33635711669921875, 0.346435546875]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 7.0, 8.0, 15.0, 12.0, 15.0, 21.0, 27.0, 44.0, 45.0, 70.0, 71.0, 77.0, 67.0, 80.0, 72.0, 59.0, 58.0, 54.0, 44.0, 39.0, 39.0, 29.0, 18.0, 11.0, 9.0, 5.0, 4.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10919189453125, -0.1060028076171875, -0.102813720703125, -0.0996246337890625, -0.096435546875, -0.0932464599609375, -0.090057373046875, -0.0868682861328125, -0.08367919921875, -0.0804901123046875, -0.077301025390625, -0.0741119384765625, -0.0709228515625, -0.0677337646484375, -0.064544677734375, -0.0613555908203125, -0.05816650390625, -0.0549774169921875, -0.051788330078125, -0.0485992431640625, -0.04541015625, -0.0422210693359375, -0.039031982421875, -0.0358428955078125, -0.03265380859375, -0.0294647216796875, -0.026275634765625, -0.0230865478515625, -0.0198974609375, -0.0167083740234375, -0.013519287109375, -0.0103302001953125, -0.00714111328125, -0.0039520263671875, -0.000762939453125, 0.0024261474609375, 0.005615234375, 0.0088043212890625, 0.011993408203125, 0.0151824951171875, 0.01837158203125, 0.0215606689453125, 0.024749755859375, 0.0279388427734375, 0.0311279296875, 0.0343170166015625, 0.037506103515625, 0.0406951904296875, 0.04388427734375, 0.0470733642578125, 0.050262451171875, 0.0534515380859375, 0.056640625, 0.0598297119140625, 0.063018798828125, 0.0662078857421875, 0.06939697265625, 0.0725860595703125, 0.075775146484375, 0.0789642333984375, 0.0821533203125, 0.0853424072265625, 0.088531494140625, 0.0917205810546875, 0.09490966796875]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 3.0, 5.0, 2.0, 9.0, 10.0, 12.0, 14.0, 26.0, 37.0, 63.0, 91.0, 181.0, 316.0, 571.0, 1206.0, 3024.0, 10419.0, 53849.0, 324805.0, 524000.0, 104163.0, 17969.0, 4498.0, 1667.0, 732.0, 370.0, 189.0, 118.0, 71.0, 55.0, 23.0, 19.0, 11.0, 10.0, 9.0, 3.0, 5.0, 4.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.28125, -0.2719306945800781, -0.26261138916015625, -0.2532920837402344, -0.2439727783203125, -0.23465347290039062, -0.22533416748046875, -0.21601486206054688, -0.206695556640625, -0.19737625122070312, -0.18805694580078125, -0.17873764038085938, -0.1694183349609375, -0.16009902954101562, -0.15077972412109375, -0.14146041870117188, -0.13214111328125, -0.12282180786132812, -0.11350250244140625, -0.10418319702148438, -0.0948638916015625, -0.08554458618164062, -0.07622528076171875, -0.06690597534179688, -0.057586669921875, -0.048267364501953125, -0.03894805908203125, -0.029628753662109375, -0.0203094482421875, -0.010990142822265625, -0.00167083740234375, 0.007648468017578125, 0.0169677734375, 0.026287078857421875, 0.03560638427734375, 0.044925689697265625, 0.0542449951171875, 0.06356430053710938, 0.07288360595703125, 0.08220291137695312, 0.091522216796875, 0.10084152221679688, 0.11016082763671875, 0.11948013305664062, 0.1287994384765625, 0.13811874389648438, 0.14743804931640625, 0.15675735473632812, 0.16607666015625, 0.17539596557617188, 0.18471527099609375, 0.19403457641601562, 0.2033538818359375, 0.21267318725585938, 0.22199249267578125, 0.23131179809570312, 0.240631103515625, 0.24995040893554688, 0.25926971435546875, 0.2685890197753906, 0.2779083251953125, 0.2872276306152344, 0.29654693603515625, 0.3058662414550781, 0.315185546875]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 4.0, 2.0, 6.0, 5.0, 1.0, 6.0, 12.0, 16.0, 22.0, 21.0, 30.0, 40.0, 38.0, 42.0, 60.0, 48.0, 58.0, 66.0, 74.0, 73.0, 51.0, 68.0, 52.0, 47.0, 37.0, 38.0, 22.0, 22.0, 13.0, 10.0, 8.0, 5.0, 5.0, 2.0, 1.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.44970703125, -0.4364585876464844, -0.42321014404296875, -0.4099617004394531, -0.3967132568359375, -0.3834648132324219, -0.37021636962890625, -0.3569679260253906, -0.343719482421875, -0.3304710388183594, -0.31722259521484375, -0.3039741516113281, -0.2907257080078125, -0.2774772644042969, -0.26422882080078125, -0.2509803771972656, -0.23773193359375, -0.22448348999023438, -0.21123504638671875, -0.19798660278320312, -0.1847381591796875, -0.17148971557617188, -0.15824127197265625, -0.14499282836914062, -0.131744384765625, -0.11849594116210938, -0.10524749755859375, -0.09199905395507812, -0.0787506103515625, -0.06550216674804688, -0.05225372314453125, -0.039005279541015625, -0.0257568359375, -0.012508392333984375, 0.00074005126953125, 0.013988494873046875, 0.0272369384765625, 0.040485382080078125, 0.05373382568359375, 0.06698226928710938, 0.080230712890625, 0.09347915649414062, 0.10672760009765625, 0.11997604370117188, 0.1332244873046875, 0.14647293090820312, 0.15972137451171875, 0.17296981811523438, 0.18621826171875, 0.19946670532226562, 0.21271514892578125, 0.22596359252929688, 0.2392120361328125, 0.2524604797363281, 0.26570892333984375, 0.2789573669433594, 0.292205810546875, 0.3054542541503906, 0.31870269775390625, 0.3319511413574219, 0.3451995849609375, 0.3584480285644531, 0.37169647216796875, 0.3849449157714844, 0.398193359375]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 4.0, 10.0, 21.0, 30.0, 41.0, 98.0, 164.0, 498.0, 2123.0, 30909.0, 941883.0, 68446.0, 3279.0, 611.0, 226.0, 116.0, 44.0, 24.0, 17.0, 13.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.47119140625, -0.45757293701171875, -0.4439544677734375, -0.43033599853515625, -0.416717529296875, -0.40309906005859375, -0.3894805908203125, -0.37586212158203125, -0.36224365234375, -0.34862518310546875, -0.3350067138671875, -0.32138824462890625, -0.307769775390625, -0.29415130615234375, -0.2805328369140625, -0.26691436767578125, -0.2532958984375, -0.23967742919921875, -0.2260589599609375, -0.21244049072265625, -0.198822021484375, -0.18520355224609375, -0.1715850830078125, -0.15796661376953125, -0.14434814453125, -0.13072967529296875, -0.1171112060546875, -0.10349273681640625, -0.089874267578125, -0.07625579833984375, -0.0626373291015625, -0.04901885986328125, -0.035400390625, -0.02178192138671875, -0.0081634521484375, 0.00545501708984375, 0.019073486328125, 0.03269195556640625, 0.0463104248046875, 0.05992889404296875, 0.07354736328125, 0.08716583251953125, 0.1007843017578125, 0.11440277099609375, 0.128021240234375, 0.14163970947265625, 0.1552581787109375, 0.16887664794921875, 0.1824951171875, 0.19611358642578125, 0.2097320556640625, 0.22335052490234375, 0.236968994140625, 0.25058746337890625, 0.2642059326171875, 0.27782440185546875, 0.29144287109375, 0.30506134033203125, 0.3186798095703125, 0.33229827880859375, 0.345916748046875, 0.35953521728515625, 0.3731536865234375, 0.38677215576171875, 0.400390625]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 5.0, 3.0, 2.0, 6.0, 6.0, 11.0, 19.0, 12.0, 22.0, 22.0, 35.0, 43.0, 43.0, 58.0, 81.0, 130.0, 132.0, 89.0, 62.0, 51.0, 36.0, 30.0, 35.0, 11.0, 16.0, 15.0, 12.0, 4.0, 6.0, 4.0, 1.0, 3.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.43865966796875e-05, -7.129088044166565e-05, -6.81951642036438e-05, -6.509944796562195e-05, -6.20037317276001e-05, -5.890801548957825e-05, -5.5812299251556396e-05, -5.2716583013534546e-05, -4.9620866775512695e-05, -4.6525150537490845e-05, -4.3429434299468994e-05, -4.0333718061447144e-05, -3.723800182342529e-05, -3.414228558540344e-05, -3.104656934738159e-05, -2.795085310935974e-05, -2.485513687133789e-05, -2.175942063331604e-05, -1.866370439529419e-05, -1.556798815727234e-05, -1.2472271919250488e-05, -9.376555681228638e-06, -6.280839443206787e-06, -3.1851232051849365e-06, -8.940696716308594e-08, 3.0063092708587646e-06, 6.102025508880615e-06, 9.197741746902466e-06, 1.2293457984924316e-05, 1.5389174222946167e-05, 1.8484890460968018e-05, 2.1580606698989868e-05, 2.467632293701172e-05, 2.777203917503357e-05, 3.086775541305542e-05, 3.396347165107727e-05, 3.705918788909912e-05, 4.015490412712097e-05, 4.325062036514282e-05, 4.634633660316467e-05, 4.9442052841186523e-05, 5.2537769079208374e-05, 5.5633485317230225e-05, 5.8729201555252075e-05, 6.182491779327393e-05, 6.492063403129578e-05, 6.801635026931763e-05, 7.111206650733948e-05, 7.420778274536133e-05, 7.730349898338318e-05, 8.039921522140503e-05, 8.349493145942688e-05, 8.659064769744873e-05, 8.968636393547058e-05, 9.278208017349243e-05, 9.587779641151428e-05, 9.897351264953613e-05, 0.00010206922888755798, 0.00010516494512557983, 0.00010826066136360168, 0.00011135637760162354, 0.00011445209383964539, 0.00011754781007766724, 0.00012064352631568909, 0.00012373924255371094]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 5.0, 3.0, 8.0, 17.0, 17.0, 22.0, 41.0, 73.0, 136.0, 247.0, 626.0, 1936.0, 13528.0, 371340.0, 636580.0, 20335.0, 2369.0, 678.0, 297.0, 136.0, 75.0, 37.0, 20.0, 14.0, 6.0, 9.0, 4.0, 5.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.20849609375, -0.19810867309570312, -0.18772125244140625, -0.17733383178710938, -0.1669464111328125, -0.15655899047851562, -0.14617156982421875, -0.13578414916992188, -0.125396728515625, -0.11500930786132812, -0.10462188720703125, -0.09423446655273438, -0.0838470458984375, -0.07345962524414062, -0.06307220458984375, -0.052684783935546875, -0.04229736328125, -0.031909942626953125, -0.02152252197265625, -0.011135101318359375, -0.0007476806640625, 0.009639739990234375, 0.02002716064453125, 0.030414581298828125, 0.040802001953125, 0.051189422607421875, 0.06157684326171875, 0.07196426391601562, 0.0823516845703125, 0.09273910522460938, 0.10312652587890625, 0.11351394653320312, 0.1239013671875, 0.13428878784179688, 0.14467620849609375, 0.15506362915039062, 0.1654510498046875, 0.17583847045898438, 0.18622589111328125, 0.19661331176757812, 0.207000732421875, 0.21738815307617188, 0.22777557373046875, 0.23816299438476562, 0.2485504150390625, 0.2589378356933594, 0.26932525634765625, 0.2797126770019531, 0.29010009765625, 0.3004875183105469, 0.31087493896484375, 0.3212623596191406, 0.3316497802734375, 0.3420372009277344, 0.35242462158203125, 0.3628120422363281, 0.373199462890625, 0.3835868835449219, 0.39397430419921875, 0.4043617248535156, 0.4147491455078125, 0.4251365661621094, 0.43552398681640625, 0.4459114074707031, 0.456298828125]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 5.0, 13.0, 8.0, 22.0, 45.0, 76.0, 147.0, 216.0, 207.0, 115.0, 66.0, 38.0, 26.0, 9.0, 6.0, 5.0, 2.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.458251953125, -0.4477958679199219, -0.43733978271484375, -0.4268836975097656, -0.4164276123046875, -0.4059715270996094, -0.39551544189453125, -0.3850593566894531, -0.374603271484375, -0.3641471862792969, -0.35369110107421875, -0.3432350158691406, -0.3327789306640625, -0.3223228454589844, -0.31186676025390625, -0.3014106750488281, -0.29095458984375, -0.2804985046386719, -0.27004241943359375, -0.2595863342285156, -0.2491302490234375, -0.23867416381835938, -0.22821807861328125, -0.21776199340820312, -0.207305908203125, -0.19684982299804688, -0.18639373779296875, -0.17593765258789062, -0.1654815673828125, -0.15502548217773438, -0.14456939697265625, -0.13411331176757812, -0.1236572265625, -0.11320114135742188, -0.10274505615234375, -0.09228897094726562, -0.0818328857421875, -0.07137680053710938, -0.06092071533203125, -0.050464630126953125, -0.040008544921875, -0.029552459716796875, -0.01909637451171875, -0.008640289306640625, 0.0018157958984375, 0.012271881103515625, 0.02272796630859375, 0.033184051513671875, 0.04364013671875, 0.054096221923828125, 0.06455230712890625, 0.07500839233398438, 0.0854644775390625, 0.09592056274414062, 0.10637664794921875, 0.11683273315429688, 0.127288818359375, 0.13774490356445312, 0.14820098876953125, 0.15865707397460938, 0.1691131591796875, 0.17956924438476562, 0.19002532958984375, 0.20048141479492188, 0.2109375]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 16.0, 14.0, 29.0, 43.0, 74.0, 87.0, 149.0, 163.0, 131.0, 100.0, 71.0, 40.0, 34.0, 26.0, 10.0, 8.0, 6.0, 4.0, 6.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-2.7389912605285645, -2.6697049140930176, -2.6004185676574707, -2.5311319828033447, -2.461845636367798, -2.392559289932251, -2.323272943496704, -2.2539865970611572, -2.1847000122070312, -2.1154136657714844, -2.0461273193359375, -1.976840853691101, -1.9075543880462646, -1.8382680416107178, -1.768981695175171, -1.699695348739624, -1.6304090023040771, -1.5611226558685303, -1.4918361902236938, -1.422549843788147, -1.3532633781433105, -1.2839770317077637, -1.2146906852722168, -1.14540433883667, -1.0761178731918335, -1.0068315267562866, -0.9375450611114502, -0.8682587146759033, -0.7989723086357117, -0.72968590259552, -0.6603995561599731, -0.5911131501197815, -0.5218267440795898, -0.4525403380393982, -0.38325396180152893, -0.31396758556365967, -0.24468117952346802, -0.17539477348327637, -0.1061083972454071, -0.03682202100753784, 0.03246438503265381, 0.10175077617168427, 0.17103716731071472, 0.24032355844974518, 0.30960994958877563, 0.3788963556289673, 0.44818273186683655, 0.5174691081047058, 0.5867555141448975, 0.6560419201850891, 0.7253283262252808, 0.7946146726608276, 0.8639010787010193, 0.9331874847412109, 1.0024738311767578, 1.0717601776123047, 1.1410466432571411, 1.210332989692688, 1.2796194553375244, 1.3489058017730713, 1.4181921482086182, 1.4874786138534546, 1.5567649602890015, 1.626051425933838, 1.6953377723693848]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 5.0, 5.0, 3.0, 7.0, 8.0, 15.0, 14.0, 17.0, 13.0, 17.0, 22.0, 18.0, 31.0, 36.0, 38.0, 35.0, 35.0, 44.0, 40.0, 44.0, 51.0, 41.0, 40.0, 46.0, 34.0, 39.0, 33.0, 35.0, 38.0, 33.0, 22.0, 25.0, 27.0, 20.0, 14.0, 13.0, 12.0, 7.0, 10.0, 6.0, 2.0, 2.0, 3.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.6305263042449951, -1.5753449201583862, -1.5201635360717773, -1.464982271194458, -1.4098008871078491, -1.3546195030212402, -1.299438238143921, -1.244256854057312, -1.1890754699707031, -1.1338940858840942, -1.0787127017974854, -1.023531436920166, -0.9683500528335571, -0.9131686687469482, -0.8579873442649841, -0.80280601978302, -0.7476246356964111, -0.6924432516098022, -0.6372619271278381, -0.582080602645874, -0.5268992185592651, -0.47171786427497864, -0.41653650999069214, -0.36135515570640564, -0.30617380142211914, -0.25099244713783264, -0.19581109285354614, -0.14062973856925964, -0.08544838428497314, -0.030267030000686646, 0.024914324283599854, 0.08009567856788635, 0.1352771520614624, 0.1904585063457489, 0.2456398606300354, 0.3008212149143219, 0.3560025691986084, 0.4111839234828949, 0.4663652777671814, 0.5215466022491455, 0.5767279863357544, 0.6319093704223633, 0.6870906949043274, 0.7422720193862915, 0.7974534034729004, 0.8526347875595093, 0.9078161120414734, 0.9629974365234375, 1.0181788206100464, 1.0733602046966553, 1.1285414695739746, 1.1837228536605835, 1.2389042377471924, 1.2940856218338013, 1.3492670059204102, 1.4044482707977295, 1.4596296548843384, 1.5148110389709473, 1.5699923038482666, 1.6251736879348755, 1.6803550720214844, 1.7355364561080933, 1.7907178401947021, 1.8458991050720215, 1.9010804891586304]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 5.0, 3.0, 6.0, 7.0, 16.0, 16.0, 33.0, 31.0, 59.0, 80.0, 159.0, 367.0, 791.0, 2644.0, 12916.0, 161491.0, 3892981.0, 109178.0, 10213.0, 2030.0, 657.0, 257.0, 102.0, 81.0, 47.0, 35.0, 24.0, 21.0, 13.0, 6.0, 9.0, 4.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.49853515625, -0.4836273193359375, -0.468719482421875, -0.4538116455078125, -0.43890380859375, -0.4239959716796875, -0.409088134765625, -0.3941802978515625, -0.3792724609375, -0.3643646240234375, -0.349456787109375, -0.3345489501953125, -0.31964111328125, -0.3047332763671875, -0.289825439453125, -0.2749176025390625, -0.260009765625, -0.2451019287109375, -0.230194091796875, -0.2152862548828125, -0.20037841796875, -0.1854705810546875, -0.170562744140625, -0.1556549072265625, -0.1407470703125, -0.1258392333984375, -0.110931396484375, -0.0960235595703125, -0.08111572265625, -0.0662078857421875, -0.051300048828125, -0.0363922119140625, -0.021484375, -0.0065765380859375, 0.008331298828125, 0.0232391357421875, 0.03814697265625, 0.0530548095703125, 0.067962646484375, 0.0828704833984375, 0.0977783203125, 0.1126861572265625, 0.127593994140625, 0.1425018310546875, 0.15740966796875, 0.1723175048828125, 0.187225341796875, 0.2021331787109375, 0.217041015625, 0.2319488525390625, 0.246856689453125, 0.2617645263671875, 0.27667236328125, 0.2915802001953125, 0.306488037109375, 0.3213958740234375, 0.3363037109375, 0.3512115478515625, 0.366119384765625, 0.3810272216796875, 0.39593505859375, 0.4108428955078125, 0.425750732421875, 0.4406585693359375, 0.45556640625]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 3.0, 6.0, 4.0, 7.0, 11.0, 22.0, 19.0, 18.0, 35.0, 41.0, 47.0, 43.0, 57.0, 70.0, 69.0, 62.0, 86.0, 67.0, 61.0, 42.0, 42.0, 40.0, 44.0, 30.0, 21.0, 25.0, 9.0, 5.0, 8.0, 6.0, 4.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11517333984375, -0.111846923828125, -0.1085205078125, -0.105194091796875, -0.10186767578125, -0.098541259765625, -0.09521484375, -0.091888427734375, -0.08856201171875, -0.085235595703125, -0.0819091796875, -0.078582763671875, -0.07525634765625, -0.071929931640625, -0.068603515625, -0.065277099609375, -0.06195068359375, -0.058624267578125, -0.0552978515625, -0.051971435546875, -0.04864501953125, -0.045318603515625, -0.0419921875, -0.038665771484375, -0.03533935546875, -0.032012939453125, -0.0286865234375, -0.025360107421875, -0.02203369140625, -0.018707275390625, -0.015380859375, -0.012054443359375, -0.00872802734375, -0.005401611328125, -0.0020751953125, 0.001251220703125, 0.00457763671875, 0.007904052734375, 0.01123046875, 0.014556884765625, 0.01788330078125, 0.021209716796875, 0.0245361328125, 0.027862548828125, 0.03118896484375, 0.034515380859375, 0.037841796875, 0.041168212890625, 0.04449462890625, 0.047821044921875, 0.0511474609375, 0.054473876953125, 0.05780029296875, 0.061126708984375, 0.064453125, 0.067779541015625, 0.07110595703125, 0.074432373046875, 0.0777587890625, 0.081085205078125, 0.08441162109375, 0.087738037109375, 0.091064453125, 0.094390869140625, 0.09771728515625]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 3.0, 8.0, 2.0, 5.0, 7.0, 22.0, 21.0, 31.0, 65.0, 83.0, 134.0, 210.0, 419.0, 726.0, 1416.0, 2842.0, 6403.0, 17119.0, 55403.0, 280771.0, 3053429.0, 640532.0, 92599.0, 25299.0, 9037.0, 3794.0, 1776.0, 889.0, 498.0, 254.0, 178.0, 112.0, 72.0, 41.0, 22.0, 17.0, 19.0, 16.0, 8.0, 7.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1591796875, -0.1534290313720703, -0.14767837524414062, -0.14192771911621094, -0.13617706298828125, -0.13042640686035156, -0.12467575073242188, -0.11892509460449219, -0.1131744384765625, -0.10742378234863281, -0.10167312622070312, -0.09592247009277344, -0.09017181396484375, -0.08442115783691406, -0.07867050170898438, -0.07291984558105469, -0.067169189453125, -0.06141853332519531, -0.055667877197265625, -0.04991722106933594, -0.04416656494140625, -0.03841590881347656, -0.032665252685546875, -0.026914596557617188, -0.0211639404296875, -0.015413284301757812, -0.009662628173828125, -0.0039119720458984375, 0.00183868408203125, 0.0075893402099609375, 0.013339996337890625, 0.019090652465820312, 0.02484130859375, 0.030591964721679688, 0.036342620849609375, 0.04209327697753906, 0.04784393310546875, 0.05359458923339844, 0.059345245361328125, 0.06509590148925781, 0.0708465576171875, 0.07659721374511719, 0.08234786987304688, 0.08809852600097656, 0.09384918212890625, 0.09959983825683594, 0.10535049438476562, 0.11110115051269531, 0.116851806640625, 0.12260246276855469, 0.12835311889648438, 0.13410377502441406, 0.13985443115234375, 0.14560508728027344, 0.15135574340820312, 0.1571063995361328, 0.1628570556640625, 0.1686077117919922, 0.17435836791992188, 0.18010902404785156, 0.18585968017578125, 0.19161033630371094, 0.19736099243164062, 0.2031116485595703, 0.2088623046875]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 5.0, 6.0, 2.0, 5.0, 7.0, 10.0, 9.0, 17.0, 37.0, 41.0, 101.0, 187.0, 478.0, 1628.0, 886.0, 292.0, 139.0, 83.0, 45.0, 30.0, 20.0, 17.0, 14.0, 7.0, 8.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1412353515625, -0.1366443634033203, -0.13205337524414062, -0.12746238708496094, -0.12287139892578125, -0.11828041076660156, -0.11368942260742188, -0.10909843444824219, -0.1045074462890625, -0.09991645812988281, -0.09532546997070312, -0.09073448181152344, -0.08614349365234375, -0.08155250549316406, -0.07696151733398438, -0.07237052917480469, -0.067779541015625, -0.06318855285644531, -0.058597564697265625, -0.05400657653808594, -0.04941558837890625, -0.04482460021972656, -0.040233612060546875, -0.03564262390136719, -0.0310516357421875, -0.026460647583007812, -0.021869659423828125, -0.017278671264648438, -0.01268768310546875, -0.008096694946289062, -0.003505706787109375, 0.0010852813720703125, 0.00567626953125, 0.010267257690429688, 0.014858245849609375, 0.019449234008789062, 0.02404022216796875, 0.028631210327148438, 0.033222198486328125, 0.03781318664550781, 0.0424041748046875, 0.04699516296386719, 0.051586151123046875, 0.05617713928222656, 0.06076812744140625, 0.06535911560058594, 0.06995010375976562, 0.07454109191894531, 0.079132080078125, 0.08372306823730469, 0.08831405639648438, 0.09290504455566406, 0.09749603271484375, 0.10208702087402344, 0.10667800903320312, 0.11126899719238281, 0.1158599853515625, 0.12045097351074219, 0.12504196166992188, 0.12963294982910156, 0.13422393798828125, 0.13881492614746094, 0.14340591430664062, 0.1479969024658203, 0.152587890625]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 2.0, 5.0, 13.0, 35.0, 39.0, 54.0, 104.0, 140.0, 126.0, 127.0, 128.0, 82.0, 60.0, 37.0, 30.0, 14.0, 7.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4504780173301697, -0.4290088713169098, -0.4075397551059723, -0.3860706090927124, -0.3646014928817749, -0.343132346868515, -0.3216632008552551, -0.3001940846443176, -0.27872493863105774, -0.25725579261779785, -0.23578667640686035, -0.21431753039360046, -0.19284839928150177, -0.17137926816940308, -0.1499101221561432, -0.1284409910440445, -0.1069718599319458, -0.0855027288198471, -0.06403359025716782, -0.042564451694488525, -0.02109532058238983, 0.0003738105297088623, 0.02184295654296875, 0.043312087655067444, 0.06478121876716614, 0.08625034987926483, 0.10771948844194412, 0.1291886270046234, 0.1506577581167221, 0.1721268892288208, 0.1935960352420807, 0.21506516635417938, 0.23653429746627808, 0.25800344347953796, 0.27947255969047546, 0.30094170570373535, 0.32241082191467285, 0.34387996792793274, 0.3653491139411926, 0.3868182301521301, 0.40828737616539, 0.4297565221786499, 0.4512256383895874, 0.4726947844028473, 0.4941639304161072, 0.5156330466270447, 0.537102222442627, 0.5585713386535645, 0.580040454864502, 0.6015095710754395, 0.6229787468910217, 0.6444478631019592, 0.6659169793128967, 0.687386155128479, 0.7088552713394165, 0.730324387550354, 0.7517935037612915, 0.773262619972229, 0.7947317957878113, 0.8162009119987488, 0.8376700282096863, 0.8591392040252686, 0.880608320236206, 0.9020774364471436, 0.9235466122627258]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 5.0, 5.0, 10.0, 3.0, 13.0, 13.0, 12.0, 22.0, 22.0, 18.0, 25.0, 37.0, 28.0, 27.0, 34.0, 35.0, 34.0, 51.0, 36.0, 53.0, 41.0, 38.0, 28.0, 41.0, 49.0, 49.0, 21.0, 32.0, 21.0, 27.0, 19.0, 24.0, 25.0, 13.0, 10.0, 15.0, 10.0, 14.0, 9.0, 11.0, 10.0, 3.0, 4.0, 2.0, 2.0, 1.0, 0.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.33872050046920776, -0.32775643467903137, -0.31679239869117737, -0.305828332901001, -0.294864296913147, -0.2839002311229706, -0.2729361653327942, -0.2619721293449402, -0.2510080933570862, -0.24004404246807098, -0.2290799915790558, -0.2181159257888794, -0.2071518898010254, -0.196187824010849, -0.1852237731218338, -0.1742597222328186, -0.1632956564426422, -0.15233160555362701, -0.14136755466461182, -0.13040348887443542, -0.11943944543600082, -0.10847539454698563, -0.09751133620738983, -0.08654728531837463, -0.07558323442935944, -0.06461918354034424, -0.05365512892603874, -0.042691074311733246, -0.03172702342271805, -0.02076297253370285, -0.009798914194107056, 0.001165136694908142, 0.01212918758392334, 0.023093240335583687, 0.034057293087244034, 0.04502134770154953, 0.05598539859056473, 0.06694944947957993, 0.07791350781917572, 0.08887755870819092, 0.09984160959720612, 0.11080566048622131, 0.12176971137523651, 0.1327337622642517, 0.1436978280544281, 0.1546618640422821, 0.1656259298324585, 0.1765899807214737, 0.1875540316104889, 0.1985180824995041, 0.2094821333885193, 0.22044619917869568, 0.23141023516654968, 0.24237430095672607, 0.2533383369445801, 0.26430240273475647, 0.27526646852493286, 0.28623053431510925, 0.29719457030296326, 0.30815863609313965, 0.31912267208099365, 0.33008673787117004, 0.34105080366134644, 0.35201483964920044, 0.36297887563705444]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 4.0, 6.0, 9.0, 16.0, 25.0, 49.0, 66.0, 94.0, 195.0, 377.0, 727.0, 1615.0, 4173.0, 14413.0, 70004.0, 328533.0, 459177.0, 132789.0, 25661.0, 6392.0, 2281.0, 935.0, 454.0, 236.0, 126.0, 69.0, 40.0, 28.0, 17.0, 14.0, 10.0, 10.0, 5.0, 3.0, 6.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3525390625, -0.3422279357910156, -0.33191680908203125, -0.3216056823730469, -0.3112945556640625, -0.3009834289550781, -0.29067230224609375, -0.2803611755371094, -0.270050048828125, -0.2597389221191406, -0.24942779541015625, -0.23911666870117188, -0.2288055419921875, -0.21849441528320312, -0.20818328857421875, -0.19787216186523438, -0.18756103515625, -0.17724990844726562, -0.16693878173828125, -0.15662765502929688, -0.1463165283203125, -0.13600540161132812, -0.12569427490234375, -0.11538314819335938, -0.105072021484375, -0.09476089477539062, -0.08444976806640625, -0.07413864135742188, -0.0638275146484375, -0.053516387939453125, -0.04320526123046875, -0.032894134521484375, -0.0225830078125, -0.012271881103515625, -0.00196075439453125, 0.008350372314453125, 0.0186614990234375, 0.028972625732421875, 0.03928375244140625, 0.049594879150390625, 0.059906005859375, 0.07021713256835938, 0.08052825927734375, 0.09083938598632812, 0.1011505126953125, 0.11146163940429688, 0.12177276611328125, 0.13208389282226562, 0.14239501953125, 0.15270614624023438, 0.16301727294921875, 0.17332839965820312, 0.1836395263671875, 0.19395065307617188, 0.20426177978515625, 0.21457290649414062, 0.224884033203125, 0.23519515991210938, 0.24550628662109375, 0.2558174133300781, 0.2661285400390625, 0.2764396667480469, 0.28675079345703125, 0.2970619201660156, 0.307373046875]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 5.0, 7.0, 13.0, 16.0, 16.0, 21.0, 31.0, 40.0, 42.0, 45.0, 45.0, 68.0, 81.0, 86.0, 67.0, 61.0, 62.0, 56.0, 48.0, 43.0, 37.0, 31.0, 30.0, 10.0, 15.0, 8.0, 11.0, 3.0, 5.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1170654296875, -0.11361026763916016, -0.11015510559082031, -0.10669994354248047, -0.10324478149414062, -0.09978961944580078, -0.09633445739746094, -0.0928792953491211, -0.08942413330078125, -0.0859689712524414, -0.08251380920410156, -0.07905864715576172, -0.07560348510742188, -0.07214832305908203, -0.06869316101074219, -0.06523799896240234, -0.0617828369140625, -0.058327674865722656, -0.05487251281738281, -0.05141735076904297, -0.047962188720703125, -0.04450702667236328, -0.04105186462402344, -0.037596702575683594, -0.03414154052734375, -0.030686378479003906, -0.027231216430664062, -0.02377605438232422, -0.020320892333984375, -0.01686573028564453, -0.013410568237304688, -0.009955406188964844, -0.006500244140625, -0.0030450820922851562, 0.0004100799560546875, 0.0038652420043945312, 0.007320404052734375, 0.010775566101074219, 0.014230728149414062, 0.017685890197753906, 0.02114105224609375, 0.024596214294433594, 0.028051376342773438, 0.03150653839111328, 0.034961700439453125, 0.03841686248779297, 0.04187202453613281, 0.045327186584472656, 0.0487823486328125, 0.052237510681152344, 0.05569267272949219, 0.05914783477783203, 0.06260299682617188, 0.06605815887451172, 0.06951332092285156, 0.0729684829711914, 0.07642364501953125, 0.0798788070678711, 0.08333396911621094, 0.08678913116455078, 0.09024429321289062, 0.09369945526123047, 0.09715461730957031, 0.10060977935791016, 0.10406494140625]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 5.0, 3.0, 7.0, 11.0, 11.0, 19.0, 27.0, 24.0, 49.0, 86.0, 139.0, 234.0, 442.0, 936.0, 2271.0, 7800.0, 41968.0, 300403.0, 558811.0, 112053.0, 16436.0, 4003.0, 1395.0, 621.0, 335.0, 181.0, 113.0, 55.0, 48.0, 21.0, 14.0, 12.0, 10.0, 7.0, 3.0, 3.0, 2.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.338134765625, -0.3265724182128906, -0.31501007080078125, -0.3034477233886719, -0.2918853759765625, -0.2803230285644531, -0.26876068115234375, -0.2571983337402344, -0.245635986328125, -0.23407363891601562, -0.22251129150390625, -0.21094894409179688, -0.1993865966796875, -0.18782424926757812, -0.17626190185546875, -0.16469955444335938, -0.15313720703125, -0.14157485961914062, -0.13001251220703125, -0.11845016479492188, -0.1068878173828125, -0.09532546997070312, -0.08376312255859375, -0.07220077514648438, -0.060638427734375, -0.049076080322265625, -0.03751373291015625, -0.025951385498046875, -0.0143890380859375, -0.002826690673828125, 0.00873565673828125, 0.020298004150390625, 0.0318603515625, 0.043422698974609375, 0.05498504638671875, 0.06654739379882812, 0.0781097412109375, 0.08967208862304688, 0.10123443603515625, 0.11279678344726562, 0.124359130859375, 0.13592147827148438, 0.14748382568359375, 0.15904617309570312, 0.1706085205078125, 0.18217086791992188, 0.19373321533203125, 0.20529556274414062, 0.21685791015625, 0.22842025756835938, 0.23998260498046875, 0.2515449523925781, 0.2631072998046875, 0.2746696472167969, 0.28623199462890625, 0.2977943420410156, 0.309356689453125, 0.3209190368652344, 0.33248138427734375, 0.3440437316894531, 0.3556060791015625, 0.3671684265136719, 0.37873077392578125, 0.3902931213378906, 0.40185546875]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 4.0, 4.0, 8.0, 8.0, 17.0, 9.0, 17.0, 20.0, 22.0, 15.0, 19.0, 30.0, 31.0, 34.0, 27.0, 31.0, 42.0, 43.0, 49.0, 51.0, 62.0, 45.0, 43.0, 43.0, 41.0, 35.0, 40.0, 38.0, 28.0, 20.0, 25.0, 18.0, 17.0, 18.0, 15.0, 7.0, 7.0, 5.0, 3.0, 3.0, 5.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0], "bins": [-0.396240234375, -0.38466644287109375, -0.3730926513671875, -0.36151885986328125, -0.349945068359375, -0.33837127685546875, -0.3267974853515625, -0.31522369384765625, -0.30364990234375, -0.29207611083984375, -0.2805023193359375, -0.26892852783203125, -0.257354736328125, -0.24578094482421875, -0.2342071533203125, -0.22263336181640625, -0.2110595703125, -0.19948577880859375, -0.1879119873046875, -0.17633819580078125, -0.164764404296875, -0.15319061279296875, -0.1416168212890625, -0.13004302978515625, -0.11846923828125, -0.10689544677734375, -0.0953216552734375, -0.08374786376953125, -0.072174072265625, -0.06060028076171875, -0.0490264892578125, -0.03745269775390625, -0.02587890625, -0.01430511474609375, -0.0027313232421875, 0.00884246826171875, 0.020416259765625, 0.03199005126953125, 0.0435638427734375, 0.05513763427734375, 0.06671142578125, 0.07828521728515625, 0.0898590087890625, 0.10143280029296875, 0.113006591796875, 0.12458038330078125, 0.1361541748046875, 0.14772796630859375, 0.1593017578125, 0.17087554931640625, 0.1824493408203125, 0.19402313232421875, 0.205596923828125, 0.21717071533203125, 0.2287445068359375, 0.24031829833984375, 0.25189208984375, 0.26346588134765625, 0.2750396728515625, 0.28661346435546875, 0.298187255859375, 0.30976104736328125, 0.3213348388671875, 0.33290863037109375, 0.344482421875]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 0.0, 2.0, 2.0, 0.0, 4.0, 13.0, 8.0, 17.0, 20.0, 33.0, 63.0, 104.0, 212.0, 453.0, 1315.0, 6240.0, 67839.0, 750189.0, 205555.0, 13050.0, 2154.0, 670.0, 283.0, 133.0, 77.0, 37.0, 29.0, 13.0, 11.0, 8.0, 13.0, 7.0, 3.0, 1.0, 3.0, 1.0, 1.0, 2.0], "bins": [-0.373779296875, -0.3652229309082031, -0.35666656494140625, -0.3481101989746094, -0.3395538330078125, -0.3309974670410156, -0.32244110107421875, -0.3138847351074219, -0.305328369140625, -0.2967720031738281, -0.28821563720703125, -0.2796592712402344, -0.2711029052734375, -0.2625465393066406, -0.25399017333984375, -0.24543380737304688, -0.23687744140625, -0.22832107543945312, -0.21976470947265625, -0.21120834350585938, -0.2026519775390625, -0.19409561157226562, -0.18553924560546875, -0.17698287963867188, -0.168426513671875, -0.15987014770507812, -0.15131378173828125, -0.14275741577148438, -0.1342010498046875, -0.12564468383789062, -0.11708831787109375, -0.10853195190429688, -0.0999755859375, -0.09141921997070312, -0.08286285400390625, -0.07430648803710938, -0.0657501220703125, -0.057193756103515625, -0.04863739013671875, -0.040081024169921875, -0.031524658203125, -0.022968292236328125, -0.01441192626953125, -0.005855560302734375, 0.0027008056640625, 0.011257171630859375, 0.01981353759765625, 0.028369903564453125, 0.03692626953125, 0.045482635498046875, 0.05403900146484375, 0.06259536743164062, 0.0711517333984375, 0.07970809936523438, 0.08826446533203125, 0.09682083129882812, 0.105377197265625, 0.11393356323242188, 0.12248992919921875, 0.13104629516601562, 0.1396026611328125, 0.14815902709960938, 0.15671539306640625, 0.16527175903320312, 0.173828125]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 4.0, 6.0, 4.0, 6.0, 10.0, 15.0, 16.0, 31.0, 36.0, 32.0, 62.0, 72.0, 58.0, 83.0, 95.0, 80.0, 62.0, 69.0, 52.0, 55.0, 41.0, 26.0, 22.0, 17.0, 16.0, 7.0, 10.0, 5.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-9.071826934814453e-05, -8.79308208823204e-05, -8.514337241649628e-05, -8.235592395067215e-05, -7.956847548484802e-05, -7.67810270190239e-05, -7.399357855319977e-05, -7.120613008737564e-05, -6.841868162155151e-05, -6.563123315572739e-05, -6.284378468990326e-05, -6.005633622407913e-05, -5.7268887758255005e-05, -5.448143929243088e-05, -5.169399082660675e-05, -4.890654236078262e-05, -4.6119093894958496e-05, -4.333164542913437e-05, -4.054419696331024e-05, -3.7756748497486115e-05, -3.496930003166199e-05, -3.218185156583786e-05, -2.9394403100013733e-05, -2.6606954634189606e-05, -2.381950616836548e-05, -2.103205770254135e-05, -1.8244609236717224e-05, -1.5457160770893097e-05, -1.266971230506897e-05, -9.882263839244843e-06, -7.094815373420715e-06, -4.307366907596588e-06, -1.519918441772461e-06, 1.2675300240516663e-06, 4.0549784898757935e-06, 6.842426955699921e-06, 9.629875421524048e-06, 1.2417323887348175e-05, 1.5204772353172302e-05, 1.799222081899643e-05, 2.0779669284820557e-05, 2.3567117750644684e-05, 2.635456621646881e-05, 2.9142014682292938e-05, 3.1929463148117065e-05, 3.471691161394119e-05, 3.750436007976532e-05, 4.029180854558945e-05, 4.3079257011413574e-05, 4.58667054772377e-05, 4.865415394306183e-05, 5.1441602408885956e-05, 5.422905087471008e-05, 5.701649934053421e-05, 5.980394780635834e-05, 6.259139627218246e-05, 6.537884473800659e-05, 6.816629320383072e-05, 7.095374166965485e-05, 7.374119013547897e-05, 7.65286386013031e-05, 7.931608706712723e-05, 8.210353553295135e-05, 8.489098399877548e-05, 8.767843246459961e-05]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 6.0, 4.0, 5.0, 6.0, 10.0, 13.0, 36.0, 35.0, 55.0, 94.0, 123.0, 184.0, 305.0, 580.0, 1040.0, 2280.0, 6029.0, 20240.0, 86001.0, 325236.0, 429309.0, 131866.0, 30540.0, 8570.0, 2999.0, 1283.0, 704.0, 365.0, 225.0, 143.0, 85.0, 50.0, 44.0, 26.0, 21.0, 11.0, 6.0, 7.0, 8.0, 3.0, 3.0, 2.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.1124267578125, -0.10843276977539062, -0.10443878173828125, -0.10044479370117188, -0.0964508056640625, -0.09245681762695312, -0.08846282958984375, -0.08446884155273438, -0.080474853515625, -0.07648086547851562, -0.07248687744140625, -0.06849288940429688, -0.0644989013671875, -0.060504913330078125, -0.05651092529296875, -0.052516937255859375, -0.04852294921875, -0.044528961181640625, -0.04053497314453125, -0.036540985107421875, -0.0325469970703125, -0.028553009033203125, -0.02455902099609375, -0.020565032958984375, -0.016571044921875, -0.012577056884765625, -0.00858306884765625, -0.004589080810546875, -0.0005950927734375, 0.003398895263671875, 0.00739288330078125, 0.011386871337890625, 0.015380859375, 0.019374847412109375, 0.02336883544921875, 0.027362823486328125, 0.0313568115234375, 0.035350799560546875, 0.03934478759765625, 0.043338775634765625, 0.047332763671875, 0.051326751708984375, 0.05532073974609375, 0.059314727783203125, 0.0633087158203125, 0.06730270385742188, 0.07129669189453125, 0.07529067993164062, 0.07928466796875, 0.08327865600585938, 0.08727264404296875, 0.09126663208007812, 0.0952606201171875, 0.09925460815429688, 0.10324859619140625, 0.10724258422851562, 0.111236572265625, 0.11523056030273438, 0.11922454833984375, 0.12321853637695312, 0.1272125244140625, 0.13120651245117188, 0.13520050048828125, 0.13919448852539062, 0.1431884765625]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 6.0, 2.0, 1.0, 2.0, 7.0, 2.0, 11.0, 26.0, 24.0, 25.0, 39.0, 56.0, 75.0, 84.0, 99.0, 110.0, 101.0, 83.0, 55.0, 58.0, 40.0, 26.0, 25.0, 16.0, 14.0, 8.0, 2.0, 5.0, 6.0, 3.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.18115234375, -0.17539024353027344, -0.16962814331054688, -0.1638660430908203, -0.15810394287109375, -0.1523418426513672, -0.14657974243164062, -0.14081764221191406, -0.1350555419921875, -0.12929344177246094, -0.12353134155273438, -0.11776924133300781, -0.11200714111328125, -0.10624504089355469, -0.10048294067382812, -0.09472084045410156, -0.088958740234375, -0.08319664001464844, -0.07743453979492188, -0.07167243957519531, -0.06591033935546875, -0.06014823913574219, -0.054386138916015625, -0.04862403869628906, -0.0428619384765625, -0.03709983825683594, -0.031337738037109375, -0.025575637817382812, -0.01981353759765625, -0.014051437377929688, -0.008289337158203125, -0.0025272369384765625, 0.00323486328125, 0.008996963500976562, 0.014759063720703125, 0.020521163940429688, 0.02628326416015625, 0.03204536437988281, 0.037807464599609375, 0.04356956481933594, 0.0493316650390625, 0.05509376525878906, 0.060855865478515625, 0.06661796569824219, 0.07238006591796875, 0.07814216613769531, 0.08390426635742188, 0.08966636657714844, 0.095428466796875, 0.10119056701660156, 0.10695266723632812, 0.11271476745605469, 0.11847686767578125, 0.12423896789550781, 0.13000106811523438, 0.13576316833496094, 0.1415252685546875, 0.14728736877441406, 0.15304946899414062, 0.1588115692138672, 0.16457366943359375, 0.1703357696533203, 0.17609786987304688, 0.18185997009277344, 0.1876220703125]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 6.0, 20.0, 59.0, 93.0, 159.0, 208.0, 178.0, 145.0, 69.0, 39.0, 13.0, 5.0, 5.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.966043710708618, -2.8552286624908447, -2.7444136142730713, -2.633598804473877, -2.5227837562561035, -2.41196870803833, -2.3011536598205566, -2.190338611602783, -2.0795235633850098, -1.9687085151672363, -1.8578935861587524, -1.747078537940979, -1.6362636089324951, -1.5254485607147217, -1.4146335124969482, -1.3038184642791748, -1.1930036544799805, -1.082188606262207, -0.9713736772537231, -0.8605586290359497, -0.749743640422821, -0.6389286518096924, -0.528113603591919, -0.4172986149787903, -0.3064836263656616, -0.19566862285137177, -0.08485361933708191, 0.02596139907836914, 0.1367763876914978, 0.24759137630462646, 0.3584064245223999, 0.46922141313552856, 0.5800361633300781, 0.6908511519432068, 0.8016661405563354, 0.9124811887741089, 1.0232961177825928, 1.1341111660003662, 1.2449262142181396, 1.355741262435913, 1.466556191444397, 1.5773712396621704, 1.6881861686706543, 1.7990012168884277, 1.9098162651062012, 2.0206313133239746, 2.131446361541748, 2.2422611713409424, 2.353076219558716, 2.4638912677764893, 2.5747063159942627, 2.685521125793457, 2.7963361740112305, 2.907151222229004, 3.0179662704467773, 3.128781318664551, 3.239596366882324, 3.3504114151000977, 3.461226463317871, 3.5720415115356445, 3.682856321334839, 3.7936713695526123, 3.9044864177703857, 4.01530122756958, 4.1261162757873535]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [3.0, 1.0, 3.0, 1.0, 0.0, 5.0, 2.0, 0.0, 3.0, 6.0, 9.0, 8.0, 12.0, 24.0, 19.0, 27.0, 31.0, 35.0, 38.0, 39.0, 45.0, 57.0, 50.0, 46.0, 56.0, 53.0, 40.0, 46.0, 45.0, 43.0, 41.0, 31.0, 49.0, 35.0, 32.0, 8.0, 20.0, 14.0, 7.0, 11.0, 8.0, 5.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.801408052444458, -1.7303305864334106, -1.6592532396316528, -1.5881757736206055, -1.5170984268188477, -1.4460209608078003, -1.374943494796753, -1.3038661479949951, -1.2327886819839478, -1.1617112159729004, -1.0906338691711426, -1.0195564031600952, -0.9484789967536926, -0.87740159034729, -0.8063241243362427, -0.7352467179298401, -0.6641693115234375, -0.5930919051170349, -0.5220144987106323, -0.45093703269958496, -0.3798596262931824, -0.3087822198867798, -0.2377047836780548, -0.16662734746932983, -0.09554994106292725, -0.024472519755363464, 0.04660490155220032, 0.1176823228597641, 0.18875974416732788, 0.25983715057373047, 0.33091458678245544, 0.4019920229911804, 0.473069429397583, 0.5441468358039856, 0.6152242422103882, 0.6863017082214355, 0.7573791146278381, 0.8284565210342407, 0.8995339870452881, 0.9706113934516907, 1.0416887998580933, 1.1127662658691406, 1.1838436126708984, 1.2549210786819458, 1.3259985446929932, 1.397075891494751, 1.4681533575057983, 1.5392308235168457, 1.6103081703186035, 1.6813856363296509, 1.7524629831314087, 1.823540449142456, 1.8946177959442139, 1.9656952619552612, 2.0367727279663086, 2.1078500747680664, 2.178927421569824, 2.250004768371582, 2.321082353591919, 2.3921597003936768, 2.4632370471954346, 2.5343146324157715, 2.6053919792175293, 2.676469326019287, 2.747546911239624]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 4.0, 7.0, 8.0, 12.0, 20.0, 33.0, 50.0, 89.0, 213.0, 435.0, 1173.0, 4216.0, 21015.0, 334693.0, 3786081.0, 37439.0, 6162.0, 1605.0, 540.0, 230.0, 105.0, 57.0, 42.0, 17.0, 18.0, 11.0, 5.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.391357421875, -0.3763847351074219, -0.36141204833984375, -0.3464393615722656, -0.3314666748046875, -0.3164939880371094, -0.30152130126953125, -0.2865486145019531, -0.271575927734375, -0.2566032409667969, -0.24163055419921875, -0.22665786743164062, -0.2116851806640625, -0.19671249389648438, -0.18173980712890625, -0.16676712036132812, -0.15179443359375, -0.13682174682617188, -0.12184906005859375, -0.10687637329101562, -0.0919036865234375, -0.07693099975585938, -0.06195831298828125, -0.046985626220703125, -0.032012939453125, -0.017040252685546875, -0.00206756591796875, 0.012905120849609375, 0.0278778076171875, 0.042850494384765625, 0.05782318115234375, 0.07279586791992188, 0.0877685546875, 0.10274124145507812, 0.11771392822265625, 0.13268661499023438, 0.1476593017578125, 0.16263198852539062, 0.17760467529296875, 0.19257736206054688, 0.207550048828125, 0.22252273559570312, 0.23749542236328125, 0.2524681091308594, 0.2674407958984375, 0.2824134826660156, 0.29738616943359375, 0.3123588562011719, 0.32733154296875, 0.3423042297363281, 0.35727691650390625, 0.3722496032714844, 0.3872222900390625, 0.4021949768066406, 0.41716766357421875, 0.4321403503417969, 0.447113037109375, 0.4620857238769531, 0.47705841064453125, 0.4920310974121094, 0.5070037841796875, 0.5219764709472656, 0.5369491577148438, 0.5519218444824219, 0.56689453125]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 7.0, 5.0, 2.0, 7.0, 10.0, 13.0, 7.0, 24.0, 25.0, 24.0, 46.0, 46.0, 48.0, 59.0, 56.0, 72.0, 59.0, 63.0, 68.0, 63.0, 46.0, 40.0, 40.0, 37.0, 24.0, 27.0, 31.0, 20.0, 9.0, 12.0, 5.0, 5.0, 4.0, 3.0, 6.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.123291015625, -0.11966419219970703, -0.11603736877441406, -0.1124105453491211, -0.10878372192382812, -0.10515689849853516, -0.10153007507324219, -0.09790325164794922, -0.09427642822265625, -0.09064960479736328, -0.08702278137207031, -0.08339595794677734, -0.07976913452148438, -0.0761423110961914, -0.07251548767089844, -0.06888866424560547, -0.0652618408203125, -0.06163501739501953, -0.05800819396972656, -0.054381370544433594, -0.050754547119140625, -0.047127723693847656, -0.04350090026855469, -0.03987407684326172, -0.03624725341796875, -0.03262042999267578, -0.028993606567382812, -0.025366783142089844, -0.021739959716796875, -0.018113136291503906, -0.014486312866210938, -0.010859489440917969, -0.007232666015625, -0.0036058425903320312, 2.09808349609375e-05, 0.0036478042602539062, 0.007274627685546875, 0.010901451110839844, 0.014528274536132812, 0.01815509796142578, 0.02178192138671875, 0.02540874481201172, 0.029035568237304688, 0.032662391662597656, 0.036289215087890625, 0.039916038513183594, 0.04354286193847656, 0.04716968536376953, 0.0507965087890625, 0.05442333221435547, 0.05805015563964844, 0.061676979064941406, 0.06530380249023438, 0.06893062591552734, 0.07255744934082031, 0.07618427276611328, 0.07981109619140625, 0.08343791961669922, 0.08706474304199219, 0.09069156646728516, 0.09431838989257812, 0.0979452133178711, 0.10157203674316406, 0.10519886016845703, 0.10882568359375]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 4.0, 1.0, 0.0, 3.0, 10.0, 7.0, 11.0, 9.0, 16.0, 22.0, 35.0, 43.0, 75.0, 90.0, 143.0, 234.0, 351.0, 654.0, 1100.0, 1973.0, 3999.0, 8882.0, 25094.0, 106423.0, 3414723.0, 537367.0, 62136.0, 17260.0, 6690.0, 3059.0, 1582.0, 902.0, 461.0, 301.0, 185.0, 125.0, 82.0, 68.0, 48.0, 34.0, 21.0, 18.0, 8.0, 16.0, 7.0, 4.0, 6.0, 2.0, 3.0, 0.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.234619140625, -0.2272491455078125, -0.219879150390625, -0.2125091552734375, -0.20513916015625, -0.1977691650390625, -0.190399169921875, -0.1830291748046875, -0.1756591796875, -0.1682891845703125, -0.160919189453125, -0.1535491943359375, -0.14617919921875, -0.1388092041015625, -0.131439208984375, -0.1240692138671875, -0.11669921875, -0.1093292236328125, -0.101959228515625, -0.0945892333984375, -0.08721923828125, -0.0798492431640625, -0.072479248046875, -0.0651092529296875, -0.0577392578125, -0.0503692626953125, -0.042999267578125, -0.0356292724609375, -0.02825927734375, -0.0208892822265625, -0.013519287109375, -0.0061492919921875, 0.001220703125, 0.0085906982421875, 0.015960693359375, 0.0233306884765625, 0.03070068359375, 0.0380706787109375, 0.045440673828125, 0.0528106689453125, 0.0601806640625, 0.0675506591796875, 0.074920654296875, 0.0822906494140625, 0.08966064453125, 0.0970306396484375, 0.104400634765625, 0.1117706298828125, 0.119140625, 0.1265106201171875, 0.133880615234375, 0.1412506103515625, 0.14862060546875, 0.1559906005859375, 0.163360595703125, 0.1707305908203125, 0.1781005859375, 0.1854705810546875, 0.192840576171875, 0.2002105712890625, 0.20758056640625, 0.2149505615234375, 0.222320556640625, 0.2296905517578125, 0.237060546875]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 4.0, 5.0, 9.0, 9.0, 14.0, 33.0, 51.0, 131.0, 639.0, 2799.0, 221.0, 83.0, 39.0, 21.0, 10.0, 7.0, 2.0, 1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11627197265625, -0.11305904388427734, -0.10984611511230469, -0.10663318634033203, -0.10342025756835938, -0.10020732879638672, -0.09699440002441406, -0.0937814712524414, -0.09056854248046875, -0.0873556137084961, -0.08414268493652344, -0.08092975616455078, -0.07771682739257812, -0.07450389862060547, -0.07129096984863281, -0.06807804107666016, -0.0648651123046875, -0.061652183532714844, -0.05843925476074219, -0.05522632598876953, -0.052013397216796875, -0.04880046844482422, -0.04558753967285156, -0.042374610900878906, -0.03916168212890625, -0.035948753356933594, -0.03273582458496094, -0.02952289581298828, -0.026309967041015625, -0.02309703826904297, -0.019884109497070312, -0.016671180725097656, -0.013458251953125, -0.010245323181152344, -0.0070323944091796875, -0.0038194656372070312, -0.000606536865234375, 0.0026063919067382812, 0.0058193206787109375, 0.009032249450683594, 0.01224517822265625, 0.015458106994628906, 0.018671035766601562, 0.02188396453857422, 0.025096893310546875, 0.02830982208251953, 0.03152275085449219, 0.034735679626464844, 0.0379486083984375, 0.041161537170410156, 0.04437446594238281, 0.04758739471435547, 0.050800323486328125, 0.05401325225830078, 0.05722618103027344, 0.060439109802246094, 0.06365203857421875, 0.0668649673461914, 0.07007789611816406, 0.07329082489013672, 0.07650375366210938, 0.07971668243408203, 0.08292961120605469, 0.08614253997802734, 0.08935546875]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 3.0, 1.0, 3.0, 3.0, 5.0, 10.0, 18.0, 18.0, 35.0, 54.0, 69.0, 96.0, 130.0, 121.0, 130.0, 122.0, 80.0, 54.0, 28.0, 11.0, 12.0, 4.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.31168490648269653, -0.3032430410385132, -0.29480117559432983, -0.28635933995246887, -0.2779174745082855, -0.2694756090641022, -0.2610337734222412, -0.25259190797805786, -0.2441500425338745, -0.23570817708969116, -0.227266326546669, -0.21882447600364685, -0.2103826105594635, -0.20194074511528015, -0.193498894572258, -0.18505704402923584, -0.1766151785850525, -0.16817331314086914, -0.15973146259784698, -0.15128961205482483, -0.14284774661064148, -0.13440588116645813, -0.12596403062343597, -0.11752217262983322, -0.10908031463623047, -0.10063845664262772, -0.09219659864902496, -0.08375474065542221, -0.07531288266181946, -0.0668710246682167, -0.05842916667461395, -0.0499873086810112, -0.04154545068740845, -0.033103592693805695, -0.024661734700202942, -0.01621987670660019, -0.0077780187129974365, 0.0006638392806053162, 0.009105697274208069, 0.01754755526781082, 0.025989413261413574, 0.03443127125501633, 0.04287312924861908, 0.05131498724222183, 0.059756845235824585, 0.06819870322942734, 0.07664056122303009, 0.08508241921663284, 0.0935242772102356, 0.10196613520383835, 0.1104079931974411, 0.11884985119104385, 0.1272917091846466, 0.13573357462882996, 0.1441754251718521, 0.15261727571487427, 0.16105914115905762, 0.16950100660324097, 0.17794285714626312, 0.18638470768928528, 0.19482657313346863, 0.20326843857765198, 0.21171028912067413, 0.2201521396636963, 0.22859400510787964]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 6.0, 3.0, 5.0, 7.0, 8.0, 11.0, 17.0, 11.0, 11.0, 22.0, 19.0, 23.0, 31.0, 37.0, 41.0, 41.0, 36.0, 40.0, 47.0, 46.0, 49.0, 45.0, 46.0, 49.0, 40.0, 34.0, 35.0, 31.0, 37.0, 32.0, 24.0, 24.0, 21.0, 21.0, 19.0, 9.0, 7.0, 6.0, 11.0, 4.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 0.0, 1.0], "bins": [-0.16033828258514404, -0.15594208240509033, -0.15154588222503662, -0.1471496969461441, -0.1427534967660904, -0.13835729658603668, -0.13396109640598297, -0.12956489622592926, -0.12516871094703674, -0.12077251076698303, -0.11637631803750992, -0.11198011785745621, -0.1075839251279831, -0.10318772494792938, -0.09879152476787567, -0.09439532458782196, -0.08999912440776825, -0.08560292422771454, -0.08120673149824142, -0.07681053131818771, -0.0724143385887146, -0.06801813840866089, -0.06362193822860718, -0.059225741773843765, -0.05482954531908035, -0.05043334886431694, -0.04603715240955353, -0.04164095222949982, -0.037244755774736404, -0.03284855931997299, -0.02845236100256443, -0.02405616268515587, -0.019659966230392456, -0.015263768844306469, -0.010867571458220482, -0.006471374072134495, -0.0020751766860485077, 0.002321019768714905, 0.0067172180861234665, 0.011113416403532028, 0.01550961285829544, 0.019905809313058853, 0.024302007630467415, 0.028698205947875977, 0.03309440240263939, 0.0374905988574028, 0.04188679903745651, 0.046282995492219925, 0.05067919194698334, 0.05507538840174675, 0.05947158485651016, 0.06386778503656387, 0.06826397776603699, 0.0726601779460907, 0.07705637812614441, 0.08145257830619812, 0.08584877103567123, 0.09024497121572495, 0.09464116394519806, 0.09903736412525177, 0.10343356430530548, 0.1078297570347786, 0.1122259572148323, 0.11662214994430542, 0.12101835012435913]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 6.0, 6.0, 2.0, 10.0, 14.0, 24.0, 22.0, 52.0, 82.0, 152.0, 337.0, 799.0, 2335.0, 7439.0, 29894.0, 139224.0, 431527.0, 327915.0, 82948.0, 18250.0, 4723.0, 1607.0, 600.0, 266.0, 111.0, 81.0, 58.0, 30.0, 20.0, 11.0, 7.0, 7.0, 4.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.318603515625, -0.30859375, -0.298583984375, -0.28857421875, -0.278564453125, -0.2685546875, -0.258544921875, -0.24853515625, -0.238525390625, -0.228515625, -0.218505859375, -0.20849609375, -0.198486328125, -0.1884765625, -0.178466796875, -0.16845703125, -0.158447265625, -0.1484375, -0.138427734375, -0.12841796875, -0.118408203125, -0.1083984375, -0.098388671875, -0.08837890625, -0.078369140625, -0.068359375, -0.058349609375, -0.04833984375, -0.038330078125, -0.0283203125, -0.018310546875, -0.00830078125, 0.001708984375, 0.01171875, 0.021728515625, 0.03173828125, 0.041748046875, 0.0517578125, 0.061767578125, 0.07177734375, 0.081787109375, 0.091796875, 0.101806640625, 0.11181640625, 0.121826171875, 0.1318359375, 0.141845703125, 0.15185546875, 0.161865234375, 0.171875, 0.181884765625, 0.19189453125, 0.201904296875, 0.2119140625, 0.221923828125, 0.23193359375, 0.241943359375, 0.251953125, 0.261962890625, 0.27197265625, 0.281982421875, 0.2919921875, 0.302001953125, 0.31201171875, 0.322021484375]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 8.0, 4.0, 9.0, 13.0, 17.0, 24.0, 21.0, 26.0, 44.0, 52.0, 64.0, 69.0, 68.0, 52.0, 77.0, 68.0, 66.0, 52.0, 52.0, 46.0, 29.0, 25.0, 36.0, 23.0, 16.0, 20.0, 7.0, 8.0, 6.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.1275634765625, -0.12363147735595703, -0.11969947814941406, -0.1157674789428711, -0.11183547973632812, -0.10790348052978516, -0.10397148132324219, -0.10003948211669922, -0.09610748291015625, -0.09217548370361328, -0.08824348449707031, -0.08431148529052734, -0.08037948608398438, -0.0764474868774414, -0.07251548767089844, -0.06858348846435547, -0.0646514892578125, -0.06071949005126953, -0.05678749084472656, -0.052855491638183594, -0.048923492431640625, -0.044991493225097656, -0.04105949401855469, -0.03712749481201172, -0.03319549560546875, -0.02926349639892578, -0.025331497192382812, -0.021399497985839844, -0.017467498779296875, -0.013535499572753906, -0.009603500366210938, -0.005671501159667969, -0.001739501953125, 0.0021924972534179688, 0.0061244964599609375, 0.010056495666503906, 0.013988494873046875, 0.017920494079589844, 0.021852493286132812, 0.02578449249267578, 0.02971649169921875, 0.03364849090576172, 0.03758049011230469, 0.041512489318847656, 0.045444488525390625, 0.049376487731933594, 0.05330848693847656, 0.05724048614501953, 0.0611724853515625, 0.06510448455810547, 0.06903648376464844, 0.0729684829711914, 0.07690048217773438, 0.08083248138427734, 0.08476448059082031, 0.08869647979736328, 0.09262847900390625, 0.09656047821044922, 0.10049247741699219, 0.10442447662353516, 0.10835647583007812, 0.1122884750366211, 0.11622047424316406, 0.12015247344970703, 0.12408447265625]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 3.0, 2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 3.0, 1.0, 4.0, 6.0, 8.0, 11.0, 15.0, 17.0, 28.0, 38.0, 69.0, 117.0, 218.0, 352.0, 656.0, 1392.0, 3760.0, 14057.0, 88506.0, 553851.0, 327574.0, 44475.0, 8481.0, 2609.0, 1105.0, 498.0, 291.0, 137.0, 82.0, 59.0, 47.0, 25.0, 16.0, 10.0, 6.0, 7.0, 3.0, 3.0, 7.0, 5.0, 4.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.35009765625, -0.3383598327636719, -0.32662200927734375, -0.3148841857910156, -0.3031463623046875, -0.2914085388183594, -0.27967071533203125, -0.2679328918457031, -0.256195068359375, -0.24445724487304688, -0.23271942138671875, -0.22098159790039062, -0.2092437744140625, -0.19750595092773438, -0.18576812744140625, -0.17403030395507812, -0.16229248046875, -0.15055465698242188, -0.13881683349609375, -0.12707901000976562, -0.1153411865234375, -0.10360336303710938, -0.09186553955078125, -0.08012771606445312, -0.068389892578125, -0.056652069091796875, -0.04491424560546875, -0.033176422119140625, -0.0214385986328125, -0.009700775146484375, 0.00203704833984375, 0.013774871826171875, 0.0255126953125, 0.037250518798828125, 0.04898834228515625, 0.060726165771484375, 0.0724639892578125, 0.08420181274414062, 0.09593963623046875, 0.10767745971679688, 0.119415283203125, 0.13115310668945312, 0.14289093017578125, 0.15462875366210938, 0.1663665771484375, 0.17810440063476562, 0.18984222412109375, 0.20158004760742188, 0.21331787109375, 0.22505569458007812, 0.23679351806640625, 0.24853134155273438, 0.2602691650390625, 0.2720069885253906, 0.28374481201171875, 0.2954826354980469, 0.307220458984375, 0.3189582824707031, 0.33069610595703125, 0.3424339294433594, 0.3541717529296875, 0.3659095764160156, 0.37764739990234375, 0.3893852233886719, 0.401123046875]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 4.0, 7.0, 3.0, 12.0, 15.0, 16.0, 17.0, 16.0, 20.0, 29.0, 40.0, 42.0, 42.0, 45.0, 41.0, 44.0, 61.0, 53.0, 44.0, 57.0, 49.0, 53.0, 39.0, 42.0, 24.0, 40.0, 27.0, 20.0, 14.0, 17.0, 21.0, 9.0, 9.0, 7.0, 6.0, 2.0, 5.0, 0.0, 5.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.46630859375, -0.45105743408203125, -0.4358062744140625, -0.42055511474609375, -0.405303955078125, -0.39005279541015625, -0.3748016357421875, -0.35955047607421875, -0.34429931640625, -0.32904815673828125, -0.3137969970703125, -0.29854583740234375, -0.283294677734375, -0.26804351806640625, -0.2527923583984375, -0.23754119873046875, -0.2222900390625, -0.20703887939453125, -0.1917877197265625, -0.17653656005859375, -0.161285400390625, -0.14603424072265625, -0.1307830810546875, -0.11553192138671875, -0.10028076171875, -0.08502960205078125, -0.0697784423828125, -0.05452728271484375, -0.039276123046875, -0.02402496337890625, -0.0087738037109375, 0.00647735595703125, 0.021728515625, 0.03697967529296875, 0.0522308349609375, 0.06748199462890625, 0.082733154296875, 0.09798431396484375, 0.1132354736328125, 0.12848663330078125, 0.14373779296875, 0.15898895263671875, 0.1742401123046875, 0.18949127197265625, 0.204742431640625, 0.21999359130859375, 0.2352447509765625, 0.25049591064453125, 0.2657470703125, 0.28099822998046875, 0.2962493896484375, 0.31150054931640625, 0.326751708984375, 0.34200286865234375, 0.3572540283203125, 0.37250518798828125, 0.38775634765625, 0.40300750732421875, 0.4182586669921875, 0.43350982666015625, 0.448760986328125, 0.46401214599609375, 0.4792633056640625, 0.49451446533203125, 0.509765625]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 2.0, 3.0, 4.0, 3.0, 6.0, 8.0, 14.0, 14.0, 11.0, 22.0, 28.0, 56.0, 71.0, 129.0, 219.0, 388.0, 1022.0, 3518.0, 33294.0, 866228.0, 133544.0, 7227.0, 1513.0, 545.0, 249.0, 132.0, 100.0, 61.0, 34.0, 30.0, 26.0, 9.0, 11.0, 8.0, 8.0, 2.0, 6.0, 6.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-0.36376953125, -0.3519172668457031, -0.34006500244140625, -0.3282127380371094, -0.3163604736328125, -0.3045082092285156, -0.29265594482421875, -0.2808036804199219, -0.268951416015625, -0.2570991516113281, -0.24524688720703125, -0.23339462280273438, -0.2215423583984375, -0.20969009399414062, -0.19783782958984375, -0.18598556518554688, -0.17413330078125, -0.16228103637695312, -0.15042877197265625, -0.13857650756835938, -0.1267242431640625, -0.11487197875976562, -0.10301971435546875, -0.09116744995117188, -0.079315185546875, -0.06746292114257812, -0.05561065673828125, -0.043758392333984375, -0.0319061279296875, -0.020053863525390625, -0.00820159912109375, 0.003650665283203125, 0.0155029296875, 0.027355194091796875, 0.03920745849609375, 0.051059722900390625, 0.0629119873046875, 0.07476425170898438, 0.08661651611328125, 0.09846878051757812, 0.110321044921875, 0.12217330932617188, 0.13402557373046875, 0.14587783813476562, 0.1577301025390625, 0.16958236694335938, 0.18143463134765625, 0.19328689575195312, 0.20513916015625, 0.21699142456054688, 0.22884368896484375, 0.24069595336914062, 0.2525482177734375, 0.2644004821777344, 0.27625274658203125, 0.2881050109863281, 0.299957275390625, 0.3118095397949219, 0.32366180419921875, 0.3355140686035156, 0.3473663330078125, 0.3592185974121094, 0.37107086181640625, 0.3829231262207031, 0.394775390625]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 1.0, 4.0, 7.0, 28.0, 43.0, 92.0, 147.0, 236.0, 206.0, 126.0, 64.0, 26.0, 11.0, 7.0, 9.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.85860824584961e-05, -9.193085134029388e-05, -8.527562022209167e-05, -7.862038910388947e-05, -7.196515798568726e-05, -6.530992686748505e-05, -5.865469574928284e-05, -5.199946463108063e-05, -4.534423351287842e-05, -3.868900239467621e-05, -3.2033771276474e-05, -2.537854015827179e-05, -1.872330904006958e-05, -1.206807792186737e-05, -5.412846803665161e-06, 1.2423843145370483e-06, 7.897615432739258e-06, 1.4552846550941467e-05, 2.1208077669143677e-05, 2.7863308787345886e-05, 3.4518539905548096e-05, 4.1173771023750305e-05, 4.7829002141952515e-05, 5.4484233260154724e-05, 6.113946437835693e-05, 6.779469549655914e-05, 7.444992661476135e-05, 8.110515773296356e-05, 8.776038885116577e-05, 9.441561996936798e-05, 0.00010107085108757019, 0.0001077260822057724, 0.00011438131332397461, 0.00012103654444217682, 0.00012769177556037903, 0.00013434700667858124, 0.00014100223779678345, 0.00014765746891498566, 0.00015431270003318787, 0.00016096793115139008, 0.00016762316226959229, 0.0001742783933877945, 0.0001809336245059967, 0.00018758885562419891, 0.00019424408674240112, 0.00020089931786060333, 0.00020755454897880554, 0.00021420978009700775, 0.00022086501121520996, 0.00022752024233341217, 0.00023417547345161438, 0.0002408307045698166, 0.0002474859356880188, 0.000254141166806221, 0.0002607963979244232, 0.00026745162904262543, 0.00027410686016082764, 0.00028076209127902985, 0.00028741732239723206, 0.00029407255351543427, 0.0003007277846336365, 0.0003073830157518387, 0.0003140382468700409, 0.0003206934779882431, 0.0003273487091064453]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 7.0, 10.0, 5.0, 21.0, 19.0, 24.0, 52.0, 81.0, 122.0, 285.0, 638.0, 1471.0, 5035.0, 27751.0, 344875.0, 607786.0, 49581.0, 7312.0, 1965.0, 752.0, 324.0, 174.0, 98.0, 62.0, 31.0, 24.0, 12.0, 10.0, 10.0, 7.0, 4.0, 1.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.2783203125, -0.2712078094482422, -0.2640953063964844, -0.25698280334472656, -0.24987030029296875, -0.24275779724121094, -0.23564529418945312, -0.2285327911376953, -0.2214202880859375, -0.2143077850341797, -0.20719528198242188, -0.20008277893066406, -0.19297027587890625, -0.18585777282714844, -0.17874526977539062, -0.1716327667236328, -0.164520263671875, -0.1574077606201172, -0.15029525756835938, -0.14318275451660156, -0.13607025146484375, -0.12895774841308594, -0.12184524536132812, -0.11473274230957031, -0.1076202392578125, -0.10050773620605469, -0.09339523315429688, -0.08628273010253906, -0.07917022705078125, -0.07205772399902344, -0.06494522094726562, -0.05783271789550781, -0.05072021484375, -0.04360771179199219, -0.036495208740234375, -0.029382705688476562, -0.02227020263671875, -0.015157699584960938, -0.008045196533203125, -0.0009326934814453125, 0.0061798095703125, 0.013292312622070312, 0.020404815673828125, 0.027517318725585938, 0.03462982177734375, 0.04174232482910156, 0.048854827880859375, 0.05596733093261719, 0.063079833984375, 0.07019233703613281, 0.07730484008789062, 0.08441734313964844, 0.09152984619140625, 0.09864234924316406, 0.10575485229492188, 0.11286735534667969, 0.1199798583984375, 0.1270923614501953, 0.13420486450195312, 0.14131736755371094, 0.14842987060546875, 0.15554237365722656, 0.16265487670898438, 0.1697673797607422, 0.1768798828125]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [3.0, 2.0, 2.0, 1.0, 5.0, 1.0, 7.0, 6.0, 5.0, 6.0, 7.0, 21.0, 14.0, 31.0, 43.0, 83.0, 85.0, 124.0, 126.0, 125.0, 101.0, 68.0, 50.0, 23.0, 17.0, 17.0, 7.0, 7.0, 7.0, 5.0, 2.0, 4.0, 4.0, 1.0, 5.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.156005859375, -0.147491455078125, -0.13897705078125, -0.130462646484375, -0.1219482421875, -0.113433837890625, -0.10491943359375, -0.096405029296875, -0.087890625, -0.079376220703125, -0.07086181640625, -0.062347412109375, -0.0538330078125, -0.045318603515625, -0.03680419921875, -0.028289794921875, -0.019775390625, -0.011260986328125, -0.00274658203125, 0.005767822265625, 0.0142822265625, 0.022796630859375, 0.03131103515625, 0.039825439453125, 0.04833984375, 0.056854248046875, 0.06536865234375, 0.073883056640625, 0.0823974609375, 0.090911865234375, 0.09942626953125, 0.107940673828125, 0.116455078125, 0.124969482421875, 0.13348388671875, 0.141998291015625, 0.1505126953125, 0.159027099609375, 0.16754150390625, 0.176055908203125, 0.1845703125, 0.193084716796875, 0.20159912109375, 0.210113525390625, 0.2186279296875, 0.227142333984375, 0.23565673828125, 0.244171142578125, 0.252685546875, 0.261199951171875, 0.26971435546875, 0.278228759765625, 0.2867431640625, 0.295257568359375, 0.30377197265625, 0.312286376953125, 0.32080078125, 0.329315185546875, 0.33782958984375, 0.346343994140625, 0.3548583984375, 0.363372802734375, 0.37188720703125, 0.380401611328125, 0.388916015625]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 7.0, 1.0, 7.0, 4.0, 21.0, 53.0, 139.0, 197.0, 238.0, 184.0, 94.0, 44.0, 14.0, 7.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.593186616897583, -3.4267771244049072, -3.2603676319122314, -3.0939581394195557, -2.92754864692688, -2.761139154434204, -2.5947296619415283, -2.4283201694488525, -2.2619106769561768, -2.095501184463501, -1.9290916919708252, -1.7626821994781494, -1.5962727069854736, -1.4298632144927979, -1.263453722000122, -1.0970442295074463, -0.9306347370147705, -0.7642252445220947, -0.597815752029419, -0.43140625953674316, -0.2649967670440674, -0.0985872745513916, 0.06782221794128418, 0.23423171043395996, 0.40064120292663574, 0.5670506954193115, 0.7334601879119873, 0.8998696804046631, 1.0662791728973389, 1.2326886653900146, 1.3990981578826904, 1.5655076503753662, 1.731917381286621, 1.8983268737792969, 2.0647363662719727, 2.2311458587646484, 2.397555351257324, 2.56396484375, 2.730374336242676, 2.8967838287353516, 3.0631933212280273, 3.229602813720703, 3.396012306213379, 3.5624217987060547, 3.7288312911987305, 3.8952407836914062, 4.061650276184082, 4.228059768676758, 4.394469261169434, 4.560878753662109, 4.727288246154785, 4.893697738647461, 5.060107231140137, 5.2265167236328125, 5.392926216125488, 5.559335708618164, 5.72574520111084, 5.892154693603516, 6.058564186096191, 6.224973678588867, 6.391383171081543, 6.557792663574219, 6.7242021560668945, 6.89061164855957, 7.057021141052246]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 3.0, 7.0, 4.0, 3.0, 5.0, 9.0, 9.0, 10.0, 8.0, 21.0, 25.0, 22.0, 27.0, 31.0, 34.0, 27.0, 41.0, 52.0, 63.0, 60.0, 68.0, 66.0, 54.0, 56.0, 53.0, 31.0, 36.0, 37.0, 21.0, 23.0, 24.0, 18.0, 13.0, 8.0, 15.0, 3.0, 7.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-3.0950942039489746, -3.002689838409424, -2.910285472869873, -2.8178813457489014, -2.7254769802093506, -2.6330726146698, -2.540668487548828, -2.4482641220092773, -2.3558597564697266, -2.263455390930176, -2.171051025390625, -2.0786468982696533, -1.9862425327301025, -1.8938381671905518, -1.8014339208602905, -1.7090296745300293, -1.6166253089904785, -1.5242209434509277, -1.4318166971206665, -1.3394124507904053, -1.2470080852508545, -1.1546037197113037, -1.0621994733810425, -0.9697951674461365, -0.8773908615112305, -0.7849865555763245, -0.6925822496414185, -0.6001779437065125, -0.5077736377716064, -0.41536933183670044, -0.32296502590179443, -0.23056071996688843, -0.13815641403198242, -0.045752108097076416, 0.04665219783782959, 0.1390565037727356, 0.2314608097076416, 0.3238651156425476, 0.4162694215774536, 0.5086737275123596, 0.6010780334472656, 0.6934823393821716, 0.7858866453170776, 0.8782909512519836, 0.9706952571868896, 1.0630996227264404, 1.1555038690567017, 1.247908115386963, 1.3403124809265137, 1.4327168464660645, 1.5251210927963257, 1.617525339126587, 1.7099297046661377, 1.8023340702056885, 1.8947383165359497, 1.987142562866211, 2.0795469284057617, 2.1719512939453125, 2.2643556594848633, 2.356759786605835, 2.4491641521453857, 2.5415685176849365, 2.633972644805908, 2.726377010345459, 2.8187813758850098]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 3.0, 0.0, 1.0, 2.0, 3.0, 3.0, 4.0, 11.0, 6.0, 9.0, 16.0, 29.0, 38.0, 78.0, 111.0, 200.0, 362.0, 767.0, 1612.0, 4343.0, 15440.0, 94755.0, 3836837.0, 204416.0, 24747.0, 6272.0, 2166.0, 942.0, 469.0, 271.0, 145.0, 94.0, 42.0, 31.0, 17.0, 14.0, 10.0, 11.0, 8.0, 3.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2391357421875, -0.22902488708496094, -0.21891403198242188, -0.2088031768798828, -0.19869232177734375, -0.1885814666748047, -0.17847061157226562, -0.16835975646972656, -0.1582489013671875, -0.14813804626464844, -0.13802719116210938, -0.1279163360595703, -0.11780548095703125, -0.10769462585449219, -0.09758377075195312, -0.08747291564941406, -0.077362060546875, -0.06725120544433594, -0.057140350341796875, -0.04702949523925781, -0.03691864013671875, -0.026807785034179688, -0.016696929931640625, -0.0065860748291015625, 0.0035247802734375, 0.013635635375976562, 0.023746490478515625, 0.03385734558105469, 0.04396820068359375, 0.05407905578613281, 0.06418991088867188, 0.07430076599121094, 0.08441162109375, 0.09452247619628906, 0.10463333129882812, 0.11474418640136719, 0.12485504150390625, 0.1349658966064453, 0.14507675170898438, 0.15518760681152344, 0.1652984619140625, 0.17540931701660156, 0.18552017211914062, 0.1956310272216797, 0.20574188232421875, 0.2158527374267578, 0.22596359252929688, 0.23607444763183594, 0.246185302734375, 0.25629615783691406, 0.2664070129394531, 0.2765178680419922, 0.28662872314453125, 0.2967395782470703, 0.3068504333496094, 0.31696128845214844, 0.3270721435546875, 0.33718299865722656, 0.3472938537597656, 0.3574047088623047, 0.36751556396484375, 0.3776264190673828, 0.3877372741699219, 0.39784812927246094, 0.407958984375]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 3.0, 2.0, 4.0, 4.0, 7.0, 8.0, 3.0, 8.0, 15.0, 20.0, 30.0, 26.0, 37.0, 54.0, 44.0, 40.0, 62.0, 67.0, 69.0, 69.0, 67.0, 46.0, 61.0, 52.0, 40.0, 33.0, 30.0, 21.0, 11.0, 19.0, 12.0, 13.0, 8.0, 4.0, 7.0, 3.0, 2.0, 5.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1285400390625, -0.1246480941772461, -0.12075614929199219, -0.11686420440673828, -0.11297225952148438, -0.10908031463623047, -0.10518836975097656, -0.10129642486572266, -0.09740447998046875, -0.09351253509521484, -0.08962059020996094, -0.08572864532470703, -0.08183670043945312, -0.07794475555419922, -0.07405281066894531, -0.0701608657836914, -0.0662689208984375, -0.062376976013183594, -0.05848503112792969, -0.05459308624267578, -0.050701141357421875, -0.04680919647216797, -0.04291725158691406, -0.039025306701660156, -0.03513336181640625, -0.031241416931152344, -0.027349472045898438, -0.02345752716064453, -0.019565582275390625, -0.01567363739013672, -0.011781692504882812, -0.007889747619628906, -0.003997802734375, -0.00010585784912109375, 0.0037860870361328125, 0.007678031921386719, 0.011569976806640625, 0.015461921691894531, 0.019353866577148438, 0.023245811462402344, 0.02713775634765625, 0.031029701232910156, 0.03492164611816406, 0.03881359100341797, 0.042705535888671875, 0.04659748077392578, 0.05048942565917969, 0.054381370544433594, 0.0582733154296875, 0.062165260314941406, 0.06605720520019531, 0.06994915008544922, 0.07384109497070312, 0.07773303985595703, 0.08162498474121094, 0.08551692962646484, 0.08940887451171875, 0.09330081939697266, 0.09719276428222656, 0.10108470916748047, 0.10497665405273438, 0.10886859893798828, 0.11276054382324219, 0.1166524887084961, 0.12054443359375]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 8.0, 8.0, 10.0, 10.0, 14.0, 29.0, 36.0, 34.0, 58.0, 90.0, 122.0, 186.0, 302.0, 537.0, 942.0, 1979.0, 4353.0, 10732.0, 34759.0, 177456.0, 3546202.0, 339642.0, 51547.0, 14550.0, 5517.0, 2377.0, 1160.0, 610.0, 330.0, 221.0, 147.0, 87.0, 74.0, 32.0, 39.0, 27.0, 13.0, 12.0, 14.0, 6.0, 8.0, 4.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.251708984375, -0.24422645568847656, -0.23674392700195312, -0.2292613983154297, -0.22177886962890625, -0.2142963409423828, -0.20681381225585938, -0.19933128356933594, -0.1918487548828125, -0.18436622619628906, -0.17688369750976562, -0.1694011688232422, -0.16191864013671875, -0.1544361114501953, -0.14695358276367188, -0.13947105407714844, -0.131988525390625, -0.12450599670410156, -0.11702346801757812, -0.10954093933105469, -0.10205841064453125, -0.09457588195800781, -0.08709335327148438, -0.07961082458496094, -0.0721282958984375, -0.06464576721191406, -0.057163238525390625, -0.04968070983886719, -0.04219818115234375, -0.03471565246582031, -0.027233123779296875, -0.019750595092773438, -0.01226806640625, -0.0047855377197265625, 0.002696990966796875, 0.010179519653320312, 0.01766204833984375, 0.025144577026367188, 0.032627105712890625, 0.04010963439941406, 0.0475921630859375, 0.05507469177246094, 0.06255722045898438, 0.07003974914550781, 0.07752227783203125, 0.08500480651855469, 0.09248733520507812, 0.09996986389160156, 0.107452392578125, 0.11493492126464844, 0.12241744995117188, 0.1298999786376953, 0.13738250732421875, 0.1448650360107422, 0.15234756469726562, 0.15983009338378906, 0.1673126220703125, 0.17479515075683594, 0.18227767944335938, 0.1897602081298828, 0.19724273681640625, 0.2047252655029297, 0.21220779418945312, 0.21969032287597656, 0.2271728515625]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 2.0, 2.0, 5.0, 4.0, 3.0, 6.0, 9.0, 19.0, 16.0, 25.0, 56.0, 90.0, 179.0, 385.0, 2362.0, 497.0, 190.0, 97.0, 45.0, 20.0, 19.0, 12.0, 15.0, 9.0, 5.0, 5.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0634765625, -0.06109428405761719, -0.058712005615234375, -0.05632972717285156, -0.05394744873046875, -0.05156517028808594, -0.049182891845703125, -0.04680061340332031, -0.0444183349609375, -0.04203605651855469, -0.039653778076171875, -0.03727149963378906, -0.03488922119140625, -0.03250694274902344, -0.030124664306640625, -0.027742385864257812, -0.025360107421875, -0.022977828979492188, -0.020595550537109375, -0.018213272094726562, -0.01583099365234375, -0.013448715209960938, -0.011066436767578125, -0.008684158325195312, -0.0063018798828125, -0.0039196014404296875, -0.001537322998046875, 0.0008449554443359375, 0.00322723388671875, 0.0056095123291015625, 0.007991790771484375, 0.010374069213867188, 0.01275634765625, 0.015138626098632812, 0.017520904541015625, 0.019903182983398438, 0.02228546142578125, 0.024667739868164062, 0.027050018310546875, 0.029432296752929688, 0.0318145751953125, 0.03419685363769531, 0.036579132080078125, 0.03896141052246094, 0.04134368896484375, 0.04372596740722656, 0.046108245849609375, 0.04849052429199219, 0.050872802734375, 0.05325508117675781, 0.055637359619140625, 0.05801963806152344, 0.06040191650390625, 0.06278419494628906, 0.06516647338867188, 0.06754875183105469, 0.0699310302734375, 0.07231330871582031, 0.07469558715820312, 0.07707786560058594, 0.07946014404296875, 0.08184242248535156, 0.08422470092773438, 0.08660697937011719, 0.0889892578125]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 4.0, 5.0, 7.0, 19.0, 28.0, 37.0, 32.0, 58.0, 67.0, 95.0, 97.0, 96.0, 106.0, 74.0, 71.0, 56.0, 47.0, 23.0, 23.0, 14.0, 11.0, 10.0, 5.0, 4.0, 1.0, 2.0, 2.0, 1.0, 2.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.32781243324279785, -0.3197641670703888, -0.31171587109565735, -0.3036676049232483, -0.29561933875083923, -0.2875710427761078, -0.27952277660369873, -0.2714745104312897, -0.2634262144565582, -0.25537794828414917, -0.24732966721057892, -0.23928138613700867, -0.23123310506343842, -0.22318482398986816, -0.2151365578174591, -0.20708827674388885, -0.1990400105714798, -0.19099172949790955, -0.1829434633255005, -0.17489518225193024, -0.16684690117835999, -0.15879863500595093, -0.15075035393238068, -0.14270207285881042, -0.13465380668640137, -0.12660552561283112, -0.11855725198984146, -0.1105089783668518, -0.10246069729328156, -0.0944124236702919, -0.08636415004730225, -0.078315868973732, -0.07026758790016174, -0.06221931055188179, -0.05417103320360184, -0.04612275958061218, -0.03807448223233223, -0.030026204884052277, -0.021977931261062622, -0.013929653912782669, -0.005881376564502716, 0.0021668998524546623, 0.01021517626941204, 0.018263451755046844, 0.026311729103326797, 0.03436000645160675, 0.042408280074596405, 0.05045655742287636, 0.05850483477115631, 0.06655310839414597, 0.07460138946771622, 0.08264966309070587, 0.09069794416427612, 0.09874621778726578, 0.10679449141025543, 0.11484277248382568, 0.12289104610681534, 0.130939319729805, 0.13898760080337524, 0.1470358669757843, 0.15508414804935455, 0.1631324291229248, 0.17118069529533386, 0.1792289763689041, 0.18727725744247437]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 4.0, 8.0, 11.0, 5.0, 8.0, 8.0, 18.0, 16.0, 9.0, 18.0, 33.0, 25.0, 26.0, 33.0, 36.0, 47.0, 47.0, 34.0, 41.0, 34.0, 34.0, 48.0, 47.0, 45.0, 35.0, 39.0, 40.0, 36.0, 29.0, 31.0, 19.0, 29.0, 16.0, 14.0, 13.0, 16.0, 13.0, 6.0, 8.0, 2.0, 7.0, 2.0, 6.0, 5.0, 6.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0], "bins": [-0.209530770778656, -0.20335735380649567, -0.19718393683433533, -0.19101053476333618, -0.18483711779117584, -0.1786637008190155, -0.17249029874801636, -0.16631688177585602, -0.16014346480369568, -0.15397004783153534, -0.147796630859375, -0.14162322878837585, -0.13544981181621552, -0.12927639484405518, -0.12310298532247543, -0.11692957580089569, -0.11075615882873535, -0.10458274185657501, -0.09840933233499527, -0.09223592281341553, -0.08606250584125519, -0.07988908886909485, -0.0737156793475151, -0.06754226982593536, -0.061368852853775024, -0.055195439606904984, -0.04902202636003494, -0.0428486131131649, -0.03667519986629486, -0.03050178661942482, -0.02432837337255478, -0.018154960125684738, -0.011981546878814697, -0.005808133631944656, 0.0003652796149253845, 0.006538692861795425, 0.012712106108665466, 0.018885519355535507, 0.025058932602405548, 0.03123234584927559, 0.03740575909614563, 0.04357917234301567, 0.04975258558988571, 0.05592599883675575, 0.06209941208362579, 0.06827282905578613, 0.07444623857736588, 0.08061964809894562, 0.08679306507110596, 0.0929664820432663, 0.09913989156484604, 0.10531330108642578, 0.11148671805858612, 0.11766013503074646, 0.1238335445523262, 0.13000695407390594, 0.13618037104606628, 0.14235378801822662, 0.14852720499038696, 0.1547006070613861, 0.16087402403354645, 0.1670474410057068, 0.17322084307670593, 0.17939426004886627, 0.1855676770210266]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 4.0, 9.0, 8.0, 13.0, 21.0, 23.0, 47.0, 65.0, 129.0, 264.0, 494.0, 1185.0, 3064.0, 9838.0, 36682.0, 149234.0, 404492.0, 317176.0, 92687.0, 22877.0, 6299.0, 2178.0, 899.0, 398.0, 198.0, 100.0, 61.0, 39.0, 22.0, 14.0, 11.0, 8.0, 3.0, 8.0, 6.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.269775390625, -0.26224517822265625, -0.2547149658203125, -0.24718475341796875, -0.239654541015625, -0.23212432861328125, -0.2245941162109375, -0.21706390380859375, -0.20953369140625, -0.20200347900390625, -0.1944732666015625, -0.18694305419921875, -0.179412841796875, -0.17188262939453125, -0.1643524169921875, -0.15682220458984375, -0.1492919921875, -0.14176177978515625, -0.1342315673828125, -0.12670135498046875, -0.119171142578125, -0.11164093017578125, -0.1041107177734375, -0.09658050537109375, -0.08905029296875, -0.08152008056640625, -0.0739898681640625, -0.06645965576171875, -0.058929443359375, -0.05139923095703125, -0.0438690185546875, -0.03633880615234375, -0.02880859375, -0.02127838134765625, -0.0137481689453125, -0.00621795654296875, 0.001312255859375, 0.00884246826171875, 0.0163726806640625, 0.02390289306640625, 0.03143310546875, 0.03896331787109375, 0.0464935302734375, 0.05402374267578125, 0.061553955078125, 0.06908416748046875, 0.0766143798828125, 0.08414459228515625, 0.0916748046875, 0.09920501708984375, 0.1067352294921875, 0.11426544189453125, 0.121795654296875, 0.12932586669921875, 0.1368560791015625, 0.14438629150390625, 0.15191650390625, 0.15944671630859375, 0.1669769287109375, 0.17450714111328125, 0.182037353515625, 0.18956756591796875, 0.1970977783203125, 0.20462799072265625, 0.212158203125]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 4.0, 2.0, 1.0, 1.0, 3.0, 5.0, 3.0, 8.0, 5.0, 10.0, 17.0, 14.0, 28.0, 35.0, 40.0, 44.0, 49.0, 53.0, 63.0, 67.0, 51.0, 73.0, 60.0, 71.0, 45.0, 43.0, 47.0, 25.0, 33.0, 23.0, 23.0, 19.0, 13.0, 11.0, 6.0, 4.0, 3.0, 6.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1295166015625, -0.12546157836914062, -0.12140655517578125, -0.11735153198242188, -0.1132965087890625, -0.10924148559570312, -0.10518646240234375, -0.10113143920898438, -0.097076416015625, -0.09302139282226562, -0.08896636962890625, -0.08491134643554688, -0.0808563232421875, -0.07680130004882812, -0.07274627685546875, -0.06869125366210938, -0.06463623046875, -0.060581207275390625, -0.05652618408203125, -0.052471160888671875, -0.0484161376953125, -0.044361114501953125, -0.04030609130859375, -0.036251068115234375, -0.032196044921875, -0.028141021728515625, -0.02408599853515625, -0.020030975341796875, -0.0159759521484375, -0.011920928955078125, -0.00786590576171875, -0.003810882568359375, 0.000244140625, 0.004299163818359375, 0.00835418701171875, 0.012409210205078125, 0.0164642333984375, 0.020519256591796875, 0.02457427978515625, 0.028629302978515625, 0.032684326171875, 0.036739349365234375, 0.04079437255859375, 0.044849395751953125, 0.0489044189453125, 0.052959442138671875, 0.05701446533203125, 0.061069488525390625, 0.06512451171875, 0.06917953491210938, 0.07323455810546875, 0.07728958129882812, 0.0813446044921875, 0.08539962768554688, 0.08945465087890625, 0.09350967407226562, 0.097564697265625, 0.10161972045898438, 0.10567474365234375, 0.10972976684570312, 0.1137847900390625, 0.11783981323242188, 0.12189483642578125, 0.12594985961914062, 0.1300048828125]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 1.0, 1.0, 3.0, 5.0, 9.0, 6.0, 8.0, 17.0, 31.0, 44.0, 89.0, 154.0, 350.0, 868.0, 3074.0, 36944.0, 860635.0, 138122.0, 6038.0, 1247.0, 454.0, 217.0, 95.0, 49.0, 31.0, 15.0, 24.0, 7.0, 8.0, 5.0, 1.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.66015625, -0.639312744140625, -0.61846923828125, -0.597625732421875, -0.5767822265625, -0.555938720703125, -0.53509521484375, -0.514251708984375, -0.493408203125, -0.472564697265625, -0.45172119140625, -0.430877685546875, -0.4100341796875, -0.389190673828125, -0.36834716796875, -0.347503662109375, -0.32666015625, -0.305816650390625, -0.28497314453125, -0.264129638671875, -0.2432861328125, -0.222442626953125, -0.20159912109375, -0.180755615234375, -0.159912109375, -0.139068603515625, -0.11822509765625, -0.097381591796875, -0.0765380859375, -0.055694580078125, -0.03485107421875, -0.014007568359375, 0.0068359375, 0.027679443359375, 0.04852294921875, 0.069366455078125, 0.0902099609375, 0.111053466796875, 0.13189697265625, 0.152740478515625, 0.173583984375, 0.194427490234375, 0.21527099609375, 0.236114501953125, 0.2569580078125, 0.277801513671875, 0.29864501953125, 0.319488525390625, 0.34033203125, 0.361175537109375, 0.38201904296875, 0.402862548828125, 0.4237060546875, 0.444549560546875, 0.46539306640625, 0.486236572265625, 0.507080078125, 0.527923583984375, 0.54876708984375, 0.569610595703125, 0.5904541015625, 0.611297607421875, 0.63214111328125, 0.652984619140625, 0.673828125]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 4.0, 3.0, 3.0, 7.0, 8.0, 8.0, 12.0, 8.0, 16.0, 19.0, 22.0, 15.0, 24.0, 36.0, 37.0, 38.0, 44.0, 57.0, 57.0, 56.0, 54.0, 61.0, 55.0, 53.0, 45.0, 50.0, 41.0, 38.0, 23.0, 16.0, 20.0, 16.0, 14.0, 22.0, 9.0, 5.0, 2.0, 3.0, 3.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.58056640625, -0.563720703125, -0.546875, -0.530029296875, -0.51318359375, -0.496337890625, -0.4794921875, -0.462646484375, -0.44580078125, -0.428955078125, -0.412109375, -0.395263671875, -0.37841796875, -0.361572265625, -0.3447265625, -0.327880859375, -0.31103515625, -0.294189453125, -0.27734375, -0.260498046875, -0.24365234375, -0.226806640625, -0.2099609375, -0.193115234375, -0.17626953125, -0.159423828125, -0.142578125, -0.125732421875, -0.10888671875, -0.092041015625, -0.0751953125, -0.058349609375, -0.04150390625, -0.024658203125, -0.0078125, 0.009033203125, 0.02587890625, 0.042724609375, 0.0595703125, 0.076416015625, 0.09326171875, 0.110107421875, 0.126953125, 0.143798828125, 0.16064453125, 0.177490234375, 0.1943359375, 0.211181640625, 0.22802734375, 0.244873046875, 0.26171875, 0.278564453125, 0.29541015625, 0.312255859375, 0.3291015625, 0.345947265625, 0.36279296875, 0.379638671875, 0.396484375, 0.413330078125, 0.43017578125, 0.447021484375, 0.4638671875, 0.480712890625, 0.49755859375]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 4.0, 4.0, 7.0, 19.0, 6.0, 23.0, 35.0, 56.0, 72.0, 135.0, 235.0, 488.0, 1324.0, 5566.0, 75424.0, 887632.0, 69759.0, 5390.0, 1327.0, 469.0, 219.0, 122.0, 66.0, 41.0, 32.0, 26.0, 17.0, 13.0, 14.0, 8.0, 9.0, 2.0, 3.0, 5.0, 0.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.37109375, -0.36092376708984375, -0.3507537841796875, -0.34058380126953125, -0.330413818359375, -0.32024383544921875, -0.3100738525390625, -0.29990386962890625, -0.28973388671875, -0.27956390380859375, -0.2693939208984375, -0.25922393798828125, -0.249053955078125, -0.23888397216796875, -0.2287139892578125, -0.21854400634765625, -0.2083740234375, -0.19820404052734375, -0.1880340576171875, -0.17786407470703125, -0.167694091796875, -0.15752410888671875, -0.1473541259765625, -0.13718414306640625, -0.12701416015625, -0.11684417724609375, -0.1066741943359375, -0.09650421142578125, -0.086334228515625, -0.07616424560546875, -0.0659942626953125, -0.05582427978515625, -0.045654296875, -0.03548431396484375, -0.0253143310546875, -0.01514434814453125, -0.004974365234375, 0.00519561767578125, 0.0153656005859375, 0.02553558349609375, 0.03570556640625, 0.04587554931640625, 0.0560455322265625, 0.06621551513671875, 0.076385498046875, 0.08655548095703125, 0.0967254638671875, 0.10689544677734375, 0.1170654296875, 0.12723541259765625, 0.1374053955078125, 0.14757537841796875, 0.157745361328125, 0.16791534423828125, 0.1780853271484375, 0.18825531005859375, 0.19842529296875, 0.20859527587890625, 0.2187652587890625, 0.22893524169921875, 0.239105224609375, 0.24927520751953125, 0.2594451904296875, 0.26961517333984375, 0.27978515625]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [4.0, 0.0, 1.0, 3.0, 1.0, 4.0, 7.0, 11.0, 13.0, 17.0, 32.0, 39.0, 65.0, 92.0, 117.0, 139.0, 113.0, 99.0, 93.0, 65.0, 32.0, 32.0, 15.0, 12.0, 2.0, 3.0, 2.0, 4.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.933906555175781e-05, -3.6840327084064484e-05, -3.4341588616371155e-05, -3.1842850148677826e-05, -2.9344111680984497e-05, -2.6845373213291168e-05, -2.434663474559784e-05, -2.184789627790451e-05, -1.934915781021118e-05, -1.6850419342517853e-05, -1.4351680874824524e-05, -1.1852942407131195e-05, -9.354203939437866e-06, -6.855465471744537e-06, -4.3567270040512085e-06, -1.8579885363578796e-06, 6.407499313354492e-07, 3.139488399028778e-06, 5.638226866722107e-06, 8.136965334415436e-06, 1.0635703802108765e-05, 1.3134442269802094e-05, 1.5633180737495422e-05, 1.813191920518875e-05, 2.063065767288208e-05, 2.312939614057541e-05, 2.5628134608268738e-05, 2.8126873075962067e-05, 3.0625611543655396e-05, 3.3124350011348724e-05, 3.562308847904205e-05, 3.812182694673538e-05, 4.062056541442871e-05, 4.311930388212204e-05, 4.561804234981537e-05, 4.81167808175087e-05, 5.0615519285202026e-05, 5.3114257752895355e-05, 5.5612996220588684e-05, 5.811173468828201e-05, 6.061047315597534e-05, 6.310921162366867e-05, 6.5607950091362e-05, 6.810668855905533e-05, 7.060542702674866e-05, 7.310416549444199e-05, 7.560290396213531e-05, 7.810164242982864e-05, 8.060038089752197e-05, 8.30991193652153e-05, 8.559785783290863e-05, 8.809659630060196e-05, 9.059533476829529e-05, 9.309407323598862e-05, 9.559281170368195e-05, 9.809155017137527e-05, 0.0001005902886390686, 0.00010308902710676193, 0.00010558776557445526, 0.00010808650404214859, 0.00011058524250984192, 0.00011308398097753525, 0.00011558271944522858, 0.0001180814579129219, 0.00012058019638061523]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 5.0, 7.0, 6.0, 17.0, 27.0, 48.0, 75.0, 144.0, 243.0, 547.0, 1447.0, 6331.0, 85197.0, 866357.0, 79594.0, 6016.0, 1389.0, 542.0, 221.0, 135.0, 76.0, 48.0, 27.0, 20.0, 13.0, 9.0, 3.0, 3.0, 2.0, 5.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.26416015625, -0.2545509338378906, -0.24494171142578125, -0.23533248901367188, -0.2257232666015625, -0.21611404418945312, -0.20650482177734375, -0.19689559936523438, -0.187286376953125, -0.17767715454101562, -0.16806793212890625, -0.15845870971679688, -0.1488494873046875, -0.13924026489257812, -0.12963104248046875, -0.12002182006835938, -0.11041259765625, -0.10080337524414062, -0.09119415283203125, -0.08158493041992188, -0.0719757080078125, -0.062366485595703125, -0.05275726318359375, -0.043148040771484375, -0.033538818359375, -0.023929595947265625, -0.01432037353515625, -0.004711151123046875, 0.0048980712890625, 0.014507293701171875, 0.02411651611328125, 0.033725738525390625, 0.0433349609375, 0.052944183349609375, 0.06255340576171875, 0.07216262817382812, 0.0817718505859375, 0.09138107299804688, 0.10099029541015625, 0.11059951782226562, 0.120208740234375, 0.12981796264648438, 0.13942718505859375, 0.14903640747070312, 0.1586456298828125, 0.16825485229492188, 0.17786407470703125, 0.18747329711914062, 0.19708251953125, 0.20669174194335938, 0.21630096435546875, 0.22591018676757812, 0.2355194091796875, 0.24512863159179688, 0.25473785400390625, 0.2643470764160156, 0.273956298828125, 0.2835655212402344, 0.29317474365234375, 0.3027839660644531, 0.3123931884765625, 0.3220024108886719, 0.33161163330078125, 0.3412208557128906, 0.350830078125]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 1.0, 3.0, 5.0, 3.0, 14.0, 9.0, 11.0, 26.0, 32.0, 44.0, 70.0, 94.0, 118.0, 109.0, 114.0, 96.0, 61.0, 65.0, 48.0, 28.0, 23.0, 13.0, 9.0, 5.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2388916015625, -0.2315826416015625, -0.224273681640625, -0.2169647216796875, -0.20965576171875, -0.2023468017578125, -0.195037841796875, -0.1877288818359375, -0.180419921875, -0.1731109619140625, -0.165802001953125, -0.1584930419921875, -0.15118408203125, -0.1438751220703125, -0.136566162109375, -0.1292572021484375, -0.1219482421875, -0.1146392822265625, -0.107330322265625, -0.1000213623046875, -0.09271240234375, -0.0854034423828125, -0.078094482421875, -0.0707855224609375, -0.0634765625, -0.0561676025390625, -0.048858642578125, -0.0415496826171875, -0.03424072265625, -0.0269317626953125, -0.019622802734375, -0.0123138427734375, -0.0050048828125, 0.0023040771484375, 0.009613037109375, 0.0169219970703125, 0.02423095703125, 0.0315399169921875, 0.038848876953125, 0.0461578369140625, 0.053466796875, 0.0607757568359375, 0.068084716796875, 0.0753936767578125, 0.08270263671875, 0.0900115966796875, 0.097320556640625, 0.1046295166015625, 0.1119384765625, 0.1192474365234375, 0.126556396484375, 0.1338653564453125, 0.14117431640625, 0.1484832763671875, 0.155792236328125, 0.1631011962890625, 0.17041015625, 0.1777191162109375, 0.185028076171875, 0.1923370361328125, 0.19964599609375, 0.2069549560546875, 0.214263916015625, 0.2215728759765625, 0.2288818359375]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 6.0, 5.0, 14.0, 52.0, 140.0, 276.0, 273.0, 154.0, 62.0, 22.0, 4.0, 3.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0], "bins": [-9.45622444152832, -9.274282455444336, -9.092340469360352, -8.910398483276367, -8.728456497192383, -8.546514511108398, -8.364572525024414, -8.18263053894043, -8.000688552856445, -7.818746566772461, -7.636804580688477, -7.454862594604492, -7.272920608520508, -7.090978622436523, -6.909036636352539, -6.727094650268555, -6.545152187347412, -6.363210201263428, -6.181268215179443, -5.999326229095459, -5.817384243011475, -5.63544225692749, -5.453499794006348, -5.271557807922363, -5.089615821838379, -4.9076738357543945, -4.72573184967041, -4.543789863586426, -4.361847877502441, -4.179905891418457, -3.9979636669158936, -3.816021680831909, -3.634079933166504, -3.4521379470825195, -3.270195960998535, -3.088253974914551, -2.9063119888305664, -2.724370002746582, -2.5424277782440186, -2.360485792160034, -2.17854380607605, -1.9966018199920654, -1.814659833908081, -1.6327177286148071, -1.4507757425308228, -1.2688337564468384, -1.0868916511535645, -0.9049496650695801, -0.7230076789855957, -0.5410656929016113, -0.3591236472129822, -0.17718160152435303, 0.004760384559631348, 0.18670237064361572, 0.36864447593688965, 0.550586462020874, 0.7325284481048584, 0.9144704341888428, 1.0964124202728271, 1.278354525566101, 1.4602965116500854, 1.6422384977340698, 1.8241806030273438, 2.006122589111328, 2.1880645751953125]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 6.0, 2.0, 2.0, 1.0, 10.0, 3.0, 4.0, 11.0, 13.0, 17.0, 17.0, 20.0, 28.0, 36.0, 30.0, 35.0, 46.0, 46.0, 51.0, 56.0, 66.0, 65.0, 56.0, 54.0, 46.0, 52.0, 46.0, 27.0, 25.0, 22.0, 17.0, 24.0, 21.0, 13.0, 8.0, 9.0, 4.0, 6.0, 3.0, 8.0, 1.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7098795175552368, -1.6386661529541016, -1.5674527883529663, -1.496239423751831, -1.4250260591506958, -1.3538126945495605, -1.2825993299484253, -1.21138596534729, -1.1401726007461548, -1.0689592361450195, -0.9977458715438843, -0.926532506942749, -0.8553191423416138, -0.7841057777404785, -0.7128924131393433, -0.641679048538208, -0.5704656839370728, -0.4992523193359375, -0.42803895473480225, -0.356825590133667, -0.28561222553253174, -0.21439886093139648, -0.14318549633026123, -0.07197213172912598, -0.0007587671279907227, 0.07045459747314453, 0.14166796207427979, 0.21288132667541504, 0.2840946912765503, 0.35530805587768555, 0.4265214204788208, 0.49773478507995605, 0.5689482688903809, 0.6401616334915161, 0.7113749980926514, 0.7825883626937866, 0.8538017272949219, 0.9250150918960571, 0.9962284564971924, 1.0674418210983276, 1.138655185699463, 1.2098685503005981, 1.2810819149017334, 1.3522952795028687, 1.423508644104004, 1.4947220087051392, 1.5659353733062744, 1.6371487379074097, 1.708362102508545, 1.7795754671096802, 1.8507888317108154, 1.9220021963119507, 1.993215560913086, 2.0644288063049316, 2.1356422901153564, 2.2068557739257812, 2.278069019317627, 2.3492822647094727, 2.4204957485198975, 2.4917092323303223, 2.562922477722168, 2.6341357231140137, 2.7053492069244385, 2.7765626907348633, 2.847775936126709]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 2.0, 2.0, 2.0, 7.0, 8.0, 19.0, 45.0, 62.0, 109.0, 200.0, 419.0, 1066.0, 3698.0, 22712.0, 3944382.0, 205414.0, 11972.0, 2554.0, 833.0, 374.0, 166.0, 105.0, 50.0, 29.0, 21.0, 8.0, 13.0, 3.0, 5.0, 3.0, 2.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.59765625, -0.5800018310546875, -0.562347412109375, -0.5446929931640625, -0.52703857421875, -0.5093841552734375, -0.491729736328125, -0.4740753173828125, -0.4564208984375, -0.4387664794921875, -0.421112060546875, -0.4034576416015625, -0.38580322265625, -0.3681488037109375, -0.350494384765625, -0.3328399658203125, -0.315185546875, -0.2975311279296875, -0.279876708984375, -0.2622222900390625, -0.24456787109375, -0.2269134521484375, -0.209259033203125, -0.1916046142578125, -0.1739501953125, -0.1562957763671875, -0.138641357421875, -0.1209869384765625, -0.10333251953125, -0.0856781005859375, -0.068023681640625, -0.0503692626953125, -0.03271484375, -0.0150604248046875, 0.002593994140625, 0.0202484130859375, 0.03790283203125, 0.0555572509765625, 0.073211669921875, 0.0908660888671875, 0.1085205078125, 0.1261749267578125, 0.143829345703125, 0.1614837646484375, 0.17913818359375, 0.1967926025390625, 0.214447021484375, 0.2321014404296875, 0.249755859375, 0.2674102783203125, 0.285064697265625, 0.3027191162109375, 0.32037353515625, 0.3380279541015625, 0.355682373046875, 0.3733367919921875, 0.3909912109375, 0.4086456298828125, 0.426300048828125, 0.4439544677734375, 0.46160888671875, 0.4792633056640625, 0.496917724609375, 0.5145721435546875, 0.5322265625]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 0.0, 2.0, 6.0, 5.0, 8.0, 6.0, 15.0, 14.0, 16.0, 31.0, 41.0, 40.0, 52.0, 68.0, 77.0, 69.0, 78.0, 82.0, 71.0, 62.0, 45.0, 42.0, 41.0, 45.0, 20.0, 16.0, 14.0, 11.0, 7.0, 6.0, 4.0, 4.0, 4.0, 3.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1376953125, -0.1325531005859375, -0.127410888671875, -0.1222686767578125, -0.11712646484375, -0.1119842529296875, -0.106842041015625, -0.1016998291015625, -0.0965576171875, -0.0914154052734375, -0.086273193359375, -0.0811309814453125, -0.07598876953125, -0.0708465576171875, -0.065704345703125, -0.0605621337890625, -0.055419921875, -0.0502777099609375, -0.045135498046875, -0.0399932861328125, -0.03485107421875, -0.0297088623046875, -0.024566650390625, -0.0194244384765625, -0.0142822265625, -0.0091400146484375, -0.003997802734375, 0.0011444091796875, 0.00628662109375, 0.0114288330078125, 0.016571044921875, 0.0217132568359375, 0.02685546875, 0.0319976806640625, 0.037139892578125, 0.0422821044921875, 0.04742431640625, 0.0525665283203125, 0.057708740234375, 0.0628509521484375, 0.0679931640625, 0.0731353759765625, 0.078277587890625, 0.0834197998046875, 0.08856201171875, 0.0937042236328125, 0.098846435546875, 0.1039886474609375, 0.109130859375, 0.1142730712890625, 0.119415283203125, 0.1245574951171875, 0.12969970703125, 0.1348419189453125, 0.139984130859375, 0.1451263427734375, 0.1502685546875, 0.1554107666015625, 0.160552978515625, 0.1656951904296875, 0.17083740234375, 0.1759796142578125, 0.181121826171875, 0.1862640380859375, 0.19140625]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 1.0, 1.0, 4.0, 3.0, 11.0, 16.0, 18.0, 30.0, 33.0, 62.0, 87.0, 122.0, 187.0, 328.0, 517.0, 973.0, 1843.0, 3672.0, 8527.0, 23566.0, 89257.0, 3416170.0, 549729.0, 66122.0, 18900.0, 7099.0, 3339.0, 1581.0, 864.0, 437.0, 305.0, 179.0, 97.0, 76.0, 50.0, 31.0, 16.0, 9.0, 9.0, 4.0, 5.0, 5.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.2340087890625, -0.22710609436035156, -0.22020339965820312, -0.2133007049560547, -0.20639801025390625, -0.1994953155517578, -0.19259262084960938, -0.18568992614746094, -0.1787872314453125, -0.17188453674316406, -0.16498184204101562, -0.1580791473388672, -0.15117645263671875, -0.1442737579345703, -0.13737106323242188, -0.13046836853027344, -0.123565673828125, -0.11666297912597656, -0.10976028442382812, -0.10285758972167969, -0.09595489501953125, -0.08905220031738281, -0.08214950561523438, -0.07524681091308594, -0.0683441162109375, -0.06144142150878906, -0.054538726806640625, -0.04763603210449219, -0.04073333740234375, -0.03383064270019531, -0.026927947998046875, -0.020025253295898438, -0.01312255859375, -0.0062198638916015625, 0.000682830810546875, 0.0075855255126953125, 0.01448822021484375, 0.021390914916992188, 0.028293609619140625, 0.03519630432128906, 0.0420989990234375, 0.04900169372558594, 0.055904388427734375, 0.06280708312988281, 0.06970977783203125, 0.07661247253417969, 0.08351516723632812, 0.09041786193847656, 0.097320556640625, 0.10422325134277344, 0.11112594604492188, 0.11802864074707031, 0.12493133544921875, 0.1318340301513672, 0.13873672485351562, 0.14563941955566406, 0.1525421142578125, 0.15944480895996094, 0.16634750366210938, 0.1732501983642578, 0.18015289306640625, 0.1870555877685547, 0.19395828247070312, 0.20086097717285156, 0.207763671875]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 4.0, 1.0, 4.0, 11.0, 12.0, 21.0, 24.0, 33.0, 58.0, 124.0, 252.0, 2854.0, 352.0, 124.0, 87.0, 37.0, 26.0, 17.0, 11.0, 9.0, 5.0, 9.0, 3.0, 2.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.09454345703125, -0.09227180480957031, -0.09000015258789062, -0.08772850036621094, -0.08545684814453125, -0.08318519592285156, -0.08091354370117188, -0.07864189147949219, -0.0763702392578125, -0.07409858703613281, -0.07182693481445312, -0.06955528259277344, -0.06728363037109375, -0.06501197814941406, -0.06274032592773438, -0.06046867370605469, -0.058197021484375, -0.05592536926269531, -0.053653717041015625, -0.05138206481933594, -0.04911041259765625, -0.04683876037597656, -0.044567108154296875, -0.04229545593261719, -0.0400238037109375, -0.03775215148925781, -0.035480499267578125, -0.03320884704589844, -0.03093719482421875, -0.028665542602539062, -0.026393890380859375, -0.024122238159179688, -0.0218505859375, -0.019578933715820312, -0.017307281494140625, -0.015035629272460938, -0.01276397705078125, -0.010492324829101562, -0.008220672607421875, -0.0059490203857421875, -0.0036773681640625, -0.0014057159423828125, 0.000865936279296875, 0.0031375885009765625, 0.00540924072265625, 0.0076808929443359375, 0.009952545166015625, 0.012224197387695312, 0.014495849609375, 0.016767501831054688, 0.019039154052734375, 0.021310806274414062, 0.02358245849609375, 0.025854110717773438, 0.028125762939453125, 0.030397415161132812, 0.0326690673828125, 0.03494071960449219, 0.037212371826171875, 0.03948402404785156, 0.04175567626953125, 0.04402732849121094, 0.046298980712890625, 0.04857063293457031, 0.05084228515625]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 4.0, 5.0, 15.0, 19.0, 24.0, 32.0, 57.0, 86.0, 91.0, 130.0, 109.0, 103.0, 91.0, 81.0, 64.0, 29.0, 31.0, 11.0, 7.0, 3.0, 1.0, 1.0, 5.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.23041397333145142, -0.22208306193351746, -0.2137521505355835, -0.20542123913764954, -0.19709032773971558, -0.18875941634178162, -0.18042851984500885, -0.1720976084470749, -0.16376669704914093, -0.15543578565120697, -0.147104874253273, -0.13877396285533905, -0.13044306635856628, -0.12211214751005173, -0.11378124356269836, -0.1054503321647644, -0.09711942076683044, -0.08878850936889648, -0.08045759797096252, -0.07212669402360916, -0.0637957826256752, -0.05546487122774124, -0.04713396355509758, -0.03880305588245392, -0.03047214448451996, -0.022141234949231148, -0.013810325413942337, -0.005479415878653526, 0.0028514936566352844, 0.011182405054569244, 0.019513312727212906, 0.027844220399856567, 0.036175161600112915, 0.044506072998046875, 0.052836980670690536, 0.0611678883433342, 0.06949879974126816, 0.07782971113920212, 0.08616061508655548, 0.09449152648448944, 0.1028224378824234, 0.11115334928035736, 0.11948426067829132, 0.12781517207622528, 0.13614606857299805, 0.144476979970932, 0.15280789136886597, 0.16113880276679993, 0.1694697141647339, 0.17780062556266785, 0.1861315369606018, 0.19446244835853577, 0.20279335975646973, 0.2111242711544037, 0.21945516765117645, 0.2277860790491104, 0.23611699044704437, 0.24444790184497833, 0.2527787983417511, 0.26110970973968506, 0.269440621137619, 0.277771532535553, 0.28610244393348694, 0.2944333553314209, 0.30276426672935486]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 3.0, 3.0, 4.0, 8.0, 12.0, 7.0, 9.0, 22.0, 20.0, 14.0, 28.0, 27.0, 29.0, 36.0, 34.0, 36.0, 32.0, 42.0, 42.0, 43.0, 39.0, 47.0, 39.0, 33.0, 47.0, 37.0, 38.0, 26.0, 37.0, 27.0, 18.0, 28.0, 22.0, 20.0, 13.0, 13.0, 10.0, 7.0, 11.0, 5.0, 11.0, 10.0, 2.0, 3.0, 3.0, 6.0, 2.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.1151648759841919, -0.11126790195703506, -0.10737093538045883, -0.103473961353302, -0.09957699477672577, -0.09568002074956894, -0.09178304672241211, -0.08788608014583588, -0.08398910611867905, -0.08009213209152222, -0.07619516551494598, -0.07229819148778915, -0.06840121746063232, -0.06450425088405609, -0.06060727685689926, -0.05671030655503273, -0.0528133362531662, -0.04891636595129967, -0.045019395649433136, -0.041122421622276306, -0.037225451320409775, -0.03332848101854324, -0.029431508854031563, -0.025534536689519882, -0.02163756638765335, -0.01774059608578682, -0.013843623921275139, -0.009946652688086033, -0.006049681454896927, -0.0021527111530303955, 0.001744261011481285, 0.005641233175992966, 0.009538203477859497, 0.013435174711048603, 0.01733214594423771, 0.02122911810874939, 0.02512608841061592, 0.029023058712482452, 0.03292003273963928, 0.036817003041505814, 0.040713973343372345, 0.044610943645238876, 0.04850791394710541, 0.05240488797426224, 0.05630185827612877, 0.0601988285779953, 0.06409580260515213, 0.06799277663230896, 0.07188974320888519, 0.07578671723604202, 0.07968368381261826, 0.08358065783977509, 0.08747762441635132, 0.09137459844350815, 0.09527157247066498, 0.09916853904724121, 0.10306551307439804, 0.10696248710155487, 0.1108594536781311, 0.11475642770528793, 0.11865340173244476, 0.122550368309021, 0.12644733488559723, 0.13034431636333466, 0.1342412829399109]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 4.0, 6.0, 7.0, 8.0, 13.0, 35.0, 45.0, 73.0, 84.0, 144.0, 256.0, 476.0, 1096.0, 2508.0, 7595.0, 31130.0, 170640.0, 544946.0, 232152.0, 42187.0, 9501.0, 3067.0, 1243.0, 582.0, 287.0, 173.0, 84.0, 71.0, 43.0, 29.0, 22.0, 14.0, 10.0, 5.0, 4.0, 3.0, 3.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.2271728515625, -0.2186298370361328, -0.21008682250976562, -0.20154380798339844, -0.19300079345703125, -0.18445777893066406, -0.17591476440429688, -0.1673717498779297, -0.1588287353515625, -0.1502857208251953, -0.14174270629882812, -0.13319969177246094, -0.12465667724609375, -0.11611366271972656, -0.10757064819335938, -0.09902763366699219, -0.090484619140625, -0.08194160461425781, -0.07339859008789062, -0.06485557556152344, -0.05631256103515625, -0.04776954650878906, -0.039226531982421875, -0.030683517456054688, -0.0221405029296875, -0.013597488403320312, -0.005054473876953125, 0.0034885406494140625, 0.01203155517578125, 0.020574569702148438, 0.029117584228515625, 0.03766059875488281, 0.04620361328125, 0.05474662780761719, 0.06328964233398438, 0.07183265686035156, 0.08037567138671875, 0.08891868591308594, 0.09746170043945312, 0.10600471496582031, 0.1145477294921875, 0.12309074401855469, 0.13163375854492188, 0.14017677307128906, 0.14871978759765625, 0.15726280212402344, 0.16580581665039062, 0.1743488311767578, 0.182891845703125, 0.1914348602294922, 0.19997787475585938, 0.20852088928222656, 0.21706390380859375, 0.22560691833496094, 0.23414993286132812, 0.2426929473876953, 0.2512359619140625, 0.2597789764404297, 0.2683219909667969, 0.27686500549316406, 0.28540802001953125, 0.29395103454589844, 0.3024940490722656, 0.3110370635986328, 0.319580078125]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 3.0, 2.0, 2.0, 10.0, 7.0, 7.0, 7.0, 10.0, 13.0, 25.0, 28.0, 43.0, 36.0, 62.0, 65.0, 69.0, 75.0, 60.0, 80.0, 73.0, 59.0, 42.0, 46.0, 39.0, 39.0, 26.0, 22.0, 17.0, 7.0, 9.0, 4.0, 6.0, 4.0, 2.0, 2.0, 4.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1307373046875, -0.1258392333984375, -0.120941162109375, -0.1160430908203125, -0.11114501953125, -0.1062469482421875, -0.101348876953125, -0.0964508056640625, -0.091552734375, -0.0866546630859375, -0.081756591796875, -0.0768585205078125, -0.07196044921875, -0.0670623779296875, -0.062164306640625, -0.0572662353515625, -0.0523681640625, -0.0474700927734375, -0.042572021484375, -0.0376739501953125, -0.03277587890625, -0.0278778076171875, -0.022979736328125, -0.0180816650390625, -0.01318359375, -0.0082855224609375, -0.003387451171875, 0.0015106201171875, 0.00640869140625, 0.0113067626953125, 0.016204833984375, 0.0211029052734375, 0.0260009765625, 0.0308990478515625, 0.035797119140625, 0.0406951904296875, 0.04559326171875, 0.0504913330078125, 0.055389404296875, 0.0602874755859375, 0.065185546875, 0.0700836181640625, 0.074981689453125, 0.0798797607421875, 0.08477783203125, 0.0896759033203125, 0.094573974609375, 0.0994720458984375, 0.1043701171875, 0.1092681884765625, 0.114166259765625, 0.1190643310546875, 0.12396240234375, 0.1288604736328125, 0.133758544921875, 0.1386566162109375, 0.1435546875, 0.1484527587890625, 0.153350830078125, 0.1582489013671875, 0.16314697265625, 0.1680450439453125, 0.172943115234375, 0.1778411865234375, 0.1827392578125]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 5.0, 7.0, 7.0, 10.0, 16.0, 11.0, 24.0, 22.0, 42.0, 69.0, 130.0, 242.0, 404.0, 833.0, 2429.0, 15780.0, 504129.0, 504781.0, 15519.0, 2309.0, 814.0, 401.0, 201.0, 121.0, 83.0, 54.0, 36.0, 35.0, 13.0, 10.0, 5.0, 7.0, 5.0, 5.0, 0.0, 1.0, 0.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.50439453125, -0.4886322021484375, -0.472869873046875, -0.4571075439453125, -0.44134521484375, -0.4255828857421875, -0.409820556640625, -0.3940582275390625, -0.3782958984375, -0.3625335693359375, -0.346771240234375, -0.3310089111328125, -0.31524658203125, -0.2994842529296875, -0.283721923828125, -0.2679595947265625, -0.252197265625, -0.2364349365234375, -0.220672607421875, -0.2049102783203125, -0.18914794921875, -0.1733856201171875, -0.157623291015625, -0.1418609619140625, -0.1260986328125, -0.1103363037109375, -0.094573974609375, -0.0788116455078125, -0.06304931640625, -0.0472869873046875, -0.031524658203125, -0.0157623291015625, 0.0, 0.0157623291015625, 0.031524658203125, 0.0472869873046875, 0.06304931640625, 0.0788116455078125, 0.094573974609375, 0.1103363037109375, 0.1260986328125, 0.1418609619140625, 0.157623291015625, 0.1733856201171875, 0.18914794921875, 0.2049102783203125, 0.220672607421875, 0.2364349365234375, 0.252197265625, 0.2679595947265625, 0.283721923828125, 0.2994842529296875, 0.31524658203125, 0.3310089111328125, 0.346771240234375, 0.3625335693359375, 0.3782958984375, 0.3940582275390625, 0.409820556640625, 0.4255828857421875, 0.44134521484375, 0.4571075439453125, 0.472869873046875, 0.4886322021484375, 0.50439453125]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 1.0, 3.0, 5.0, 14.0, 15.0, 11.0, 16.0, 16.0, 31.0, 30.0, 36.0, 36.0, 41.0, 43.0, 47.0, 48.0, 42.0, 58.0, 68.0, 55.0, 57.0, 53.0, 46.0, 39.0, 41.0, 35.0, 24.0, 17.0, 16.0, 20.0, 11.0, 11.0, 8.0, 2.0, 5.0, 4.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.423583984375, -0.4073448181152344, -0.39110565185546875, -0.3748664855957031, -0.3586273193359375, -0.3423881530761719, -0.32614898681640625, -0.3099098205566406, -0.293670654296875, -0.2774314880371094, -0.26119232177734375, -0.24495315551757812, -0.2287139892578125, -0.21247482299804688, -0.19623565673828125, -0.17999649047851562, -0.16375732421875, -0.14751815795898438, -0.13127899169921875, -0.11503982543945312, -0.0988006591796875, -0.08256149291992188, -0.06632232666015625, -0.050083160400390625, -0.033843994140625, -0.017604827880859375, -0.00136566162109375, 0.014873504638671875, 0.0311126708984375, 0.047351837158203125, 0.06359100341796875, 0.07983016967773438, 0.0960693359375, 0.11230850219726562, 0.12854766845703125, 0.14478683471679688, 0.1610260009765625, 0.17726516723632812, 0.19350433349609375, 0.20974349975585938, 0.225982666015625, 0.24222183227539062, 0.25846099853515625, 0.2747001647949219, 0.2909393310546875, 0.3071784973144531, 0.32341766357421875, 0.3396568298339844, 0.35589599609375, 0.3721351623535156, 0.38837432861328125, 0.4046134948730469, 0.4208526611328125, 0.4370918273925781, 0.45333099365234375, 0.4695701599121094, 0.485809326171875, 0.5020484924316406, 0.5182876586914062, 0.5345268249511719, 0.5507659912109375, 0.5670051574707031, 0.5832443237304688, 0.5994834899902344, 0.61572265625]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 3.0, 3.0, 4.0, 3.0, 2.0, 8.0, 21.0, 23.0, 34.0, 47.0, 65.0, 122.0, 210.0, 467.0, 1272.0, 5610.0, 89865.0, 890815.0, 53547.0, 4308.0, 1112.0, 467.0, 210.0, 131.0, 71.0, 56.0, 22.0, 23.0, 14.0, 7.0, 5.0, 5.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.213134765625, -0.20507049560546875, -0.1970062255859375, -0.18894195556640625, -0.180877685546875, -0.17281341552734375, -0.1647491455078125, -0.15668487548828125, -0.14862060546875, -0.14055633544921875, -0.1324920654296875, -0.12442779541015625, -0.116363525390625, -0.10829925537109375, -0.1002349853515625, -0.09217071533203125, -0.0841064453125, -0.07604217529296875, -0.0679779052734375, -0.05991363525390625, -0.051849365234375, -0.04378509521484375, -0.0357208251953125, -0.02765655517578125, -0.01959228515625, -0.01152801513671875, -0.0034637451171875, 0.00460052490234375, 0.012664794921875, 0.02072906494140625, 0.0287933349609375, 0.03685760498046875, 0.044921875, 0.05298614501953125, 0.0610504150390625, 0.06911468505859375, 0.077178955078125, 0.08524322509765625, 0.0933074951171875, 0.10137176513671875, 0.10943603515625, 0.11750030517578125, 0.1255645751953125, 0.13362884521484375, 0.141693115234375, 0.14975738525390625, 0.1578216552734375, 0.16588592529296875, 0.1739501953125, 0.18201446533203125, 0.1900787353515625, 0.19814300537109375, 0.206207275390625, 0.21427154541015625, 0.2223358154296875, 0.23040008544921875, 0.23846435546875, 0.24652862548828125, 0.2545928955078125, 0.26265716552734375, 0.270721435546875, 0.27878570556640625, 0.2868499755859375, 0.29491424560546875, 0.302978515625]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 4.0, 3.0, 4.0, 12.0, 13.0, 11.0, 21.0, 25.0, 34.0, 44.0, 56.0, 81.0, 89.0, 88.0, 86.0, 85.0, 72.0, 70.0, 53.0, 41.0, 34.0, 26.0, 17.0, 12.0, 5.0, 10.0, 4.0, 2.0, 1.0, 5.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.2438507080078125e-05, -4.0940940380096436e-05, -3.9443373680114746e-05, -3.794580698013306e-05, -3.644824028015137e-05, -3.495067358016968e-05, -3.345310688018799e-05, -3.19555401802063e-05, -3.045797348022461e-05, -2.896040678024292e-05, -2.746284008026123e-05, -2.596527338027954e-05, -2.446770668029785e-05, -2.2970139980316162e-05, -2.1472573280334473e-05, -1.9975006580352783e-05, -1.8477439880371094e-05, -1.6979873180389404e-05, -1.5482306480407715e-05, -1.3984739780426025e-05, -1.2487173080444336e-05, -1.0989606380462646e-05, -9.492039680480957e-06, -7.994472980499268e-06, -6.496906280517578e-06, -4.999339580535889e-06, -3.5017728805541992e-06, -2.0042061805725098e-06, -5.066394805908203e-07, 9.909272193908691e-07, 2.4884939193725586e-06, 3.986060619354248e-06, 5.4836273193359375e-06, 6.981194019317627e-06, 8.478760719299316e-06, 9.976327419281006e-06, 1.1473894119262695e-05, 1.2971460819244385e-05, 1.4469027519226074e-05, 1.5966594219207764e-05, 1.7464160919189453e-05, 1.8961727619171143e-05, 2.0459294319152832e-05, 2.195686101913452e-05, 2.345442771911621e-05, 2.49519944190979e-05, 2.644956111907959e-05, 2.794712781906128e-05, 2.944469451904297e-05, 3.094226121902466e-05, 3.243982791900635e-05, 3.393739461898804e-05, 3.5434961318969727e-05, 3.6932528018951416e-05, 3.8430094718933105e-05, 3.9927661418914795e-05, 4.1425228118896484e-05, 4.2922794818878174e-05, 4.442036151885986e-05, 4.591792821884155e-05, 4.741549491882324e-05, 4.891306161880493e-05, 5.041062831878662e-05, 5.190819501876831e-05, 5.340576171875e-05]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 5.0, 5.0, 11.0, 14.0, 34.0, 45.0, 82.0, 141.0, 296.0, 689.0, 1821.0, 8085.0, 117706.0, 845522.0, 65383.0, 5954.0, 1552.0, 621.0, 273.0, 139.0, 66.0, 39.0, 20.0, 17.0, 11.0, 9.0, 5.0, 8.0, 3.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.26123046875, -0.25363922119140625, -0.2460479736328125, -0.23845672607421875, -0.230865478515625, -0.22327423095703125, -0.2156829833984375, -0.20809173583984375, -0.20050048828125, -0.19290924072265625, -0.1853179931640625, -0.17772674560546875, -0.170135498046875, -0.16254425048828125, -0.1549530029296875, -0.14736175537109375, -0.1397705078125, -0.13217926025390625, -0.1245880126953125, -0.11699676513671875, -0.109405517578125, -0.10181427001953125, -0.0942230224609375, -0.08663177490234375, -0.07904052734375, -0.07144927978515625, -0.0638580322265625, -0.05626678466796875, -0.048675537109375, -0.04108428955078125, -0.0334930419921875, -0.02590179443359375, -0.018310546875, -0.01071929931640625, -0.0031280517578125, 0.00446319580078125, 0.012054443359375, 0.01964569091796875, 0.0272369384765625, 0.03482818603515625, 0.04241943359375, 0.05001068115234375, 0.0576019287109375, 0.06519317626953125, 0.072784423828125, 0.08037567138671875, 0.0879669189453125, 0.09555816650390625, 0.1031494140625, 0.11074066162109375, 0.1183319091796875, 0.12592315673828125, 0.133514404296875, 0.14110565185546875, 0.1486968994140625, 0.15628814697265625, 0.16387939453125, 0.17147064208984375, 0.1790618896484375, 0.18665313720703125, 0.194244384765625, 0.20183563232421875, 0.2094268798828125, 0.21701812744140625, 0.224609375]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 8.0, 10.0, 16.0, 39.0, 36.0, 57.0, 93.0, 80.0, 123.0, 132.0, 106.0, 89.0, 77.0, 38.0, 32.0, 24.0, 16.0, 9.0, 3.0, 9.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.2061767578125, -0.19938278198242188, -0.19258880615234375, -0.18579483032226562, -0.1790008544921875, -0.17220687866210938, -0.16541290283203125, -0.15861892700195312, -0.151824951171875, -0.14503097534179688, -0.13823699951171875, -0.13144302368164062, -0.1246490478515625, -0.11785507202148438, -0.11106109619140625, -0.10426712036132812, -0.09747314453125, -0.09067916870117188, -0.08388519287109375, -0.07709121704101562, -0.0702972412109375, -0.06350326538085938, -0.05670928955078125, -0.049915313720703125, -0.043121337890625, -0.036327362060546875, -0.02953338623046875, -0.022739410400390625, -0.0159454345703125, -0.009151458740234375, -0.00235748291015625, 0.004436492919921875, 0.01123046875, 0.018024444580078125, 0.02481842041015625, 0.031612396240234375, 0.0384063720703125, 0.045200347900390625, 0.05199432373046875, 0.058788299560546875, 0.065582275390625, 0.07237625122070312, 0.07917022705078125, 0.08596420288085938, 0.0927581787109375, 0.09955215454101562, 0.10634613037109375, 0.11314010620117188, 0.11993408203125, 0.12672805786132812, 0.13352203369140625, 0.14031600952148438, 0.1471099853515625, 0.15390396118164062, 0.16069793701171875, 0.16749191284179688, 0.174285888671875, 0.18107986450195312, 0.18787384033203125, 0.19466781616210938, 0.2014617919921875, 0.20825576782226562, 0.21504974365234375, 0.22184371948242188, 0.2286376953125]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 3.0, 8.0, 4.0, 9.0, 20.0, 64.0, 124.0, 208.0, 228.0, 183.0, 87.0, 41.0, 18.0, 9.0, 3.0, 2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.8693244457244873, -3.755748748779297, -3.6421730518341064, -3.528597354888916, -3.4150216579437256, -3.301445960998535, -3.187870502471924, -3.0742945671081543, -2.960719108581543, -2.8471434116363525, -2.733567714691162, -2.6199920177459717, -2.5064163208007812, -2.392840623855591, -2.2792649269104004, -2.165689468383789, -2.0521135330200195, -1.938537836074829, -1.8249621391296387, -1.7113864421844482, -1.5978107452392578, -1.4842350482940674, -1.3706594705581665, -1.257083773612976, -1.1435080766677856, -1.0299323797225952, -0.9163566827774048, -0.8027810454368591, -0.6892053484916687, -0.5756296515464783, -0.4620540142059326, -0.3484783172607422, -0.23490262031555176, -0.12132693827152252, -0.007751256227493286, 0.10582441091537476, 0.21940010786056519, 0.3329758048057556, 0.44655144214630127, 0.5601271390914917, 0.6737028360366821, 0.7872785329818726, 0.900854229927063, 1.0144298076629639, 1.1280055046081543, 1.2415812015533447, 1.3551568984985352, 1.4687325954437256, 1.582308292388916, 1.6958839893341064, 1.8094596862792969, 1.9230353832244873, 2.0366110801696777, 2.150186777114868, 2.2637624740600586, 2.37733793258667, 2.4909138679504395, 2.60448956489563, 2.7180652618408203, 2.8316409587860107, 2.945216655731201, 3.0587923526763916, 3.172368049621582, 3.2859435081481934, 3.399519205093384]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 5.0, 4.0, 6.0, 8.0, 12.0, 6.0, 13.0, 15.0, 23.0, 23.0, 31.0, 22.0, 38.0, 38.0, 47.0, 44.0, 45.0, 56.0, 48.0, 58.0, 58.0, 57.0, 51.0, 40.0, 40.0, 43.0, 34.0, 28.0, 20.0, 26.0, 20.0, 19.0, 10.0, 8.0, 4.0, 5.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.0460784435272217, -1.9790561199188232, -1.9120337963104248, -1.845011591911316, -1.7779892683029175, -1.710966944694519, -1.6439447402954102, -1.5769224166870117, -1.5099000930786133, -1.4428777694702148, -1.3758554458618164, -1.3088332414627075, -1.241810917854309, -1.1747885942459106, -1.1077663898468018, -1.0407440662384033, -0.9737217426300049, -0.9066994190216064, -0.8396771550178528, -0.7726548910140991, -0.7056325674057007, -0.6386102437973022, -0.5715879797935486, -0.5045657157897949, -0.4375433921813965, -0.37052109837532043, -0.3034988045692444, -0.23647651076316833, -0.16945421695709229, -0.10243192315101624, -0.035409629344940186, 0.031612664461135864, 0.09863471984863281, 0.16565701365470886, 0.2326793074607849, 0.29970160126686096, 0.366723895072937, 0.43374618887901306, 0.5007684826850891, 0.5677907466888428, 0.6348130702972412, 0.7018353939056396, 0.7688576579093933, 0.835879921913147, 0.9029022455215454, 0.9699245691299438, 1.0369467735290527, 1.1039690971374512, 1.1709914207458496, 1.238013744354248, 1.3050360679626465, 1.3720582723617554, 1.4390805959701538, 1.5061029195785522, 1.5731251239776611, 1.6401474475860596, 1.707169771194458, 1.7741920948028564, 1.8412144184112549, 1.9082366228103638, 1.9752589464187622, 2.042281150817871, 2.1093034744262695, 2.176325798034668, 2.2433481216430664]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 0.0, 5.0, 6.0, 12.0, 10.0, 9.0, 16.0, 24.0, 38.0, 45.0, 72.0, 133.0, 195.0, 479.0, 996.0, 2569.0, 8085.0, 38062.0, 603813.0, 3470764.0, 53146.0, 10246.0, 3132.0, 1189.0, 571.0, 268.0, 136.0, 95.0, 47.0, 27.0, 26.0, 15.0, 13.0, 7.0, 6.0, 3.0, 8.0, 3.0, 8.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2073974609375, -0.19800758361816406, -0.18861770629882812, -0.1792278289794922, -0.16983795166015625, -0.1604480743408203, -0.15105819702148438, -0.14166831970214844, -0.1322784423828125, -0.12288856506347656, -0.11349868774414062, -0.10410881042480469, -0.09471893310546875, -0.08532905578613281, -0.07593917846679688, -0.06654930114746094, -0.057159423828125, -0.04776954650878906, -0.038379669189453125, -0.028989791870117188, -0.01959991455078125, -0.010210037231445312, -0.000820159912109375, 0.008569717407226562, 0.0179595947265625, 0.027349472045898438, 0.036739349365234375, 0.04612922668457031, 0.05551910400390625, 0.06490898132324219, 0.07429885864257812, 0.08368873596191406, 0.09307861328125, 0.10246849060058594, 0.11185836791992188, 0.12124824523925781, 0.13063812255859375, 0.1400279998779297, 0.14941787719726562, 0.15880775451660156, 0.1681976318359375, 0.17758750915527344, 0.18697738647460938, 0.1963672637939453, 0.20575714111328125, 0.2151470184326172, 0.22453689575195312, 0.23392677307128906, 0.243316650390625, 0.25270652770996094, 0.2620964050292969, 0.2714862823486328, 0.28087615966796875, 0.2902660369873047, 0.2996559143066406, 0.30904579162597656, 0.3184356689453125, 0.32782554626464844, 0.3372154235839844, 0.3466053009033203, 0.35599517822265625, 0.3653850555419922, 0.3747749328613281, 0.38416481018066406, 0.3935546875]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 4.0, 4.0, 3.0, 9.0, 7.0, 8.0, 15.0, 18.0, 27.0, 34.0, 41.0, 55.0, 70.0, 60.0, 70.0, 65.0, 64.0, 57.0, 75.0, 66.0, 39.0, 41.0, 34.0, 48.0, 17.0, 17.0, 14.0, 10.0, 9.0, 7.0, 5.0, 3.0, 5.0, 2.0, 4.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.154296875, -0.1498088836669922, -0.14532089233398438, -0.14083290100097656, -0.13634490966796875, -0.13185691833496094, -0.12736892700195312, -0.12288093566894531, -0.1183929443359375, -0.11390495300292969, -0.10941696166992188, -0.10492897033691406, -0.10044097900390625, -0.09595298767089844, -0.09146499633789062, -0.08697700500488281, -0.082489013671875, -0.07800102233886719, -0.07351303100585938, -0.06902503967285156, -0.06453704833984375, -0.06004905700683594, -0.055561065673828125, -0.05107307434082031, -0.0465850830078125, -0.04209709167480469, -0.037609100341796875, -0.03312110900878906, -0.02863311767578125, -0.024145126342773438, -0.019657135009765625, -0.015169143676757812, -0.01068115234375, -0.0061931610107421875, -0.001705169677734375, 0.0027828216552734375, 0.00727081298828125, 0.011758804321289062, 0.016246795654296875, 0.020734786987304688, 0.0252227783203125, 0.029710769653320312, 0.034198760986328125, 0.03868675231933594, 0.04317474365234375, 0.04766273498535156, 0.052150726318359375, 0.05663871765136719, 0.061126708984375, 0.06561470031738281, 0.07010269165039062, 0.07459068298339844, 0.07907867431640625, 0.08356666564941406, 0.08805465698242188, 0.09254264831542969, 0.0970306396484375, 0.10151863098144531, 0.10600662231445312, 0.11049461364746094, 0.11498260498046875, 0.11947059631347656, 0.12395858764648438, 0.1284465789794922, 0.1329345703125]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 2.0, 2.0, 10.0, 10.0, 14.0, 22.0, 26.0, 30.0, 45.0, 56.0, 96.0, 153.0, 233.0, 409.0, 585.0, 1012.0, 1710.0, 3198.0, 5990.0, 12294.0, 28938.0, 83848.0, 397545.0, 3253454.0, 287270.0, 69228.0, 24811.0, 10856.0, 5340.0, 2869.0, 1649.0, 900.0, 576.0, 354.0, 257.0, 145.0, 105.0, 65.0, 57.0, 39.0, 25.0, 18.0, 12.0, 11.0, 6.0, 4.0, 3.0, 1.0, 5.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1317138671875, -0.12752151489257812, -0.12332916259765625, -0.11913681030273438, -0.1149444580078125, -0.11075210571289062, -0.10655975341796875, -0.10236740112304688, -0.098175048828125, -0.09398269653320312, -0.08979034423828125, -0.08559799194335938, -0.0814056396484375, -0.07721328735351562, -0.07302093505859375, -0.06882858276367188, -0.06463623046875, -0.060443878173828125, -0.05625152587890625, -0.052059173583984375, -0.0478668212890625, -0.043674468994140625, -0.03948211669921875, -0.035289764404296875, -0.031097412109375, -0.026905059814453125, -0.02271270751953125, -0.018520355224609375, -0.0143280029296875, -0.010135650634765625, -0.00594329833984375, -0.001750946044921875, 0.00244140625, 0.006633758544921875, 0.01082611083984375, 0.015018463134765625, 0.0192108154296875, 0.023403167724609375, 0.02759552001953125, 0.031787872314453125, 0.035980224609375, 0.040172576904296875, 0.04436492919921875, 0.048557281494140625, 0.0527496337890625, 0.056941986083984375, 0.06113433837890625, 0.06532669067382812, 0.06951904296875, 0.07371139526367188, 0.07790374755859375, 0.08209609985351562, 0.0862884521484375, 0.09048080444335938, 0.09467315673828125, 0.09886550903320312, 0.103057861328125, 0.10725021362304688, 0.11144256591796875, 0.11563491821289062, 0.1198272705078125, 0.12401962280273438, 0.12821197509765625, 0.13240432739257812, 0.1365966796875]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 4.0, 2.0, 6.0, 2.0, 9.0, 7.0, 12.0, 9.0, 16.0, 19.0, 24.0, 32.0, 45.0, 74.0, 104.0, 157.0, 331.0, 1500.0, 922.0, 311.0, 154.0, 87.0, 74.0, 42.0, 35.0, 19.0, 15.0, 10.0, 11.0, 13.0, 6.0, 3.0, 5.0, 5.0, 5.0, 4.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.05926513671875, -0.05697822570800781, -0.054691314697265625, -0.05240440368652344, -0.05011749267578125, -0.04783058166503906, -0.045543670654296875, -0.04325675964355469, -0.0409698486328125, -0.03868293762207031, -0.036396026611328125, -0.03410911560058594, -0.03182220458984375, -0.029535293579101562, -0.027248382568359375, -0.024961471557617188, -0.022674560546875, -0.020387649536132812, -0.018100738525390625, -0.015813827514648438, -0.01352691650390625, -0.011240005493164062, -0.008953094482421875, -0.0066661834716796875, -0.0043792724609375, -0.0020923614501953125, 0.000194549560546875, 0.0024814605712890625, 0.00476837158203125, 0.0070552825927734375, 0.009342193603515625, 0.011629104614257812, 0.013916015625, 0.016202926635742188, 0.018489837646484375, 0.020776748657226562, 0.02306365966796875, 0.025350570678710938, 0.027637481689453125, 0.029924392700195312, 0.0322113037109375, 0.03449821472167969, 0.036785125732421875, 0.03907203674316406, 0.04135894775390625, 0.04364585876464844, 0.045932769775390625, 0.04821968078613281, 0.050506591796875, 0.05279350280761719, 0.055080413818359375, 0.05736732482910156, 0.05965423583984375, 0.06194114685058594, 0.06422805786132812, 0.06651496887207031, 0.0688018798828125, 0.07108879089355469, 0.07337570190429688, 0.07566261291503906, 0.07794952392578125, 0.08023643493652344, 0.08252334594726562, 0.08481025695800781, 0.08709716796875]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 6.0, 2.0, 2.0, 8.0, 14.0, 36.0, 50.0, 101.0, 151.0, 164.0, 138.0, 122.0, 89.0, 44.0, 26.0, 19.0, 10.0, 8.0, 6.0, 3.0, 1.0, 0.0, 2.0, 2.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3507859706878662, -0.33178627490997314, -0.3127865791320801, -0.293786883354187, -0.27478715777397156, -0.2557874619960785, -0.23678776621818542, -0.21778805553913116, -0.1987883597612381, -0.17978866398334503, -0.16078895330429077, -0.1417892575263977, -0.12278955429792404, -0.10378985106945038, -0.08479015529155731, -0.06579044461250305, -0.046790748834609985, -0.02779104746878147, -0.008791346102952957, 0.010208353400230408, 0.02920805662870407, 0.048207759857177734, 0.0672074556350708, 0.08620716631412506, 0.10520686209201813, 0.12420656532049179, 0.14320626854896545, 0.16220596432685852, 0.1812056601047516, 0.20020537078380585, 0.2192050665616989, 0.23820477724075317, 0.25720447301864624, 0.2762041687965393, 0.2952038645744324, 0.31420356035232544, 0.3332032859325409, 0.35220298171043396, 0.371202677488327, 0.3902024030685425, 0.40920209884643555, 0.4282017946243286, 0.4472014904022217, 0.46620118618011475, 0.4852009117603302, 0.5042005777359009, 0.523200273513794, 0.5422000288963318, 0.5611996650695801, 0.5801993608474731, 0.5991990566253662, 0.6181987524032593, 0.6371984481811523, 0.6561981439590454, 0.6751978397369385, 0.6941975951194763, 0.7131972908973694, 0.7321969866752625, 0.7511966824531555, 0.7701963782310486, 0.7891960740089417, 0.8081958293914795, 0.8271955251693726, 0.8461952209472656, 0.8651949167251587]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 9.0, 4.0, 2.0, 5.0, 8.0, 5.0, 10.0, 14.0, 14.0, 12.0, 10.0, 16.0, 19.0, 24.0, 25.0, 26.0, 31.0, 32.0, 25.0, 34.0, 30.0, 50.0, 34.0, 35.0, 37.0, 39.0, 35.0, 40.0, 41.0, 33.0, 37.0, 40.0, 38.0, 28.0, 23.0, 16.0, 27.0, 14.0, 15.0, 8.0, 12.0, 10.0, 9.0, 9.0, 5.0, 2.0, 3.0, 5.0, 2.0, 2.0, 1.0, 4.0, 5.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.25023192167282104, -0.24231058359146118, -0.23438923060894012, -0.22646789252758026, -0.2185465395450592, -0.21062520146369934, -0.20270386338233948, -0.19478252530097961, -0.18686117231845856, -0.1789398342370987, -0.17101848125457764, -0.16309714317321777, -0.1551758050918579, -0.14725445210933685, -0.139333114027977, -0.13141176104545593, -0.12349042296409607, -0.11556907743215561, -0.10764773190021515, -0.09972639381885529, -0.09180504828691483, -0.08388370275497437, -0.0759623646736145, -0.06804101914167404, -0.06011967360973358, -0.05219832807779312, -0.04427698627114296, -0.0363556444644928, -0.028434298932552338, -0.020512953400611877, -0.012591611593961716, -0.004670269787311554, 0.0032510757446289062, 0.011172419413924217, 0.019093763083219528, 0.02701510675251484, 0.03493645042181015, 0.04285779595375061, 0.05077913776040077, 0.058700479567050934, 0.0666218250989914, 0.07454317063093185, 0.08246451616287231, 0.09038585424423218, 0.09830719977617264, 0.1062285453081131, 0.11414988338947296, 0.12207122892141342, 0.12999257445335388, 0.13791391253471375, 0.1458352655172348, 0.15375660359859467, 0.16167795658111572, 0.16959929466247559, 0.17752063274383545, 0.1854419708251953, 0.19336332380771637, 0.20128466188907623, 0.2092060148715973, 0.21712735295295715, 0.22504869103431702, 0.23297004401683807, 0.24089138209819794, 0.248812735080719, 0.25673407316207886]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 1.0, 3.0, 1.0, 0.0, 2.0, 3.0, 1.0, 4.0, 4.0, 6.0, 6.0, 7.0, 10.0, 13.0, 29.0, 34.0, 51.0, 58.0, 135.0, 254.0, 572.0, 1595.0, 5480.0, 28910.0, 215964.0, 628011.0, 141176.0, 19775.0, 4195.0, 1272.0, 451.0, 220.0, 133.0, 62.0, 27.0, 25.0, 18.0, 15.0, 11.0, 9.0, 7.0, 7.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.41357421875, -0.4018898010253906, -0.39020538330078125, -0.3785209655761719, -0.3668365478515625, -0.3551521301269531, -0.34346771240234375, -0.3317832946777344, -0.320098876953125, -0.3084144592285156, -0.29673004150390625, -0.2850456237792969, -0.2733612060546875, -0.2616767883300781, -0.24999237060546875, -0.23830795288085938, -0.22662353515625, -0.21493911743164062, -0.20325469970703125, -0.19157028198242188, -0.1798858642578125, -0.16820144653320312, -0.15651702880859375, -0.14483261108398438, -0.133148193359375, -0.12146377563476562, -0.10977935791015625, -0.09809494018554688, -0.0864105224609375, -0.07472610473632812, -0.06304168701171875, -0.051357269287109375, -0.0396728515625, -0.027988433837890625, -0.01630401611328125, -0.004619598388671875, 0.0070648193359375, 0.018749237060546875, 0.03043365478515625, 0.042118072509765625, 0.053802490234375, 0.06548690795898438, 0.07717132568359375, 0.08885574340820312, 0.1005401611328125, 0.11222457885742188, 0.12390899658203125, 0.13559341430664062, 0.14727783203125, 0.15896224975585938, 0.17064666748046875, 0.18233108520507812, 0.1940155029296875, 0.20569992065429688, 0.21738433837890625, 0.22906875610351562, 0.240753173828125, 0.2524375915527344, 0.26412200927734375, 0.2758064270019531, 0.2874908447265625, 0.2991752624511719, 0.31085968017578125, 0.3225440979003906, 0.334228515625]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 6.0, 3.0, 9.0, 10.0, 9.0, 22.0, 20.0, 27.0, 35.0, 39.0, 51.0, 52.0, 69.0, 65.0, 58.0, 69.0, 65.0, 57.0, 62.0, 45.0, 48.0, 45.0, 28.0, 33.0, 17.0, 12.0, 19.0, 3.0, 11.0, 4.0, 2.0, 6.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1434326171875, -0.1389923095703125, -0.134552001953125, -0.1301116943359375, -0.12567138671875, -0.1212310791015625, -0.116790771484375, -0.1123504638671875, -0.10791015625, -0.1034698486328125, -0.099029541015625, -0.0945892333984375, -0.09014892578125, -0.0857086181640625, -0.081268310546875, -0.0768280029296875, -0.0723876953125, -0.0679473876953125, -0.063507080078125, -0.0590667724609375, -0.05462646484375, -0.0501861572265625, -0.045745849609375, -0.0413055419921875, -0.036865234375, -0.0324249267578125, -0.027984619140625, -0.0235443115234375, -0.01910400390625, -0.0146636962890625, -0.010223388671875, -0.0057830810546875, -0.0013427734375, 0.0030975341796875, 0.007537841796875, 0.0119781494140625, 0.01641845703125, 0.0208587646484375, 0.025299072265625, 0.0297393798828125, 0.0341796875, 0.0386199951171875, 0.043060302734375, 0.0475006103515625, 0.05194091796875, 0.0563812255859375, 0.060821533203125, 0.0652618408203125, 0.0697021484375, 0.0741424560546875, 0.078582763671875, 0.0830230712890625, 0.08746337890625, 0.0919036865234375, 0.096343994140625, 0.1007843017578125, 0.105224609375, 0.1096649169921875, 0.114105224609375, 0.1185455322265625, 0.12298583984375, 0.1274261474609375, 0.131866455078125, 0.1363067626953125, 0.1407470703125]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 0.0, 5.0, 2.0, 6.0, 8.0, 4.0, 16.0, 12.0, 30.0, 48.0, 62.0, 128.0, 267.0, 497.0, 1362.0, 5365.0, 83482.0, 896562.0, 54146.0, 4340.0, 1161.0, 490.0, 234.0, 113.0, 63.0, 50.0, 31.0, 20.0, 14.0, 12.0, 6.0, 5.0, 6.0, 4.0, 2.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.6611328125, -0.641937255859375, -0.62274169921875, -0.603546142578125, -0.5843505859375, -0.565155029296875, -0.54595947265625, -0.526763916015625, -0.507568359375, -0.488372802734375, -0.46917724609375, -0.449981689453125, -0.4307861328125, -0.411590576171875, -0.39239501953125, -0.373199462890625, -0.35400390625, -0.334808349609375, -0.31561279296875, -0.296417236328125, -0.2772216796875, -0.258026123046875, -0.23883056640625, -0.219635009765625, -0.200439453125, -0.181243896484375, -0.16204833984375, -0.142852783203125, -0.1236572265625, -0.104461669921875, -0.08526611328125, -0.066070556640625, -0.046875, -0.027679443359375, -0.00848388671875, 0.010711669921875, 0.0299072265625, 0.049102783203125, 0.06829833984375, 0.087493896484375, 0.106689453125, 0.125885009765625, 0.14508056640625, 0.164276123046875, 0.1834716796875, 0.202667236328125, 0.22186279296875, 0.241058349609375, 0.26025390625, 0.279449462890625, 0.29864501953125, 0.317840576171875, 0.3370361328125, 0.356231689453125, 0.37542724609375, 0.394622802734375, 0.413818359375, 0.433013916015625, 0.45220947265625, 0.471405029296875, 0.4906005859375, 0.509796142578125, 0.52899169921875, 0.548187255859375, 0.5673828125]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 0.0, 5.0, 3.0, 6.0, 3.0, 5.0, 11.0, 20.0, 11.0, 16.0, 15.0, 19.0, 27.0, 33.0, 30.0, 47.0, 31.0, 50.0, 50.0, 40.0, 55.0, 54.0, 57.0, 43.0, 45.0, 42.0, 33.0, 39.0, 36.0, 36.0, 25.0, 21.0, 23.0, 15.0, 12.0, 13.0, 9.0, 5.0, 7.0, 8.0, 3.0, 2.0, 1.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.41357421875, -0.40007781982421875, -0.3865814208984375, -0.37308502197265625, -0.359588623046875, -0.34609222412109375, -0.3325958251953125, -0.31909942626953125, -0.30560302734375, -0.29210662841796875, -0.2786102294921875, -0.26511383056640625, -0.251617431640625, -0.23812103271484375, -0.2246246337890625, -0.21112823486328125, -0.1976318359375, -0.18413543701171875, -0.1706390380859375, -0.15714263916015625, -0.143646240234375, -0.13014984130859375, -0.1166534423828125, -0.10315704345703125, -0.08966064453125, -0.07616424560546875, -0.0626678466796875, -0.04917144775390625, -0.035675048828125, -0.02217864990234375, -0.0086822509765625, 0.00481414794921875, 0.018310546875, 0.03180694580078125, 0.0453033447265625, 0.05879974365234375, 0.072296142578125, 0.08579254150390625, 0.0992889404296875, 0.11278533935546875, 0.12628173828125, 0.13977813720703125, 0.1532745361328125, 0.16677093505859375, 0.180267333984375, 0.19376373291015625, 0.2072601318359375, 0.22075653076171875, 0.2342529296875, 0.24774932861328125, 0.2612457275390625, 0.27474212646484375, 0.288238525390625, 0.30173492431640625, 0.3152313232421875, 0.32872772216796875, 0.34222412109375, 0.35572052001953125, 0.3692169189453125, 0.38271331787109375, 0.396209716796875, 0.40970611572265625, 0.4232025146484375, 0.43669891357421875, 0.4501953125]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 4.0, 3.0, 7.0, 4.0, 13.0, 21.0, 27.0, 37.0, 47.0, 89.0, 115.0, 207.0, 419.0, 931.0, 2198.0, 7099.0, 31334.0, 214864.0, 661620.0, 104127.0, 17734.0, 4550.0, 1579.0, 686.0, 357.0, 174.0, 97.0, 75.0, 39.0, 23.0, 24.0, 10.0, 17.0, 5.0, 6.0, 8.0, 7.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11004638671875, -0.1060190200805664, -0.10199165344238281, -0.09796428680419922, -0.09393692016601562, -0.08990955352783203, -0.08588218688964844, -0.08185482025146484, -0.07782745361328125, -0.07380008697509766, -0.06977272033691406, -0.06574535369873047, -0.061717987060546875, -0.05769062042236328, -0.05366325378417969, -0.049635887145996094, -0.0456085205078125, -0.041581153869628906, -0.03755378723144531, -0.03352642059326172, -0.029499053955078125, -0.02547168731689453, -0.021444320678710938, -0.017416954040527344, -0.01338958740234375, -0.009362220764160156, -0.0053348541259765625, -0.0013074874877929688, 0.002719879150390625, 0.006747245788574219, 0.010774612426757812, 0.014801979064941406, 0.018829345703125, 0.022856712341308594, 0.026884078979492188, 0.03091144561767578, 0.034938812255859375, 0.03896617889404297, 0.04299354553222656, 0.047020912170410156, 0.05104827880859375, 0.055075645446777344, 0.05910301208496094, 0.06313037872314453, 0.06715774536132812, 0.07118511199951172, 0.07521247863769531, 0.0792398452758789, 0.0832672119140625, 0.0872945785522461, 0.09132194519042969, 0.09534931182861328, 0.09937667846679688, 0.10340404510498047, 0.10743141174316406, 0.11145877838134766, 0.11548614501953125, 0.11951351165771484, 0.12354087829589844, 0.12756824493408203, 0.13159561157226562, 0.13562297821044922, 0.1396503448486328, 0.1436777114868164, 0.147705078125]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 5.0, 3.0, 4.0, 4.0, 8.0, 7.0, 5.0, 5.0, 11.0, 15.0, 10.0, 19.0, 20.0, 28.0, 27.0, 35.0, 38.0, 56.0, 62.0, 78.0, 90.0, 87.0, 69.0, 53.0, 52.0, 28.0, 34.0, 30.0, 15.0, 20.0, 12.0, 17.0, 17.0, 16.0, 8.0, 7.0, 4.0, 5.0, 5.0, 2.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.26173210144043e-05, -4.1268765926361084e-05, -3.992021083831787e-05, -3.857165575027466e-05, -3.7223100662231445e-05, -3.587454557418823e-05, -3.452599048614502e-05, -3.317743539810181e-05, -3.1828880310058594e-05, -3.048032522201538e-05, -2.9131770133972168e-05, -2.7783215045928955e-05, -2.6434659957885742e-05, -2.508610486984253e-05, -2.3737549781799316e-05, -2.2388994693756104e-05, -2.104043960571289e-05, -1.9691884517669678e-05, -1.8343329429626465e-05, -1.6994774341583252e-05, -1.564621925354004e-05, -1.4297664165496826e-05, -1.2949109077453613e-05, -1.16005539894104e-05, -1.0251998901367188e-05, -8.903443813323975e-06, -7.554888725280762e-06, -6.206333637237549e-06, -4.857778549194336e-06, -3.509223461151123e-06, -2.16066837310791e-06, -8.121132850646973e-07, 5.364418029785156e-07, 1.8849968910217285e-06, 3.2335519790649414e-06, 4.582107067108154e-06, 5.930662155151367e-06, 7.27921724319458e-06, 8.627772331237793e-06, 9.976327419281006e-06, 1.1324882507324219e-05, 1.2673437595367432e-05, 1.4021992683410645e-05, 1.5370547771453857e-05, 1.671910285949707e-05, 1.8067657947540283e-05, 1.9416213035583496e-05, 2.076476812362671e-05, 2.2113323211669922e-05, 2.3461878299713135e-05, 2.4810433387756348e-05, 2.615898847579956e-05, 2.7507543563842773e-05, 2.8856098651885986e-05, 3.02046537399292e-05, 3.155320882797241e-05, 3.2901763916015625e-05, 3.425031900405884e-05, 3.559887409210205e-05, 3.6947429180145264e-05, 3.8295984268188477e-05, 3.964453935623169e-05, 4.09930944442749e-05, 4.2341649532318115e-05, 4.369020462036133e-05]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 6.0, 9.0, 6.0, 17.0, 22.0, 32.0, 35.0, 41.0, 85.0, 151.0, 239.0, 483.0, 1014.0, 2593.0, 9716.0, 73469.0, 731006.0, 202840.0, 19648.0, 4232.0, 1464.0, 622.0, 338.0, 173.0, 110.0, 79.0, 48.0, 26.0, 20.0, 10.0, 7.0, 1.0, 5.0, 6.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.130859375, -0.12556076049804688, -0.12026214599609375, -0.11496353149414062, -0.1096649169921875, -0.10436630249023438, -0.09906768798828125, -0.09376907348632812, -0.088470458984375, -0.08317184448242188, -0.07787322998046875, -0.07257461547851562, -0.0672760009765625, -0.061977386474609375, -0.05667877197265625, -0.051380157470703125, -0.04608154296875, -0.040782928466796875, -0.03548431396484375, -0.030185699462890625, -0.0248870849609375, -0.019588470458984375, -0.01428985595703125, -0.008991241455078125, -0.003692626953125, 0.001605987548828125, 0.00690460205078125, 0.012203216552734375, 0.0175018310546875, 0.022800445556640625, 0.02809906005859375, 0.033397674560546875, 0.0386962890625, 0.043994903564453125, 0.04929351806640625, 0.054592132568359375, 0.0598907470703125, 0.06518936157226562, 0.07048797607421875, 0.07578659057617188, 0.081085205078125, 0.08638381958007812, 0.09168243408203125, 0.09698104858398438, 0.1022796630859375, 0.10757827758789062, 0.11287689208984375, 0.11817550659179688, 0.12347412109375, 0.12877273559570312, 0.13407135009765625, 0.13936996459960938, 0.1446685791015625, 0.14996719360351562, 0.15526580810546875, 0.16056442260742188, 0.165863037109375, 0.17116165161132812, 0.17646026611328125, 0.18175888061523438, 0.1870574951171875, 0.19235610961914062, 0.19765472412109375, 0.20295333862304688, 0.208251953125]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 8.0, 4.0, 10.0, 8.0, 9.0, 11.0, 8.0, 8.0, 10.0, 18.0, 21.0, 35.0, 39.0, 61.0, 54.0, 71.0, 76.0, 83.0, 66.0, 75.0, 38.0, 54.0, 47.0, 42.0, 23.0, 19.0, 15.0, 20.0, 16.0, 13.0, 9.0, 6.0, 5.0, 4.0, 6.0, 6.0, 2.0, 3.0, 4.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09130859375, -0.0880289077758789, -0.08474922180175781, -0.08146953582763672, -0.07818984985351562, -0.07491016387939453, -0.07163047790527344, -0.06835079193115234, -0.06507110595703125, -0.061791419982910156, -0.05851173400878906, -0.05523204803466797, -0.051952362060546875, -0.04867267608642578, -0.04539299011230469, -0.042113304138183594, -0.0388336181640625, -0.035553932189941406, -0.03227424621582031, -0.02899456024169922, -0.025714874267578125, -0.02243518829345703, -0.019155502319335938, -0.015875816345214844, -0.01259613037109375, -0.009316444396972656, -0.0060367584228515625, -0.0027570724487304688, 0.000522613525390625, 0.0038022994995117188, 0.0070819854736328125, 0.010361671447753906, 0.013641357421875, 0.016921043395996094, 0.020200729370117188, 0.02348041534423828, 0.026760101318359375, 0.03003978729248047, 0.03331947326660156, 0.036599159240722656, 0.03987884521484375, 0.043158531188964844, 0.04643821716308594, 0.04971790313720703, 0.052997589111328125, 0.05627727508544922, 0.05955696105957031, 0.0628366470336914, 0.0661163330078125, 0.0693960189819336, 0.07267570495605469, 0.07595539093017578, 0.07923507690429688, 0.08251476287841797, 0.08579444885253906, 0.08907413482666016, 0.09235382080078125, 0.09563350677490234, 0.09891319274902344, 0.10219287872314453, 0.10547256469726562, 0.10875225067138672, 0.11203193664550781, 0.1153116226196289, 0.11859130859375]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 4.0, 3.0, 3.0, 7.0, 6.0, 9.0, 17.0, 44.0, 96.0, 144.0, 211.0, 199.0, 133.0, 80.0, 27.0, 15.0, 5.0, 1.0, 2.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.9341628551483154, -2.8327794075012207, -2.731395959854126, -2.6300125122070312, -2.5286288261413574, -2.4272453784942627, -2.325861930847168, -2.2244784832000732, -2.1230950355529785, -2.021711587905884, -1.9203280210494995, -1.8189445734024048, -1.7175610065460205, -1.6161775588989258, -1.514794111251831, -1.4134106636047363, -1.3120269775390625, -1.2106435298919678, -1.1092599630355835, -1.0078765153884888, -0.9064930081367493, -0.8051095008850098, -0.703726053237915, -0.6023425459861755, -0.500959038734436, -0.39957553148269653, -0.2981920540332794, -0.1968085765838623, -0.0954250693321228, 0.005958437919616699, 0.10734188556671143, 0.20872539281845093, 0.31010913848876953, 0.41149264574050903, 0.5128761529922485, 0.6142596006393433, 0.7156431078910828, 0.8170266151428223, 0.918410062789917, 1.0197935104370117, 1.121177077293396, 1.2225605249404907, 1.323944091796875, 1.4253275394439697, 1.5267109870910645, 1.6280945539474487, 1.7294780015945435, 1.8308615684509277, 1.9322450160980225, 2.033628463745117, 2.135011911392212, 2.2363953590393066, 2.3377790451049805, 2.439162492752075, 2.54054594039917, 2.6419293880462646, 2.7433128356933594, 2.844696283340454, 2.946079730987549, 3.0474634170532227, 3.1488468647003174, 3.250230312347412, 3.351613759994507, 3.4529972076416016, 3.5543808937072754]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 2.0, 5.0, 3.0, 6.0, 9.0, 5.0, 14.0, 12.0, 16.0, 20.0, 22.0, 20.0, 27.0, 33.0, 22.0, 28.0, 48.0, 48.0, 48.0, 52.0, 56.0, 50.0, 60.0, 41.0, 43.0, 47.0, 33.0, 51.0, 33.0, 25.0, 21.0, 19.0, 17.0, 16.0, 9.0, 9.0, 5.0, 12.0, 3.0, 5.0, 2.0, 3.0, 4.0, 1.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9295673370361328, -1.8716405630111694, -1.813713788986206, -1.7557870149612427, -1.6978602409362793, -1.639933466911316, -1.5820066928863525, -1.5240797996520996, -1.4661531448364258, -1.4082263708114624, -1.350299596786499, -1.2923728227615356, -1.2344460487365723, -1.1765192747116089, -1.1185925006866455, -1.0606656074523926, -1.0027388334274292, -0.9448120594024658, -0.8868852853775024, -0.8289585113525391, -0.7710317373275757, -0.7131049633026123, -0.6551781296730042, -0.5972513556480408, -0.5393245816230774, -0.481397807598114, -0.42347103357315063, -0.36554422974586487, -0.3076174557209015, -0.2496906816959381, -0.19176387786865234, -0.13383710384368896, -0.07591032981872559, -0.01798354834318161, 0.039943233132362366, 0.09787002205848694, 0.15579679608345032, 0.2137235701084137, 0.27165037393569946, 0.32957714796066284, 0.3875039219856262, 0.4454306960105896, 0.503357470035553, 0.5612843036651611, 0.6192110776901245, 0.6771378517150879, 0.7350646257400513, 0.7929913997650146, 0.850918173789978, 0.9088449478149414, 0.9667717218399048, 1.0246984958648682, 1.0826252698898315, 1.140552043914795, 1.1984789371490479, 1.2564055919647217, 1.3143324851989746, 1.372259259223938, 1.4301860332489014, 1.4881128072738647, 1.5460395812988281, 1.6039663553237915, 1.6618931293487549, 1.7198200225830078, 1.7777466773986816]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 5.0, 1.0, 4.0, 5.0, 2.0, 6.0, 5.0, 10.0, 12.0, 26.0, 27.0, 44.0, 64.0, 101.0, 204.0, 451.0, 1436.0, 6231.0, 51583.0, 1801543.0, 2260067.0, 62900.0, 7049.0, 1518.0, 464.0, 203.0, 116.0, 71.0, 42.0, 23.0, 23.0, 12.0, 10.0, 5.0, 9.0, 7.0, 5.0, 3.0, 0.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.240234375, -0.23196029663085938, -0.22368621826171875, -0.21541213989257812, -0.2071380615234375, -0.19886398315429688, -0.19058990478515625, -0.18231582641601562, -0.174041748046875, -0.16576766967773438, -0.15749359130859375, -0.14921951293945312, -0.1409454345703125, -0.13267135620117188, -0.12439727783203125, -0.11612319946289062, -0.10784912109375, -0.09957504272460938, -0.09130096435546875, -0.08302688598632812, -0.0747528076171875, -0.06647872924804688, -0.05820465087890625, -0.049930572509765625, -0.041656494140625, -0.033382415771484375, -0.02510833740234375, -0.016834259033203125, -0.0085601806640625, -0.000286102294921875, 0.00798797607421875, 0.016262054443359375, 0.0245361328125, 0.032810211181640625, 0.04108428955078125, 0.049358367919921875, 0.0576324462890625, 0.06590652465820312, 0.07418060302734375, 0.08245468139648438, 0.090728759765625, 0.09900283813476562, 0.10727691650390625, 0.11555099487304688, 0.1238250732421875, 0.13209915161132812, 0.14037322998046875, 0.14864730834960938, 0.15692138671875, 0.16519546508789062, 0.17346954345703125, 0.18174362182617188, 0.1900177001953125, 0.19829177856445312, 0.20656585693359375, 0.21483993530273438, 0.223114013671875, 0.23138809204101562, 0.23966217041015625, 0.24793624877929688, 0.2562103271484375, 0.2644844055175781, 0.27275848388671875, 0.2810325622558594, 0.289306640625]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 6.0, 8.0, 9.0, 12.0, 20.0, 26.0, 47.0, 59.0, 64.0, 73.0, 73.0, 91.0, 103.0, 68.0, 78.0, 69.0, 53.0, 43.0, 32.0, 29.0, 17.0, 12.0, 7.0, 5.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1463623046875, -0.1411590576171875, -0.135955810546875, -0.1307525634765625, -0.12554931640625, -0.1203460693359375, -0.115142822265625, -0.1099395751953125, -0.104736328125, -0.0995330810546875, -0.094329833984375, -0.0891265869140625, -0.08392333984375, -0.0787200927734375, -0.073516845703125, -0.0683135986328125, -0.0631103515625, -0.0579071044921875, -0.052703857421875, -0.0475006103515625, -0.04229736328125, -0.0370941162109375, -0.031890869140625, -0.0266876220703125, -0.021484375, -0.0162811279296875, -0.011077880859375, -0.0058746337890625, -0.00067138671875, 0.0045318603515625, 0.009735107421875, 0.0149383544921875, 0.0201416015625, 0.0253448486328125, 0.030548095703125, 0.0357513427734375, 0.04095458984375, 0.0461578369140625, 0.051361083984375, 0.0565643310546875, 0.061767578125, 0.0669708251953125, 0.072174072265625, 0.0773773193359375, 0.08258056640625, 0.0877838134765625, 0.092987060546875, 0.0981903076171875, 0.1033935546875, 0.1085968017578125, 0.113800048828125, 0.1190032958984375, 0.12420654296875, 0.1294097900390625, 0.134613037109375, 0.1398162841796875, 0.14501953125, 0.1502227783203125, 0.155426025390625, 0.1606292724609375, 0.16583251953125, 0.1710357666015625, 0.176239013671875, 0.1814422607421875, 0.1866455078125]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 3.0, 2.0, 4.0, 4.0, 4.0, 7.0, 10.0, 12.0, 22.0, 42.0, 51.0, 116.0, 244.0, 691.0, 2316.0, 11559.0, 102990.0, 3042637.0, 982803.0, 42337.0, 6151.0, 1410.0, 499.0, 166.0, 81.0, 49.0, 19.0, 16.0, 11.0, 13.0, 10.0, 7.0, 0.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.3447265625, -0.33628273010253906, -0.3278388977050781, -0.3193950653076172, -0.31095123291015625, -0.3025074005126953, -0.2940635681152344, -0.28561973571777344, -0.2771759033203125, -0.26873207092285156, -0.2602882385253906, -0.2518444061279297, -0.24340057373046875, -0.2349567413330078, -0.22651290893554688, -0.21806907653808594, -0.209625244140625, -0.20118141174316406, -0.19273757934570312, -0.1842937469482422, -0.17584991455078125, -0.1674060821533203, -0.15896224975585938, -0.15051841735839844, -0.1420745849609375, -0.13363075256347656, -0.12518692016601562, -0.11674308776855469, -0.10829925537109375, -0.09985542297363281, -0.09141159057617188, -0.08296775817871094, -0.07452392578125, -0.06608009338378906, -0.057636260986328125, -0.04919242858886719, -0.04074859619140625, -0.03230476379394531, -0.023860931396484375, -0.015417098999023438, -0.0069732666015625, 0.0014705657958984375, 0.009914398193359375, 0.018358230590820312, 0.02680206298828125, 0.03524589538574219, 0.043689727783203125, 0.05213356018066406, 0.060577392578125, 0.06902122497558594, 0.07746505737304688, 0.08590888977050781, 0.09435272216796875, 0.10279655456542969, 0.11124038696289062, 0.11968421936035156, 0.1281280517578125, 0.13657188415527344, 0.14501571655273438, 0.1534595489501953, 0.16190338134765625, 0.1703472137451172, 0.17879104614257812, 0.18723487854003906, 0.1956787109375]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 4.0, 2.0, 7.0, 11.0, 10.0, 15.0, 23.0, 24.0, 54.0, 88.0, 130.0, 240.0, 419.0, 670.0, 805.0, 674.0, 397.0, 196.0, 122.0, 55.0, 45.0, 28.0, 17.0, 12.0, 6.0, 10.0, 5.0, 1.0, 6.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.2489013671875, -0.2412395477294922, -0.23357772827148438, -0.22591590881347656, -0.21825408935546875, -0.21059226989746094, -0.20293045043945312, -0.1952686309814453, -0.1876068115234375, -0.1799449920654297, -0.17228317260742188, -0.16462135314941406, -0.15695953369140625, -0.14929771423339844, -0.14163589477539062, -0.1339740753173828, -0.126312255859375, -0.11865043640136719, -0.11098861694335938, -0.10332679748535156, -0.09566497802734375, -0.08800315856933594, -0.08034133911132812, -0.07267951965332031, -0.0650177001953125, -0.05735588073730469, -0.049694061279296875, -0.04203224182128906, -0.03437042236328125, -0.026708602905273438, -0.019046783447265625, -0.011384963989257812, -0.00372314453125, 0.0039386749267578125, 0.011600494384765625, 0.019262313842773438, 0.02692413330078125, 0.03458595275878906, 0.042247772216796875, 0.04990959167480469, 0.0575714111328125, 0.06523323059082031, 0.07289505004882812, 0.08055686950683594, 0.08821868896484375, 0.09588050842285156, 0.10354232788085938, 0.11120414733886719, 0.118865966796875, 0.1265277862548828, 0.13418960571289062, 0.14185142517089844, 0.14951324462890625, 0.15717506408691406, 0.16483688354492188, 0.1724987030029297, 0.1801605224609375, 0.1878223419189453, 0.19548416137695312, 0.20314598083496094, 0.21080780029296875, 0.21846961975097656, 0.22613143920898438, 0.2337932586669922, 0.241455078125]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 3.0, 8.0, 5.0, 5.0, 6.0, 8.0, 3.0, 20.0, 21.0, 35.0, 86.0, 108.0, 179.0, 199.0, 149.0, 92.0, 42.0, 18.0, 4.0, 7.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.0547385215759277, -2.9882168769836426, -2.9216954708099365, -2.8551738262176514, -2.788652181625366, -2.72213077545166, -2.655609130859375, -2.58908748626709, -2.522566080093384, -2.4560444355010986, -2.3895230293273926, -2.3230013847351074, -2.2564797401428223, -2.189958333969116, -2.123436689376831, -2.056915044784546, -1.9903935194015503, -1.9238719940185547, -1.8573503494262695, -1.790828824043274, -1.7243072986602783, -1.6577856540679932, -1.5912641286849976, -1.524742603302002, -1.4582209587097168, -1.3916994333267212, -1.325177788734436, -1.2586562633514404, -1.1921347379684448, -1.1256132125854492, -1.059091567993164, -0.9925700426101685, -0.9260485172271729, -0.8595269322395325, -0.7930054068565369, -0.7264838218688965, -0.6599622964859009, -0.5934407114982605, -0.5269191265106201, -0.4603975713253021, -0.39387601613998413, -0.32735446095466614, -0.26083290576934814, -0.19431132078170776, -0.12778976559638977, -0.06126821041107178, 0.0052533745765686035, 0.0717749297618866, 0.1382964849472046, 0.20481804013252258, 0.2713395953178406, 0.33786118030548096, 0.40438273549079895, 0.47090429067611694, 0.5374258756637573, 0.6039474010467529, 0.6704689860343933, 0.7369905710220337, 0.8035120964050293, 0.8700336813926697, 0.9365552663803101, 1.0030767917633057, 1.0695984363555908, 1.1361199617385864, 1.202641487121582]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 3.0, 4.0, 6.0, 8.0, 9.0, 15.0, 16.0, 20.0, 21.0, 34.0, 38.0, 44.0, 39.0, 53.0, 57.0, 62.0, 62.0, 56.0, 72.0, 54.0, 58.0, 49.0, 42.0, 37.0, 27.0, 23.0, 32.0, 14.0, 16.0, 10.0, 13.0, 7.0, 3.0, 2.0, 0.0, 3.0, 0.0, 3.0, 0.0, 0.0, 3.0], "bins": [-1.5951663255691528, -1.5554850101470947, -1.5158038139343262, -1.476122498512268, -1.43644118309021, -1.3967599868774414, -1.3570786714553833, -1.3173973560333252, -1.2777161598205566, -1.2380348443984985, -1.19835364818573, -1.1586723327636719, -1.1189910173416138, -1.0793097019195557, -1.039628505706787, -0.999947190284729, -0.9602658748626709, -0.9205846190452576, -0.8809033036231995, -0.8412220478057861, -0.801540732383728, -0.7618594765663147, -0.7221782207489014, -0.6824969053268433, -0.6428156495094299, -0.6031343936920166, -0.5634530782699585, -0.5237718224525452, -0.48409053683280945, -0.44440925121307373, -0.4047279953956604, -0.3650467097759247, -0.3253653049468994, -0.2856840193271637, -0.24600274860858917, -0.20632147789001465, -0.16664019227027893, -0.1269589066505432, -0.08727763593196869, -0.047596365213394165, -0.007915079593658447, 0.031766198575496674, 0.0714474767446518, 0.11112875491380692, 0.15081003308296204, 0.19049131870269775, 0.23017258942127228, 0.2698538601398468, 0.3095351457595825, 0.34921643137931824, 0.38889771699905396, 0.4285789728164673, 0.468260258436203, 0.5079415440559387, 0.547622799873352, 0.5873041152954102, 0.6269853711128235, 0.6666666269302368, 0.7063479423522949, 0.7460291981697083, 0.7857104539871216, 0.8253917694091797, 0.865073025226593, 0.9047542810440063, 0.9444355964660645]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 5.0, 2.0, 11.0, 18.0, 20.0, 24.0, 46.0, 50.0, 91.0, 159.0, 278.0, 501.0, 860.0, 1655.0, 3266.0, 6505.0, 13787.0, 32123.0, 79313.0, 207159.0, 372106.0, 197888.0, 75827.0, 30669.0, 13319.0, 6112.0, 3060.0, 1602.0, 878.0, 483.0, 314.0, 173.0, 79.0, 69.0, 38.0, 26.0, 12.0, 8.0, 9.0, 8.0, 1.0, 6.0, 4.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.12469482421875, -0.12015628814697266, -0.11561775207519531, -0.11107921600341797, -0.10654067993164062, -0.10200214385986328, -0.09746360778808594, -0.0929250717163086, -0.08838653564453125, -0.0838479995727539, -0.07930946350097656, -0.07477092742919922, -0.07023239135742188, -0.06569385528564453, -0.06115531921386719, -0.056616783142089844, -0.0520782470703125, -0.047539710998535156, -0.04300117492675781, -0.03846263885498047, -0.033924102783203125, -0.02938556671142578, -0.024847030639648438, -0.020308494567871094, -0.01576995849609375, -0.011231422424316406, -0.0066928863525390625, -0.0021543502807617188, 0.002384185791015625, 0.006922721862792969, 0.011461257934570312, 0.015999794006347656, 0.020538330078125, 0.025076866149902344, 0.029615402221679688, 0.03415393829345703, 0.038692474365234375, 0.04323101043701172, 0.04776954650878906, 0.052308082580566406, 0.05684661865234375, 0.061385154724121094, 0.06592369079589844, 0.07046222686767578, 0.07500076293945312, 0.07953929901123047, 0.08407783508300781, 0.08861637115478516, 0.0931549072265625, 0.09769344329833984, 0.10223197937011719, 0.10677051544189453, 0.11130905151367188, 0.11584758758544922, 0.12038612365722656, 0.1249246597290039, 0.12946319580078125, 0.1340017318725586, 0.13854026794433594, 0.14307880401611328, 0.14761734008789062, 0.15215587615966797, 0.1566944122314453, 0.16123294830322266, 0.165771484375]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 6.0, 1.0, 3.0, 5.0, 3.0, 15.0, 10.0, 12.0, 19.0, 20.0, 32.0, 37.0, 41.0, 44.0, 44.0, 48.0, 64.0, 48.0, 66.0, 70.0, 57.0, 40.0, 59.0, 46.0, 40.0, 31.0, 31.0, 20.0, 27.0, 18.0, 18.0, 9.0, 4.0, 6.0, 3.0, 2.0, 3.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.13134765625, -0.12786006927490234, -0.12437248229980469, -0.12088489532470703, -0.11739730834960938, -0.11390972137451172, -0.11042213439941406, -0.1069345474243164, -0.10344696044921875, -0.0999593734741211, -0.09647178649902344, -0.09298419952392578, -0.08949661254882812, -0.08600902557373047, -0.08252143859863281, -0.07903385162353516, -0.0755462646484375, -0.07205867767333984, -0.06857109069824219, -0.06508350372314453, -0.061595916748046875, -0.05810832977294922, -0.05462074279785156, -0.051133155822753906, -0.04764556884765625, -0.044157981872558594, -0.04067039489746094, -0.03718280792236328, -0.033695220947265625, -0.03020763397216797, -0.026720046997070312, -0.023232460021972656, -0.019744873046875, -0.016257286071777344, -0.012769699096679688, -0.009282112121582031, -0.005794525146484375, -0.0023069381713867188, 0.0011806488037109375, 0.004668235778808594, 0.00815582275390625, 0.011643409729003906, 0.015130996704101562, 0.01861858367919922, 0.022106170654296875, 0.02559375762939453, 0.029081344604492188, 0.032568931579589844, 0.0360565185546875, 0.039544105529785156, 0.04303169250488281, 0.04651927947998047, 0.050006866455078125, 0.05349445343017578, 0.05698204040527344, 0.060469627380371094, 0.06395721435546875, 0.0674448013305664, 0.07093238830566406, 0.07441997528076172, 0.07790756225585938, 0.08139514923095703, 0.08488273620605469, 0.08837032318115234, 0.09185791015625]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 2.0, 2.0, 3.0, 2.0, 6.0, 8.0, 11.0, 11.0, 16.0, 26.0, 38.0, 47.0, 65.0, 87.0, 137.0, 208.0, 330.0, 563.0, 1032.0, 2115.0, 6830.0, 39973.0, 559949.0, 394705.0, 31945.0, 6003.0, 1954.0, 975.0, 540.0, 337.0, 213.0, 126.0, 97.0, 61.0, 39.0, 31.0, 23.0, 16.0, 11.0, 5.0, 6.0, 4.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0], "bins": [-0.377685546875, -0.3668785095214844, -0.35607147216796875, -0.3452644348144531, -0.3344573974609375, -0.3236503601074219, -0.31284332275390625, -0.3020362854003906, -0.291229248046875, -0.2804222106933594, -0.26961517333984375, -0.2588081359863281, -0.2480010986328125, -0.23719406127929688, -0.22638702392578125, -0.21557998657226562, -0.20477294921875, -0.19396591186523438, -0.18315887451171875, -0.17235183715820312, -0.1615447998046875, -0.15073776245117188, -0.13993072509765625, -0.12912368774414062, -0.118316650390625, -0.10750961303710938, -0.09670257568359375, -0.08589553833007812, -0.0750885009765625, -0.06428146362304688, -0.05347442626953125, -0.042667388916015625, -0.0318603515625, -0.021053314208984375, -0.01024627685546875, 0.000560760498046875, 0.0113677978515625, 0.022174835205078125, 0.03298187255859375, 0.043788909912109375, 0.054595947265625, 0.06540298461914062, 0.07621002197265625, 0.08701705932617188, 0.0978240966796875, 0.10863113403320312, 0.11943817138671875, 0.13024520874023438, 0.14105224609375, 0.15185928344726562, 0.16266632080078125, 0.17347335815429688, 0.1842803955078125, 0.19508743286132812, 0.20589447021484375, 0.21670150756835938, 0.227508544921875, 0.23831558227539062, 0.24912261962890625, 0.2599296569824219, 0.2707366943359375, 0.2815437316894531, 0.29235076904296875, 0.3031578063964844, 0.31396484375]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 3.0, 7.0, 11.0, 6.0, 12.0, 12.0, 10.0, 17.0, 16.0, 19.0, 12.0, 12.0, 35.0, 41.0, 28.0, 29.0, 38.0, 35.0, 35.0, 45.0, 53.0, 46.0, 46.0, 48.0, 43.0, 42.0, 40.0, 39.0, 41.0, 24.0, 18.0, 26.0, 26.0, 19.0, 15.0, 8.0, 9.0, 11.0, 7.0, 8.0, 7.0, 2.0, 4.0, 2.0, 4.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.300537109375, -0.28987884521484375, -0.2792205810546875, -0.26856231689453125, -0.257904052734375, -0.24724578857421875, -0.2365875244140625, -0.22592926025390625, -0.21527099609375, -0.20461273193359375, -0.1939544677734375, -0.18329620361328125, -0.172637939453125, -0.16197967529296875, -0.1513214111328125, -0.14066314697265625, -0.1300048828125, -0.11934661865234375, -0.1086883544921875, -0.09803009033203125, -0.087371826171875, -0.07671356201171875, -0.0660552978515625, -0.05539703369140625, -0.04473876953125, -0.03408050537109375, -0.0234222412109375, -0.01276397705078125, -0.002105712890625, 0.00855255126953125, 0.0192108154296875, 0.02986907958984375, 0.04052734375, 0.05118560791015625, 0.0618438720703125, 0.07250213623046875, 0.083160400390625, 0.09381866455078125, 0.1044769287109375, 0.11513519287109375, 0.12579345703125, 0.13645172119140625, 0.1471099853515625, 0.15776824951171875, 0.168426513671875, 0.17908477783203125, 0.1897430419921875, 0.20040130615234375, 0.2110595703125, 0.22171783447265625, 0.2323760986328125, 0.24303436279296875, 0.253692626953125, 0.26435089111328125, 0.2750091552734375, 0.28566741943359375, 0.29632568359375, 0.30698394775390625, 0.3176422119140625, 0.32830047607421875, 0.338958740234375, 0.34961700439453125, 0.3602752685546875, 0.37093353271484375, 0.381591796875]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 5.0, 5.0, 6.0, 9.0, 10.0, 14.0, 32.0, 36.0, 48.0, 92.0, 148.0, 303.0, 550.0, 1312.0, 3616.0, 14653.0, 94680.0, 808089.0, 103258.0, 15268.0, 3852.0, 1318.0, 600.0, 270.0, 140.0, 101.0, 45.0, 38.0, 18.0, 12.0, 9.0, 7.0, 4.0, 6.0, 1.0, 0.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.158935546875, -0.1535511016845703, -0.14816665649414062, -0.14278221130371094, -0.13739776611328125, -0.13201332092285156, -0.12662887573242188, -0.12124443054199219, -0.1158599853515625, -0.11047554016113281, -0.10509109497070312, -0.09970664978027344, -0.09432220458984375, -0.08893775939941406, -0.08355331420898438, -0.07816886901855469, -0.072784423828125, -0.06739997863769531, -0.062015533447265625, -0.05663108825683594, -0.05124664306640625, -0.04586219787597656, -0.040477752685546875, -0.03509330749511719, -0.0297088623046875, -0.024324417114257812, -0.018939971923828125, -0.013555526733398438, -0.00817108154296875, -0.0027866363525390625, 0.002597808837890625, 0.007982254028320312, 0.01336669921875, 0.018751144409179688, 0.024135589599609375, 0.029520034790039062, 0.03490447998046875, 0.04028892517089844, 0.045673370361328125, 0.05105781555175781, 0.0564422607421875, 0.06182670593261719, 0.06721115112304688, 0.07259559631347656, 0.07798004150390625, 0.08336448669433594, 0.08874893188476562, 0.09413337707519531, 0.099517822265625, 0.10490226745605469, 0.11028671264648438, 0.11567115783691406, 0.12105560302734375, 0.12644004821777344, 0.13182449340820312, 0.1372089385986328, 0.1425933837890625, 0.1479778289794922, 0.15336227416992188, 0.15874671936035156, 0.16413116455078125, 0.16951560974121094, 0.17490005493164062, 0.1802845001220703, 0.1856689453125]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 6.0, 1.0, 2.0, 1.0, 4.0, 8.0, 9.0, 4.0, 4.0, 11.0, 6.0, 9.0, 13.0, 21.0, 22.0, 20.0, 36.0, 50.0, 65.0, 99.0, 112.0, 120.0, 93.0, 65.0, 47.0, 40.0, 27.0, 18.0, 19.0, 22.0, 9.0, 11.0, 12.0, 7.0, 4.0, 5.0, 3.0, 6.0, 1.0, 1.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.9948692321777344e-05, -4.816707223653793e-05, -4.638545215129852e-05, -4.460383206605911e-05, -4.28222119808197e-05, -4.104059189558029e-05, -3.925897181034088e-05, -3.747735172510147e-05, -3.569573163986206e-05, -3.391411155462265e-05, -3.213249146938324e-05, -3.035087138414383e-05, -2.856925129890442e-05, -2.678763121366501e-05, -2.5006011128425598e-05, -2.3224391043186188e-05, -2.1442770957946777e-05, -1.9661150872707367e-05, -1.7879530787467957e-05, -1.6097910702228546e-05, -1.4316290616989136e-05, -1.2534670531749725e-05, -1.0753050446510315e-05, -8.971430361270905e-06, -7.189810276031494e-06, -5.408190190792084e-06, -3.6265701055526733e-06, -1.844950020313263e-06, -6.332993507385254e-08, 1.7182901501655579e-06, 3.4999102354049683e-06, 5.281530320644379e-06, 7.063150405883789e-06, 8.8447704911232e-06, 1.062639057636261e-05, 1.240801066160202e-05, 1.418963074684143e-05, 1.597125083208084e-05, 1.775287091732025e-05, 1.9534491002559662e-05, 2.1316111087799072e-05, 2.3097731173038483e-05, 2.4879351258277893e-05, 2.6660971343517303e-05, 2.8442591428756714e-05, 3.0224211513996124e-05, 3.2005831599235535e-05, 3.3787451684474945e-05, 3.5569071769714355e-05, 3.7350691854953766e-05, 3.9132311940193176e-05, 4.091393202543259e-05, 4.2695552110672e-05, 4.447717219591141e-05, 4.625879228115082e-05, 4.804041236639023e-05, 4.982203245162964e-05, 5.160365253686905e-05, 5.338527262210846e-05, 5.516689270734787e-05, 5.694851279258728e-05, 5.873013287782669e-05, 6.05117529630661e-05, 6.229337304830551e-05, 6.407499313354492e-05]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 4.0, 6.0, 6.0, 6.0, 12.0, 18.0, 23.0, 27.0, 40.0, 51.0, 45.0, 91.0, 107.0, 169.0, 210.0, 367.0, 553.0, 920.0, 1606.0, 3331.0, 8632.0, 26476.0, 112002.0, 679314.0, 161556.0, 33957.0, 10333.0, 4043.0, 1910.0, 913.0, 562.0, 383.0, 235.0, 168.0, 134.0, 85.0, 62.0, 55.0, 28.0, 23.0, 18.0, 26.0, 23.0, 8.0, 6.0, 4.0, 6.0, 2.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.1300048828125, -0.12601661682128906, -0.12202835083007812, -0.11804008483886719, -0.11405181884765625, -0.11006355285644531, -0.10607528686523438, -0.10208702087402344, -0.0980987548828125, -0.09411048889160156, -0.09012222290039062, -0.08613395690917969, -0.08214569091796875, -0.07815742492675781, -0.07416915893554688, -0.07018089294433594, -0.066192626953125, -0.06220436096191406, -0.058216094970703125, -0.05422782897949219, -0.05023956298828125, -0.04625129699707031, -0.042263031005859375, -0.03827476501464844, -0.0342864990234375, -0.030298233032226562, -0.026309967041015625, -0.022321701049804688, -0.01833343505859375, -0.014345169067382812, -0.010356903076171875, -0.0063686370849609375, -0.00238037109375, 0.0016078948974609375, 0.005596160888671875, 0.009584426879882812, 0.01357269287109375, 0.017560958862304688, 0.021549224853515625, 0.025537490844726562, 0.0295257568359375, 0.03351402282714844, 0.037502288818359375, 0.04149055480957031, 0.04547882080078125, 0.04946708679199219, 0.053455352783203125, 0.05744361877441406, 0.061431884765625, 0.06542015075683594, 0.06940841674804688, 0.07339668273925781, 0.07738494873046875, 0.08137321472167969, 0.08536148071289062, 0.08934974670410156, 0.0933380126953125, 0.09732627868652344, 0.10131454467773438, 0.10530281066894531, 0.10929107666015625, 0.11327934265136719, 0.11726760864257812, 0.12125587463378906, 0.125244140625]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 3.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 2.0, 2.0, 3.0, 6.0, 1.0, 8.0, 5.0, 15.0, 9.0, 12.0, 19.0, 17.0, 13.0, 34.0, 30.0, 31.0, 60.0, 75.0, 81.0, 75.0, 76.0, 67.0, 56.0, 53.0, 33.0, 46.0, 28.0, 22.0, 21.0, 16.0, 13.0, 6.0, 11.0, 8.0, 9.0, 9.0, 4.0, 4.0, 3.0, 3.0, 2.0, 7.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.09539794921875, -0.09224319458007812, -0.08908843994140625, -0.08593368530273438, -0.0827789306640625, -0.07962417602539062, -0.07646942138671875, -0.07331466674804688, -0.070159912109375, -0.06700515747070312, -0.06385040283203125, -0.060695648193359375, -0.0575408935546875, -0.054386138916015625, -0.05123138427734375, -0.048076629638671875, -0.044921875, -0.041767120361328125, -0.03861236572265625, -0.035457611083984375, -0.0323028564453125, -0.029148101806640625, -0.02599334716796875, -0.022838592529296875, -0.019683837890625, -0.016529083251953125, -0.01337432861328125, -0.010219573974609375, -0.0070648193359375, -0.003910064697265625, -0.00075531005859375, 0.002399444580078125, 0.00555419921875, 0.008708953857421875, 0.01186370849609375, 0.015018463134765625, 0.0181732177734375, 0.021327972412109375, 0.02448272705078125, 0.027637481689453125, 0.030792236328125, 0.033946990966796875, 0.03710174560546875, 0.040256500244140625, 0.0434112548828125, 0.046566009521484375, 0.04972076416015625, 0.052875518798828125, 0.0560302734375, 0.059185028076171875, 0.06233978271484375, 0.06549453735351562, 0.0686492919921875, 0.07180404663085938, 0.07495880126953125, 0.07811355590820312, 0.081268310546875, 0.08442306518554688, 0.08757781982421875, 0.09073257446289062, 0.0938873291015625, 0.09704208374023438, 0.10019683837890625, 0.10335159301757812, 0.10650634765625]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 3.0, 1.0, 1.0, 3.0, 6.0, 9.0, 9.0, 16.0, 46.0, 74.0, 125.0, 162.0, 200.0, 139.0, 100.0, 54.0, 24.0, 12.0, 7.0, 5.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.766864061355591, -2.693016529083252, -2.619168996810913, -2.545321464538574, -2.4714739322662354, -2.3976263999938965, -2.3237788677215576, -2.2499313354492188, -2.17608380317688, -2.102236270904541, -2.028388738632202, -1.9545412063598633, -1.8806936740875244, -1.8068461418151855, -1.7329986095428467, -1.6591510772705078, -1.585303544998169, -1.51145601272583, -1.4376084804534912, -1.3637609481811523, -1.2899134159088135, -1.2160658836364746, -1.1422183513641357, -1.0683708190917969, -0.994523286819458, -0.9206757545471191, -0.8468282222747803, -0.7729806900024414, -0.6991331577301025, -0.6252856254577637, -0.5514380931854248, -0.47759056091308594, -0.40374279022216797, -0.3298952579498291, -0.25604772567749023, -0.18220019340515137, -0.1083526611328125, -0.03450512886047363, 0.039342403411865234, 0.1131899356842041, 0.18703746795654297, 0.26088500022888184, 0.3347325325012207, 0.40858006477355957, 0.48242759704589844, 0.5562751293182373, 0.6301226615905762, 0.703970193862915, 0.7778177261352539, 0.8516652584075928, 0.9255127906799316, 0.9993603229522705, 1.0732078552246094, 1.1470553874969482, 1.220902919769287, 1.294750452041626, 1.3685979843139648, 1.4424455165863037, 1.5162930488586426, 1.5901405811309814, 1.6639881134033203, 1.7378356456756592, 1.811683177947998, 1.885530710220337, 1.9593782424926758]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 4.0, 1.0, 1.0, 1.0, 4.0, 3.0, 9.0, 11.0, 7.0, 14.0, 16.0, 16.0, 17.0, 23.0, 25.0, 35.0, 37.0, 39.0, 35.0, 49.0, 56.0, 60.0, 52.0, 66.0, 57.0, 48.0, 45.0, 31.0, 30.0, 29.0, 34.0, 29.0, 22.0, 23.0, 14.0, 13.0, 11.0, 16.0, 8.0, 3.0, 5.0, 5.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-1.2354381084442139, -1.1894893646240234, -1.143540620803833, -1.097591757774353, -1.0516430139541626, -1.0056942701339722, -0.959745466709137, -0.9137966632843018, -0.8678479194641113, -0.8218991756439209, -0.7759503722190857, -0.7300015687942505, -0.6840528249740601, -0.6381040811538696, -0.5921552777290344, -0.5462064743041992, -0.5002577304840088, -0.45430895686149597, -0.40836018323898315, -0.36241140961647034, -0.3164626359939575, -0.2705138623714447, -0.22456508874893188, -0.17861631512641907, -0.13266754150390625, -0.08671876788139343, -0.040769994258880615, 0.005178779363632202, 0.05112755298614502, 0.09707632660865784, 0.14302510023117065, 0.18897387385368347, 0.2349226474761963, 0.2808714210987091, 0.3268201947212219, 0.37276896834373474, 0.41871774196624756, 0.4646665155887604, 0.5106152892112732, 0.5565640926361084, 0.6025128364562988, 0.6484615802764893, 0.6944103837013245, 0.7403591871261597, 0.7863079309463501, 0.8322566747665405, 0.8782054781913757, 0.9241542816162109, 0.9701030254364014, 1.0160517692565918, 1.0620005130767822, 1.1079493761062622, 1.1538981199264526, 1.199846863746643, 1.245795726776123, 1.2917444705963135, 1.337693214416504, 1.3836419582366943, 1.4295907020568848, 1.4755395650863647, 1.5214883089065552, 1.5674370527267456, 1.6133859157562256, 1.659334659576416, 1.7052834033966064]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 5.0, 5.0, 4.0, 5.0, 6.0, 5.0, 8.0, 14.0, 20.0, 21.0, 33.0, 45.0, 73.0, 77.0, 142.0, 153.0, 305.0, 1797.0, 4121819.0, 68403.0, 557.0, 236.0, 161.0, 102.0, 79.0, 60.0, 45.0, 29.0, 22.0, 13.0, 13.0, 11.0, 4.0, 6.0, 2.0, 4.0, 5.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 3.0], "bins": [-1.2275390625, -1.1932373046875, -1.158935546875, -1.1246337890625, -1.09033203125, -1.0560302734375, -1.021728515625, -0.9874267578125, -0.953125, -0.9188232421875, -0.884521484375, -0.8502197265625, -0.81591796875, -0.7816162109375, -0.747314453125, -0.7130126953125, -0.6787109375, -0.6444091796875, -0.610107421875, -0.5758056640625, -0.54150390625, -0.5072021484375, -0.472900390625, -0.4385986328125, -0.404296875, -0.3699951171875, -0.335693359375, -0.3013916015625, -0.26708984375, -0.2327880859375, -0.198486328125, -0.1641845703125, -0.1298828125, -0.0955810546875, -0.061279296875, -0.0269775390625, 0.00732421875, 0.0416259765625, 0.075927734375, 0.1102294921875, 0.14453125, 0.1788330078125, 0.213134765625, 0.2474365234375, 0.28173828125, 0.3160400390625, 0.350341796875, 0.3846435546875, 0.4189453125, 0.4532470703125, 0.487548828125, 0.5218505859375, 0.55615234375, 0.5904541015625, 0.624755859375, 0.6590576171875, 0.693359375, 0.7276611328125, 0.761962890625, 0.7962646484375, 0.83056640625, 0.8648681640625, 0.899169921875, 0.9334716796875, 0.9677734375]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 5.0, 5.0, 3.0, 9.0, 6.0, 14.0, 30.0, 27.0, 32.0, 48.0, 60.0, 58.0, 57.0, 96.0, 71.0, 60.0, 82.0, 60.0, 56.0, 50.0, 44.0, 33.0, 28.0, 21.0, 17.0, 11.0, 6.0, 4.0, 4.0, 3.0, 3.0, 1.0, 1.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11785888671875, -0.11363697052001953, -0.10941505432128906, -0.1051931381225586, -0.10097122192382812, -0.09674930572509766, -0.09252738952636719, -0.08830547332763672, -0.08408355712890625, -0.07986164093017578, -0.07563972473144531, -0.07141780853271484, -0.06719589233398438, -0.0629739761352539, -0.05875205993652344, -0.05453014373779297, -0.0503082275390625, -0.04608631134033203, -0.04186439514160156, -0.037642478942871094, -0.033420562744140625, -0.029198646545410156, -0.024976730346679688, -0.02075481414794922, -0.01653289794921875, -0.012310981750488281, -0.008089065551757812, -0.0038671493530273438, 0.000354766845703125, 0.004576683044433594, 0.008798599243164062, 0.013020515441894531, 0.017242431640625, 0.02146434783935547, 0.025686264038085938, 0.029908180236816406, 0.034130096435546875, 0.038352012634277344, 0.04257392883300781, 0.04679584503173828, 0.05101776123046875, 0.05523967742919922, 0.05946159362792969, 0.06368350982666016, 0.06790542602539062, 0.0721273422241211, 0.07634925842285156, 0.08057117462158203, 0.0847930908203125, 0.08901500701904297, 0.09323692321777344, 0.0974588394165039, 0.10168075561523438, 0.10590267181396484, 0.11012458801269531, 0.11434650421142578, 0.11856842041015625, 0.12279033660888672, 0.1270122528076172, 0.13123416900634766, 0.13545608520507812, 0.1396780014038086, 0.14389991760253906, 0.14812183380126953, 0.15234375]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 2.0, 2.0, 5.0, 6.0, 6.0, 4.0, 10.0, 25.0, 30.0, 27.0, 72.0, 119.0, 244.0, 555.0, 1195.0, 2764.0, 7052.0, 19437.0, 66526.0, 343802.0, 2165546.0, 1324593.0, 193160.0, 44469.0, 14321.0, 5551.0, 2384.0, 1196.0, 550.0, 277.0, 144.0, 87.0, 40.0, 27.0, 17.0, 13.0, 7.0, 12.0, 4.0, 3.0, 1.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1376953125, -0.13362598419189453, -0.12955665588378906, -0.1254873275756836, -0.12141799926757812, -0.11734867095947266, -0.11327934265136719, -0.10921001434326172, -0.10514068603515625, -0.10107135772705078, -0.09700202941894531, -0.09293270111083984, -0.08886337280273438, -0.0847940444946289, -0.08072471618652344, -0.07665538787841797, -0.0725860595703125, -0.06851673126220703, -0.06444740295410156, -0.060378074645996094, -0.056308746337890625, -0.052239418029785156, -0.04817008972167969, -0.04410076141357422, -0.04003143310546875, -0.03596210479736328, -0.03189277648925781, -0.027823448181152344, -0.023754119873046875, -0.019684791564941406, -0.015615463256835938, -0.011546134948730469, -0.007476806640625, -0.0034074783325195312, 0.0006618499755859375, 0.004731178283691406, 0.008800506591796875, 0.012869834899902344, 0.016939163208007812, 0.02100849151611328, 0.02507781982421875, 0.02914714813232422, 0.03321647644042969, 0.037285804748535156, 0.041355133056640625, 0.045424461364746094, 0.04949378967285156, 0.05356311798095703, 0.0576324462890625, 0.06170177459716797, 0.06577110290527344, 0.0698404312133789, 0.07390975952148438, 0.07797908782958984, 0.08204841613769531, 0.08611774444580078, 0.09018707275390625, 0.09425640106201172, 0.09832572937011719, 0.10239505767822266, 0.10646438598632812, 0.1105337142944336, 0.11460304260253906, 0.11867237091064453, 0.12274169921875]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 6.0, 8.0, 4.0, 8.0, 9.0, 13.0, 13.0, 21.0, 22.0, 47.0, 45.0, 69.0, 86.0, 167.0, 224.0, 290.0, 372.0, 454.0, 495.0, 428.0, 330.0, 289.0, 182.0, 142.0, 101.0, 54.0, 41.0, 37.0, 31.0, 20.0, 17.0, 11.0, 9.0, 7.0, 4.0, 7.0, 3.0, 0.0, 4.0, 3.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.11376953125, -0.10959625244140625, -0.1054229736328125, -0.10124969482421875, -0.097076416015625, -0.09290313720703125, -0.0887298583984375, -0.08455657958984375, -0.08038330078125, -0.07621002197265625, -0.0720367431640625, -0.06786346435546875, -0.063690185546875, -0.05951690673828125, -0.0553436279296875, -0.05117034912109375, -0.0469970703125, -0.04282379150390625, -0.0386505126953125, -0.03447723388671875, -0.030303955078125, -0.02613067626953125, -0.0219573974609375, -0.01778411865234375, -0.01361083984375, -0.00943756103515625, -0.0052642822265625, -0.00109100341796875, 0.003082275390625, 0.00725555419921875, 0.0114288330078125, 0.01560211181640625, 0.019775390625, 0.02394866943359375, 0.0281219482421875, 0.03229522705078125, 0.036468505859375, 0.04064178466796875, 0.0448150634765625, 0.04898834228515625, 0.05316162109375, 0.05733489990234375, 0.0615081787109375, 0.06568145751953125, 0.069854736328125, 0.07402801513671875, 0.0782012939453125, 0.08237457275390625, 0.0865478515625, 0.09072113037109375, 0.0948944091796875, 0.09906768798828125, 0.103240966796875, 0.10741424560546875, 0.1115875244140625, 0.11576080322265625, 0.11993408203125, 0.12410736083984375, 0.1282806396484375, 0.13245391845703125, 0.136627197265625, 0.14080047607421875, 0.1449737548828125, 0.14914703369140625, 0.1533203125]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 5.0, 5.0, 7.0, 9.0, 13.0, 42.0, 64.0, 134.0, 207.0, 208.0, 145.0, 97.0, 40.0, 9.0, 7.0, 5.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-2.613504409790039, -2.549882650375366, -2.4862611293792725, -2.4226393699645996, -2.359017848968506, -2.295396089553833, -2.23177433013916, -2.1681528091430664, -2.1045310497283936, -2.0409092903137207, -1.977287769317627, -1.913666009902954, -1.8500443696975708, -1.7864227294921875, -1.7228009700775146, -1.6591793298721313, -1.595557689666748, -1.5319360494613647, -1.4683144092559814, -1.4046926498413086, -1.3410710096359253, -1.277449369430542, -1.2138276100158691, -1.1502059698104858, -1.0865843296051025, -1.0229626893997192, -0.9593409895896912, -0.8957192897796631, -0.8320976495742798, -0.7684760093688965, -0.7048543095588684, -0.6412326097488403, -0.5776112079620361, -0.5139895677566528, -0.45036786794662476, -0.38674619793891907, -0.3231245279312134, -0.2595028579235077, -0.195881187915802, -0.1322595179080963, -0.06863784790039062, -0.0050161778926849365, 0.05860549211502075, 0.12222716212272644, 0.18584883213043213, 0.24947050213813782, 0.3130921721458435, 0.3767138421535492, 0.4403355121612549, 0.5039571523666382, 0.5675788521766663, 0.6312005519866943, 0.6948221921920776, 0.7584438323974609, 0.822065532207489, 0.8856872320175171, 0.9493088722229004, 1.0129305124282837, 1.076552152633667, 1.1401739120483398, 1.2037955522537231, 1.2674171924591064, 1.3310389518737793, 1.3946605920791626, 1.458282232284546]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 4.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 6.0, 4.0, 7.0, 9.0, 6.0, 7.0, 14.0, 18.0, 20.0, 24.0, 20.0, 28.0, 34.0, 28.0, 36.0, 29.0, 51.0, 50.0, 47.0, 48.0, 51.0, 46.0, 34.0, 47.0, 36.0, 40.0, 30.0, 37.0, 26.0, 25.0, 28.0, 20.0, 15.0, 13.0, 7.0, 8.0, 8.0, 13.0, 5.0, 11.0, 6.0, 4.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.7177573442459106, -0.6952441334724426, -0.6727309226989746, -0.6502177119255066, -0.6277045011520386, -0.6051913499832153, -0.5826781392097473, -0.5601649284362793, -0.5376517176628113, -0.5151385068893433, -0.49262529611587524, -0.4701121151447296, -0.4475989043712616, -0.4250856935977936, -0.40257251262664795, -0.38005930185317993, -0.3575460910797119, -0.3350328803062439, -0.3125196695327759, -0.29000648856163025, -0.26749327778816223, -0.2449800670146942, -0.2224668711423874, -0.19995367527008057, -0.17744046449661255, -0.15492725372314453, -0.1324140578508377, -0.10990085452795029, -0.08738765120506287, -0.06487444788217545, -0.042361244559288025, -0.0198480486869812, 0.0026651620864868164, 0.025178365409374237, 0.04769156873226166, 0.07020477205514908, 0.0927179753780365, 0.11523117870092392, 0.13774438202381134, 0.16025757789611816, 0.18277078866958618, 0.2052839994430542, 0.22779719531536102, 0.25031039118766785, 0.27282360196113586, 0.2953368127346039, 0.3178499937057495, 0.34036320447921753, 0.36287641525268555, 0.38538962602615356, 0.4079028367996216, 0.4304160177707672, 0.45292922854423523, 0.47544243931770325, 0.4979556202888489, 0.5204688310623169, 0.5429820418357849, 0.5654952526092529, 0.588008463382721, 0.610521674156189, 0.6330348253250122, 0.6555480360984802, 0.6780612468719482, 0.7005744576454163, 0.7230876684188843]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 5.0, 2.0, 4.0, 4.0, 10.0, 7.0, 4.0, 17.0, 15.0, 27.0, 45.0, 56.0, 79.0, 136.0, 151.0, 279.0, 393.0, 669.0, 1089.0, 1976.0, 3579.0, 6751.0, 13780.0, 28169.0, 63055.0, 157015.0, 345626.0, 247458.0, 96519.0, 41372.0, 19308.0, 9534.0, 4945.0, 2748.0, 1383.0, 844.0, 499.0, 339.0, 221.0, 142.0, 104.0, 53.0, 36.0, 38.0, 23.0, 16.0, 10.0, 13.0, 4.0, 4.0, 6.0, 3.0, 2.0, 3.0, 1.0, 0.0, 1.0], "bins": [-0.130615234375, -0.12674427032470703, -0.12287330627441406, -0.1190023422241211, -0.11513137817382812, -0.11126041412353516, -0.10738945007324219, -0.10351848602294922, -0.09964752197265625, -0.09577655792236328, -0.09190559387207031, -0.08803462982177734, -0.08416366577148438, -0.0802927017211914, -0.07642173767089844, -0.07255077362060547, -0.0686798095703125, -0.06480884552001953, -0.06093788146972656, -0.057066917419433594, -0.053195953369140625, -0.049324989318847656, -0.04545402526855469, -0.04158306121826172, -0.03771209716796875, -0.03384113311767578, -0.029970169067382812, -0.026099205017089844, -0.022228240966796875, -0.018357276916503906, -0.014486312866210938, -0.010615348815917969, -0.006744384765625, -0.0028734207153320312, 0.0009975433349609375, 0.004868507385253906, 0.008739471435546875, 0.012610435485839844, 0.016481399536132812, 0.02035236358642578, 0.02422332763671875, 0.02809429168701172, 0.03196525573730469, 0.035836219787597656, 0.039707183837890625, 0.043578147888183594, 0.04744911193847656, 0.05132007598876953, 0.0551910400390625, 0.05906200408935547, 0.06293296813964844, 0.0668039321899414, 0.07067489624023438, 0.07454586029052734, 0.07841682434082031, 0.08228778839111328, 0.08615875244140625, 0.09002971649169922, 0.09390068054199219, 0.09777164459228516, 0.10164260864257812, 0.1055135726928711, 0.10938453674316406, 0.11325550079345703, 0.11712646484375]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 1.0, 4.0, 8.0, 5.0, 8.0, 7.0, 15.0, 14.0, 35.0, 28.0, 23.0, 32.0, 39.0, 46.0, 49.0, 50.0, 31.0, 54.0, 64.0, 53.0, 72.0, 48.0, 58.0, 37.0, 39.0, 36.0, 31.0, 13.0, 23.0, 18.0, 13.0, 14.0, 16.0, 8.0, 3.0, 4.0, 2.0, 1.0, 1.0, 4.0, 0.0, 3.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.11700439453125, -0.11380481719970703, -0.11060523986816406, -0.1074056625366211, -0.10420608520507812, -0.10100650787353516, -0.09780693054199219, -0.09460735321044922, -0.09140777587890625, -0.08820819854736328, -0.08500862121582031, -0.08180904388427734, -0.07860946655273438, -0.0754098892211914, -0.07221031188964844, -0.06901073455810547, -0.0658111572265625, -0.06261157989501953, -0.05941200256347656, -0.056212425231933594, -0.053012847900390625, -0.049813270568847656, -0.04661369323730469, -0.04341411590576172, -0.04021453857421875, -0.03701496124267578, -0.03381538391113281, -0.030615806579589844, -0.027416229248046875, -0.024216651916503906, -0.021017074584960938, -0.01781749725341797, -0.014617919921875, -0.011418342590332031, -0.008218765258789062, -0.005019187927246094, -0.001819610595703125, 0.0013799667358398438, 0.0045795440673828125, 0.007779121398925781, 0.01097869873046875, 0.014178276062011719, 0.017377853393554688, 0.020577430725097656, 0.023777008056640625, 0.026976585388183594, 0.030176162719726562, 0.03337574005126953, 0.0365753173828125, 0.03977489471435547, 0.04297447204589844, 0.046174049377441406, 0.049373626708984375, 0.052573204040527344, 0.05577278137207031, 0.05897235870361328, 0.06217193603515625, 0.06537151336669922, 0.06857109069824219, 0.07177066802978516, 0.07497024536132812, 0.0781698226928711, 0.08136940002441406, 0.08456897735595703, 0.0877685546875]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0, 4.0, 0.0, 2.0, 3.0, 8.0, 5.0, 6.0, 14.0, 27.0, 43.0, 46.0, 66.0, 144.0, 231.0, 453.0, 882.0, 2547.0, 10080.0, 66635.0, 711132.0, 224392.0, 24197.0, 4825.0, 1498.0, 592.0, 301.0, 169.0, 76.0, 62.0, 31.0, 26.0, 15.0, 21.0, 8.0, 2.0, 4.0, 7.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3271484375, -0.3165092468261719, -0.30587005615234375, -0.2952308654785156, -0.2845916748046875, -0.2739524841308594, -0.26331329345703125, -0.2526741027832031, -0.242034912109375, -0.23139572143554688, -0.22075653076171875, -0.21011734008789062, -0.1994781494140625, -0.18883895874023438, -0.17819976806640625, -0.16756057739257812, -0.15692138671875, -0.14628219604492188, -0.13564300537109375, -0.12500381469726562, -0.1143646240234375, -0.10372543334960938, -0.09308624267578125, -0.08244705200195312, -0.071807861328125, -0.061168670654296875, -0.05052947998046875, -0.039890289306640625, -0.0292510986328125, -0.018611907958984375, -0.00797271728515625, 0.002666473388671875, 0.0133056640625, 0.023944854736328125, 0.03458404541015625, 0.045223236083984375, 0.0558624267578125, 0.06650161743164062, 0.07714080810546875, 0.08777999877929688, 0.098419189453125, 0.10905838012695312, 0.11969757080078125, 0.13033676147460938, 0.1409759521484375, 0.15161514282226562, 0.16225433349609375, 0.17289352416992188, 0.18353271484375, 0.19417190551757812, 0.20481109619140625, 0.21545028686523438, 0.2260894775390625, 0.23672866821289062, 0.24736785888671875, 0.2580070495605469, 0.268646240234375, 0.2792854309082031, 0.28992462158203125, 0.3005638122558594, 0.3112030029296875, 0.3218421936035156, 0.33248138427734375, 0.3431205749511719, 0.353759765625]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 6.0, 5.0, 12.0, 14.0, 13.0, 17.0, 18.0, 27.0, 29.0, 37.0, 37.0, 37.0, 49.0, 44.0, 60.0, 65.0, 54.0, 56.0, 36.0, 58.0, 48.0, 41.0, 30.0, 43.0, 29.0, 22.0, 27.0, 22.0, 21.0, 6.0, 10.0, 8.0, 8.0, 5.0, 6.0, 5.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.36962890625, -0.3577232360839844, -0.34581756591796875, -0.3339118957519531, -0.3220062255859375, -0.3101005554199219, -0.29819488525390625, -0.2862892150878906, -0.274383544921875, -0.2624778747558594, -0.25057220458984375, -0.23866653442382812, -0.2267608642578125, -0.21485519409179688, -0.20294952392578125, -0.19104385375976562, -0.17913818359375, -0.16723251342773438, -0.15532684326171875, -0.14342117309570312, -0.1315155029296875, -0.11960983276367188, -0.10770416259765625, -0.09579849243164062, -0.083892822265625, -0.07198715209960938, -0.06008148193359375, -0.048175811767578125, -0.0362701416015625, -0.024364471435546875, -0.01245880126953125, -0.000553131103515625, 0.0113525390625, 0.023258209228515625, 0.03516387939453125, 0.047069549560546875, 0.0589752197265625, 0.07088088989257812, 0.08278656005859375, 0.09469223022460938, 0.106597900390625, 0.11850357055664062, 0.13040924072265625, 0.14231491088867188, 0.1542205810546875, 0.16612625122070312, 0.17803192138671875, 0.18993759155273438, 0.20184326171875, 0.21374893188476562, 0.22565460205078125, 0.23756027221679688, 0.2494659423828125, 0.2613716125488281, 0.27327728271484375, 0.2851829528808594, 0.297088623046875, 0.3089942932128906, 0.32089996337890625, 0.3328056335449219, 0.3447113037109375, 0.3566169738769531, 0.36852264404296875, 0.3804283142089844, 0.392333984375]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 3.0, 2.0, 4.0, 3.0, 3.0, 4.0, 4.0, 11.0, 10.0, 16.0, 29.0, 36.0, 57.0, 121.0, 242.0, 508.0, 1378.0, 5657.0, 43576.0, 768936.0, 207543.0, 16112.0, 2765.0, 823.0, 322.0, 157.0, 96.0, 44.0, 27.0, 14.0, 12.0, 16.0, 9.0, 4.0, 5.0, 1.0, 3.0, 4.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.2080078125, -0.2014617919921875, -0.194915771484375, -0.1883697509765625, -0.18182373046875, -0.1752777099609375, -0.168731689453125, -0.1621856689453125, -0.1556396484375, -0.1490936279296875, -0.142547607421875, -0.1360015869140625, -0.12945556640625, -0.1229095458984375, -0.116363525390625, -0.1098175048828125, -0.103271484375, -0.0967254638671875, -0.090179443359375, -0.0836334228515625, -0.07708740234375, -0.0705413818359375, -0.063995361328125, -0.0574493408203125, -0.0509033203125, -0.0443572998046875, -0.037811279296875, -0.0312652587890625, -0.02471923828125, -0.0181732177734375, -0.011627197265625, -0.0050811767578125, 0.00146484375, 0.0080108642578125, 0.014556884765625, 0.0211029052734375, 0.02764892578125, 0.0341949462890625, 0.040740966796875, 0.0472869873046875, 0.0538330078125, 0.0603790283203125, 0.066925048828125, 0.0734710693359375, 0.08001708984375, 0.0865631103515625, 0.093109130859375, 0.0996551513671875, 0.106201171875, 0.1127471923828125, 0.119293212890625, 0.1258392333984375, 0.13238525390625, 0.1389312744140625, 0.145477294921875, 0.1520233154296875, 0.1585693359375, 0.1651153564453125, 0.171661376953125, 0.1782073974609375, 0.18475341796875, 0.1912994384765625, 0.197845458984375, 0.2043914794921875, 0.2109375]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 5.0, 1.0, 2.0, 7.0, 6.0, 10.0, 10.0, 9.0, 8.0, 21.0, 29.0, 40.0, 39.0, 57.0, 80.0, 94.0, 116.0, 89.0, 83.0, 79.0, 45.0, 30.0, 32.0, 26.0, 16.0, 17.0, 10.0, 5.0, 6.0, 6.0, 3.0, 3.0, 7.0, 4.0, 4.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-4.1604042053222656e-05, -4.024524241685867e-05, -3.888644278049469e-05, -3.752764314413071e-05, -3.6168843507766724e-05, -3.481004387140274e-05, -3.345124423503876e-05, -3.2092444598674774e-05, -3.073364496231079e-05, -2.9374845325946808e-05, -2.8016045689582825e-05, -2.665724605321884e-05, -2.529844641685486e-05, -2.3939646780490875e-05, -2.2580847144126892e-05, -2.122204750776291e-05, -1.9863247871398926e-05, -1.8504448235034943e-05, -1.714564859867096e-05, -1.5786848962306976e-05, -1.4428049325942993e-05, -1.306924968957901e-05, -1.1710450053215027e-05, -1.0351650416851044e-05, -8.99285078048706e-06, -7.634051144123077e-06, -6.275251507759094e-06, -4.916451871395111e-06, -3.557652235031128e-06, -2.1988525986671448e-06, -8.400529623031616e-07, 5.187466740608215e-07, 1.8775463104248047e-06, 3.236345946788788e-06, 4.595145583152771e-06, 5.953945219516754e-06, 7.312744855880737e-06, 8.67154449224472e-06, 1.0030344128608704e-05, 1.1389143764972687e-05, 1.274794340133667e-05, 1.4106743037700653e-05, 1.5465542674064636e-05, 1.682434231042862e-05, 1.8183141946792603e-05, 1.9541941583156586e-05, 2.090074121952057e-05, 2.2259540855884552e-05, 2.3618340492248535e-05, 2.497714012861252e-05, 2.63359397649765e-05, 2.7694739401340485e-05, 2.9053539037704468e-05, 3.041233867406845e-05, 3.1771138310432434e-05, 3.312993794679642e-05, 3.44887375831604e-05, 3.5847537219524384e-05, 3.720633685588837e-05, 3.856513649225235e-05, 3.992393612861633e-05, 4.1282735764980316e-05, 4.26415354013443e-05, 4.400033503770828e-05, 4.5359134674072266e-05]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 5.0, 2.0, 3.0, 3.0, 4.0, 12.0, 9.0, 12.0, 26.0, 32.0, 37.0, 78.0, 122.0, 189.0, 291.0, 614.0, 1193.0, 3003.0, 8516.0, 31941.0, 221284.0, 674318.0, 81334.0, 16601.0, 4940.0, 1943.0, 905.0, 475.0, 258.0, 165.0, 63.0, 55.0, 50.0, 29.0, 16.0, 9.0, 3.0, 4.0, 5.0, 3.0, 2.0, 4.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.136474609375, -0.13196563720703125, -0.1274566650390625, -0.12294769287109375, -0.118438720703125, -0.11392974853515625, -0.1094207763671875, -0.10491180419921875, -0.10040283203125, -0.09589385986328125, -0.0913848876953125, -0.08687591552734375, -0.082366943359375, -0.07785797119140625, -0.0733489990234375, -0.06884002685546875, -0.0643310546875, -0.05982208251953125, -0.0553131103515625, -0.05080413818359375, -0.046295166015625, -0.04178619384765625, -0.0372772216796875, -0.03276824951171875, -0.02825927734375, -0.02375030517578125, -0.0192413330078125, -0.01473236083984375, -0.010223388671875, -0.00571441650390625, -0.0012054443359375, 0.00330352783203125, 0.0078125, 0.01232147216796875, 0.0168304443359375, 0.02133941650390625, 0.025848388671875, 0.03035736083984375, 0.0348663330078125, 0.03937530517578125, 0.04388427734375, 0.04839324951171875, 0.0529022216796875, 0.05741119384765625, 0.061920166015625, 0.06642913818359375, 0.0709381103515625, 0.07544708251953125, 0.0799560546875, 0.08446502685546875, 0.0889739990234375, 0.09348297119140625, 0.097991943359375, 0.10250091552734375, 0.1070098876953125, 0.11151885986328125, 0.11602783203125, 0.12053680419921875, 0.1250457763671875, 0.12955474853515625, 0.134063720703125, 0.13857269287109375, 0.1430816650390625, 0.14759063720703125, 0.152099609375]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 2.0, 9.0, 1.0, 4.0, 3.0, 7.0, 4.0, 5.0, 8.0, 4.0, 11.0, 19.0, 22.0, 30.0, 36.0, 47.0, 66.0, 57.0, 61.0, 71.0, 62.0, 89.0, 57.0, 64.0, 48.0, 48.0, 28.0, 26.0, 20.0, 25.0, 12.0, 7.0, 10.0, 4.0, 8.0, 5.0, 5.0, 2.0, 1.0, 5.0, 0.0, 2.0, 3.0, 2.0, 3.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.09112548828125, -0.08821392059326172, -0.08530235290527344, -0.08239078521728516, -0.07947921752929688, -0.0765676498413086, -0.07365608215332031, -0.07074451446533203, -0.06783294677734375, -0.06492137908935547, -0.06200981140136719, -0.059098243713378906, -0.056186676025390625, -0.053275108337402344, -0.05036354064941406, -0.04745197296142578, -0.0445404052734375, -0.04162883758544922, -0.03871726989746094, -0.035805702209472656, -0.032894134521484375, -0.029982566833496094, -0.027070999145507812, -0.02415943145751953, -0.02124786376953125, -0.01833629608154297, -0.015424728393554688, -0.012513160705566406, -0.009601593017578125, -0.006690025329589844, -0.0037784576416015625, -0.0008668899536132812, 0.002044677734375, 0.004956245422363281, 0.007867813110351562, 0.010779380798339844, 0.013690948486328125, 0.016602516174316406, 0.019514083862304688, 0.02242565155029297, 0.02533721923828125, 0.02824878692626953, 0.031160354614257812, 0.034071922302246094, 0.036983489990234375, 0.039895057678222656, 0.04280662536621094, 0.04571819305419922, 0.0486297607421875, 0.05154132843017578, 0.05445289611816406, 0.057364463806152344, 0.060276031494140625, 0.0631875991821289, 0.06609916687011719, 0.06901073455810547, 0.07192230224609375, 0.07483386993408203, 0.07774543762207031, 0.0806570053100586, 0.08356857299804688, 0.08648014068603516, 0.08939170837402344, 0.09230327606201172, 0.09521484375]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 2.0, 3.0, 2.0, 6.0, 6.0, 23.0, 90.0, 148.0, 255.0, 231.0, 127.0, 59.0, 20.0, 12.0, 9.0, 2.0, 2.0, 2.0, 4.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.634068489074707, -3.545316457748413, -3.456564426422119, -3.3678126335144043, -3.2790606021881104, -3.1903085708618164, -3.1015565395355225, -3.0128045082092285, -2.9240527153015137, -2.8353006839752197, -2.746548652648926, -2.657796859741211, -2.569044828414917, -2.480292797088623, -2.391540765762329, -2.302788734436035, -2.2140369415283203, -2.1252849102020264, -2.0365328788757324, -1.947780966758728, -1.8590290546417236, -1.7702770233154297, -1.6815249919891357, -1.5927730798721313, -1.5040209293365479, -1.415268898010254, -1.3265169858932495, -1.2377649545669556, -1.1490130424499512, -1.0602610111236572, -0.9715090394020081, -0.8827570676803589, -0.7940051555633545, -0.7052531838417053, -0.6165012121200562, -0.5277491807937622, -0.4389972388744354, -0.35024526715278625, -0.2614932656288147, -0.17274129390716553, -0.08398932218551636, 0.004762656986713409, 0.09351463615894318, 0.18226662278175354, 0.2710185945034027, 0.3597705662250519, 0.44852256774902344, 0.5372745394706726, 0.6260265111923218, 0.714778482913971, 0.8035304546356201, 0.8922824859619141, 0.9810343980789185, 1.0697864294052124, 1.1585383415222168, 1.2472903728485107, 1.3360424041748047, 1.4247944355010986, 1.513546347618103, 1.602298378944397, 1.6910502910614014, 1.7798023223876953, 1.8685543537139893, 1.9573062658309937, 2.046058177947998]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 6.0, 3.0, 6.0, 9.0, 5.0, 7.0, 11.0, 6.0, 15.0, 10.0, 24.0, 19.0, 21.0, 21.0, 29.0, 27.0, 33.0, 34.0, 36.0, 43.0, 51.0, 47.0, 53.0, 62.0, 51.0, 46.0, 40.0, 35.0, 38.0, 31.0, 27.0, 27.0, 25.0, 21.0, 13.0, 13.0, 15.0, 11.0, 10.0, 6.0, 4.0, 7.0, 2.0, 4.0, 2.0, 6.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.2282485961914062, -1.1893563270568848, -1.1504640579223633, -1.1115717887878418, -1.0726795196533203, -1.0337872505187988, -0.9948949813842773, -0.9560027122497559, -0.9171104431152344, -0.8782181739807129, -0.8393259048461914, -0.8004336357116699, -0.7615413665771484, -0.722649097442627, -0.6837568283081055, -0.644864559173584, -0.6059723496437073, -0.5670800805091858, -0.5281878113746643, -0.4892955422401428, -0.45040327310562134, -0.41151100397109985, -0.37261876463890076, -0.3337264955043793, -0.2948342263698578, -0.2559419572353363, -0.21704968810081482, -0.17815743386745453, -0.13926516473293304, -0.10037289559841156, -0.06148064136505127, -0.022588372230529785, 0.0163038969039917, 0.055196162313222885, 0.09408842772245407, 0.13298068940639496, 0.17187295854091644, 0.21076522767543793, 0.24965748190879822, 0.2885497510433197, 0.3274420201778412, 0.36633428931236267, 0.40522655844688416, 0.44411879777908325, 0.48301106691360474, 0.5219033360481262, 0.5607956051826477, 0.5996878743171692, 0.6385801434516907, 0.6774724125862122, 0.7163646817207336, 0.7552569508552551, 0.7941492199897766, 0.8330414891242981, 0.8719336986541748, 0.9108259677886963, 0.9497182369232178, 0.9886105060577393, 1.0275027751922607, 1.0663950443267822, 1.1052873134613037, 1.1441795825958252, 1.1830718517303467, 1.2219641208648682, 1.2608563899993896]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 6.0, 6.0, 10.0, 11.0, 11.0, 23.0, 37.0, 54.0, 78.0, 128.0, 212.0, 312.0, 570.0, 1147.0, 2663.0, 6494.0, 22044.0, 104097.0, 841015.0, 2593734.0, 524577.0, 71769.0, 16198.0, 5080.0, 1962.0, 891.0, 424.0, 244.0, 145.0, 102.0, 63.0, 48.0, 32.0, 25.0, 10.0, 18.0, 12.0, 12.0, 3.0, 4.0, 6.0, 3.0, 2.0, 2.0, 4.0, 3.0, 0.0, 1.0, 4.0], "bins": [-0.1444091796875, -0.14021015167236328, -0.13601112365722656, -0.13181209564208984, -0.12761306762695312, -0.1234140396118164, -0.11921501159667969, -0.11501598358154297, -0.11081695556640625, -0.10661792755126953, -0.10241889953613281, -0.0982198715209961, -0.09402084350585938, -0.08982181549072266, -0.08562278747558594, -0.08142375946044922, -0.0772247314453125, -0.07302570343017578, -0.06882667541503906, -0.06462764739990234, -0.060428619384765625, -0.056229591369628906, -0.05203056335449219, -0.04783153533935547, -0.04363250732421875, -0.03943347930908203, -0.03523445129394531, -0.031035423278808594, -0.026836395263671875, -0.022637367248535156, -0.018438339233398438, -0.014239311218261719, -0.010040283203125, -0.005841255187988281, -0.0016422271728515625, 0.0025568008422851562, 0.006755828857421875, 0.010954856872558594, 0.015153884887695312, 0.01935291290283203, 0.02355194091796875, 0.02775096893310547, 0.03194999694824219, 0.036149024963378906, 0.040348052978515625, 0.044547080993652344, 0.04874610900878906, 0.05294513702392578, 0.0571441650390625, 0.06134319305419922, 0.06554222106933594, 0.06974124908447266, 0.07394027709960938, 0.0781393051147461, 0.08233833312988281, 0.08653736114501953, 0.09073638916015625, 0.09493541717529297, 0.09913444519042969, 0.1033334732055664, 0.10753250122070312, 0.11173152923583984, 0.11593055725097656, 0.12012958526611328, 0.12432861328125]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 3.0, 10.0, 7.0, 8.0, 5.0, 12.0, 18.0, 18.0, 23.0, 35.0, 39.0, 45.0, 48.0, 53.0, 50.0, 64.0, 56.0, 54.0, 61.0, 59.0, 61.0, 56.0, 36.0, 35.0, 35.0, 23.0, 17.0, 14.0, 22.0, 8.0, 11.0, 6.0, 5.0, 2.0, 3.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.11578369140625, -0.112579345703125, -0.109375, -0.106170654296875, -0.10296630859375, -0.099761962890625, -0.0965576171875, -0.093353271484375, -0.09014892578125, -0.086944580078125, -0.083740234375, -0.080535888671875, -0.07733154296875, -0.074127197265625, -0.0709228515625, -0.067718505859375, -0.06451416015625, -0.061309814453125, -0.05810546875, -0.054901123046875, -0.05169677734375, -0.048492431640625, -0.0452880859375, -0.042083740234375, -0.03887939453125, -0.035675048828125, -0.032470703125, -0.029266357421875, -0.02606201171875, -0.022857666015625, -0.0196533203125, -0.016448974609375, -0.01324462890625, -0.010040283203125, -0.0068359375, -0.003631591796875, -0.00042724609375, 0.002777099609375, 0.0059814453125, 0.009185791015625, 0.01239013671875, 0.015594482421875, 0.018798828125, 0.022003173828125, 0.02520751953125, 0.028411865234375, 0.0316162109375, 0.034820556640625, 0.03802490234375, 0.041229248046875, 0.04443359375, 0.047637939453125, 0.05084228515625, 0.054046630859375, 0.0572509765625, 0.060455322265625, 0.06365966796875, 0.066864013671875, 0.070068359375, 0.073272705078125, 0.07647705078125, 0.079681396484375, 0.0828857421875, 0.086090087890625, 0.08929443359375]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 6.0, 8.0, 19.0, 15.0, 34.0, 33.0, 63.0, 105.0, 166.0, 320.0, 646.0, 1318.0, 2959.0, 7724.0, 23660.0, 88162.0, 520793.0, 2656185.0, 728538.0, 116259.0, 30151.0, 9977.0, 3833.0, 1607.0, 750.0, 391.0, 218.0, 121.0, 75.0, 46.0, 25.0, 20.0, 20.0, 9.0, 9.0, 6.0, 5.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.1658935546875, -0.16123008728027344, -0.15656661987304688, -0.1519031524658203, -0.14723968505859375, -0.1425762176513672, -0.13791275024414062, -0.13324928283691406, -0.1285858154296875, -0.12392234802246094, -0.11925888061523438, -0.11459541320800781, -0.10993194580078125, -0.10526847839355469, -0.10060501098632812, -0.09594154357910156, -0.091278076171875, -0.08661460876464844, -0.08195114135742188, -0.07728767395019531, -0.07262420654296875, -0.06796073913574219, -0.06329727172851562, -0.05863380432128906, -0.0539703369140625, -0.04930686950683594, -0.044643402099609375, -0.03997993469238281, -0.03531646728515625, -0.030652999877929688, -0.025989532470703125, -0.021326065063476562, -0.01666259765625, -0.011999130249023438, -0.007335662841796875, -0.0026721954345703125, 0.00199127197265625, 0.0066547393798828125, 0.011318206787109375, 0.015981674194335938, 0.0206451416015625, 0.025308609008789062, 0.029972076416015625, 0.03463554382324219, 0.03929901123046875, 0.04396247863769531, 0.048625946044921875, 0.05328941345214844, 0.057952880859375, 0.06261634826660156, 0.06727981567382812, 0.07194328308105469, 0.07660675048828125, 0.08127021789550781, 0.08593368530273438, 0.09059715270996094, 0.0952606201171875, 0.09992408752441406, 0.10458755493164062, 0.10925102233886719, 0.11391448974609375, 0.11857795715332031, 0.12324142456054688, 0.12790489196777344, 0.132568359375]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 3.0, 5.0, 3.0, 4.0, 8.0, 12.0, 7.0, 16.0, 16.0, 23.0, 34.0, 44.0, 51.0, 68.0, 79.0, 149.0, 227.0, 285.0, 387.0, 475.0, 472.0, 446.0, 355.0, 265.0, 169.0, 98.0, 91.0, 67.0, 40.0, 46.0, 36.0, 17.0, 23.0, 14.0, 11.0, 8.0, 8.0, 5.0, 2.0, 3.0, 3.0, 3.0, 3.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1693115234375, -0.16405105590820312, -0.15879058837890625, -0.15353012084960938, -0.1482696533203125, -0.14300918579101562, -0.13774871826171875, -0.13248825073242188, -0.127227783203125, -0.12196731567382812, -0.11670684814453125, -0.11144638061523438, -0.1061859130859375, -0.10092544555664062, -0.09566497802734375, -0.09040451049804688, -0.08514404296875, -0.07988357543945312, -0.07462310791015625, -0.06936264038085938, -0.0641021728515625, -0.058841705322265625, -0.05358123779296875, -0.048320770263671875, -0.043060302734375, -0.037799835205078125, -0.03253936767578125, -0.027278900146484375, -0.0220184326171875, -0.016757965087890625, -0.01149749755859375, -0.006237030029296875, -0.0009765625, 0.004283905029296875, 0.00954437255859375, 0.014804840087890625, 0.0200653076171875, 0.025325775146484375, 0.03058624267578125, 0.035846710205078125, 0.041107177734375, 0.046367645263671875, 0.05162811279296875, 0.056888580322265625, 0.0621490478515625, 0.06740951538085938, 0.07266998291015625, 0.07793045043945312, 0.08319091796875, 0.08845138549804688, 0.09371185302734375, 0.09897232055664062, 0.1042327880859375, 0.10949325561523438, 0.11475372314453125, 0.12001419067382812, 0.125274658203125, 0.13053512573242188, 0.13579559326171875, 0.14105606079101562, 0.1463165283203125, 0.15157699584960938, 0.15683746337890625, 0.16209793090820312, 0.1673583984375]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 5.0, 13.0, 9.0, 28.0, 72.0, 129.0, 224.0, 231.0, 156.0, 80.0, 22.0, 14.0, 10.0, 4.0, 4.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.351358413696289, -2.2611982822418213, -2.1710381507873535, -2.0808780193328857, -1.9907177686691284, -1.9005576372146606, -1.8103973865509033, -1.7202372550964355, -1.6300771236419678, -1.5399169921875, -1.4497568607330322, -1.359596610069275, -1.2694364786148071, -1.1792763471603394, -1.089116096496582, -0.9989559650421143, -0.9087958335876465, -0.8186357021331787, -0.7284755110740662, -0.6383153200149536, -0.5481551885604858, -0.4579950273036957, -0.3678348660469055, -0.27767467498779297, -0.1875145435333252, -0.09735438227653503, -0.007194221019744873, 0.08296594023704529, 0.17312610149383545, 0.2632862627506256, 0.35344642400741577, 0.4436066150665283, 0.5337669849395752, 0.623927116394043, 0.7140873074531555, 0.8042474985122681, 0.8944076299667358, 0.9845677614212036, 1.074728012084961, 1.1648881435394287, 1.2550482749938965, 1.3452084064483643, 1.435368537902832, 1.5255287885665894, 1.6156889200210571, 1.705849051475525, 1.7960093021392822, 1.88616943359375, 1.9763295650482178, 2.0664896965026855, 2.1566498279571533, 2.246809959411621, 2.336970329284668, 2.4271304607391357, 2.5172905921936035, 2.6074507236480713, 2.697610855102539, 2.787770986557007, 2.8779311180114746, 2.9680912494659424, 3.05825138092041, 3.148411750793457, 3.238571882247925, 3.3287320137023926, 3.4188921451568604]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 0.0, 2.0, 1.0, 5.0, 6.0, 10.0, 6.0, 12.0, 14.0, 19.0, 19.0, 21.0, 34.0, 34.0, 37.0, 36.0, 47.0, 45.0, 58.0, 58.0, 51.0, 51.0, 56.0, 41.0, 50.0, 38.0, 39.0, 42.0, 33.0, 28.0, 25.0, 19.0, 14.0, 10.0, 10.0, 8.0, 5.0, 5.0, 9.0, 4.0, 5.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.0525121688842773, -1.0177582502365112, -0.9830042123794556, -0.9482502937316895, -0.9134963154792786, -0.8787423372268677, -0.8439884185791016, -0.8092344403266907, -0.7744804620742798, -0.7397264838218689, -0.704972505569458, -0.6702185869216919, -0.635464608669281, -0.6007106304168701, -0.565956711769104, -0.5312027335166931, -0.4964487552642822, -0.46169477701187134, -0.42694082856178284, -0.39218688011169434, -0.35743290185928345, -0.32267892360687256, -0.28792497515678406, -0.25317102670669556, -0.21841704845428467, -0.18366308510303497, -0.14890912175178528, -0.11415515840053558, -0.07940119504928589, -0.044647231698036194, -0.009893268346786499, 0.024860695004463196, 0.05961453914642334, 0.09436850249767303, 0.12912246584892273, 0.16387642920017242, 0.19863039255142212, 0.23338435590267181, 0.2681383192539215, 0.30289226770401, 0.3376462459564209, 0.3724002242088318, 0.4071541726589203, 0.4419081211090088, 0.4766620993614197, 0.5114160776138306, 0.5461699962615967, 0.5809239745140076, 0.6156779527664185, 0.6504319310188293, 0.6851859092712402, 0.7199398279190063, 0.7546938061714172, 0.7894477844238281, 0.8242017030715942, 0.8589556813240051, 0.893709659576416, 0.9284636378288269, 0.9632176160812378, 0.9979715347290039, 1.0327255725860596, 1.0674794912338257, 1.1022334098815918, 1.1369874477386475, 1.1717413663864136]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 4.0, 2.0, 5.0, 6.0, 7.0, 8.0, 15.0, 13.0, 20.0, 41.0, 55.0, 75.0, 103.0, 176.0, 312.0, 472.0, 857.0, 1636.0, 3404.0, 7283.0, 16522.0, 38616.0, 95643.0, 234303.0, 349410.0, 175251.0, 70826.0, 29497.0, 12594.0, 5625.0, 2657.0, 1317.0, 715.0, 388.0, 230.0, 146.0, 81.0, 65.0, 51.0, 43.0, 29.0, 16.0, 13.0, 12.0, 4.0, 4.0, 5.0, 6.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.14892578125, -0.14458847045898438, -0.14025115966796875, -0.13591384887695312, -0.1315765380859375, -0.12723922729492188, -0.12290191650390625, -0.11856460571289062, -0.114227294921875, -0.10988998413085938, -0.10555267333984375, -0.10121536254882812, -0.0968780517578125, -0.09254074096679688, -0.08820343017578125, -0.08386611938476562, -0.07952880859375, -0.07519149780273438, -0.07085418701171875, -0.06651687622070312, -0.0621795654296875, -0.057842254638671875, -0.05350494384765625, -0.049167633056640625, -0.044830322265625, -0.040493011474609375, -0.03615570068359375, -0.031818389892578125, -0.0274810791015625, -0.023143768310546875, -0.01880645751953125, -0.014469146728515625, -0.0101318359375, -0.005794525146484375, -0.00145721435546875, 0.002880096435546875, 0.0072174072265625, 0.011554718017578125, 0.01589202880859375, 0.020229339599609375, 0.024566650390625, 0.028903961181640625, 0.03324127197265625, 0.037578582763671875, 0.0419158935546875, 0.046253204345703125, 0.05059051513671875, 0.054927825927734375, 0.05926513671875, 0.06360244750976562, 0.06793975830078125, 0.07227706909179688, 0.0766143798828125, 0.08095169067382812, 0.08528900146484375, 0.08962631225585938, 0.093963623046875, 0.09830093383789062, 0.10263824462890625, 0.10697555541992188, 0.1113128662109375, 0.11565017700195312, 0.11998748779296875, 0.12432479858398438, 0.128662109375]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 8.0, 3.0, 7.0, 5.0, 13.0, 15.0, 23.0, 19.0, 20.0, 32.0, 50.0, 51.0, 49.0, 50.0, 50.0, 55.0, 55.0, 75.0, 52.0, 57.0, 53.0, 43.0, 40.0, 38.0, 24.0, 27.0, 21.0, 17.0, 11.0, 10.0, 10.0, 8.0, 6.0, 4.0, 5.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11474609375, -0.11144542694091797, -0.10814476013183594, -0.1048440933227539, -0.10154342651367188, -0.09824275970458984, -0.09494209289550781, -0.09164142608642578, -0.08834075927734375, -0.08504009246826172, -0.08173942565917969, -0.07843875885009766, -0.07513809204101562, -0.0718374252319336, -0.06853675842285156, -0.06523609161376953, -0.0619354248046875, -0.05863475799560547, -0.05533409118652344, -0.052033424377441406, -0.048732757568359375, -0.045432090759277344, -0.04213142395019531, -0.03883075714111328, -0.03553009033203125, -0.03222942352294922, -0.028928756713867188, -0.025628089904785156, -0.022327423095703125, -0.019026756286621094, -0.015726089477539062, -0.012425422668457031, -0.009124755859375, -0.005824089050292969, -0.0025234222412109375, 0.0007772445678710938, 0.004077911376953125, 0.007378578186035156, 0.010679244995117188, 0.013979911804199219, 0.01728057861328125, 0.02058124542236328, 0.023881912231445312, 0.027182579040527344, 0.030483245849609375, 0.033783912658691406, 0.03708457946777344, 0.04038524627685547, 0.0436859130859375, 0.04698657989501953, 0.05028724670410156, 0.053587913513183594, 0.056888580322265625, 0.060189247131347656, 0.06348991394042969, 0.06679058074951172, 0.07009124755859375, 0.07339191436767578, 0.07669258117675781, 0.07999324798583984, 0.08329391479492188, 0.0865945816040039, 0.08989524841308594, 0.09319591522216797, 0.09649658203125]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 2.0, 4.0, 3.0, 10.0, 13.0, 11.0, 18.0, 23.0, 23.0, 53.0, 61.0, 84.0, 113.0, 174.0, 241.0, 385.0, 564.0, 956.0, 1660.0, 3542.0, 10096.0, 49987.0, 432805.0, 478637.0, 50819.0, 10333.0, 3547.0, 1656.0, 924.0, 550.0, 378.0, 259.0, 179.0, 137.0, 92.0, 64.0, 36.0, 28.0, 24.0, 19.0, 17.0, 10.0, 7.0, 5.0, 4.0, 2.0, 2.0, 3.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.308349609375, -0.2984046936035156, -0.28845977783203125, -0.2785148620605469, -0.2685699462890625, -0.2586250305175781, -0.24868011474609375, -0.23873519897460938, -0.228790283203125, -0.21884536743164062, -0.20890045166015625, -0.19895553588867188, -0.1890106201171875, -0.17906570434570312, -0.16912078857421875, -0.15917587280273438, -0.14923095703125, -0.13928604125976562, -0.12934112548828125, -0.11939620971679688, -0.1094512939453125, -0.09950637817382812, -0.08956146240234375, -0.07961654663085938, -0.069671630859375, -0.059726715087890625, -0.04978179931640625, -0.039836883544921875, -0.0298919677734375, -0.019947052001953125, -0.01000213623046875, -5.7220458984375e-05, 0.0098876953125, 0.019832611083984375, 0.02977752685546875, 0.039722442626953125, 0.0496673583984375, 0.059612274169921875, 0.06955718994140625, 0.07950210571289062, 0.089447021484375, 0.09939193725585938, 0.10933685302734375, 0.11928176879882812, 0.1292266845703125, 0.13917160034179688, 0.14911651611328125, 0.15906143188476562, 0.16900634765625, 0.17895126342773438, 0.18889617919921875, 0.19884109497070312, 0.2087860107421875, 0.21873092651367188, 0.22867584228515625, 0.23862075805664062, 0.248565673828125, 0.2585105895996094, 0.26845550537109375, 0.2784004211425781, 0.2883453369140625, 0.2982902526855469, 0.30823516845703125, 0.3181800842285156, 0.328125]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 2.0, 5.0, 4.0, 2.0, 1.0, 4.0, 6.0, 4.0, 12.0, 9.0, 9.0, 11.0, 17.0, 21.0, 15.0, 15.0, 17.0, 23.0, 26.0, 26.0, 32.0, 41.0, 42.0, 33.0, 34.0, 39.0, 39.0, 56.0, 48.0, 54.0, 40.0, 43.0, 34.0, 24.0, 28.0, 28.0, 27.0, 29.0, 17.0, 15.0, 11.0, 13.0, 8.0, 6.0, 12.0, 6.0, 2.0, 7.0, 6.0, 1.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0], "bins": [-0.342041015625, -0.33063507080078125, -0.3192291259765625, -0.30782318115234375, -0.296417236328125, -0.28501129150390625, -0.2736053466796875, -0.26219940185546875, -0.25079345703125, -0.23938751220703125, -0.2279815673828125, -0.21657562255859375, -0.205169677734375, -0.19376373291015625, -0.1823577880859375, -0.17095184326171875, -0.1595458984375, -0.14813995361328125, -0.1367340087890625, -0.12532806396484375, -0.113922119140625, -0.10251617431640625, -0.0911102294921875, -0.07970428466796875, -0.06829833984375, -0.05689239501953125, -0.0454864501953125, -0.03408050537109375, -0.022674560546875, -0.01126861572265625, 0.0001373291015625, 0.01154327392578125, 0.02294921875, 0.03435516357421875, 0.0457611083984375, 0.05716705322265625, 0.068572998046875, 0.07997894287109375, 0.0913848876953125, 0.10279083251953125, 0.11419677734375, 0.12560272216796875, 0.1370086669921875, 0.14841461181640625, 0.159820556640625, 0.17122650146484375, 0.1826324462890625, 0.19403839111328125, 0.2054443359375, 0.21685028076171875, 0.2282562255859375, 0.23966217041015625, 0.251068115234375, 0.26247406005859375, 0.2738800048828125, 0.28528594970703125, 0.29669189453125, 0.30809783935546875, 0.3195037841796875, 0.33090972900390625, 0.342315673828125, 0.35372161865234375, 0.3651275634765625, 0.37653350830078125, 0.387939453125]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 5.0, 3.0, 8.0, 13.0, 14.0, 22.0, 41.0, 56.0, 98.0, 172.0, 238.0, 531.0, 1144.0, 3132.0, 12093.0, 75143.0, 765673.0, 160647.0, 21517.0, 4869.0, 1654.0, 665.0, 354.0, 185.0, 100.0, 62.0, 34.0, 28.0, 23.0, 16.0, 8.0, 7.0, 4.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1427001953125, -0.1369171142578125, -0.131134033203125, -0.1253509521484375, -0.11956787109375, -0.1137847900390625, -0.108001708984375, -0.1022186279296875, -0.096435546875, -0.0906524658203125, -0.084869384765625, -0.0790863037109375, -0.07330322265625, -0.0675201416015625, -0.061737060546875, -0.0559539794921875, -0.0501708984375, -0.0443878173828125, -0.038604736328125, -0.0328216552734375, -0.02703857421875, -0.0212554931640625, -0.015472412109375, -0.0096893310546875, -0.00390625, 0.0018768310546875, 0.007659912109375, 0.0134429931640625, 0.01922607421875, 0.0250091552734375, 0.030792236328125, 0.0365753173828125, 0.0423583984375, 0.0481414794921875, 0.053924560546875, 0.0597076416015625, 0.06549072265625, 0.0712738037109375, 0.077056884765625, 0.0828399658203125, 0.088623046875, 0.0944061279296875, 0.100189208984375, 0.1059722900390625, 0.11175537109375, 0.1175384521484375, 0.123321533203125, 0.1291046142578125, 0.1348876953125, 0.1406707763671875, 0.146453857421875, 0.1522369384765625, 0.15802001953125, 0.1638031005859375, 0.169586181640625, 0.1753692626953125, 0.18115234375, 0.1869354248046875, 0.192718505859375, 0.1985015869140625, 0.20428466796875, 0.2100677490234375, 0.215850830078125, 0.2216339111328125, 0.2274169921875]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 2.0, 0.0, 4.0, 5.0, 4.0, 9.0, 10.0, 6.0, 13.0, 11.0, 20.0, 16.0, 13.0, 24.0, 30.0, 37.0, 30.0, 65.0, 74.0, 86.0, 96.0, 84.0, 65.0, 54.0, 35.0, 40.0, 26.0, 20.0, 15.0, 15.0, 14.0, 10.0, 13.0, 11.0, 12.0, 8.0, 6.0, 2.0, 7.0, 0.0, 2.0, 3.0, 1.0, 3.0, 1.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-4.6253204345703125e-05, -4.467833787202835e-05, -4.310347139835358e-05, -4.15286049246788e-05, -3.995373845100403e-05, -3.8378871977329254e-05, -3.680400550365448e-05, -3.5229139029979706e-05, -3.365427255630493e-05, -3.207940608263016e-05, -3.0504539608955383e-05, -2.892967313528061e-05, -2.7354806661605835e-05, -2.577994018793106e-05, -2.4205073714256287e-05, -2.2630207240581512e-05, -2.1055340766906738e-05, -1.9480474293231964e-05, -1.790560781955719e-05, -1.6330741345882416e-05, -1.4755874872207642e-05, -1.3181008398532867e-05, -1.1606141924858093e-05, -1.0031275451183319e-05, -8.456408977508545e-06, -6.881542503833771e-06, -5.306676030158997e-06, -3.7318095564842224e-06, -2.1569430828094482e-06, -5.820766091346741e-07, 9.927898645401e-07, 2.5676563382148743e-06, 4.1425228118896484e-06, 5.717389285564423e-06, 7.292255759239197e-06, 8.867122232913971e-06, 1.0441988706588745e-05, 1.201685518026352e-05, 1.3591721653938293e-05, 1.5166588127613068e-05, 1.6741454601287842e-05, 1.8316321074962616e-05, 1.989118754863739e-05, 2.1466054022312164e-05, 2.304092049598694e-05, 2.4615786969661713e-05, 2.6190653443336487e-05, 2.776551991701126e-05, 2.9340386390686035e-05, 3.091525286436081e-05, 3.2490119338035583e-05, 3.406498581171036e-05, 3.563985228538513e-05, 3.7214718759059906e-05, 3.878958523273468e-05, 4.0364451706409454e-05, 4.193931818008423e-05, 4.3514184653759e-05, 4.508905112743378e-05, 4.666391760110855e-05, 4.8238784074783325e-05, 4.98136505484581e-05, 5.1388517022132874e-05, 5.296338349580765e-05, 5.453824996948242e-05]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 4.0, 4.0, 8.0, 4.0, 9.0, 15.0, 22.0, 29.0, 42.0, 58.0, 71.0, 105.0, 145.0, 220.0, 361.0, 608.0, 1150.0, 1994.0, 4853.0, 13494.0, 49887.0, 337173.0, 554482.0, 58535.0, 14804.0, 5344.0, 2251.0, 1116.0, 614.0, 370.0, 237.0, 173.0, 111.0, 82.0, 52.0, 40.0, 34.0, 12.0, 13.0, 11.0, 7.0, 3.0, 1.0, 3.0, 7.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0], "bins": [-0.1611328125, -0.1564006805419922, -0.15166854858398438, -0.14693641662597656, -0.14220428466796875, -0.13747215270996094, -0.13274002075195312, -0.1280078887939453, -0.1232757568359375, -0.11854362487792969, -0.11381149291992188, -0.10907936096191406, -0.10434722900390625, -0.09961509704589844, -0.09488296508789062, -0.09015083312988281, -0.085418701171875, -0.08068656921386719, -0.07595443725585938, -0.07122230529785156, -0.06649017333984375, -0.06175804138183594, -0.057025909423828125, -0.05229377746582031, -0.0475616455078125, -0.04282951354980469, -0.038097381591796875, -0.03336524963378906, -0.02863311767578125, -0.023900985717773438, -0.019168853759765625, -0.014436721801757812, -0.00970458984375, -0.0049724578857421875, -0.000240325927734375, 0.0044918060302734375, 0.00922393798828125, 0.013956069946289062, 0.018688201904296875, 0.023420333862304688, 0.0281524658203125, 0.03288459777832031, 0.037616729736328125, 0.04234886169433594, 0.04708099365234375, 0.05181312561035156, 0.056545257568359375, 0.06127738952636719, 0.066009521484375, 0.07074165344238281, 0.07547378540039062, 0.08020591735839844, 0.08493804931640625, 0.08967018127441406, 0.09440231323242188, 0.09913444519042969, 0.1038665771484375, 0.10859870910644531, 0.11333084106445312, 0.11806297302246094, 0.12279510498046875, 0.12752723693847656, 0.13225936889648438, 0.1369915008544922, 0.1417236328125]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 4.0, 3.0, 4.0, 5.0, 6.0, 7.0, 10.0, 17.0, 27.0, 34.0, 32.0, 32.0, 60.0, 115.0, 112.0, 123.0, 99.0, 64.0, 46.0, 57.0, 37.0, 23.0, 13.0, 20.0, 16.0, 10.0, 6.0, 9.0, 3.0, 3.0, 6.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1336669921875, -0.12853622436523438, -0.12340545654296875, -0.11827468872070312, -0.1131439208984375, -0.10801315307617188, -0.10288238525390625, -0.09775161743164062, -0.092620849609375, -0.08749008178710938, -0.08235931396484375, -0.07722854614257812, -0.0720977783203125, -0.06696701049804688, -0.06183624267578125, -0.056705474853515625, -0.05157470703125, -0.046443939208984375, -0.04131317138671875, -0.036182403564453125, -0.0310516357421875, -0.025920867919921875, -0.02079010009765625, -0.015659332275390625, -0.010528564453125, -0.005397796630859375, -0.00026702880859375, 0.004863739013671875, 0.0099945068359375, 0.015125274658203125, 0.02025604248046875, 0.025386810302734375, 0.030517578125, 0.035648345947265625, 0.04077911376953125, 0.045909881591796875, 0.0510406494140625, 0.056171417236328125, 0.06130218505859375, 0.06643295288085938, 0.071563720703125, 0.07669448852539062, 0.08182525634765625, 0.08695602416992188, 0.0920867919921875, 0.09721755981445312, 0.10234832763671875, 0.10747909545898438, 0.11260986328125, 0.11774063110351562, 0.12287139892578125, 0.12800216674804688, 0.1331329345703125, 0.13826370239257812, 0.14339447021484375, 0.14852523803710938, 0.153656005859375, 0.15878677368164062, 0.16391754150390625, 0.16904830932617188, 0.1741790771484375, 0.17930984497070312, 0.18444061279296875, 0.18957138061523438, 0.1947021484375]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 6.0, 4.0, 8.0, 19.0, 52.0, 169.0, 413.0, 220.0, 76.0, 18.0, 5.0, 7.0, 4.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.840893268585205, -2.6961872577667236, -2.551481008529663, -2.4067749977111816, -2.262068748474121, -2.1173627376556396, -1.9726567268371582, -1.8279505968093872, -1.6832444667816162, -1.5385383367538452, -1.3938322067260742, -1.2491261959075928, -1.1044200658798218, -0.9597139358520508, -0.8150078654289246, -0.6703017950057983, -0.5255956649780273, -0.38088956475257874, -0.23618346452713013, -0.09147736430168152, 0.05322873592376709, 0.19793486595153809, 0.3426409363746643, 0.4873470067977905, 0.6320531368255615, 0.7767592668533325, 0.9214653372764587, 1.066171407699585, 1.210877537727356, 1.355583667755127, 1.5002896785736084, 1.6449958086013794, 1.7897014617919922, 1.9344075918197632, 2.079113721847534, 2.2238197326660156, 2.368525981903076, 2.5132319927215576, 2.657938003540039, 2.8026442527770996, 2.947350263595581, 3.0920562744140625, 3.236762523651123, 3.3814685344696045, 3.526174545288086, 3.6708807945251465, 3.815586805343628, 3.9602928161621094, 4.10499906539917, 4.2497053146362305, 4.394411087036133, 4.539117336273193, 4.683823585510254, 4.828529357910156, 4.973235607147217, 5.117941856384277, 5.26264762878418, 5.40735387802124, 5.552059650421143, 5.696765899658203, 5.841472148895264, 5.986178398132324, 6.130884170532227, 6.275590419769287, 6.420296669006348]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 7.0, 5.0, 3.0, 3.0, 4.0, 11.0, 21.0, 10.0, 20.0, 19.0, 22.0, 26.0, 24.0, 37.0, 35.0, 28.0, 29.0, 41.0, 43.0, 70.0, 78.0, 74.0, 48.0, 37.0, 46.0, 27.0, 38.0, 30.0, 24.0, 21.0, 19.0, 11.0, 11.0, 11.0, 15.0, 11.0, 8.0, 5.0, 7.0, 4.0, 7.0, 5.0, 3.0, 3.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.4916245937347412, -1.4426367282867432, -1.3936489820480347, -1.3446611166000366, -1.2956733703613281, -1.24668550491333, -1.197697639465332, -1.1487098932266235, -1.099722146987915, -1.050734281539917, -1.0017465353012085, -0.9527586698532104, -0.903770923614502, -0.8547830581665039, -0.8057952523231506, -0.7568074464797974, -0.7078195810317993, -0.658831775188446, -0.6098439693450928, -0.5608561038970947, -0.5118683576583862, -0.46288052201271057, -0.4138926863670349, -0.36490488052368164, -0.31591707468032837, -0.2669292688369751, -0.21794144809246063, -0.16895362734794617, -0.1199658215045929, -0.07097801566123962, -0.021990180015563965, 0.026997625827789307, 0.07598543167114258, 0.12497324496507645, 0.17396105825901031, 0.22294887900352478, 0.27193668484687805, 0.3209244906902313, 0.369912326335907, 0.41890013217926025, 0.4678879380226135, 0.5168757438659668, 0.5658635497093201, 0.6148513555526733, 0.6638392210006714, 0.7128269672393799, 0.7618148326873779, 0.8108026385307312, 0.8597904443740845, 0.9087782502174377, 0.957766056060791, 1.006753921508789, 1.0557416677474976, 1.1047295331954956, 1.153717279434204, 1.2027051448822021, 1.2516930103302002, 1.3006808757781982, 1.3496686220169067, 1.3986564874649048, 1.4476442337036133, 1.4966320991516113, 1.5456199645996094, 1.5946077108383179, 1.6435954570770264]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 5.0, 6.0, 9.0, 10.0, 11.0, 26.0, 29.0, 41.0, 57.0, 100.0, 134.0, 217.0, 333.0, 601.0, 1181.0, 2630.0, 7385.0, 29440.0, 214711.0, 2266949.0, 1512942.0, 126368.0, 20720.0, 5857.0, 2195.0, 1059.0, 484.0, 286.0, 162.0, 110.0, 74.0, 53.0, 26.0, 20.0, 12.0, 12.0, 8.0, 5.0, 8.0, 4.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1376953125, -0.13292884826660156, -0.12816238403320312, -0.12339591979980469, -0.11862945556640625, -0.11386299133300781, -0.10909652709960938, -0.10433006286621094, -0.0995635986328125, -0.09479713439941406, -0.09003067016601562, -0.08526420593261719, -0.08049774169921875, -0.07573127746582031, -0.07096481323242188, -0.06619834899902344, -0.061431884765625, -0.05666542053222656, -0.051898956298828125, -0.04713249206542969, -0.04236602783203125, -0.03759956359863281, -0.032833099365234375, -0.028066635131835938, -0.0233001708984375, -0.018533706665039062, -0.013767242431640625, -0.009000778198242188, -0.00423431396484375, 0.0005321502685546875, 0.005298614501953125, 0.010065078735351562, 0.01483154296875, 0.019598007202148438, 0.024364471435546875, 0.029130935668945312, 0.03389739990234375, 0.03866386413574219, 0.043430328369140625, 0.04819679260253906, 0.0529632568359375, 0.05772972106933594, 0.062496185302734375, 0.06726264953613281, 0.07202911376953125, 0.07679557800292969, 0.08156204223632812, 0.08632850646972656, 0.091094970703125, 0.09586143493652344, 0.10062789916992188, 0.10539436340332031, 0.11016082763671875, 0.11492729187011719, 0.11969375610351562, 0.12446022033691406, 0.1292266845703125, 0.13399314880371094, 0.13875961303710938, 0.1435260772705078, 0.14829254150390625, 0.1530590057373047, 0.15782546997070312, 0.16259193420410156, 0.1673583984375]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 3.0, 4.0, 4.0, 10.0, 1.0, 9.0, 16.0, 18.0, 29.0, 25.0, 33.0, 45.0, 63.0, 47.0, 46.0, 53.0, 74.0, 59.0, 58.0, 55.0, 45.0, 48.0, 52.0, 27.0, 40.0, 27.0, 26.0, 22.0, 20.0, 10.0, 12.0, 6.0, 4.0, 11.0, 2.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08721923828125, -0.0836782455444336, -0.08013725280761719, -0.07659626007080078, -0.07305526733398438, -0.06951427459716797, -0.06597328186035156, -0.062432289123535156, -0.05889129638671875, -0.055350303649902344, -0.05180931091308594, -0.04826831817626953, -0.044727325439453125, -0.04118633270263672, -0.03764533996582031, -0.034104347229003906, -0.0305633544921875, -0.027022361755371094, -0.023481369018554688, -0.01994037628173828, -0.016399383544921875, -0.012858390808105469, -0.009317398071289062, -0.005776405334472656, -0.00223541259765625, 0.0013055801391601562, 0.0048465728759765625, 0.008387565612792969, 0.011928558349609375, 0.015469551086425781, 0.019010543823242188, 0.022551536560058594, 0.026092529296875, 0.029633522033691406, 0.03317451477050781, 0.03671550750732422, 0.040256500244140625, 0.04379749298095703, 0.04733848571777344, 0.050879478454589844, 0.05442047119140625, 0.057961463928222656, 0.06150245666503906, 0.06504344940185547, 0.06858444213867188, 0.07212543487548828, 0.07566642761230469, 0.0792074203491211, 0.0827484130859375, 0.0862894058227539, 0.08983039855957031, 0.09337139129638672, 0.09691238403320312, 0.10045337677001953, 0.10399436950683594, 0.10753536224365234, 0.11107635498046875, 0.11461734771728516, 0.11815834045410156, 0.12169933319091797, 0.12524032592773438, 0.12878131866455078, 0.1323223114013672, 0.1358633041381836, 0.139404296875]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 6.0, 9.0, 16.0, 32.0, 38.0, 83.0, 200.0, 487.0, 1186.0, 3997.0, 24177.0, 504080.0, 3520922.0, 124241.0, 10932.0, 2335.0, 783.0, 321.0, 178.0, 99.0, 64.0, 37.0, 18.0, 16.0, 12.0, 5.0, 7.0, 2.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.271484375, -0.26189422607421875, -0.2523040771484375, -0.24271392822265625, -0.233123779296875, -0.22353363037109375, -0.2139434814453125, -0.20435333251953125, -0.19476318359375, -0.18517303466796875, -0.1755828857421875, -0.16599273681640625, -0.156402587890625, -0.14681243896484375, -0.1372222900390625, -0.12763214111328125, -0.1180419921875, -0.10845184326171875, -0.0988616943359375, -0.08927154541015625, -0.079681396484375, -0.07009124755859375, -0.0605010986328125, -0.05091094970703125, -0.04132080078125, -0.03173065185546875, -0.0221405029296875, -0.01255035400390625, -0.002960205078125, 0.00662994384765625, 0.0162200927734375, 0.02581024169921875, 0.035400390625, 0.04499053955078125, 0.0545806884765625, 0.06417083740234375, 0.073760986328125, 0.08335113525390625, 0.0929412841796875, 0.10253143310546875, 0.11212158203125, 0.12171173095703125, 0.1313018798828125, 0.14089202880859375, 0.150482177734375, 0.16007232666015625, 0.1696624755859375, 0.17925262451171875, 0.1888427734375, 0.19843292236328125, 0.2080230712890625, 0.21761322021484375, 0.227203369140625, 0.23679351806640625, 0.2463836669921875, 0.25597381591796875, 0.26556396484375, 0.27515411376953125, 0.2847442626953125, 0.29433441162109375, 0.303924560546875, 0.31351470947265625, 0.3231048583984375, 0.33269500732421875, 0.34228515625]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 4.0, 2.0, 6.0, 5.0, 10.0, 15.0, 15.0, 22.0, 44.0, 84.0, 124.0, 193.0, 323.0, 590.0, 804.0, 726.0, 455.0, 248.0, 148.0, 84.0, 62.0, 40.0, 18.0, 16.0, 11.0, 8.0, 5.0, 8.0, 3.0, 1.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.2083740234375, -0.20058250427246094, -0.19279098510742188, -0.1849994659423828, -0.17720794677734375, -0.1694164276123047, -0.16162490844726562, -0.15383338928222656, -0.1460418701171875, -0.13825035095214844, -0.13045883178710938, -0.12266731262207031, -0.11487579345703125, -0.10708427429199219, -0.09929275512695312, -0.09150123596191406, -0.083709716796875, -0.07591819763183594, -0.06812667846679688, -0.06033515930175781, -0.05254364013671875, -0.04475212097167969, -0.036960601806640625, -0.029169082641601562, -0.0213775634765625, -0.013586044311523438, -0.005794525146484375, 0.0019969940185546875, 0.00978851318359375, 0.017580032348632812, 0.025371551513671875, 0.03316307067871094, 0.04095458984375, 0.04874610900878906, 0.056537628173828125, 0.06432914733886719, 0.07212066650390625, 0.07991218566894531, 0.08770370483398438, 0.09549522399902344, 0.1032867431640625, 0.11107826232910156, 0.11886978149414062, 0.1266613006591797, 0.13445281982421875, 0.1422443389892578, 0.15003585815429688, 0.15782737731933594, 0.165618896484375, 0.17341041564941406, 0.18120193481445312, 0.1889934539794922, 0.19678497314453125, 0.2045764923095703, 0.21236801147460938, 0.22015953063964844, 0.2279510498046875, 0.23574256896972656, 0.24353408813476562, 0.2513256072998047, 0.25911712646484375, 0.2669086456298828, 0.2747001647949219, 0.28249168395996094, 0.290283203125]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 0.0, 3.0, 0.0, 4.0, 5.0, 10.0, 13.0, 32.0, 131.0, 213.0, 291.0, 168.0, 83.0, 30.0, 9.0, 6.0, 5.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-4.533990859985352, -4.431568622589111, -4.329146385192871, -4.226723670959473, -4.124301433563232, -4.021879196166992, -3.919456958770752, -3.8170347213745117, -3.7146122455596924, -3.612190008163452, -3.509767532348633, -3.4073452949523926, -3.3049230575561523, -3.202500581741333, -3.1000783443450928, -2.9976558685302734, -2.895233631134033, -2.792811393737793, -2.6903889179229736, -2.5879666805267334, -2.485544443130493, -2.383121967315674, -2.2806997299194336, -2.1782774925231934, -2.075855255126953, -1.9734328985214233, -1.871010661125183, -1.7685883045196533, -1.6661659479141235, -1.5637435913085938, -1.4613213539123535, -1.3588989973068237, -1.256476640701294, -1.1540542840957642, -1.051632046699524, -0.9492096900939941, -0.8467873334884644, -0.7443650364875793, -0.6419427394866943, -0.5395203828811646, -0.43709808588027954, -0.33467575907707214, -0.23225344717502594, -0.12983113527297974, -0.02740880846977234, 0.07501351833343506, 0.17743581533432007, 0.27985817193984985, 0.38228046894073486, 0.48470279574394226, 0.5871251225471497, 0.6895474195480347, 0.7919697761535645, 0.8943920731544495, 0.9968143701553345, 1.0992367267608643, 1.2016589641571045, 1.3040813207626343, 1.4065035581588745, 1.5089259147644043, 1.611348271369934, 1.7137706279754639, 1.816192865371704, 1.9186152219772339, 2.0210375785827637]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 3.0, 5.0, 5.0, 4.0, 6.0, 6.0, 7.0, 2.0, 5.0, 6.0, 23.0, 19.0, 30.0, 32.0, 52.0, 49.0, 48.0, 62.0, 58.0, 66.0, 76.0, 56.0, 67.0, 45.0, 47.0, 55.0, 33.0, 39.0, 19.0, 19.0, 17.0, 14.0, 7.0, 7.0, 12.0, 8.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0220189094543457, -0.9813469648361206, -0.9406750798225403, -0.9000031352043152, -0.8593312501907349, -0.8186593055725098, -0.7779873609542847, -0.7373154759407043, -0.696643590927124, -0.6559716463088989, -0.6152997612953186, -0.5746278166770935, -0.5339559316635132, -0.4932839870452881, -0.4526120722293854, -0.41194015741348267, -0.37126821279525757, -0.33059629797935486, -0.28992438316345215, -0.24925245344638824, -0.20858053863048553, -0.16790862381458282, -0.12723669409751892, -0.08656477928161621, -0.0458928644657135, -0.0052209459245204926, 0.035450972616672516, 0.07612289488315582, 0.11679480969905853, 0.15746672451496124, 0.19813865423202515, 0.23881056904792786, 0.27948248386383057, 0.3201543986797333, 0.360826313495636, 0.4014982581138611, 0.4421701431274414, 0.4828420877456665, 0.5235140323638916, 0.5641859173774719, 0.6048578023910522, 0.6455297470092773, 0.6862016320228577, 0.7268735766410828, 0.7675454616546631, 0.8082174062728882, 0.8488893508911133, 0.8895612359046936, 0.9302331805229187, 0.9709051251411438, 1.0115770101547241, 1.0522489547729492, 1.0929208993911743, 1.1335927248001099, 1.174264669418335, 1.21493661403656, 1.2556085586547852, 1.2962805032730103, 1.3369524478912354, 1.377624273300171, 1.418296217918396, 1.458968162536621, 1.4996401071548462, 1.5403120517730713, 1.5809838771820068]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 4.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 5.0, 5.0, 7.0, 10.0, 18.0, 15.0, 17.0, 43.0, 64.0, 102.0, 154.0, 287.0, 506.0, 1089.0, 2501.0, 6664.0, 20055.0, 73360.0, 308557.0, 464328.0, 122482.0, 31865.0, 9749.0, 3510.0, 1562.0, 702.0, 340.0, 217.0, 118.0, 62.0, 51.0, 45.0, 15.0, 15.0, 8.0, 6.0, 5.0, 3.0, 5.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.212158203125, -0.20556640625, -0.198974609375, -0.1923828125, -0.185791015625, -0.17919921875, -0.172607421875, -0.166015625, -0.159423828125, -0.15283203125, -0.146240234375, -0.1396484375, -0.133056640625, -0.12646484375, -0.119873046875, -0.11328125, -0.106689453125, -0.10009765625, -0.093505859375, -0.0869140625, -0.080322265625, -0.07373046875, -0.067138671875, -0.060546875, -0.053955078125, -0.04736328125, -0.040771484375, -0.0341796875, -0.027587890625, -0.02099609375, -0.014404296875, -0.0078125, -0.001220703125, 0.00537109375, 0.011962890625, 0.0185546875, 0.025146484375, 0.03173828125, 0.038330078125, 0.044921875, 0.051513671875, 0.05810546875, 0.064697265625, 0.0712890625, 0.077880859375, 0.08447265625, 0.091064453125, 0.09765625, 0.104248046875, 0.11083984375, 0.117431640625, 0.1240234375, 0.130615234375, 0.13720703125, 0.143798828125, 0.150390625, 0.156982421875, 0.16357421875, 0.170166015625, 0.1767578125, 0.183349609375, 0.18994140625, 0.196533203125, 0.203125, 0.209716796875]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 2.0, 7.0, 7.0, 7.0, 7.0, 14.0, 13.0, 22.0, 24.0, 17.0, 30.0, 28.0, 35.0, 45.0, 39.0, 46.0, 51.0, 43.0, 53.0, 53.0, 47.0, 37.0, 46.0, 43.0, 34.0, 42.0, 27.0, 28.0, 19.0, 21.0, 28.0, 22.0, 12.0, 18.0, 10.0, 4.0, 5.0, 5.0, 5.0, 3.0, 2.0, 2.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.09765625, -0.0947275161743164, -0.09179878234863281, -0.08887004852294922, -0.08594131469726562, -0.08301258087158203, -0.08008384704589844, -0.07715511322021484, -0.07422637939453125, -0.07129764556884766, -0.06836891174316406, -0.06544017791748047, -0.06251144409179688, -0.05958271026611328, -0.05665397644042969, -0.053725242614746094, -0.0507965087890625, -0.047867774963378906, -0.04493904113769531, -0.04201030731201172, -0.039081573486328125, -0.03615283966064453, -0.03322410583496094, -0.030295372009277344, -0.02736663818359375, -0.024437904357910156, -0.021509170532226562, -0.01858043670654297, -0.015651702880859375, -0.012722969055175781, -0.009794235229492188, -0.006865501403808594, -0.003936767578125, -0.0010080337524414062, 0.0019207000732421875, 0.004849433898925781, 0.007778167724609375, 0.010706901550292969, 0.013635635375976562, 0.016564369201660156, 0.01949310302734375, 0.022421836853027344, 0.025350570678710938, 0.02827930450439453, 0.031208038330078125, 0.03413677215576172, 0.03706550598144531, 0.039994239807128906, 0.0429229736328125, 0.045851707458496094, 0.04878044128417969, 0.05170917510986328, 0.054637908935546875, 0.05756664276123047, 0.06049537658691406, 0.06342411041259766, 0.06635284423828125, 0.06928157806396484, 0.07221031188964844, 0.07513904571533203, 0.07806777954101562, 0.08099651336669922, 0.08392524719238281, 0.0868539810180664, 0.08978271484375]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 8.0, 8.0, 12.0, 13.0, 24.0, 41.0, 103.0, 145.0, 330.0, 687.0, 1813.0, 7400.0, 97777.0, 890651.0, 42325.0, 4719.0, 1317.0, 595.0, 272.0, 132.0, 79.0, 38.0, 24.0, 25.0, 11.0, 4.0, 1.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.79052734375, -0.7714195251464844, -0.7523117065429688, -0.7332038879394531, -0.7140960693359375, -0.6949882507324219, -0.6758804321289062, -0.6567726135253906, -0.637664794921875, -0.6185569763183594, -0.5994491577148438, -0.5803413391113281, -0.5612335205078125, -0.5421257019042969, -0.5230178833007812, -0.5039100646972656, -0.48480224609375, -0.4656944274902344, -0.44658660888671875, -0.4274787902832031, -0.4083709716796875, -0.3892631530761719, -0.37015533447265625, -0.3510475158691406, -0.331939697265625, -0.3128318786621094, -0.29372406005859375, -0.2746162414550781, -0.2555084228515625, -0.23640060424804688, -0.21729278564453125, -0.19818496704101562, -0.1790771484375, -0.15996932983398438, -0.14086151123046875, -0.12175369262695312, -0.1026458740234375, -0.08353805541992188, -0.06443023681640625, -0.045322418212890625, -0.026214599609375, -0.007106781005859375, 0.01200103759765625, 0.031108856201171875, 0.0502166748046875, 0.06932449340820312, 0.08843231201171875, 0.10754013061523438, 0.12664794921875, 0.14575576782226562, 0.16486358642578125, 0.18397140502929688, 0.2030792236328125, 0.22218704223632812, 0.24129486083984375, 0.2604026794433594, 0.279510498046875, 0.2986183166503906, 0.31772613525390625, 0.3368339538574219, 0.3559417724609375, 0.3750495910644531, 0.39415740966796875, 0.4132652282714844, 0.432373046875]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 4.0, 0.0, 4.0, 3.0, 4.0, 3.0, 9.0, 7.0, 9.0, 14.0, 13.0, 20.0, 22.0, 17.0, 19.0, 21.0, 30.0, 31.0, 46.0, 42.0, 46.0, 40.0, 53.0, 43.0, 42.0, 44.0, 56.0, 43.0, 38.0, 28.0, 30.0, 33.0, 28.0, 24.0, 25.0, 21.0, 17.0, 15.0, 15.0, 7.0, 5.0, 9.0, 5.0, 9.0, 5.0, 7.0, 0.0, 3.0, 2.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.340087890625, -0.3293113708496094, -0.31853485107421875, -0.3077583312988281, -0.2969818115234375, -0.2862052917480469, -0.27542877197265625, -0.2646522521972656, -0.253875732421875, -0.24309921264648438, -0.23232269287109375, -0.22154617309570312, -0.2107696533203125, -0.19999313354492188, -0.18921661376953125, -0.17844009399414062, -0.16766357421875, -0.15688705444335938, -0.14611053466796875, -0.13533401489257812, -0.1245574951171875, -0.11378097534179688, -0.10300445556640625, -0.09222793579101562, -0.081451416015625, -0.07067489624023438, -0.05989837646484375, -0.049121856689453125, -0.0383453369140625, -0.027568817138671875, -0.01679229736328125, -0.006015777587890625, 0.0047607421875, 0.015537261962890625, 0.02631378173828125, 0.037090301513671875, 0.0478668212890625, 0.058643341064453125, 0.06941986083984375, 0.08019638061523438, 0.090972900390625, 0.10174942016601562, 0.11252593994140625, 0.12330245971679688, 0.1340789794921875, 0.14485549926757812, 0.15563201904296875, 0.16640853881835938, 0.17718505859375, 0.18796157836914062, 0.19873809814453125, 0.20951461791992188, 0.2202911376953125, 0.23106765747070312, 0.24184417724609375, 0.2526206970214844, 0.263397216796875, 0.2741737365722656, 0.28495025634765625, 0.2957267761230469, 0.3065032958984375, 0.3172798156738281, 0.32805633544921875, 0.3388328552246094, 0.349609375]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 2.0, 7.0, 2.0, 5.0, 9.0, 8.0, 12.0, 12.0, 21.0, 33.0, 41.0, 93.0, 124.0, 184.0, 319.0, 639.0, 1486.0, 4065.0, 15441.0, 81689.0, 811746.0, 106096.0, 18486.0, 4808.0, 1593.0, 705.0, 362.0, 196.0, 125.0, 85.0, 48.0, 26.0, 24.0, 15.0, 14.0, 13.0, 6.0, 3.0, 6.0, 3.0, 3.0, 1.0, 5.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.228271484375, -0.22146987915039062, -0.21466827392578125, -0.20786666870117188, -0.2010650634765625, -0.19426345825195312, -0.18746185302734375, -0.18066024780273438, -0.173858642578125, -0.16705703735351562, -0.16025543212890625, -0.15345382690429688, -0.1466522216796875, -0.13985061645507812, -0.13304901123046875, -0.12624740600585938, -0.11944580078125, -0.11264419555664062, -0.10584259033203125, -0.09904098510742188, -0.0922393798828125, -0.08543777465820312, -0.07863616943359375, -0.07183456420898438, -0.065032958984375, -0.058231353759765625, -0.05142974853515625, -0.044628143310546875, -0.0378265380859375, -0.031024932861328125, -0.02422332763671875, -0.017421722412109375, -0.0106201171875, -0.003818511962890625, 0.00298309326171875, 0.009784698486328125, 0.0165863037109375, 0.023387908935546875, 0.03018951416015625, 0.036991119384765625, 0.043792724609375, 0.050594329833984375, 0.05739593505859375, 0.06419754028320312, 0.0709991455078125, 0.07780075073242188, 0.08460235595703125, 0.09140396118164062, 0.09820556640625, 0.10500717163085938, 0.11180877685546875, 0.11861038208007812, 0.1254119873046875, 0.13221359252929688, 0.13901519775390625, 0.14581680297851562, 0.152618408203125, 0.15942001342773438, 0.16622161865234375, 0.17302322387695312, 0.1798248291015625, 0.18662643432617188, 0.19342803955078125, 0.20022964477539062, 0.20703125]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 2.0, 6.0, 7.0, 9.0, 6.0, 9.0, 6.0, 14.0, 8.0, 15.0, 22.0, 27.0, 34.0, 39.0, 66.0, 87.0, 107.0, 105.0, 99.0, 82.0, 63.0, 41.0, 30.0, 25.0, 18.0, 8.0, 12.0, 11.0, 6.0, 11.0, 6.0, 3.0, 5.0, 3.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-6.0677528381347656e-05, -5.879346281290054e-05, -5.690939724445343e-05, -5.502533167600632e-05, -5.3141266107559204e-05, -5.125720053911209e-05, -4.937313497066498e-05, -4.7489069402217865e-05, -4.560500383377075e-05, -4.372093826532364e-05, -4.1836872696876526e-05, -3.995280712842941e-05, -3.80687415599823e-05, -3.618467599153519e-05, -3.4300610423088074e-05, -3.241654485464096e-05, -3.053247928619385e-05, -2.8648413717746735e-05, -2.676434814929962e-05, -2.488028258085251e-05, -2.2996217012405396e-05, -2.1112151443958282e-05, -1.922808587551117e-05, -1.7344020307064056e-05, -1.5459954738616943e-05, -1.357588917016983e-05, -1.1691823601722717e-05, -9.807758033275604e-06, -7.923692464828491e-06, -6.039626896381378e-06, -4.155561327934265e-06, -2.271495759487152e-06, -3.8743019104003906e-07, 1.496635377407074e-06, 3.380700945854187e-06, 5.2647665143013e-06, 7.148832082748413e-06, 9.032897651195526e-06, 1.091696321964264e-05, 1.2801028788089752e-05, 1.4685094356536865e-05, 1.6569159924983978e-05, 1.845322549343109e-05, 2.0337291061878204e-05, 2.2221356630325317e-05, 2.410542219877243e-05, 2.5989487767219543e-05, 2.7873553335666656e-05, 2.975761890411377e-05, 3.164168447256088e-05, 3.3525750041007996e-05, 3.540981560945511e-05, 3.729388117790222e-05, 3.9177946746349335e-05, 4.106201231479645e-05, 4.294607788324356e-05, 4.4830143451690674e-05, 4.671420902013779e-05, 4.85982745885849e-05, 5.048234015703201e-05, 5.2366405725479126e-05, 5.425047129392624e-05, 5.613453686237335e-05, 5.8018602430820465e-05, 5.990266799926758e-05]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 5.0, 7.0, 5.0, 5.0, 5.0, 5.0, 4.0, 13.0, 16.0, 22.0, 29.0, 29.0, 45.0, 79.0, 96.0, 130.0, 214.0, 326.0, 498.0, 910.0, 1807.0, 3885.0, 10291.0, 33712.0, 169403.0, 713610.0, 79435.0, 20973.0, 6896.0, 2760.0, 1278.0, 744.0, 449.0, 260.0, 161.0, 136.0, 86.0, 62.0, 55.0, 29.0, 23.0, 18.0, 10.0, 10.0, 8.0, 2.0, 6.0, 2.0, 4.0, 4.0, 0.0, 1.0, 5.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.161865234375, -0.15685462951660156, -0.15184402465820312, -0.1468334197998047, -0.14182281494140625, -0.1368122100830078, -0.13180160522460938, -0.12679100036621094, -0.1217803955078125, -0.11676979064941406, -0.11175918579101562, -0.10674858093261719, -0.10173797607421875, -0.09672737121582031, -0.09171676635742188, -0.08670616149902344, -0.081695556640625, -0.07668495178222656, -0.07167434692382812, -0.06666374206542969, -0.06165313720703125, -0.05664253234863281, -0.051631927490234375, -0.04662132263183594, -0.0416107177734375, -0.03660011291503906, -0.031589508056640625, -0.026578903198242188, -0.02156829833984375, -0.016557693481445312, -0.011547088623046875, -0.0065364837646484375, -0.00152587890625, 0.0034847259521484375, 0.008495330810546875, 0.013505935668945312, 0.01851654052734375, 0.023527145385742188, 0.028537750244140625, 0.03354835510253906, 0.0385589599609375, 0.04356956481933594, 0.048580169677734375, 0.05359077453613281, 0.05860137939453125, 0.06361198425292969, 0.06862258911132812, 0.07363319396972656, 0.078643798828125, 0.08365440368652344, 0.08866500854492188, 0.09367561340332031, 0.09868621826171875, 0.10369682312011719, 0.10870742797851562, 0.11371803283691406, 0.1187286376953125, 0.12373924255371094, 0.12874984741210938, 0.1337604522705078, 0.13877105712890625, 0.1437816619873047, 0.14879226684570312, 0.15380287170410156, 0.1588134765625]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 3.0, 4.0, 3.0, 5.0, 6.0, 0.0, 4.0, 8.0, 11.0, 7.0, 15.0, 14.0, 9.0, 12.0, 12.0, 23.0, 33.0, 37.0, 56.0, 69.0, 100.0, 106.0, 98.0, 88.0, 58.0, 45.0, 34.0, 28.0, 16.0, 15.0, 13.0, 11.0, 10.0, 11.0, 7.0, 9.0, 1.0, 1.0, 8.0, 4.0, 4.0, 3.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.11822509765625, -0.11449337005615234, -0.11076164245605469, -0.10702991485595703, -0.10329818725585938, -0.09956645965576172, -0.09583473205566406, -0.0921030044555664, -0.08837127685546875, -0.0846395492553711, -0.08090782165527344, -0.07717609405517578, -0.07344436645507812, -0.06971263885498047, -0.06598091125488281, -0.062249183654785156, -0.0585174560546875, -0.054785728454589844, -0.05105400085449219, -0.04732227325439453, -0.043590545654296875, -0.03985881805419922, -0.03612709045410156, -0.032395362854003906, -0.02866363525390625, -0.024931907653808594, -0.021200180053710938, -0.01746845245361328, -0.013736724853515625, -0.010004997253417969, -0.0062732696533203125, -0.0025415420532226562, 0.001190185546875, 0.004921913146972656, 0.008653640747070312, 0.012385368347167969, 0.016117095947265625, 0.01984882354736328, 0.023580551147460938, 0.027312278747558594, 0.03104400634765625, 0.034775733947753906, 0.03850746154785156, 0.04223918914794922, 0.045970916748046875, 0.04970264434814453, 0.05343437194824219, 0.057166099548339844, 0.0608978271484375, 0.06462955474853516, 0.06836128234863281, 0.07209300994873047, 0.07582473754882812, 0.07955646514892578, 0.08328819274902344, 0.0870199203491211, 0.09075164794921875, 0.0944833755493164, 0.09821510314941406, 0.10194683074951172, 0.10567855834960938, 0.10941028594970703, 0.11314201354980469, 0.11687374114990234, 0.12060546875]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 6.0, 11.0, 9.0, 27.0, 66.0, 121.0, 255.0, 250.0, 136.0, 49.0, 29.0, 9.0, 5.0, 7.0, 5.0, 3.0, 4.0, 3.0, 2.0, 2.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.3943662643432617, -3.294478178024292, -3.194589853286743, -3.0947017669677734, -2.9948136806488037, -2.894925355911255, -2.795037269592285, -2.6951489448547363, -2.5952608585357666, -2.495372772216797, -2.395484447479248, -2.2955963611602783, -2.1957082748413086, -2.0958199501037598, -1.99593186378479, -1.8960436582565308, -1.796155571937561, -1.6962673664093018, -1.596379280090332, -1.4964910745620728, -1.3966028690338135, -1.2967147827148438, -1.1968265771865845, -1.0969383716583252, -0.9970502257347107, -0.8971620798110962, -0.7972738742828369, -0.6973857283592224, -0.5974975824356079, -0.49760937690734863, -0.39772123098373413, -0.29783302545547485, -0.19794487953186035, -0.09805671125650406, 0.0018314570188522339, 0.10171961784362793, 0.20160779356956482, 0.3014959692955017, 0.4013841152191162, 0.5012723207473755, 0.60116046667099, 0.7010486125946045, 0.8009368181228638, 0.9008249640464783, 1.0007131099700928, 1.100601315498352, 1.2004895210266113, 1.300377607345581, 1.4002658128738403, 1.5001540184020996, 1.6000421047210693, 1.6999303102493286, 1.799818515777588, 1.8997066020965576, 1.999594807624817, 2.099483013153076, 2.199371099472046, 2.2992591857910156, 2.3991475105285645, 2.499035596847534, 2.598923683166504, 2.6988120079040527, 2.7987000942230225, 2.898588180541992, 2.998476505279541]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 8.0, 10.0, 7.0, 10.0, 13.0, 9.0, 11.0, 17.0, 24.0, 20.0, 22.0, 22.0, 23.0, 34.0, 39.0, 43.0, 30.0, 63.0, 63.0, 81.0, 59.0, 53.0, 40.0, 36.0, 36.0, 28.0, 28.0, 32.0, 18.0, 24.0, 12.0, 17.0, 9.0, 11.0, 9.0, 11.0, 7.0, 7.0, 3.0, 6.0, 8.0, 6.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3342461585998535, -1.2885558605194092, -1.2428655624389648, -1.1971752643585205, -1.1514849662780762, -1.1057946681976318, -1.0601043701171875, -1.0144140720367432, -0.9687238335609436, -0.9230335354804993, -0.8773432374000549, -0.8316529989242554, -0.785962700843811, -0.7402724027633667, -0.6945821046829224, -0.648891806602478, -0.6032015085220337, -0.5575112104415894, -0.511820912361145, -0.46613064408302307, -0.42044034600257874, -0.3747500479221344, -0.32905977964401245, -0.2833694815635681, -0.23767918348312378, -0.19198888540267944, -0.1462986022233963, -0.10060831904411316, -0.05491802096366882, -0.009227722883224487, 0.03646254539489746, 0.0821528434753418, 0.12784326076507568, 0.17353355884552002, 0.21922384202480316, 0.2649141252040863, 0.31060442328453064, 0.356294721364975, 0.4019849896430969, 0.44767528772354126, 0.4933655858039856, 0.5390558838844299, 0.5847461819648743, 0.6304364204406738, 0.6761267185211182, 0.7218170166015625, 0.7675073146820068, 0.8131976127624512, 0.8588879108428955, 0.9045782089233398, 0.9502685070037842, 0.9959588050842285, 1.0416491031646729, 1.0873394012451172, 1.1330296993255615, 1.1787199974060059, 1.2244102954864502, 1.2701005935668945, 1.3157908916473389, 1.3614811897277832, 1.4071714878082275, 1.4528617858886719, 1.4985520839691162, 1.5442423820495605, 1.5899325609207153]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 1.0, 9.0, 6.0, 14.0, 12.0, 30.0, 29.0, 49.0, 105.0, 177.0, 351.0, 793.0, 2236.0, 11430.0, 282400.0, 3811292.0, 76453.0, 6439.0, 1486.0, 499.0, 234.0, 95.0, 52.0, 32.0, 15.0, 13.0, 8.0, 8.0, 1.0, 2.0, 2.0, 3.0, 3.0, 1.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.258544921875, -0.24792861938476562, -0.23731231689453125, -0.22669601440429688, -0.2160797119140625, -0.20546340942382812, -0.19484710693359375, -0.18423080444335938, -0.173614501953125, -0.16299819946289062, -0.15238189697265625, -0.14176559448242188, -0.1311492919921875, -0.12053298950195312, -0.10991668701171875, -0.09930038452148438, -0.08868408203125, -0.07806777954101562, -0.06745147705078125, -0.056835174560546875, -0.0462188720703125, -0.035602569580078125, -0.02498626708984375, -0.014369964599609375, -0.003753662109375, 0.006862640380859375, 0.01747894287109375, 0.028095245361328125, 0.0387115478515625, 0.049327850341796875, 0.05994415283203125, 0.07056045532226562, 0.0811767578125, 0.09179306030273438, 0.10240936279296875, 0.11302566528320312, 0.1236419677734375, 0.13425827026367188, 0.14487457275390625, 0.15549087524414062, 0.166107177734375, 0.17672348022460938, 0.18733978271484375, 0.19795608520507812, 0.2085723876953125, 0.21918869018554688, 0.22980499267578125, 0.24042129516601562, 0.25103759765625, 0.2616539001464844, 0.27227020263671875, 0.2828865051269531, 0.2935028076171875, 0.3041191101074219, 0.31473541259765625, 0.3253517150878906, 0.335968017578125, 0.3465843200683594, 0.35720062255859375, 0.3678169250488281, 0.3784332275390625, 0.3890495300292969, 0.39966583251953125, 0.4102821350097656, 0.4208984375]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 4.0, 3.0, 4.0, 6.0, 8.0, 12.0, 11.0, 24.0, 20.0, 18.0, 21.0, 25.0, 24.0, 45.0, 41.0, 38.0, 45.0, 48.0, 53.0, 46.0, 50.0, 62.0, 47.0, 36.0, 36.0, 35.0, 32.0, 50.0, 34.0, 28.0, 22.0, 19.0, 8.0, 10.0, 8.0, 13.0, 5.0, 6.0, 3.0, 1.0, 2.0, 5.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0843505859375, -0.08154010772705078, -0.07872962951660156, -0.07591915130615234, -0.07310867309570312, -0.0702981948852539, -0.06748771667480469, -0.06467723846435547, -0.06186676025390625, -0.05905628204345703, -0.05624580383300781, -0.053435325622558594, -0.050624847412109375, -0.047814369201660156, -0.04500389099121094, -0.04219341278076172, -0.0393829345703125, -0.03657245635986328, -0.03376197814941406, -0.030951499938964844, -0.028141021728515625, -0.025330543518066406, -0.022520065307617188, -0.01970958709716797, -0.01689910888671875, -0.014088630676269531, -0.011278152465820312, -0.008467674255371094, -0.005657196044921875, -0.0028467178344726562, -3.62396240234375e-05, 0.0027742385864257812, 0.005584716796875, 0.008395195007324219, 0.011205673217773438, 0.014016151428222656, 0.016826629638671875, 0.019637107849121094, 0.022447586059570312, 0.02525806427001953, 0.02806854248046875, 0.03087902069091797, 0.03368949890136719, 0.036499977111816406, 0.039310455322265625, 0.042120933532714844, 0.04493141174316406, 0.04774188995361328, 0.0505523681640625, 0.05336284637451172, 0.05617332458496094, 0.058983802795410156, 0.061794281005859375, 0.0646047592163086, 0.06741523742675781, 0.07022571563720703, 0.07303619384765625, 0.07584667205810547, 0.07865715026855469, 0.0814676284790039, 0.08427810668945312, 0.08708858489990234, 0.08989906311035156, 0.09270954132080078, 0.09552001953125]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 0.0, 4.0, 1.0, 1.0, 4.0, 3.0, 3.0, 4.0, 11.0, 21.0, 26.0, 30.0, 51.0, 94.0, 152.0, 260.0, 515.0, 812.0, 1741.0, 3692.0, 10770.0, 93109.0, 3670113.0, 382404.0, 20198.0, 5350.0, 2249.0, 1157.0, 618.0, 374.0, 195.0, 128.0, 73.0, 34.0, 31.0, 17.0, 14.0, 12.0, 5.0, 3.0, 5.0, 2.0, 5.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.26318359375, -0.2529335021972656, -0.24268341064453125, -0.23243331909179688, -0.2221832275390625, -0.21193313598632812, -0.20168304443359375, -0.19143295288085938, -0.181182861328125, -0.17093276977539062, -0.16068267822265625, -0.15043258666992188, -0.1401824951171875, -0.12993240356445312, -0.11968231201171875, -0.10943222045898438, -0.09918212890625, -0.08893203735351562, -0.07868194580078125, -0.06843185424804688, -0.0581817626953125, -0.047931671142578125, -0.03768157958984375, -0.027431488037109375, -0.017181396484375, -0.006931304931640625, 0.00331878662109375, 0.013568878173828125, 0.0238189697265625, 0.034069061279296875, 0.04431915283203125, 0.054569244384765625, 0.0648193359375, 0.07506942749023438, 0.08531951904296875, 0.09556961059570312, 0.1058197021484375, 0.11606979370117188, 0.12631988525390625, 0.13656997680664062, 0.146820068359375, 0.15707015991210938, 0.16732025146484375, 0.17757034301757812, 0.1878204345703125, 0.19807052612304688, 0.20832061767578125, 0.21857070922851562, 0.22882080078125, 0.23907089233398438, 0.24932098388671875, 0.2595710754394531, 0.2698211669921875, 0.2800712585449219, 0.29032135009765625, 0.3005714416503906, 0.310821533203125, 0.3210716247558594, 0.33132171630859375, 0.3415718078613281, 0.3518218994140625, 0.3620719909667969, 0.37232208251953125, 0.3825721740722656, 0.392822265625]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 5.0, 3.0, 7.0, 7.0, 10.0, 24.0, 42.0, 93.0, 183.0, 422.0, 866.0, 1094.0, 729.0, 282.0, 127.0, 76.0, 40.0, 18.0, 20.0, 7.0, 7.0, 5.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.276123046875, -0.2663421630859375, -0.256561279296875, -0.2467803955078125, -0.23699951171875, -0.2272186279296875, -0.217437744140625, -0.2076568603515625, -0.1978759765625, -0.1880950927734375, -0.178314208984375, -0.1685333251953125, -0.15875244140625, -0.1489715576171875, -0.139190673828125, -0.1294097900390625, -0.11962890625, -0.1098480224609375, -0.100067138671875, -0.0902862548828125, -0.08050537109375, -0.0707244873046875, -0.060943603515625, -0.0511627197265625, -0.0413818359375, -0.0316009521484375, -0.021820068359375, -0.0120391845703125, -0.00225830078125, 0.0075225830078125, 0.017303466796875, 0.0270843505859375, 0.036865234375, 0.0466461181640625, 0.056427001953125, 0.0662078857421875, 0.07598876953125, 0.0857696533203125, 0.095550537109375, 0.1053314208984375, 0.1151123046875, 0.1248931884765625, 0.134674072265625, 0.1444549560546875, 0.15423583984375, 0.1640167236328125, 0.173797607421875, 0.1835784912109375, 0.193359375, 0.2031402587890625, 0.212921142578125, 0.2227020263671875, 0.23248291015625, 0.2422637939453125, 0.252044677734375, 0.2618255615234375, 0.2716064453125, 0.2813873291015625, 0.291168212890625, 0.3009490966796875, 0.31072998046875, 0.3205108642578125, 0.330291748046875, 0.3400726318359375, 0.349853515625]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 4.0, 2.0, 3.0, 7.0, 12.0, 24.0, 45.0, 104.0, 191.0, 275.0, 172.0, 95.0, 29.0, 21.0, 1.0, 3.0, 5.0, 3.0, 4.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9455642700195312, -1.8582165241241455, -1.7708687782287598, -1.683521032333374, -1.5961732864379883, -1.5088255405426025, -1.4214777946472168, -1.334130048751831, -1.2467823028564453, -1.1594345569610596, -1.0720868110656738, -0.9847390651702881, -0.8973913192749023, -0.8100435733795166, -0.7226957678794861, -0.6353480219841003, -0.5480002164840698, -0.4606524705886841, -0.37330472469329834, -0.2859569489955902, -0.19860920310020447, -0.11126145720481873, -0.023913681507110596, 0.06343406438827515, 0.1507818102836609, 0.23812955617904663, 0.3254773020744324, 0.4128250777721405, 0.5001728534698486, 0.5875205993652344, 0.6748683452606201, 0.7622160911560059, 0.8495638370513916, 0.9369115829467773, 1.024259328842163, 1.1116070747375488, 1.1989548206329346, 1.2863025665283203, 1.373650312423706, 1.4609980583190918, 1.5483458042144775, 1.6356935501098633, 1.723041296005249, 1.8103890419006348, 1.8977367877960205, 1.9850845336914062, 2.072432279586792, 2.1597800254821777, 2.2471280097961426, 2.3344757556915283, 2.421823501586914, 2.5091712474823, 2.5965189933776855, 2.6838667392730713, 2.771214485168457, 2.8585622310638428, 2.9459099769592285, 3.0332577228546143, 3.12060546875, 3.2079532146453857, 3.2953009605407715, 3.3826487064361572, 3.469996452331543, 3.5573441982269287, 3.6446919441223145]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 6.0, 8.0, 10.0, 26.0, 34.0, 43.0, 49.0, 67.0, 66.0, 81.0, 81.0, 98.0, 76.0, 82.0, 68.0, 57.0, 51.0, 38.0, 22.0, 15.0, 14.0, 7.0, 5.0, 3.0, 0.0, 1.0, 1.0], "bins": [-2.4637389183044434, -2.413572072982788, -2.363405227661133, -2.3132386207580566, -2.2630717754364014, -2.212904930114746, -2.16273832321167, -2.1125714778900146, -2.0624046325683594, -2.012237787246704, -1.9620710611343384, -1.9119043350219727, -1.8617374897003174, -1.811570644378662, -1.7614039182662964, -1.7112371921539307, -1.6610703468322754, -1.6109035015106201, -1.5607367753982544, -1.5105700492858887, -1.4604032039642334, -1.4102363586425781, -1.3600696325302124, -1.3099029064178467, -1.2597360610961914, -1.2095692157745361, -1.1594024896621704, -1.1092357635498047, -1.0590689182281494, -1.0089020729064941, -0.9587353467941284, -0.9085685610771179, -0.8584018349647522, -0.8082350492477417, -0.7580682635307312, -0.7079014778137207, -0.6577346920967102, -0.6075679063796997, -0.5574011206626892, -0.5072343349456787, -0.4570675492286682, -0.4069007635116577, -0.3567339777946472, -0.3065671920776367, -0.2564004063606262, -0.20623362064361572, -0.15606683492660522, -0.10590004920959473, -0.05573326349258423, -0.0055664777755737305, 0.04460030794143677, 0.09476709365844727, 0.14493387937545776, 0.19510066509246826, 0.24526745080947876, 0.29543423652648926, 0.34560102224349976, 0.39576780796051025, 0.44593459367752075, 0.49610137939453125, 0.5462681651115417, 0.5964349508285522, 0.6466017365455627, 0.6967685222625732, 0.7469353079795837]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 5.0, 2.0, 1.0, 3.0, 4.0, 13.0, 11.0, 22.0, 32.0, 65.0, 87.0, 186.0, 470.0, 1615.0, 8281.0, 94634.0, 788254.0, 141041.0, 10720.0, 2026.0, 610.0, 201.0, 111.0, 54.0, 47.0, 28.0, 16.0, 7.0, 6.0, 6.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.294921875, -0.28338623046875, -0.2718505859375, -0.26031494140625, -0.248779296875, -0.23724365234375, -0.2257080078125, -0.21417236328125, -0.20263671875, -0.19110107421875, -0.1795654296875, -0.16802978515625, -0.156494140625, -0.14495849609375, -0.1334228515625, -0.12188720703125, -0.1103515625, -0.09881591796875, -0.0872802734375, -0.07574462890625, -0.064208984375, -0.05267333984375, -0.0411376953125, -0.02960205078125, -0.01806640625, -0.00653076171875, 0.0050048828125, 0.01654052734375, 0.028076171875, 0.03961181640625, 0.0511474609375, 0.06268310546875, 0.07421875, 0.08575439453125, 0.0972900390625, 0.10882568359375, 0.120361328125, 0.13189697265625, 0.1434326171875, 0.15496826171875, 0.16650390625, 0.17803955078125, 0.1895751953125, 0.20111083984375, 0.212646484375, 0.22418212890625, 0.2357177734375, 0.24725341796875, 0.2587890625, 0.27032470703125, 0.2818603515625, 0.29339599609375, 0.304931640625, 0.31646728515625, 0.3280029296875, 0.33953857421875, 0.35107421875, 0.36260986328125, 0.3741455078125, 0.38568115234375, 0.397216796875, 0.40875244140625, 0.4202880859375, 0.43182373046875, 0.443359375]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 6.0, 5.0, 10.0, 13.0, 15.0, 9.0, 17.0, 18.0, 32.0, 46.0, 49.0, 62.0, 65.0, 50.0, 52.0, 76.0, 57.0, 49.0, 58.0, 51.0, 43.0, 54.0, 27.0, 36.0, 28.0, 24.0, 16.0, 9.0, 12.0, 9.0, 6.0, 1.0, 3.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.1597900390625, -0.15606021881103516, -0.1523303985595703, -0.14860057830810547, -0.14487075805664062, -0.14114093780517578, -0.13741111755371094, -0.1336812973022461, -0.12995147705078125, -0.1262216567993164, -0.12249183654785156, -0.11876201629638672, -0.11503219604492188, -0.11130237579345703, -0.10757255554199219, -0.10384273529052734, -0.1001129150390625, -0.09638309478759766, -0.09265327453613281, -0.08892345428466797, -0.08519363403320312, -0.08146381378173828, -0.07773399353027344, -0.0740041732788086, -0.07027435302734375, -0.0665445327758789, -0.06281471252441406, -0.05908489227294922, -0.055355072021484375, -0.05162525177001953, -0.04789543151855469, -0.044165611267089844, -0.040435791015625, -0.036705970764160156, -0.03297615051269531, -0.02924633026123047, -0.025516510009765625, -0.02178668975830078, -0.018056869506835938, -0.014327049255371094, -0.01059722900390625, -0.006867408752441406, -0.0031375885009765625, 0.0005922317504882812, 0.004322052001953125, 0.008051872253417969, 0.011781692504882812, 0.015511512756347656, 0.0192413330078125, 0.022971153259277344, 0.026700973510742188, 0.03043079376220703, 0.034160614013671875, 0.03789043426513672, 0.04162025451660156, 0.045350074768066406, 0.04907989501953125, 0.052809715270996094, 0.05653953552246094, 0.06026935577392578, 0.06399917602539062, 0.06772899627685547, 0.07145881652832031, 0.07518863677978516, 0.07891845703125]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 4.0, 5.0, 4.0, 3.0, 11.0, 14.0, 16.0, 30.0, 35.0, 66.0, 93.0, 153.0, 253.0, 456.0, 1142.0, 3221.0, 11831.0, 68412.0, 634255.0, 280606.0, 36612.0, 7340.0, 2223.0, 794.0, 392.0, 194.0, 132.0, 95.0, 42.0, 41.0, 22.0, 24.0, 14.0, 10.0, 5.0, 2.0, 5.0, 3.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2349853515625, -0.2271099090576172, -0.21923446655273438, -0.21135902404785156, -0.20348358154296875, -0.19560813903808594, -0.18773269653320312, -0.1798572540283203, -0.1719818115234375, -0.1641063690185547, -0.15623092651367188, -0.14835548400878906, -0.14048004150390625, -0.13260459899902344, -0.12472915649414062, -0.11685371398925781, -0.108978271484375, -0.10110282897949219, -0.09322738647460938, -0.08535194396972656, -0.07747650146484375, -0.06960105895996094, -0.061725616455078125, -0.05385017395019531, -0.0459747314453125, -0.03809928894042969, -0.030223846435546875, -0.022348403930664062, -0.01447296142578125, -0.0065975189208984375, 0.001277923583984375, 0.009153366088867188, 0.01702880859375, 0.024904251098632812, 0.032779693603515625, 0.04065513610839844, 0.04853057861328125, 0.05640602111816406, 0.06428146362304688, 0.07215690612792969, 0.0800323486328125, 0.08790779113769531, 0.09578323364257812, 0.10365867614746094, 0.11153411865234375, 0.11940956115722656, 0.12728500366210938, 0.1351604461669922, 0.143035888671875, 0.1509113311767578, 0.15878677368164062, 0.16666221618652344, 0.17453765869140625, 0.18241310119628906, 0.19028854370117188, 0.1981639862060547, 0.2060394287109375, 0.2139148712158203, 0.22179031372070312, 0.22966575622558594, 0.23754119873046875, 0.24541664123535156, 0.2532920837402344, 0.2611675262451172, 0.26904296875]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 5.0, 7.0, 8.0, 6.0, 10.0, 10.0, 13.0, 16.0, 17.0, 20.0, 25.0, 28.0, 30.0, 48.0, 35.0, 54.0, 41.0, 57.0, 56.0, 65.0, 62.0, 40.0, 51.0, 51.0, 40.0, 39.0, 34.0, 21.0, 26.0, 20.0, 17.0, 12.0, 10.0, 10.0, 4.0, 5.0, 3.0, 1.0, 5.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.367919921875, -0.3560981750488281, -0.34427642822265625, -0.3324546813964844, -0.3206329345703125, -0.3088111877441406, -0.29698944091796875, -0.2851676940917969, -0.273345947265625, -0.2615242004394531, -0.24970245361328125, -0.23788070678710938, -0.2260589599609375, -0.21423721313476562, -0.20241546630859375, -0.19059371948242188, -0.17877197265625, -0.16695022583007812, -0.15512847900390625, -0.14330673217773438, -0.1314849853515625, -0.11966323852539062, -0.10784149169921875, -0.09601974487304688, -0.084197998046875, -0.07237625122070312, -0.06055450439453125, -0.048732757568359375, -0.0369110107421875, -0.025089263916015625, -0.01326751708984375, -0.001445770263671875, 0.0103759765625, 0.022197723388671875, 0.03401947021484375, 0.045841217041015625, 0.0576629638671875, 0.06948471069335938, 0.08130645751953125, 0.09312820434570312, 0.104949951171875, 0.11677169799804688, 0.12859344482421875, 0.14041519165039062, 0.1522369384765625, 0.16405868530273438, 0.17588043212890625, 0.18770217895507812, 0.19952392578125, 0.21134567260742188, 0.22316741943359375, 0.23498916625976562, 0.2468109130859375, 0.2586326599121094, 0.27045440673828125, 0.2822761535644531, 0.294097900390625, 0.3059196472167969, 0.31774139404296875, 0.3295631408691406, 0.3413848876953125, 0.3532066345214844, 0.36502838134765625, 0.3768501281738281, 0.388671875]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 1.0, 2.0, 8.0, 7.0, 7.0, 7.0, 20.0, 26.0, 41.0, 69.0, 115.0, 245.0, 433.0, 970.0, 2297.0, 6391.0, 22950.0, 125836.0, 725951.0, 128760.0, 23352.0, 6696.0, 2351.0, 1015.0, 446.0, 241.0, 122.0, 62.0, 47.0, 39.0, 9.0, 13.0, 7.0, 7.0, 4.0, 2.0, 4.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10992431640625, -0.1066436767578125, -0.103363037109375, -0.1000823974609375, -0.0968017578125, -0.0935211181640625, -0.090240478515625, -0.0869598388671875, -0.08367919921875, -0.0803985595703125, -0.077117919921875, -0.0738372802734375, -0.070556640625, -0.0672760009765625, -0.063995361328125, -0.0607147216796875, -0.05743408203125, -0.0541534423828125, -0.050872802734375, -0.0475921630859375, -0.0443115234375, -0.0410308837890625, -0.037750244140625, -0.0344696044921875, -0.03118896484375, -0.0279083251953125, -0.024627685546875, -0.0213470458984375, -0.01806640625, -0.0147857666015625, -0.011505126953125, -0.0082244873046875, -0.00494384765625, -0.0016632080078125, 0.001617431640625, 0.0048980712890625, 0.0081787109375, 0.0114593505859375, 0.014739990234375, 0.0180206298828125, 0.02130126953125, 0.0245819091796875, 0.027862548828125, 0.0311431884765625, 0.034423828125, 0.0377044677734375, 0.040985107421875, 0.0442657470703125, 0.04754638671875, 0.0508270263671875, 0.054107666015625, 0.0573883056640625, 0.0606689453125, 0.0639495849609375, 0.067230224609375, 0.0705108642578125, 0.07379150390625, 0.0770721435546875, 0.080352783203125, 0.0836334228515625, 0.0869140625, 0.0901947021484375, 0.093475341796875, 0.0967559814453125, 0.10003662109375]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 1.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 3.0, 3.0, 3.0, 6.0, 20.0, 12.0, 25.0, 39.0, 66.0, 105.0, 129.0, 156.0, 136.0, 120.0, 57.0, 54.0, 24.0, 16.0, 10.0, 10.0, 2.0, 5.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.269050598144531e-05, -5.0838105380535126e-05, -4.898570477962494e-05, -4.713330417871475e-05, -4.5280903577804565e-05, -4.342850297689438e-05, -4.157610237598419e-05, -3.9723701775074005e-05, -3.787130117416382e-05, -3.601890057325363e-05, -3.4166499972343445e-05, -3.231409937143326e-05, -3.046169877052307e-05, -2.8609298169612885e-05, -2.6756897568702698e-05, -2.490449696779251e-05, -2.3052096366882324e-05, -2.1199695765972137e-05, -1.934729516506195e-05, -1.7494894564151764e-05, -1.5642493963241577e-05, -1.379009336233139e-05, -1.1937692761421204e-05, -1.0085292160511017e-05, -8.23289155960083e-06, -6.380490958690643e-06, -4.5280903577804565e-06, -2.6756897568702698e-06, -8.23289155960083e-07, 1.0291114449501038e-06, 2.8815120458602905e-06, 4.733912646770477e-06, 6.586313247680664e-06, 8.43871384859085e-06, 1.0291114449501038e-05, 1.2143515050411224e-05, 1.3995915651321411e-05, 1.5848316252231598e-05, 1.7700716853141785e-05, 1.955311745405197e-05, 2.1405518054962158e-05, 2.3257918655872345e-05, 2.5110319256782532e-05, 2.696271985769272e-05, 2.8815120458602905e-05, 3.066752105951309e-05, 3.251992166042328e-05, 3.4372322261333466e-05, 3.622472286224365e-05, 3.807712346315384e-05, 3.9929524064064026e-05, 4.178192466497421e-05, 4.36343252658844e-05, 4.5486725866794586e-05, 4.733912646770477e-05, 4.919152706861496e-05, 5.1043927669525146e-05, 5.289632827043533e-05, 5.474872887134552e-05, 5.660112947225571e-05, 5.8453530073165894e-05, 6.030593067407608e-05, 6.215833127498627e-05, 6.401073187589645e-05, 6.586313247680664e-05]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 3.0, 4.0, 8.0, 7.0, 4.0, 6.0, 8.0, 18.0, 25.0, 29.0, 55.0, 79.0, 139.0, 230.0, 405.0, 784.0, 1538.0, 3454.0, 8135.0, 22376.0, 80776.0, 539000.0, 297651.0, 62281.0, 18505.0, 7097.0, 2972.0, 1349.0, 730.0, 367.0, 199.0, 105.0, 70.0, 38.0, 29.0, 19.0, 26.0, 8.0, 13.0, 3.0, 7.0, 3.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0718994140625, -0.06932353973388672, -0.06674766540527344, -0.06417179107666016, -0.061595916748046875, -0.059020042419433594, -0.05644416809082031, -0.05386829376220703, -0.05129241943359375, -0.04871654510498047, -0.04614067077636719, -0.043564796447753906, -0.040988922119140625, -0.038413047790527344, -0.03583717346191406, -0.03326129913330078, -0.0306854248046875, -0.02810955047607422, -0.025533676147460938, -0.022957801818847656, -0.020381927490234375, -0.017806053161621094, -0.015230178833007812, -0.012654304504394531, -0.01007843017578125, -0.007502555847167969, -0.0049266815185546875, -0.0023508071899414062, 0.000225067138671875, 0.0028009414672851562, 0.0053768157958984375, 0.007952690124511719, 0.010528564453125, 0.013104438781738281, 0.015680313110351562, 0.018256187438964844, 0.020832061767578125, 0.023407936096191406, 0.025983810424804688, 0.02855968475341797, 0.03113555908203125, 0.03371143341064453, 0.03628730773925781, 0.038863182067871094, 0.041439056396484375, 0.044014930725097656, 0.04659080505371094, 0.04916667938232422, 0.0517425537109375, 0.05431842803955078, 0.05689430236816406, 0.059470176696777344, 0.062046051025390625, 0.0646219253540039, 0.06719779968261719, 0.06977367401123047, 0.07234954833984375, 0.07492542266845703, 0.07750129699707031, 0.0800771713256836, 0.08265304565429688, 0.08522891998291016, 0.08780479431152344, 0.09038066864013672, 0.09295654296875]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 4.0, 3.0, 3.0, 5.0, 7.0, 15.0, 11.0, 10.0, 23.0, 27.0, 34.0, 40.0, 63.0, 90.0, 81.0, 93.0, 88.0, 92.0, 69.0, 69.0, 44.0, 35.0, 23.0, 12.0, 20.0, 11.0, 9.0, 10.0, 3.0, 4.0, 1.0, 2.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.10260009765625, -0.09984207153320312, -0.09708404541015625, -0.09432601928710938, -0.0915679931640625, -0.08880996704101562, -0.08605194091796875, -0.08329391479492188, -0.080535888671875, -0.07777786254882812, -0.07501983642578125, -0.07226181030273438, -0.0695037841796875, -0.06674575805664062, -0.06398773193359375, -0.061229705810546875, -0.0584716796875, -0.055713653564453125, -0.05295562744140625, -0.050197601318359375, -0.0474395751953125, -0.044681549072265625, -0.04192352294921875, -0.039165496826171875, -0.036407470703125, -0.033649444580078125, -0.03089141845703125, -0.028133392333984375, -0.0253753662109375, -0.022617340087890625, -0.01985931396484375, -0.017101287841796875, -0.01434326171875, -0.011585235595703125, -0.00882720947265625, -0.006069183349609375, -0.0033111572265625, -0.000553131103515625, 0.00220489501953125, 0.004962921142578125, 0.007720947265625, 0.010478973388671875, 0.01323699951171875, 0.015995025634765625, 0.0187530517578125, 0.021511077880859375, 0.02426910400390625, 0.027027130126953125, 0.02978515625, 0.032543182373046875, 0.03530120849609375, 0.038059234619140625, 0.0408172607421875, 0.043575286865234375, 0.04633331298828125, 0.049091339111328125, 0.051849365234375, 0.054607391357421875, 0.05736541748046875, 0.060123443603515625, 0.0628814697265625, 0.06563949584960938, 0.06839752197265625, 0.07115554809570312, 0.07391357421875]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 1.0, 2.0, 3.0, 10.0, 9.0, 23.0, 38.0, 73.0, 114.0, 265.0, 270.0, 102.0, 53.0, 14.0, 6.0, 9.0, 5.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.4403464794158936, -2.3665807247161865, -2.2928147315979004, -2.2190489768981934, -2.1452829837799072, -2.0715172290802, -1.9977513551712036, -1.923985481262207, -1.8502196073532104, -1.7764537334442139, -1.7026878595352173, -1.6289219856262207, -1.5551562309265137, -1.4813902378082275, -1.4076244831085205, -1.333858609199524, -1.2600927352905273, -1.1863268613815308, -1.1125609874725342, -1.0387951135635376, -0.9650292992591858, -0.8912634253501892, -0.8174976110458374, -0.7437317371368408, -0.6699658632278442, -0.5961999893188477, -0.5224341154098511, -0.44866830110549927, -0.3749024271965027, -0.3011365532875061, -0.2273707091808319, -0.15360486507415771, -0.07983922958374023, -0.006073370575904846, 0.06769248843193054, 0.14145834743976593, 0.21522420644760132, 0.2889900803565979, 0.3627559244632721, 0.4365217685699463, 0.5102876424789429, 0.5840535163879395, 0.657819390296936, 0.7315852046012878, 0.8053510785102844, 0.879116952419281, 0.9528827667236328, 1.0266486406326294, 1.100414514541626, 1.1741803884506226, 1.2479462623596191, 1.3217121362686157, 1.3954780101776123, 1.4692437648773193, 1.543009638786316, 1.6167755126953125, 1.690541386604309, 1.7643072605133057, 1.8380731344223022, 1.9118390083312988, 1.9856047630310059, 2.059370756149292, 2.133136510848999, 2.206902503967285, 2.280668258666992]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 1.0, 4.0, 5.0, 7.0, 4.0, 15.0, 20.0, 16.0, 19.0, 16.0, 26.0, 33.0, 26.0, 47.0, 28.0, 41.0, 67.0, 92.0, 81.0, 86.0, 65.0, 51.0, 43.0, 41.0, 38.0, 23.0, 23.0, 17.0, 21.0, 11.0, 10.0, 8.0, 10.0, 6.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.2091469764709473, -1.1628299951553345, -1.1165128946304321, -1.0701959133148193, -1.0238789319992065, -0.977561891078949, -0.9312448501586914, -0.8849278688430786, -0.8386108875274658, -0.7922938466072083, -0.7459768652915955, -0.6996598243713379, -0.6533428430557251, -0.6070258021354675, -0.56070876121521, -0.5143917798995972, -0.4680747389793396, -0.4217577278614044, -0.37544071674346924, -0.32912367582321167, -0.2828066945075989, -0.2364896684885025, -0.19017264246940613, -0.14385563135147095, -0.09753862023353577, -0.05122160539031029, -0.004904590547084808, 0.04141242802143097, 0.08772943913936615, 0.13404645025730133, 0.1803634762763977, 0.22668048739433289, 0.27299749851226807, 0.31931450963020325, 0.3656315207481384, 0.411948561668396, 0.4582655429840088, 0.5045825839042664, 0.5508996248245239, 0.5972166061401367, 0.6435335874557495, 0.6898506283760071, 0.7361676096916199, 0.7824846506118774, 0.8288016319274902, 0.8751186728477478, 0.9214357137680054, 0.9677526950836182, 1.0140697956085205, 1.0603867769241333, 1.1067038774490356, 1.1530208587646484, 1.1993378400802612, 1.245654821395874, 1.2919719219207764, 1.3382889032363892, 1.384605884552002, 1.4309228658676147, 1.477239966392517, 1.5235569477081299, 1.5698739290237427, 1.6161909103393555, 1.6625080108642578, 1.7088249921798706, 1.7551419734954834]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 2.0, 3.0, 3.0, 3.0, 4.0, 4.0, 10.0, 6.0, 7.0, 15.0, 7.0, 17.0, 31.0, 51.0, 48.0, 77.0, 114.0, 220.0, 414.0, 775.0, 2008.0, 7420.0, 57410.0, 1864168.0, 2180270.0, 66696.0, 9591.0, 2803.0, 1091.0, 506.0, 212.0, 136.0, 70.0, 41.0, 21.0, 14.0, 8.0, 5.0, 5.0, 3.0, 0.0, 2.0, 2.0], "bins": [-0.32666015625, -0.31940460205078125, -0.3121490478515625, -0.30489349365234375, -0.297637939453125, -0.29038238525390625, -0.2831268310546875, -0.27587127685546875, -0.26861572265625, -0.26136016845703125, -0.2541046142578125, -0.24684906005859375, -0.239593505859375, -0.23233795166015625, -0.2250823974609375, -0.21782684326171875, -0.2105712890625, -0.20331573486328125, -0.1960601806640625, -0.18880462646484375, -0.181549072265625, -0.17429351806640625, -0.1670379638671875, -0.15978240966796875, -0.15252685546875, -0.14527130126953125, -0.1380157470703125, -0.13076019287109375, -0.123504638671875, -0.11624908447265625, -0.1089935302734375, -0.10173797607421875, -0.094482421875, -0.08722686767578125, -0.0799713134765625, -0.07271575927734375, -0.065460205078125, -0.05820465087890625, -0.0509490966796875, -0.04369354248046875, -0.03643798828125, -0.02918243408203125, -0.0219268798828125, -0.01467132568359375, -0.007415771484375, -0.00016021728515625, 0.0070953369140625, 0.01435089111328125, 0.0216064453125, 0.02886199951171875, 0.0361175537109375, 0.04337310791015625, 0.050628662109375, 0.05788421630859375, 0.0651397705078125, 0.07239532470703125, 0.07965087890625, 0.08690643310546875, 0.0941619873046875, 0.10141754150390625, 0.108673095703125, 0.11592864990234375, 0.1231842041015625, 0.13043975830078125, 0.1376953125]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 5.0, 7.0, 11.0, 16.0, 22.0, 32.0, 48.0, 68.0, 69.0, 91.0, 76.0, 78.0, 71.0, 86.0, 75.0, 63.0, 56.0, 38.0, 28.0, 19.0, 18.0, 14.0, 5.0, 5.0, 5.0, 3.0, 1.0, 1.0, 2.0], "bins": [-0.2362060546875, -0.23117351531982422, -0.22614097595214844, -0.22110843658447266, -0.21607589721679688, -0.2110433578491211, -0.2060108184814453, -0.20097827911376953, -0.19594573974609375, -0.19091320037841797, -0.1858806610107422, -0.1808481216430664, -0.17581558227539062, -0.17078304290771484, -0.16575050354003906, -0.16071796417236328, -0.1556854248046875, -0.15065288543701172, -0.14562034606933594, -0.14058780670166016, -0.13555526733398438, -0.1305227279663086, -0.1254901885986328, -0.12045764923095703, -0.11542510986328125, -0.11039257049560547, -0.10536003112792969, -0.1003274917602539, -0.09529495239257812, -0.09026241302490234, -0.08522987365722656, -0.08019733428955078, -0.075164794921875, -0.07013225555419922, -0.06509971618652344, -0.060067176818847656, -0.055034637451171875, -0.050002098083496094, -0.04496955871582031, -0.03993701934814453, -0.03490447998046875, -0.02987194061279297, -0.024839401245117188, -0.019806861877441406, -0.014774322509765625, -0.009741783142089844, -0.0047092437744140625, 0.00032329559326171875, 0.0053558349609375, 0.010388374328613281, 0.015420913696289062, 0.020453453063964844, 0.025485992431640625, 0.030518531799316406, 0.03555107116699219, 0.04058361053466797, 0.04561614990234375, 0.05064868927001953, 0.05568122863769531, 0.060713768005371094, 0.06574630737304688, 0.07077884674072266, 0.07581138610839844, 0.08084392547607422, 0.08587646484375]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 10.0, 13.0, 20.0, 40.0, 113.0, 302.0, 1043.0, 7490.0, 1690503.0, 2484820.0, 8248.0, 1069.0, 381.0, 121.0, 59.0, 24.0, 16.0, 7.0, 4.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5166015625, -0.49880218505859375, -0.4810028076171875, -0.46320343017578125, -0.445404052734375, -0.42760467529296875, -0.4098052978515625, -0.39200592041015625, -0.37420654296875, -0.35640716552734375, -0.3386077880859375, -0.32080841064453125, -0.303009033203125, -0.28520965576171875, -0.2674102783203125, -0.24961090087890625, -0.2318115234375, -0.21401214599609375, -0.1962127685546875, -0.17841339111328125, -0.160614013671875, -0.14281463623046875, -0.1250152587890625, -0.10721588134765625, -0.08941650390625, -0.07161712646484375, -0.0538177490234375, -0.03601837158203125, -0.018218994140625, -0.00041961669921875, 0.0173797607421875, 0.03517913818359375, 0.052978515625, 0.07077789306640625, 0.0885772705078125, 0.10637664794921875, 0.124176025390625, 0.14197540283203125, 0.1597747802734375, 0.17757415771484375, 0.19537353515625, 0.21317291259765625, 0.2309722900390625, 0.24877166748046875, 0.266571044921875, 0.28437042236328125, 0.3021697998046875, 0.31996917724609375, 0.3377685546875, 0.35556793212890625, 0.3733673095703125, 0.39116668701171875, 0.408966064453125, 0.42676544189453125, 0.4445648193359375, 0.46236419677734375, 0.48016357421875, 0.49796295166015625, 0.5157623291015625, 0.5335617065429688, 0.551361083984375, 0.5691604614257812, 0.5869598388671875, 0.6047592163085938, 0.62255859375]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 0.0, 4.0, 0.0, 1.0, 3.0, 7.0, 4.0, 10.0, 12.0, 24.0, 35.0, 66.0, 114.0, 195.0, 358.0, 636.0, 924.0, 727.0, 421.0, 221.0, 124.0, 81.0, 48.0, 28.0, 7.0, 8.0, 7.0, 7.0, 3.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.216796875, -0.2092132568359375, -0.201629638671875, -0.1940460205078125, -0.18646240234375, -0.1788787841796875, -0.171295166015625, -0.1637115478515625, -0.1561279296875, -0.1485443115234375, -0.140960693359375, -0.1333770751953125, -0.12579345703125, -0.1182098388671875, -0.110626220703125, -0.1030426025390625, -0.095458984375, -0.0878753662109375, -0.080291748046875, -0.0727081298828125, -0.06512451171875, -0.0575408935546875, -0.049957275390625, -0.0423736572265625, -0.0347900390625, -0.0272064208984375, -0.019622802734375, -0.0120391845703125, -0.00445556640625, 0.0031280517578125, 0.010711669921875, 0.0182952880859375, 0.02587890625, 0.0334625244140625, 0.041046142578125, 0.0486297607421875, 0.05621337890625, 0.0637969970703125, 0.071380615234375, 0.0789642333984375, 0.0865478515625, 0.0941314697265625, 0.101715087890625, 0.1092987060546875, 0.11688232421875, 0.1244659423828125, 0.132049560546875, 0.1396331787109375, 0.147216796875, 0.1548004150390625, 0.162384033203125, 0.1699676513671875, 0.17755126953125, 0.1851348876953125, 0.192718505859375, 0.2003021240234375, 0.2078857421875, 0.2154693603515625, 0.223052978515625, 0.2306365966796875, 0.23822021484375, 0.2458038330078125, 0.253387451171875, 0.2609710693359375, 0.2685546875]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0, 10.0, 15.0, 34.0, 77.0, 168.0, 204.0, 209.0, 131.0, 82.0, 38.0, 14.0, 8.0, 5.0, 3.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6589196920394897, -1.5832395553588867, -1.5075592994689941, -1.4318791627883911, -1.356199026107788, -1.2805187702178955, -1.2048386335372925, -1.1291584968566895, -1.0534782409667969, -0.9777980446815491, -0.9021178483963013, -0.8264377117156982, -0.7507575154304504, -0.6750773191452026, -0.5993971824645996, -0.5237169861793518, -0.448036789894104, -0.3723565936088562, -0.2966764271259308, -0.22099624574184418, -0.14531606435775757, -0.06963586807250977, 0.006044298410415649, 0.08172446489334106, 0.15740466117858887, 0.23308484256267548, 0.3087650239467621, 0.3844451904296875, 0.4601253867149353, 0.5358055830001831, 0.6114857196807861, 0.6871659159660339, 0.7628459930419922, 0.83852618932724, 0.9142063856124878, 0.9898865222930908, 1.0655667781829834, 1.1412469148635864, 1.2169270515441895, 1.292607307434082, 1.368287444114685, 1.443967580795288, 1.5196478366851807, 1.5953279733657837, 1.6710081100463867, 1.7466883659362793, 1.8223685026168823, 1.8980486392974854, 1.973728895187378, 2.0494091510772705, 2.125089168548584, 2.2007694244384766, 2.276449680328369, 2.3521299362182617, 2.427809953689575, 2.5034902095794678, 2.5791702270507812, 2.654850482940674, 2.7305305004119873, 2.80621075630188, 2.8818910121917725, 2.957571029663086, 3.0332512855529785, 3.108931541442871, 3.1846117973327637]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 4.0, 2.0, 4.0, 3.0, 2.0, 6.0, 8.0, 15.0, 14.0, 19.0, 19.0, 23.0, 29.0, 32.0, 45.0, 55.0, 58.0, 54.0, 59.0, 65.0, 62.0, 54.0, 51.0, 52.0, 49.0, 38.0, 31.0, 34.0, 25.0, 20.0, 15.0, 21.0, 13.0, 8.0, 7.0, 8.0, 1.0, 4.0, 3.0, 0.0, 1.0, 1.0, 1.0], "bins": [-1.320117712020874, -1.2880189418792725, -1.2559202909469604, -1.2238215208053589, -1.1917227506637573, -1.1596240997314453, -1.1275253295898438, -1.0954265594482422, -1.0633279085159302, -1.0312291383743286, -0.9991304278373718, -0.967031717300415, -0.9349330067634583, -0.9028342962265015, -0.8707355260848999, -0.8386368155479431, -0.8065380454063416, -0.7744393348693848, -0.7423405647277832, -0.7102418541908264, -0.6781431436538696, -0.6460443735122681, -0.6139456629753113, -0.5818469524383545, -0.5497481822967529, -0.5176494717597961, -0.48555073142051697, -0.4534519910812378, -0.421353280544281, -0.38925454020500183, -0.35715579986572266, -0.32505708932876587, -0.29295843839645386, -0.2608596980571747, -0.2287609875202179, -0.19666224718093872, -0.16456352174282074, -0.13246479630470276, -0.10036605596542358, -0.0682673305273056, -0.03616860508918762, -0.004069875925779343, 0.028028853237628937, 0.060127586126327515, 0.0922263115644455, 0.12432503700256348, 0.15642377734184265, 0.18852250277996063, 0.2206212282180786, 0.2527199685573578, 0.2848186790943146, 0.31691741943359375, 0.34901612997055054, 0.3811148703098297, 0.4132136106491089, 0.4453123211860657, 0.47741106152534485, 0.509509801864624, 0.5416085124015808, 0.5737072229385376, 0.6058059930801392, 0.637904703617096, 0.6700034141540527, 0.7021021842956543, 0.7342008948326111]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 9.0, 5.0, 4.0, 5.0, 12.0, 19.0, 40.0, 46.0, 131.0, 299.0, 1068.0, 6229.0, 75211.0, 850993.0, 104888.0, 7644.0, 1317.0, 363.0, 136.0, 63.0, 34.0, 9.0, 13.0, 7.0, 3.0, 6.0, 1.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.49560546875, -0.48274993896484375, -0.4698944091796875, -0.45703887939453125, -0.444183349609375, -0.43132781982421875, -0.4184722900390625, -0.40561676025390625, -0.39276123046875, -0.37990570068359375, -0.3670501708984375, -0.35419464111328125, -0.341339111328125, -0.32848358154296875, -0.3156280517578125, -0.30277252197265625, -0.2899169921875, -0.27706146240234375, -0.2642059326171875, -0.25135040283203125, -0.238494873046875, -0.22563934326171875, -0.2127838134765625, -0.19992828369140625, -0.18707275390625, -0.17421722412109375, -0.1613616943359375, -0.14850616455078125, -0.135650634765625, -0.12279510498046875, -0.1099395751953125, -0.09708404541015625, -0.084228515625, -0.07137298583984375, -0.0585174560546875, -0.04566192626953125, -0.032806396484375, -0.01995086669921875, -0.0070953369140625, 0.00576019287109375, 0.01861572265625, 0.03147125244140625, 0.0443267822265625, 0.05718231201171875, 0.070037841796875, 0.08289337158203125, 0.0957489013671875, 0.10860443115234375, 0.1214599609375, 0.13431549072265625, 0.1471710205078125, 0.16002655029296875, 0.172882080078125, 0.18573760986328125, 0.1985931396484375, 0.21144866943359375, 0.22430419921875, 0.23715972900390625, 0.2500152587890625, 0.26287078857421875, 0.275726318359375, 0.28858184814453125, 0.3014373779296875, 0.31429290771484375, 0.3271484375]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 4.0, 4.0, 3.0, 2.0, 6.0, 10.0, 7.0, 20.0, 14.0, 14.0, 19.0, 23.0, 39.0, 31.0, 27.0, 46.0, 48.0, 44.0, 59.0, 51.0, 51.0, 42.0, 55.0, 60.0, 45.0, 44.0, 38.0, 39.0, 27.0, 25.0, 19.0, 21.0, 16.0, 14.0, 8.0, 5.0, 9.0, 5.0, 7.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0933837890625, -0.09024906158447266, -0.08711433410644531, -0.08397960662841797, -0.08084487915039062, -0.07771015167236328, -0.07457542419433594, -0.0714406967163086, -0.06830596923828125, -0.0651712417602539, -0.06203651428222656, -0.05890178680419922, -0.055767059326171875, -0.05263233184814453, -0.04949760437011719, -0.046362876892089844, -0.0432281494140625, -0.040093421936035156, -0.03695869445800781, -0.03382396697998047, -0.030689239501953125, -0.02755451202392578, -0.024419784545898438, -0.021285057067871094, -0.01815032958984375, -0.015015602111816406, -0.011880874633789062, -0.008746147155761719, -0.005611419677734375, -0.0024766921997070312, 0.0006580352783203125, 0.0037927627563476562, 0.006927490234375, 0.010062217712402344, 0.013196945190429688, 0.01633167266845703, 0.019466400146484375, 0.02260112762451172, 0.025735855102539062, 0.028870582580566406, 0.03200531005859375, 0.035140037536621094, 0.03827476501464844, 0.04140949249267578, 0.044544219970703125, 0.04767894744873047, 0.05081367492675781, 0.053948402404785156, 0.0570831298828125, 0.060217857360839844, 0.06335258483886719, 0.06648731231689453, 0.06962203979492188, 0.07275676727294922, 0.07589149475097656, 0.0790262222290039, 0.08216094970703125, 0.0852956771850586, 0.08843040466308594, 0.09156513214111328, 0.09469985961914062, 0.09783458709716797, 0.10096931457519531, 0.10410404205322266, 0.10723876953125]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 1.0, 2.0, 4.0, 2.0, 7.0, 5.0, 7.0, 7.0, 17.0, 16.0, 22.0, 19.0, 33.0, 56.0, 77.0, 110.0, 160.0, 284.0, 473.0, 926.0, 2067.0, 6125.0, 25215.0, 191789.0, 725978.0, 75005.0, 13197.0, 3770.0, 1430.0, 654.0, 375.0, 212.0, 167.0, 86.0, 92.0, 44.0, 38.0, 22.0, 16.0, 16.0, 10.0, 7.0, 2.0, 6.0, 3.0, 2.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.281494140625, -0.273284912109375, -0.26507568359375, -0.256866455078125, -0.2486572265625, -0.240447998046875, -0.23223876953125, -0.224029541015625, -0.2158203125, -0.207611083984375, -0.19940185546875, -0.191192626953125, -0.1829833984375, -0.174774169921875, -0.16656494140625, -0.158355712890625, -0.150146484375, -0.141937255859375, -0.13372802734375, -0.125518798828125, -0.1173095703125, -0.109100341796875, -0.10089111328125, -0.092681884765625, -0.08447265625, -0.076263427734375, -0.06805419921875, -0.059844970703125, -0.0516357421875, -0.043426513671875, -0.03521728515625, -0.027008056640625, -0.018798828125, -0.010589599609375, -0.00238037109375, 0.005828857421875, 0.0140380859375, 0.022247314453125, 0.03045654296875, 0.038665771484375, 0.046875, 0.055084228515625, 0.06329345703125, 0.071502685546875, 0.0797119140625, 0.087921142578125, 0.09613037109375, 0.104339599609375, 0.112548828125, 0.120758056640625, 0.12896728515625, 0.137176513671875, 0.1453857421875, 0.153594970703125, 0.16180419921875, 0.170013427734375, 0.17822265625, 0.186431884765625, 0.19464111328125, 0.202850341796875, 0.2110595703125, 0.219268798828125, 0.22747802734375, 0.235687255859375, 0.243896484375]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 0.0, 4.0, 0.0, 8.0, 6.0, 2.0, 11.0, 9.0, 15.0, 16.0, 20.0, 22.0, 28.0, 39.0, 34.0, 35.0, 41.0, 46.0, 55.0, 62.0, 54.0, 60.0, 46.0, 53.0, 62.0, 39.0, 35.0, 38.0, 32.0, 24.0, 27.0, 22.0, 14.0, 11.0, 8.0, 7.0, 9.0, 3.0, 3.0, 6.0, 4.0, 1.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.298828125, -0.2868461608886719, -0.27486419677734375, -0.2628822326660156, -0.2509002685546875, -0.23891830444335938, -0.22693634033203125, -0.21495437622070312, -0.202972412109375, -0.19099044799804688, -0.17900848388671875, -0.16702651977539062, -0.1550445556640625, -0.14306259155273438, -0.13108062744140625, -0.11909866333007812, -0.10711669921875, -0.09513473510742188, -0.08315277099609375, -0.07117080688476562, -0.0591888427734375, -0.047206878662109375, -0.03522491455078125, -0.023242950439453125, -0.011260986328125, 0.000720977783203125, 0.01270294189453125, 0.024684906005859375, 0.0366668701171875, 0.048648834228515625, 0.06063079833984375, 0.07261276245117188, 0.0845947265625, 0.09657669067382812, 0.10855865478515625, 0.12054061889648438, 0.1325225830078125, 0.14450454711914062, 0.15648651123046875, 0.16846847534179688, 0.180450439453125, 0.19243240356445312, 0.20441436767578125, 0.21639633178710938, 0.2283782958984375, 0.24036026000976562, 0.25234222412109375, 0.2643241882324219, 0.27630615234375, 0.2882881164550781, 0.30027008056640625, 0.3122520446777344, 0.3242340087890625, 0.3362159729003906, 0.34819793701171875, 0.3601799011230469, 0.372161865234375, 0.3841438293457031, 0.39612579345703125, 0.4081077575683594, 0.4200897216796875, 0.4320716857910156, 0.44405364990234375, 0.4560356140136719, 0.468017578125]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 5.0, 8.0, 1.0, 8.0, 5.0, 17.0, 17.0, 23.0, 32.0, 37.0, 64.0, 95.0, 146.0, 224.0, 395.0, 644.0, 1057.0, 2016.0, 4227.0, 8899.0, 21752.0, 64411.0, 525434.0, 319633.0, 61061.0, 20955.0, 8573.0, 4120.0, 2067.0, 1036.0, 554.0, 381.0, 205.0, 142.0, 104.0, 64.0, 35.0, 34.0, 17.0, 15.0, 8.0, 8.0, 7.0, 8.0, 6.0, 5.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 2.0], "bins": [-0.07098388671875, -0.0688314437866211, -0.06667900085449219, -0.06452655792236328, -0.062374114990234375, -0.06022167205810547, -0.05806922912597656, -0.055916786193847656, -0.05376434326171875, -0.051611900329589844, -0.04945945739746094, -0.04730701446533203, -0.045154571533203125, -0.04300212860107422, -0.04084968566894531, -0.038697242736816406, -0.0365447998046875, -0.034392356872558594, -0.03223991394042969, -0.03008747100830078, -0.027935028076171875, -0.02578258514404297, -0.023630142211914062, -0.021477699279785156, -0.01932525634765625, -0.017172813415527344, -0.015020370483398438, -0.012867927551269531, -0.010715484619140625, -0.008563041687011719, -0.0064105987548828125, -0.004258155822753906, -0.002105712890625, 4.673004150390625e-05, 0.0021991729736328125, 0.004351615905761719, 0.006504058837890625, 0.008656501770019531, 0.010808944702148438, 0.012961387634277344, 0.01511383056640625, 0.017266273498535156, 0.019418716430664062, 0.02157115936279297, 0.023723602294921875, 0.02587604522705078, 0.028028488159179688, 0.030180931091308594, 0.0323333740234375, 0.034485816955566406, 0.03663825988769531, 0.03879070281982422, 0.040943145751953125, 0.04309558868408203, 0.04524803161621094, 0.047400474548339844, 0.04955291748046875, 0.051705360412597656, 0.05385780334472656, 0.05601024627685547, 0.058162689208984375, 0.06031513214111328, 0.06246757507324219, 0.0646200180053711, 0.0667724609375]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 3.0, 2.0, 4.0, 4.0, 10.0, 8.0, 8.0, 18.0, 16.0, 19.0, 21.0, 39.0, 72.0, 93.0, 112.0, 123.0, 128.0, 86.0, 71.0, 43.0, 35.0, 15.0, 14.0, 22.0, 9.0, 9.0, 3.0, 3.0, 4.0, 4.0, 4.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.676248550415039e-05, -2.552475780248642e-05, -2.428703010082245e-05, -2.3049302399158478e-05, -2.1811574697494507e-05, -2.0573846995830536e-05, -1.9336119294166565e-05, -1.8098391592502594e-05, -1.6860663890838623e-05, -1.5622936189174652e-05, -1.4385208487510681e-05, -1.314748078584671e-05, -1.190975308418274e-05, -1.0672025382518768e-05, -9.434297680854797e-06, -8.196569979190826e-06, -6.9588422775268555e-06, -5.7211145758628845e-06, -4.4833868741989136e-06, -3.2456591725349426e-06, -2.0079314708709717e-06, -7.702037692070007e-07, 4.675239324569702e-07, 1.7052516341209412e-06, 2.942979335784912e-06, 4.180707037448883e-06, 5.418434739112854e-06, 6.656162440776825e-06, 7.893890142440796e-06, 9.131617844104767e-06, 1.0369345545768738e-05, 1.1607073247432709e-05, 1.284480094909668e-05, 1.408252865076065e-05, 1.532025635242462e-05, 1.6557984054088593e-05, 1.7795711755752563e-05, 1.9033439457416534e-05, 2.0271167159080505e-05, 2.1508894860744476e-05, 2.2746622562408447e-05, 2.3984350264072418e-05, 2.522207796573639e-05, 2.645980566740036e-05, 2.769753336906433e-05, 2.8935261070728302e-05, 3.0172988772392273e-05, 3.1410716474056244e-05, 3.2648444175720215e-05, 3.3886171877384186e-05, 3.512389957904816e-05, 3.636162728071213e-05, 3.75993549823761e-05, 3.883708268404007e-05, 4.007481038570404e-05, 4.131253808736801e-05, 4.255026578903198e-05, 4.378799349069595e-05, 4.5025721192359924e-05, 4.6263448894023895e-05, 4.7501176595687866e-05, 4.873890429735184e-05, 4.997663199901581e-05, 5.121435970067978e-05, 5.245208740234375e-05]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 6.0, 7.0, 9.0, 16.0, 15.0, 14.0, 30.0, 35.0, 65.0, 76.0, 143.0, 193.0, 329.0, 558.0, 1085.0, 2109.0, 4849.0, 12477.0, 37230.0, 173778.0, 688083.0, 88275.0, 23494.0, 8364.0, 3569.0, 1680.0, 798.0, 474.0, 248.0, 180.0, 120.0, 88.0, 47.0, 37.0, 23.0, 19.0, 6.0, 6.0, 9.0, 6.0, 4.0, 6.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0706787109375, -0.06809043884277344, -0.06550216674804688, -0.06291389465332031, -0.06032562255859375, -0.05773735046386719, -0.055149078369140625, -0.05256080627441406, -0.0499725341796875, -0.04738426208496094, -0.044795989990234375, -0.04220771789550781, -0.03961944580078125, -0.03703117370605469, -0.034442901611328125, -0.03185462951660156, -0.029266357421875, -0.026678085327148438, -0.024089813232421875, -0.021501541137695312, -0.01891326904296875, -0.016324996948242188, -0.013736724853515625, -0.011148452758789062, -0.0085601806640625, -0.0059719085693359375, -0.003383636474609375, -0.0007953643798828125, 0.00179290771484375, 0.0043811798095703125, 0.006969451904296875, 0.009557723999023438, 0.01214599609375, 0.014734268188476562, 0.017322540283203125, 0.019910812377929688, 0.02249908447265625, 0.025087356567382812, 0.027675628662109375, 0.030263900756835938, 0.0328521728515625, 0.03544044494628906, 0.038028717041015625, 0.04061698913574219, 0.04320526123046875, 0.04579353332519531, 0.048381805419921875, 0.05097007751464844, 0.053558349609375, 0.05614662170410156, 0.058734893798828125, 0.06132316589355469, 0.06391143798828125, 0.06649971008300781, 0.06908798217773438, 0.07167625427246094, 0.0742645263671875, 0.07685279846191406, 0.07944107055664062, 0.08202934265136719, 0.08461761474609375, 0.08720588684082031, 0.08979415893554688, 0.09238243103027344, 0.094970703125]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 3.0, 4.0, 2.0, 9.0, 5.0, 6.0, 8.0, 12.0, 9.0, 11.0, 15.0, 33.0, 40.0, 56.0, 94.0, 117.0, 130.0, 109.0, 86.0, 68.0, 41.0, 35.0, 21.0, 21.0, 15.0, 10.0, 16.0, 7.0, 4.0, 8.0, 0.0, 4.0, 2.0, 3.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0802001953125, -0.0773019790649414, -0.07440376281738281, -0.07150554656982422, -0.06860733032226562, -0.06570911407470703, -0.06281089782714844, -0.059912681579589844, -0.05701446533203125, -0.054116249084472656, -0.05121803283691406, -0.04831981658935547, -0.045421600341796875, -0.04252338409423828, -0.03962516784667969, -0.036726951599121094, -0.0338287353515625, -0.030930519104003906, -0.028032302856445312, -0.02513408660888672, -0.022235870361328125, -0.01933765411376953, -0.016439437866210938, -0.013541221618652344, -0.01064300537109375, -0.007744789123535156, -0.0048465728759765625, -0.0019483566284179688, 0.000949859619140625, 0.0038480758666992188, 0.0067462921142578125, 0.009644508361816406, 0.012542724609375, 0.015440940856933594, 0.018339157104492188, 0.02123737335205078, 0.024135589599609375, 0.02703380584716797, 0.029932022094726562, 0.032830238342285156, 0.03572845458984375, 0.038626670837402344, 0.04152488708496094, 0.04442310333251953, 0.047321319580078125, 0.05021953582763672, 0.05311775207519531, 0.056015968322753906, 0.0589141845703125, 0.061812400817871094, 0.06471061706542969, 0.06760883331298828, 0.07050704956054688, 0.07340526580810547, 0.07630348205566406, 0.07920169830322266, 0.08209991455078125, 0.08499813079833984, 0.08789634704589844, 0.09079456329345703, 0.09369277954101562, 0.09659099578857422, 0.09948921203613281, 0.1023874282836914, 0.10528564453125]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 1.0, 4.0, 7.0, 10.0, 15.0, 32.0, 41.0, 66.0, 94.0, 213.0, 187.0, 101.0, 72.0, 57.0, 40.0, 17.0, 8.0, 6.0, 6.0, 4.0, 4.0, 3.0, 0.0, 4.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6782475709915161, -1.6288036108016968, -1.5793596506118774, -1.5299155712127686, -1.4804716110229492, -1.4310276508331299, -1.3815836906433105, -1.3321397304534912, -1.2826957702636719, -1.2332518100738525, -1.1838078498840332, -1.1343638896942139, -1.084919810295105, -1.0354758501052856, -0.9860318899154663, -0.936587929725647, -0.8871438503265381, -0.8376998901367188, -0.7882558703422546, -0.7388119101524353, -0.6893678903579712, -0.6399239301681519, -0.5904799699783325, -0.5410360097885132, -0.4915919899940491, -0.44214800000190735, -0.3927040100097656, -0.3432600498199463, -0.29381605982780457, -0.24437206983566284, -0.1949281096458435, -0.14548411965370178, -0.09604001045227051, -0.04659602791070938, 0.0028479546308517456, 0.052291929721832275, 0.101735919713974, 0.15117990970611572, 0.20062386989593506, 0.2500678598880768, 0.2995118498802185, 0.34895583987236023, 0.39839982986450195, 0.4478437900543213, 0.497287780046463, 0.5467317700386047, 0.5961757302284241, 0.6456197500228882, 0.6950637102127075, 0.7445076704025269, 0.793951690196991, 0.8433956503868103, 0.8928396701812744, 0.9422836303710938, 0.9917275905609131, 1.0411715507507324, 1.0906155109405518, 1.140059471130371, 1.1895034313201904, 1.2389473915100098, 1.2883914709091187, 1.337835431098938, 1.3872793912887573, 1.4367233514785767, 1.4861674308776855]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 3.0, 2.0, 2.0, 1.0, 3.0, 6.0, 15.0, 10.0, 12.0, 9.0, 10.0, 21.0, 18.0, 20.0, 26.0, 20.0, 27.0, 25.0, 45.0, 47.0, 70.0, 86.0, 100.0, 84.0, 65.0, 38.0, 26.0, 32.0, 34.0, 16.0, 20.0, 23.0, 17.0, 15.0, 9.0, 13.0, 10.0, 1.0, 14.0, 6.0, 7.0, 2.0, 1.0, 5.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.564016580581665, -1.519797921180725, -1.4755792617797852, -1.4313606023788452, -1.3871419429779053, -1.3429231643676758, -1.2987046241760254, -1.254485845565796, -1.210267186164856, -1.166048526763916, -1.121829867362976, -1.0776112079620361, -1.0333925485610962, -0.9891738295555115, -0.9449551701545715, -0.9007364511489868, -0.8565178513526917, -0.8122991919517517, -0.7680805325508118, -0.723861813545227, -0.6796431541442871, -0.6354244947433472, -0.5912058353424072, -0.5469871759414673, -0.5027685165405273, -0.4585498571395874, -0.4143311679363251, -0.37011250853538513, -0.3258938193321228, -0.28167515993118286, -0.23745650053024292, -0.1932378113269806, -0.14901912212371826, -0.10480044782161713, -0.06058178097009659, -0.01636311411857605, 0.027855560183525085, 0.07207423448562622, 0.11629289388656616, 0.1605115830898285, 0.20473024249076843, 0.24894891679286957, 0.2931675910949707, 0.33738625049591064, 0.3816049098968506, 0.4258235991001129, 0.47004225850105286, 0.5142609477043152, 0.5584796071052551, 0.6026982665061951, 0.646916925907135, 0.6911356449127197, 0.7353543043136597, 0.7795729637145996, 0.8237916231155396, 0.8680102825164795, 0.9122289419174194, 0.9564476013183594, 1.0006662607192993, 1.0448849201202393, 1.0891035795211792, 1.1333222389221191, 1.1775410175323486, 1.2217596769332886, 1.2659783363342285]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 4.0, 8.0, 11.0, 14.0, 22.0, 39.0, 92.0, 184.0, 449.0, 1273.0, 6011.0, 117420.0, 3826947.0, 231498.0, 8156.0, 1408.0, 429.0, 151.0, 64.0, 31.0, 19.0, 23.0, 9.0, 9.0, 6.0, 3.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.255126953125, -0.24382400512695312, -0.23252105712890625, -0.22121810913085938, -0.2099151611328125, -0.19861221313476562, -0.18730926513671875, -0.17600631713867188, -0.164703369140625, -0.15340042114257812, -0.14209747314453125, -0.13079452514648438, -0.1194915771484375, -0.10818862915039062, -0.09688568115234375, -0.08558273315429688, -0.07427978515625, -0.06297683715820312, -0.05167388916015625, -0.040370941162109375, -0.0290679931640625, -0.017765045166015625, -0.00646209716796875, 0.004840850830078125, 0.016143798828125, 0.027446746826171875, 0.03874969482421875, 0.050052642822265625, 0.0613555908203125, 0.07265853881835938, 0.08396148681640625, 0.09526443481445312, 0.1065673828125, 0.11787033081054688, 0.12917327880859375, 0.14047622680664062, 0.1517791748046875, 0.16308212280273438, 0.17438507080078125, 0.18568801879882812, 0.196990966796875, 0.20829391479492188, 0.21959686279296875, 0.23089981079101562, 0.2422027587890625, 0.2535057067871094, 0.26480865478515625, 0.2761116027832031, 0.28741455078125, 0.2987174987792969, 0.31002044677734375, 0.3213233947753906, 0.3326263427734375, 0.3439292907714844, 0.35523223876953125, 0.3665351867675781, 0.377838134765625, 0.3891410827636719, 0.40044403076171875, 0.4117469787597656, 0.4230499267578125, 0.4343528747558594, 0.44565582275390625, 0.4569587707519531, 0.46826171875]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 4.0, 1.0, 5.0, 3.0, 7.0, 9.0, 9.0, 12.0, 17.0, 20.0, 21.0, 31.0, 25.0, 31.0, 32.0, 29.0, 40.0, 37.0, 56.0, 44.0, 51.0, 54.0, 50.0, 46.0, 47.0, 38.0, 37.0, 48.0, 35.0, 20.0, 20.0, 23.0, 23.0, 13.0, 12.0, 10.0, 13.0, 12.0, 7.0, 2.0, 2.0, 1.0, 6.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0], "bins": [-0.08782958984375, -0.08502006530761719, -0.08221054077148438, -0.07940101623535156, -0.07659149169921875, -0.07378196716308594, -0.07097244262695312, -0.06816291809082031, -0.0653533935546875, -0.06254386901855469, -0.059734344482421875, -0.05692481994628906, -0.05411529541015625, -0.05130577087402344, -0.048496246337890625, -0.04568672180175781, -0.042877197265625, -0.04006767272949219, -0.037258148193359375, -0.03444862365722656, -0.03163909912109375, -0.028829574584960938, -0.026020050048828125, -0.023210525512695312, -0.0204010009765625, -0.017591476440429688, -0.014781951904296875, -0.011972427368164062, -0.00916290283203125, -0.0063533782958984375, -0.003543853759765625, -0.0007343292236328125, 0.0020751953125, 0.0048847198486328125, 0.007694244384765625, 0.010503768920898438, 0.01331329345703125, 0.016122817993164062, 0.018932342529296875, 0.021741867065429688, 0.0245513916015625, 0.027360916137695312, 0.030170440673828125, 0.03297996520996094, 0.03578948974609375, 0.03859901428222656, 0.041408538818359375, 0.04421806335449219, 0.047027587890625, 0.04983711242675781, 0.052646636962890625, 0.05545616149902344, 0.05826568603515625, 0.06107521057128906, 0.06388473510742188, 0.06669425964355469, 0.0695037841796875, 0.07231330871582031, 0.07512283325195312, 0.07793235778808594, 0.08074188232421875, 0.08355140686035156, 0.08636093139648438, 0.08917045593261719, 0.09197998046875]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 3.0, 2.0, 5.0, 4.0, 7.0, 9.0, 18.0, 37.0, 67.0, 138.0, 273.0, 663.0, 2253.0, 16449.0, 958523.0, 3176525.0, 34515.0, 3193.0, 871.0, 363.0, 176.0, 86.0, 34.0, 28.0, 19.0, 12.0, 6.0, 5.0, 1.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5205078125, -0.5081520080566406, -0.49579620361328125, -0.4834403991699219, -0.4710845947265625, -0.4587287902832031, -0.44637298583984375, -0.4340171813964844, -0.421661376953125, -0.4093055725097656, -0.39694976806640625, -0.3845939636230469, -0.3722381591796875, -0.3598823547363281, -0.34752655029296875, -0.3351707458496094, -0.32281494140625, -0.3104591369628906, -0.29810333251953125, -0.2857475280761719, -0.2733917236328125, -0.2610359191894531, -0.24868011474609375, -0.23632431030273438, -0.223968505859375, -0.21161270141601562, -0.19925689697265625, -0.18690109252929688, -0.1745452880859375, -0.16218948364257812, -0.14983367919921875, -0.13747787475585938, -0.1251220703125, -0.11276626586914062, -0.10041046142578125, -0.08805465698242188, -0.0756988525390625, -0.06334304809570312, -0.05098724365234375, -0.038631439208984375, -0.026275634765625, -0.013919830322265625, -0.00156402587890625, 0.010791778564453125, 0.0231475830078125, 0.035503387451171875, 0.04785919189453125, 0.060214996337890625, 0.07257080078125, 0.08492660522460938, 0.09728240966796875, 0.10963821411132812, 0.1219940185546875, 0.13434982299804688, 0.14670562744140625, 0.15906143188476562, 0.171417236328125, 0.18377304077148438, 0.19612884521484375, 0.20848464965820312, 0.2208404541015625, 0.23319625854492188, 0.24555206298828125, 0.2579078674316406, 0.270263671875]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 2.0, 3.0, 2.0, 4.0, 2.0, 8.0, 10.0, 4.0, 11.0, 17.0, 23.0, 28.0, 63.0, 77.0, 88.0, 148.0, 214.0, 297.0, 481.0, 578.0, 613.0, 422.0, 325.0, 211.0, 158.0, 82.0, 59.0, 44.0, 31.0, 19.0, 15.0, 12.0, 9.0, 7.0, 3.0, 2.0, 3.0, 2.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.174072265625, -0.1682415008544922, -0.16241073608398438, -0.15657997131347656, -0.15074920654296875, -0.14491844177246094, -0.13908767700195312, -0.1332569122314453, -0.1274261474609375, -0.12159538269042969, -0.11576461791992188, -0.10993385314941406, -0.10410308837890625, -0.09827232360839844, -0.09244155883789062, -0.08661079406738281, -0.080780029296875, -0.07494926452636719, -0.06911849975585938, -0.06328773498535156, -0.05745697021484375, -0.05162620544433594, -0.045795440673828125, -0.03996467590332031, -0.0341339111328125, -0.028303146362304688, -0.022472381591796875, -0.016641616821289062, -0.01081085205078125, -0.0049800872802734375, 0.000850677490234375, 0.0066814422607421875, 0.01251220703125, 0.018342971801757812, 0.024173736572265625, 0.030004501342773438, 0.03583526611328125, 0.04166603088378906, 0.047496795654296875, 0.05332756042480469, 0.0591583251953125, 0.06498908996582031, 0.07081985473632812, 0.07665061950683594, 0.08248138427734375, 0.08831214904785156, 0.09414291381835938, 0.09997367858886719, 0.105804443359375, 0.11163520812988281, 0.11746597290039062, 0.12329673767089844, 0.12912750244140625, 0.13495826721191406, 0.14078903198242188, 0.1466197967529297, 0.1524505615234375, 0.1582813262939453, 0.16411209106445312, 0.16994285583496094, 0.17577362060546875, 0.18160438537597656, 0.18743515014648438, 0.1932659149169922, 0.1990966796875]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 5.0, 2.0, 15.0, 17.0, 20.0, 54.0, 100.0, 168.0, 190.0, 188.0, 112.0, 55.0, 35.0, 23.0, 9.0, 9.0, 3.0, 0.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5186384916305542, -1.4484360218048096, -1.3782334327697754, -1.3080308437347412, -1.2378283739089966, -1.167625904083252, -1.0974233150482178, -1.0272207260131836, -0.957018256187439, -0.8868157267570496, -0.8166131973266602, -0.7464106678962708, -0.6762081384658813, -0.6060056090354919, -0.5358030796051025, -0.46560055017471313, -0.39539802074432373, -0.3251954913139343, -0.2549929618835449, -0.18479043245315552, -0.11458790302276611, -0.04438537359237671, 0.025817155838012695, 0.0960196852684021, 0.1662222146987915, 0.2364247441291809, 0.3066272735595703, 0.3768298029899597, 0.4470323324203491, 0.5172348618507385, 0.5874373912811279, 0.6576399207115173, 0.7278423309326172, 0.7980448603630066, 0.868247389793396, 0.9384499192237854, 1.0086524486541748, 1.078855037689209, 1.1490575075149536, 1.2192599773406982, 1.2894625663757324, 1.3596651554107666, 1.4298676252365112, 1.5000700950622559, 1.57027268409729, 1.6404752731323242, 1.7106777429580688, 1.7808802127838135, 1.8510828018188477, 1.9212853908538818, 1.9914878606796265, 2.061690330505371, 2.1318929195404053, 2.2020955085754395, 2.2722978591918945, 2.3425004482269287, 2.412703037261963, 2.482905626296997, 2.5531082153320312, 2.6233105659484863, 2.6935131549835205, 2.7637157440185547, 2.8339180946350098, 2.904120683670044, 2.974323272705078]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 0.0, 3.0, 3.0, 3.0, 3.0, 2.0, 4.0, 6.0, 9.0, 12.0, 12.0, 17.0, 19.0, 29.0, 27.0, 36.0, 32.0, 27.0, 41.0, 50.0, 44.0, 56.0, 42.0, 60.0, 40.0, 32.0, 41.0, 58.0, 49.0, 44.0, 31.0, 31.0, 23.0, 25.0, 18.0, 19.0, 19.0, 11.0, 9.0, 9.0, 6.0, 4.0, 2.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1407835483551025, -1.1096351146697998, -1.0784865617752075, -1.0473381280899048, -1.016189694404602, -0.9850411415100098, -0.953892707824707, -0.9227442145347595, -0.891595721244812, -0.8604472279548645, -0.8292987942695618, -0.7981503009796143, -0.7670018076896667, -0.7358533143997192, -0.7047048807144165, -0.673556387424469, -0.6424079537391663, -0.6112594604492188, -0.580111026763916, -0.5489625334739685, -0.517814040184021, -0.4866655766963959, -0.45551711320877075, -0.42436861991882324, -0.3932201564311981, -0.362071692943573, -0.3309231996536255, -0.29977473616600037, -0.26862627267837524, -0.23747777938842773, -0.2063293159008026, -0.1751808375120163, -0.14403241872787476, -0.11288394033908844, -0.08173546940088272, -0.050586998462677, -0.019438520073890686, 0.01170995831489563, 0.04285842180252075, 0.07400690019130707, 0.10515537858009338, 0.1363038569688797, 0.16745233535766602, 0.19860079884529114, 0.22974927723407745, 0.26089775562286377, 0.2920462191104889, 0.323194682598114, 0.3543431758880615, 0.38549163937568665, 0.41664013266563416, 0.4477885961532593, 0.4789370894432068, 0.5100855827331543, 0.541234016418457, 0.5723825097084045, 0.603531002998352, 0.6346794962882996, 0.6658279299736023, 0.6969764232635498, 0.7281249165534973, 0.7592734098434448, 0.7904218435287476, 0.8215703368186951, 0.8527187705039978]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 8.0, 5.0, 6.0, 15.0, 19.0, 21.0, 36.0, 71.0, 155.0, 204.0, 452.0, 901.0, 2527.0, 8611.0, 38434.0, 234516.0, 606068.0, 124657.0, 23025.0, 5648.0, 1715.0, 730.0, 323.0, 156.0, 87.0, 49.0, 33.0, 25.0, 15.0, 16.0, 9.0, 6.0, 4.0, 1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2086181640625, -0.2009868621826172, -0.19335556030273438, -0.18572425842285156, -0.17809295654296875, -0.17046165466308594, -0.16283035278320312, -0.1551990509033203, -0.1475677490234375, -0.1399364471435547, -0.13230514526367188, -0.12467384338378906, -0.11704254150390625, -0.10941123962402344, -0.10177993774414062, -0.09414863586425781, -0.086517333984375, -0.07888603210449219, -0.07125473022460938, -0.06362342834472656, -0.05599212646484375, -0.04836082458496094, -0.040729522705078125, -0.03309822082519531, -0.0254669189453125, -0.017835617065429688, -0.010204315185546875, -0.0025730133056640625, 0.00505828857421875, 0.012689590454101562, 0.020320892333984375, 0.027952194213867188, 0.03558349609375, 0.04321479797363281, 0.050846099853515625, 0.05847740173339844, 0.06610870361328125, 0.07374000549316406, 0.08137130737304688, 0.08900260925292969, 0.0966339111328125, 0.10426521301269531, 0.11189651489257812, 0.11952781677246094, 0.12715911865234375, 0.13479042053222656, 0.14242172241210938, 0.1500530242919922, 0.157684326171875, 0.1653156280517578, 0.17294692993164062, 0.18057823181152344, 0.18820953369140625, 0.19584083557128906, 0.20347213745117188, 0.2111034393310547, 0.2187347412109375, 0.2263660430908203, 0.23399734497070312, 0.24162864685058594, 0.24925994873046875, 0.25689125061035156, 0.2645225524902344, 0.2721538543701172, 0.27978515625]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 2.0, 2.0, 4.0, 2.0, 5.0, 9.0, 3.0, 16.0, 21.0, 29.0, 35.0, 34.0, 36.0, 50.0, 58.0, 57.0, 62.0, 48.0, 61.0, 60.0, 59.0, 54.0, 56.0, 32.0, 37.0, 36.0, 32.0, 23.0, 21.0, 18.0, 17.0, 8.0, 9.0, 4.0, 5.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.14453125, -0.140777587890625, -0.13702392578125, -0.133270263671875, -0.1295166015625, -0.125762939453125, -0.12200927734375, -0.118255615234375, -0.114501953125, -0.110748291015625, -0.10699462890625, -0.103240966796875, -0.0994873046875, -0.095733642578125, -0.09197998046875, -0.088226318359375, -0.08447265625, -0.080718994140625, -0.07696533203125, -0.073211669921875, -0.0694580078125, -0.065704345703125, -0.06195068359375, -0.058197021484375, -0.054443359375, -0.050689697265625, -0.04693603515625, -0.043182373046875, -0.0394287109375, -0.035675048828125, -0.03192138671875, -0.028167724609375, -0.0244140625, -0.020660400390625, -0.01690673828125, -0.013153076171875, -0.0093994140625, -0.005645751953125, -0.00189208984375, 0.001861572265625, 0.005615234375, 0.009368896484375, 0.01312255859375, 0.016876220703125, 0.0206298828125, 0.024383544921875, 0.02813720703125, 0.031890869140625, 0.03564453125, 0.039398193359375, 0.04315185546875, 0.046905517578125, 0.0506591796875, 0.054412841796875, 0.05816650390625, 0.061920166015625, 0.065673828125, 0.069427490234375, 0.07318115234375, 0.076934814453125, 0.0806884765625, 0.084442138671875, 0.08819580078125, 0.091949462890625, 0.095703125]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 4.0, 8.0, 6.0, 10.0, 14.0, 13.0, 15.0, 28.0, 50.0, 54.0, 91.0, 160.0, 212.0, 336.0, 615.0, 1237.0, 3186.0, 10714.0, 59256.0, 740058.0, 197988.0, 24418.0, 5780.0, 2016.0, 938.0, 486.0, 274.0, 176.0, 138.0, 77.0, 58.0, 36.0, 24.0, 26.0, 14.0, 14.0, 5.0, 7.0, 5.0, 2.0, 2.0, 3.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.260009765625, -0.25127410888671875, -0.2425384521484375, -0.23380279541015625, -0.225067138671875, -0.21633148193359375, -0.2075958251953125, -0.19886016845703125, -0.19012451171875, -0.18138885498046875, -0.1726531982421875, -0.16391754150390625, -0.155181884765625, -0.14644622802734375, -0.1377105712890625, -0.12897491455078125, -0.1202392578125, -0.11150360107421875, -0.1027679443359375, -0.09403228759765625, -0.085296630859375, -0.07656097412109375, -0.0678253173828125, -0.05908966064453125, -0.05035400390625, -0.04161834716796875, -0.0328826904296875, -0.02414703369140625, -0.015411376953125, -0.00667572021484375, 0.0020599365234375, 0.01079559326171875, 0.01953125, 0.02826690673828125, 0.0370025634765625, 0.04573822021484375, 0.054473876953125, 0.06320953369140625, 0.0719451904296875, 0.08068084716796875, 0.08941650390625, 0.09815216064453125, 0.1068878173828125, 0.11562347412109375, 0.124359130859375, 0.13309478759765625, 0.1418304443359375, 0.15056610107421875, 0.1593017578125, 0.16803741455078125, 0.1767730712890625, 0.18550872802734375, 0.194244384765625, 0.20298004150390625, 0.2117156982421875, 0.22045135498046875, 0.22918701171875, 0.23792266845703125, 0.2466583251953125, 0.25539398193359375, 0.264129638671875, 0.27286529541015625, 0.2816009521484375, 0.29033660888671875, 0.299072265625]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 5.0, 2.0, 3.0, 7.0, 7.0, 10.0, 12.0, 21.0, 24.0, 33.0, 32.0, 36.0, 37.0, 46.0, 62.0, 47.0, 54.0, 59.0, 55.0, 59.0, 56.0, 55.0, 47.0, 39.0, 32.0, 29.0, 32.0, 21.0, 14.0, 12.0, 8.0, 13.0, 9.0, 4.0, 9.0, 3.0, 2.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.38623046875, -0.3740234375, -0.36181640625, -0.349609375, -0.33740234375, -0.3251953125, -0.31298828125, -0.30078125, -0.28857421875, -0.2763671875, -0.26416015625, -0.251953125, -0.23974609375, -0.2275390625, -0.21533203125, -0.203125, -0.19091796875, -0.1787109375, -0.16650390625, -0.154296875, -0.14208984375, -0.1298828125, -0.11767578125, -0.10546875, -0.09326171875, -0.0810546875, -0.06884765625, -0.056640625, -0.04443359375, -0.0322265625, -0.02001953125, -0.0078125, 0.00439453125, 0.0166015625, 0.02880859375, 0.041015625, 0.05322265625, 0.0654296875, 0.07763671875, 0.08984375, 0.10205078125, 0.1142578125, 0.12646484375, 0.138671875, 0.15087890625, 0.1630859375, 0.17529296875, 0.1875, 0.19970703125, 0.2119140625, 0.22412109375, 0.236328125, 0.24853515625, 0.2607421875, 0.27294921875, 0.28515625, 0.29736328125, 0.3095703125, 0.32177734375, 0.333984375, 0.34619140625, 0.3583984375, 0.37060546875, 0.3828125, 0.39501953125]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 2.0, 1.0, 2.0, 5.0, 2.0, 3.0, 4.0, 8.0, 6.0, 6.0, 9.0, 9.0, 22.0, 22.0, 26.0, 45.0, 51.0, 101.0, 151.0, 251.0, 452.0, 959.0, 2283.0, 7002.0, 26717.0, 185233.0, 755189.0, 52134.0, 11471.0, 3495.0, 1388.0, 610.0, 329.0, 180.0, 119.0, 60.0, 59.0, 37.0, 26.0, 22.0, 14.0, 13.0, 11.0, 4.0, 9.0, 4.0, 7.0, 4.0, 0.0, 4.0, 2.0, 2.0, 0.0, 0.0, 3.0, 0.0, 2.0], "bins": [-0.11676025390625, -0.11324405670166016, -0.10972785949707031, -0.10621166229248047, -0.10269546508789062, -0.09917926788330078, -0.09566307067871094, -0.0921468734741211, -0.08863067626953125, -0.0851144790649414, -0.08159828186035156, -0.07808208465576172, -0.07456588745117188, -0.07104969024658203, -0.06753349304199219, -0.06401729583740234, -0.0605010986328125, -0.056984901428222656, -0.05346870422363281, -0.04995250701904297, -0.046436309814453125, -0.04292011260986328, -0.03940391540527344, -0.035887718200683594, -0.03237152099609375, -0.028855323791503906, -0.025339126586914062, -0.02182292938232422, -0.018306732177734375, -0.014790534973144531, -0.011274337768554688, -0.007758140563964844, -0.004241943359375, -0.0007257461547851562, 0.0027904510498046875, 0.006306648254394531, 0.009822845458984375, 0.013339042663574219, 0.016855239868164062, 0.020371437072753906, 0.02388763427734375, 0.027403831481933594, 0.030920028686523438, 0.03443622589111328, 0.037952423095703125, 0.04146862030029297, 0.04498481750488281, 0.048501014709472656, 0.0520172119140625, 0.055533409118652344, 0.05904960632324219, 0.06256580352783203, 0.06608200073242188, 0.06959819793701172, 0.07311439514160156, 0.0766305923461914, 0.08014678955078125, 0.0836629867553711, 0.08717918395996094, 0.09069538116455078, 0.09421157836914062, 0.09772777557373047, 0.10124397277832031, 0.10476016998291016, 0.1082763671875]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 2.0, 0.0, 3.0, 3.0, 7.0, 8.0, 6.0, 11.0, 20.0, 25.0, 27.0, 43.0, 68.0, 77.0, 101.0, 102.0, 124.0, 81.0, 68.0, 63.0, 45.0, 32.0, 17.0, 18.0, 9.0, 3.0, 14.0, 5.0, 7.0, 2.0, 7.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.4332275390625e-05, -3.3146701753139496e-05, -3.196112811565399e-05, -3.077555447816849e-05, -2.9589980840682983e-05, -2.840440720319748e-05, -2.7218833565711975e-05, -2.603325992822647e-05, -2.4847686290740967e-05, -2.3662112653255463e-05, -2.247653901576996e-05, -2.1290965378284454e-05, -2.010539174079895e-05, -1.8919818103313446e-05, -1.7734244465827942e-05, -1.6548670828342438e-05, -1.5363097190856934e-05, -1.417752355337143e-05, -1.2991949915885925e-05, -1.1806376278400421e-05, -1.0620802640914917e-05, -9.435229003429413e-06, -8.249655365943909e-06, -7.0640817284584045e-06, -5.8785080909729e-06, -4.692934453487396e-06, -3.507360816001892e-06, -2.321787178516388e-06, -1.1362135410308838e-06, 4.936009645462036e-08, 1.2349337339401245e-06, 2.4205073714256287e-06, 3.606081008911133e-06, 4.791654646396637e-06, 5.977228283882141e-06, 7.162801921367645e-06, 8.34837555885315e-06, 9.533949196338654e-06, 1.0719522833824158e-05, 1.1905096471309662e-05, 1.3090670108795166e-05, 1.427624374628067e-05, 1.5461817383766174e-05, 1.664739102125168e-05, 1.7832964658737183e-05, 1.9018538296222687e-05, 2.020411193370819e-05, 2.1389685571193695e-05, 2.25752592086792e-05, 2.3760832846164703e-05, 2.4946406483650208e-05, 2.613198012113571e-05, 2.7317553758621216e-05, 2.850312739610672e-05, 2.9688701033592224e-05, 3.087427467107773e-05, 3.205984830856323e-05, 3.3245421946048737e-05, 3.443099558353424e-05, 3.5616569221019745e-05, 3.680214285850525e-05, 3.798771649599075e-05, 3.917329013347626e-05, 4.035886377096176e-05, 4.1544437408447266e-05]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 3.0, 3.0, 10.0, 10.0, 21.0, 29.0, 47.0, 67.0, 96.0, 167.0, 307.0, 564.0, 1171.0, 2967.0, 9546.0, 40143.0, 360013.0, 575910.0, 41927.0, 9913.0, 3095.0, 1190.0, 568.0, 308.0, 173.0, 104.0, 66.0, 44.0, 31.0, 20.0, 16.0, 8.0, 6.0, 6.0, 6.0, 3.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11328125, -0.10984992980957031, -0.10641860961914062, -0.10298728942871094, -0.09955596923828125, -0.09612464904785156, -0.09269332885742188, -0.08926200866699219, -0.0858306884765625, -0.08239936828613281, -0.07896804809570312, -0.07553672790527344, -0.07210540771484375, -0.06867408752441406, -0.06524276733398438, -0.06181144714355469, -0.058380126953125, -0.05494880676269531, -0.051517486572265625, -0.04808616638183594, -0.04465484619140625, -0.04122352600097656, -0.037792205810546875, -0.03436088562011719, -0.0309295654296875, -0.027498245239257812, -0.024066925048828125, -0.020635604858398438, -0.01720428466796875, -0.013772964477539062, -0.010341644287109375, -0.0069103240966796875, -0.00347900390625, -4.76837158203125e-05, 0.003383636474609375, 0.0068149566650390625, 0.01024627685546875, 0.013677597045898438, 0.017108917236328125, 0.020540237426757812, 0.0239715576171875, 0.027402877807617188, 0.030834197998046875, 0.03426551818847656, 0.03769683837890625, 0.04112815856933594, 0.044559478759765625, 0.04799079895019531, 0.051422119140625, 0.05485343933105469, 0.058284759521484375, 0.06171607971191406, 0.06514739990234375, 0.06857872009277344, 0.07201004028320312, 0.07544136047363281, 0.0788726806640625, 0.08230400085449219, 0.08573532104492188, 0.08916664123535156, 0.09259796142578125, 0.09602928161621094, 0.09946060180664062, 0.10289192199707031, 0.1063232421875]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 4.0, 5.0, 5.0, 4.0, 9.0, 7.0, 10.0, 12.0, 14.0, 17.0, 33.0, 42.0, 51.0, 57.0, 67.0, 100.0, 131.0, 90.0, 81.0, 61.0, 39.0, 28.0, 22.0, 18.0, 21.0, 25.0, 10.0, 8.0, 9.0, 5.0, 4.0, 9.0, 2.0, 3.0, 2.0, 3.0, 0.0, 0.0, 1.0, 2.0, 1.0], "bins": [-0.10821533203125, -0.10547161102294922, -0.10272789001464844, -0.09998416900634766, -0.09724044799804688, -0.0944967269897461, -0.09175300598144531, -0.08900928497314453, -0.08626556396484375, -0.08352184295654297, -0.08077812194824219, -0.0780344009399414, -0.07529067993164062, -0.07254695892333984, -0.06980323791503906, -0.06705951690673828, -0.0643157958984375, -0.06157207489013672, -0.05882835388183594, -0.056084632873535156, -0.053340911865234375, -0.050597190856933594, -0.04785346984863281, -0.04510974884033203, -0.04236602783203125, -0.03962230682373047, -0.03687858581542969, -0.034134864807128906, -0.031391143798828125, -0.028647422790527344, -0.025903701782226562, -0.02315998077392578, -0.020416259765625, -0.01767253875732422, -0.014928817749023438, -0.012185096740722656, -0.009441375732421875, -0.006697654724121094, -0.0039539337158203125, -0.0012102127075195312, 0.00153350830078125, 0.004277229309082031, 0.0070209503173828125, 0.009764671325683594, 0.012508392333984375, 0.015252113342285156, 0.017995834350585938, 0.02073955535888672, 0.0234832763671875, 0.02622699737548828, 0.028970718383789062, 0.031714439392089844, 0.034458160400390625, 0.037201881408691406, 0.03994560241699219, 0.04268932342529297, 0.04543304443359375, 0.04817676544189453, 0.05092048645019531, 0.053664207458496094, 0.056407928466796875, 0.059151649475097656, 0.06189537048339844, 0.06463909149169922, 0.0673828125]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 3.0, 19.0, 83.0, 317.0, 482.0, 71.0, 12.0, 3.0, 5.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.450579643249512, -6.266711235046387, -6.0828423500061035, -5.8989739418029785, -5.715105056762695, -5.53123664855957, -5.347367763519287, -5.163499355316162, -4.979630470275879, -4.795762062072754, -4.611893177032471, -4.428024768829346, -4.2441558837890625, -4.0602874755859375, -3.8764185905456543, -3.6925501823425293, -3.508681535720825, -3.324812889099121, -3.140944242477417, -2.957075595855713, -2.773206949234009, -2.5893383026123047, -2.4054698944091797, -2.2216010093688965, -2.0377326011657715, -1.8538639545440674, -1.6699953079223633, -1.4861266613006592, -1.302258014678955, -1.118389368057251, -0.9345208406448364, -0.7506521940231323, -0.5667834281921387, -0.38291478157043457, -0.19904616475105286, -0.015177547931671143, 0.16869109869003296, 0.35255974531173706, 0.5364283323287964, 0.7202969789505005, 0.9041656255722046, 1.0880342721939087, 1.2719029188156128, 1.4557714462280273, 1.6396400928497314, 1.8235087394714355, 2.0073773860931396, 2.1912460327148438, 2.375114679336548, 2.558983325958252, 2.742851972579956, 2.92672061920166, 3.1105892658233643, 3.2944579124450684, 3.4783263206481934, 3.6621952056884766, 3.8460636138916016, 4.029932022094727, 4.21380090713501, 4.397669315338135, 4.581538200378418, 4.765406608581543, 4.949275493621826, 5.133143901824951, 5.317012786865234]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 5.0, 5.0, 5.0, 5.0, 6.0, 4.0, 9.0, 9.0, 9.0, 14.0, 12.0, 12.0, 16.0, 25.0, 18.0, 23.0, 12.0, 20.0, 38.0, 24.0, 42.0, 58.0, 82.0, 97.0, 103.0, 55.0, 31.0, 26.0, 25.0, 23.0, 17.0, 15.0, 31.0, 20.0, 20.0, 6.0, 16.0, 5.0, 13.0, 11.0, 7.0, 9.0, 9.0, 2.0, 4.0, 2.0, 3.0, 1.0, 1.0, 4.0, 3.0, 1.0, 1.0, 1.0], "bins": [-1.3335986137390137, -1.293694257736206, -1.2537897825241089, -1.2138853073120117, -1.173980951309204, -1.1340765953063965, -1.0941721200942993, -1.0542676448822021, -1.0143632888793945, -0.9744588732719421, -0.9345544576644897, -0.8946500420570374, -0.854745626449585, -0.8148412108421326, -0.7749367952346802, -0.7350323796272278, -0.6951279640197754, -0.655223548412323, -0.6153191328048706, -0.5754147171974182, -0.5355103015899658, -0.4956058859825134, -0.45570147037506104, -0.41579705476760864, -0.37589263916015625, -0.33598822355270386, -0.29608380794525146, -0.2561793923377991, -0.21627497673034668, -0.1763705611228943, -0.1364661455154419, -0.0965617299079895, -0.05665719509124756, -0.016752779483795166, 0.023151636123657227, 0.06305605173110962, 0.10296046733856201, 0.1428648829460144, 0.1827692985534668, 0.2226737141609192, 0.2625781297683716, 0.302482545375824, 0.34238696098327637, 0.38229137659072876, 0.42219579219818115, 0.46210020780563354, 0.5020046234130859, 0.5419090390205383, 0.5818134546279907, 0.6217178702354431, 0.6616222858428955, 0.7015267014503479, 0.7414311170578003, 0.7813355326652527, 0.8212399482727051, 0.8611443638801575, 0.9010487794876099, 0.9409531950950623, 0.9808576107025146, 1.0207619667053223, 1.0606664419174194, 1.1005709171295166, 1.1404752731323242, 1.1803796291351318, 1.220284104347229]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 0.0, 2.0, 4.0, 6.0, 9.0, 5.0, 14.0, 10.0, 21.0, 28.0, 47.0, 79.0, 118.0, 220.0, 449.0, 1042.0, 2538.0, 7073.0, 30959.0, 294358.0, 2829473.0, 942927.0, 67004.0, 11899.0, 3382.0, 1339.0, 552.0, 301.0, 150.0, 90.0, 56.0, 34.0, 22.0, 18.0, 14.0, 7.0, 5.0, 5.0, 7.0, 6.0, 3.0, 1.0, 2.0, 4.0, 3.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-0.256591796875, -0.2473297119140625, -0.238067626953125, -0.2288055419921875, -0.21954345703125, -0.2102813720703125, -0.201019287109375, -0.1917572021484375, -0.1824951171875, -0.1732330322265625, -0.163970947265625, -0.1547088623046875, -0.14544677734375, -0.1361846923828125, -0.126922607421875, -0.1176605224609375, -0.1083984375, -0.0991363525390625, -0.089874267578125, -0.0806121826171875, -0.07135009765625, -0.0620880126953125, -0.052825927734375, -0.0435638427734375, -0.0343017578125, -0.0250396728515625, -0.015777587890625, -0.0065155029296875, 0.00274658203125, 0.0120086669921875, 0.021270751953125, 0.0305328369140625, 0.039794921875, 0.0490570068359375, 0.058319091796875, 0.0675811767578125, 0.07684326171875, 0.0861053466796875, 0.095367431640625, 0.1046295166015625, 0.1138916015625, 0.1231536865234375, 0.132415771484375, 0.1416778564453125, 0.15093994140625, 0.1602020263671875, 0.169464111328125, 0.1787261962890625, 0.18798828125, 0.1972503662109375, 0.206512451171875, 0.2157745361328125, 0.22503662109375, 0.2342987060546875, 0.243560791015625, 0.2528228759765625, 0.2620849609375, 0.2713470458984375, 0.280609130859375, 0.2898712158203125, 0.29913330078125, 0.3083953857421875, 0.317657470703125, 0.3269195556640625, 0.336181640625]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 5.0, 4.0, 5.0, 4.0, 16.0, 11.0, 20.0, 23.0, 27.0, 45.0, 46.0, 49.0, 57.0, 69.0, 65.0, 79.0, 61.0, 67.0, 50.0, 62.0, 50.0, 41.0, 32.0, 32.0, 24.0, 22.0, 15.0, 9.0, 6.0, 4.0, 6.0, 0.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1160888671875, -0.11193084716796875, -0.1077728271484375, -0.10361480712890625, -0.099456787109375, -0.09529876708984375, -0.0911407470703125, -0.08698272705078125, -0.08282470703125, -0.07866668701171875, -0.0745086669921875, -0.07035064697265625, -0.066192626953125, -0.06203460693359375, -0.0578765869140625, -0.05371856689453125, -0.049560546875, -0.04540252685546875, -0.0412445068359375, -0.03708648681640625, -0.032928466796875, -0.02877044677734375, -0.0246124267578125, -0.02045440673828125, -0.01629638671875, -0.01213836669921875, -0.0079803466796875, -0.00382232666015625, 0.000335693359375, 0.00449371337890625, 0.0086517333984375, 0.01280975341796875, 0.0169677734375, 0.02112579345703125, 0.0252838134765625, 0.02944183349609375, 0.033599853515625, 0.03775787353515625, 0.0419158935546875, 0.04607391357421875, 0.05023193359375, 0.05438995361328125, 0.0585479736328125, 0.06270599365234375, 0.066864013671875, 0.07102203369140625, 0.0751800537109375, 0.07933807373046875, 0.08349609375, 0.08765411376953125, 0.0918121337890625, 0.09597015380859375, 0.100128173828125, 0.10428619384765625, 0.1084442138671875, 0.11260223388671875, 0.11676025390625, 0.12091827392578125, 0.1250762939453125, 0.12923431396484375, 0.133392333984375, 0.13755035400390625, 0.1417083740234375, 0.14586639404296875, 0.1500244140625]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 2.0, 6.0, 4.0, 4.0, 8.0, 7.0, 20.0, 35.0, 70.0, 147.0, 388.0, 913.0, 3120.0, 49243.0, 4121428.0, 15346.0, 2204.0, 734.0, 284.0, 152.0, 73.0, 30.0, 20.0, 17.0, 4.0, 2.0, 2.0, 5.0, 3.0, 5.0, 0.0, 2.0, 4.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1884765625, -1.146575927734375, -1.10467529296875, -1.062774658203125, -1.0208740234375, -0.978973388671875, -0.93707275390625, -0.895172119140625, -0.853271484375, -0.811370849609375, -0.76947021484375, -0.727569580078125, -0.6856689453125, -0.643768310546875, -0.60186767578125, -0.559967041015625, -0.51806640625, -0.476165771484375, -0.43426513671875, -0.392364501953125, -0.3504638671875, -0.308563232421875, -0.26666259765625, -0.224761962890625, -0.182861328125, -0.140960693359375, -0.09906005859375, -0.057159423828125, -0.0152587890625, 0.026641845703125, 0.06854248046875, 0.110443115234375, 0.15234375, 0.194244384765625, 0.23614501953125, 0.278045654296875, 0.3199462890625, 0.361846923828125, 0.40374755859375, 0.445648193359375, 0.487548828125, 0.529449462890625, 0.57135009765625, 0.613250732421875, 0.6551513671875, 0.697052001953125, 0.73895263671875, 0.780853271484375, 0.82275390625, 0.864654541015625, 0.90655517578125, 0.948455810546875, 0.9903564453125, 1.032257080078125, 1.07415771484375, 1.116058349609375, 1.157958984375, 1.199859619140625, 1.24176025390625, 1.283660888671875, 1.3255615234375, 1.367462158203125, 1.40936279296875, 1.451263427734375, 1.4931640625]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 6.0, 17.0, 25.0, 40.0, 76.0, 137.0, 291.0, 546.0, 925.0, 921.0, 508.0, 272.0, 112.0, 78.0, 45.0, 29.0, 17.0, 8.0, 9.0, 5.0, 2.0, 3.0, 0.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.50341796875, -0.48471832275390625, -0.4660186767578125, -0.44731903076171875, -0.428619384765625, -0.40991973876953125, -0.3912200927734375, -0.37252044677734375, -0.35382080078125, -0.33512115478515625, -0.3164215087890625, -0.29772186279296875, -0.279022216796875, -0.26032257080078125, -0.2416229248046875, -0.22292327880859375, -0.2042236328125, -0.18552398681640625, -0.1668243408203125, -0.14812469482421875, -0.129425048828125, -0.11072540283203125, -0.0920257568359375, -0.07332611083984375, -0.05462646484375, -0.03592681884765625, -0.0172271728515625, 0.00147247314453125, 0.020172119140625, 0.03887176513671875, 0.0575714111328125, 0.07627105712890625, 0.094970703125, 0.11367034912109375, 0.1323699951171875, 0.15106964111328125, 0.169769287109375, 0.18846893310546875, 0.2071685791015625, 0.22586822509765625, 0.24456787109375, 0.26326751708984375, 0.2819671630859375, 0.30066680908203125, 0.319366455078125, 0.33806610107421875, 0.3567657470703125, 0.37546539306640625, 0.3941650390625, 0.41286468505859375, 0.4315643310546875, 0.45026397705078125, 0.468963623046875, 0.48766326904296875, 0.5063629150390625, 0.5250625610351562, 0.54376220703125, 0.5624618530273438, 0.5811614990234375, 0.5998611450195312, 0.618560791015625, 0.6372604370117188, 0.6559600830078125, 0.6746597290039062, 0.693359375]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 2.0, 3.0, 4.0, 5.0, 7.0, 7.0, 16.0, 20.0, 47.0, 77.0, 118.0, 198.0, 157.0, 132.0, 72.0, 37.0, 26.0, 16.0, 8.0, 8.0, 10.0, 4.0, 5.0, 3.0, 4.0, 3.0, 3.0, 4.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.406118392944336, -4.267202377319336, -4.128286838531494, -3.989370822906494, -3.850454807281494, -3.7115390300750732, -3.5726232528686523, -3.4337072372436523, -3.2947914600372314, -3.1558756828308105, -3.0169596672058105, -2.8780438899993896, -2.7391281127929688, -2.6002120971679688, -2.461296319961548, -2.322380542755127, -2.183464527130127, -2.044548749923706, -1.905632734298706, -1.7667169570922852, -1.6278010606765747, -1.4888851642608643, -1.3499693870544434, -1.211053490638733, -1.0721375942230225, -0.933221697807312, -0.7943058609962463, -0.6553900241851807, -0.5164741277694702, -0.37755823135375977, -0.2386423945426941, -0.09972655773162842, 0.039189815521240234, 0.1781056821346283, 0.31702154874801636, 0.4559374153614044, 0.5948532819747925, 0.7337691783905029, 0.8726850152015686, 1.0116008520126343, 1.1505167484283447, 1.2894326448440552, 1.4283485412597656, 1.5672643184661865, 1.706180214881897, 1.8450961112976074, 1.9840118885040283, 2.122927665710449, 2.261843681335449, 2.40075945854187, 2.53967547416687, 2.678591251373291, 2.817507266998291, 2.956423044204712, 3.095338821411133, 3.234254837036133, 3.3731706142425537, 3.5120863914489746, 3.6510024070739746, 3.7899181842803955, 3.9288339614868164, 4.067749977111816, 4.206665992736816, 4.345581531524658, 4.484497547149658]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 5.0, 1.0, 7.0, 11.0, 17.0, 13.0, 23.0, 45.0, 37.0, 42.0, 69.0, 71.0, 89.0, 86.0, 110.0, 84.0, 73.0, 54.0, 48.0, 38.0, 23.0, 20.0, 10.0, 9.0, 3.0, 4.0, 4.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.6779420375823975, -3.5676016807556152, -3.457261323928833, -3.346920967102051, -3.2365806102752686, -3.1262402534484863, -3.015900135040283, -2.905559539794922, -2.7952194213867188, -2.6848790645599365, -2.5745387077331543, -2.464198350906372, -2.35385799407959, -2.2435176372528076, -2.1331772804260254, -2.0228371620178223, -1.912496566772461, -1.8021562099456787, -1.6918158531188965, -1.5814754962921143, -1.471135139465332, -1.3607947826385498, -1.2504545450210571, -1.140114188194275, -1.0297738313674927, -0.9194334745407104, -0.8090931177139282, -0.6987528204917908, -0.5884124636650085, -0.4780721068382263, -0.36773180961608887, -0.25739145278930664, -0.1470508575439453, -0.03671051561832428, 0.07362982630729675, 0.1839701533317566, 0.2943105101585388, 0.40465086698532104, 0.5149911642074585, 0.6253315210342407, 0.735671877861023, 0.8460122346878052, 0.9563525915145874, 1.06669282913208, 1.1770331859588623, 1.2873735427856445, 1.3977138996124268, 1.508054256439209, 1.6183946132659912, 1.7287349700927734, 1.8390753269195557, 1.949415683746338, 2.05975604057312, 2.1700963973999023, 2.2804365158081055, 2.390777111053467, 2.50111722946167, 2.611457586288452, 2.7217979431152344, 2.8321382999420166, 2.942478656768799, 3.052819013595581, 3.1631593704223633, 3.2734994888305664, 3.3838400840759277]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 5.0, 3.0, 0.0, 3.0, 5.0, 4.0, 16.0, 18.0, 22.0, 25.0, 49.0, 91.0, 165.0, 248.0, 503.0, 1212.0, 3409.0, 12143.0, 78253.0, 738597.0, 184522.0, 20966.0, 5061.0, 1801.0, 686.0, 294.0, 187.0, 98.0, 56.0, 31.0, 26.0, 16.0, 15.0, 12.0, 3.0, 2.0, 7.0, 2.0, 3.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.319580078125, -0.30843353271484375, -0.2972869873046875, -0.28614044189453125, -0.274993896484375, -0.26384735107421875, -0.2527008056640625, -0.24155426025390625, -0.23040771484375, -0.21926116943359375, -0.2081146240234375, -0.19696807861328125, -0.185821533203125, -0.17467498779296875, -0.1635284423828125, -0.15238189697265625, -0.1412353515625, -0.13008880615234375, -0.1189422607421875, -0.10779571533203125, -0.096649169921875, -0.08550262451171875, -0.0743560791015625, -0.06320953369140625, -0.05206298828125, -0.04091644287109375, -0.0297698974609375, -0.01862335205078125, -0.007476806640625, 0.00366973876953125, 0.0148162841796875, 0.02596282958984375, 0.037109375, 0.04825592041015625, 0.0594024658203125, 0.07054901123046875, 0.081695556640625, 0.09284210205078125, 0.1039886474609375, 0.11513519287109375, 0.12628173828125, 0.13742828369140625, 0.1485748291015625, 0.15972137451171875, 0.170867919921875, 0.18201446533203125, 0.1931610107421875, 0.20430755615234375, 0.2154541015625, 0.22660064697265625, 0.2377471923828125, 0.24889373779296875, 0.260040283203125, 0.27118682861328125, 0.2823333740234375, 0.29347991943359375, 0.30462646484375, 0.31577301025390625, 0.3269195556640625, 0.33806610107421875, 0.349212646484375, 0.36035919189453125, 0.3715057373046875, 0.38265228271484375, 0.393798828125]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 3.0, 1.0, 1.0, 5.0, 4.0, 5.0, 13.0, 20.0, 30.0, 33.0, 42.0, 58.0, 72.0, 71.0, 76.0, 69.0, 100.0, 82.0, 71.0, 70.0, 52.0, 27.0, 30.0, 19.0, 20.0, 12.0, 5.0, 6.0, 4.0, 3.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2015380859375, -0.19476699829101562, -0.18799591064453125, -0.18122482299804688, -0.1744537353515625, -0.16768264770507812, -0.16091156005859375, -0.15414047241210938, -0.147369384765625, -0.14059829711914062, -0.13382720947265625, -0.12705612182617188, -0.1202850341796875, -0.11351394653320312, -0.10674285888671875, -0.09997177124023438, -0.09320068359375, -0.08642959594726562, -0.07965850830078125, -0.07288742065429688, -0.0661163330078125, -0.059345245361328125, -0.05257415771484375, -0.045803070068359375, -0.039031982421875, -0.032260894775390625, -0.02548980712890625, -0.018718719482421875, -0.0119476318359375, -0.005176544189453125, 0.00159454345703125, 0.008365631103515625, 0.01513671875, 0.021907806396484375, 0.02867889404296875, 0.035449981689453125, 0.0422210693359375, 0.048992156982421875, 0.05576324462890625, 0.06253433227539062, 0.069305419921875, 0.07607650756835938, 0.08284759521484375, 0.08961868286132812, 0.0963897705078125, 0.10316085815429688, 0.10993194580078125, 0.11670303344726562, 0.12347412109375, 0.13024520874023438, 0.13701629638671875, 0.14378738403320312, 0.1505584716796875, 0.15732955932617188, 0.16410064697265625, 0.17087173461914062, 0.177642822265625, 0.18441390991210938, 0.19118499755859375, 0.19795608520507812, 0.2047271728515625, 0.21149826049804688, 0.21826934814453125, 0.22504043579101562, 0.2318115234375]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 4.0, 6.0, 7.0, 8.0, 10.0, 5.0, 13.0, 23.0, 23.0, 37.0, 40.0, 64.0, 86.0, 118.0, 180.0, 338.0, 629.0, 1695.0, 5969.0, 41641.0, 871731.0, 111030.0, 10570.0, 2408.0, 873.0, 410.0, 211.0, 135.0, 85.0, 43.0, 50.0, 33.0, 24.0, 13.0, 9.0, 15.0, 6.0, 5.0, 4.0, 5.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.3701171875, -0.3600273132324219, -0.34993743896484375, -0.3398475646972656, -0.3297576904296875, -0.3196678161621094, -0.30957794189453125, -0.2994880676269531, -0.289398193359375, -0.2793083190917969, -0.26921844482421875, -0.2591285705566406, -0.2490386962890625, -0.23894882202148438, -0.22885894775390625, -0.21876907348632812, -0.20867919921875, -0.19858932495117188, -0.18849945068359375, -0.17840957641601562, -0.1683197021484375, -0.15822982788085938, -0.14813995361328125, -0.13805007934570312, -0.127960205078125, -0.11787033081054688, -0.10778045654296875, -0.09769058227539062, -0.0876007080078125, -0.07751083374023438, -0.06742095947265625, -0.057331085205078125, -0.0472412109375, -0.037151336669921875, -0.02706146240234375, -0.016971588134765625, -0.0068817138671875, 0.003208160400390625, 0.01329803466796875, 0.023387908935546875, 0.033477783203125, 0.043567657470703125, 0.05365753173828125, 0.06374740600585938, 0.0738372802734375, 0.08392715454101562, 0.09401702880859375, 0.10410690307617188, 0.11419677734375, 0.12428665161132812, 0.13437652587890625, 0.14446640014648438, 0.1545562744140625, 0.16464614868164062, 0.17473602294921875, 0.18482589721679688, 0.194915771484375, 0.20500564575195312, 0.21509552001953125, 0.22518539428710938, 0.2352752685546875, 0.24536514282226562, 0.25545501708984375, 0.2655448913574219, 0.275634765625]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 4.0, 1.0, 5.0, 6.0, 8.0, 9.0, 10.0, 12.0, 20.0, 28.0, 28.0, 28.0, 38.0, 40.0, 52.0, 84.0, 89.0, 98.0, 93.0, 79.0, 57.0, 47.0, 29.0, 24.0, 19.0, 22.0, 20.0, 17.0, 9.0, 7.0, 8.0, 7.0, 1.0, 3.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0], "bins": [-0.8486328125, -0.827789306640625, -0.80694580078125, -0.786102294921875, -0.7652587890625, -0.744415283203125, -0.72357177734375, -0.702728271484375, -0.681884765625, -0.661041259765625, -0.64019775390625, -0.619354248046875, -0.5985107421875, -0.577667236328125, -0.55682373046875, -0.535980224609375, -0.51513671875, -0.494293212890625, -0.47344970703125, -0.452606201171875, -0.4317626953125, -0.410919189453125, -0.39007568359375, -0.369232177734375, -0.348388671875, -0.327545166015625, -0.30670166015625, -0.285858154296875, -0.2650146484375, -0.244171142578125, -0.22332763671875, -0.202484130859375, -0.181640625, -0.160797119140625, -0.13995361328125, -0.119110107421875, -0.0982666015625, -0.077423095703125, -0.05657958984375, -0.035736083984375, -0.014892578125, 0.005950927734375, 0.02679443359375, 0.047637939453125, 0.0684814453125, 0.089324951171875, 0.11016845703125, 0.131011962890625, 0.15185546875, 0.172698974609375, 0.19354248046875, 0.214385986328125, 0.2352294921875, 0.256072998046875, 0.27691650390625, 0.297760009765625, 0.318603515625, 0.339447021484375, 0.36029052734375, 0.381134033203125, 0.4019775390625, 0.422821044921875, 0.44366455078125, 0.464508056640625, 0.4853515625]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 5.0, 3.0, 2.0, 7.0, 6.0, 6.0, 9.0, 17.0, 16.0, 23.0, 39.0, 63.0, 90.0, 142.0, 252.0, 529.0, 1108.0, 2760.0, 8171.0, 35201.0, 833650.0, 139401.0, 18042.0, 5194.0, 1968.0, 842.0, 403.0, 226.0, 131.0, 79.0, 60.0, 30.0, 21.0, 18.0, 19.0, 6.0, 1.0, 7.0, 9.0, 4.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0740966796875, -0.07213640213012695, -0.0701761245727539, -0.06821584701538086, -0.06625556945800781, -0.06429529190063477, -0.06233501434326172, -0.06037473678588867, -0.058414459228515625, -0.05645418167114258, -0.05449390411376953, -0.052533626556396484, -0.05057334899902344, -0.04861307144165039, -0.046652793884277344, -0.0446925163269043, -0.04273223876953125, -0.0407719612121582, -0.038811683654785156, -0.03685140609741211, -0.03489112854003906, -0.032930850982666016, -0.03097057342529297, -0.029010295867919922, -0.027050018310546875, -0.025089740753173828, -0.02312946319580078, -0.021169185638427734, -0.019208908081054688, -0.01724863052368164, -0.015288352966308594, -0.013328075408935547, -0.0113677978515625, -0.009407520294189453, -0.007447242736816406, -0.005486965179443359, -0.0035266876220703125, -0.0015664100646972656, 0.00039386749267578125, 0.002354145050048828, 0.004314422607421875, 0.006274700164794922, 0.008234977722167969, 0.010195255279541016, 0.012155532836914062, 0.01411581039428711, 0.016076087951660156, 0.018036365509033203, 0.01999664306640625, 0.021956920623779297, 0.023917198181152344, 0.02587747573852539, 0.027837753295898438, 0.029798030853271484, 0.03175830841064453, 0.03371858596801758, 0.035678863525390625, 0.03763914108276367, 0.03959941864013672, 0.041559696197509766, 0.04351997375488281, 0.04548025131225586, 0.047440528869628906, 0.04940080642700195, 0.051361083984375]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 2.0, 2.0, 1.0, 3.0, 4.0, 6.0, 7.0, 2.0, 4.0, 7.0, 9.0, 11.0, 13.0, 11.0, 23.0, 30.0, 42.0, 47.0, 46.0, 75.0, 100.0, 109.0, 78.0, 73.0, 63.0, 56.0, 53.0, 30.0, 13.0, 17.0, 15.0, 13.0, 9.0, 8.0, 4.0, 3.0, 8.0, 2.0, 2.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.6166439056396484e-05, -2.5323592126369476e-05, -2.4480745196342468e-05, -2.363789826631546e-05, -2.2795051336288452e-05, -2.1952204406261444e-05, -2.1109357476234436e-05, -2.0266510546207428e-05, -1.942366361618042e-05, -1.8580816686153412e-05, -1.7737969756126404e-05, -1.6895122826099396e-05, -1.6052275896072388e-05, -1.520942896604538e-05, -1.4366582036018372e-05, -1.3523735105991364e-05, -1.2680888175964355e-05, -1.1838041245937347e-05, -1.099519431591034e-05, -1.0152347385883331e-05, -9.309500455856323e-06, -8.466653525829315e-06, -7.623806595802307e-06, -6.780959665775299e-06, -5.938112735748291e-06, -5.095265805721283e-06, -4.252418875694275e-06, -3.409571945667267e-06, -2.566725015640259e-06, -1.7238780856132507e-06, -8.810311555862427e-07, -3.818422555923462e-08, 8.046627044677734e-07, 1.6475096344947815e-06, 2.4903565645217896e-06, 3.3332034945487976e-06, 4.176050424575806e-06, 5.018897354602814e-06, 5.861744284629822e-06, 6.70459121465683e-06, 7.547438144683838e-06, 8.390285074710846e-06, 9.233132004737854e-06, 1.0075978934764862e-05, 1.091882586479187e-05, 1.1761672794818878e-05, 1.2604519724845886e-05, 1.3447366654872894e-05, 1.4290213584899902e-05, 1.513306051492691e-05, 1.597590744495392e-05, 1.6818754374980927e-05, 1.7661601305007935e-05, 1.8504448235034943e-05, 1.934729516506195e-05, 2.019014209508896e-05, 2.1032989025115967e-05, 2.1875835955142975e-05, 2.2718682885169983e-05, 2.356152981519699e-05, 2.4404376745224e-05, 2.5247223675251007e-05, 2.6090070605278015e-05, 2.6932917535305023e-05, 2.777576446533203e-05]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 4.0, 3.0, 3.0, 4.0, 4.0, 13.0, 19.0, 14.0, 20.0, 42.0, 63.0, 84.0, 133.0, 180.0, 354.0, 569.0, 1082.0, 2085.0, 4539.0, 11174.0, 33435.0, 206948.0, 713746.0, 47890.0, 14635.0, 5699.0, 2644.0, 1335.0, 705.0, 414.0, 251.0, 147.0, 91.0, 73.0, 46.0, 26.0, 35.0, 17.0, 11.0, 11.0, 6.0, 4.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.041229248046875, -0.039813995361328125, -0.03839874267578125, -0.036983489990234375, -0.0355682373046875, -0.034152984619140625, -0.03273773193359375, -0.031322479248046875, -0.0299072265625, -0.028491973876953125, -0.02707672119140625, -0.025661468505859375, -0.0242462158203125, -0.022830963134765625, -0.02141571044921875, -0.020000457763671875, -0.018585205078125, -0.017169952392578125, -0.01575469970703125, -0.014339447021484375, -0.0129241943359375, -0.011508941650390625, -0.01009368896484375, -0.008678436279296875, -0.00726318359375, -0.005847930908203125, -0.00443267822265625, -0.003017425537109375, -0.0016021728515625, -0.000186920166015625, 0.00122833251953125, 0.002643585205078125, 0.004058837890625, 0.005474090576171875, 0.00688934326171875, 0.008304595947265625, 0.0097198486328125, 0.011135101318359375, 0.01255035400390625, 0.013965606689453125, 0.015380859375, 0.016796112060546875, 0.01821136474609375, 0.019626617431640625, 0.0210418701171875, 0.022457122802734375, 0.02387237548828125, 0.025287628173828125, 0.026702880859375, 0.028118133544921875, 0.02953338623046875, 0.030948638916015625, 0.0323638916015625, 0.033779144287109375, 0.03519439697265625, 0.036609649658203125, 0.03802490234375, 0.039440155029296875, 0.04085540771484375, 0.042270660400390625, 0.0436859130859375, 0.045101165771484375, 0.04651641845703125, 0.047931671142578125, 0.049346923828125]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 0.0, 0.0, 2.0, 4.0, 2.0, 2.0, 3.0, 2.0, 9.0, 10.0, 6.0, 7.0, 17.0, 14.0, 18.0, 22.0, 27.0, 40.0, 57.0, 65.0, 92.0, 131.0, 90.0, 85.0, 70.0, 50.0, 35.0, 27.0, 21.0, 21.0, 17.0, 10.0, 9.0, 8.0, 7.0, 9.0, 3.0, 5.0, 6.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.05010986328125, -0.04842948913574219, -0.046749114990234375, -0.04506874084472656, -0.04338836669921875, -0.04170799255371094, -0.040027618408203125, -0.03834724426269531, -0.0366668701171875, -0.03498649597167969, -0.033306121826171875, -0.03162574768066406, -0.02994537353515625, -0.028264999389648438, -0.026584625244140625, -0.024904251098632812, -0.023223876953125, -0.021543502807617188, -0.019863128662109375, -0.018182754516601562, -0.01650238037109375, -0.014822006225585938, -0.013141632080078125, -0.011461257934570312, -0.0097808837890625, -0.008100509643554688, -0.006420135498046875, -0.0047397613525390625, -0.00305938720703125, -0.0013790130615234375, 0.000301361083984375, 0.0019817352294921875, 0.003662109375, 0.0053424835205078125, 0.007022857666015625, 0.008703231811523438, 0.01038360595703125, 0.012063980102539062, 0.013744354248046875, 0.015424728393554688, 0.0171051025390625, 0.018785476684570312, 0.020465850830078125, 0.022146224975585938, 0.02382659912109375, 0.025506973266601562, 0.027187347412109375, 0.028867721557617188, 0.030548095703125, 0.03222846984863281, 0.033908843994140625, 0.03558921813964844, 0.03726959228515625, 0.03894996643066406, 0.040630340576171875, 0.04231071472167969, 0.0439910888671875, 0.04567146301269531, 0.047351837158203125, 0.04903221130371094, 0.05071258544921875, 0.05239295959472656, 0.054073333740234375, 0.05575370788574219, 0.05743408203125]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 2.0, 3.0, 3.0, 5.0, 9.0, 17.0, 26.0, 44.0, 89.0, 398.0, 248.0, 96.0, 27.0, 14.0, 12.0, 6.0, 4.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.7262933254241943, -2.6408090591430664, -2.5553250312805176, -2.4698407649993896, -2.3843564987182617, -2.298872470855713, -2.213388204574585, -2.127903938293457, -2.042419910430908, -1.9569357633590698, -1.871451497077942, -1.7859673500061035, -1.7004830837249756, -1.6149989366531372, -1.5295147895812988, -1.444030523300171, -1.358546257019043, -1.2730621099472046, -1.1875778436660767, -1.1020936965942383, -1.0166094303131104, -0.931125283241272, -0.8456411361694336, -0.7601569294929504, -0.6746727228164673, -0.5891885161399841, -0.503704309463501, -0.4182201623916626, -0.33273595571517944, -0.2472517490386963, -0.1617676019668579, -0.07628339529037476, 0.0092010498046875, 0.09468524158000946, 0.18016943335533142, 0.2656536102294922, 0.35113781690597534, 0.4366220235824585, 0.5221061706542969, 0.60759037733078, 0.6930745840072632, 0.7785587906837463, 0.8640429973602295, 0.9495271444320679, 1.0350112915039062, 1.1204955577850342, 1.2059797048568726, 1.291463851928711, 1.3769481182098389, 1.4624322652816772, 1.5479165315628052, 1.6334006786346436, 1.7188849449157715, 1.8043690919876099, 1.8898532390594482, 1.9753375053405762, 2.060821533203125, 2.146305799484253, 2.2317898273468018, 2.3172740936279297, 2.4027583599090576, 2.4882426261901855, 2.5737266540527344, 2.6592109203338623, 2.7446951866149902]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 4.0, 4.0, 3.0, 7.0, 14.0, 14.0, 10.0, 21.0, 18.0, 24.0, 30.0, 21.0, 56.0, 98.0, 292.0, 123.0, 55.0, 34.0, 29.0, 27.0, 35.0, 19.0, 26.0, 16.0, 7.0, 5.0, 1.0, 3.0, 6.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0], "bins": [-2.7694602012634277, -2.7011349201202393, -2.632809638977051, -2.5644843578338623, -2.496159076690674, -2.4278337955474854, -2.359508514404297, -2.2911832332611084, -2.22285795211792, -2.1545326709747314, -2.086207389831543, -2.0178821086883545, -1.949556827545166, -1.8812315464019775, -1.812906265258789, -1.7445809841156006, -1.6762555837631226, -1.607930302619934, -1.5396050214767456, -1.4712797403335571, -1.4029544591903687, -1.3346291780471802, -1.2663037776947021, -1.1979784965515137, -1.1296532154083252, -1.0613279342651367, -0.9930026531219482, -0.9246773719787598, -0.8563520908355713, -0.7880268096923828, -0.7197014689445496, -0.6513761878013611, -0.5830509662628174, -0.5147256851196289, -0.44640040397644043, -0.37807509303092957, -0.3097498118877411, -0.2414245307445526, -0.17309921979904175, -0.10477393865585327, -0.036448657512664795, 0.03187663108110428, 0.10020191967487335, 0.16852721571922302, 0.2368524968624115, 0.3051777780056, 0.37350308895111084, 0.4418283700942993, 0.5101536512374878, 0.5784789323806763, 0.6468042135238647, 0.7151294946670532, 0.7834547758102417, 0.8517800569534302, 0.9201053977012634, 0.9884306788444519, 1.0567560195922852, 1.1250813007354736, 1.193406581878662, 1.2617318630218506, 1.330057144165039, 1.3983824253082275, 1.466707706451416, 1.5350329875946045, 1.603358268737793]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 5.0, 3.0, 2.0, 6.0, 7.0, 15.0, 18.0, 22.0, 23.0, 44.0, 38.0, 54.0, 63.0, 220.0, 159.0, 74.0, 57.0, 36.0, 46.0, 24.0, 20.0, 26.0, 16.0, 3.0, 11.0, 7.0, 6.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1494140625, -0.14316940307617188, -0.13692474365234375, -0.13068008422851562, -0.1244354248046875, -0.11819076538085938, -0.11194610595703125, -0.10570144653320312, -0.099456787109375, -0.09321212768554688, -0.08696746826171875, -0.08072280883789062, -0.0744781494140625, -0.06823348999023438, -0.06198883056640625, -0.055744171142578125, -0.04949951171875, -0.043254852294921875, -0.03701019287109375, -0.030765533447265625, -0.0245208740234375, -0.018276214599609375, -0.01203155517578125, -0.005786895751953125, 0.000457763671875, 0.006702423095703125, 0.01294708251953125, 0.019191741943359375, 0.0254364013671875, 0.031681060791015625, 0.03792572021484375, 0.044170379638671875, 0.0504150390625, 0.056659698486328125, 0.06290435791015625, 0.06914901733398438, 0.0753936767578125, 0.08163833618164062, 0.08788299560546875, 0.09412765502929688, 0.100372314453125, 0.10661697387695312, 0.11286163330078125, 0.11910629272460938, 0.1253509521484375, 0.13159561157226562, 0.13784027099609375, 0.14408493041992188, 0.15032958984375, 0.15657424926757812, 0.16281890869140625, 0.16906356811523438, 0.1753082275390625, 0.18155288696289062, 0.18779754638671875, 0.19404220581054688, 0.200286865234375, 0.20653152465820312, 0.21277618408203125, 0.21902084350585938, 0.2252655029296875, 0.23151016235351562, 0.23775482177734375, 0.24399948120117188, 0.250244140625]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 8.0, 2.0, 2.0, 1.0, 3.0, 2.0, 2.0, 7.0, 9.0, 5.0, 8.0, 13.0, 29.0, 42.0, 78.0, 96.0, 255.0, 985.0, 7980.0, 8365612.0, 11657.0, 1196.0, 279.0, 133.0, 81.0, 46.0, 16.0, 4.0, 8.0, 10.0, 3.0, 6.0, 5.0, 3.0, 4.0, 5.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.5400357246398926, -2.4705750942230225, -2.4011144638061523, -2.3316540718078613, -2.262193441390991, -2.192732810974121, -2.12327241897583, -2.05381178855896, -1.9843511581420898, -1.9148905277252197, -1.8454300165176392, -1.7759695053100586, -1.7065088748931885, -1.6370482444763184, -1.5675877332687378, -1.4981272220611572, -1.428666591644287, -1.359205961227417, -1.2897454500198364, -1.2202849388122559, -1.1508243083953857, -1.0813636779785156, -1.011903166770935, -0.9424425959587097, -0.8729820251464844, -0.803521454334259, -0.7340608835220337, -0.6646003127098083, -0.595139741897583, -0.5256791710853577, -0.4562186002731323, -0.386758029460907, -0.31729745864868164, -0.2478368878364563, -0.17837631702423096, -0.10891574621200562, -0.03945517539978027, 0.03000539541244507, 0.09946596622467041, 0.16892653703689575, 0.2383871078491211, 0.30784767866134644, 0.3773082494735718, 0.4467688202857971, 0.5162293910980225, 0.5856899619102478, 0.6551505327224731, 0.7246111035346985, 0.7940716743469238, 0.8635322451591492, 0.9329928159713745, 1.002453327178955, 1.0719139575958252, 1.1413745880126953, 1.2108350992202759, 1.2802956104278564, 1.3497562408447266, 1.4192168712615967, 1.4886773824691772, 1.5581378936767578, 1.627598524093628, 1.697059154510498, 1.7665196657180786, 1.8359801769256592, 1.9054408073425293]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 5.0, 5.0, 2.0, 5.0, 4.0, 4.0, 2.0, 2.0, 6.0, 6.0, 6.0, 3.0, 12.0, 3.0, 4.0, 5.0, 2.0, 3.0, 5.0, 3.0, 5.0, 4.0, 5.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.945923328399658, -3.8382351398468018, -3.7305469512939453, -3.622858762741089, -3.5151705741882324, -3.407482385635376, -3.2997941970825195, -3.192105770111084, -3.0844178199768066, -2.97672963142395, -2.8690414428710938, -2.7613532543182373, -2.653665065765381, -2.5459768772125244, -2.438288688659668, -2.3306002616882324, -2.222912073135376, -2.1152238845825195, -2.007535696029663, -1.8998475074768066, -1.7921593189239502, -1.6844711303710938, -1.5767828226089478, -1.4690946340560913, -1.3614064455032349, -1.2537182569503784, -1.146030068397522, -1.038341760635376, -0.9306536316871643, -0.8229654431343079, -0.7152771949768066, -0.6075890064239502, -0.49990105628967285, -0.3922128677368164, -0.2845246493816376, -0.17683643102645874, -0.0691482424736023, 0.03853994607925415, 0.14622819423675537, 0.2539163827896118, 0.36160457134246826, 0.4692927598953247, 0.5769809484481812, 0.6846691966056824, 0.7923573851585388, 0.9000455737113953, 1.0077338218688965, 1.115422010421753, 1.2231101989746094, 1.3307983875274658, 1.4384865760803223, 1.5461747646331787, 1.6538629531860352, 1.7615511417388916, 1.8692394495010376, 1.976927638053894, 2.084615707397461, 2.1923038959503174, 2.299992084503174, 2.4076802730560303, 2.5153684616088867, 2.623056650161743, 2.7307448387145996, 2.838433265686035, 2.9461214542388916]}, "gradients/encoder.masked_spec_embed": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 1.0, 4.0, 6.0, 7.0, 11.0, 20.0, 16.0, 34.0, 44.0, 59.0, 64.0, 88.0, 89.0, 97.0, 107.0, 94.0, 60.0, 50.0, 35.0, 26.0, 29.0, 12.0, 12.0, 9.0, 12.0, 5.0, 5.0, 4.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08526611328125, -0.08197498321533203, -0.07868385314941406, -0.0753927230834961, -0.07210159301757812, -0.06881046295166016, -0.06551933288574219, -0.06222820281982422, -0.05893707275390625, -0.05564594268798828, -0.05235481262207031, -0.049063682556152344, -0.045772552490234375, -0.042481422424316406, -0.03919029235839844, -0.03589916229248047, -0.0326080322265625, -0.02931690216064453, -0.026025772094726562, -0.022734642028808594, -0.019443511962890625, -0.016152381896972656, -0.012861251831054688, -0.009570121765136719, -0.00627899169921875, -0.0029878616333007812, 0.0003032684326171875, 0.0035943984985351562, 0.006885528564453125, 0.010176658630371094, 0.013467788696289062, 0.01675891876220703, 0.020050048828125, 0.02334117889404297, 0.026632308959960938, 0.029923439025878906, 0.033214569091796875, 0.036505699157714844, 0.03979682922363281, 0.04308795928955078, 0.04637908935546875, 0.04967021942138672, 0.05296134948730469, 0.056252479553222656, 0.059543609619140625, 0.0628347396850586, 0.06612586975097656, 0.06941699981689453, 0.0727081298828125, 0.07599925994873047, 0.07929039001464844, 0.0825815200805664, 0.08587265014648438, 0.08916378021240234, 0.09245491027832031, 0.09574604034423828, 0.09903717041015625, 0.10232830047607422, 0.10561943054199219, 0.10891056060791016, 0.11220169067382812, 0.1154928207397461, 0.11878395080566406, 0.12207508087158203, 0.1253662109375]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 6.0, 0.0, 2.0, 1.0, 6.0, 9.0, 4.0, 10.0, 22.0, 27.0, 47.0, 45.0, 97.0, 119.0, 210.0, 306.0, 469.0, 873.0, 1436.0, 2692.0, 5425.0, 11095.0, 24335.0, 55575.0, 120951.0, 151844.0, 81525.0, 35437.0, 16000.0, 7386.0, 3687.0, 1905.0, 1056.0, 571.0, 382.0, 241.0, 132.0, 111.0, 80.0, 49.0, 27.0, 21.0, 21.0, 10.0, 10.0, 12.0, 4.0, 2.0, 2.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0], "bins": [-0.75634765625, -0.7342529296875, -0.712158203125, -0.6900634765625, -0.66796875, -0.6458740234375, -0.623779296875, -0.6016845703125, -0.57958984375, -0.5574951171875, -0.535400390625, -0.5133056640625, -0.4912109375, -0.4691162109375, -0.447021484375, -0.4249267578125, -0.40283203125, -0.3807373046875, -0.358642578125, -0.3365478515625, -0.314453125, -0.2923583984375, -0.270263671875, -0.2481689453125, -0.22607421875, -0.2039794921875, -0.181884765625, -0.1597900390625, -0.1376953125, -0.1156005859375, -0.093505859375, -0.0714111328125, -0.04931640625, -0.0272216796875, -0.005126953125, 0.0169677734375, 0.0390625, 0.0611572265625, 0.083251953125, 0.1053466796875, 0.12744140625, 0.1495361328125, 0.171630859375, 0.1937255859375, 0.2158203125, 0.2379150390625, 0.260009765625, 0.2821044921875, 0.30419921875, 0.3262939453125, 0.348388671875, 0.3704833984375, 0.392578125, 0.4146728515625, 0.436767578125, 0.4588623046875, 0.48095703125, 0.5030517578125, 0.525146484375, 0.5472412109375, 0.5693359375, 0.5914306640625, 0.613525390625, 0.6356201171875, 0.65771484375]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 4.0, 5.0, 6.0, 8.0, 5.0, 14.0, 12.0, 24.0, 21.0, 26.0, 29.0, 39.0, 60.0, 53.0, 69.0, 84.0, 62.0, 80.0, 68.0, 81.0, 57.0, 43.0, 40.0, 31.0, 25.0, 13.0, 12.0, 11.0, 13.0, 3.0, 3.0, 1.0, 2.0, 4.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.2122802734375, -0.20678329467773438, -0.20128631591796875, -0.19578933715820312, -0.1902923583984375, -0.18479537963867188, -0.17929840087890625, -0.17380142211914062, -0.168304443359375, -0.16280746459960938, -0.15731048583984375, -0.15181350708007812, -0.1463165283203125, -0.14081954956054688, -0.13532257080078125, -0.12982559204101562, -0.12432861328125, -0.11883163452148438, -0.11333465576171875, -0.10783767700195312, -0.1023406982421875, -0.09684371948242188, -0.09134674072265625, -0.08584976196289062, -0.080352783203125, -0.07485580444335938, -0.06935882568359375, -0.06386184692382812, -0.0583648681640625, -0.052867889404296875, -0.04737091064453125, -0.041873931884765625, -0.036376953125, -0.030879974365234375, -0.02538299560546875, -0.019886016845703125, -0.0143890380859375, -0.008892059326171875, -0.00339508056640625, 0.002101898193359375, 0.007598876953125, 0.013095855712890625, 0.01859283447265625, 0.024089813232421875, 0.0295867919921875, 0.035083770751953125, 0.04058074951171875, 0.046077728271484375, 0.05157470703125, 0.057071685791015625, 0.06256866455078125, 0.06806564331054688, 0.0735626220703125, 0.07905960083007812, 0.08455657958984375, 0.09005355834960938, 0.095550537109375, 0.10104751586914062, 0.10654449462890625, 0.11204147338867188, 0.1175384521484375, 0.12303543090820312, 0.12853240966796875, 0.13402938842773438, 0.1395263671875]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 7.0, 4.0, 18.0, 23.0, 41.0, 84.0, 93.0, 90.0, 56.0, 25.0, 12.0, 8.0, 10.0, 6.0, 5.0, 5.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8905225992202759, -0.8457006216049194, -0.8008787035942078, -0.7560567855834961, -0.7112348079681396, -0.6664128303527832, -0.6215909123420715, -0.5767689943313599, -0.5319470167160034, -0.48712506890296936, -0.4423031210899353, -0.39748117327690125, -0.3526592254638672, -0.30783727765083313, -0.2630153298377991, -0.21819338202476501, -0.17337143421173096, -0.1285494863986969, -0.08372753858566284, -0.038905590772628784, 0.0059163570404052734, 0.05073830485343933, 0.09556025266647339, 0.14038220047950745, 0.1852041482925415, 0.23002609610557556, 0.2748480439186096, 0.3196699917316437, 0.36449193954467773, 0.4093138873577118, 0.45413583517074585, 0.4989577829837799, 0.5437796115875244, 0.5886015892028809, 0.6334235072135925, 0.6782454252243042, 0.7230674028396606, 0.7678893804550171, 0.8127112984657288, 0.8575332164764404, 0.9023551940917969, 0.9471771717071533, 0.991999089717865, 1.0368210077285767, 1.081642985343933, 1.1264649629592896, 1.1712868213653564, 1.216108798980713, 1.2609307765960693, 1.3057527542114258, 1.3505747318267822, 1.3953965902328491, 1.4402185678482056, 1.485040545463562, 1.529862403869629, 1.5746843814849854, 1.6195063591003418, 1.6643283367156982, 1.7091503143310547, 1.7539721727371216, 1.798794150352478, 1.8436161279678345, 1.8884379863739014, 1.9332599639892578, 1.9780819416046143]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 1.0, 1.0, 3.0, 0.0, 4.0, 3.0, 3.0, 10.0, 7.0, 6.0, 6.0, 16.0, 31.0, 25.0, 41.0, 48.0, 43.0, 48.0, 34.0, 35.0, 30.0, 16.0, 16.0, 10.0, 7.0, 11.0, 3.0, 3.0, 1.0, 1.0, 5.0, 4.0, 1.0, 3.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0], "bins": [-0.5323032736778259, -0.5148088335990906, -0.49731433391571045, -0.4798198640346527, -0.46232539415359497, -0.4448309540748596, -0.4273364841938019, -0.40984201431274414, -0.3923475444316864, -0.37485307455062866, -0.3573586046695709, -0.3398641347885132, -0.32236969470977783, -0.3048751950263977, -0.28738075494766235, -0.2698862850666046, -0.2523918151855469, -0.23489734530448914, -0.2174028754234314, -0.19990842044353485, -0.1824139505624771, -0.16491948068141937, -0.14742502570152283, -0.1299305558204651, -0.11243608593940735, -0.09494161605834961, -0.07744715362787247, -0.059952687472105026, -0.042458221316337585, -0.024963751435279846, -0.007469289004802704, 0.010025173425674438, 0.027519702911376953, 0.045014169067144394, 0.06250863522291183, 0.08000309765338898, 0.09749756753444672, 0.11499203741550446, 0.132486492395401, 0.14998096227645874, 0.16747543215751648, 0.18496990203857422, 0.20246437191963196, 0.2199588268995285, 0.23745329678058624, 0.2549477815628052, 0.2724422216415405, 0.28993669152259827, 0.307431161403656, 0.32492563128471375, 0.3424201011657715, 0.3599145710468292, 0.37740904092788696, 0.3949034810066223, 0.41239795088768005, 0.4298924207687378, 0.44738689064979553, 0.46488136053085327, 0.482375830411911, 0.49987030029296875, 0.5173647403717041, 0.5348592400550842, 0.5523536801338196, 0.5698481798171997, 0.5873426198959351]}, "train/train_runtime": 5009.4893, "train/train_samples_per_second": 5.697, "train/train_steps_per_second": 0.178, "train/total_flos": 0.0, "train/train_loss": 4.8473983449786235} \ No newline at end of file +{"train/loss": 3.0179, "train/learning_rate": 4.591836734693877e-06, "train/epoch": 1.0, "train/global_step": 892, "_runtime": 5869, "_timestamp": 1647534505, "_step": 893, "gradients/decoder.model.decoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 7.0, 197.0, 544.0, 249.0, 18.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7681227922439575, -1.2875614166259766, -0.8070001006126404, -0.3264387845993042, 0.15412259101867676, 0.6346839666366577, 1.1152452230453491, 1.5958067178726196, 2.0763678550720215, 2.556929111480713, 3.0374906063079834, 3.518051862716675, 3.9986133575439453, 4.479174613952637, 4.959735870361328, 5.4402971267700195, 5.920858860015869, 6.4014201164245605, 6.881981372833252, 7.362543106079102, 7.843104362487793, 8.323665618896484, 8.804226875305176, 9.284788131713867, 9.765349388122559, 10.24591064453125, 10.726471900939941, 11.207033157348633, 11.687594413757324, 12.168155670166016, 12.648717880249023, 13.129279136657715, 13.60983943939209, 14.090400695800781, 14.570961952209473, 15.051523208618164, 15.532084465026855, 16.012645721435547, 16.493207931518555, 16.97376823425293, 17.454330444335938, 17.934892654418945, 18.41545295715332, 18.896015167236328, 19.376575469970703, 19.85713768005371, 20.337697982788086, 20.818260192871094, 21.29882049560547, 21.779382705688477, 22.25994300842285, 22.74050521850586, 23.221065521240234, 23.701627731323242, 24.182188034057617, 24.662750244140625, 25.143312454223633, 25.62387466430664, 26.104434967041016, 26.584997177124023, 27.0655574798584, 27.546119689941406, 28.02667999267578, 28.50724220275879, 28.987802505493164]}, "gradients/decoder.model.decoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 5.0, 6.0, 3.0, 6.0, 9.0, 12.0, 18.0, 16.0, 11.0, 20.0, 17.0, 22.0, 32.0, 28.0, 26.0, 34.0, 36.0, 33.0, 41.0, 41.0, 39.0, 33.0, 39.0, 41.0, 41.0, 46.0, 30.0, 40.0, 37.0, 27.0, 40.0, 25.0, 22.0, 20.0, 14.0, 19.0, 15.0, 20.0, 7.0, 12.0, 8.0, 5.0, 2.0, 4.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-3.695791721343994, -3.598155975341797, -3.5005202293395996, -3.4028844833374023, -3.305248737335205, -3.207612991333008, -3.1099772453308105, -3.012341260910034, -2.914705514907837, -2.8170697689056396, -2.7194340229034424, -2.621798276901245, -2.524162530899048, -2.4265265464782715, -2.328890800476074, -2.231255054473877, -2.1336193084716797, -2.0359835624694824, -1.9383478164672852, -1.840712070465088, -1.743076205253601, -1.6454404592514038, -1.5478047132492065, -1.4501688480377197, -1.3525333404541016, -1.2548975944519043, -1.157261848449707, -1.0596261024475098, -0.961990237236023, -0.8643544912338257, -0.7667187452316284, -0.6690829396247864, -0.5714471340179443, -0.4738113582134247, -0.37617558240890503, -0.27853983640670776, -0.1809040606021881, -0.08326828479766846, 0.014367461204528809, 0.11200326681137085, 0.20963901281356812, 0.30727478861808777, 0.4049105644226074, 0.5025463104248047, 0.600182056427002, 0.697817862033844, 0.7954536080360413, 0.8930894136428833, 0.9907251596450806, 1.0883609056472778, 1.185996651649475, 1.283632516860962, 1.3812682628631592, 1.4789040088653564, 1.5765397548675537, 1.674175500869751, 1.7718112468719482, 1.8694469928741455, 1.9670827388763428, 2.06471848487854, 2.1623542308807373, 2.2599902153015137, 2.357625961303711, 2.455261707305908, 2.5528974533081055]}, "gradients/decoder.model.decoder.layers.11.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 3.0, 1.0, 5.0, 4.0, 7.0, 10.0, 11.0, 32.0, 34.0, 54.0, 72.0, 103.0, 147.0, 290.0, 423.0, 776.0, 1480.0, 2667.0, 5174.0, 10941.0, 24908.0, 57350.0, 134043.0, 304513.0, 687304.0, 1346694.0, 903490.0, 398829.0, 175166.0, 76072.0, 33459.0, 15167.0, 7155.0, 3531.0, 1914.0, 1015.0, 551.0, 325.0, 192.0, 120.0, 83.0, 52.0, 32.0, 18.0, 25.0, 21.0, 12.0, 4.0, 4.0, 3.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-2.310546875, -2.241943359375, -2.17333984375, -2.104736328125, -2.0361328125, -1.967529296875, -1.89892578125, -1.830322265625, -1.76171875, -1.693115234375, -1.62451171875, -1.555908203125, -1.4873046875, -1.418701171875, -1.35009765625, -1.281494140625, -1.212890625, -1.144287109375, -1.07568359375, -1.007080078125, -0.9384765625, -0.869873046875, -0.80126953125, -0.732666015625, -0.6640625, -0.595458984375, -0.52685546875, -0.458251953125, -0.3896484375, -0.321044921875, -0.25244140625, -0.183837890625, -0.115234375, -0.046630859375, 0.02197265625, 0.090576171875, 0.1591796875, 0.227783203125, 0.29638671875, 0.364990234375, 0.43359375, 0.502197265625, 0.57080078125, 0.639404296875, 0.7080078125, 0.776611328125, 0.84521484375, 0.913818359375, 0.982421875, 1.051025390625, 1.11962890625, 1.188232421875, 1.2568359375, 1.325439453125, 1.39404296875, 1.462646484375, 1.53125, 1.599853515625, 1.66845703125, 1.737060546875, 1.8056640625, 1.874267578125, 1.94287109375, 2.011474609375, 2.080078125]}, "gradients/decoder.model.decoder.layers.11.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 2.0, 3.0, 1.0, 6.0, 6.0, 5.0, 10.0, 6.0, 16.0, 12.0, 17.0, 24.0, 24.0, 31.0, 24.0, 29.0, 35.0, 41.0, 30.0, 33.0, 51.0, 40.0, 38.0, 44.0, 40.0, 58.0, 32.0, 42.0, 34.0, 29.0, 29.0, 24.0, 24.0, 28.0, 27.0, 21.0, 21.0, 10.0, 16.0, 9.0, 8.0, 10.0, 5.0, 4.0, 6.0, 4.0, 1.0, 0.0, 2.0, 2.0], "bins": [-4.015625, -3.90777587890625, -3.7999267578125, -3.69207763671875, -3.584228515625, -3.47637939453125, -3.3685302734375, -3.26068115234375, -3.15283203125, -3.04498291015625, -2.9371337890625, -2.82928466796875, -2.721435546875, -2.61358642578125, -2.5057373046875, -2.39788818359375, -2.2900390625, -2.18218994140625, -2.0743408203125, -1.96649169921875, -1.858642578125, -1.75079345703125, -1.6429443359375, -1.53509521484375, -1.42724609375, -1.31939697265625, -1.2115478515625, -1.10369873046875, -0.995849609375, -0.88800048828125, -0.7801513671875, -0.67230224609375, -0.564453125, -0.45660400390625, -0.3487548828125, -0.24090576171875, -0.133056640625, -0.02520751953125, 0.0826416015625, 0.19049072265625, 0.29833984375, 0.40618896484375, 0.5140380859375, 0.62188720703125, 0.729736328125, 0.83758544921875, 0.9454345703125, 1.05328369140625, 1.1611328125, 1.26898193359375, 1.3768310546875, 1.48468017578125, 1.592529296875, 1.70037841796875, 1.8082275390625, 1.91607666015625, 2.02392578125, 2.13177490234375, 2.2396240234375, 2.34747314453125, 2.455322265625, 2.56317138671875, 2.6710205078125, 2.77886962890625, 2.88671875]}, "gradients/decoder.model.decoder.layers.11.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 2.0, 2.0, 2.0, 8.0, 12.0, 17.0, 16.0, 45.0, 124.0, 382.0, 56488.0, 4136465.0, 432.0, 150.0, 67.0, 32.0, 27.0, 8.0, 7.0, 5.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-76.9375, -72.6748046875, -68.412109375, -64.1494140625, -59.88671875, -55.6240234375, -51.361328125, -47.0986328125, -42.8359375, -38.5732421875, -34.310546875, -30.0478515625, -25.78515625, -21.5224609375, -17.259765625, -12.9970703125, -8.734375, -4.4716796875, -0.208984375, 4.0537109375, 8.31640625, 12.5791015625, 16.841796875, 21.1044921875, 25.3671875, 29.6298828125, 33.892578125, 38.1552734375, 42.41796875, 46.6806640625, 50.943359375, 55.2060546875, 59.46875, 63.7314453125, 67.994140625, 72.2568359375, 76.51953125, 80.7822265625, 85.044921875, 89.3076171875, 93.5703125, 97.8330078125, 102.095703125, 106.3583984375, 110.62109375, 114.8837890625, 119.146484375, 123.4091796875, 127.671875, 131.9345703125, 136.197265625, 140.4599609375, 144.72265625, 148.9853515625, 153.248046875, 157.5107421875, 161.7734375, 166.0361328125, 170.298828125, 174.5615234375, 178.82421875, 183.0869140625, 187.349609375, 191.6123046875, 195.875]}, "gradients/decoder.model.decoder.layers.11.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 1.0, 0.0, 4.0, 1.0, 6.0, 5.0, 14.0, 18.0, 15.0, 43.0, 95.0, 195.0, 549.0, 1536.0, 966.0, 303.0, 156.0, 71.0, 37.0, 29.0, 16.0, 10.0, 7.0, 6.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.849609375, -1.7603759765625, -1.671142578125, -1.5819091796875, -1.49267578125, -1.4034423828125, -1.314208984375, -1.2249755859375, -1.1357421875, -1.0465087890625, -0.957275390625, -0.8680419921875, -0.77880859375, -0.6895751953125, -0.600341796875, -0.5111083984375, -0.421875, -0.3326416015625, -0.243408203125, -0.1541748046875, -0.06494140625, 0.0242919921875, 0.113525390625, 0.2027587890625, 0.2919921875, 0.3812255859375, 0.470458984375, 0.5596923828125, 0.64892578125, 0.7381591796875, 0.827392578125, 0.9166259765625, 1.005859375, 1.0950927734375, 1.184326171875, 1.2735595703125, 1.36279296875, 1.4520263671875, 1.541259765625, 1.6304931640625, 1.7197265625, 1.8089599609375, 1.898193359375, 1.9874267578125, 2.07666015625, 2.1658935546875, 2.255126953125, 2.3443603515625, 2.43359375, 2.5228271484375, 2.612060546875, 2.7012939453125, 2.79052734375, 2.8797607421875, 2.968994140625, 3.0582275390625, 3.1474609375, 3.2366943359375, 3.325927734375, 3.4151611328125, 3.50439453125, 3.5936279296875, 3.682861328125, 3.7720947265625, 3.861328125]}, "gradients/decoder.model.decoder.layers.11.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 10.0, 14.0, 21.0, 20.0, 36.0, 48.0, 63.0, 82.0, 89.0, 90.0, 117.0, 94.0, 98.0, 61.0, 49.0, 40.0, 23.0, 19.0, 13.0, 7.0, 7.0, 2.0, 2.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.2791056632995605, -6.09200382232666, -5.90490198135376, -5.717800140380859, -5.530697822570801, -5.3435959815979, -5.156494140625, -4.9693922996521, -4.782290458679199, -4.595188617706299, -4.408086776733398, -4.220984935760498, -4.033883094787598, -3.846781015396118, -3.6596789360046387, -3.4725770950317383, -3.285475254058838, -3.0983734130859375, -2.911271572113037, -2.7241694927215576, -2.5370676517486572, -2.349965810775757, -2.1628637313842773, -1.975761890411377, -1.7886600494384766, -1.6015582084655762, -1.4144562482833862, -1.2273542881011963, -1.040252447128296, -0.8531505465507507, -0.6660486459732056, -0.4789466857910156, -0.29184436798095703, -0.10474246740341187, 0.0823594331741333, 0.26946133375167847, 0.45656323432922363, 0.6436651349067688, 0.830767035484314, 1.017868995666504, 1.2049708366394043, 1.3920726776123047, 1.5791746377944946, 1.7662765979766846, 1.953378438949585, 2.1404802799224854, 2.327582359313965, 2.5146842002868652, 2.7017860412597656, 2.888887882232666, 3.0759897232055664, 3.263091802597046, 3.4501936435699463, 3.6372954845428467, 3.824397563934326, 4.011499404907227, 4.198601245880127, 4.385703086853027, 4.572804927825928, 4.759906768798828, 4.947009086608887, 5.134110927581787, 5.3212127685546875, 5.508314609527588, 5.695416450500488]}, "gradients/decoder.model.decoder.layers.11.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 3.0, 4.0, 2.0, 4.0, 6.0, 11.0, 14.0, 7.0, 14.0, 18.0, 18.0, 21.0, 22.0, 34.0, 24.0, 32.0, 38.0, 28.0, 39.0, 37.0, 41.0, 44.0, 43.0, 46.0, 39.0, 44.0, 33.0, 37.0, 34.0, 41.0, 32.0, 38.0, 27.0, 30.0, 18.0, 9.0, 20.0, 11.0, 9.0, 13.0, 3.0, 4.0, 7.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0], "bins": [-3.8008768558502197, -3.698765754699707, -3.5966548919677734, -3.49454402923584, -3.392432928085327, -3.2903218269348145, -3.188210964202881, -3.0861001014709473, -2.9839890003204346, -2.881877899169922, -2.7797670364379883, -2.6776561737060547, -2.575545072555542, -2.4734339714050293, -2.3713231086730957, -2.269212245941162, -2.1671011447906494, -2.0649900436401367, -1.9628791809082031, -1.86076819896698, -1.7586572170257568, -1.6565462350845337, -1.5544352531433105, -1.4523242712020874, -1.3502132892608643, -1.2481023073196411, -1.145991325378418, -1.0438803434371948, -0.9417693614959717, -0.8396583795547485, -0.7375473976135254, -0.6354364156723022, -0.5333254337310791, -0.43121445178985596, -0.3291034698486328, -0.22699248790740967, -0.12488150596618652, -0.02277052402496338, 0.07934045791625977, 0.1814514398574829, 0.28356242179870605, 0.3856734037399292, 0.48778438568115234, 0.5898953676223755, 0.6920063495635986, 0.7941173315048218, 0.8962283134460449, 0.9983392953872681, 1.1004502773284912, 1.2025612592697144, 1.3046722412109375, 1.4067832231521606, 1.5088942050933838, 1.611005187034607, 1.71311616897583, 1.8152271509170532, 1.9173381328582764, 2.019449234008789, 2.1215600967407227, 2.2236709594726562, 2.325782060623169, 2.4278931617736816, 2.5300040245056152, 2.632114887237549, 2.7342259883880615]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 4.0, 3.0, 5.0, 5.0, 8.0, 8.0, 16.0, 16.0, 31.0, 44.0, 62.0, 85.0, 117.0, 196.0, 305.0, 547.0, 863.0, 1654.0, 3220.0, 5935.0, 11773.0, 23152.0, 44878.0, 84487.0, 142148.0, 198286.0, 200993.0, 145669.0, 86844.0, 47050.0, 24402.0, 12192.0, 6203.0, 3253.0, 1693.0, 940.0, 559.0, 307.0, 201.0, 111.0, 82.0, 48.0, 47.0, 39.0, 29.0, 13.0, 12.0, 10.0, 6.0, 3.0, 1.0, 5.0, 0.0, 2.0, 3.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.6669921875, -0.6431961059570312, -0.6194000244140625, -0.5956039428710938, -0.571807861328125, -0.5480117797851562, -0.5242156982421875, -0.5004196166992188, -0.47662353515625, -0.45282745361328125, -0.4290313720703125, -0.40523529052734375, -0.381439208984375, -0.35764312744140625, -0.3338470458984375, -0.31005096435546875, -0.2862548828125, -0.26245880126953125, -0.2386627197265625, -0.21486663818359375, -0.191070556640625, -0.16727447509765625, -0.1434783935546875, -0.11968231201171875, -0.09588623046875, -0.07209014892578125, -0.0482940673828125, -0.02449798583984375, -0.000701904296875, 0.02309417724609375, 0.0468902587890625, 0.07068634033203125, 0.094482421875, 0.11827850341796875, 0.1420745849609375, 0.16587066650390625, 0.189666748046875, 0.21346282958984375, 0.2372589111328125, 0.26105499267578125, 0.28485107421875, 0.30864715576171875, 0.3324432373046875, 0.35623931884765625, 0.380035400390625, 0.40383148193359375, 0.4276275634765625, 0.45142364501953125, 0.4752197265625, 0.49901580810546875, 0.5228118896484375, 0.5466079711914062, 0.570404052734375, 0.5942001342773438, 0.6179962158203125, 0.6417922973632812, 0.66558837890625, 0.6893844604492188, 0.7131805419921875, 0.7369766235351562, 0.760772705078125, 0.7845687866210938, 0.8083648681640625, 0.8321609497070312, 0.85595703125]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 1.0, 5.0, 5.0, 5.0, 2.0, 6.0, 8.0, 7.0, 15.0, 9.0, 24.0, 16.0, 15.0, 26.0, 32.0, 29.0, 33.0, 27.0, 37.0, 42.0, 51.0, 36.0, 53.0, 42.0, 40.0, 46.0, 38.0, 46.0, 40.0, 38.0, 32.0, 33.0, 22.0, 28.0, 22.0, 23.0, 12.0, 15.0, 15.0, 7.0, 7.0, 3.0, 5.0, 1.0, 2.0, 2.0, 3.0, 4.0, 0.0, 0.0, 2.0], "bins": [-2.826171875, -2.748443603515625, -2.67071533203125, -2.592987060546875, -2.5152587890625, -2.437530517578125, -2.35980224609375, -2.282073974609375, -2.204345703125, -2.126617431640625, -2.04888916015625, -1.971160888671875, -1.8934326171875, -1.815704345703125, -1.73797607421875, -1.660247802734375, -1.58251953125, -1.504791259765625, -1.42706298828125, -1.349334716796875, -1.2716064453125, -1.193878173828125, -1.11614990234375, -1.038421630859375, -0.960693359375, -0.882965087890625, -0.80523681640625, -0.727508544921875, -0.6497802734375, -0.572052001953125, -0.49432373046875, -0.416595458984375, -0.3388671875, -0.261138916015625, -0.18341064453125, -0.105682373046875, -0.0279541015625, 0.049774169921875, 0.12750244140625, 0.205230712890625, 0.282958984375, 0.360687255859375, 0.43841552734375, 0.516143798828125, 0.5938720703125, 0.671600341796875, 0.74932861328125, 0.827056884765625, 0.90478515625, 0.982513427734375, 1.06024169921875, 1.137969970703125, 1.2156982421875, 1.293426513671875, 1.37115478515625, 1.448883056640625, 1.526611328125, 1.604339599609375, 1.68206787109375, 1.759796142578125, 1.8375244140625, 1.915252685546875, 1.99298095703125, 2.070709228515625, 2.1484375]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 4.0, 6.0, 5.0, 8.0, 7.0, 12.0, 10.0, 19.0, 40.0, 56.0, 94.0, 160.0, 246.0, 442.0, 1065.0, 2335.0, 5992.0, 16914.0, 52296.0, 154361.0, 318471.0, 297061.0, 131855.0, 43532.0, 14557.0, 5102.0, 2034.0, 896.0, 426.0, 223.0, 118.0, 64.0, 53.0, 30.0, 26.0, 16.0, 8.0, 6.0, 3.0, 1.0, 6.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.0283203125, -0.998870849609375, -0.96942138671875, -0.939971923828125, -0.9105224609375, -0.881072998046875, -0.85162353515625, -0.822174072265625, -0.792724609375, -0.763275146484375, -0.73382568359375, -0.704376220703125, -0.6749267578125, -0.645477294921875, -0.61602783203125, -0.586578369140625, -0.55712890625, -0.527679443359375, -0.49822998046875, -0.468780517578125, -0.4393310546875, -0.409881591796875, -0.38043212890625, -0.350982666015625, -0.321533203125, -0.292083740234375, -0.26263427734375, -0.233184814453125, -0.2037353515625, -0.174285888671875, -0.14483642578125, -0.115386962890625, -0.0859375, -0.056488037109375, -0.02703857421875, 0.002410888671875, 0.0318603515625, 0.061309814453125, 0.09075927734375, 0.120208740234375, 0.149658203125, 0.179107666015625, 0.20855712890625, 0.238006591796875, 0.2674560546875, 0.296905517578125, 0.32635498046875, 0.355804443359375, 0.38525390625, 0.414703369140625, 0.44415283203125, 0.473602294921875, 0.5030517578125, 0.532501220703125, 0.56195068359375, 0.591400146484375, 0.620849609375, 0.650299072265625, 0.67974853515625, 0.709197998046875, 0.7386474609375, 0.768096923828125, 0.79754638671875, 0.826995849609375, 0.8564453125]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 5.0, 13.0, 6.0, 11.0, 29.0, 23.0, 23.0, 26.0, 35.0, 39.0, 51.0, 58.0, 62.0, 55.0, 57.0, 50.0, 62.0, 49.0, 60.0, 51.0, 44.0, 40.0, 37.0, 25.0, 22.0, 13.0, 15.0, 15.0, 11.0, 5.0, 4.0, 5.0, 4.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-7.3203125, -7.11517333984375, -6.9100341796875, -6.70489501953125, -6.499755859375, -6.29461669921875, -6.0894775390625, -5.88433837890625, -5.67919921875, -5.47406005859375, -5.2689208984375, -5.06378173828125, -4.858642578125, -4.65350341796875, -4.4483642578125, -4.24322509765625, -4.0380859375, -3.83294677734375, -3.6278076171875, -3.42266845703125, -3.217529296875, -3.01239013671875, -2.8072509765625, -2.60211181640625, -2.39697265625, -2.19183349609375, -1.9866943359375, -1.78155517578125, -1.576416015625, -1.37127685546875, -1.1661376953125, -0.96099853515625, -0.755859375, -0.55072021484375, -0.3455810546875, -0.14044189453125, 0.064697265625, 0.26983642578125, 0.4749755859375, 0.68011474609375, 0.88525390625, 1.09039306640625, 1.2955322265625, 1.50067138671875, 1.705810546875, 1.91094970703125, 2.1160888671875, 2.32122802734375, 2.5263671875, 2.73150634765625, 2.9366455078125, 3.14178466796875, 3.346923828125, 3.55206298828125, 3.7572021484375, 3.96234130859375, 4.16748046875, 4.37261962890625, 4.5777587890625, 4.78289794921875, 4.988037109375, 5.19317626953125, 5.3983154296875, 5.60345458984375, 5.80859375]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 7.0, 11.0, 10.0, 8.0, 20.0, 21.0, 36.0, 42.0, 81.0, 109.0, 185.0, 397.0, 710.0, 1601.0, 3501.0, 8691.0, 24165.0, 89788.0, 413188.0, 385531.0, 82533.0, 22962.0, 8336.0, 3359.0, 1584.0, 724.0, 396.0, 262.0, 104.0, 59.0, 43.0, 31.0, 20.0, 8.0, 15.0, 9.0, 9.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2322998046875, -0.22525405883789062, -0.21820831298828125, -0.21116256713867188, -0.2041168212890625, -0.19707107543945312, -0.19002532958984375, -0.18297958374023438, -0.175933837890625, -0.16888809204101562, -0.16184234619140625, -0.15479660034179688, -0.1477508544921875, -0.14070510864257812, -0.13365936279296875, -0.12661361694335938, -0.11956787109375, -0.11252212524414062, -0.10547637939453125, -0.09843063354492188, -0.0913848876953125, -0.08433914184570312, -0.07729339599609375, -0.07024765014648438, -0.063201904296875, -0.056156158447265625, -0.04911041259765625, -0.042064666748046875, -0.0350189208984375, -0.027973175048828125, -0.02092742919921875, -0.013881683349609375, -0.0068359375, 0.000209808349609375, 0.00725555419921875, 0.014301300048828125, 0.0213470458984375, 0.028392791748046875, 0.03543853759765625, 0.042484283447265625, 0.049530029296875, 0.056575775146484375, 0.06362152099609375, 0.07066726684570312, 0.0777130126953125, 0.08475875854492188, 0.09180450439453125, 0.09885025024414062, 0.10589599609375, 0.11294174194335938, 0.11998748779296875, 0.12703323364257812, 0.1340789794921875, 0.14112472534179688, 0.14817047119140625, 0.15521621704101562, 0.162261962890625, 0.16930770874023438, 0.17635345458984375, 0.18339920043945312, 0.1904449462890625, 0.19749069213867188, 0.20453643798828125, 0.21158218383789062, 0.2186279296875]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 5.0, 3.0, 4.0, 6.0, 9.0, 9.0, 17.0, 22.0, 32.0, 53.0, 84.0, 158.0, 150.0, 151.0, 120.0, 71.0, 38.0, 34.0, 14.0, 7.0, 7.0, 5.0, 6.0, 2.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002765655517578125, -0.0002690330147743225, -0.0002615004777908325, -0.00025396794080734253, -0.00024643540382385254, -0.00023890286684036255, -0.00023137032985687256, -0.00022383779287338257, -0.00021630525588989258, -0.0002087727189064026, -0.0002012401819229126, -0.0001937076449394226, -0.00018617510795593262, -0.00017864257097244263, -0.00017111003398895264, -0.00016357749700546265, -0.00015604496002197266, -0.00014851242303848267, -0.00014097988605499268, -0.00013344734907150269, -0.0001259148120880127, -0.0001183822751045227, -0.00011084973812103271, -0.00010331720113754272, -9.578466415405273e-05, -8.825212717056274e-05, -8.071959018707275e-05, -7.318705320358276e-05, -6.565451622009277e-05, -5.812197923660278e-05, -5.058944225311279e-05, -4.30569052696228e-05, -3.552436828613281e-05, -2.7991831302642822e-05, -2.0459294319152832e-05, -1.2926757335662842e-05, -5.3942203521728516e-06, 2.1383166313171387e-06, 9.670853614807129e-06, 1.720339059829712e-05, 2.473592758178711e-05, 3.22684645652771e-05, 3.980100154876709e-05, 4.733353853225708e-05, 5.486607551574707e-05, 6.239861249923706e-05, 6.993114948272705e-05, 7.746368646621704e-05, 8.499622344970703e-05, 9.252876043319702e-05, 0.00010006129741668701, 0.000107593834400177, 0.00011512637138366699, 0.00012265890836715698, 0.00013019144535064697, 0.00013772398233413696, 0.00014525651931762695, 0.00015278905630111694, 0.00016032159328460693, 0.00016785413026809692, 0.00017538666725158691, 0.0001829192042350769, 0.0001904517412185669, 0.00019798427820205688, 0.00020551681518554688]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 8.0, 5.0, 6.0, 7.0, 22.0, 24.0, 37.0, 52.0, 119.0, 196.0, 900.0, 45684.0, 990458.0, 10126.0, 514.0, 141.0, 86.0, 56.0, 36.0, 24.0, 12.0, 11.0, 9.0, 6.0, 4.0, 2.0, 1.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.2705078125, -1.22998046875, -1.189453125, -1.14892578125, -1.1083984375, -1.06787109375, -1.02734375, -0.98681640625, -0.9462890625, -0.90576171875, -0.865234375, -0.82470703125, -0.7841796875, -0.74365234375, -0.703125, -0.66259765625, -0.6220703125, -0.58154296875, -0.541015625, -0.50048828125, -0.4599609375, -0.41943359375, -0.37890625, -0.33837890625, -0.2978515625, -0.25732421875, -0.216796875, -0.17626953125, -0.1357421875, -0.09521484375, -0.0546875, -0.01416015625, 0.0263671875, 0.06689453125, 0.107421875, 0.14794921875, 0.1884765625, 0.22900390625, 0.26953125, 0.31005859375, 0.3505859375, 0.39111328125, 0.431640625, 0.47216796875, 0.5126953125, 0.55322265625, 0.59375, 0.63427734375, 0.6748046875, 0.71533203125, 0.755859375, 0.79638671875, 0.8369140625, 0.87744140625, 0.91796875, 0.95849609375, 0.9990234375, 1.03955078125, 1.080078125, 1.12060546875, 1.1611328125, 1.20166015625, 1.2421875, 1.28271484375, 1.3232421875]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 3.0, 2.0, 1.0, 2.0, 5.0, 7.0, 5.0, 9.0, 20.0, 20.0, 40.0, 41.0, 71.0, 81.0, 89.0, 106.0, 98.0, 92.0, 84.0, 68.0, 50.0, 38.0, 24.0, 17.0, 11.0, 9.0, 4.0, 1.0, 3.0, 1.0, 2.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.092529296875, -0.0892171859741211, -0.08590507507324219, -0.08259296417236328, -0.07928085327148438, -0.07596874237060547, -0.07265663146972656, -0.06934452056884766, -0.06603240966796875, -0.06272029876708984, -0.05940818786621094, -0.05609607696533203, -0.052783966064453125, -0.04947185516357422, -0.04615974426269531, -0.042847633361816406, -0.0395355224609375, -0.036223411560058594, -0.03291130065917969, -0.02959918975830078, -0.026287078857421875, -0.02297496795654297, -0.019662857055664062, -0.016350746154785156, -0.01303863525390625, -0.009726524353027344, -0.0064144134521484375, -0.0031023025512695312, 0.000209808349609375, 0.0035219192504882812, 0.0068340301513671875, 0.010146141052246094, 0.013458251953125, 0.016770362854003906, 0.020082473754882812, 0.02339458465576172, 0.026706695556640625, 0.03001880645751953, 0.03333091735839844, 0.036643028259277344, 0.03995513916015625, 0.043267250061035156, 0.04657936096191406, 0.04989147186279297, 0.053203582763671875, 0.05651569366455078, 0.05982780456542969, 0.0631399154663086, 0.0664520263671875, 0.0697641372680664, 0.07307624816894531, 0.07638835906982422, 0.07970046997070312, 0.08301258087158203, 0.08632469177246094, 0.08963680267333984, 0.09294891357421875, 0.09626102447509766, 0.09957313537597656, 0.10288524627685547, 0.10619735717773438, 0.10950946807861328, 0.11282157897949219, 0.1161336898803711, 0.11944580078125]}, "gradients/decoder.model.decoder.layers.11.self_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 3.0, 13.0, 35.0, 104.0, 206.0, 306.0, 213.0, 91.0, 25.0, 10.0, 5.0, 3.0, 0.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.611790418624878, -3.234570026397705, -2.8573496341705322, -2.4801292419433594, -2.1029086112976074, -1.7256883382797241, -1.3484678268432617, -0.9712474346160889, -0.594027042388916, -0.21680662035942078, 0.16041380167007446, 0.5376342535018921, 0.9148546457290649, 1.2920750379562378, 1.6692955493927002, 2.046515941619873, 2.423736333847046, 2.8009567260742188, 3.1781771183013916, 3.5553975105285645, 3.9326181411743164, 4.30983829498291, 4.687058925628662, 5.064279556274414, 5.441499710083008, 5.81872034072876, 6.1959404945373535, 6.5731611251831055, 6.950381278991699, 7.327601909637451, 7.704822540283203, 8.082042694091797, 8.459263801574707, 8.8364839553833, 9.213705062866211, 9.590925216674805, 9.968145370483398, 10.345365524291992, 10.722586631774902, 11.099806785583496, 11.47702693939209, 11.854247093200684, 12.231468200683594, 12.608688354492188, 12.985908508300781, 13.363128662109375, 13.740349769592285, 14.117569923400879, 14.494791030883789, 14.872011184692383, 15.249232292175293, 15.626452445983887, 16.003673553466797, 16.38089370727539, 16.758113861083984, 17.135334014892578, 17.512554168701172, 17.889774322509766, 18.26699447631836, 18.644214630126953, 19.02143669128418, 19.398656845092773, 19.775876998901367, 20.15309715270996, 20.530317306518555]}, "gradients/decoder.model.decoder.layers.11.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 2.0, 4.0, 6.0, 6.0, 3.0, 12.0, 10.0, 12.0, 15.0, 21.0, 19.0, 24.0, 32.0, 35.0, 31.0, 30.0, 31.0, 39.0, 45.0, 50.0, 54.0, 31.0, 53.0, 36.0, 51.0, 37.0, 40.0, 43.0, 37.0, 34.0, 31.0, 23.0, 14.0, 23.0, 16.0, 14.0, 11.0, 8.0, 5.0, 3.0, 9.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 2.0], "bins": [-2.843140125274658, -2.7669174671173096, -2.69069504737854, -2.6144723892211914, -2.538249969482422, -2.4620273113250732, -2.3858048915863037, -2.309582233428955, -2.2333598136901855, -2.157137155532837, -2.0809147357940674, -2.0046920776367188, -1.9284696578979492, -1.8522469997406006, -1.7760244607925415, -1.6998019218444824, -1.6235792636871338, -1.5473567247390747, -1.4711341857910156, -1.3949116468429565, -1.3186891078948975, -1.2424664497375488, -1.1662439107894897, -1.0900213718414307, -1.0137988328933716, -0.9375762939453125, -0.8613537549972534, -0.7851311564445496, -0.7089086174964905, -0.6326860785484314, -0.5564634799957275, -0.48024094104766846, -0.4040184020996094, -0.3277958631515503, -0.2515732944011688, -0.17535074055194855, -0.09912818670272827, -0.02290564775466919, 0.05331692099571228, 0.12953948974609375, 0.20576202869415283, 0.2819845676422119, 0.3582071363925934, 0.43442970514297485, 0.5106522440910339, 0.586874783039093, 0.6630973815917969, 0.739319920539856, 0.815542459487915, 0.8917649984359741, 0.9679875373840332, 1.0442100763320923, 1.1204326152801514, 1.1966552734375, 1.272877812385559, 1.3491003513336182, 1.4253228902816772, 1.5015454292297363, 1.5777679681777954, 1.6539905071258545, 1.7302131652832031, 1.8064355850219727, 1.8826582431793213, 1.9588807821273804, 2.0351033210754395]}, "gradients/decoder.model.decoder.layers.11.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 7.0, 2.0, 11.0, 15.0, 15.0, 34.0, 39.0, 83.0, 121.0, 171.0, 359.0, 604.0, 1162.0, 2069.0, 3968.0, 8068.0, 19325.0, 53139.0, 179875.0, 443132.0, 228104.0, 66000.0, 22863.0, 9596.0, 4541.0, 2301.0, 1261.0, 680.0, 421.0, 260.0, 115.0, 74.0, 45.0, 29.0, 32.0, 15.0, 12.0, 9.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.091796875, -1.0522308349609375, -1.012664794921875, -0.9730987548828125, -0.93353271484375, -0.8939666748046875, -0.854400634765625, -0.8148345947265625, -0.7752685546875, -0.7357025146484375, -0.696136474609375, -0.6565704345703125, -0.61700439453125, -0.5774383544921875, -0.537872314453125, -0.4983062744140625, -0.458740234375, -0.4191741943359375, -0.379608154296875, -0.3400421142578125, -0.30047607421875, -0.2609100341796875, -0.221343994140625, -0.1817779541015625, -0.1422119140625, -0.1026458740234375, -0.063079833984375, -0.0235137939453125, 0.01605224609375, 0.0556182861328125, 0.095184326171875, 0.1347503662109375, 0.17431640625, 0.2138824462890625, 0.253448486328125, 0.2930145263671875, 0.33258056640625, 0.3721466064453125, 0.411712646484375, 0.4512786865234375, 0.4908447265625, 0.5304107666015625, 0.569976806640625, 0.6095428466796875, 0.64910888671875, 0.6886749267578125, 0.728240966796875, 0.7678070068359375, 0.807373046875, 0.8469390869140625, 0.886505126953125, 0.9260711669921875, 0.96563720703125, 1.0052032470703125, 1.044769287109375, 1.0843353271484375, 1.1239013671875, 1.1634674072265625, 1.203033447265625, 1.2425994873046875, 1.28216552734375, 1.3217315673828125, 1.361297607421875, 1.4008636474609375, 1.4404296875]}, "gradients/decoder.model.decoder.layers.11.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 5.0, 0.0, 3.0, 2.0, 3.0, 2.0, 2.0, 5.0, 8.0, 4.0, 7.0, 11.0, 17.0, 16.0, 21.0, 25.0, 26.0, 30.0, 40.0, 33.0, 37.0, 35.0, 40.0, 39.0, 50.0, 42.0, 57.0, 47.0, 53.0, 39.0, 48.0, 35.0, 37.0, 27.0, 39.0, 22.0, 16.0, 19.0, 13.0, 12.0, 7.0, 11.0, 7.0, 6.0, 3.0, 5.0, 5.0, 2.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.2421875, -6.05816650390625, -5.8741455078125, -5.69012451171875, -5.506103515625, -5.32208251953125, -5.1380615234375, -4.95404052734375, -4.77001953125, -4.58599853515625, -4.4019775390625, -4.21795654296875, -4.033935546875, -3.84991455078125, -3.6658935546875, -3.48187255859375, -3.2978515625, -3.11383056640625, -2.9298095703125, -2.74578857421875, -2.561767578125, -2.37774658203125, -2.1937255859375, -2.00970458984375, -1.82568359375, -1.64166259765625, -1.4576416015625, -1.27362060546875, -1.089599609375, -0.90557861328125, -0.7215576171875, -0.53753662109375, -0.353515625, -0.16949462890625, 0.0145263671875, 0.19854736328125, 0.382568359375, 0.56658935546875, 0.7506103515625, 0.93463134765625, 1.11865234375, 1.30267333984375, 1.4866943359375, 1.67071533203125, 1.854736328125, 2.03875732421875, 2.2227783203125, 2.40679931640625, 2.5908203125, 2.77484130859375, 2.9588623046875, 3.14288330078125, 3.326904296875, 3.51092529296875, 3.6949462890625, 3.87896728515625, 4.06298828125, 4.24700927734375, 4.4310302734375, 4.61505126953125, 4.799072265625, 4.98309326171875, 5.1671142578125, 5.35113525390625, 5.53515625]}, "gradients/decoder.model.decoder.layers.11.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 5.0, 4.0, 2.0, 2.0, 4.0, 6.0, 2.0, 6.0, 10.0, 15.0, 17.0, 26.0, 36.0, 64.0, 82.0, 115.0, 159.0, 376.0, 960.0, 8576.0, 668770.0, 361629.0, 5908.0, 871.0, 346.0, 202.0, 114.0, 79.0, 55.0, 35.0, 25.0, 11.0, 7.0, 7.0, 8.0, 8.0, 3.0, 4.0, 3.0, 3.0, 3.0, 2.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.11328125, -5.92767333984375, -5.7420654296875, -5.55645751953125, -5.370849609375, -5.18524169921875, -4.9996337890625, -4.81402587890625, -4.62841796875, -4.44281005859375, -4.2572021484375, -4.07159423828125, -3.885986328125, -3.70037841796875, -3.5147705078125, -3.32916259765625, -3.1435546875, -2.95794677734375, -2.7723388671875, -2.58673095703125, -2.401123046875, -2.21551513671875, -2.0299072265625, -1.84429931640625, -1.65869140625, -1.47308349609375, -1.2874755859375, -1.10186767578125, -0.916259765625, -0.73065185546875, -0.5450439453125, -0.35943603515625, -0.173828125, 0.01177978515625, 0.1973876953125, 0.38299560546875, 0.568603515625, 0.75421142578125, 0.9398193359375, 1.12542724609375, 1.31103515625, 1.49664306640625, 1.6822509765625, 1.86785888671875, 2.053466796875, 2.23907470703125, 2.4246826171875, 2.61029052734375, 2.7958984375, 2.98150634765625, 3.1671142578125, 3.35272216796875, 3.538330078125, 3.72393798828125, 3.9095458984375, 4.09515380859375, 4.28076171875, 4.46636962890625, 4.6519775390625, 4.83758544921875, 5.023193359375, 5.20880126953125, 5.3944091796875, 5.58001708984375, 5.765625]}, "gradients/decoder.model.decoder.layers.11.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 6.0, 1.0, 2.0, 3.0, 3.0, 4.0, 4.0, 6.0, 9.0, 12.0, 14.0, 7.0, 9.0, 19.0, 20.0, 25.0, 30.0, 25.0, 34.0, 31.0, 24.0, 47.0, 42.0, 39.0, 45.0, 41.0, 48.0, 43.0, 56.0, 45.0, 37.0, 37.0, 24.0, 32.0, 28.0, 28.0, 29.0, 19.0, 12.0, 11.0, 11.0, 13.0, 7.0, 9.0, 8.0, 4.0, 5.0, 4.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.35546875, -5.17584228515625, -4.9962158203125, -4.81658935546875, -4.636962890625, -4.45733642578125, -4.2777099609375, -4.09808349609375, -3.91845703125, -3.73883056640625, -3.5592041015625, -3.37957763671875, -3.199951171875, -3.02032470703125, -2.8406982421875, -2.66107177734375, -2.4814453125, -2.30181884765625, -2.1221923828125, -1.94256591796875, -1.762939453125, -1.58331298828125, -1.4036865234375, -1.22406005859375, -1.04443359375, -0.86480712890625, -0.6851806640625, -0.50555419921875, -0.325927734375, -0.14630126953125, 0.0333251953125, 0.21295166015625, 0.392578125, 0.57220458984375, 0.7518310546875, 0.93145751953125, 1.111083984375, 1.29071044921875, 1.4703369140625, 1.64996337890625, 1.82958984375, 2.00921630859375, 2.1888427734375, 2.36846923828125, 2.548095703125, 2.72772216796875, 2.9073486328125, 3.08697509765625, 3.2666015625, 3.44622802734375, 3.6258544921875, 3.80548095703125, 3.985107421875, 4.16473388671875, 4.3443603515625, 4.52398681640625, 4.70361328125, 4.88323974609375, 5.0628662109375, 5.24249267578125, 5.422119140625, 5.60174560546875, 5.7813720703125, 5.96099853515625, 6.140625]}, "gradients/decoder.model.decoder.layers.11.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 0.0, 6.0, 2.0, 6.0, 9.0, 5.0, 10.0, 14.0, 29.0, 34.0, 64.0, 137.0, 278.0, 1103.0, 7395.0, 601973.0, 429093.0, 6751.0, 1081.0, 292.0, 111.0, 61.0, 33.0, 19.0, 20.0, 6.0, 12.0, 4.0, 3.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6162109375, -1.565673828125, -1.51513671875, -1.464599609375, -1.4140625, -1.363525390625, -1.31298828125, -1.262451171875, -1.2119140625, -1.161376953125, -1.11083984375, -1.060302734375, -1.009765625, -0.959228515625, -0.90869140625, -0.858154296875, -0.8076171875, -0.757080078125, -0.70654296875, -0.656005859375, -0.60546875, -0.554931640625, -0.50439453125, -0.453857421875, -0.4033203125, -0.352783203125, -0.30224609375, -0.251708984375, -0.201171875, -0.150634765625, -0.10009765625, -0.049560546875, 0.0009765625, 0.051513671875, 0.10205078125, 0.152587890625, 0.203125, 0.253662109375, 0.30419921875, 0.354736328125, 0.4052734375, 0.455810546875, 0.50634765625, 0.556884765625, 0.607421875, 0.657958984375, 0.70849609375, 0.759033203125, 0.8095703125, 0.860107421875, 0.91064453125, 0.961181640625, 1.01171875, 1.062255859375, 1.11279296875, 1.163330078125, 1.2138671875, 1.264404296875, 1.31494140625, 1.365478515625, 1.416015625, 1.466552734375, 1.51708984375, 1.567626953125, 1.6181640625]}, "gradients/decoder.model.decoder.layers.11.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 3.0, 5.0, 9.0, 7.0, 11.0, 11.0, 14.0, 32.0, 32.0, 50.0, 77.0, 109.0, 211.0, 141.0, 86.0, 50.0, 47.0, 24.0, 22.0, 22.0, 13.0, 9.0, 7.0, 3.0, 2.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00012445449829101562, -0.00012076832354068756, -0.0001170821487903595, -0.00011339597404003143, -0.00010970979928970337, -0.0001060236245393753, -0.00010233744978904724, -9.865127503871918e-05, -9.496510028839111e-05, -9.127892553806305e-05, -8.759275078773499e-05, -8.390657603740692e-05, -8.022040128707886e-05, -7.65342265367508e-05, -7.284805178642273e-05, -6.916187703609467e-05, -6.54757022857666e-05, -6.178952753543854e-05, -5.8103352785110474e-05, -5.441717803478241e-05, -5.0731003284454346e-05, -4.704482853412628e-05, -4.335865378379822e-05, -3.9672479033470154e-05, -3.598630428314209e-05, -3.2300129532814026e-05, -2.8613954782485962e-05, -2.4927780032157898e-05, -2.1241605281829834e-05, -1.755543053150177e-05, -1.3869255781173706e-05, -1.0183081030845642e-05, -6.496906280517578e-06, -2.810731530189514e-06, 8.754432201385498e-07, 4.561617970466614e-06, 8.247792720794678e-06, 1.1933967471122742e-05, 1.5620142221450806e-05, 1.930631697177887e-05, 2.2992491722106934e-05, 2.6678666472434998e-05, 3.036484122276306e-05, 3.4051015973091125e-05, 3.773719072341919e-05, 4.1423365473747253e-05, 4.510954022407532e-05, 4.879571497440338e-05, 5.2481889724731445e-05, 5.616806447505951e-05, 5.985423922538757e-05, 6.354041397571564e-05, 6.72265887260437e-05, 7.091276347637177e-05, 7.459893822669983e-05, 7.828511297702789e-05, 8.197128772735596e-05, 8.565746247768402e-05, 8.934363722801208e-05, 9.302981197834015e-05, 9.671598672866821e-05, 0.00010040216147899628, 0.00010408833622932434, 0.0001077745109796524, 0.00011146068572998047]}, "gradients/decoder.model.decoder.layers.11.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 6.0, 9.0, 10.0, 16.0, 21.0, 26.0, 21.0, 49.0, 100.0, 277.0, 1200.0, 12226.0, 927862.0, 102317.0, 3451.0, 542.0, 171.0, 86.0, 64.0, 23.0, 28.0, 13.0, 12.0, 8.0, 2.0, 3.0, 6.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7314453125, -1.6732635498046875, -1.615081787109375, -1.5569000244140625, -1.49871826171875, -1.4405364990234375, -1.382354736328125, -1.3241729736328125, -1.2659912109375, -1.2078094482421875, -1.149627685546875, -1.0914459228515625, -1.03326416015625, -0.9750823974609375, -0.916900634765625, -0.8587188720703125, -0.800537109375, -0.7423553466796875, -0.684173583984375, -0.6259918212890625, -0.56781005859375, -0.5096282958984375, -0.451446533203125, -0.3932647705078125, -0.3350830078125, -0.2769012451171875, -0.218719482421875, -0.1605377197265625, -0.10235595703125, -0.0441741943359375, 0.014007568359375, 0.0721893310546875, 0.13037109375, 0.1885528564453125, 0.246734619140625, 0.3049163818359375, 0.36309814453125, 0.4212799072265625, 0.479461669921875, 0.5376434326171875, 0.5958251953125, 0.6540069580078125, 0.712188720703125, 0.7703704833984375, 0.82855224609375, 0.8867340087890625, 0.944915771484375, 1.0030975341796875, 1.061279296875, 1.1194610595703125, 1.177642822265625, 1.2358245849609375, 1.29400634765625, 1.3521881103515625, 1.410369873046875, 1.4685516357421875, 1.5267333984375, 1.5849151611328125, 1.643096923828125, 1.7012786865234375, 1.75946044921875, 1.8176422119140625, 1.875823974609375, 1.9340057373046875, 1.9921875]}, "gradients/decoder.model.decoder.layers.11.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 3.0, 2.0, 3.0, 8.0, 8.0, 6.0, 5.0, 23.0, 16.0, 27.0, 21.0, 47.0, 89.0, 129.0, 216.0, 125.0, 70.0, 72.0, 40.0, 35.0, 17.0, 10.0, 8.0, 9.0, 3.0, 7.0, 1.0, 0.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.304443359375, -0.2941169738769531, -0.28379058837890625, -0.2734642028808594, -0.2631378173828125, -0.2528114318847656, -0.24248504638671875, -0.23215866088867188, -0.221832275390625, -0.21150588989257812, -0.20117950439453125, -0.19085311889648438, -0.1805267333984375, -0.17020034790039062, -0.15987396240234375, -0.14954757690429688, -0.13922119140625, -0.12889480590820312, -0.11856842041015625, -0.10824203491210938, -0.0979156494140625, -0.08758926391601562, -0.07726287841796875, -0.06693649291992188, -0.056610107421875, -0.046283721923828125, -0.03595733642578125, -0.025630950927734375, -0.0153045654296875, -0.004978179931640625, 0.00534820556640625, 0.015674591064453125, 0.0260009765625, 0.036327362060546875, 0.04665374755859375, 0.056980133056640625, 0.0673065185546875, 0.07763290405273438, 0.08795928955078125, 0.09828567504882812, 0.108612060546875, 0.11893844604492188, 0.12926483154296875, 0.13959121704101562, 0.1499176025390625, 0.16024398803710938, 0.17057037353515625, 0.18089675903320312, 0.19122314453125, 0.20154953002929688, 0.21187591552734375, 0.22220230102539062, 0.2325286865234375, 0.24285507202148438, 0.25318145751953125, 0.2635078430175781, 0.273834228515625, 0.2841606140136719, 0.29448699951171875, 0.3048133850097656, 0.3151397705078125, 0.3254661560058594, 0.33579254150390625, 0.3461189270019531, 0.3564453125]}, "gradients/decoder.model.decoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 5.0, 34.0, 204.0, 427.0, 274.0, 56.0, 14.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.37736177444458, -3.449653148651123, -2.521944761276245, -1.5942363739013672, -0.6665277481079102, 0.2611808776855469, 1.1888890266418457, 2.1165976524353027, 3.0443062782287598, 3.972014904022217, 4.899723052978516, 5.827431678771973, 6.75514030456543, 7.682848930358887, 8.610557556152344, 9.538265228271484, 10.465974807739258, 11.393683433532715, 12.321392059326172, 13.249099731445312, 14.176809310913086, 15.104516983032227, 16.0322265625, 16.95993423461914, 17.88764190673828, 18.815349578857422, 19.743059158325195, 20.670766830444336, 21.59847640991211, 22.52618408203125, 23.45389175415039, 24.381601333618164, 25.309310913085938, 26.237018585205078, 27.16472816467285, 28.092435836791992, 29.020145416259766, 29.947853088378906, 30.875560760498047, 31.80327033996582, 32.730979919433594, 33.658687591552734, 34.586395263671875, 35.51410675048828, 36.44181442260742, 37.36952209472656, 38.2972297668457, 39.224937438964844, 40.15264892578125, 41.08035659790039, 42.00806427001953, 42.93577575683594, 43.86348342895508, 44.79119110107422, 45.71889877319336, 46.6466064453125, 47.57431411743164, 48.50202178955078, 49.42972946166992, 50.35744094848633, 51.28514862060547, 52.21285629272461, 53.14056396484375, 54.068275451660156, 54.9959831237793]}, "gradients/decoder.model.decoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 2.0, 8.0, 4.0, 8.0, 11.0, 11.0, 10.0, 15.0, 14.0, 11.0, 24.0, 17.0, 27.0, 30.0, 34.0, 40.0, 26.0, 53.0, 31.0, 41.0, 49.0, 54.0, 46.0, 36.0, 38.0, 32.0, 34.0, 38.0, 29.0, 30.0, 28.0, 25.0, 28.0, 22.0, 21.0, 16.0, 15.0, 7.0, 14.0, 4.0, 5.0, 4.0, 4.0, 3.0, 1.0, 5.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.70509147644043, -8.427559852600098, -8.150028228759766, -7.87249755859375, -7.594965934753418, -7.317434310913086, -7.039903163909912, -6.762372016906738, -6.484840393066406, -6.207308769226074, -5.9297776222229, -5.652246475219727, -5.3747148513793945, -5.0971832275390625, -4.819652080535889, -4.542120933532715, -4.264589309692383, -3.98705792427063, -3.709526538848877, -3.431995153427124, -3.154463768005371, -2.876932382583618, -2.5994009971618652, -2.3218696117401123, -2.0443382263183594, -1.7668068408966064, -1.4892754554748535, -1.2117440700531006, -0.9342126846313477, -0.6566812992095947, -0.3791499137878418, -0.10161852836608887, 0.17591381072998047, 0.4534451961517334, 0.7309765815734863, 1.0085079669952393, 1.2860393524169922, 1.5635707378387451, 1.841102123260498, 2.118633508682251, 2.396164894104004, 2.673696279525757, 2.9512276649475098, 3.2287590503692627, 3.5062904357910156, 3.7838218212127686, 4.0613532066345215, 4.338884353637695, 4.616415977478027, 4.893947601318359, 5.171478748321533, 5.449009895324707, 5.726541519165039, 6.004073143005371, 6.281604290008545, 6.559135437011719, 6.836667060852051, 7.114198684692383, 7.391729831695557, 7.6692609786987305, 7.9467926025390625, 8.224324226379395, 8.501855850219727, 8.779386520385742, 9.056918144226074]}, "gradients/decoder.model.decoder.layers.10.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 1.0, 4.0, 6.0, 14.0, 18.0, 27.0, 28.0, 54.0, 59.0, 76.0, 118.0, 281.0, 536.0, 1331.0, 4135.0, 16444.0, 91558.0, 704441.0, 2459042.0, 780703.0, 109008.0, 19449.0, 4562.0, 1305.0, 511.0, 240.0, 118.0, 68.0, 44.0, 23.0, 27.0, 16.0, 13.0, 9.0, 4.0, 4.0, 4.0, 2.0, 2.0, 4.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.07421875, -3.95623779296875, -3.8382568359375, -3.72027587890625, -3.602294921875, -3.48431396484375, -3.3663330078125, -3.24835205078125, -3.13037109375, -3.01239013671875, -2.8944091796875, -2.77642822265625, -2.658447265625, -2.54046630859375, -2.4224853515625, -2.30450439453125, -2.1865234375, -2.06854248046875, -1.9505615234375, -1.83258056640625, -1.714599609375, -1.59661865234375, -1.4786376953125, -1.36065673828125, -1.24267578125, -1.12469482421875, -1.0067138671875, -0.88873291015625, -0.770751953125, -0.65277099609375, -0.5347900390625, -0.41680908203125, -0.298828125, -0.18084716796875, -0.0628662109375, 0.05511474609375, 0.173095703125, 0.29107666015625, 0.4090576171875, 0.52703857421875, 0.64501953125, 0.76300048828125, 0.8809814453125, 0.99896240234375, 1.116943359375, 1.23492431640625, 1.3529052734375, 1.47088623046875, 1.5888671875, 1.70684814453125, 1.8248291015625, 1.94281005859375, 2.060791015625, 2.17877197265625, 2.2967529296875, 2.41473388671875, 2.53271484375, 2.65069580078125, 2.7686767578125, 2.88665771484375, 3.004638671875, 3.12261962890625, 3.2406005859375, 3.35858154296875, 3.4765625]}, "gradients/decoder.model.decoder.layers.10.fc2.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 2.0, 4.0, 4.0, 10.0, 9.0, 7.0, 18.0, 28.0, 26.0, 36.0, 38.0, 50.0, 49.0, 77.0, 52.0, 56.0, 50.0, 66.0, 52.0, 58.0, 55.0, 52.0, 50.0, 35.0, 40.0, 24.0, 17.0, 10.0, 9.0, 7.0, 6.0, 3.0, 2.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.71484375, -2.612274169921875, -2.50970458984375, -2.407135009765625, -2.3045654296875, -2.201995849609375, -2.09942626953125, -1.996856689453125, -1.894287109375, -1.791717529296875, -1.68914794921875, -1.586578369140625, -1.4840087890625, -1.381439208984375, -1.27886962890625, -1.176300048828125, -1.07373046875, -0.971160888671875, -0.86859130859375, -0.766021728515625, -0.6634521484375, -0.560882568359375, -0.45831298828125, -0.355743408203125, -0.253173828125, -0.150604248046875, -0.04803466796875, 0.054534912109375, 0.1571044921875, 0.259674072265625, 0.36224365234375, 0.464813232421875, 0.5673828125, 0.669952392578125, 0.77252197265625, 0.875091552734375, 0.9776611328125, 1.080230712890625, 1.18280029296875, 1.285369873046875, 1.387939453125, 1.490509033203125, 1.59307861328125, 1.695648193359375, 1.7982177734375, 1.900787353515625, 2.00335693359375, 2.105926513671875, 2.20849609375, 2.311065673828125, 2.41363525390625, 2.516204833984375, 2.6187744140625, 2.721343994140625, 2.82391357421875, 2.926483154296875, 3.029052734375, 3.131622314453125, 3.23419189453125, 3.336761474609375, 3.4393310546875, 3.541900634765625, 3.64447021484375, 3.747039794921875, 3.849609375]}, "gradients/decoder.model.decoder.layers.10.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 3.0, 2.0, 11.0, 14.0, 24.0, 61.0, 169.0, 612.0, 2090622.0, 2101885.0, 637.0, 134.0, 53.0, 22.0, 9.0, 7.0, 5.0, 5.0, 3.0, 5.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-28.125, -26.953125, -25.78125, -24.609375, -23.4375, -22.265625, -21.09375, -19.921875, -18.75, -17.578125, -16.40625, -15.234375, -14.0625, -12.890625, -11.71875, -10.546875, -9.375, -8.203125, -7.03125, -5.859375, -4.6875, -3.515625, -2.34375, -1.171875, 0.0, 1.171875, 2.34375, 3.515625, 4.6875, 5.859375, 7.03125, 8.203125, 9.375, 10.546875, 11.71875, 12.890625, 14.0625, 15.234375, 16.40625, 17.578125, 18.75, 19.921875, 21.09375, 22.265625, 23.4375, 24.609375, 25.78125, 26.953125, 28.125, 29.296875, 30.46875, 31.640625, 32.8125, 33.984375, 35.15625, 36.328125, 37.5, 38.671875, 39.84375, 41.015625, 42.1875, 43.359375, 44.53125, 45.703125, 46.875]}, "gradients/decoder.model.decoder.layers.10.fc1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 7.0, 1.0, 7.0, 8.0, 5.0, 11.0, 13.0, 16.0, 18.0, 43.0, 42.0, 57.0, 88.0, 114.0, 165.0, 271.0, 377.0, 556.0, 627.0, 487.0, 402.0, 227.0, 161.0, 105.0, 91.0, 45.0, 35.0, 27.0, 25.0, 18.0, 9.0, 10.0, 4.0, 3.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.0576171875, -1.0249176025390625, -0.992218017578125, -0.9595184326171875, -0.92681884765625, -0.8941192626953125, -0.861419677734375, -0.8287200927734375, -0.7960205078125, -0.7633209228515625, -0.730621337890625, -0.6979217529296875, -0.66522216796875, -0.6325225830078125, -0.599822998046875, -0.5671234130859375, -0.534423828125, -0.5017242431640625, -0.469024658203125, -0.4363250732421875, -0.40362548828125, -0.3709259033203125, -0.338226318359375, -0.3055267333984375, -0.2728271484375, -0.2401275634765625, -0.207427978515625, -0.1747283935546875, -0.14202880859375, -0.1093292236328125, -0.076629638671875, -0.0439300537109375, -0.01123046875, 0.0214691162109375, 0.054168701171875, 0.0868682861328125, 0.11956787109375, 0.1522674560546875, 0.184967041015625, 0.2176666259765625, 0.2503662109375, 0.2830657958984375, 0.315765380859375, 0.3484649658203125, 0.38116455078125, 0.4138641357421875, 0.446563720703125, 0.4792633056640625, 0.511962890625, 0.5446624755859375, 0.577362060546875, 0.6100616455078125, 0.64276123046875, 0.6754608154296875, 0.708160400390625, 0.7408599853515625, 0.7735595703125, 0.8062591552734375, 0.838958740234375, 0.8716583251953125, 0.90435791015625, 0.9370574951171875, 0.969757080078125, 1.0024566650390625, 1.03515625]}, "gradients/decoder.model.decoder.layers.10.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 5.0, 14.0, 28.0, 103.0, 193.0, 288.0, 213.0, 98.0, 33.0, 24.0, 7.0, 6.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.553400754928589, -3.146216869354248, -2.7390329837799072, -2.3318490982055664, -1.924665093421936, -1.5174810886383057, -1.1102972030639648, -0.703113317489624, -0.2959294319152832, 0.11125448346138, 0.5184383988380432, 0.9256223440170288, 1.3328062295913696, 1.739990234375, 2.147174119949341, 2.5543580055236816, 2.9615418910980225, 3.3687257766723633, 3.775909662246704, 4.183093547821045, 4.590277671813965, 4.997461318969727, 5.4046454429626465, 5.811829566955566, 6.219013214111328, 6.626197338104248, 7.03338098526001, 7.44056510925293, 7.847748756408691, 8.254932403564453, 8.662117004394531, 9.069300651550293, 9.476485252380371, 9.883668899536133, 10.290853500366211, 10.698037147521973, 11.105220794677734, 11.512405395507812, 11.919589042663574, 12.326772689819336, 12.733956336975098, 13.14113998413086, 13.548324584960938, 13.9555082321167, 14.362691879272461, 14.769876480102539, 15.1770601272583, 15.584243774414062, 15.99142837524414, 16.39861297607422, 16.805795669555664, 17.212980270385742, 17.62016487121582, 18.027347564697266, 18.434532165527344, 18.841716766357422, 19.248899459838867, 19.656084060668945, 20.06326675415039, 20.47045135498047, 20.877635955810547, 21.284818649291992, 21.69200325012207, 22.099185943603516, 22.506370544433594]}, "gradients/decoder.model.decoder.layers.10.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 5.0, 3.0, 5.0, 6.0, 7.0, 16.0, 14.0, 16.0, 29.0, 31.0, 38.0, 35.0, 44.0, 40.0, 56.0, 42.0, 57.0, 52.0, 62.0, 55.0, 50.0, 48.0, 43.0, 37.0, 49.0, 42.0, 30.0, 21.0, 23.0, 15.0, 9.0, 12.0, 11.0, 5.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.143270254135132, -3.042898654937744, -2.9425268173217773, -2.8421552181243896, -2.741783380508423, -2.641411781311035, -2.5410399436950684, -2.4406683444976807, -2.340296745300293, -2.2399251461029053, -2.1395533084869385, -2.039181709289551, -1.938809871673584, -1.8384382724761963, -1.738066554069519, -1.6376948356628418, -1.537322998046875, -1.4369512796401978, -1.3365795612335205, -1.2362079620361328, -1.135836124420166, -1.0354645252227783, -0.9350928068161011, -0.8347210884094238, -0.7343493700027466, -0.6339776515960693, -0.5336059331893921, -0.4332342743873596, -0.3328625559806824, -0.23249083757400513, -0.13211917877197266, -0.03174746036529541, 0.06862449645996094, 0.168996199965477, 0.26936790347099304, 0.3697395920753479, 0.47011131048202515, 0.5704830288887024, 0.6708546876907349, 0.7712264060974121, 0.8715981245040894, 0.9719698429107666, 1.0723415613174438, 1.172713279724121, 1.2730848789215088, 1.3734567165374756, 1.4738283157348633, 1.5742000341415405, 1.6745717525482178, 1.774943470954895, 1.8753151893615723, 1.97568678855896, 2.0760586261749268, 2.1764302253723145, 2.2768020629882812, 2.377173662185669, 2.4775452613830566, 2.5779168605804443, 2.678288698196411, 2.778660297393799, 2.8790321350097656, 2.9794037342071533, 3.079775333404541, 3.180147171020508, 3.2805190086364746]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 4.0, 4.0, 4.0, 7.0, 16.0, 13.0, 11.0, 22.0, 32.0, 63.0, 70.0, 118.0, 169.0, 282.0, 463.0, 649.0, 1184.0, 1940.0, 3796.0, 7961.0, 19335.0, 52353.0, 142193.0, 291052.0, 292237.0, 144393.0, 53563.0, 19604.0, 8102.0, 3891.0, 2028.0, 1108.0, 687.0, 418.0, 244.0, 193.0, 118.0, 80.0, 51.0, 34.0, 22.0, 15.0, 7.0, 9.0, 6.0, 4.0, 2.0, 3.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.87158203125, -0.8451766967773438, -0.8187713623046875, -0.7923660278320312, -0.765960693359375, -0.7395553588867188, -0.7131500244140625, -0.6867446899414062, -0.66033935546875, -0.6339340209960938, -0.6075286865234375, -0.5811233520507812, -0.554718017578125, -0.5283126831054688, -0.5019073486328125, -0.47550201416015625, -0.4490966796875, -0.42269134521484375, -0.3962860107421875, -0.36988067626953125, -0.343475341796875, -0.31707000732421875, -0.2906646728515625, -0.26425933837890625, -0.23785400390625, -0.21144866943359375, -0.1850433349609375, -0.15863800048828125, -0.132232666015625, -0.10582733154296875, -0.0794219970703125, -0.05301666259765625, -0.026611328125, -0.00020599365234375, 0.0261993408203125, 0.05260467529296875, 0.079010009765625, 0.10541534423828125, 0.1318206787109375, 0.15822601318359375, 0.18463134765625, 0.21103668212890625, 0.2374420166015625, 0.26384735107421875, 0.290252685546875, 0.31665802001953125, 0.3430633544921875, 0.36946868896484375, 0.3958740234375, 0.42227935791015625, 0.4486846923828125, 0.47509002685546875, 0.501495361328125, 0.5279006958007812, 0.5543060302734375, 0.5807113647460938, 0.60711669921875, 0.6335220336914062, 0.6599273681640625, 0.6863327026367188, 0.712738037109375, 0.7391433715820312, 0.7655487060546875, 0.7919540405273438, 0.818359375]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 0.0, 3.0, 1.0, 6.0, 7.0, 5.0, 12.0, 15.0, 16.0, 15.0, 24.0, 26.0, 35.0, 25.0, 47.0, 44.0, 42.0, 59.0, 53.0, 49.0, 55.0, 49.0, 51.0, 53.0, 42.0, 49.0, 44.0, 35.0, 35.0, 31.0, 24.0, 12.0, 11.0, 12.0, 5.0, 5.0, 7.0, 5.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.322265625, -2.2398681640625, -2.157470703125, -2.0750732421875, -1.99267578125, -1.9102783203125, -1.827880859375, -1.7454833984375, -1.6630859375, -1.5806884765625, -1.498291015625, -1.4158935546875, -1.33349609375, -1.2510986328125, -1.168701171875, -1.0863037109375, -1.00390625, -0.9215087890625, -0.839111328125, -0.7567138671875, -0.67431640625, -0.5919189453125, -0.509521484375, -0.4271240234375, -0.3447265625, -0.2623291015625, -0.179931640625, -0.0975341796875, -0.01513671875, 0.0672607421875, 0.149658203125, 0.2320556640625, 0.314453125, 0.3968505859375, 0.479248046875, 0.5616455078125, 0.64404296875, 0.7264404296875, 0.808837890625, 0.8912353515625, 0.9736328125, 1.0560302734375, 1.138427734375, 1.2208251953125, 1.30322265625, 1.3856201171875, 1.468017578125, 1.5504150390625, 1.6328125, 1.7152099609375, 1.797607421875, 1.8800048828125, 1.96240234375, 2.0447998046875, 2.127197265625, 2.2095947265625, 2.2919921875, 2.3743896484375, 2.456787109375, 2.5391845703125, 2.62158203125, 2.7039794921875, 2.786376953125, 2.8687744140625, 2.951171875]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 5.0, 6.0, 1.0, 7.0, 6.0, 14.0, 20.0, 18.0, 30.0, 45.0, 85.0, 123.0, 231.0, 430.0, 904.0, 2060.0, 5436.0, 16222.0, 51515.0, 161870.0, 338766.0, 295215.0, 119677.0, 36978.0, 11551.0, 4085.0, 1640.0, 733.0, 381.0, 194.0, 109.0, 72.0, 42.0, 30.0, 18.0, 13.0, 5.0, 5.0, 5.0, 6.0, 5.0, 1.0, 4.0, 2.0, 0.0, 0.0, 3.0], "bins": [-0.86962890625, -0.8466567993164062, -0.8236846923828125, -0.8007125854492188, -0.777740478515625, -0.7547683715820312, -0.7317962646484375, -0.7088241577148438, -0.68585205078125, -0.6628799438476562, -0.6399078369140625, -0.6169357299804688, -0.593963623046875, -0.5709915161132812, -0.5480194091796875, -0.5250473022460938, -0.5020751953125, -0.47910308837890625, -0.4561309814453125, -0.43315887451171875, -0.410186767578125, -0.38721466064453125, -0.3642425537109375, -0.34127044677734375, -0.31829833984375, -0.29532623291015625, -0.2723541259765625, -0.24938201904296875, -0.226409912109375, -0.20343780517578125, -0.1804656982421875, -0.15749359130859375, -0.134521484375, -0.11154937744140625, -0.0885772705078125, -0.06560516357421875, -0.042633056640625, -0.01966094970703125, 0.0033111572265625, 0.02628326416015625, 0.04925537109375, 0.07222747802734375, 0.0951995849609375, 0.11817169189453125, 0.141143798828125, 0.16411590576171875, 0.1870880126953125, 0.21006011962890625, 0.2330322265625, 0.25600433349609375, 0.2789764404296875, 0.30194854736328125, 0.324920654296875, 0.34789276123046875, 0.3708648681640625, 0.39383697509765625, 0.41680908203125, 0.43978118896484375, 0.4627532958984375, 0.48572540283203125, 0.508697509765625, 0.5316696166992188, 0.5546417236328125, 0.5776138305664062, 0.6005859375]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 2.0, 7.0, 7.0, 6.0, 10.0, 10.0, 9.0, 9.0, 10.0, 13.0, 23.0, 24.0, 26.0, 19.0, 28.0, 22.0, 24.0, 32.0, 42.0, 48.0, 49.0, 27.0, 34.0, 52.0, 41.0, 38.0, 42.0, 39.0, 27.0, 40.0, 27.0, 24.0, 33.0, 24.0, 23.0, 19.0, 16.0, 15.0, 9.0, 7.0, 15.0, 9.0, 7.0, 6.0, 2.0, 3.0, 3.0, 3.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-3.51953125, -3.406707763671875, -3.29388427734375, -3.181060791015625, -3.0682373046875, -2.955413818359375, -2.84259033203125, -2.729766845703125, -2.616943359375, -2.504119873046875, -2.39129638671875, -2.278472900390625, -2.1656494140625, -2.052825927734375, -1.94000244140625, -1.827178955078125, -1.71435546875, -1.601531982421875, -1.48870849609375, -1.375885009765625, -1.2630615234375, -1.150238037109375, -1.03741455078125, -0.924591064453125, -0.811767578125, -0.698944091796875, -0.58612060546875, -0.473297119140625, -0.3604736328125, -0.247650146484375, -0.13482666015625, -0.022003173828125, 0.0908203125, 0.203643798828125, 0.31646728515625, 0.429290771484375, 0.5421142578125, 0.654937744140625, 0.76776123046875, 0.880584716796875, 0.993408203125, 1.106231689453125, 1.21905517578125, 1.331878662109375, 1.4447021484375, 1.557525634765625, 1.67034912109375, 1.783172607421875, 1.89599609375, 2.008819580078125, 2.12164306640625, 2.234466552734375, 2.3472900390625, 2.460113525390625, 2.57293701171875, 2.685760498046875, 2.798583984375, 2.911407470703125, 3.02423095703125, 3.137054443359375, 3.2498779296875, 3.362701416015625, 3.47552490234375, 3.588348388671875, 3.701171875]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 5.0, 5.0, 7.0, 8.0, 9.0, 15.0, 17.0, 34.0, 42.0, 50.0, 114.0, 141.0, 244.0, 410.0, 715.0, 1420.0, 2844.0, 6438.0, 15754.0, 44853.0, 185088.0, 520004.0, 195037.0, 46393.0, 16110.0, 6573.0, 3003.0, 1388.0, 733.0, 410.0, 248.0, 157.0, 79.0, 61.0, 51.0, 25.0, 19.0, 15.0, 10.0, 11.0, 6.0, 7.0, 4.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.11376953125, -0.10991477966308594, -0.10606002807617188, -0.10220527648925781, -0.09835052490234375, -0.09449577331542969, -0.09064102172851562, -0.08678627014160156, -0.0829315185546875, -0.07907676696777344, -0.07522201538085938, -0.07136726379394531, -0.06751251220703125, -0.06365776062011719, -0.059803009033203125, -0.05594825744628906, -0.052093505859375, -0.04823875427246094, -0.044384002685546875, -0.04052925109863281, -0.03667449951171875, -0.03281974792480469, -0.028964996337890625, -0.025110244750976562, -0.0212554931640625, -0.017400741577148438, -0.013545989990234375, -0.009691238403320312, -0.00583648681640625, -0.0019817352294921875, 0.001873016357421875, 0.0057277679443359375, 0.00958251953125, 0.013437271118164062, 0.017292022705078125, 0.021146774291992188, 0.02500152587890625, 0.028856277465820312, 0.032711029052734375, 0.03656578063964844, 0.0404205322265625, 0.04427528381347656, 0.048130035400390625, 0.05198478698730469, 0.05583953857421875, 0.05969429016113281, 0.06354904174804688, 0.06740379333496094, 0.071258544921875, 0.07511329650878906, 0.07896804809570312, 0.08282279968261719, 0.08667755126953125, 0.09053230285644531, 0.09438705444335938, 0.09824180603027344, 0.1020965576171875, 0.10595130920410156, 0.10980606079101562, 0.11366081237792969, 0.11751556396484375, 0.12137031555175781, 0.12522506713867188, 0.12907981872558594, 0.1329345703125]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 2.0, 6.0, 5.0, 4.0, 11.0, 5.0, 14.0, 16.0, 16.0, 41.0, 44.0, 72.0, 86.0, 104.0, 129.0, 109.0, 110.0, 74.0, 44.0, 29.0, 15.0, 16.0, 8.0, 7.0, 4.0, 13.0, 3.0, 3.0, 4.0, 7.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.00011736154556274414, -0.00011422205716371536, -0.00011108256876468658, -0.0001079430803656578, -0.00010480359196662903, -0.00010166410356760025, -9.852461516857147e-05, -9.53851267695427e-05, -9.224563837051392e-05, -8.910614997148514e-05, -8.596666157245636e-05, -8.282717317342758e-05, -7.96876847743988e-05, -7.654819637537003e-05, -7.340870797634125e-05, -7.026921957731247e-05, -6.712973117828369e-05, -6.399024277925491e-05, -6.0850754380226135e-05, -5.771126598119736e-05, -5.457177758216858e-05, -5.14322891831398e-05, -4.829280078411102e-05, -4.5153312385082245e-05, -4.201382398605347e-05, -3.887433558702469e-05, -3.573484718799591e-05, -3.259535878896713e-05, -2.9455870389938354e-05, -2.6316381990909576e-05, -2.31768935918808e-05, -2.003740519285202e-05, -1.6897916793823242e-05, -1.3758428394794464e-05, -1.0618939995765686e-05, -7.479451596736908e-06, -4.33996319770813e-06, -1.2004747986793518e-06, 1.9390136003494263e-06, 5.078501999378204e-06, 8.217990398406982e-06, 1.135747879743576e-05, 1.4496967196464539e-05, 1.7636455595493317e-05, 2.0775943994522095e-05, 2.3915432393550873e-05, 2.705492079257965e-05, 3.019440919160843e-05, 3.333389759063721e-05, 3.6473385989665985e-05, 3.961287438869476e-05, 4.275236278772354e-05, 4.589185118675232e-05, 4.90313395857811e-05, 5.2170827984809875e-05, 5.5310316383838654e-05, 5.844980478286743e-05, 6.158929318189621e-05, 6.472878158092499e-05, 6.786826997995377e-05, 7.100775837898254e-05, 7.414724677801132e-05, 7.72867351770401e-05, 8.042622357606888e-05, 8.356571197509766e-05]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 0.0, 3.0, 4.0, 3.0, 4.0, 2.0, 4.0, 10.0, 9.0, 10.0, 20.0, 18.0, 21.0, 39.0, 43.0, 94.0, 148.0, 281.0, 647.0, 1826.0, 6149.0, 38443.0, 799355.0, 182994.0, 13325.0, 3094.0, 1087.0, 429.0, 207.0, 101.0, 50.0, 37.0, 28.0, 23.0, 10.0, 8.0, 4.0, 8.0, 4.0, 4.0, 5.0, 3.0, 2.0, 0.0, 2.0, 0.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.31689453125, -0.30504608154296875, -0.2931976318359375, -0.28134918212890625, -0.269500732421875, -0.25765228271484375, -0.2458038330078125, -0.23395538330078125, -0.22210693359375, -0.21025848388671875, -0.1984100341796875, -0.18656158447265625, -0.174713134765625, -0.16286468505859375, -0.1510162353515625, -0.13916778564453125, -0.1273193359375, -0.11547088623046875, -0.1036224365234375, -0.09177398681640625, -0.079925537109375, -0.06807708740234375, -0.0562286376953125, -0.04438018798828125, -0.03253173828125, -0.02068328857421875, -0.0088348388671875, 0.00301361083984375, 0.014862060546875, 0.02671051025390625, 0.0385589599609375, 0.05040740966796875, 0.062255859375, 0.07410430908203125, 0.0859527587890625, 0.09780120849609375, 0.109649658203125, 0.12149810791015625, 0.1333465576171875, 0.14519500732421875, 0.15704345703125, 0.16889190673828125, 0.1807403564453125, 0.19258880615234375, 0.204437255859375, 0.21628570556640625, 0.2281341552734375, 0.23998260498046875, 0.2518310546875, 0.26367950439453125, 0.2755279541015625, 0.28737640380859375, 0.299224853515625, 0.31107330322265625, 0.3229217529296875, 0.33477020263671875, 0.34661865234375, 0.35846710205078125, 0.3703155517578125, 0.38216400146484375, 0.394012451171875, 0.40586090087890625, 0.4177093505859375, 0.42955780029296875, 0.44140625]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 3.0, 3.0, 6.0, 7.0, 6.0, 4.0, 6.0, 11.0, 3.0, 11.0, 13.0, 20.0, 16.0, 35.0, 37.0, 64.0, 82.0, 110.0, 136.0, 103.0, 78.0, 52.0, 52.0, 20.0, 28.0, 23.0, 9.0, 14.0, 10.0, 6.0, 6.0, 3.0, 10.0, 4.0, 3.0, 4.0, 2.0, 1.0, 0.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.05810546875, -0.056204795837402344, -0.05430412292480469, -0.05240345001220703, -0.050502777099609375, -0.04860210418701172, -0.04670143127441406, -0.044800758361816406, -0.04290008544921875, -0.040999412536621094, -0.03909873962402344, -0.03719806671142578, -0.035297393798828125, -0.03339672088623047, -0.03149604797363281, -0.029595375061035156, -0.0276947021484375, -0.025794029235839844, -0.023893356323242188, -0.02199268341064453, -0.020092010498046875, -0.01819133758544922, -0.016290664672851562, -0.014389991760253906, -0.01248931884765625, -0.010588645935058594, -0.008687973022460938, -0.006787300109863281, -0.004886627197265625, -0.0029859542846679688, -0.0010852813720703125, 0.0008153915405273438, 0.002716064453125, 0.004616737365722656, 0.0065174102783203125, 0.008418083190917969, 0.010318756103515625, 0.012219429016113281, 0.014120101928710938, 0.016020774841308594, 0.01792144775390625, 0.019822120666503906, 0.021722793579101562, 0.02362346649169922, 0.025524139404296875, 0.02742481231689453, 0.029325485229492188, 0.031226158142089844, 0.0331268310546875, 0.035027503967285156, 0.03692817687988281, 0.03882884979248047, 0.040729522705078125, 0.04263019561767578, 0.04453086853027344, 0.046431541442871094, 0.04833221435546875, 0.050232887268066406, 0.05213356018066406, 0.05403423309326172, 0.055934906005859375, 0.05783557891845703, 0.05973625183105469, 0.061636924743652344, 0.06353759765625]}, "gradients/decoder.model.decoder.layers.10.self_attn_layer_norm.weight": {"_type": "histogram", "values": [3.0, 3.0, 2.0, 4.0, 17.0, 59.0, 192.0, 311.0, 281.0, 90.0, 30.0, 14.0, 8.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.294938802719116, -2.0025463104248047, -1.7101539373397827, -1.4177615642547607, -1.1253690719604492, -0.8329765796661377, -0.5405842065811157, -0.24819183349609375, 0.04420065879821777, 0.3365930914878845, 0.6289855241775513, 0.921377956867218, 1.2137703895568848, 1.5061628818511963, 1.7985552549362183, 2.0909476280212402, 2.3833401203155518, 2.6757326126098633, 2.9681248664855957, 3.2605173587799072, 3.5529098510742188, 3.8453023433685303, 4.137694835662842, 4.430087089538574, 4.722479820251465, 5.014872074127197, 5.307264804840088, 5.59965705871582, 5.892049789428711, 6.184442043304443, 6.476834297180176, 6.769227027893066, 7.061618804931641, 7.354011058807373, 7.646403789520264, 7.938796043395996, 8.231188774108887, 8.523580551147461, 8.815973281860352, 9.108366012573242, 9.400758743286133, 9.693151473999023, 9.985543251037598, 10.277935981750488, 10.570328712463379, 10.862720489501953, 11.155113220214844, 11.447505950927734, 11.739897727966309, 12.0322904586792, 12.324682235717773, 12.617074966430664, 12.909467697143555, 13.201860427856445, 13.49425220489502, 13.78664493560791, 14.079036712646484, 14.371429443359375, 14.66382122039795, 14.95621395111084, 15.24860668182373, 15.540998458862305, 15.833391189575195, 16.125783920288086, 16.418176651000977]}, "gradients/decoder.model.decoder.layers.10.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 1.0, 6.0, 5.0, 7.0, 14.0, 19.0, 20.0, 15.0, 22.0, 38.0, 37.0, 58.0, 43.0, 44.0, 50.0, 64.0, 46.0, 71.0, 68.0, 61.0, 58.0, 45.0, 34.0, 37.0, 37.0, 29.0, 15.0, 21.0, 12.0, 8.0, 11.0, 5.0, 6.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.471536636352539, -2.3857316970825195, -2.299926519393921, -2.2141215801239014, -2.128316640853882, -2.042511463165283, -1.9567065238952637, -1.8709015846252441, -1.785096526145935, -1.699291467666626, -1.6134865283966064, -1.5276814699172974, -1.4418764114379883, -1.3560714721679688, -1.2702664136886597, -1.1844613552093506, -1.098656415939331, -1.012851357460022, -0.9270464181900024, -0.8412413597106934, -0.755436360836029, -0.6696313619613647, -0.5838263034820557, -0.49802130460739136, -0.41221630573272705, -0.32641130685806274, -0.24060627818107605, -0.15480124950408936, -0.06899625062942505, 0.016808748245239258, 0.10261380672454834, 0.18841880559921265, 0.27422404289245605, 0.36002904176712036, 0.44583407044410706, 0.5316390991210938, 0.6174440979957581, 0.7032490968704224, 0.7890541553497314, 0.8748591542243958, 0.9606641530990601, 1.0464692115783691, 1.1322741508483887, 1.2180792093276978, 1.3038842678070068, 1.3896892070770264, 1.4754942655563354, 1.5612993240356445, 1.647104263305664, 1.7329093217849731, 1.8187142610549927, 1.9045193195343018, 1.9903242588043213, 2.07612943649292, 2.1619343757629395, 2.247739315032959, 2.3335442543029785, 2.419349193572998, 2.5051543712615967, 2.590959310531616, 2.6767642498016357, 2.7625694274902344, 2.848374366760254, 2.9341793060302734, 3.019984483718872]}, "gradients/decoder.model.decoder.layers.10.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 4.0, 2.0, 8.0, 8.0, 12.0, 18.0, 29.0, 43.0, 65.0, 97.0, 162.0, 267.0, 436.0, 841.0, 1612.0, 2903.0, 5764.0, 12090.0, 26409.0, 64647.0, 181539.0, 445215.0, 187727.0, 66555.0, 27205.0, 12460.0, 5908.0, 2929.0, 1571.0, 848.0, 441.0, 306.0, 162.0, 83.0, 58.0, 51.0, 29.0, 19.0, 14.0, 8.0, 3.0, 4.0, 1.0, 2.0, 2.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-1.203125, -1.1609344482421875, -1.118743896484375, -1.0765533447265625, -1.03436279296875, -0.9921722412109375, -0.949981689453125, -0.9077911376953125, -0.8656005859375, -0.8234100341796875, -0.781219482421875, -0.7390289306640625, -0.69683837890625, -0.6546478271484375, -0.612457275390625, -0.5702667236328125, -0.528076171875, -0.4858856201171875, -0.443695068359375, -0.4015045166015625, -0.35931396484375, -0.3171234130859375, -0.274932861328125, -0.2327423095703125, -0.1905517578125, -0.1483612060546875, -0.106170654296875, -0.0639801025390625, -0.02178955078125, 0.0204010009765625, 0.062591552734375, 0.1047821044921875, 0.14697265625, 0.1891632080078125, 0.231353759765625, 0.2735443115234375, 0.31573486328125, 0.3579254150390625, 0.400115966796875, 0.4423065185546875, 0.4844970703125, 0.5266876220703125, 0.568878173828125, 0.6110687255859375, 0.65325927734375, 0.6954498291015625, 0.737640380859375, 0.7798309326171875, 0.822021484375, 0.8642120361328125, 0.906402587890625, 0.9485931396484375, 0.99078369140625, 1.0329742431640625, 1.075164794921875, 1.1173553466796875, 1.1595458984375, 1.2017364501953125, 1.243927001953125, 1.2861175537109375, 1.32830810546875, 1.3704986572265625, 1.412689208984375, 1.4548797607421875, 1.4970703125]}, "gradients/decoder.model.decoder.layers.10.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 8.0, 7.0, 9.0, 12.0, 12.0, 10.0, 19.0, 14.0, 27.0, 19.0, 19.0, 39.0, 30.0, 37.0, 42.0, 56.0, 38.0, 38.0, 56.0, 47.0, 47.0, 41.0, 50.0, 45.0, 33.0, 31.0, 39.0, 33.0, 20.0, 24.0, 22.0, 13.0, 14.0, 13.0, 7.0, 7.0, 8.0, 8.0, 5.0, 0.0, 6.0, 0.0, 2.0, 1.0], "bins": [-4.671875, -4.55169677734375, -4.4315185546875, -4.31134033203125, -4.191162109375, -4.07098388671875, -3.9508056640625, -3.83062744140625, -3.71044921875, -3.59027099609375, -3.4700927734375, -3.34991455078125, -3.229736328125, -3.10955810546875, -2.9893798828125, -2.86920166015625, -2.7490234375, -2.62884521484375, -2.5086669921875, -2.38848876953125, -2.268310546875, -2.14813232421875, -2.0279541015625, -1.90777587890625, -1.78759765625, -1.66741943359375, -1.5472412109375, -1.42706298828125, -1.306884765625, -1.18670654296875, -1.0665283203125, -0.94635009765625, -0.826171875, -0.70599365234375, -0.5858154296875, -0.46563720703125, -0.345458984375, -0.22528076171875, -0.1051025390625, 0.01507568359375, 0.13525390625, 0.25543212890625, 0.3756103515625, 0.49578857421875, 0.615966796875, 0.73614501953125, 0.8563232421875, 0.97650146484375, 1.0966796875, 1.21685791015625, 1.3370361328125, 1.45721435546875, 1.577392578125, 1.69757080078125, 1.8177490234375, 1.93792724609375, 2.05810546875, 2.17828369140625, 2.2984619140625, 2.41864013671875, 2.538818359375, 2.65899658203125, 2.7791748046875, 2.89935302734375, 3.01953125]}, "gradients/decoder.model.decoder.layers.10.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 5.0, 3.0, 4.0, 4.0, 4.0, 8.0, 6.0, 11.0, 10.0, 13.0, 23.0, 19.0, 24.0, 27.0, 42.0, 38.0, 57.0, 75.0, 84.0, 102.0, 196.0, 489.0, 9610.0, 1025015.0, 11389.0, 539.0, 187.0, 108.0, 86.0, 66.0, 66.0, 54.0, 35.0, 38.0, 19.0, 26.0, 10.0, 17.0, 12.0, 6.0, 7.0, 8.0, 7.0, 2.0, 5.0, 4.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-10.328125, -9.9659423828125, -9.603759765625, -9.2415771484375, -8.87939453125, -8.5172119140625, -8.155029296875, -7.7928466796875, -7.4306640625, -7.0684814453125, -6.706298828125, -6.3441162109375, -5.98193359375, -5.6197509765625, -5.257568359375, -4.8953857421875, -4.533203125, -4.1710205078125, -3.808837890625, -3.4466552734375, -3.08447265625, -2.7222900390625, -2.360107421875, -1.9979248046875, -1.6357421875, -1.2735595703125, -0.911376953125, -0.5491943359375, -0.18701171875, 0.1751708984375, 0.537353515625, 0.8995361328125, 1.26171875, 1.6239013671875, 1.986083984375, 2.3482666015625, 2.71044921875, 3.0726318359375, 3.434814453125, 3.7969970703125, 4.1591796875, 4.5213623046875, 4.883544921875, 5.2457275390625, 5.60791015625, 5.9700927734375, 6.332275390625, 6.6944580078125, 7.056640625, 7.4188232421875, 7.781005859375, 8.1431884765625, 8.50537109375, 8.8675537109375, 9.229736328125, 9.5919189453125, 9.9541015625, 10.3162841796875, 10.678466796875, 11.0406494140625, 11.40283203125, 11.7650146484375, 12.127197265625, 12.4893798828125, 12.8515625]}, "gradients/decoder.model.decoder.layers.10.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 5.0, 5.0, 5.0, 4.0, 10.0, 13.0, 10.0, 14.0, 21.0, 20.0, 16.0, 23.0, 33.0, 34.0, 37.0, 37.0, 50.0, 60.0, 52.0, 58.0, 50.0, 54.0, 51.0, 41.0, 43.0, 30.0, 34.0, 38.0, 36.0, 19.0, 20.0, 15.0, 18.0, 8.0, 12.0, 2.0, 5.0, 9.0, 4.0, 3.0, 2.0, 2.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.46484375, -4.32501220703125, -4.1851806640625, -4.04534912109375, -3.905517578125, -3.76568603515625, -3.6258544921875, -3.48602294921875, -3.34619140625, -3.20635986328125, -3.0665283203125, -2.92669677734375, -2.786865234375, -2.64703369140625, -2.5072021484375, -2.36737060546875, -2.2275390625, -2.08770751953125, -1.9478759765625, -1.80804443359375, -1.668212890625, -1.52838134765625, -1.3885498046875, -1.24871826171875, -1.10888671875, -0.96905517578125, -0.8292236328125, -0.68939208984375, -0.549560546875, -0.40972900390625, -0.2698974609375, -0.13006591796875, 0.009765625, 0.14959716796875, 0.2894287109375, 0.42926025390625, 0.569091796875, 0.70892333984375, 0.8487548828125, 0.98858642578125, 1.12841796875, 1.26824951171875, 1.4080810546875, 1.54791259765625, 1.687744140625, 1.82757568359375, 1.9674072265625, 2.10723876953125, 2.2470703125, 2.38690185546875, 2.5267333984375, 2.66656494140625, 2.806396484375, 2.94622802734375, 3.0860595703125, 3.22589111328125, 3.36572265625, 3.50555419921875, 3.6453857421875, 3.78521728515625, 3.925048828125, 4.06488037109375, 4.2047119140625, 4.34454345703125, 4.484375]}, "gradients/decoder.model.decoder.layers.10.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 4.0, 5.0, 5.0, 7.0, 9.0, 12.0, 15.0, 25.0, 29.0, 53.0, 81.0, 249.0, 2563.0, 898443.0, 145313.0, 1307.0, 185.0, 91.0, 50.0, 22.0, 40.0, 14.0, 10.0, 8.0, 3.0, 5.0, 3.0, 2.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.41015625, -3.2833251953125, -3.156494140625, -3.0296630859375, -2.90283203125, -2.7760009765625, -2.649169921875, -2.5223388671875, -2.3955078125, -2.2686767578125, -2.141845703125, -2.0150146484375, -1.88818359375, -1.7613525390625, -1.634521484375, -1.5076904296875, -1.380859375, -1.2540283203125, -1.127197265625, -1.0003662109375, -0.87353515625, -0.7467041015625, -0.619873046875, -0.4930419921875, -0.3662109375, -0.2393798828125, -0.112548828125, 0.0142822265625, 0.14111328125, 0.2679443359375, 0.394775390625, 0.5216064453125, 0.6484375, 0.7752685546875, 0.902099609375, 1.0289306640625, 1.15576171875, 1.2825927734375, 1.409423828125, 1.5362548828125, 1.6630859375, 1.7899169921875, 1.916748046875, 2.0435791015625, 2.17041015625, 2.2972412109375, 2.424072265625, 2.5509033203125, 2.677734375, 2.8045654296875, 2.931396484375, 3.0582275390625, 3.18505859375, 3.3118896484375, 3.438720703125, 3.5655517578125, 3.6923828125, 3.8192138671875, 3.946044921875, 4.0728759765625, 4.19970703125, 4.3265380859375, 4.453369140625, 4.5802001953125, 4.70703125]}, "gradients/decoder.model.decoder.layers.10.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 5.0, 5.0, 6.0, 2.0, 6.0, 15.0, 17.0, 26.0, 38.0, 44.0, 89.0, 148.0, 197.0, 152.0, 85.0, 49.0, 36.0, 33.0, 8.0, 12.0, 9.0, 9.0, 4.0, 1.0, 3.0, 4.0, 1.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00011819601058959961, -0.0001129666343331337, -0.00010773725807666779, -0.00010250788182020187, -9.727850556373596e-05, -9.204912930727005e-05, -8.681975305080414e-05, -8.159037679433823e-05, -7.636100053787231e-05, -7.11316242814064e-05, -6.590224802494049e-05, -6.067287176847458e-05, -5.544349551200867e-05, -5.0214119255542755e-05, -4.498474299907684e-05, -3.975536674261093e-05, -3.452599048614502e-05, -2.9296614229679108e-05, -2.4067237973213196e-05, -1.8837861716747284e-05, -1.3608485460281372e-05, -8.37910920381546e-06, -3.1497329473495483e-06, 2.0796433091163635e-06, 7.309019565582275e-06, 1.2538395822048187e-05, 1.77677720785141e-05, 2.299714833498001e-05, 2.8226524591445923e-05, 3.3455900847911835e-05, 3.8685277104377747e-05, 4.391465336084366e-05, 4.914402961730957e-05, 5.437340587377548e-05, 5.9602782130241394e-05, 6.48321583867073e-05, 7.006153464317322e-05, 7.529091089963913e-05, 8.052028715610504e-05, 8.574966341257095e-05, 9.097903966903687e-05, 9.620841592550278e-05, 0.00010143779218196869, 0.0001066671684384346, 0.00011189654469490051, 0.00011712592095136642, 0.00012235529720783234, 0.00012758467346429825, 0.00013281404972076416, 0.00013804342597723007, 0.00014327280223369598, 0.0001485021784901619, 0.0001537315547466278, 0.00015896093100309372, 0.00016419030725955963, 0.00016941968351602554, 0.00017464905977249146, 0.00017987843602895737, 0.00018510781228542328, 0.0001903371885418892, 0.0001955665647983551, 0.00020079594105482101, 0.00020602531731128693, 0.00021125469356775284, 0.00021648406982421875]}, "gradients/decoder.model.decoder.layers.10.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 2.0, 3.0, 5.0, 5.0, 5.0, 6.0, 5.0, 14.0, 13.0, 19.0, 25.0, 40.0, 50.0, 91.0, 255.0, 1350.0, 42319.0, 989789.0, 13329.0, 809.0, 172.0, 67.0, 52.0, 33.0, 21.0, 24.0, 14.0, 8.0, 12.0, 3.0, 4.0, 4.0, 4.0, 2.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.455078125, -2.368560791015625, -2.28204345703125, -2.195526123046875, -2.1090087890625, -2.022491455078125, -1.93597412109375, -1.849456787109375, -1.762939453125, -1.676422119140625, -1.58990478515625, -1.503387451171875, -1.4168701171875, -1.330352783203125, -1.24383544921875, -1.157318115234375, -1.07080078125, -0.984283447265625, -0.89776611328125, -0.811248779296875, -0.7247314453125, -0.638214111328125, -0.55169677734375, -0.465179443359375, -0.378662109375, -0.292144775390625, -0.20562744140625, -0.119110107421875, -0.0325927734375, 0.053924560546875, 0.14044189453125, 0.226959228515625, 0.3134765625, 0.399993896484375, 0.48651123046875, 0.573028564453125, 0.6595458984375, 0.746063232421875, 0.83258056640625, 0.919097900390625, 1.005615234375, 1.092132568359375, 1.17864990234375, 1.265167236328125, 1.3516845703125, 1.438201904296875, 1.52471923828125, 1.611236572265625, 1.69775390625, 1.784271240234375, 1.87078857421875, 1.957305908203125, 2.0438232421875, 2.130340576171875, 2.21685791015625, 2.303375244140625, 2.389892578125, 2.476409912109375, 2.56292724609375, 2.649444580078125, 2.7359619140625, 2.822479248046875, 2.90899658203125, 2.995513916015625, 3.08203125]}, "gradients/decoder.model.decoder.layers.10.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 3.0, 2.0, 3.0, 4.0, 8.0, 2.0, 8.0, 16.0, 24.0, 21.0, 41.0, 53.0, 86.0, 119.0, 199.0, 125.0, 76.0, 59.0, 48.0, 29.0, 16.0, 15.0, 11.0, 12.0, 8.0, 6.0, 7.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.387939453125, -0.3763618469238281, -0.36478424072265625, -0.3532066345214844, -0.3416290283203125, -0.3300514221191406, -0.31847381591796875, -0.3068962097167969, -0.295318603515625, -0.2837409973144531, -0.27216339111328125, -0.2605857849121094, -0.2490081787109375, -0.23743057250976562, -0.22585296630859375, -0.21427536010742188, -0.20269775390625, -0.19112014770507812, -0.17954254150390625, -0.16796493530273438, -0.1563873291015625, -0.14480972290039062, -0.13323211669921875, -0.12165451049804688, -0.110076904296875, -0.09849929809570312, -0.08692169189453125, -0.07534408569335938, -0.0637664794921875, -0.052188873291015625, -0.04061126708984375, -0.029033660888671875, -0.0174560546875, -0.005878448486328125, 0.00569915771484375, 0.017276763916015625, 0.0288543701171875, 0.040431976318359375, 0.05200958251953125, 0.06358718872070312, 0.075164794921875, 0.08674240112304688, 0.09832000732421875, 0.10989761352539062, 0.1214752197265625, 0.13305282592773438, 0.14463043212890625, 0.15620803833007812, 0.16778564453125, 0.17936325073242188, 0.19094085693359375, 0.20251846313476562, 0.2140960693359375, 0.22567367553710938, 0.23725128173828125, 0.24882888793945312, 0.260406494140625, 0.2719841003417969, 0.28356170654296875, 0.2951393127441406, 0.3067169189453125, 0.3182945251464844, 0.32987213134765625, 0.3414497375488281, 0.35302734375]}, "gradients/decoder.model.decoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 4.0, 6.0, 7.0, 12.0, 81.0, 226.0, 306.0, 231.0, 95.0, 29.0, 14.0, 5.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.233728885650635, -3.685295581817627, -3.13686203956604, -2.588428497314453, -2.0399951934814453, -1.4915618896484375, -0.9431283473968506, -0.39469480514526367, 0.15373849868774414, 0.7021719217300415, 1.2506053447723389, 1.7990387678146362, 2.3474721908569336, 2.8959054946899414, 3.4443390369415283, 3.9927725791931152, 4.541205883026123, 5.089639186859131, 5.638072967529297, 6.186506271362305, 6.7349395751953125, 7.28337287902832, 7.831806182861328, 8.380239486694336, 8.928672790527344, 9.477106094360352, 10.02553939819336, 10.573972702026367, 11.122406005859375, 11.670839309692383, 12.219273567199707, 12.767706871032715, 13.316139221191406, 13.864572525024414, 14.413005828857422, 14.96143913269043, 15.509872436523438, 16.058305740356445, 16.606739044189453, 17.155174255371094, 17.70360565185547, 18.252038955688477, 18.800472259521484, 19.348905563354492, 19.8973388671875, 20.445772171020508, 20.994205474853516, 21.542640686035156, 22.091073989868164, 22.639507293701172, 23.18794059753418, 23.736373901367188, 24.284807205200195, 24.833240509033203, 25.38167381286621, 25.93010711669922, 26.47854232788086, 27.026975631713867, 27.575408935546875, 28.123842239379883, 28.67227554321289, 29.2207088470459, 29.769142150878906, 30.317577362060547, 30.866008758544922]}, "gradients/decoder.model.decoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 4.0, 4.0, 3.0, 3.0, 5.0, 4.0, 10.0, 5.0, 9.0, 9.0, 10.0, 13.0, 7.0, 20.0, 27.0, 18.0, 23.0, 29.0, 34.0, 33.0, 38.0, 40.0, 36.0, 30.0, 34.0, 38.0, 55.0, 37.0, 36.0, 44.0, 31.0, 34.0, 40.0, 27.0, 24.0, 23.0, 20.0, 17.0, 24.0, 20.0, 13.0, 16.0, 12.0, 5.0, 7.0, 9.0, 9.0, 5.0, 8.0, 2.0, 4.0, 3.0, 3.0, 1.0, 3.0], "bins": [-5.967244625091553, -5.800583839416504, -5.633923530578613, -5.4672627449035645, -5.300602436065674, -5.133941650390625, -4.967281341552734, -4.8006205558776855, -4.633959770202637, -4.467298984527588, -4.300638675689697, -4.133977890014648, -3.9673173427581787, -3.800656795501709, -3.6339962482452393, -3.4673357009887695, -3.3006751537323, -3.13401460647583, -2.9673540592193604, -2.8006935119628906, -2.634032726287842, -2.467372179031372, -2.3007116317749023, -2.1340508460998535, -1.9673904180526733, -1.8007298707962036, -1.6340692043304443, -1.4674086570739746, -1.3007481098175049, -1.1340874433517456, -0.9674268960952759, -0.8007662296295166, -0.6341056823730469, -0.4674450755119324, -0.30078449845314026, -0.13412392139434814, 0.03253668546676636, 0.19919729232788086, 0.3658578395843506, 0.5325185060501099, 0.6991790533065796, 0.8658396601676941, 1.0325002670288086, 1.1991608142852783, 1.365821361541748, 1.5324820280075073, 1.699142575263977, 1.8658032417297363, 2.032463788986206, 2.199124336242676, 2.3657848834991455, 2.5324454307556152, 2.699106216430664, 2.865766763687134, 3.0324273109436035, 3.1990880966186523, 3.365748405456543, 3.5324089527130127, 3.6990694999694824, 3.8657302856445312, 4.032390594482422, 4.199051380157471, 4.3657121658325195, 4.53237247467041, 4.699033260345459]}, "gradients/decoder.model.decoder.layers.9.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 4.0, 5.0, 4.0, 7.0, 6.0, 16.0, 17.0, 28.0, 19.0, 39.0, 50.0, 76.0, 58.0, 111.0, 156.0, 284.0, 510.0, 1038.0, 2408.0, 6598.0, 23983.0, 126021.0, 798007.0, 2269360.0, 795141.0, 131666.0, 26974.0, 7144.0, 2432.0, 937.0, 437.0, 250.0, 158.0, 84.0, 54.0, 49.0, 27.0, 32.0, 17.0, 17.0, 12.0, 13.0, 14.0, 6.0, 4.0, 3.0, 4.0, 5.0, 2.0, 3.0, 0.0, 2.0, 1.0], "bins": [-3.455078125, -3.354949951171875, -3.25482177734375, -3.154693603515625, -3.0545654296875, -2.954437255859375, -2.85430908203125, -2.754180908203125, -2.654052734375, -2.553924560546875, -2.45379638671875, -2.353668212890625, -2.2535400390625, -2.153411865234375, -2.05328369140625, -1.953155517578125, -1.85302734375, -1.752899169921875, -1.65277099609375, -1.552642822265625, -1.4525146484375, -1.352386474609375, -1.25225830078125, -1.152130126953125, -1.052001953125, -0.951873779296875, -0.85174560546875, -0.751617431640625, -0.6514892578125, -0.551361083984375, -0.45123291015625, -0.351104736328125, -0.2509765625, -0.150848388671875, -0.05072021484375, 0.049407958984375, 0.1495361328125, 0.249664306640625, 0.34979248046875, 0.449920654296875, 0.550048828125, 0.650177001953125, 0.75030517578125, 0.850433349609375, 0.9505615234375, 1.050689697265625, 1.15081787109375, 1.250946044921875, 1.35107421875, 1.451202392578125, 1.55133056640625, 1.651458740234375, 1.7515869140625, 1.851715087890625, 1.95184326171875, 2.051971435546875, 2.152099609375, 2.252227783203125, 2.35235595703125, 2.452484130859375, 2.5526123046875, 2.652740478515625, 2.75286865234375, 2.852996826171875, 2.953125]}, "gradients/decoder.model.decoder.layers.9.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 2.0, 0.0, 3.0, 6.0, 5.0, 8.0, 14.0, 19.0, 22.0, 29.0, 35.0, 49.0, 47.0, 74.0, 68.0, 64.0, 87.0, 75.0, 61.0, 66.0, 45.0, 48.0, 50.0, 30.0, 24.0, 24.0, 15.0, 11.0, 17.0, 8.0, 4.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.283203125, -2.186981201171875, -2.09075927734375, -1.994537353515625, -1.8983154296875, -1.802093505859375, -1.70587158203125, -1.609649658203125, -1.513427734375, -1.417205810546875, -1.32098388671875, -1.224761962890625, -1.1285400390625, -1.032318115234375, -0.93609619140625, -0.839874267578125, -0.74365234375, -0.647430419921875, -0.55120849609375, -0.454986572265625, -0.3587646484375, -0.262542724609375, -0.16632080078125, -0.070098876953125, 0.026123046875, 0.122344970703125, 0.21856689453125, 0.314788818359375, 0.4110107421875, 0.507232666015625, 0.60345458984375, 0.699676513671875, 0.7958984375, 0.892120361328125, 0.98834228515625, 1.084564208984375, 1.1807861328125, 1.277008056640625, 1.37322998046875, 1.469451904296875, 1.565673828125, 1.661895751953125, 1.75811767578125, 1.854339599609375, 1.9505615234375, 2.046783447265625, 2.14300537109375, 2.239227294921875, 2.33544921875, 2.431671142578125, 2.52789306640625, 2.624114990234375, 2.7203369140625, 2.816558837890625, 2.91278076171875, 3.009002685546875, 3.105224609375, 3.201446533203125, 3.29766845703125, 3.393890380859375, 3.4901123046875, 3.586334228515625, 3.68255615234375, 3.778778076171875, 3.875]}, "gradients/decoder.model.decoder.layers.9.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 3.0, 1.0, 8.0, 0.0, 5.0, 8.0, 30.0, 38.0, 86.0, 144.0, 327.0, 900.0, 10572.0, 4126105.0, 53915.0, 1292.0, 429.0, 224.0, 80.0, 50.0, 19.0, 13.0, 7.0, 10.0, 8.0, 1.0, 3.0, 2.0, 2.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-18.28125, -17.7955322265625, -17.309814453125, -16.8240966796875, -16.33837890625, -15.8526611328125, -15.366943359375, -14.8812255859375, -14.3955078125, -13.9097900390625, -13.424072265625, -12.9383544921875, -12.45263671875, -11.9669189453125, -11.481201171875, -10.9954833984375, -10.509765625, -10.0240478515625, -9.538330078125, -9.0526123046875, -8.56689453125, -8.0811767578125, -7.595458984375, -7.1097412109375, -6.6240234375, -6.1383056640625, -5.652587890625, -5.1668701171875, -4.68115234375, -4.1954345703125, -3.709716796875, -3.2239990234375, -2.73828125, -2.2525634765625, -1.766845703125, -1.2811279296875, -0.79541015625, -0.3096923828125, 0.176025390625, 0.6617431640625, 1.1474609375, 1.6331787109375, 2.118896484375, 2.6046142578125, 3.09033203125, 3.5760498046875, 4.061767578125, 4.5474853515625, 5.033203125, 5.5189208984375, 6.004638671875, 6.4903564453125, 6.97607421875, 7.4617919921875, 7.947509765625, 8.4332275390625, 8.9189453125, 9.4046630859375, 9.890380859375, 10.3760986328125, 10.86181640625, 11.3475341796875, 11.833251953125, 12.3189697265625, 12.8046875]}, "gradients/decoder.model.decoder.layers.9.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 2.0, 4.0, 5.0, 6.0, 6.0, 14.0, 13.0, 21.0, 27.0, 45.0, 62.0, 100.0, 122.0, 175.0, 259.0, 347.0, 458.0, 548.0, 512.0, 406.0, 265.0, 204.0, 148.0, 89.0, 77.0, 55.0, 40.0, 26.0, 11.0, 4.0, 8.0, 6.0, 3.0, 3.0, 5.0, 4.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.205078125, -1.1721267700195312, -1.1391754150390625, -1.1062240600585938, -1.073272705078125, -1.0403213500976562, -1.0073699951171875, -0.9744186401367188, -0.94146728515625, -0.9085159301757812, -0.8755645751953125, -0.8426132202148438, -0.809661865234375, -0.7767105102539062, -0.7437591552734375, -0.7108078002929688, -0.6778564453125, -0.6449050903320312, -0.6119537353515625, -0.5790023803710938, -0.546051025390625, -0.5130996704101562, -0.4801483154296875, -0.44719696044921875, -0.41424560546875, -0.38129425048828125, -0.3483428955078125, -0.31539154052734375, -0.282440185546875, -0.24948883056640625, -0.2165374755859375, -0.18358612060546875, -0.150634765625, -0.11768341064453125, -0.0847320556640625, -0.05178070068359375, -0.018829345703125, 0.01412200927734375, 0.0470733642578125, 0.08002471923828125, 0.11297607421875, 0.14592742919921875, 0.1788787841796875, 0.21183013916015625, 0.244781494140625, 0.27773284912109375, 0.3106842041015625, 0.34363555908203125, 0.3765869140625, 0.40953826904296875, 0.4424896240234375, 0.47544097900390625, 0.508392333984375, 0.5413436889648438, 0.5742950439453125, 0.6072463989257812, 0.64019775390625, 0.6731491088867188, 0.7061004638671875, 0.7390518188476562, 0.772003173828125, 0.8049545288085938, 0.8379058837890625, 0.8708572387695312, 0.90380859375]}, "gradients/decoder.model.decoder.layers.9.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 4.0, 7.0, 14.0, 30.0, 59.0, 82.0, 117.0, 147.0, 165.0, 131.0, 93.0, 65.0, 41.0, 19.0, 10.0, 8.0, 10.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.9344077110290527, -3.730466604232788, -3.5265254974365234, -3.3225841522216797, -3.118643045425415, -2.9147019386291504, -2.7107605934143066, -2.506819486618042, -2.3028783798217773, -2.0989372730255127, -1.8949960470199585, -1.6910548210144043, -1.4871137142181396, -1.283172607421875, -1.0792313814163208, -0.8752901554107666, -0.671349048614502, -0.46740788221359253, -0.2634667158126831, -0.05952554941177368, 0.14441561698913574, 0.3483567237854004, 0.5522979497909546, 0.7562391757965088, 0.9601802825927734, 1.164121389389038, 1.3680626153945923, 1.5720038414001465, 1.7759449481964111, 1.9798860549926758, 2.1838274002075195, 2.387768507003784, 2.591710090637207, 2.7956511974334717, 2.9995923042297363, 3.20353364944458, 3.4074747562408447, 3.6114158630371094, 3.815357208251953, 4.019298553466797, 4.223239421844482, 4.427180767059326, 4.631121635437012, 4.8350629806518555, 5.039004325866699, 5.242945194244385, 5.4468865394592285, 5.650827407836914, 5.854768753051758, 6.058710098266602, 6.262650966644287, 6.466592311859131, 6.670533180236816, 6.87447452545166, 7.078415870666504, 7.282357215881348, 7.486298084259033, 7.690239429473877, 7.8941802978515625, 8.098121643066406, 8.30206298828125, 8.506004333496094, 8.709944725036621, 8.913886070251465, 9.117827415466309]}, "gradients/decoder.model.decoder.layers.9.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 3.0, 5.0, 7.0, 7.0, 7.0, 17.0, 14.0, 15.0, 24.0, 21.0, 28.0, 38.0, 39.0, 48.0, 42.0, 61.0, 60.0, 45.0, 61.0, 72.0, 66.0, 54.0, 54.0, 37.0, 29.0, 40.0, 25.0, 18.0, 18.0, 16.0, 9.0, 13.0, 9.0, 3.0, 8.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.7118377685546875, -2.6209635734558105, -2.5300893783569336, -2.4392151832580566, -2.3483409881591797, -2.2574665546417236, -2.1665923595428467, -2.0757181644439697, -1.9848439693450928, -1.8939697742462158, -1.8030955791473389, -1.7122212648391724, -1.6213470697402954, -1.5304728746414185, -1.439598560333252, -1.348724365234375, -1.257850170135498, -1.166975975036621, -1.0761017799377441, -0.9852274656295776, -0.8943532705307007, -0.8034790754318237, -0.712604820728302, -0.6217305660247803, -0.5308563709259033, -0.439982146024704, -0.34910792112350464, -0.2582336962223053, -0.16735947132110596, -0.07648524641990662, 0.014388978481292725, 0.10526323318481445, 0.1961374282836914, 0.28701165318489075, 0.3778858780860901, 0.46876010298728943, 0.5596343278884888, 0.6505085229873657, 0.7413827776908875, 0.8322570323944092, 0.9231312274932861, 1.014005422592163, 1.10487961769104, 1.1957539319992065, 1.2866281270980835, 1.3775023221969604, 1.468376636505127, 1.559250831604004, 1.6501250267028809, 1.7409992218017578, 1.8318734169006348, 1.9227477312088013, 2.0136218070983887, 2.1044962406158447, 2.1953704357147217, 2.2862446308135986, 2.3771188259124756, 2.4679930210113525, 2.5588672161102295, 2.6497414112091064, 2.7406158447265625, 2.8314900398254395, 2.9223642349243164, 3.0132384300231934, 3.1041126251220703]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 1.0, 4.0, 4.0, 11.0, 12.0, 15.0, 21.0, 32.0, 59.0, 100.0, 156.0, 304.0, 662.0, 1435.0, 3791.0, 13629.0, 76827.0, 427060.0, 427376.0, 76790.0, 13568.0, 3760.0, 1502.0, 681.0, 323.0, 191.0, 94.0, 58.0, 38.0, 16.0, 10.0, 10.0, 7.0, 4.0, 4.0, 2.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.03125, -1.0017852783203125, -0.972320556640625, -0.9428558349609375, -0.91339111328125, -0.8839263916015625, -0.854461669921875, -0.8249969482421875, -0.7955322265625, -0.7660675048828125, -0.736602783203125, -0.7071380615234375, -0.67767333984375, -0.6482086181640625, -0.618743896484375, -0.5892791748046875, -0.559814453125, -0.5303497314453125, -0.500885009765625, -0.4714202880859375, -0.44195556640625, -0.4124908447265625, -0.383026123046875, -0.3535614013671875, -0.3240966796875, -0.2946319580078125, -0.265167236328125, -0.2357025146484375, -0.20623779296875, -0.1767730712890625, -0.147308349609375, -0.1178436279296875, -0.08837890625, -0.0589141845703125, -0.029449462890625, 1.52587890625e-05, 0.02947998046875, 0.0589447021484375, 0.088409423828125, 0.1178741455078125, 0.1473388671875, 0.1768035888671875, 0.206268310546875, 0.2357330322265625, 0.26519775390625, 0.2946624755859375, 0.324127197265625, 0.3535919189453125, 0.383056640625, 0.4125213623046875, 0.441986083984375, 0.4714508056640625, 0.50091552734375, 0.5303802490234375, 0.559844970703125, 0.5893096923828125, 0.6187744140625, 0.6482391357421875, 0.677703857421875, 0.7071685791015625, 0.73663330078125, 0.7660980224609375, 0.795562744140625, 0.8250274658203125, 0.8544921875]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 4.0, 3.0, 13.0, 19.0, 15.0, 26.0, 28.0, 36.0, 44.0, 59.0, 77.0, 74.0, 102.0, 74.0, 78.0, 78.0, 60.0, 64.0, 41.0, 30.0, 27.0, 15.0, 20.0, 11.0, 7.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.255859375, -2.178436279296875, -2.10101318359375, -2.023590087890625, -1.9461669921875, -1.868743896484375, -1.79132080078125, -1.713897705078125, -1.636474609375, -1.559051513671875, -1.48162841796875, -1.404205322265625, -1.3267822265625, -1.249359130859375, -1.17193603515625, -1.094512939453125, -1.01708984375, -0.939666748046875, -0.86224365234375, -0.784820556640625, -0.7073974609375, -0.629974365234375, -0.55255126953125, -0.475128173828125, -0.397705078125, -0.320281982421875, -0.24285888671875, -0.165435791015625, -0.0880126953125, -0.010589599609375, 0.06683349609375, 0.144256591796875, 0.2216796875, 0.299102783203125, 0.37652587890625, 0.453948974609375, 0.5313720703125, 0.608795166015625, 0.68621826171875, 0.763641357421875, 0.841064453125, 0.918487548828125, 0.99591064453125, 1.073333740234375, 1.1507568359375, 1.228179931640625, 1.30560302734375, 1.383026123046875, 1.46044921875, 1.537872314453125, 1.61529541015625, 1.692718505859375, 1.7701416015625, 1.847564697265625, 1.92498779296875, 2.002410888671875, 2.079833984375, 2.157257080078125, 2.23468017578125, 2.312103271484375, 2.3895263671875, 2.466949462890625, 2.54437255859375, 2.621795654296875, 2.69921875]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 4.0, 4.0, 10.0, 5.0, 10.0, 13.0, 16.0, 21.0, 27.0, 55.0, 87.0, 130.0, 206.0, 398.0, 758.0, 1451.0, 3058.0, 6839.0, 16519.0, 41291.0, 97446.0, 198379.0, 274444.0, 214882.0, 111151.0, 47042.0, 19337.0, 7933.0, 3465.0, 1672.0, 793.0, 413.0, 253.0, 155.0, 96.0, 62.0, 40.0, 23.0, 24.0, 13.0, 18.0, 6.0, 4.0, 2.0, 3.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0], "bins": [-0.307373046875, -0.297637939453125, -0.28790283203125, -0.278167724609375, -0.2684326171875, -0.258697509765625, -0.24896240234375, -0.239227294921875, -0.2294921875, -0.219757080078125, -0.21002197265625, -0.200286865234375, -0.1905517578125, -0.180816650390625, -0.17108154296875, -0.161346435546875, -0.151611328125, -0.141876220703125, -0.13214111328125, -0.122406005859375, -0.1126708984375, -0.102935791015625, -0.09320068359375, -0.083465576171875, -0.07373046875, -0.063995361328125, -0.05426025390625, -0.044525146484375, -0.0347900390625, -0.025054931640625, -0.01531982421875, -0.005584716796875, 0.004150390625, 0.013885498046875, 0.02362060546875, 0.033355712890625, 0.0430908203125, 0.052825927734375, 0.06256103515625, 0.072296142578125, 0.08203125, 0.091766357421875, 0.10150146484375, 0.111236572265625, 0.1209716796875, 0.130706787109375, 0.14044189453125, 0.150177001953125, 0.159912109375, 0.169647216796875, 0.17938232421875, 0.189117431640625, 0.1988525390625, 0.208587646484375, 0.21832275390625, 0.228057861328125, 0.23779296875, 0.247528076171875, 0.25726318359375, 0.266998291015625, 0.2767333984375, 0.286468505859375, 0.29620361328125, 0.305938720703125, 0.315673828125]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 1.0, 1.0, 4.0, 2.0, 4.0, 3.0, 4.0, 11.0, 10.0, 8.0, 5.0, 14.0, 19.0, 21.0, 25.0, 28.0, 37.0, 28.0, 46.0, 44.0, 47.0, 35.0, 62.0, 53.0, 47.0, 55.0, 54.0, 44.0, 52.0, 31.0, 31.0, 32.0, 19.0, 22.0, 26.0, 16.0, 13.0, 13.0, 15.0, 9.0, 4.0, 6.0, 2.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-2.673828125, -2.595855712890625, -2.51788330078125, -2.439910888671875, -2.3619384765625, -2.283966064453125, -2.20599365234375, -2.128021240234375, -2.050048828125, -1.972076416015625, -1.89410400390625, -1.816131591796875, -1.7381591796875, -1.660186767578125, -1.58221435546875, -1.504241943359375, -1.42626953125, -1.348297119140625, -1.27032470703125, -1.192352294921875, -1.1143798828125, -1.036407470703125, -0.95843505859375, -0.880462646484375, -0.802490234375, -0.724517822265625, -0.64654541015625, -0.568572998046875, -0.4906005859375, -0.412628173828125, -0.33465576171875, -0.256683349609375, -0.1787109375, -0.100738525390625, -0.02276611328125, 0.055206298828125, 0.1331787109375, 0.211151123046875, 0.28912353515625, 0.367095947265625, 0.445068359375, 0.523040771484375, 0.60101318359375, 0.678985595703125, 0.7569580078125, 0.834930419921875, 0.91290283203125, 0.990875244140625, 1.06884765625, 1.146820068359375, 1.22479248046875, 1.302764892578125, 1.3807373046875, 1.458709716796875, 1.53668212890625, 1.614654541015625, 1.692626953125, 1.770599365234375, 1.84857177734375, 1.926544189453125, 2.0045166015625, 2.082489013671875, 2.16046142578125, 2.238433837890625, 2.31640625]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 1.0, 2.0, 9.0, 10.0, 18.0, 22.0, 26.0, 56.0, 84.0, 110.0, 157.0, 325.0, 488.0, 1006.0, 1799.0, 3497.0, 7378.0, 15551.0, 35507.0, 86277.0, 217336.0, 339222.0, 199765.0, 78693.0, 32786.0, 14606.0, 6668.0, 3276.0, 1631.0, 925.0, 526.0, 284.0, 176.0, 123.0, 67.0, 51.0, 28.0, 21.0, 15.0, 13.0, 11.0, 8.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.050537109375, -0.04882097244262695, -0.047104835510253906, -0.04538869857788086, -0.04367256164550781, -0.041956424713134766, -0.04024028778076172, -0.03852415084838867, -0.036808013916015625, -0.03509187698364258, -0.03337574005126953, -0.031659603118896484, -0.029943466186523438, -0.02822732925415039, -0.026511192321777344, -0.024795055389404297, -0.02307891845703125, -0.021362781524658203, -0.019646644592285156, -0.01793050765991211, -0.016214370727539062, -0.014498233795166016, -0.012782096862792969, -0.011065959930419922, -0.009349822998046875, -0.007633686065673828, -0.005917549133300781, -0.004201412200927734, -0.0024852752685546875, -0.0007691383361816406, 0.0009469985961914062, 0.002663135528564453, 0.0043792724609375, 0.006095409393310547, 0.007811546325683594, 0.00952768325805664, 0.011243820190429688, 0.012959957122802734, 0.014676094055175781, 0.016392230987548828, 0.018108367919921875, 0.019824504852294922, 0.02154064178466797, 0.023256778717041016, 0.024972915649414062, 0.02668905258178711, 0.028405189514160156, 0.030121326446533203, 0.03183746337890625, 0.0335536003112793, 0.035269737243652344, 0.03698587417602539, 0.03870201110839844, 0.040418148040771484, 0.04213428497314453, 0.04385042190551758, 0.045566558837890625, 0.04728269577026367, 0.04899883270263672, 0.050714969635009766, 0.05243110656738281, 0.05414724349975586, 0.055863380432128906, 0.05757951736450195, 0.059295654296875]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 8.0, 11.0, 13.0, 30.0, 55.0, 98.0, 203.0, 233.0, 162.0, 96.0, 57.0, 25.0, 8.0, 8.0, 3.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.6862831115722656e-05, -5.2304938435554504e-05, -4.774704575538635e-05, -4.31891530752182e-05, -3.863126039505005e-05, -3.40733677148819e-05, -2.9515475034713745e-05, -2.4957582354545593e-05, -2.039968967437744e-05, -1.584179699420929e-05, -1.1283904314041138e-05, -6.726011633872986e-06, -2.168118953704834e-06, 2.389773726463318e-06, 6.94766640663147e-06, 1.1505559086799622e-05, 1.6063451766967773e-05, 2.0621344447135925e-05, 2.5179237127304077e-05, 2.973712980747223e-05, 3.429502248764038e-05, 3.885291516780853e-05, 4.3410807847976685e-05, 4.7968700528144836e-05, 5.252659320831299e-05, 5.708448588848114e-05, 6.164237856864929e-05, 6.620027124881744e-05, 7.07581639289856e-05, 7.531605660915375e-05, 7.98739492893219e-05, 8.443184196949005e-05, 8.89897346496582e-05, 9.354762732982635e-05, 9.810552000999451e-05, 0.00010266341269016266, 0.00010722130537033081, 0.00011177919805049896, 0.00011633709073066711, 0.00012089498341083527, 0.00012545287609100342, 0.00013001076877117157, 0.00013456866145133972, 0.00013912655413150787, 0.00014368444681167603, 0.00014824233949184418, 0.00015280023217201233, 0.00015735812485218048, 0.00016191601753234863, 0.00016647391021251678, 0.00017103180289268494, 0.0001755896955728531, 0.00018014758825302124, 0.0001847054809331894, 0.00018926337361335754, 0.0001938212662935257, 0.00019837915897369385, 0.000202937051653862, 0.00020749494433403015, 0.0002120528370141983, 0.00021661072969436646, 0.0002211686223745346, 0.00022572651505470276, 0.0002302844077348709, 0.00023484230041503906]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0, 7.0, 6.0, 14.0, 26.0, 26.0, 51.0, 71.0, 123.0, 251.0, 726.0, 2582.0, 12766.0, 91581.0, 684731.0, 223572.0, 25615.0, 4479.0, 1143.0, 384.0, 181.0, 93.0, 47.0, 25.0, 18.0, 15.0, 10.0, 6.0, 4.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1683349609375, -0.1630229949951172, -0.15771102905273438, -0.15239906311035156, -0.14708709716796875, -0.14177513122558594, -0.13646316528320312, -0.1311511993408203, -0.1258392333984375, -0.12052726745605469, -0.11521530151367188, -0.10990333557128906, -0.10459136962890625, -0.09927940368652344, -0.09396743774414062, -0.08865547180175781, -0.083343505859375, -0.07803153991699219, -0.07271957397460938, -0.06740760803222656, -0.06209564208984375, -0.05678367614746094, -0.051471710205078125, -0.04615974426269531, -0.0408477783203125, -0.03553581237792969, -0.030223846435546875, -0.024911880493164062, -0.01959991455078125, -0.014287948608398438, -0.008975982666015625, -0.0036640167236328125, 0.00164794921875, 0.0069599151611328125, 0.012271881103515625, 0.017583847045898438, 0.02289581298828125, 0.028207778930664062, 0.033519744873046875, 0.03883171081542969, 0.0441436767578125, 0.04945564270019531, 0.054767608642578125, 0.06007957458496094, 0.06539154052734375, 0.07070350646972656, 0.07601547241210938, 0.08132743835449219, 0.086639404296875, 0.09195137023925781, 0.09726333618164062, 0.10257530212402344, 0.10788726806640625, 0.11319923400878906, 0.11851119995117188, 0.12382316589355469, 0.1291351318359375, 0.1344470977783203, 0.13975906372070312, 0.14507102966308594, 0.15038299560546875, 0.15569496154785156, 0.16100692749023438, 0.1663188934326172, 0.171630859375]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 5.0, 1.0, 6.0, 11.0, 10.0, 13.0, 15.0, 21.0, 17.0, 24.0, 31.0, 41.0, 59.0, 71.0, 85.0, 95.0, 83.0, 83.0, 81.0, 58.0, 42.0, 31.0, 23.0, 21.0, 25.0, 10.0, 16.0, 3.0, 9.0, 8.0, 4.0, 4.0, 3.0, 0.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.018829345703125, -0.01824045181274414, -0.01765155792236328, -0.017062664031982422, -0.016473770141601562, -0.015884876251220703, -0.015295982360839844, -0.014707088470458984, -0.014118194580078125, -0.013529300689697266, -0.012940406799316406, -0.012351512908935547, -0.011762619018554688, -0.011173725128173828, -0.010584831237792969, -0.00999593734741211, -0.00940704345703125, -0.00881814956665039, -0.008229255676269531, -0.007640361785888672, -0.0070514678955078125, -0.006462574005126953, -0.005873680114746094, -0.005284786224365234, -0.004695892333984375, -0.004106998443603516, -0.0035181045532226562, -0.002929210662841797, -0.0023403167724609375, -0.0017514228820800781, -0.0011625289916992188, -0.0005736351013183594, 1.52587890625e-05, 0.0006041526794433594, 0.0011930465698242188, 0.0017819404602050781, 0.0023708343505859375, 0.002959728240966797, 0.0035486221313476562, 0.004137516021728516, 0.004726409912109375, 0.005315303802490234, 0.005904197692871094, 0.006493091583251953, 0.0070819854736328125, 0.007670879364013672, 0.008259773254394531, 0.00884866714477539, 0.00943756103515625, 0.01002645492553711, 0.010615348815917969, 0.011204242706298828, 0.011793136596679688, 0.012382030487060547, 0.012970924377441406, 0.013559818267822266, 0.014148712158203125, 0.014737606048583984, 0.015326499938964844, 0.015915393829345703, 0.016504287719726562, 0.017093181610107422, 0.01768207550048828, 0.01827096939086914, 0.01885986328125]}, "gradients/decoder.model.decoder.layers.9.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 3.0, 6.0, 6.0, 17.0, 23.0, 66.0, 114.0, 165.0, 195.0, 174.0, 109.0, 58.0, 33.0, 13.0, 12.0, 4.0, 3.0, 8.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.1353538036346436, -2.9968111515045166, -2.8582684993743896, -2.7197258472442627, -2.581183433532715, -2.442640781402588, -2.304098129272461, -2.165555477142334, -2.027012825012207, -1.88847017288208, -1.7499275207519531, -1.6113849878311157, -1.4728423357009888, -1.3342996835708618, -1.1957571506500244, -1.0572144985198975, -0.9186718463897705, -0.7801291942596436, -0.6415866017341614, -0.5030440092086792, -0.36450135707855225, -0.2259587049484253, -0.08741611242294312, 0.05112648010253906, 0.18966913223266602, 0.3282117545604706, 0.46675437688827515, 0.6052969694137573, 0.7438396215438843, 0.8823822736740112, 1.0209248065948486, 1.1594674587249756, 1.2980103492736816, 1.4365530014038086, 1.5750956535339355, 1.713638186454773, 1.8521808385849, 1.9907234907150269, 2.1292660236358643, 2.267808675765991, 2.406351327896118, 2.544893980026245, 2.683436632156372, 2.821979284286499, 2.960521697998047, 3.099064350128174, 3.237607002258301, 3.3761496543884277, 3.5146923065185547, 3.6532349586486816, 3.7917776107788086, 3.9303202629089355, 4.0688629150390625, 4.2074055671691895, 4.345948219299316, 4.484490394592285, 4.62303352355957, 4.761576175689697, 4.900118827819824, 5.038661479949951, 5.177204132080078, 5.315746784210205, 5.454289436340332, 5.592831611633301, 5.731374263763428]}, "gradients/decoder.model.decoder.layers.9.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 5.0, 1.0, 1.0, 5.0, 8.0, 7.0, 10.0, 11.0, 19.0, 18.0, 23.0, 29.0, 37.0, 45.0, 55.0, 52.0, 73.0, 54.0, 63.0, 91.0, 78.0, 58.0, 59.0, 42.0, 35.0, 37.0, 21.0, 21.0, 18.0, 14.0, 9.0, 6.0, 6.0, 6.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4924906492233276, -1.4316776990890503, -1.3708648681640625, -1.3100519180297852, -1.2492389678955078, -1.1884260177612305, -1.1276130676269531, -1.0668002367019653, -1.005987286567688, -0.9451743364334106, -0.8843614459037781, -0.8235485553741455, -0.7627356052398682, -0.7019226551055908, -0.6411097645759583, -0.5802968740463257, -0.5194839239120483, -0.4586710035800934, -0.3978580832481384, -0.33704516291618347, -0.2762322425842285, -0.21541932225227356, -0.1546064019203186, -0.09379348158836365, -0.03298056125640869, 0.027832359075546265, 0.08864527940750122, 0.14945819973945618, 0.21027112007141113, 0.2710840404033661, 0.33189696073532104, 0.392709881067276, 0.4535226821899414, 0.5143356323242188, 0.5751485228538513, 0.6359614133834839, 0.6967743635177612, 0.7575873136520386, 0.8184002041816711, 0.8792130947113037, 0.940026044845581, 1.0008389949798584, 1.0616519451141357, 1.1224647760391235, 1.1832777261734009, 1.2440906763076782, 1.304903507232666, 1.3657164573669434, 1.4265294075012207, 1.487342357635498, 1.5481553077697754, 1.6089681386947632, 1.6697810888290405, 1.7305940389633179, 1.7914068698883057, 1.852219820022583, 1.9130327701568604, 1.9738457202911377, 2.034658670425415, 2.0954716205596924, 2.1562843322753906, 2.217097282409668, 2.2779102325439453, 2.3387231826782227, 2.3995361328125]}, "gradients/decoder.model.decoder.layers.9.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 5.0, 2.0, 7.0, 8.0, 14.0, 26.0, 29.0, 42.0, 57.0, 95.0, 206.0, 307.0, 537.0, 856.0, 1747.0, 3681.0, 7167.0, 15532.0, 36859.0, 94162.0, 244345.0, 355018.0, 173339.0, 65332.0, 26368.0, 11569.0, 5416.0, 2672.0, 1317.0, 759.0, 442.0, 247.0, 133.0, 86.0, 52.0, 42.0, 21.0, 18.0, 21.0, 7.0, 10.0, 4.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0], "bins": [-1.328125, -1.2882537841796875, -1.248382568359375, -1.2085113525390625, -1.16864013671875, -1.1287689208984375, -1.088897705078125, -1.0490264892578125, -1.0091552734375, -0.9692840576171875, -0.929412841796875, -0.8895416259765625, -0.84967041015625, -0.8097991943359375, -0.769927978515625, -0.7300567626953125, -0.690185546875, -0.6503143310546875, -0.610443115234375, -0.5705718994140625, -0.53070068359375, -0.4908294677734375, -0.450958251953125, -0.4110870361328125, -0.3712158203125, -0.3313446044921875, -0.291473388671875, -0.2516021728515625, -0.21173095703125, -0.1718597412109375, -0.131988525390625, -0.0921173095703125, -0.05224609375, -0.0123748779296875, 0.027496337890625, 0.0673675537109375, 0.10723876953125, 0.1471099853515625, 0.186981201171875, 0.2268524169921875, 0.2667236328125, 0.3065948486328125, 0.346466064453125, 0.3863372802734375, 0.42620849609375, 0.4660797119140625, 0.505950927734375, 0.5458221435546875, 0.585693359375, 0.6255645751953125, 0.665435791015625, 0.7053070068359375, 0.74517822265625, 0.7850494384765625, 0.824920654296875, 0.8647918701171875, 0.9046630859375, 0.9445343017578125, 0.984405517578125, 1.0242767333984375, 1.06414794921875, 1.1040191650390625, 1.143890380859375, 1.1837615966796875, 1.2236328125]}, "gradients/decoder.model.decoder.layers.9.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 5.0, 1.0, 3.0, 6.0, 11.0, 9.0, 12.0, 15.0, 26.0, 26.0, 21.0, 33.0, 45.0, 51.0, 72.0, 62.0, 79.0, 68.0, 80.0, 61.0, 56.0, 55.0, 44.0, 37.0, 27.0, 30.0, 15.0, 22.0, 17.0, 9.0, 6.0, 6.0, 6.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.08203125, -2.956298828125, -2.83056640625, -2.704833984375, -2.5791015625, -2.453369140625, -2.32763671875, -2.201904296875, -2.076171875, -1.950439453125, -1.82470703125, -1.698974609375, -1.5732421875, -1.447509765625, -1.32177734375, -1.196044921875, -1.0703125, -0.944580078125, -0.81884765625, -0.693115234375, -0.5673828125, -0.441650390625, -0.31591796875, -0.190185546875, -0.064453125, 0.061279296875, 0.18701171875, 0.312744140625, 0.4384765625, 0.564208984375, 0.68994140625, 0.815673828125, 0.94140625, 1.067138671875, 1.19287109375, 1.318603515625, 1.4443359375, 1.570068359375, 1.69580078125, 1.821533203125, 1.947265625, 2.072998046875, 2.19873046875, 2.324462890625, 2.4501953125, 2.575927734375, 2.70166015625, 2.827392578125, 2.953125, 3.078857421875, 3.20458984375, 3.330322265625, 3.4560546875, 3.581787109375, 3.70751953125, 3.833251953125, 3.958984375, 4.084716796875, 4.21044921875, 4.336181640625, 4.4619140625, 4.587646484375, 4.71337890625, 4.839111328125, 4.96484375]}, "gradients/decoder.model.decoder.layers.9.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 5.0, 8.0, 3.0, 6.0, 9.0, 6.0, 13.0, 10.0, 13.0, 17.0, 17.0, 14.0, 26.0, 33.0, 20.0, 40.0, 39.0, 49.0, 76.0, 163.0, 578.0, 21767.0, 1019576.0, 5210.0, 373.0, 119.0, 69.0, 39.0, 34.0, 38.0, 28.0, 21.0, 23.0, 18.0, 23.0, 12.0, 10.0, 14.0, 10.0, 6.0, 6.0, 7.0, 4.0, 5.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.9296875, -10.5699462890625, -10.210205078125, -9.8504638671875, -9.49072265625, -9.1309814453125, -8.771240234375, -8.4114990234375, -8.0517578125, -7.6920166015625, -7.332275390625, -6.9725341796875, -6.61279296875, -6.2530517578125, -5.893310546875, -5.5335693359375, -5.173828125, -4.8140869140625, -4.454345703125, -4.0946044921875, -3.73486328125, -3.3751220703125, -3.015380859375, -2.6556396484375, -2.2958984375, -1.9361572265625, -1.576416015625, -1.2166748046875, -0.85693359375, -0.4971923828125, -0.137451171875, 0.2222900390625, 0.58203125, 0.9417724609375, 1.301513671875, 1.6612548828125, 2.02099609375, 2.3807373046875, 2.740478515625, 3.1002197265625, 3.4599609375, 3.8197021484375, 4.179443359375, 4.5391845703125, 4.89892578125, 5.2586669921875, 5.618408203125, 5.9781494140625, 6.337890625, 6.6976318359375, 7.057373046875, 7.4171142578125, 7.77685546875, 8.1365966796875, 8.496337890625, 8.8560791015625, 9.2158203125, 9.5755615234375, 9.935302734375, 10.2950439453125, 10.65478515625, 11.0145263671875, 11.374267578125, 11.7340087890625, 12.09375]}, "gradients/decoder.model.decoder.layers.9.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 2.0, 3.0, 1.0, 5.0, 2.0, 11.0, 9.0, 10.0, 14.0, 8.0, 18.0, 17.0, 20.0, 24.0, 21.0, 27.0, 22.0, 42.0, 51.0, 30.0, 32.0, 52.0, 40.0, 42.0, 56.0, 45.0, 37.0, 42.0, 38.0, 38.0, 29.0, 34.0, 16.0, 29.0, 27.0, 19.0, 12.0, 15.0, 20.0, 11.0, 5.0, 5.0, 6.0, 9.0, 6.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.7890625, -2.698822021484375, -2.60858154296875, -2.518341064453125, -2.4281005859375, -2.337860107421875, -2.24761962890625, -2.157379150390625, -2.067138671875, -1.976898193359375, -1.88665771484375, -1.796417236328125, -1.7061767578125, -1.615936279296875, -1.52569580078125, -1.435455322265625, -1.34521484375, -1.254974365234375, -1.16473388671875, -1.074493408203125, -0.9842529296875, -0.894012451171875, -0.80377197265625, -0.713531494140625, -0.623291015625, -0.533050537109375, -0.44281005859375, -0.352569580078125, -0.2623291015625, -0.172088623046875, -0.08184814453125, 0.008392333984375, 0.0986328125, 0.188873291015625, 0.27911376953125, 0.369354248046875, 0.4595947265625, 0.549835205078125, 0.64007568359375, 0.730316162109375, 0.820556640625, 0.910797119140625, 1.00103759765625, 1.091278076171875, 1.1815185546875, 1.271759033203125, 1.36199951171875, 1.452239990234375, 1.54248046875, 1.632720947265625, 1.72296142578125, 1.813201904296875, 1.9034423828125, 1.993682861328125, 2.08392333984375, 2.174163818359375, 2.264404296875, 2.354644775390625, 2.44488525390625, 2.535125732421875, 2.6253662109375, 2.715606689453125, 2.80584716796875, 2.896087646484375, 2.986328125]}, "gradients/decoder.model.decoder.layers.9.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 3.0, 4.0, 4.0, 7.0, 11.0, 15.0, 12.0, 40.0, 64.0, 135.0, 314.0, 1108.0, 6712.0, 189888.0, 821837.0, 25069.0, 2336.0, 588.0, 212.0, 90.0, 50.0, 20.0, 12.0, 11.0, 6.0, 3.0, 4.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.30078125, -2.246307373046875, -2.19183349609375, -2.137359619140625, -2.0828857421875, -2.028411865234375, -1.97393798828125, -1.919464111328125, -1.864990234375, -1.810516357421875, -1.75604248046875, -1.701568603515625, -1.6470947265625, -1.592620849609375, -1.53814697265625, -1.483673095703125, -1.42919921875, -1.374725341796875, -1.32025146484375, -1.265777587890625, -1.2113037109375, -1.156829833984375, -1.10235595703125, -1.047882080078125, -0.993408203125, -0.938934326171875, -0.88446044921875, -0.829986572265625, -0.7755126953125, -0.721038818359375, -0.66656494140625, -0.612091064453125, -0.5576171875, -0.503143310546875, -0.44866943359375, -0.394195556640625, -0.3397216796875, -0.285247802734375, -0.23077392578125, -0.176300048828125, -0.121826171875, -0.067352294921875, -0.01287841796875, 0.041595458984375, 0.0960693359375, 0.150543212890625, 0.20501708984375, 0.259490966796875, 0.31396484375, 0.368438720703125, 0.42291259765625, 0.477386474609375, 0.5318603515625, 0.586334228515625, 0.64080810546875, 0.695281982421875, 0.749755859375, 0.804229736328125, 0.85870361328125, 0.913177490234375, 0.9676513671875, 1.022125244140625, 1.07659912109375, 1.131072998046875, 1.185546875]}, "gradients/decoder.model.decoder.layers.9.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 2.0, 4.0, 6.0, 5.0, 14.0, 15.0, 20.0, 39.0, 47.0, 89.0, 111.0, 128.0, 118.0, 119.0, 83.0, 63.0, 45.0, 30.0, 27.0, 18.0, 13.0, 2.0, 1.0, 1.0, 3.0, 2.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00013446807861328125, -0.00012985989451408386, -0.00012525171041488647, -0.00012064352631568909, -0.0001160353422164917, -0.00011142715811729431, -0.00010681897401809692, -0.00010221078991889954, -9.760260581970215e-05, -9.299442172050476e-05, -8.838623762130737e-05, -8.377805352210999e-05, -7.91698694229126e-05, -7.456168532371521e-05, -6.995350122451782e-05, -6.534531712532043e-05, -6.073713302612305e-05, -5.612894892692566e-05, -5.152076482772827e-05, -4.6912580728530884e-05, -4.2304396629333496e-05, -3.769621253013611e-05, -3.308802843093872e-05, -2.8479844331741333e-05, -2.3871660232543945e-05, -1.9263476133346558e-05, -1.465529203414917e-05, -1.0047107934951782e-05, -5.4389238357543945e-06, -8.307397365570068e-07, 3.777444362640381e-06, 8.385628461837769e-06, 1.2993812561035156e-05, 1.7601996660232544e-05, 2.221018075942993e-05, 2.681836485862732e-05, 3.142654895782471e-05, 3.6034733057022095e-05, 4.064291715621948e-05, 4.525110125541687e-05, 4.985928535461426e-05, 5.4467469453811646e-05, 5.907565355300903e-05, 6.368383765220642e-05, 6.829202175140381e-05, 7.29002058506012e-05, 7.750838994979858e-05, 8.211657404899597e-05, 8.672475814819336e-05, 9.133294224739075e-05, 9.594112634658813e-05, 0.00010054931044578552, 0.00010515749454498291, 0.0001097656786441803, 0.00011437386274337769, 0.00011898204684257507, 0.00012359023094177246, 0.00012819841504096985, 0.00013280659914016724, 0.00013741478323936462, 0.000142022967338562, 0.0001466311514377594, 0.0001512393355369568, 0.00015584751963615417, 0.00016045570373535156]}, "gradients/decoder.model.decoder.layers.9.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 6.0, 1.0, 8.0, 6.0, 20.0, 20.0, 49.0, 87.0, 186.0, 526.0, 2252.0, 22916.0, 752570.0, 259230.0, 8694.0, 1317.0, 361.0, 153.0, 64.0, 36.0, 21.0, 19.0, 10.0, 4.0, 3.0, 4.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.107421875, -2.05450439453125, -2.0015869140625, -1.94866943359375, -1.895751953125, -1.84283447265625, -1.7899169921875, -1.73699951171875, -1.68408203125, -1.63116455078125, -1.5782470703125, -1.52532958984375, -1.472412109375, -1.41949462890625, -1.3665771484375, -1.31365966796875, -1.2607421875, -1.20782470703125, -1.1549072265625, -1.10198974609375, -1.049072265625, -0.99615478515625, -0.9432373046875, -0.89031982421875, -0.83740234375, -0.78448486328125, -0.7315673828125, -0.67864990234375, -0.625732421875, -0.57281494140625, -0.5198974609375, -0.46697998046875, -0.4140625, -0.36114501953125, -0.3082275390625, -0.25531005859375, -0.202392578125, -0.14947509765625, -0.0965576171875, -0.04364013671875, 0.00927734375, 0.06219482421875, 0.1151123046875, 0.16802978515625, 0.220947265625, 0.27386474609375, 0.3267822265625, 0.37969970703125, 0.4326171875, 0.48553466796875, 0.5384521484375, 0.59136962890625, 0.644287109375, 0.69720458984375, 0.7501220703125, 0.80303955078125, 0.85595703125, 0.90887451171875, 0.9617919921875, 1.01470947265625, 1.067626953125, 1.12054443359375, 1.1734619140625, 1.22637939453125, 1.279296875]}, "gradients/decoder.model.decoder.layers.9.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 2.0, 4.0, 4.0, 7.0, 16.0, 20.0, 55.0, 113.0, 160.0, 234.0, 164.0, 96.0, 58.0, 43.0, 20.0, 6.0, 5.0, 5.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.39208984375, -0.37094879150390625, -0.3498077392578125, -0.32866668701171875, -0.307525634765625, -0.28638458251953125, -0.2652435302734375, -0.24410247802734375, -0.22296142578125, -0.20182037353515625, -0.1806793212890625, -0.15953826904296875, -0.138397216796875, -0.11725616455078125, -0.0961151123046875, -0.07497406005859375, -0.0538330078125, -0.03269195556640625, -0.0115509033203125, 0.00959014892578125, 0.030731201171875, 0.05187225341796875, 0.0730133056640625, 0.09415435791015625, 0.11529541015625, 0.13643646240234375, 0.1575775146484375, 0.17871856689453125, 0.199859619140625, 0.22100067138671875, 0.2421417236328125, 0.26328277587890625, 0.284423828125, 0.30556488037109375, 0.3267059326171875, 0.34784698486328125, 0.368988037109375, 0.39012908935546875, 0.4112701416015625, 0.43241119384765625, 0.45355224609375, 0.47469329833984375, 0.4958343505859375, 0.5169754028320312, 0.538116455078125, 0.5592575073242188, 0.5803985595703125, 0.6015396118164062, 0.6226806640625, 0.6438217163085938, 0.6649627685546875, 0.6861038208007812, 0.707244873046875, 0.7283859252929688, 0.7495269775390625, 0.7706680297851562, 0.79180908203125, 0.8129501342773438, 0.8340911865234375, 0.8552322387695312, 0.876373291015625, 0.8975143432617188, 0.9186553955078125, 0.9397964477539062, 0.9609375]}, "gradients/decoder.model.decoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 4.0, 0.0, 3.0, 5.0, 3.0, 6.0, 9.0, 23.0, 37.0, 66.0, 112.0, 174.0, 163.0, 144.0, 96.0, 74.0, 32.0, 22.0, 18.0, 5.0, 4.0, 5.0, 3.0, 4.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.3319878578186035, -4.098165035247803, -3.8643417358398438, -3.630518913269043, -3.396695613861084, -3.162872791290283, -2.9290497303009033, -2.6952266693115234, -2.4614036083221436, -2.2275805473327637, -1.9937574863433838, -1.7599345445632935, -1.5261114835739136, -1.2922884225845337, -1.0584654808044434, -0.8246424198150635, -0.5908193588256836, -0.3569963276386261, -0.1231732964515686, 0.1106497049331665, 0.3444727659225464, 0.5782958269119263, 0.8121187686920166, 1.0459418296813965, 1.2797648906707764, 1.5135879516601562, 1.7474110126495361, 1.9812339544296265, 2.215056896209717, 2.448880195617676, 2.6827030181884766, 2.9165260791778564, 3.1503496170043945, 3.3841726779937744, 3.6179957389831543, 3.851818561553955, 4.085641860961914, 4.319464683532715, 4.553287506103516, 4.787110805511475, 5.020934104919434, 5.254756927490234, 5.488580226898193, 5.722403049468994, 5.956226348876953, 6.190049171447754, 6.423871994018555, 6.657695293426514, 6.8915181159973145, 7.125340938568115, 7.359164237976074, 7.592987060546875, 7.826810359954834, 8.060633659362793, 8.294456481933594, 8.528279304504395, 8.762102127075195, 8.995924949645996, 9.229747772216797, 9.463571548461914, 9.697394371032715, 9.931217193603516, 10.165040016174316, 10.398862838745117, 10.632686614990234]}, "gradients/decoder.model.decoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 0.0, 2.0, 8.0, 3.0, 7.0, 6.0, 9.0, 12.0, 18.0, 10.0, 22.0, 26.0, 23.0, 18.0, 27.0, 30.0, 36.0, 37.0, 32.0, 33.0, 40.0, 41.0, 46.0, 49.0, 34.0, 57.0, 33.0, 29.0, 33.0, 36.0, 47.0, 23.0, 36.0, 30.0, 23.0, 15.0, 11.0, 15.0, 12.0, 10.0, 7.0, 6.0, 3.0, 3.0, 2.0, 5.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.5542969703674316, -3.4319028854370117, -3.3095085620880127, -3.1871142387390137, -3.0647201538085938, -2.942326068878174, -2.819931745529175, -2.697537422180176, -2.575143337249756, -2.452749252319336, -2.330354928970337, -2.207960605621338, -2.085566520690918, -1.9631723165512085, -1.840778112411499, -1.7183839082717896, -1.59598970413208, -1.4735954999923706, -1.3512012958526611, -1.2288070917129517, -1.1064128875732422, -0.9840186834335327, -0.8616244792938232, -0.7392302751541138, -0.6168360710144043, -0.4944418668746948, -0.37204766273498535, -0.24965345859527588, -0.1272592544555664, -0.004865050315856934, 0.11752915382385254, 0.239923357963562, 0.3623175621032715, 0.48471176624298096, 0.6071059703826904, 0.7295001745223999, 0.8518943786621094, 0.9742885828018188, 1.0966827869415283, 1.2190769910812378, 1.3414711952209473, 1.4638653993606567, 1.5862596035003662, 1.7086538076400757, 1.8310480117797852, 1.9534422159194946, 2.075836420059204, 2.198230743408203, 2.320624828338623, 2.443018913269043, 2.565413236618042, 2.687807559967041, 2.810201644897461, 2.932595729827881, 3.05499005317688, 3.177384376525879, 3.299778461456299, 3.4221725463867188, 3.5445668697357178, 3.666961193084717, 3.7893552780151367, 3.9117493629455566, 4.034143447875977, 4.156538009643555, 4.278932094573975]}, "gradients/decoder.model.decoder.layers.8.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 5.0, 4.0, 4.0, 8.0, 1.0, 10.0, 9.0, 11.0, 13.0, 17.0, 21.0, 32.0, 38.0, 51.0, 67.0, 142.0, 206.0, 505.0, 1281.0, 5088.0, 30316.0, 326068.0, 2514240.0, 1191479.0, 106701.0, 13140.0, 2950.0, 903.0, 398.0, 176.0, 110.0, 69.0, 47.0, 46.0, 34.0, 18.0, 20.0, 10.0, 10.0, 7.0, 9.0, 6.0, 6.0, 0.0, 3.0, 4.0, 3.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0], "bins": [-4.17578125, -4.04833984375, -3.9208984375, -3.79345703125, -3.666015625, -3.53857421875, -3.4111328125, -3.28369140625, -3.15625, -3.02880859375, -2.9013671875, -2.77392578125, -2.646484375, -2.51904296875, -2.3916015625, -2.26416015625, -2.13671875, -2.00927734375, -1.8818359375, -1.75439453125, -1.626953125, -1.49951171875, -1.3720703125, -1.24462890625, -1.1171875, -0.98974609375, -0.8623046875, -0.73486328125, -0.607421875, -0.47998046875, -0.3525390625, -0.22509765625, -0.09765625, 0.02978515625, 0.1572265625, 0.28466796875, 0.412109375, 0.53955078125, 0.6669921875, 0.79443359375, 0.921875, 1.04931640625, 1.1767578125, 1.30419921875, 1.431640625, 1.55908203125, 1.6865234375, 1.81396484375, 1.94140625, 2.06884765625, 2.1962890625, 2.32373046875, 2.451171875, 2.57861328125, 2.7060546875, 2.83349609375, 2.9609375, 3.08837890625, 3.2158203125, 3.34326171875, 3.470703125, 3.59814453125, 3.7255859375, 3.85302734375, 3.98046875]}, "gradients/decoder.model.decoder.layers.8.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 1.0, 3.0, 1.0, 4.0, 8.0, 10.0, 13.0, 13.0, 10.0, 18.0, 27.0, 26.0, 40.0, 36.0, 50.0, 46.0, 57.0, 76.0, 65.0, 60.0, 60.0, 43.0, 68.0, 43.0, 47.0, 35.0, 42.0, 28.0, 23.0, 15.0, 14.0, 11.0, 6.0, 5.0, 3.0, 1.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.091796875, -2.0145263671875, -1.937255859375, -1.8599853515625, -1.78271484375, -1.7054443359375, -1.628173828125, -1.5509033203125, -1.4736328125, -1.3963623046875, -1.319091796875, -1.2418212890625, -1.16455078125, -1.0872802734375, -1.010009765625, -0.9327392578125, -0.85546875, -0.7781982421875, -0.700927734375, -0.6236572265625, -0.54638671875, -0.4691162109375, -0.391845703125, -0.3145751953125, -0.2373046875, -0.1600341796875, -0.082763671875, -0.0054931640625, 0.07177734375, 0.1490478515625, 0.226318359375, 0.3035888671875, 0.380859375, 0.4581298828125, 0.535400390625, 0.6126708984375, 0.68994140625, 0.7672119140625, 0.844482421875, 0.9217529296875, 0.9990234375, 1.0762939453125, 1.153564453125, 1.2308349609375, 1.30810546875, 1.3853759765625, 1.462646484375, 1.5399169921875, 1.6171875, 1.6944580078125, 1.771728515625, 1.8489990234375, 1.92626953125, 2.0035400390625, 2.080810546875, 2.1580810546875, 2.2353515625, 2.3126220703125, 2.389892578125, 2.4671630859375, 2.54443359375, 2.6217041015625, 2.698974609375, 2.7762451171875, 2.853515625]}, "gradients/decoder.model.decoder.layers.8.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 1.0, 2.0, 2.0, 2.0, 2.0, 5.0, 4.0, 11.0, 19.0, 31.0, 25.0, 69.0, 125.0, 217.0, 510.0, 2469.0, 59742.0, 4022426.0, 104338.0, 3125.0, 579.0, 265.0, 128.0, 63.0, 42.0, 25.0, 20.0, 14.0, 9.0, 6.0, 5.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-10.34375, -10.06829833984375, -9.7928466796875, -9.51739501953125, -9.241943359375, -8.96649169921875, -8.6910400390625, -8.41558837890625, -8.14013671875, -7.86468505859375, -7.5892333984375, -7.31378173828125, -7.038330078125, -6.76287841796875, -6.4874267578125, -6.21197509765625, -5.9365234375, -5.66107177734375, -5.3856201171875, -5.11016845703125, -4.834716796875, -4.55926513671875, -4.2838134765625, -4.00836181640625, -3.73291015625, -3.45745849609375, -3.1820068359375, -2.90655517578125, -2.631103515625, -2.35565185546875, -2.0802001953125, -1.80474853515625, -1.529296875, -1.25384521484375, -0.9783935546875, -0.70294189453125, -0.427490234375, -0.15203857421875, 0.1234130859375, 0.39886474609375, 0.67431640625, 0.94976806640625, 1.2252197265625, 1.50067138671875, 1.776123046875, 2.05157470703125, 2.3270263671875, 2.60247802734375, 2.8779296875, 3.15338134765625, 3.4288330078125, 3.70428466796875, 3.979736328125, 4.25518798828125, 4.5306396484375, 4.80609130859375, 5.08154296875, 5.35699462890625, 5.6324462890625, 5.90789794921875, 6.183349609375, 6.45880126953125, 6.7342529296875, 7.00970458984375, 7.28515625]}, "gradients/decoder.model.decoder.layers.8.fc1.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 5.0, 7.0, 8.0, 9.0, 15.0, 18.0, 16.0, 37.0, 64.0, 89.0, 121.0, 175.0, 249.0, 404.0, 517.0, 594.0, 537.0, 362.0, 283.0, 188.0, 109.0, 89.0, 70.0, 47.0, 24.0, 17.0, 9.0, 2.0, 4.0, 2.0, 0.0, 3.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.95703125, -0.9234466552734375, -0.889862060546875, -0.8562774658203125, -0.82269287109375, -0.7891082763671875, -0.755523681640625, -0.7219390869140625, -0.6883544921875, -0.6547698974609375, -0.621185302734375, -0.5876007080078125, -0.55401611328125, -0.5204315185546875, -0.486846923828125, -0.4532623291015625, -0.419677734375, -0.3860931396484375, -0.352508544921875, -0.3189239501953125, -0.28533935546875, -0.2517547607421875, -0.218170166015625, -0.1845855712890625, -0.1510009765625, -0.1174163818359375, -0.083831787109375, -0.0502471923828125, -0.01666259765625, 0.0169219970703125, 0.050506591796875, 0.0840911865234375, 0.11767578125, 0.1512603759765625, 0.184844970703125, 0.2184295654296875, 0.25201416015625, 0.2855987548828125, 0.319183349609375, 0.3527679443359375, 0.3863525390625, 0.4199371337890625, 0.453521728515625, 0.4871063232421875, 0.52069091796875, 0.5542755126953125, 0.587860107421875, 0.6214447021484375, 0.655029296875, 0.6886138916015625, 0.722198486328125, 0.7557830810546875, 0.78936767578125, 0.8229522705078125, 0.856536865234375, 0.8901214599609375, 0.9237060546875, 0.9572906494140625, 0.990875244140625, 1.0244598388671875, 1.05804443359375, 1.0916290283203125, 1.125213623046875, 1.1587982177734375, 1.1923828125]}, "gradients/decoder.model.decoder.layers.8.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 3.0, 5.0, 6.0, 16.0, 8.0, 20.0, 28.0, 43.0, 47.0, 88.0, 113.0, 121.0, 118.0, 95.0, 93.0, 57.0, 47.0, 33.0, 21.0, 11.0, 11.0, 8.0, 5.0, 1.0, 6.0, 5.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.443881988525391, -4.306818962097168, -4.169755935668945, -4.032692909240723, -3.8956298828125, -3.7585668563842773, -3.6215038299560547, -3.484440803527832, -3.3473777770996094, -3.2103147506713867, -3.073251724243164, -2.9361886978149414, -2.7991256713867188, -2.662062644958496, -2.5249996185302734, -2.387936592102051, -2.250873565673828, -2.1138105392456055, -1.9767475128173828, -1.8396844863891602, -1.7026214599609375, -1.5655584335327148, -1.4284954071044922, -1.2914323806762695, -1.1543693542480469, -1.0173063278198242, -0.8802433013916016, -0.7431802749633789, -0.6061172485351562, -0.4690542221069336, -0.33199119567871094, -0.19492816925048828, -0.05786561965942383, 0.07919740676879883, 0.21626043319702148, 0.35332345962524414, 0.4903864860534668, 0.6274495124816895, 0.7645125389099121, 0.9015755653381348, 1.0386385917663574, 1.17570161819458, 1.3127646446228027, 1.4498276710510254, 1.586890697479248, 1.7239537239074707, 1.8610167503356934, 1.998079776763916, 2.1351428031921387, 2.2722058296203613, 2.409268856048584, 2.5463318824768066, 2.6833949089050293, 2.820457935333252, 2.9575209617614746, 3.0945839881896973, 3.23164701461792, 3.3687100410461426, 3.5057730674743652, 3.642836093902588, 3.7798991203308105, 3.916962146759033, 4.054025173187256, 4.1910881996154785, 4.328151226043701]}, "gradients/decoder.model.decoder.layers.8.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 2.0, 4.0, 5.0, 11.0, 7.0, 17.0, 13.0, 13.0, 15.0, 22.0, 25.0, 30.0, 29.0, 46.0, 46.0, 51.0, 46.0, 52.0, 50.0, 56.0, 67.0, 43.0, 44.0, 40.0, 52.0, 28.0, 34.0, 31.0, 27.0, 24.0, 16.0, 19.0, 15.0, 10.0, 3.0, 3.0, 5.0, 1.0, 1.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.1229019165039062, -2.0435311794281006, -1.9641602039337158, -1.8847893476486206, -1.8054184913635254, -1.7260477542877197, -1.6466768980026245, -1.5673060417175293, -1.487935185432434, -1.4085643291473389, -1.3291934728622437, -1.2498226165771484, -1.1704518795013428, -1.091080904006958, -1.0117101669311523, -0.9323393106460571, -0.8529684543609619, -0.7735975980758667, -0.6942267417907715, -0.614855945110321, -0.5354850888252258, -0.4561142325401306, -0.3767434060573578, -0.29737257957458496, -0.21800172328948975, -0.13863088190555573, -0.059260040521621704, 0.020110800862312317, 0.09948164224624634, 0.17885249853134155, 0.2582233250141144, 0.3375941514968872, 0.4169652462005615, 0.49633610248565674, 0.575706958770752, 0.6550777554512024, 0.7344486117362976, 0.8138194680213928, 0.8931902647018433, 0.9725611209869385, 1.0519319772720337, 1.131302833557129, 1.2106736898422241, 1.2900445461273193, 1.369415283203125, 1.4487862586975098, 1.5281569957733154, 1.6075278520584106, 1.6868987083435059, 1.766269564628601, 1.8456404209136963, 1.9250112771987915, 2.0043821334838867, 2.0837528705596924, 2.163123846054077, 2.242494583129883, 2.3218655586242676, 2.4012362957000732, 2.480607271194458, 2.5599780082702637, 2.6393489837646484, 2.718719720840454, 2.798090696334839, 2.8774614334106445, 2.95683217048645]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 7.0, 14.0, 18.0, 26.0, 48.0, 71.0, 103.0, 207.0, 524.0, 1421.0, 5946.0, 52789.0, 497404.0, 438913.0, 43586.0, 5328.0, 1211.0, 459.0, 213.0, 108.0, 69.0, 37.0, 14.0, 13.0, 14.0, 7.0, 4.0, 2.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.99560546875, -0.9634475708007812, -0.9312896728515625, -0.8991317749023438, -0.866973876953125, -0.8348159790039062, -0.8026580810546875, -0.7705001831054688, -0.73834228515625, -0.7061843872070312, -0.6740264892578125, -0.6418685913085938, -0.609710693359375, -0.5775527954101562, -0.5453948974609375, -0.5132369995117188, -0.4810791015625, -0.44892120361328125, -0.4167633056640625, -0.38460540771484375, -0.352447509765625, -0.32028961181640625, -0.2881317138671875, -0.25597381591796875, -0.22381591796875, -0.19165802001953125, -0.1595001220703125, -0.12734222412109375, -0.095184326171875, -0.06302642822265625, -0.0308685302734375, 0.00128936767578125, 0.033447265625, 0.06560516357421875, 0.0977630615234375, 0.12992095947265625, 0.162078857421875, 0.19423675537109375, 0.2263946533203125, 0.25855255126953125, 0.29071044921875, 0.32286834716796875, 0.3550262451171875, 0.38718414306640625, 0.419342041015625, 0.45149993896484375, 0.4836578369140625, 0.5158157348632812, 0.5479736328125, 0.5801315307617188, 0.6122894287109375, 0.6444473266601562, 0.676605224609375, 0.7087631225585938, 0.7409210205078125, 0.7730789184570312, 0.80523681640625, 0.8373947143554688, 0.8695526123046875, 0.9017105102539062, 0.933868408203125, 0.9660263061523438, 0.9981842041015625, 1.0303421020507812, 1.0625]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 5.0, 8.0, 5.0, 7.0, 23.0, 26.0, 30.0, 30.0, 47.0, 60.0, 71.0, 92.0, 87.0, 97.0, 70.0, 72.0, 63.0, 53.0, 41.0, 39.0, 33.0, 19.0, 9.0, 4.0, 9.0, 6.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.126953125, -2.05157470703125, -1.9761962890625, -1.90081787109375, -1.825439453125, -1.75006103515625, -1.6746826171875, -1.59930419921875, -1.52392578125, -1.44854736328125, -1.3731689453125, -1.29779052734375, -1.222412109375, -1.14703369140625, -1.0716552734375, -0.99627685546875, -0.9208984375, -0.84552001953125, -0.7701416015625, -0.69476318359375, -0.619384765625, -0.54400634765625, -0.4686279296875, -0.39324951171875, -0.31787109375, -0.24249267578125, -0.1671142578125, -0.09173583984375, -0.016357421875, 0.05902099609375, 0.1343994140625, 0.20977783203125, 0.28515625, 0.36053466796875, 0.4359130859375, 0.51129150390625, 0.586669921875, 0.66204833984375, 0.7374267578125, 0.81280517578125, 0.88818359375, 0.96356201171875, 1.0389404296875, 1.11431884765625, 1.189697265625, 1.26507568359375, 1.3404541015625, 1.41583251953125, 1.4912109375, 1.56658935546875, 1.6419677734375, 1.71734619140625, 1.792724609375, 1.86810302734375, 1.9434814453125, 2.01885986328125, 2.09423828125, 2.16961669921875, 2.2449951171875, 2.32037353515625, 2.395751953125, 2.47113037109375, 2.5465087890625, 2.62188720703125, 2.697265625]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 2.0, 2.0, 3.0, 0.0, 3.0, 3.0, 6.0, 11.0, 16.0, 22.0, 36.0, 35.0, 54.0, 89.0, 136.0, 193.0, 331.0, 595.0, 1086.0, 2052.0, 4106.0, 8215.0, 16555.0, 33947.0, 69115.0, 129129.0, 197742.0, 219849.0, 167539.0, 98142.0, 50293.0, 24854.0, 11937.0, 5966.0, 2986.0, 1525.0, 796.0, 426.0, 274.0, 144.0, 120.0, 69.0, 45.0, 32.0, 24.0, 17.0, 9.0, 11.0, 10.0, 2.0, 4.0, 3.0, 1.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.2215576171875, -0.21447181701660156, -0.20738601684570312, -0.2003002166748047, -0.19321441650390625, -0.1861286163330078, -0.17904281616210938, -0.17195701599121094, -0.1648712158203125, -0.15778541564941406, -0.15069961547851562, -0.1436138153076172, -0.13652801513671875, -0.1294422149658203, -0.12235641479492188, -0.11527061462402344, -0.108184814453125, -0.10109901428222656, -0.09401321411132812, -0.08692741394042969, -0.07984161376953125, -0.07275581359863281, -0.06567001342773438, -0.05858421325683594, -0.0514984130859375, -0.04441261291503906, -0.037326812744140625, -0.030241012573242188, -0.02315521240234375, -0.016069412231445312, -0.008983612060546875, -0.0018978118896484375, 0.00518798828125, 0.012273788452148438, 0.019359588623046875, 0.026445388793945312, 0.03353118896484375, 0.04061698913574219, 0.047702789306640625, 0.05478858947753906, 0.0618743896484375, 0.06896018981933594, 0.07604598999023438, 0.08313179016113281, 0.09021759033203125, 0.09730339050292969, 0.10438919067382812, 0.11147499084472656, 0.118560791015625, 0.12564659118652344, 0.13273239135742188, 0.1398181915283203, 0.14690399169921875, 0.1539897918701172, 0.16107559204101562, 0.16816139221191406, 0.1752471923828125, 0.18233299255371094, 0.18941879272460938, 0.1965045928955078, 0.20359039306640625, 0.2106761932373047, 0.21776199340820312, 0.22484779357910156, 0.23193359375]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 3.0, 3.0, 4.0, 7.0, 7.0, 13.0, 5.0, 15.0, 13.0, 12.0, 12.0, 16.0, 25.0, 29.0, 36.0, 33.0, 29.0, 40.0, 55.0, 37.0, 42.0, 49.0, 39.0, 45.0, 43.0, 36.0, 46.0, 37.0, 38.0, 42.0, 23.0, 25.0, 26.0, 21.0, 19.0, 17.0, 12.0, 13.0, 10.0, 7.0, 9.0, 4.0, 2.0, 4.0, 2.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.41796875, -2.34393310546875, -2.2698974609375, -2.19586181640625, -2.121826171875, -2.04779052734375, -1.9737548828125, -1.89971923828125, -1.82568359375, -1.75164794921875, -1.6776123046875, -1.60357666015625, -1.529541015625, -1.45550537109375, -1.3814697265625, -1.30743408203125, -1.2333984375, -1.15936279296875, -1.0853271484375, -1.01129150390625, -0.937255859375, -0.86322021484375, -0.7891845703125, -0.71514892578125, -0.64111328125, -0.56707763671875, -0.4930419921875, -0.41900634765625, -0.344970703125, -0.27093505859375, -0.1968994140625, -0.12286376953125, -0.048828125, 0.02520751953125, 0.0992431640625, 0.17327880859375, 0.247314453125, 0.32135009765625, 0.3953857421875, 0.46942138671875, 0.54345703125, 0.61749267578125, 0.6915283203125, 0.76556396484375, 0.839599609375, 0.91363525390625, 0.9876708984375, 1.06170654296875, 1.1357421875, 1.20977783203125, 1.2838134765625, 1.35784912109375, 1.431884765625, 1.50592041015625, 1.5799560546875, 1.65399169921875, 1.72802734375, 1.80206298828125, 1.8760986328125, 1.95013427734375, 2.024169921875, 2.09820556640625, 2.1722412109375, 2.24627685546875, 2.3203125]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 3.0, 5.0, 7.0, 14.0, 8.0, 8.0, 20.0, 37.0, 78.0, 109.0, 199.0, 361.0, 693.0, 1575.0, 4139.0, 14933.0, 79205.0, 443709.0, 412334.0, 70636.0, 13660.0, 3870.0, 1393.0, 721.0, 380.0, 178.0, 106.0, 68.0, 55.0, 23.0, 11.0, 9.0, 4.0, 6.0, 1.0, 3.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.11553955078125, -0.11241436004638672, -0.10928916931152344, -0.10616397857666016, -0.10303878784179688, -0.0999135971069336, -0.09678840637207031, -0.09366321563720703, -0.09053802490234375, -0.08741283416748047, -0.08428764343261719, -0.0811624526977539, -0.07803726196289062, -0.07491207122802734, -0.07178688049316406, -0.06866168975830078, -0.0655364990234375, -0.06241130828857422, -0.05928611755371094, -0.056160926818847656, -0.053035736083984375, -0.049910545349121094, -0.04678535461425781, -0.04366016387939453, -0.04053497314453125, -0.03740978240966797, -0.03428459167480469, -0.031159400939941406, -0.028034210205078125, -0.024909019470214844, -0.021783828735351562, -0.01865863800048828, -0.015533447265625, -0.012408256530761719, -0.009283065795898438, -0.006157875061035156, -0.003032684326171875, 9.250640869140625e-05, 0.0032176971435546875, 0.006342887878417969, 0.00946807861328125, 0.012593269348144531, 0.015718460083007812, 0.018843650817871094, 0.021968841552734375, 0.025094032287597656, 0.028219223022460938, 0.03134441375732422, 0.0344696044921875, 0.03759479522705078, 0.04071998596191406, 0.043845176696777344, 0.046970367431640625, 0.050095558166503906, 0.05322074890136719, 0.05634593963623047, 0.05947113037109375, 0.06259632110595703, 0.06572151184082031, 0.0688467025756836, 0.07197189331054688, 0.07509708404541016, 0.07822227478027344, 0.08134746551513672, 0.08447265625]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 10.0, 6.0, 9.0, 12.0, 12.0, 28.0, 30.0, 60.0, 69.0, 72.0, 87.0, 101.0, 89.0, 98.0, 78.0, 66.0, 43.0, 42.0, 23.0, 18.0, 18.0, 9.0, 4.0, 5.0, 5.0, 0.0, 5.0, 0.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-6.4849853515625e-05, -6.323214620351791e-05, -6.161443889141083e-05, -5.999673157930374e-05, -5.8379024267196655e-05, -5.676131695508957e-05, -5.514360964298248e-05, -5.35259023308754e-05, -5.190819501876831e-05, -5.0290487706661224e-05, -4.867278039455414e-05, -4.705507308244705e-05, -4.5437365770339966e-05, -4.381965845823288e-05, -4.2201951146125793e-05, -4.058424383401871e-05, -3.896653652191162e-05, -3.7348829209804535e-05, -3.573112189769745e-05, -3.411341458559036e-05, -3.2495707273483276e-05, -3.087799996137619e-05, -2.9260292649269104e-05, -2.7642585337162018e-05, -2.602487802505493e-05, -2.4407170712947845e-05, -2.278946340084076e-05, -2.1171756088733673e-05, -1.9554048776626587e-05, -1.79363414645195e-05, -1.6318634152412415e-05, -1.4700926840305328e-05, -1.3083219528198242e-05, -1.1465512216091156e-05, -9.84780490398407e-06, -8.230097591876984e-06, -6.6123902797698975e-06, -4.994682967662811e-06, -3.376975655555725e-06, -1.759268343448639e-06, -1.4156103134155273e-07, 1.4761462807655334e-06, 3.0938535928726196e-06, 4.711560904979706e-06, 6.329268217086792e-06, 7.946975529193878e-06, 9.564682841300964e-06, 1.118239015340805e-05, 1.2800097465515137e-05, 1.4417804777622223e-05, 1.603551208972931e-05, 1.7653219401836395e-05, 1.927092671394348e-05, 2.0888634026050568e-05, 2.2506341338157654e-05, 2.412404865026474e-05, 2.5741755962371826e-05, 2.7359463274478912e-05, 2.8977170586586e-05, 3.0594877898693085e-05, 3.221258521080017e-05, 3.383029252290726e-05, 3.544799983501434e-05, 3.706570714712143e-05, 3.8683414459228516e-05]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 5.0, 2.0, 3.0, 2.0, 6.0, 4.0, 7.0, 15.0, 11.0, 11.0, 34.0, 41.0, 70.0, 109.0, 268.0, 611.0, 2009.0, 9102.0, 63773.0, 591315.0, 339637.0, 33709.0, 5653.0, 1300.0, 414.0, 185.0, 89.0, 59.0, 34.0, 23.0, 16.0, 9.0, 10.0, 5.0, 6.0, 3.0, 6.0, 1.0, 5.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1446533203125, -0.13980674743652344, -0.13496017456054688, -0.1301136016845703, -0.12526702880859375, -0.12042045593261719, -0.11557388305664062, -0.11072731018066406, -0.1058807373046875, -0.10103416442871094, -0.09618759155273438, -0.09134101867675781, -0.08649444580078125, -0.08164787292480469, -0.07680130004882812, -0.07195472717285156, -0.067108154296875, -0.06226158142089844, -0.057415008544921875, -0.05256843566894531, -0.04772186279296875, -0.04287528991699219, -0.038028717041015625, -0.03318214416503906, -0.0283355712890625, -0.023488998413085938, -0.018642425537109375, -0.013795852661132812, -0.00894927978515625, -0.0041027069091796875, 0.000743865966796875, 0.0055904388427734375, 0.01043701171875, 0.015283584594726562, 0.020130157470703125, 0.024976730346679688, 0.02982330322265625, 0.03466987609863281, 0.039516448974609375, 0.04436302185058594, 0.0492095947265625, 0.05405616760253906, 0.058902740478515625, 0.06374931335449219, 0.06859588623046875, 0.07344245910644531, 0.07828903198242188, 0.08313560485839844, 0.087982177734375, 0.09282875061035156, 0.09767532348632812, 0.10252189636230469, 0.10736846923828125, 0.11221504211425781, 0.11706161499023438, 0.12190818786621094, 0.1267547607421875, 0.13160133361816406, 0.13644790649414062, 0.1412944793701172, 0.14614105224609375, 0.1509876251220703, 0.15583419799804688, 0.16068077087402344, 0.16552734375]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 3.0, 2.0, 2.0, 5.0, 5.0, 14.0, 6.0, 13.0, 16.0, 22.0, 24.0, 45.0, 44.0, 74.0, 91.0, 102.0, 108.0, 101.0, 60.0, 53.0, 56.0, 33.0, 29.0, 16.0, 17.0, 13.0, 13.0, 7.0, 4.0, 6.0, 7.0, 3.0, 1.0, 3.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.0298309326171875, -0.028982877731323242, -0.028134822845458984, -0.027286767959594727, -0.02643871307373047, -0.02559065818786621, -0.024742603302001953, -0.023894548416137695, -0.023046493530273438, -0.02219843864440918, -0.021350383758544922, -0.020502328872680664, -0.019654273986816406, -0.01880621910095215, -0.01795816421508789, -0.017110109329223633, -0.016262054443359375, -0.015413999557495117, -0.01456594467163086, -0.013717889785766602, -0.012869834899902344, -0.012021780014038086, -0.011173725128173828, -0.01032567024230957, -0.009477615356445312, -0.008629560470581055, -0.007781505584716797, -0.006933450698852539, -0.006085395812988281, -0.0052373409271240234, -0.004389286041259766, -0.003541231155395508, -0.00269317626953125, -0.0018451213836669922, -0.0009970664978027344, -0.00014901161193847656, 0.0006990432739257812, 0.001547098159790039, 0.002395153045654297, 0.0032432079315185547, 0.0040912628173828125, 0.00493931770324707, 0.005787372589111328, 0.006635427474975586, 0.007483482360839844, 0.008331537246704102, 0.00917959213256836, 0.010027647018432617, 0.010875701904296875, 0.011723756790161133, 0.01257181167602539, 0.013419866561889648, 0.014267921447753906, 0.015115976333618164, 0.015964031219482422, 0.01681208610534668, 0.017660140991210938, 0.018508195877075195, 0.019356250762939453, 0.02020430564880371, 0.02105236053466797, 0.021900415420532227, 0.022748470306396484, 0.023596525192260742, 0.024444580078125]}, "gradients/decoder.model.decoder.layers.8.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 6.0, 6.0, 11.0, 16.0, 14.0, 40.0, 58.0, 105.0, 154.0, 158.0, 134.0, 113.0, 77.0, 37.0, 28.0, 19.0, 8.0, 5.0, 6.0, 3.0, 2.0, 4.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-3.755671739578247, -3.656165361404419, -3.55665922164917, -3.457152843475342, -3.3576464653015137, -3.2581400871276855, -3.1586339473724365, -3.0591275691986084, -2.9596211910247803, -2.860114812850952, -2.760608673095703, -2.661102294921875, -2.561595916748047, -2.4620895385742188, -2.3625833988189697, -2.2630770206451416, -2.1635708808898926, -2.0640645027160645, -1.9645582437515259, -1.8650519847869873, -1.7655456066131592, -1.6660393476486206, -1.566533088684082, -1.467026710510254, -1.3675203323364258, -1.2680140733718872, -1.168507695198059, -1.0690014362335205, -0.9694950580596924, -0.8699887990951538, -0.7704824805259705, -0.6709761619567871, -0.571469783782959, -0.47196346521377563, -0.3724571466445923, -0.2729508578777313, -0.17344453930854797, -0.07393822073936462, 0.025568068027496338, 0.1250743865966797, 0.22458070516586304, 0.3240870237350464, 0.42359334230422974, 0.5230996608734131, 0.6226059198379517, 0.7221122980117798, 0.8216185569763184, 0.9211248755455017, 1.020631194114685, 1.1201374530792236, 1.2196438312530518, 1.3191500902175903, 1.4186564683914185, 1.518162727355957, 1.6176691055297852, 1.7171753644943237, 1.8166816234588623, 1.9161878824234009, 2.0156941413879395, 2.1152005195617676, 2.2147068977355957, 2.314213275909424, 2.413719415664673, 2.513225793838501, 2.612732172012329]}, "gradients/decoder.model.decoder.layers.8.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 2.0, 4.0, 4.0, 8.0, 18.0, 14.0, 14.0, 19.0, 17.0, 37.0, 30.0, 51.0, 50.0, 64.0, 65.0, 58.0, 59.0, 85.0, 60.0, 52.0, 57.0, 45.0, 40.0, 32.0, 34.0, 21.0, 24.0, 12.0, 10.0, 9.0, 4.0, 1.0, 2.0, 1.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.3821330070495605, -1.3261218070983887, -1.2701106071472168, -1.2140992879867554, -1.1580880880355835, -1.1020768880844116, -1.0460656881332397, -0.9900544285774231, -0.9340431690216064, -0.8780319690704346, -0.8220207095146179, -0.766009509563446, -0.7099982500076294, -0.6539870500564575, -0.5979758501052856, -0.541964590549469, -0.4859533905982971, -0.42994216084480286, -0.3739309310913086, -0.3179197311401367, -0.26190847158432007, -0.2058972716331482, -0.14988604187965393, -0.09387481212615967, -0.037863582372665405, 0.01814764365553856, 0.07415886968374252, 0.1301700919866562, 0.18618132174015045, 0.24219253659248352, 0.2982037663459778, 0.35421499609947205, 0.4102262258529663, 0.46623745560646057, 0.5222486853599548, 0.5782598853111267, 0.6342711448669434, 0.6902823448181152, 0.7462935447692871, 0.8023048043251038, 0.8583160638809204, 0.9143272638320923, 0.9703385233879089, 1.0263497829437256, 1.0823609828948975, 1.1383721828460693, 1.1943833827972412, 1.250394582748413, 1.306405782699585, 1.3624169826507568, 1.4184281826019287, 1.4744395017623901, 1.530450701713562, 1.5864619016647339, 1.6424731016159058, 1.6984844207763672, 1.754495620727539, 1.810506820678711, 1.8665180206298828, 1.9225293397903442, 1.9785405397415161, 2.0345516204833984, 2.0905630588531494, 2.1465742588043213, 2.202585458755493]}, "gradients/decoder.model.decoder.layers.8.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 4.0, 1.0, 2.0, 2.0, 2.0, 4.0, 3.0, 4.0, 17.0, 21.0, 18.0, 27.0, 61.0, 88.0, 147.0, 221.0, 410.0, 711.0, 1430.0, 2939.0, 6466.0, 14955.0, 35969.0, 89276.0, 208636.0, 316902.0, 212870.0, 91581.0, 37035.0, 15554.0, 6734.0, 3114.0, 1563.0, 809.0, 436.0, 204.0, 123.0, 84.0, 41.0, 34.0, 19.0, 17.0, 4.0, 8.0, 7.0, 5.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.4453125, -1.4046173095703125, -1.363922119140625, -1.3232269287109375, -1.28253173828125, -1.2418365478515625, -1.201141357421875, -1.1604461669921875, -1.1197509765625, -1.0790557861328125, -1.038360595703125, -0.9976654052734375, -0.95697021484375, -0.9162750244140625, -0.875579833984375, -0.8348846435546875, -0.794189453125, -0.7534942626953125, -0.712799072265625, -0.6721038818359375, -0.63140869140625, -0.5907135009765625, -0.550018310546875, -0.5093231201171875, -0.4686279296875, -0.4279327392578125, -0.387237548828125, -0.3465423583984375, -0.30584716796875, -0.2651519775390625, -0.224456787109375, -0.1837615966796875, -0.14306640625, -0.1023712158203125, -0.061676025390625, -0.0209808349609375, 0.01971435546875, 0.0604095458984375, 0.101104736328125, 0.1417999267578125, 0.1824951171875, 0.2231903076171875, 0.263885498046875, 0.3045806884765625, 0.34527587890625, 0.3859710693359375, 0.426666259765625, 0.4673614501953125, 0.508056640625, 0.5487518310546875, 0.589447021484375, 0.6301422119140625, 0.67083740234375, 0.7115325927734375, 0.752227783203125, 0.7929229736328125, 0.8336181640625, 0.8743133544921875, 0.915008544921875, 0.9557037353515625, 0.99639892578125, 1.0370941162109375, 1.077789306640625, 1.1184844970703125, 1.1591796875]}, "gradients/decoder.model.decoder.layers.8.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 4.0, 3.0, 3.0, 5.0, 4.0, 15.0, 12.0, 14.0, 23.0, 27.0, 23.0, 33.0, 32.0, 41.0, 50.0, 62.0, 61.0, 45.0, 50.0, 70.0, 52.0, 54.0, 54.0, 45.0, 38.0, 36.0, 28.0, 22.0, 23.0, 21.0, 14.0, 6.0, 11.0, 5.0, 8.0, 3.0, 1.0, 6.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.662109375, -2.56298828125, -2.4638671875, -2.36474609375, -2.265625, -2.16650390625, -2.0673828125, -1.96826171875, -1.869140625, -1.77001953125, -1.6708984375, -1.57177734375, -1.47265625, -1.37353515625, -1.2744140625, -1.17529296875, -1.076171875, -0.97705078125, -0.8779296875, -0.77880859375, -0.6796875, -0.58056640625, -0.4814453125, -0.38232421875, -0.283203125, -0.18408203125, -0.0849609375, 0.01416015625, 0.11328125, 0.21240234375, 0.3115234375, 0.41064453125, 0.509765625, 0.60888671875, 0.7080078125, 0.80712890625, 0.90625, 1.00537109375, 1.1044921875, 1.20361328125, 1.302734375, 1.40185546875, 1.5009765625, 1.60009765625, 1.69921875, 1.79833984375, 1.8974609375, 1.99658203125, 2.095703125, 2.19482421875, 2.2939453125, 2.39306640625, 2.4921875, 2.59130859375, 2.6904296875, 2.78955078125, 2.888671875, 2.98779296875, 3.0869140625, 3.18603515625, 3.28515625, 3.38427734375, 3.4833984375, 3.58251953125, 3.681640625]}, "gradients/decoder.model.decoder.layers.8.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 6.0, 3.0, 6.0, 4.0, 13.0, 9.0, 9.0, 17.0, 11.0, 21.0, 14.0, 29.0, 34.0, 35.0, 35.0, 46.0, 86.0, 140.0, 294.0, 971.0, 54834.0, 982585.0, 8103.0, 567.0, 222.0, 134.0, 62.0, 48.0, 25.0, 28.0, 31.0, 29.0, 12.0, 17.0, 16.0, 12.0, 13.0, 6.0, 10.0, 6.0, 3.0, 3.0, 5.0, 1.0, 1.0, 4.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.28125, -8.9942626953125, -8.707275390625, -8.4202880859375, -8.13330078125, -7.8463134765625, -7.559326171875, -7.2723388671875, -6.9853515625, -6.6983642578125, -6.411376953125, -6.1243896484375, -5.83740234375, -5.5504150390625, -5.263427734375, -4.9764404296875, -4.689453125, -4.4024658203125, -4.115478515625, -3.8284912109375, -3.54150390625, -3.2545166015625, -2.967529296875, -2.6805419921875, -2.3935546875, -2.1065673828125, -1.819580078125, -1.5325927734375, -1.24560546875, -0.9586181640625, -0.671630859375, -0.3846435546875, -0.09765625, 0.1893310546875, 0.476318359375, 0.7633056640625, 1.05029296875, 1.3372802734375, 1.624267578125, 1.9112548828125, 2.1982421875, 2.4852294921875, 2.772216796875, 3.0592041015625, 3.34619140625, 3.6331787109375, 3.920166015625, 4.2071533203125, 4.494140625, 4.7811279296875, 5.068115234375, 5.3551025390625, 5.64208984375, 5.9290771484375, 6.216064453125, 6.5030517578125, 6.7900390625, 7.0770263671875, 7.364013671875, 7.6510009765625, 7.93798828125, 8.2249755859375, 8.511962890625, 8.7989501953125, 9.0859375]}, "gradients/decoder.model.decoder.layers.8.self_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 3.0, 4.0, 7.0, 7.0, 5.0, 13.0, 16.0, 10.0, 11.0, 24.0, 16.0, 22.0, 22.0, 17.0, 34.0, 50.0, 36.0, 35.0, 57.0, 45.0, 45.0, 38.0, 39.0, 31.0, 41.0, 45.0, 34.0, 34.0, 32.0, 29.0, 31.0, 26.0, 23.0, 14.0, 19.0, 15.0, 14.0, 10.0, 12.0, 8.0, 3.0, 5.0, 9.0, 3.0, 2.0, 6.0, 1.0, 5.0, 1.0, 0.0, 0.0, 0.0, 3.0], "bins": [-2.763671875, -2.68017578125, -2.5966796875, -2.51318359375, -2.4296875, -2.34619140625, -2.2626953125, -2.17919921875, -2.095703125, -2.01220703125, -1.9287109375, -1.84521484375, -1.76171875, -1.67822265625, -1.5947265625, -1.51123046875, -1.427734375, -1.34423828125, -1.2607421875, -1.17724609375, -1.09375, -1.01025390625, -0.9267578125, -0.84326171875, -0.759765625, -0.67626953125, -0.5927734375, -0.50927734375, -0.42578125, -0.34228515625, -0.2587890625, -0.17529296875, -0.091796875, -0.00830078125, 0.0751953125, 0.15869140625, 0.2421875, 0.32568359375, 0.4091796875, 0.49267578125, 0.576171875, 0.65966796875, 0.7431640625, 0.82666015625, 0.91015625, 0.99365234375, 1.0771484375, 1.16064453125, 1.244140625, 1.32763671875, 1.4111328125, 1.49462890625, 1.578125, 1.66162109375, 1.7451171875, 1.82861328125, 1.912109375, 1.99560546875, 2.0791015625, 2.16259765625, 2.24609375, 2.32958984375, 2.4130859375, 2.49658203125, 2.580078125]}, "gradients/decoder.model.decoder.layers.8.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 5.0, 1.0, 4.0, 2.0, 3.0, 8.0, 5.0, 11.0, 20.0, 28.0, 41.0, 65.0, 117.0, 332.0, 781.0, 2913.0, 21239.0, 495733.0, 501213.0, 21538.0, 2978.0, 807.0, 346.0, 180.0, 83.0, 41.0, 23.0, 10.0, 7.0, 10.0, 2.0, 3.0, 2.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5185546875, -1.4679412841796875, -1.417327880859375, -1.3667144775390625, -1.31610107421875, -1.2654876708984375, -1.214874267578125, -1.1642608642578125, -1.1136474609375, -1.0630340576171875, -1.012420654296875, -0.9618072509765625, -0.91119384765625, -0.8605804443359375, -0.809967041015625, -0.7593536376953125, -0.708740234375, -0.6581268310546875, -0.607513427734375, -0.5569000244140625, -0.50628662109375, -0.4556732177734375, -0.405059814453125, -0.3544464111328125, -0.3038330078125, -0.2532196044921875, -0.202606201171875, -0.1519927978515625, -0.10137939453125, -0.0507659912109375, -0.000152587890625, 0.0504608154296875, 0.10107421875, 0.1516876220703125, 0.202301025390625, 0.2529144287109375, 0.30352783203125, 0.3541412353515625, 0.404754638671875, 0.4553680419921875, 0.5059814453125, 0.5565948486328125, 0.607208251953125, 0.6578216552734375, 0.70843505859375, 0.7590484619140625, 0.809661865234375, 0.8602752685546875, 0.910888671875, 0.9615020751953125, 1.012115478515625, 1.0627288818359375, 1.11334228515625, 1.1639556884765625, 1.214569091796875, 1.2651824951171875, 1.3157958984375, 1.3664093017578125, 1.417022705078125, 1.4676361083984375, 1.51824951171875, 1.5688629150390625, 1.619476318359375, 1.6700897216796875, 1.720703125]}, "gradients/decoder.model.decoder.layers.8.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 4.0, 1.0, 6.0, 2.0, 3.0, 5.0, 11.0, 11.0, 17.0, 20.0, 30.0, 33.0, 66.0, 79.0, 85.0, 88.0, 112.0, 106.0, 86.0, 60.0, 50.0, 37.0, 31.0, 22.0, 17.0, 9.0, 8.0, 3.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.00017440319061279297, -0.00016973353922367096, -0.00016506388783454895, -0.00016039423644542694, -0.00015572458505630493, -0.00015105493366718292, -0.0001463852822780609, -0.0001417156308889389, -0.0001370459794998169, -0.00013237632811069489, -0.00012770667672157288, -0.00012303702533245087, -0.00011836737394332886, -0.00011369772255420685, -0.00010902807116508484, -0.00010435841977596283, -9.968876838684082e-05, -9.501911699771881e-05, -9.03494656085968e-05, -8.567981421947479e-05, -8.101016283035278e-05, -7.634051144123077e-05, -7.167086005210876e-05, -6.700120866298676e-05, -6.233155727386475e-05, -5.766190588474274e-05, -5.299225449562073e-05, -4.832260310649872e-05, -4.365295171737671e-05, -3.89833003282547e-05, -3.431364893913269e-05, -2.964399755001068e-05, -2.4974346160888672e-05, -2.0304694771766663e-05, -1.5635043382644653e-05, -1.0965391993522644e-05, -6.295740604400635e-06, -1.6260892152786255e-06, 3.043562173843384e-06, 7.713213562965393e-06, 1.2382864952087402e-05, 1.705251634120941e-05, 2.172216773033142e-05, 2.639181911945343e-05, 3.106147050857544e-05, 3.573112189769745e-05, 4.040077328681946e-05, 4.507042467594147e-05, 4.9740076065063477e-05, 5.4409727454185486e-05, 5.9079378843307495e-05, 6.37490302324295e-05, 6.841868162155151e-05, 7.308833301067352e-05, 7.775798439979553e-05, 8.242763578891754e-05, 8.709728717803955e-05, 9.176693856716156e-05, 9.643658995628357e-05, 0.00010110624134540558, 0.00010577589273452759, 0.0001104455441236496, 0.0001151151955127716, 0.00011978484690189362, 0.00012445449829101562]}, "gradients/decoder.model.decoder.layers.8.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 7.0, 7.0, 10.0, 11.0, 33.0, 31.0, 71.0, 111.0, 248.0, 828.0, 3602.0, 40604.0, 751949.0, 237242.0, 11258.0, 1648.0, 471.0, 203.0, 89.0, 64.0, 30.0, 17.0, 9.0, 7.0, 4.0, 6.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.32421875, -1.26849365234375, -1.2127685546875, -1.15704345703125, -1.101318359375, -1.04559326171875, -0.9898681640625, -0.93414306640625, -0.87841796875, -0.82269287109375, -0.7669677734375, -0.71124267578125, -0.655517578125, -0.59979248046875, -0.5440673828125, -0.48834228515625, -0.4326171875, -0.37689208984375, -0.3211669921875, -0.26544189453125, -0.209716796875, -0.15399169921875, -0.0982666015625, -0.04254150390625, 0.01318359375, 0.06890869140625, 0.1246337890625, 0.18035888671875, 0.236083984375, 0.29180908203125, 0.3475341796875, 0.40325927734375, 0.458984375, 0.51470947265625, 0.5704345703125, 0.62615966796875, 0.681884765625, 0.73760986328125, 0.7933349609375, 0.84906005859375, 0.90478515625, 0.96051025390625, 1.0162353515625, 1.07196044921875, 1.127685546875, 1.18341064453125, 1.2391357421875, 1.29486083984375, 1.3505859375, 1.40631103515625, 1.4620361328125, 1.51776123046875, 1.573486328125, 1.62921142578125, 1.6849365234375, 1.74066162109375, 1.79638671875, 1.85211181640625, 1.9078369140625, 1.96356201171875, 2.019287109375, 2.07501220703125, 2.1307373046875, 2.18646240234375, 2.2421875]}, "gradients/decoder.model.decoder.layers.8.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 4.0, 8.0, 6.0, 5.0, 12.0, 18.0, 22.0, 35.0, 43.0, 55.0, 68.0, 75.0, 106.0, 103.0, 90.0, 74.0, 64.0, 65.0, 43.0, 27.0, 24.0, 14.0, 11.0, 9.0, 7.0, 6.0, 4.0, 3.0, 7.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.5126953125, -0.4986724853515625, -0.484649658203125, -0.4706268310546875, -0.45660400390625, -0.4425811767578125, -0.428558349609375, -0.4145355224609375, -0.4005126953125, -0.3864898681640625, -0.372467041015625, -0.3584442138671875, -0.34442138671875, -0.3303985595703125, -0.316375732421875, -0.3023529052734375, -0.288330078125, -0.2743072509765625, -0.260284423828125, -0.2462615966796875, -0.23223876953125, -0.2182159423828125, -0.204193115234375, -0.1901702880859375, -0.1761474609375, -0.1621246337890625, -0.148101806640625, -0.1340789794921875, -0.12005615234375, -0.1060333251953125, -0.092010498046875, -0.0779876708984375, -0.06396484375, -0.0499420166015625, -0.035919189453125, -0.0218963623046875, -0.00787353515625, 0.0061492919921875, 0.020172119140625, 0.0341949462890625, 0.0482177734375, 0.0622406005859375, 0.076263427734375, 0.0902862548828125, 0.10430908203125, 0.1183319091796875, 0.132354736328125, 0.1463775634765625, 0.160400390625, 0.1744232177734375, 0.188446044921875, 0.2024688720703125, 0.21649169921875, 0.2305145263671875, 0.244537353515625, 0.2585601806640625, 0.2725830078125, 0.2866058349609375, 0.300628662109375, 0.3146514892578125, 0.32867431640625, 0.3426971435546875, 0.356719970703125, 0.3707427978515625, 0.384765625]}, "gradients/decoder.model.decoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 17.0, 38.0, 117.0, 230.0, 326.0, 170.0, 70.0, 23.0, 6.0, 8.0, 5.0, 0.0, 2.0, 0.0, 0.0, 3.0], "bins": [-23.3571834564209, -22.910215377807617, -22.463247299194336, -22.016277313232422, -21.56930923461914, -21.12234115600586, -20.675373077392578, -20.228404998779297, -19.781435012817383, -19.3344669342041, -18.88749885559082, -18.440528869628906, -17.993560791015625, -17.546592712402344, -17.099624633789062, -16.65265655517578, -16.2056884765625, -15.758720397949219, -15.311751365661621, -14.86478328704834, -14.417814254760742, -13.970846176147461, -13.52387809753418, -13.076909065246582, -12.629940032958984, -12.182971954345703, -11.736002922058105, -11.289034843444824, -10.842065811157227, -10.395097732543945, -9.948129653930664, -9.501160621643066, -9.054192543029785, -8.607224464416504, -8.160255432128906, -7.713287353515625, -7.266318321228027, -6.819350242614746, -6.372381687164307, -5.925413131713867, -5.478444576263428, -5.031476020812988, -4.584507465362549, -4.137538909912109, -3.690570592880249, -3.2436020374298096, -2.796633720397949, -2.3496651649475098, -1.9026966094970703, -1.4557280540466309, -1.008759617805481, -0.561791181564331, -0.1148226261138916, 0.33214592933654785, 0.7791142463684082, 1.2260828018188477, 1.673051357269287, 2.1200199127197266, 2.566988468170166, 3.0139567852020264, 3.460925340652466, 3.9078938961029053, 4.354862213134766, 4.801830768585205, 5.2487993240356445]}, "gradients/decoder.model.decoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 2.0, 3.0, 6.0, 3.0, 1.0, 5.0, 4.0, 5.0, 12.0, 12.0, 15.0, 10.0, 18.0, 24.0, 29.0, 24.0, 20.0, 30.0, 24.0, 36.0, 30.0, 40.0, 53.0, 44.0, 40.0, 28.0, 39.0, 39.0, 46.0, 41.0, 27.0, 49.0, 28.0, 31.0, 43.0, 26.0, 28.0, 17.0, 14.0, 15.0, 8.0, 12.0, 8.0, 5.0, 8.0, 1.0, 4.0, 1.0, 1.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-4.125938415527344, -3.9832170009613037, -3.8404955863952637, -3.6977741718292236, -3.5550527572631836, -3.4123313426971436, -3.2696099281311035, -3.1268885135650635, -2.9841670989990234, -2.8414456844329834, -2.6987242698669434, -2.5560028553009033, -2.4132814407348633, -2.2705600261688232, -2.127838611602783, -1.9851171970367432, -1.8423957824707031, -1.699674367904663, -1.556952953338623, -1.414231538772583, -1.271510124206543, -1.128788709640503, -0.9860672950744629, -0.8433458805084229, -0.7006244659423828, -0.5579030513763428, -0.41518163681030273, -0.2724602222442627, -0.12973880767822266, 0.012982606887817383, 0.15570402145385742, 0.29842543601989746, 0.4411473274230957, 0.5838687419891357, 0.7265901565551758, 0.8693115711212158, 1.0120329856872559, 1.154754400253296, 1.297475814819336, 1.440197229385376, 1.582918643951416, 1.725640058517456, 1.868361473083496, 2.011082887649536, 2.153804302215576, 2.296525716781616, 2.4392471313476562, 2.5819685459136963, 2.7246899604797363, 2.8674113750457764, 3.0101327896118164, 3.1528542041778564, 3.2955756187438965, 3.4382970333099365, 3.5810184478759766, 3.7237398624420166, 3.8664612770080566, 4.009182929992676, 4.151904106140137, 4.294625282287598, 4.437346935272217, 4.580068588256836, 4.722789764404297, 4.865510940551758, 5.008232593536377]}, "gradients/decoder.model.decoder.layers.7.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 1.0, 6.0, 2.0, 4.0, 3.0, 11.0, 10.0, 24.0, 29.0, 28.0, 47.0, 66.0, 85.0, 148.0, 265.0, 395.0, 905.0, 2906.0, 16331.0, 200090.0, 2565872.0, 1321199.0, 74314.0, 8218.0, 1831.0, 620.0, 298.0, 182.0, 123.0, 76.0, 63.0, 34.0, 26.0, 22.0, 15.0, 13.0, 6.0, 4.0, 5.0, 1.0, 5.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.671875, -4.52508544921875, -4.3782958984375, -4.23150634765625, -4.084716796875, -3.93792724609375, -3.7911376953125, -3.64434814453125, -3.49755859375, -3.35076904296875, -3.2039794921875, -3.05718994140625, -2.910400390625, -2.76361083984375, -2.6168212890625, -2.47003173828125, -2.3232421875, -2.17645263671875, -2.0296630859375, -1.88287353515625, -1.736083984375, -1.58929443359375, -1.4425048828125, -1.29571533203125, -1.14892578125, -1.00213623046875, -0.8553466796875, -0.70855712890625, -0.561767578125, -0.41497802734375, -0.2681884765625, -0.12139892578125, 0.025390625, 0.17218017578125, 0.3189697265625, 0.46575927734375, 0.612548828125, 0.75933837890625, 0.9061279296875, 1.05291748046875, 1.19970703125, 1.34649658203125, 1.4932861328125, 1.64007568359375, 1.786865234375, 1.93365478515625, 2.0804443359375, 2.22723388671875, 2.3740234375, 2.52081298828125, 2.6676025390625, 2.81439208984375, 2.961181640625, 3.10797119140625, 3.2547607421875, 3.40155029296875, 3.54833984375, 3.69512939453125, 3.8419189453125, 3.98870849609375, 4.135498046875, 4.28228759765625, 4.4290771484375, 4.57586669921875, 4.72265625]}, "gradients/decoder.model.decoder.layers.7.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 1.0, 3.0, 11.0, 8.0, 15.0, 14.0, 22.0, 16.0, 32.0, 34.0, 50.0, 36.0, 39.0, 53.0, 44.0, 53.0, 61.0, 59.0, 63.0, 48.0, 47.0, 40.0, 45.0, 28.0, 40.0, 35.0, 29.0, 24.0, 14.0, 14.0, 9.0, 3.0, 5.0, 3.0, 4.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.12109375, -2.045166015625, -1.96923828125, -1.893310546875, -1.8173828125, -1.741455078125, -1.66552734375, -1.589599609375, -1.513671875, -1.437744140625, -1.36181640625, -1.285888671875, -1.2099609375, -1.134033203125, -1.05810546875, -0.982177734375, -0.90625, -0.830322265625, -0.75439453125, -0.678466796875, -0.6025390625, -0.526611328125, -0.45068359375, -0.374755859375, -0.298828125, -0.222900390625, -0.14697265625, -0.071044921875, 0.0048828125, 0.080810546875, 0.15673828125, 0.232666015625, 0.30859375, 0.384521484375, 0.46044921875, 0.536376953125, 0.6123046875, 0.688232421875, 0.76416015625, 0.840087890625, 0.916015625, 0.991943359375, 1.06787109375, 1.143798828125, 1.2197265625, 1.295654296875, 1.37158203125, 1.447509765625, 1.5234375, 1.599365234375, 1.67529296875, 1.751220703125, 1.8271484375, 1.903076171875, 1.97900390625, 2.054931640625, 2.130859375, 2.206787109375, 2.28271484375, 2.358642578125, 2.4345703125, 2.510498046875, 2.58642578125, 2.662353515625, 2.73828125]}, "gradients/decoder.model.decoder.layers.7.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 3.0, 4.0, 3.0, 3.0, 6.0, 5.0, 5.0, 11.0, 17.0, 20.0, 16.0, 25.0, 41.0, 77.0, 151.0, 286.0, 1200.0, 38421.0, 4136008.0, 16419.0, 918.0, 268.0, 119.0, 86.0, 49.0, 45.0, 18.0, 16.0, 8.0, 8.0, 7.0, 5.0, 6.0, 4.0, 5.0, 3.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.1015625, -9.7042236328125, -9.306884765625, -8.9095458984375, -8.51220703125, -8.1148681640625, -7.717529296875, -7.3201904296875, -6.9228515625, -6.5255126953125, -6.128173828125, -5.7308349609375, -5.33349609375, -4.9361572265625, -4.538818359375, -4.1414794921875, -3.744140625, -3.3468017578125, -2.949462890625, -2.5521240234375, -2.15478515625, -1.7574462890625, -1.360107421875, -0.9627685546875, -0.5654296875, -0.1680908203125, 0.229248046875, 0.6265869140625, 1.02392578125, 1.4212646484375, 1.818603515625, 2.2159423828125, 2.61328125, 3.0106201171875, 3.407958984375, 3.8052978515625, 4.20263671875, 4.5999755859375, 4.997314453125, 5.3946533203125, 5.7919921875, 6.1893310546875, 6.586669921875, 6.9840087890625, 7.38134765625, 7.7786865234375, 8.176025390625, 8.5733642578125, 8.970703125, 9.3680419921875, 9.765380859375, 10.1627197265625, 10.56005859375, 10.9573974609375, 11.354736328125, 11.7520751953125, 12.1494140625, 12.5467529296875, 12.944091796875, 13.3414306640625, 13.73876953125, 14.1361083984375, 14.533447265625, 14.9307861328125, 15.328125]}, "gradients/decoder.model.decoder.layers.7.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 6.0, 3.0, 1.0, 8.0, 13.0, 8.0, 21.0, 24.0, 39.0, 57.0, 83.0, 149.0, 235.0, 349.0, 470.0, 607.0, 597.0, 507.0, 319.0, 230.0, 119.0, 96.0, 57.0, 35.0, 22.0, 14.0, 9.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.17578125, -1.1400604248046875, -1.104339599609375, -1.0686187744140625, -1.03289794921875, -0.9971771240234375, -0.961456298828125, -0.9257354736328125, -0.8900146484375, -0.8542938232421875, -0.818572998046875, -0.7828521728515625, -0.74713134765625, -0.7114105224609375, -0.675689697265625, -0.6399688720703125, -0.604248046875, -0.5685272216796875, -0.532806396484375, -0.4970855712890625, -0.46136474609375, -0.4256439208984375, -0.389923095703125, -0.3542022705078125, -0.3184814453125, -0.2827606201171875, -0.247039794921875, -0.2113189697265625, -0.17559814453125, -0.1398773193359375, -0.104156494140625, -0.0684356689453125, -0.03271484375, 0.0030059814453125, 0.038726806640625, 0.0744476318359375, 0.11016845703125, 0.1458892822265625, 0.181610107421875, 0.2173309326171875, 0.2530517578125, 0.2887725830078125, 0.324493408203125, 0.3602142333984375, 0.39593505859375, 0.4316558837890625, 0.467376708984375, 0.5030975341796875, 0.538818359375, 0.5745391845703125, 0.610260009765625, 0.6459808349609375, 0.68170166015625, 0.7174224853515625, 0.753143310546875, 0.7888641357421875, 0.8245849609375, 0.8603057861328125, 0.896026611328125, 0.9317474365234375, 0.96746826171875, 1.0031890869140625, 1.038909912109375, 1.0746307373046875, 1.1103515625]}, "gradients/decoder.model.decoder.layers.7.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 3.0, 4.0, 6.0, 10.0, 9.0, 15.0, 14.0, 37.0, 39.0, 72.0, 90.0, 112.0, 111.0, 108.0, 106.0, 63.0, 61.0, 42.0, 34.0, 23.0, 19.0, 15.0, 6.0, 3.0, 5.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-5.2290778160095215, -5.0955610275268555, -4.9620442390441895, -4.828527927398682, -4.695011138916016, -4.56149435043335, -4.427977561950684, -4.294461250305176, -4.16094446182251, -4.027427673339844, -3.893911123275757, -3.760394334793091, -3.626877784729004, -3.493360996246338, -3.359844207763672, -3.226327657699585, -3.092810869216919, -2.959294080734253, -2.825777530670166, -2.6922607421875, -2.558744192123413, -2.425227403640747, -2.29171085357666, -2.158194065093994, -2.024677276611328, -1.8911606073379517, -1.7576439380645752, -1.6241271495819092, -1.4906105995178223, -1.3570938110351562, -1.2235771417617798, -1.0900604724884033, -0.9565441608428955, -0.823027491569519, -0.6895108222961426, -0.5559940934181213, -0.4224774241447449, -0.2889607548713684, -0.15544402599334717, -0.021927356719970703, 0.11158931255340576, 0.24510599672794342, 0.3786226809024811, 0.5121393799781799, 0.6456560492515564, 0.7791727185249329, 0.9126894474029541, 1.0462061166763306, 1.179722785949707, 1.3132394552230835, 1.44675612449646, 1.580272912979126, 1.713789463043213, 1.847306251525879, 1.9808229207992554, 2.114339590072632, 2.2478561401367188, 2.3813729286193848, 2.5148894786834717, 2.6484062671661377, 2.7819228172302246, 2.9154396057128906, 3.0489563941955566, 3.1824729442596436, 3.3159897327423096]}, "gradients/decoder.model.decoder.layers.7.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 0.0, 6.0, 1.0, 4.0, 5.0, 10.0, 4.0, 10.0, 17.0, 21.0, 23.0, 29.0, 26.0, 31.0, 33.0, 41.0, 36.0, 50.0, 39.0, 40.0, 52.0, 43.0, 49.0, 44.0, 56.0, 40.0, 50.0, 37.0, 37.0, 31.0, 28.0, 20.0, 15.0, 16.0, 13.0, 13.0, 6.0, 11.0, 5.0, 7.0, 2.0, 3.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.4433648586273193, -2.3669867515563965, -2.2906088829040527, -2.21423077583313, -2.137852907180786, -2.0614748001098633, -1.98509681224823, -1.9087188243865967, -1.8323408365249634, -1.75596284866333, -1.6795848608016968, -1.6032068729400635, -1.5268287658691406, -1.4504508972167969, -1.374072790145874, -1.2976948022842407, -1.2213168144226074, -1.1449388265609741, -1.0685608386993408, -0.9921827912330627, -0.9158048033714294, -0.8394268155097961, -0.7630487680435181, -0.6866707801818848, -0.6102927923202515, -0.5339148044586182, -0.4575367867946625, -0.3811587691307068, -0.3047807812690735, -0.22840279340744019, -0.1520247757434845, -0.07564675807952881, 0.0007309913635253906, 0.07710899412631989, 0.15348699688911438, 0.22986499965190887, 0.30624300241470337, 0.38262099027633667, 0.45899900794029236, 0.535377025604248, 0.6117550134658813, 0.6881330013275146, 0.764510989189148, 0.840889036655426, 0.9172670245170593, 0.9936450123786926, 1.0700230598449707, 1.146401047706604, 1.2227790355682373, 1.2991570234298706, 1.375535011291504, 1.4519129991531372, 1.5282909870147705, 1.6046690940856934, 1.6810470819473267, 1.75742506980896, 1.8338030576705933, 1.9101810455322266, 1.9865590333938599, 2.062937021255493, 2.139315128326416, 2.2156929969787598, 2.2920711040496826, 2.3684492111206055, 2.444827079772949]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 9.0, 5.0, 7.0, 13.0, 15.0, 22.0, 29.0, 41.0, 67.0, 104.0, 214.0, 346.0, 712.0, 1842.0, 5448.0, 20140.0, 85015.0, 304037.0, 417804.0, 159603.0, 38304.0, 9709.0, 2872.0, 1043.0, 490.0, 257.0, 123.0, 85.0, 52.0, 44.0, 31.0, 14.0, 18.0, 15.0, 4.0, 7.0, 6.0, 7.0, 3.0, 3.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.59375, -0.5753250122070312, -0.5569000244140625, -0.5384750366210938, -0.520050048828125, -0.5016250610351562, -0.4832000732421875, -0.46477508544921875, -0.44635009765625, -0.42792510986328125, -0.4095001220703125, -0.39107513427734375, -0.372650146484375, -0.35422515869140625, -0.3358001708984375, -0.31737518310546875, -0.2989501953125, -0.28052520751953125, -0.2621002197265625, -0.24367523193359375, -0.225250244140625, -0.20682525634765625, -0.1884002685546875, -0.16997528076171875, -0.15155029296875, -0.13312530517578125, -0.1147003173828125, -0.09627532958984375, -0.077850341796875, -0.05942535400390625, -0.0410003662109375, -0.02257537841796875, -0.004150390625, 0.01427459716796875, 0.0326995849609375, 0.05112457275390625, 0.069549560546875, 0.08797454833984375, 0.1063995361328125, 0.12482452392578125, 0.14324951171875, 0.16167449951171875, 0.1800994873046875, 0.19852447509765625, 0.216949462890625, 0.23537445068359375, 0.2537994384765625, 0.27222442626953125, 0.2906494140625, 0.30907440185546875, 0.3274993896484375, 0.34592437744140625, 0.364349365234375, 0.38277435302734375, 0.4011993408203125, 0.41962432861328125, 0.43804931640625, 0.45647430419921875, 0.4748992919921875, 0.49332427978515625, 0.511749267578125, 0.5301742553710938, 0.5485992431640625, 0.5670242309570312, 0.58544921875]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 4.0, 3.0, 10.0, 6.0, 18.0, 19.0, 21.0, 43.0, 41.0, 49.0, 64.0, 60.0, 88.0, 72.0, 84.0, 76.0, 74.0, 64.0, 52.0, 34.0, 42.0, 20.0, 22.0, 16.0, 6.0, 6.0, 8.0, 4.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.919921875, -1.84295654296875, -1.7659912109375, -1.68902587890625, -1.612060546875, -1.53509521484375, -1.4581298828125, -1.38116455078125, -1.30419921875, -1.22723388671875, -1.1502685546875, -1.07330322265625, -0.996337890625, -0.91937255859375, -0.8424072265625, -0.76544189453125, -0.6884765625, -0.61151123046875, -0.5345458984375, -0.45758056640625, -0.380615234375, -0.30364990234375, -0.2266845703125, -0.14971923828125, -0.07275390625, 0.00421142578125, 0.0811767578125, 0.15814208984375, 0.235107421875, 0.31207275390625, 0.3890380859375, 0.46600341796875, 0.54296875, 0.61993408203125, 0.6968994140625, 0.77386474609375, 0.850830078125, 0.92779541015625, 1.0047607421875, 1.08172607421875, 1.15869140625, 1.23565673828125, 1.3126220703125, 1.38958740234375, 1.466552734375, 1.54351806640625, 1.6204833984375, 1.69744873046875, 1.7744140625, 1.85137939453125, 1.9283447265625, 2.00531005859375, 2.082275390625, 2.15924072265625, 2.2362060546875, 2.31317138671875, 2.39013671875, 2.46710205078125, 2.5440673828125, 2.62103271484375, 2.697998046875, 2.77496337890625, 2.8519287109375, 2.92889404296875, 3.005859375]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 8.0, 3.0, 5.0, 8.0, 11.0, 11.0, 25.0, 29.0, 44.0, 57.0, 98.0, 152.0, 238.0, 414.0, 736.0, 1312.0, 2641.0, 5164.0, 11070.0, 22706.0, 47012.0, 92092.0, 159764.0, 218275.0, 204142.0, 135777.0, 74823.0, 37383.0, 17523.0, 8487.0, 3903.0, 2049.0, 1107.0, 585.0, 317.0, 183.0, 140.0, 87.0, 51.0, 40.0, 19.0, 21.0, 10.0, 9.0, 8.0, 6.0, 4.0, 2.0, 3.0, 1.0, 3.0, 3.0, 2.0, 1.0], "bins": [-0.261474609375, -0.25374794006347656, -0.24602127075195312, -0.2382946014404297, -0.23056793212890625, -0.2228412628173828, -0.21511459350585938, -0.20738792419433594, -0.1996612548828125, -0.19193458557128906, -0.18420791625976562, -0.1764812469482422, -0.16875457763671875, -0.1610279083251953, -0.15330123901367188, -0.14557456970214844, -0.137847900390625, -0.13012123107910156, -0.12239456176757812, -0.11466789245605469, -0.10694122314453125, -0.09921455383300781, -0.09148788452148438, -0.08376121520996094, -0.0760345458984375, -0.06830787658691406, -0.060581207275390625, -0.05285453796386719, -0.04512786865234375, -0.03740119934082031, -0.029674530029296875, -0.021947860717773438, -0.01422119140625, -0.0064945220947265625, 0.001232147216796875, 0.008958816528320312, 0.01668548583984375, 0.024412155151367188, 0.032138824462890625, 0.03986549377441406, 0.0475921630859375, 0.05531883239746094, 0.06304550170898438, 0.07077217102050781, 0.07849884033203125, 0.08622550964355469, 0.09395217895507812, 0.10167884826660156, 0.109405517578125, 0.11713218688964844, 0.12485885620117188, 0.1325855255126953, 0.14031219482421875, 0.1480388641357422, 0.15576553344726562, 0.16349220275878906, 0.1712188720703125, 0.17894554138183594, 0.18667221069335938, 0.1943988800048828, 0.20212554931640625, 0.2098522186279297, 0.21757888793945312, 0.22530555725097656, 0.2330322265625]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 7.0, 4.0, 4.0, 6.0, 9.0, 12.0, 16.0, 25.0, 23.0, 19.0, 36.0, 40.0, 41.0, 65.0, 59.0, 70.0, 68.0, 64.0, 59.0, 59.0, 55.0, 48.0, 49.0, 28.0, 32.0, 22.0, 15.0, 18.0, 16.0, 10.0, 9.0, 8.0, 8.0, 5.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.85546875, -3.73992919921875, -3.6243896484375, -3.50885009765625, -3.393310546875, -3.27777099609375, -3.1622314453125, -3.04669189453125, -2.93115234375, -2.81561279296875, -2.7000732421875, -2.58453369140625, -2.468994140625, -2.35345458984375, -2.2379150390625, -2.12237548828125, -2.0068359375, -1.89129638671875, -1.7757568359375, -1.66021728515625, -1.544677734375, -1.42913818359375, -1.3135986328125, -1.19805908203125, -1.08251953125, -0.96697998046875, -0.8514404296875, -0.73590087890625, -0.620361328125, -0.50482177734375, -0.3892822265625, -0.27374267578125, -0.158203125, -0.04266357421875, 0.0728759765625, 0.18841552734375, 0.303955078125, 0.41949462890625, 0.5350341796875, 0.65057373046875, 0.76611328125, 0.88165283203125, 0.9971923828125, 1.11273193359375, 1.228271484375, 1.34381103515625, 1.4593505859375, 1.57489013671875, 1.6904296875, 1.80596923828125, 1.9215087890625, 2.03704833984375, 2.152587890625, 2.26812744140625, 2.3836669921875, 2.49920654296875, 2.61474609375, 2.73028564453125, 2.8458251953125, 2.96136474609375, 3.076904296875, 3.19244384765625, 3.3079833984375, 3.42352294921875, 3.5390625]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 4.0, 3.0, 8.0, 6.0, 4.0, 10.0, 9.0, 20.0, 27.0, 28.0, 40.0, 58.0, 114.0, 142.0, 205.0, 376.0, 697.0, 1420.0, 3333.0, 9393.0, 30130.0, 121461.0, 426249.0, 337647.0, 83247.0, 21732.0, 7034.0, 2650.0, 1134.0, 548.0, 279.0, 184.0, 115.0, 66.0, 52.0, 44.0, 17.0, 18.0, 9.0, 8.0, 14.0, 11.0, 7.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.07501220703125, -0.07250118255615234, -0.06999015808105469, -0.06747913360595703, -0.06496810913085938, -0.06245708465576172, -0.05994606018066406, -0.057435035705566406, -0.05492401123046875, -0.052412986755371094, -0.04990196228027344, -0.04739093780517578, -0.044879913330078125, -0.04236888885498047, -0.03985786437988281, -0.037346839904785156, -0.0348358154296875, -0.032324790954589844, -0.029813766479492188, -0.02730274200439453, -0.024791717529296875, -0.02228069305419922, -0.019769668579101562, -0.017258644104003906, -0.01474761962890625, -0.012236595153808594, -0.009725570678710938, -0.007214546203613281, -0.004703521728515625, -0.0021924972534179688, 0.0003185272216796875, 0.0028295516967773438, 0.005340576171875, 0.007851600646972656, 0.010362625122070312, 0.012873649597167969, 0.015384674072265625, 0.01789569854736328, 0.020406723022460938, 0.022917747497558594, 0.02542877197265625, 0.027939796447753906, 0.030450820922851562, 0.03296184539794922, 0.035472869873046875, 0.03798389434814453, 0.04049491882324219, 0.043005943298339844, 0.0455169677734375, 0.048027992248535156, 0.05053901672363281, 0.05305004119873047, 0.055561065673828125, 0.05807209014892578, 0.06058311462402344, 0.0630941390991211, 0.06560516357421875, 0.0681161880493164, 0.07062721252441406, 0.07313823699951172, 0.07564926147460938, 0.07816028594970703, 0.08067131042480469, 0.08318233489990234, 0.085693359375]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 4.0, 2.0, 2.0, 1.0, 5.0, 4.0, 9.0, 5.0, 20.0, 12.0, 16.0, 23.0, 32.0, 29.0, 39.0, 73.0, 61.0, 85.0, 69.0, 78.0, 72.0, 79.0, 52.0, 45.0, 47.0, 26.0, 24.0, 21.0, 17.0, 16.0, 8.0, 7.0, 4.0, 6.0, 6.0, 4.0, 0.0, 3.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-3.4749507904052734e-05, -3.351643681526184e-05, -3.228336572647095e-05, -3.1050294637680054e-05, -2.981722354888916e-05, -2.8584152460098267e-05, -2.7351081371307373e-05, -2.611801028251648e-05, -2.4884939193725586e-05, -2.3651868104934692e-05, -2.24187970161438e-05, -2.1185725927352905e-05, -1.9952654838562012e-05, -1.8719583749771118e-05, -1.7486512660980225e-05, -1.625344157218933e-05, -1.5020370483398438e-05, -1.3787299394607544e-05, -1.255422830581665e-05, -1.1321157217025757e-05, -1.0088086128234863e-05, -8.85501503944397e-06, -7.621943950653076e-06, -6.388872861862183e-06, -5.155801773071289e-06, -3.9227306842803955e-06, -2.689659595489502e-06, -1.4565885066986084e-06, -2.2351741790771484e-07, 1.0095536708831787e-06, 2.2426247596740723e-06, 3.475695848464966e-06, 4.708766937255859e-06, 5.941838026046753e-06, 7.1749091148376465e-06, 8.40798020362854e-06, 9.641051292419434e-06, 1.0874122381210327e-05, 1.210719347000122e-05, 1.3340264558792114e-05, 1.4573335647583008e-05, 1.58064067363739e-05, 1.7039477825164795e-05, 1.827254891395569e-05, 1.9505620002746582e-05, 2.0738691091537476e-05, 2.197176218032837e-05, 2.3204833269119263e-05, 2.4437904357910156e-05, 2.567097544670105e-05, 2.6904046535491943e-05, 2.8137117624282837e-05, 2.937018871307373e-05, 3.0603259801864624e-05, 3.183633089065552e-05, 3.306940197944641e-05, 3.4302473068237305e-05, 3.55355441570282e-05, 3.676861524581909e-05, 3.8001686334609985e-05, 3.923475742340088e-05, 4.046782851219177e-05, 4.1700899600982666e-05, 4.293397068977356e-05, 4.416704177856445e-05]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 2.0, 2.0, 3.0, 6.0, 8.0, 14.0, 4.0, 15.0, 22.0, 25.0, 44.0, 73.0, 96.0, 195.0, 374.0, 889.0, 2485.0, 7910.0, 29641.0, 152144.0, 569774.0, 227463.0, 41749.0, 10252.0, 3164.0, 1120.0, 520.0, 232.0, 113.0, 68.0, 40.0, 29.0, 15.0, 20.0, 9.0, 10.0, 4.0, 5.0, 7.0, 5.0, 4.0, 2.0, 5.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.113525390625, -0.1102457046508789, -0.10696601867675781, -0.10368633270263672, -0.10040664672851562, -0.09712696075439453, -0.09384727478027344, -0.09056758880615234, -0.08728790283203125, -0.08400821685791016, -0.08072853088378906, -0.07744884490966797, -0.07416915893554688, -0.07088947296142578, -0.06760978698730469, -0.0643301010131836, -0.0610504150390625, -0.057770729064941406, -0.05449104309082031, -0.05121135711669922, -0.047931671142578125, -0.04465198516845703, -0.04137229919433594, -0.038092613220214844, -0.03481292724609375, -0.031533241271972656, -0.028253555297851562, -0.02497386932373047, -0.021694183349609375, -0.01841449737548828, -0.015134811401367188, -0.011855125427246094, -0.008575439453125, -0.005295753479003906, -0.0020160675048828125, 0.0012636184692382812, 0.004543304443359375, 0.007822990417480469, 0.011102676391601562, 0.014382362365722656, 0.01766204833984375, 0.020941734313964844, 0.024221420288085938, 0.02750110626220703, 0.030780792236328125, 0.03406047821044922, 0.03734016418457031, 0.040619850158691406, 0.0438995361328125, 0.047179222106933594, 0.05045890808105469, 0.05373859405517578, 0.057018280029296875, 0.06029796600341797, 0.06357765197753906, 0.06685733795166016, 0.07013702392578125, 0.07341670989990234, 0.07669639587402344, 0.07997608184814453, 0.08325576782226562, 0.08653545379638672, 0.08981513977050781, 0.0930948257446289, 0.09637451171875]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 0.0, 4.0, 4.0, 2.0, 2.0, 6.0, 5.0, 5.0, 5.0, 6.0, 11.0, 7.0, 14.0, 17.0, 16.0, 43.0, 59.0, 56.0, 56.0, 78.0, 84.0, 91.0, 77.0, 77.0, 50.0, 45.0, 40.0, 30.0, 34.0, 16.0, 12.0, 12.0, 8.0, 7.0, 3.0, 13.0, 3.0, 0.0, 6.0, 1.0, 0.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0184478759765625, -0.017822980880737305, -0.01719808578491211, -0.016573190689086914, -0.01594829559326172, -0.015323400497436523, -0.014698505401611328, -0.014073610305786133, -0.013448715209960938, -0.012823820114135742, -0.012198925018310547, -0.011574029922485352, -0.010949134826660156, -0.010324239730834961, -0.009699344635009766, -0.00907444953918457, -0.008449554443359375, -0.00782465934753418, -0.007199764251708984, -0.006574869155883789, -0.005949974060058594, -0.0053250789642333984, -0.004700183868408203, -0.004075288772583008, -0.0034503936767578125, -0.002825498580932617, -0.002200603485107422, -0.0015757083892822266, -0.0009508132934570312, -0.00032591819763183594, 0.0002989768981933594, 0.0009238719940185547, 0.00154876708984375, 0.0021736621856689453, 0.0027985572814941406, 0.003423452377319336, 0.004048347473144531, 0.0046732425689697266, 0.005298137664794922, 0.005923032760620117, 0.0065479278564453125, 0.007172822952270508, 0.007797718048095703, 0.008422613143920898, 0.009047508239746094, 0.009672403335571289, 0.010297298431396484, 0.01092219352722168, 0.011547088623046875, 0.01217198371887207, 0.012796878814697266, 0.013421773910522461, 0.014046669006347656, 0.014671564102172852, 0.015296459197998047, 0.015921354293823242, 0.016546249389648438, 0.017171144485473633, 0.017796039581298828, 0.018420934677124023, 0.01904582977294922, 0.019670724868774414, 0.02029561996459961, 0.020920515060424805, 0.02154541015625]}, "gradients/decoder.model.decoder.layers.7.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 15.0, 22.0, 72.0, 216.0, 349.0, 211.0, 80.0, 28.0, 13.0, 2.0, 2.0, 3.0, 2.0, 0.0, 3.0], "bins": [-12.600336074829102, -12.36499309539795, -12.129650115966797, -11.894307136535645, -11.658964157104492, -11.42362117767334, -11.188278198242188, -10.952935218811035, -10.717592239379883, -10.48224925994873, -10.246906280517578, -10.011563301086426, -9.776220321655273, -9.540877342224121, -9.305534362792969, -9.070191383361816, -8.834848403930664, -8.599505424499512, -8.36416244506836, -8.128819465637207, -7.893476486206055, -7.658133506774902, -7.42279052734375, -7.187447547912598, -6.952103614807129, -6.716760635375977, -6.481417655944824, -6.246074676513672, -6.0107316970825195, -5.775388717651367, -5.540045738220215, -5.3047027587890625, -5.06935977935791, -4.834016799926758, -4.5986738204956055, -4.363330841064453, -4.127987861633301, -3.8926448822021484, -3.657301664352417, -3.4219586849212646, -3.186615467071533, -2.951272487640381, -2.7159295082092285, -2.480586528778076, -2.245243549346924, -2.0099005699157715, -1.77455735206604, -1.5392143726348877, -1.3038713932037354, -1.068528413772583, -0.8331853747367859, -0.5978423357009888, -0.3624993562698364, -0.12715637683868408, 0.10818672180175781, 0.34352970123291016, 0.5788726806640625, 0.8142156600952148, 1.0495586395263672, 1.284901738166809, 1.5202447175979614, 1.7555876970291138, 1.9909307956695557, 2.226273775100708, 2.4616167545318604]}, "gradients/decoder.model.decoder.layers.7.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 8.0, 12.0, 9.0, 20.0, 25.0, 47.0, 48.0, 74.0, 66.0, 82.0, 91.0, 79.0, 93.0, 89.0, 73.0, 56.0, 36.0, 35.0, 17.0, 15.0, 15.0, 8.0, 4.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7142726182937622, -1.6294703483581543, -1.5446680784225464, -1.4598658084869385, -1.3750636577606201, -1.2902613878250122, -1.2054591178894043, -1.120656967163086, -1.0358545780181885, -0.9510523080825806, -0.8662500977516174, -0.7814478278160095, -0.6966456174850464, -0.6118433475494385, -0.5270410776138306, -0.44223886728286743, -0.3574366569519043, -0.2726344168186188, -0.18783216178417206, -0.10302990674972534, -0.01822766661643982, 0.0665745735168457, 0.1513768434524536, 0.23617905378341675, 0.32098132371902466, 0.4057835638523102, 0.4905858039855957, 0.5753880739212036, 0.6601903438568115, 0.7449925541877747, 0.8297948241233826, 0.9145970344543457, 0.9993991851806641, 1.084201455116272, 1.1690037250518799, 1.2538058757781982, 1.3386081457138062, 1.423410415649414, 1.508212685585022, 1.5930149555206299, 1.6778171062469482, 1.7626193761825562, 1.847421646118164, 1.9322237968444824, 2.01702618598938, 2.1018283367156982, 2.1866307258605957, 2.271432876586914, 2.3562350273132324, 2.441037178039551, 2.5258395671844482, 2.6106417179107666, 2.695444107055664, 2.7802462577819824, 2.865048408508301, 2.9498507976531982, 3.0346531867980957, 3.119455337524414, 3.2042577266693115, 3.28905987739563, 3.3738622665405273, 3.4586644172668457, 3.543466567993164, 3.6282689571380615, 3.71307110786438]}, "gradients/decoder.model.decoder.layers.7.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 4.0, 5.0, 4.0, 2.0, 6.0, 5.0, 8.0, 4.0, 6.0, 5.0, 14.0, 11.0, 30.0, 25.0, 35.0, 40.0, 53.0, 94.0, 378.0, 3842.0, 112494.0, 842063.0, 85596.0, 3142.0, 359.0, 94.0, 64.0, 44.0, 36.0, 21.0, 26.0, 10.0, 9.0, 10.0, 7.0, 5.0, 3.0, 4.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.01953125, -4.8599853515625, -4.700439453125, -4.5408935546875, -4.38134765625, -4.2218017578125, -4.062255859375, -3.9027099609375, -3.7431640625, -3.5836181640625, -3.424072265625, -3.2645263671875, -3.10498046875, -2.9454345703125, -2.785888671875, -2.6263427734375, -2.466796875, -2.3072509765625, -2.147705078125, -1.9881591796875, -1.82861328125, -1.6690673828125, -1.509521484375, -1.3499755859375, -1.1904296875, -1.0308837890625, -0.871337890625, -0.7117919921875, -0.55224609375, -0.3927001953125, -0.233154296875, -0.0736083984375, 0.0859375, 0.2454833984375, 0.405029296875, 0.5645751953125, 0.72412109375, 0.8836669921875, 1.043212890625, 1.2027587890625, 1.3623046875, 1.5218505859375, 1.681396484375, 1.8409423828125, 2.00048828125, 2.1600341796875, 2.319580078125, 2.4791259765625, 2.638671875, 2.7982177734375, 2.957763671875, 3.1173095703125, 3.27685546875, 3.4364013671875, 3.595947265625, 3.7554931640625, 3.9150390625, 4.0745849609375, 4.234130859375, 4.3936767578125, 4.55322265625, 4.7127685546875, 4.872314453125, 5.0318603515625, 5.19140625]}, "gradients/decoder.model.decoder.layers.7.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 4.0, 10.0, 24.0, 29.0, 94.0, 100.0, 163.0, 175.0, 145.0, 132.0, 70.0, 28.0, 27.0, 8.0, 5.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.25390625, -2.94427490234375, -2.6346435546875, -2.32501220703125, -2.015380859375, -1.70574951171875, -1.3961181640625, -1.08648681640625, -0.77685546875, -0.46722412109375, -0.1575927734375, 0.15203857421875, 0.461669921875, 0.77130126953125, 1.0809326171875, 1.39056396484375, 1.7001953125, 2.00982666015625, 2.3194580078125, 2.62908935546875, 2.938720703125, 3.24835205078125, 3.5579833984375, 3.86761474609375, 4.17724609375, 4.48687744140625, 4.7965087890625, 5.10614013671875, 5.415771484375, 5.72540283203125, 6.0350341796875, 6.34466552734375, 6.654296875, 6.96392822265625, 7.2735595703125, 7.58319091796875, 7.892822265625, 8.20245361328125, 8.5120849609375, 8.82171630859375, 9.13134765625, 9.44097900390625, 9.7506103515625, 10.06024169921875, 10.369873046875, 10.67950439453125, 10.9891357421875, 11.29876708984375, 11.6083984375, 11.91802978515625, 12.2276611328125, 12.53729248046875, 12.846923828125, 13.15655517578125, 13.4661865234375, 13.77581787109375, 14.08544921875, 14.39508056640625, 14.7047119140625, 15.01434326171875, 15.323974609375, 15.63360595703125, 15.9432373046875, 16.25286865234375, 16.5625]}, "gradients/decoder.model.decoder.layers.7.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 4.0, 1.0, 3.0, 2.0, 1.0, 4.0, 2.0, 11.0, 16.0, 13.0, 20.0, 25.0, 39.0, 42.0, 44.0, 85.0, 93.0, 109.0, 155.0, 152.0, 276.0, 475.0, 1782.0, 38603.0, 780879.0, 217937.0, 5812.0, 709.0, 357.0, 225.0, 154.0, 128.0, 95.0, 73.0, 69.0, 46.0, 32.0, 22.0, 19.0, 9.0, 15.0, 10.0, 4.0, 5.0, 5.0, 5.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.203125, -4.05682373046875, -3.9105224609375, -3.76422119140625, -3.617919921875, -3.47161865234375, -3.3253173828125, -3.17901611328125, -3.03271484375, -2.88641357421875, -2.7401123046875, -2.59381103515625, -2.447509765625, -2.30120849609375, -2.1549072265625, -2.00860595703125, -1.8623046875, -1.71600341796875, -1.5697021484375, -1.42340087890625, -1.277099609375, -1.13079833984375, -0.9844970703125, -0.83819580078125, -0.69189453125, -0.54559326171875, -0.3992919921875, -0.25299072265625, -0.106689453125, 0.03961181640625, 0.1859130859375, 0.33221435546875, 0.478515625, 0.62481689453125, 0.7711181640625, 0.91741943359375, 1.063720703125, 1.21002197265625, 1.3563232421875, 1.50262451171875, 1.64892578125, 1.79522705078125, 1.9415283203125, 2.08782958984375, 2.234130859375, 2.38043212890625, 2.5267333984375, 2.67303466796875, 2.8193359375, 2.96563720703125, 3.1119384765625, 3.25823974609375, 3.404541015625, 3.55084228515625, 3.6971435546875, 3.84344482421875, 3.98974609375, 4.13604736328125, 4.2823486328125, 4.42864990234375, 4.574951171875, 4.72125244140625, 4.8675537109375, 5.01385498046875, 5.16015625]}, "gradients/decoder.model.decoder.layers.7.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 4.0, 0.0, 8.0, 2.0, 7.0, 5.0, 12.0, 9.0, 15.0, 22.0, 19.0, 27.0, 34.0, 25.0, 41.0, 43.0, 37.0, 38.0, 44.0, 51.0, 49.0, 42.0, 60.0, 40.0, 49.0, 44.0, 43.0, 34.0, 35.0, 28.0, 32.0, 12.0, 21.0, 24.0, 6.0, 9.0, 12.0, 6.0, 6.0, 3.0, 4.0, 9.0, 4.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.634765625, -2.532318115234375, -2.42987060546875, -2.327423095703125, -2.2249755859375, -2.122528076171875, -2.02008056640625, -1.917633056640625, -1.815185546875, -1.712738037109375, -1.61029052734375, -1.507843017578125, -1.4053955078125, -1.302947998046875, -1.20050048828125, -1.098052978515625, -0.99560546875, -0.893157958984375, -0.79071044921875, -0.688262939453125, -0.5858154296875, -0.483367919921875, -0.38092041015625, -0.278472900390625, -0.176025390625, -0.073577880859375, 0.02886962890625, 0.131317138671875, 0.2337646484375, 0.336212158203125, 0.43865966796875, 0.541107177734375, 0.6435546875, 0.746002197265625, 0.84844970703125, 0.950897216796875, 1.0533447265625, 1.155792236328125, 1.25823974609375, 1.360687255859375, 1.463134765625, 1.565582275390625, 1.66802978515625, 1.770477294921875, 1.8729248046875, 1.975372314453125, 2.07781982421875, 2.180267333984375, 2.28271484375, 2.385162353515625, 2.48760986328125, 2.590057373046875, 2.6925048828125, 2.794952392578125, 2.89739990234375, 2.999847412109375, 3.102294921875, 3.204742431640625, 3.30718994140625, 3.409637451171875, 3.5120849609375, 3.614532470703125, 3.71697998046875, 3.819427490234375, 3.921875]}, "gradients/decoder.model.decoder.layers.7.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 4.0, 3.0, 5.0, 8.0, 17.0, 24.0, 39.0, 66.0, 136.0, 299.0, 794.0, 2453.0, 13037.0, 219223.0, 759638.0, 45386.0, 5205.0, 1372.0, 467.0, 184.0, 103.0, 25.0, 22.0, 18.0, 8.0, 5.0, 2.0, 4.0, 4.0, 5.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.4765625, -1.420318603515625, -1.36407470703125, -1.307830810546875, -1.2515869140625, -1.195343017578125, -1.13909912109375, -1.082855224609375, -1.026611328125, -0.970367431640625, -0.91412353515625, -0.857879638671875, -0.8016357421875, -0.745391845703125, -0.68914794921875, -0.632904052734375, -0.57666015625, -0.520416259765625, -0.46417236328125, -0.407928466796875, -0.3516845703125, -0.295440673828125, -0.23919677734375, -0.182952880859375, -0.126708984375, -0.070465087890625, -0.01422119140625, 0.042022705078125, 0.0982666015625, 0.154510498046875, 0.21075439453125, 0.266998291015625, 0.3232421875, 0.379486083984375, 0.43572998046875, 0.491973876953125, 0.5482177734375, 0.604461669921875, 0.66070556640625, 0.716949462890625, 0.773193359375, 0.829437255859375, 0.88568115234375, 0.941925048828125, 0.9981689453125, 1.054412841796875, 1.11065673828125, 1.166900634765625, 1.22314453125, 1.279388427734375, 1.33563232421875, 1.391876220703125, 1.4481201171875, 1.504364013671875, 1.56060791015625, 1.616851806640625, 1.673095703125, 1.729339599609375, 1.78558349609375, 1.841827392578125, 1.8980712890625, 1.954315185546875, 2.01055908203125, 2.066802978515625, 2.123046875]}, "gradients/decoder.model.decoder.layers.7.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 5.0, 2.0, 7.0, 18.0, 22.0, 28.0, 37.0, 74.0, 100.0, 116.0, 152.0, 129.0, 96.0, 85.0, 49.0, 29.0, 24.0, 11.0, 5.0, 5.0, 4.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002601146697998047, -0.00025320425629615784, -0.000246293842792511, -0.00023938342928886414, -0.00023247301578521729, -0.00022556260228157043, -0.00021865218877792358, -0.00021174177527427673, -0.00020483136177062988, -0.00019792094826698303, -0.00019101053476333618, -0.00018410012125968933, -0.00017718970775604248, -0.00017027929425239563, -0.00016336888074874878, -0.00015645846724510193, -0.00014954805374145508, -0.00014263764023780823, -0.00013572722673416138, -0.00012881681323051453, -0.00012190639972686768, -0.00011499598622322083, -0.00010808557271957397, -0.00010117515921592712, -9.426474571228027e-05, -8.735433220863342e-05, -8.044391870498657e-05, -7.353350520133972e-05, -6.662309169769287e-05, -5.971267819404602e-05, -5.280226469039917e-05, -4.589185118675232e-05, -3.898143768310547e-05, -3.207102417945862e-05, -2.5160610675811768e-05, -1.8250197172164917e-05, -1.1339783668518066e-05, -4.429370164871216e-06, 2.4810433387756348e-06, 9.391456842422485e-06, 1.6301870346069336e-05, 2.3212283849716187e-05, 3.0122697353363037e-05, 3.703311085700989e-05, 4.394352436065674e-05, 5.085393786430359e-05, 5.776435136795044e-05, 6.467476487159729e-05, 7.158517837524414e-05, 7.849559187889099e-05, 8.540600538253784e-05, 9.231641888618469e-05, 9.922683238983154e-05, 0.0001061372458934784, 0.00011304765939712524, 0.0001199580729007721, 0.00012686848640441895, 0.0001337788999080658, 0.00014068931341171265, 0.0001475997269153595, 0.00015451014041900635, 0.0001614205539226532, 0.00016833096742630005, 0.0001752413809299469, 0.00018215179443359375]}, "gradients/decoder.model.decoder.layers.7.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 2.0, 0.0, 4.0, 3.0, 9.0, 8.0, 11.0, 20.0, 31.0, 34.0, 52.0, 100.0, 231.0, 582.0, 2171.0, 17840.0, 514320.0, 492619.0, 17284.0, 2143.0, 562.0, 231.0, 124.0, 66.0, 26.0, 29.0, 19.0, 14.0, 7.0, 8.0, 6.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-2.357421875, -2.2900543212890625, -2.222686767578125, -2.1553192138671875, -2.08795166015625, -2.0205841064453125, -1.953216552734375, -1.8858489990234375, -1.8184814453125, -1.7511138916015625, -1.683746337890625, -1.6163787841796875, -1.54901123046875, -1.4816436767578125, -1.414276123046875, -1.3469085693359375, -1.279541015625, -1.2121734619140625, -1.144805908203125, -1.0774383544921875, -1.01007080078125, -0.9427032470703125, -0.875335693359375, -0.8079681396484375, -0.7406005859375, -0.6732330322265625, -0.605865478515625, -0.5384979248046875, -0.47113037109375, -0.4037628173828125, -0.336395263671875, -0.2690277099609375, -0.20166015625, -0.1342926025390625, -0.066925048828125, 0.0004425048828125, 0.06781005859375, 0.1351776123046875, 0.202545166015625, 0.2699127197265625, 0.3372802734375, 0.4046478271484375, 0.472015380859375, 0.5393829345703125, 0.60675048828125, 0.6741180419921875, 0.741485595703125, 0.8088531494140625, 0.876220703125, 0.9435882568359375, 1.010955810546875, 1.0783233642578125, 1.14569091796875, 1.2130584716796875, 1.280426025390625, 1.3477935791015625, 1.4151611328125, 1.4825286865234375, 1.549896240234375, 1.6172637939453125, 1.68463134765625, 1.7519989013671875, 1.819366455078125, 1.8867340087890625, 1.9541015625]}, "gradients/decoder.model.decoder.layers.7.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 4.0, 2.0, 7.0, 6.0, 9.0, 6.0, 15.0, 18.0, 26.0, 36.0, 56.0, 69.0, 116.0, 126.0, 120.0, 104.0, 87.0, 61.0, 39.0, 21.0, 25.0, 18.0, 10.0, 7.0, 9.0, 6.0, 2.0, 3.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.472412109375, -0.4544334411621094, -0.43645477294921875, -0.4184761047363281, -0.4004974365234375, -0.3825187683105469, -0.36454010009765625, -0.3465614318847656, -0.328582763671875, -0.3106040954589844, -0.29262542724609375, -0.2746467590332031, -0.2566680908203125, -0.23868942260742188, -0.22071075439453125, -0.20273208618164062, -0.18475341796875, -0.16677474975585938, -0.14879608154296875, -0.13081741333007812, -0.1128387451171875, -0.09486007690429688, -0.07688140869140625, -0.058902740478515625, -0.040924072265625, -0.022945404052734375, -0.00496673583984375, 0.013011932373046875, 0.0309906005859375, 0.048969268798828125, 0.06694793701171875, 0.08492660522460938, 0.1029052734375, 0.12088394165039062, 0.13886260986328125, 0.15684127807617188, 0.1748199462890625, 0.19279861450195312, 0.21077728271484375, 0.22875595092773438, 0.246734619140625, 0.2647132873535156, 0.28269195556640625, 0.3006706237792969, 0.3186492919921875, 0.3366279602050781, 0.35460662841796875, 0.3725852966308594, 0.39056396484375, 0.4085426330566406, 0.42652130126953125, 0.4444999694824219, 0.4624786376953125, 0.4804573059082031, 0.49843597412109375, 0.5164146423339844, 0.534393310546875, 0.5523719787597656, 0.5703506469726562, 0.5883293151855469, 0.6063079833984375, 0.6242866516113281, 0.6422653198242188, 0.6602439880371094, 0.67822265625]}, "gradients/decoder.model.decoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 3.0, 3.0, 2.0, 10.0, 7.0, 20.0, 26.0, 42.0, 51.0, 71.0, 105.0, 115.0, 125.0, 118.0, 91.0, 61.0, 46.0, 40.0, 28.0, 10.0, 8.0, 7.0, 5.0, 7.0, 0.0, 4.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-6.005093097686768, -5.8308210372924805, -5.656548500061035, -5.482276439666748, -5.308004379272461, -5.133732318878174, -4.9594597816467285, -4.785187721252441, -4.610915660858154, -4.436643600463867, -4.262371063232422, -4.088099002838135, -3.9138269424438477, -3.7395546436309814, -3.5652823448181152, -3.391010284423828, -3.216737985610962, -3.0424656867980957, -2.8681936264038086, -2.6939213275909424, -2.5196492671966553, -2.345376968383789, -2.171104907989502, -1.9968326091766357, -1.822560429573059, -1.6482882499694824, -1.4740160703659058, -1.299743890762329, -1.125471591949463, -0.951199471950531, -0.7769272327423096, -0.6026550531387329, -0.42838287353515625, -0.2541106939315796, -0.07983848452568054, 0.0944337248802185, 0.26870590448379517, 0.4429780840873718, 0.6172503232955933, 0.7915225028991699, 0.9657946825027466, 1.1400668621063232, 1.3143390417099, 1.4886112213134766, 1.6628835201263428, 1.8371555805206299, 2.011427879333496, 2.185699939727783, 2.3599722385406494, 2.5342445373535156, 2.7085165977478027, 2.882788896560669, 3.057060956954956, 3.2313332557678223, 3.4056053161621094, 3.5798776149749756, 3.754149913787842, 3.928422212600708, 4.102694511413574, 4.276966571807861, 4.451238632202148, 4.6255106925964355, 4.799783229827881, 4.974055290222168, 5.148327350616455]}, "gradients/decoder.model.decoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [8.0, 9.0, 5.0, 13.0, 24.0, 34.0, 41.0, 47.0, 61.0, 71.0, 82.0, 76.0, 90.0, 91.0, 81.0, 80.0, 66.0, 46.0, 41.0, 24.0, 11.0, 9.0, 6.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.012876033782959, -3.6836705207824707, -3.3544647693634033, -3.025259017944336, -2.6960535049438477, -2.3668479919433594, -2.037642240524292, -1.7084364891052246, -1.3792309761047363, -1.0500253438949585, -0.7208197116851807, -0.39161407947540283, -0.062408447265625, 0.26679718494415283, 0.5960028171539307, 0.925208568572998, 1.2544140815734863, 1.5836197137832642, 1.912825345993042, 2.2420310974121094, 2.5712366104125977, 2.900442123413086, 3.2296478748321533, 3.5588536262512207, 3.888059139251709, 4.217264652252197, 4.546470642089844, 4.875676155090332, 5.20488166809082, 5.534087181091309, 5.863292694091797, 6.192498683929443, 6.521703720092773, 6.850909233093262, 7.18011474609375, 7.5093207359313965, 7.838526248931885, 8.167732238769531, 8.49693775177002, 8.826143264770508, 9.155348777770996, 9.484554290771484, 9.813759803771973, 10.142965316772461, 10.472171783447266, 10.801377296447754, 11.130582809448242, 11.45978832244873, 11.788993835449219, 12.118199348449707, 12.447404861450195, 12.776610374450684, 13.105815887451172, 13.435022354125977, 13.764227867126465, 14.093433380126953, 14.422638893127441, 14.75184440612793, 15.081049919128418, 15.410255432128906, 15.739461898803711, 16.068666458129883, 16.397872924804688, 16.72707748413086, 17.056283950805664]}, "gradients/decoder.model.decoder.layers.6.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 4.0, 3.0, 3.0, 4.0, 10.0, 8.0, 20.0, 13.0, 22.0, 33.0, 45.0, 57.0, 85.0, 111.0, 197.0, 338.0, 969.0, 5015.0, 114857.0, 3382080.0, 670911.0, 16019.0, 1943.0, 631.0, 353.0, 195.0, 114.0, 74.0, 51.0, 30.0, 18.0, 15.0, 15.0, 12.0, 5.0, 9.0, 4.0, 4.0, 3.0, 1.0, 1.0, 1.0, 6.0, 2.0, 0.0, 0.0, 3.0], "bins": [-7.5546875, -7.348876953125, -7.14306640625, -6.937255859375, -6.7314453125, -6.525634765625, -6.31982421875, -6.114013671875, -5.908203125, -5.702392578125, -5.49658203125, -5.290771484375, -5.0849609375, -4.879150390625, -4.67333984375, -4.467529296875, -4.26171875, -4.055908203125, -3.85009765625, -3.644287109375, -3.4384765625, -3.232666015625, -3.02685546875, -2.821044921875, -2.615234375, -2.409423828125, -2.20361328125, -1.997802734375, -1.7919921875, -1.586181640625, -1.38037109375, -1.174560546875, -0.96875, -0.762939453125, -0.55712890625, -0.351318359375, -0.1455078125, 0.060302734375, 0.26611328125, 0.471923828125, 0.677734375, 0.883544921875, 1.08935546875, 1.295166015625, 1.5009765625, 1.706787109375, 1.91259765625, 2.118408203125, 2.32421875, 2.530029296875, 2.73583984375, 2.941650390625, 3.1474609375, 3.353271484375, 3.55908203125, 3.764892578125, 3.970703125, 4.176513671875, 4.38232421875, 4.588134765625, 4.7939453125, 4.999755859375, 5.20556640625, 5.411376953125, 5.6171875]}, "gradients/decoder.model.decoder.layers.6.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 4.0, 3.0, 3.0, 7.0, 7.0, 4.0, 13.0, 8.0, 24.0, 21.0, 22.0, 31.0, 35.0, 37.0, 58.0, 43.0, 52.0, 50.0, 61.0, 60.0, 59.0, 44.0, 47.0, 48.0, 37.0, 49.0, 32.0, 33.0, 26.0, 19.0, 24.0, 14.0, 11.0, 9.0, 4.0, 3.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.349609375, -2.27484130859375, -2.2000732421875, -2.12530517578125, -2.050537109375, -1.97576904296875, -1.9010009765625, -1.82623291015625, -1.75146484375, -1.67669677734375, -1.6019287109375, -1.52716064453125, -1.452392578125, -1.37762451171875, -1.3028564453125, -1.22808837890625, -1.1533203125, -1.07855224609375, -1.0037841796875, -0.92901611328125, -0.854248046875, -0.77947998046875, -0.7047119140625, -0.62994384765625, -0.55517578125, -0.48040771484375, -0.4056396484375, -0.33087158203125, -0.256103515625, -0.18133544921875, -0.1065673828125, -0.03179931640625, 0.04296875, 0.11773681640625, 0.1925048828125, 0.26727294921875, 0.342041015625, 0.41680908203125, 0.4915771484375, 0.56634521484375, 0.64111328125, 0.71588134765625, 0.7906494140625, 0.86541748046875, 0.940185546875, 1.01495361328125, 1.0897216796875, 1.16448974609375, 1.2392578125, 1.31402587890625, 1.3887939453125, 1.46356201171875, 1.538330078125, 1.61309814453125, 1.6878662109375, 1.76263427734375, 1.83740234375, 1.91217041015625, 1.9869384765625, 2.06170654296875, 2.136474609375, 2.21124267578125, 2.2860107421875, 2.36077880859375, 2.435546875]}, "gradients/decoder.model.decoder.layers.6.fc1.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 6.0, 9.0, 7.0, 21.0, 38.0, 37.0, 67.0, 117.0, 202.0, 421.0, 1018.0, 4131.0, 104223.0, 3997500.0, 80603.0, 3971.0, 964.0, 426.0, 207.0, 121.0, 80.0, 49.0, 34.0, 15.0, 4.0, 8.0, 5.0, 0.0, 3.0, 4.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.203125, -6.958740234375, -6.71435546875, -6.469970703125, -6.2255859375, -5.981201171875, -5.73681640625, -5.492431640625, -5.248046875, -5.003662109375, -4.75927734375, -4.514892578125, -4.2705078125, -4.026123046875, -3.78173828125, -3.537353515625, -3.29296875, -3.048583984375, -2.80419921875, -2.559814453125, -2.3154296875, -2.071044921875, -1.82666015625, -1.582275390625, -1.337890625, -1.093505859375, -0.84912109375, -0.604736328125, -0.3603515625, -0.115966796875, 0.12841796875, 0.372802734375, 0.6171875, 0.861572265625, 1.10595703125, 1.350341796875, 1.5947265625, 1.839111328125, 2.08349609375, 2.327880859375, 2.572265625, 2.816650390625, 3.06103515625, 3.305419921875, 3.5498046875, 3.794189453125, 4.03857421875, 4.282958984375, 4.52734375, 4.771728515625, 5.01611328125, 5.260498046875, 5.5048828125, 5.749267578125, 5.99365234375, 6.238037109375, 6.482421875, 6.726806640625, 6.97119140625, 7.215576171875, 7.4599609375, 7.704345703125, 7.94873046875, 8.193115234375, 8.4375]}, "gradients/decoder.model.decoder.layers.6.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 4.0, 7.0, 6.0, 10.0, 12.0, 24.0, 24.0, 34.0, 37.0, 61.0, 100.0, 131.0, 165.0, 290.0, 369.0, 486.0, 536.0, 440.0, 417.0, 294.0, 192.0, 141.0, 84.0, 58.0, 41.0, 35.0, 24.0, 23.0, 12.0, 8.0, 5.0, 4.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0], "bins": [-1.0908203125, -1.0625, -1.0341796875, -1.005859375, -0.9775390625, -0.94921875, -0.9208984375, -0.892578125, -0.8642578125, -0.8359375, -0.8076171875, -0.779296875, -0.7509765625, -0.72265625, -0.6943359375, -0.666015625, -0.6376953125, -0.609375, -0.5810546875, -0.552734375, -0.5244140625, -0.49609375, -0.4677734375, -0.439453125, -0.4111328125, -0.3828125, -0.3544921875, -0.326171875, -0.2978515625, -0.26953125, -0.2412109375, -0.212890625, -0.1845703125, -0.15625, -0.1279296875, -0.099609375, -0.0712890625, -0.04296875, -0.0146484375, 0.013671875, 0.0419921875, 0.0703125, 0.0986328125, 0.126953125, 0.1552734375, 0.18359375, 0.2119140625, 0.240234375, 0.2685546875, 0.296875, 0.3251953125, 0.353515625, 0.3818359375, 0.41015625, 0.4384765625, 0.466796875, 0.4951171875, 0.5234375, 0.5517578125, 0.580078125, 0.6083984375, 0.63671875, 0.6650390625, 0.693359375, 0.7216796875]}, "gradients/decoder.model.decoder.layers.6.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 6.0, 1.0, 3.0, 3.0, 6.0, 5.0, 7.0, 8.0, 16.0, 16.0, 41.0, 59.0, 60.0, 80.0, 89.0, 100.0, 93.0, 102.0, 75.0, 57.0, 58.0, 37.0, 27.0, 21.0, 11.0, 7.0, 12.0, 3.0, 4.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.669475078582764, -4.544282913208008, -4.41909122467041, -4.293899059295654, -4.168706893920898, -4.043515205383301, -3.918323040008545, -3.793130874633789, -3.6679389476776123, -3.5427470207214355, -3.4175548553466797, -3.292362928390503, -3.167171001434326, -3.0419788360595703, -2.9167869091033936, -2.791594982147217, -2.666402816772461, -2.541210889816284, -2.4160187244415283, -2.2908267974853516, -2.1656346321105957, -2.040442705154419, -1.9152507781982422, -1.7900587320327759, -1.6648666858673096, -1.5396746397018433, -1.414482593536377, -1.2892906665802002, -1.1640986204147339, -1.0389065742492676, -0.913714587688446, -0.7885226011276245, -0.6633305549621582, -0.5381385087966919, -0.41294652223587036, -0.28775450587272644, -0.16256248950958252, -0.03737044334411621, 0.08782154321670532, 0.21301352977752686, 0.33820557594299316, 0.4633975923061371, 0.588589608669281, 0.7137815952301025, 0.8389736413955688, 0.9641656875610352, 1.089357614517212, 1.2145496606826782, 1.3397417068481445, 1.4649337530136108, 1.5901257991790771, 1.715317726135254, 1.8405097723007202, 1.9657018184661865, 2.0908937454223633, 2.216085910797119, 2.341277837753296, 2.4664697647094727, 2.5916619300842285, 2.7168538570404053, 2.842045783996582, 2.967237949371338, 3.0924298763275146, 3.2176218032836914, 3.3428139686584473]}, "gradients/decoder.model.decoder.layers.6.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 2.0, 0.0, 6.0, 9.0, 6.0, 10.0, 18.0, 20.0, 18.0, 23.0, 26.0, 34.0, 34.0, 40.0, 30.0, 48.0, 51.0, 46.0, 43.0, 62.0, 63.0, 57.0, 46.0, 52.0, 42.0, 34.0, 36.0, 34.0, 23.0, 20.0, 18.0, 27.0, 12.0, 2.0, 8.0, 2.0, 2.0, 4.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.850348472595215, -2.765322685241699, -2.6802966594696045, -2.595270872116089, -2.510244846343994, -2.4252190589904785, -2.340193033218384, -2.255167245864868, -2.1701412200927734, -2.085115432739258, -2.000089406967163, -1.915063500404358, -1.8300375938415527, -1.7450116872787476, -1.6599857807159424, -1.5749599933624268, -1.4899340867996216, -1.4049081802368164, -1.3198822736740112, -1.234856367111206, -1.1498304605484009, -1.0648045539855957, -0.9797787070274353, -0.8947528004646301, -0.809726893901825, -0.7247009873390198, -0.6396750807762146, -0.5546492338180542, -0.46962329745292664, -0.38459739089012146, -0.29957151412963867, -0.2145456075668335, -0.12951970100402832, -0.04449380189180374, 0.04053209722042084, 0.12555798888206482, 0.21058389544487, 0.29560980200767517, 0.38063567876815796, 0.46566158533096313, 0.5506874918937683, 0.6357133984565735, 0.7207393050193787, 0.8057651519775391, 0.8907910585403442, 0.9758169651031494, 1.0608428716659546, 1.1458687782287598, 1.230894684791565, 1.3159205913543701, 1.4009464979171753, 1.4859724044799805, 1.5709983110427856, 1.6560242176055908, 1.7410500049591064, 1.8260760307312012, 1.9111018180847168, 1.996127724647522, 2.081153631210327, 2.1661794185638428, 2.2512054443359375, 2.336231231689453, 2.421257257461548, 2.5062830448150635, 2.591309070587158]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [3.0, 3.0, 1.0, 2.0, 2.0, 1.0, 3.0, 4.0, 13.0, 9.0, 5.0, 15.0, 17.0, 30.0, 31.0, 31.0, 54.0, 67.0, 129.0, 180.0, 323.0, 674.0, 1527.0, 4739.0, 16002.0, 58244.0, 193148.0, 386565.0, 265306.0, 86507.0, 23757.0, 6981.0, 2295.0, 873.0, 372.0, 200.0, 125.0, 88.0, 58.0, 41.0, 35.0, 21.0, 22.0, 15.0, 13.0, 9.0, 8.0, 8.0, 5.0, 2.0, 3.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.484619140625, -0.4670982360839844, -0.44957733154296875, -0.4320564270019531, -0.4145355224609375, -0.3970146179199219, -0.37949371337890625, -0.3619728088378906, -0.344451904296875, -0.3269309997558594, -0.30941009521484375, -0.2918891906738281, -0.2743682861328125, -0.2568473815917969, -0.23932647705078125, -0.22180557250976562, -0.20428466796875, -0.18676376342773438, -0.16924285888671875, -0.15172195434570312, -0.1342010498046875, -0.11668014526367188, -0.09915924072265625, -0.08163833618164062, -0.064117431640625, -0.046596527099609375, -0.02907562255859375, -0.011554718017578125, 0.0059661865234375, 0.023487091064453125, 0.04100799560546875, 0.058528900146484375, 0.0760498046875, 0.09357070922851562, 0.11109161376953125, 0.12861251831054688, 0.1461334228515625, 0.16365432739257812, 0.18117523193359375, 0.19869613647460938, 0.216217041015625, 0.23373794555664062, 0.25125885009765625, 0.2687797546386719, 0.2863006591796875, 0.3038215637207031, 0.32134246826171875, 0.3388633728027344, 0.35638427734375, 0.3739051818847656, 0.39142608642578125, 0.4089469909667969, 0.4264678955078125, 0.4439888000488281, 0.46150970458984375, 0.4790306091308594, 0.496551513671875, 0.5140724182128906, 0.5315933227539062, 0.5491142272949219, 0.5666351318359375, 0.5841560363769531, 0.6016769409179688, 0.6191978454589844, 0.63671875]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 5.0, 4.0, 8.0, 12.0, 24.0, 22.0, 30.0, 34.0, 43.0, 62.0, 65.0, 83.0, 80.0, 87.0, 82.0, 79.0, 79.0, 51.0, 41.0, 48.0, 29.0, 16.0, 11.0, 5.0, 4.0, 3.0, 4.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.33984375, -3.2501220703125, -3.160400390625, -3.0706787109375, -2.98095703125, -2.8912353515625, -2.801513671875, -2.7117919921875, -2.6220703125, -2.5323486328125, -2.442626953125, -2.3529052734375, -2.26318359375, -2.1734619140625, -2.083740234375, -1.9940185546875, -1.904296875, -1.8145751953125, -1.724853515625, -1.6351318359375, -1.54541015625, -1.4556884765625, -1.365966796875, -1.2762451171875, -1.1865234375, -1.0968017578125, -1.007080078125, -0.9173583984375, -0.82763671875, -0.7379150390625, -0.648193359375, -0.5584716796875, -0.46875, -0.3790283203125, -0.289306640625, -0.1995849609375, -0.10986328125, -0.0201416015625, 0.069580078125, 0.1593017578125, 0.2490234375, 0.3387451171875, 0.428466796875, 0.5181884765625, 0.60791015625, 0.6976318359375, 0.787353515625, 0.8770751953125, 0.966796875, 1.0565185546875, 1.146240234375, 1.2359619140625, 1.32568359375, 1.4154052734375, 1.505126953125, 1.5948486328125, 1.6845703125, 1.7742919921875, 1.864013671875, 1.9537353515625, 2.04345703125, 2.1331787109375, 2.222900390625, 2.3126220703125, 2.40234375]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 5.0, 4.0, 8.0, 18.0, 26.0, 42.0, 61.0, 100.0, 190.0, 290.0, 573.0, 1192.0, 2119.0, 4220.0, 8364.0, 16177.0, 30866.0, 57897.0, 102361.0, 160959.0, 202803.0, 182842.0, 123763.0, 72646.0, 39002.0, 20692.0, 10340.0, 5290.0, 2672.0, 1453.0, 703.0, 383.0, 197.0, 115.0, 57.0, 46.0, 30.0, 24.0, 9.0, 8.0, 5.0, 7.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.26513671875, -0.2572669982910156, -0.24939727783203125, -0.24152755737304688, -0.2336578369140625, -0.22578811645507812, -0.21791839599609375, -0.21004867553710938, -0.202178955078125, -0.19430923461914062, -0.18643951416015625, -0.17856979370117188, -0.1707000732421875, -0.16283035278320312, -0.15496063232421875, -0.14709091186523438, -0.13922119140625, -0.13135147094726562, -0.12348175048828125, -0.11561203002929688, -0.1077423095703125, -0.09987258911132812, -0.09200286865234375, -0.08413314819335938, -0.076263427734375, -0.06839370727539062, -0.06052398681640625, -0.052654266357421875, -0.0447845458984375, -0.036914825439453125, -0.02904510498046875, -0.021175384521484375, -0.0133056640625, -0.005435943603515625, 0.00243377685546875, 0.010303497314453125, 0.0181732177734375, 0.026042938232421875, 0.03391265869140625, 0.041782379150390625, 0.049652099609375, 0.057521820068359375, 0.06539154052734375, 0.07326126098632812, 0.0811309814453125, 0.08900070190429688, 0.09687042236328125, 0.10474014282226562, 0.11260986328125, 0.12047958374023438, 0.12834930419921875, 0.13621902465820312, 0.1440887451171875, 0.15195846557617188, 0.15982818603515625, 0.16769790649414062, 0.175567626953125, 0.18343734741210938, 0.19130706787109375, 0.19917678833007812, 0.2070465087890625, 0.21491622924804688, 0.22278594970703125, 0.23065567016601562, 0.238525390625]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 3.0, 3.0, 2.0, 3.0, 6.0, 5.0, 8.0, 15.0, 12.0, 16.0, 12.0, 26.0, 18.0, 33.0, 22.0, 27.0, 31.0, 41.0, 44.0, 42.0, 53.0, 65.0, 48.0, 52.0, 49.0, 52.0, 33.0, 39.0, 42.0, 34.0, 29.0, 22.0, 18.0, 20.0, 16.0, 10.0, 14.0, 15.0, 10.0, 5.0, 6.0, 4.0, 5.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.67578125, -3.569549560546875, -3.46331787109375, -3.357086181640625, -3.2508544921875, -3.144622802734375, -3.03839111328125, -2.932159423828125, -2.825927734375, -2.719696044921875, -2.61346435546875, -2.507232666015625, -2.4010009765625, -2.294769287109375, -2.18853759765625, -2.082305908203125, -1.97607421875, -1.869842529296875, -1.76361083984375, -1.657379150390625, -1.5511474609375, -1.444915771484375, -1.33868408203125, -1.232452392578125, -1.126220703125, -1.019989013671875, -0.91375732421875, -0.807525634765625, -0.7012939453125, -0.595062255859375, -0.48883056640625, -0.382598876953125, -0.2763671875, -0.170135498046875, -0.06390380859375, 0.042327880859375, 0.1485595703125, 0.254791259765625, 0.36102294921875, 0.467254638671875, 0.573486328125, 0.679718017578125, 0.78594970703125, 0.892181396484375, 0.9984130859375, 1.104644775390625, 1.21087646484375, 1.317108154296875, 1.42333984375, 1.529571533203125, 1.63580322265625, 1.742034912109375, 1.8482666015625, 1.954498291015625, 2.06072998046875, 2.166961669921875, 2.273193359375, 2.379425048828125, 2.48565673828125, 2.591888427734375, 2.6981201171875, 2.804351806640625, 2.91058349609375, 3.016815185546875, 3.123046875]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 4.0, 5.0, 5.0, 2.0, 17.0, 19.0, 17.0, 38.0, 71.0, 124.0, 163.0, 397.0, 641.0, 1338.0, 3221.0, 8989.0, 34595.0, 183290.0, 586044.0, 180449.0, 34184.0, 8977.0, 3147.0, 1370.0, 632.0, 334.0, 178.0, 108.0, 69.0, 45.0, 35.0, 18.0, 10.0, 9.0, 6.0, 2.0, 1.0, 2.0, 2.0, 0.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11895751953125, -0.11492443084716797, -0.11089134216308594, -0.1068582534790039, -0.10282516479492188, -0.09879207611083984, -0.09475898742675781, -0.09072589874267578, -0.08669281005859375, -0.08265972137451172, -0.07862663269042969, -0.07459354400634766, -0.07056045532226562, -0.0665273666381836, -0.06249427795410156, -0.05846118927001953, -0.0544281005859375, -0.05039501190185547, -0.04636192321777344, -0.042328834533691406, -0.038295745849609375, -0.034262657165527344, -0.030229568481445312, -0.02619647979736328, -0.02216339111328125, -0.01813030242919922, -0.014097213745117188, -0.010064125061035156, -0.006031036376953125, -0.0019979476928710938, 0.0020351409912109375, 0.006068229675292969, 0.010101318359375, 0.014134407043457031, 0.018167495727539062, 0.022200584411621094, 0.026233673095703125, 0.030266761779785156, 0.03429985046386719, 0.03833293914794922, 0.04236602783203125, 0.04639911651611328, 0.05043220520019531, 0.054465293884277344, 0.058498382568359375, 0.0625314712524414, 0.06656455993652344, 0.07059764862060547, 0.0746307373046875, 0.07866382598876953, 0.08269691467285156, 0.0867300033569336, 0.09076309204101562, 0.09479618072509766, 0.09882926940917969, 0.10286235809326172, 0.10689544677734375, 0.11092853546142578, 0.11496162414550781, 0.11899471282958984, 0.12302780151367188, 0.1270608901977539, 0.13109397888183594, 0.13512706756591797, 0.13916015625]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 6.0, 7.0, 11.0, 27.0, 27.0, 56.0, 74.0, 100.0, 147.0, 166.0, 109.0, 94.0, 66.0, 39.0, 28.0, 19.0, 6.0, 15.0, 4.0, 3.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0001207590103149414, -0.00011767912656068802, -0.00011459924280643463, -0.00011151935905218124, -0.00010843947529792786, -0.00010535959154367447, -0.00010227970778942108, -9.91998240351677e-05, -9.61199402809143e-05, -9.304005652666092e-05, -8.996017277240753e-05, -8.688028901815414e-05, -8.380040526390076e-05, -8.072052150964737e-05, -7.764063775539398e-05, -7.45607540011406e-05, -7.148087024688721e-05, -6.840098649263382e-05, -6.532110273838043e-05, -6.224121898412704e-05, -5.916133522987366e-05, -5.608145147562027e-05, -5.300156772136688e-05, -4.9921683967113495e-05, -4.684180021286011e-05, -4.376191645860672e-05, -4.068203270435333e-05, -3.7602148950099945e-05, -3.452226519584656e-05, -3.144238144159317e-05, -2.8362497687339783e-05, -2.5282613933086395e-05, -2.2202730178833008e-05, -1.912284642457962e-05, -1.6042962670326233e-05, -1.2963078916072845e-05, -9.883195161819458e-06, -6.8033114075660706e-06, -3.723427653312683e-06, -6.435438990592957e-07, 2.436339855194092e-06, 5.516223609447479e-06, 8.596107363700867e-06, 1.1675991117954254e-05, 1.4755874872207642e-05, 1.783575862646103e-05, 2.0915642380714417e-05, 2.3995526134967804e-05, 2.707540988922119e-05, 3.015529364347458e-05, 3.3235177397727966e-05, 3.6315061151981354e-05, 3.939494490623474e-05, 4.247482866048813e-05, 4.5554712414741516e-05, 4.8634596168994904e-05, 5.171447992324829e-05, 5.479436367750168e-05, 5.7874247431755066e-05, 6.095413118600845e-05, 6.403401494026184e-05, 6.711389869451523e-05, 7.019378244876862e-05, 7.3273666203022e-05, 7.635354995727539e-05]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 5.0, 6.0, 6.0, 8.0, 6.0, 15.0, 29.0, 52.0, 85.0, 130.0, 285.0, 493.0, 1275.0, 3352.0, 11626.0, 52013.0, 300529.0, 541060.0, 107772.0, 21049.0, 5454.0, 1775.0, 724.0, 340.0, 171.0, 112.0, 53.0, 39.0, 30.0, 21.0, 13.0, 9.0, 6.0, 1.0, 3.0, 4.0, 0.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1270751953125, -0.12286949157714844, -0.11866378784179688, -0.11445808410644531, -0.11025238037109375, -0.10604667663574219, -0.10184097290039062, -0.09763526916503906, -0.0934295654296875, -0.08922386169433594, -0.08501815795898438, -0.08081245422363281, -0.07660675048828125, -0.07240104675292969, -0.06819534301757812, -0.06398963928222656, -0.059783935546875, -0.05557823181152344, -0.051372528076171875, -0.04716682434082031, -0.04296112060546875, -0.03875541687011719, -0.034549713134765625, -0.030344009399414062, -0.0261383056640625, -0.021932601928710938, -0.017726898193359375, -0.013521194458007812, -0.00931549072265625, -0.0051097869873046875, -0.000904083251953125, 0.0033016204833984375, 0.00750732421875, 0.011713027954101562, 0.015918731689453125, 0.020124435424804688, 0.02433013916015625, 0.028535842895507812, 0.032741546630859375, 0.03694725036621094, 0.0411529541015625, 0.04535865783691406, 0.049564361572265625, 0.05377006530761719, 0.05797576904296875, 0.06218147277832031, 0.06638717651367188, 0.07059288024902344, 0.074798583984375, 0.07900428771972656, 0.08320999145507812, 0.08741569519042969, 0.09162139892578125, 0.09582710266113281, 0.10003280639648438, 0.10423851013183594, 0.1084442138671875, 0.11264991760253906, 0.11685562133789062, 0.12106132507324219, 0.12526702880859375, 0.1294727325439453, 0.13367843627929688, 0.13788414001464844, 0.14208984375]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 3.0, 3.0, 5.0, 11.0, 9.0, 16.0, 14.0, 14.0, 23.0, 20.0, 49.0, 43.0, 54.0, 68.0, 71.0, 77.0, 83.0, 88.0, 74.0, 59.0, 50.0, 40.0, 34.0, 26.0, 13.0, 18.0, 20.0, 8.0, 3.0, 2.0, 2.0, 6.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.033355712890625, -0.03240847587585449, -0.031461238861083984, -0.030514001846313477, -0.02956676483154297, -0.02861952781677246, -0.027672290802001953, -0.026725053787231445, -0.025777816772460938, -0.02483057975769043, -0.023883342742919922, -0.022936105728149414, -0.021988868713378906, -0.0210416316986084, -0.02009439468383789, -0.019147157669067383, -0.018199920654296875, -0.017252683639526367, -0.01630544662475586, -0.015358209609985352, -0.014410972595214844, -0.013463735580444336, -0.012516498565673828, -0.01156926155090332, -0.010622024536132812, -0.009674787521362305, -0.008727550506591797, -0.007780313491821289, -0.006833076477050781, -0.0058858394622802734, -0.004938602447509766, -0.003991365432739258, -0.00304412841796875, -0.002096891403198242, -0.0011496543884277344, -0.00020241737365722656, 0.0007448196411132812, 0.001692056655883789, 0.002639293670654297, 0.0035865306854248047, 0.0045337677001953125, 0.00548100471496582, 0.006428241729736328, 0.007375478744506836, 0.008322715759277344, 0.009269952774047852, 0.01021718978881836, 0.011164426803588867, 0.012111663818359375, 0.013058900833129883, 0.01400613784790039, 0.014953374862670898, 0.015900611877441406, 0.016847848892211914, 0.017795085906982422, 0.01874232292175293, 0.019689559936523438, 0.020636796951293945, 0.021584033966064453, 0.02253127098083496, 0.02347850799560547, 0.024425745010375977, 0.025372982025146484, 0.026320219039916992, 0.0272674560546875]}, "gradients/decoder.model.decoder.layers.6.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 7.0, 11.0, 33.0, 122.0, 272.0, 285.0, 186.0, 64.0, 14.0, 10.0, 5.0, 3.0, 0.0, 1.0, 3.0], "bins": [-13.121729850769043, -12.879738807678223, -12.637748718261719, -12.395757675170898, -12.153766632080078, -11.911775588989258, -11.669785499572754, -11.427794456481934, -11.18580436706543, -10.94381332397461, -10.701823234558105, -10.459832191467285, -10.217841148376465, -9.975851058959961, -9.73386001586914, -9.49186897277832, -9.2498779296875, -9.00788688659668, -8.765896797180176, -8.523905754089355, -8.281914710998535, -8.039924621582031, -7.797933578491211, -7.555942535400391, -7.3139519691467285, -7.071961402893066, -6.829970359802246, -6.587979793548584, -6.345989227294922, -6.103998184204102, -5.8620076179504395, -5.620017051696777, -5.378025531768799, -5.136034965515137, -4.894043922424316, -4.652053356170654, -4.410062789916992, -4.168071746826172, -3.9260811805725098, -3.6840903759002686, -3.4420995712280273, -3.200108766555786, -2.958117961883545, -2.716127395629883, -2.4741365909576416, -2.2321457862854004, -1.9901551008224487, -1.748164415359497, -1.5061736106872559, -1.2641828060150146, -1.022192120552063, -0.7802013754844666, -0.5382106304168701, -0.2962198257446289, -0.054229140281677246, 0.18776154518127441, 0.4297523498535156, 0.6717430949211121, 0.9137338399887085, 1.1557245254516602, 1.3977153301239014, 1.6397061347961426, 1.8816968202590942, 2.123687505722046, 2.365678310394287]}, "gradients/decoder.model.decoder.layers.6.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 4.0, 2.0, 3.0, 3.0, 11.0, 17.0, 20.0, 20.0, 27.0, 36.0, 47.0, 46.0, 45.0, 57.0, 68.0, 55.0, 77.0, 79.0, 67.0, 68.0, 48.0, 44.0, 46.0, 39.0, 21.0, 26.0, 12.0, 7.0, 4.0, 7.0, 3.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.558716297149658, -2.4864108562469482, -2.4141054153442383, -2.3417999744415283, -2.2694945335388184, -2.1971893310546875, -2.1248836517333984, -2.0525784492492676, -1.9802730083465576, -1.9079675674438477, -1.8356621265411377, -1.7633566856384277, -1.6910513639450073, -1.6187459230422974, -1.5464404821395874, -1.474135160446167, -1.4018296003341675, -1.3295241594314575, -1.2572187185287476, -1.1849133968353271, -1.1126079559326172, -1.0403025150299072, -0.9679970741271973, -0.8956916928291321, -0.8233862519264221, -0.7510808110237122, -0.678775429725647, -0.606469988822937, -0.534164547920227, -0.46185916662216187, -0.3895537257194519, -0.3172483444213867, -0.24494290351867676, -0.17263749241828918, -0.10033206641674042, -0.02802664041519165, 0.04427877068519592, 0.1165841817855835, 0.18888962268829346, 0.26119500398635864, 0.3335004448890686, 0.4058058559894562, 0.47811126708984375, 0.5504167079925537, 0.6227221488952637, 0.6950275301933289, 0.7673329710960388, 0.839638352394104, 0.911943793296814, 0.9842492341995239, 1.0565546751022339, 1.1288599967956543, 1.2011654376983643, 1.2734708786010742, 1.3457763195037842, 1.4180817604064941, 1.490387201309204, 1.562692642211914, 1.634998083114624, 1.707303524017334, 1.7796088457107544, 1.8519142866134644, 1.9242197275161743, 1.9965250492095947, 2.0688304901123047]}, "gradients/decoder.model.decoder.layers.6.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 6.0, 2.0, 3.0, 7.0, 14.0, 17.0, 16.0, 29.0, 51.0, 73.0, 216.0, 812.0, 8443.0, 399239.0, 624537.0, 13535.0, 1063.0, 255.0, 80.0, 46.0, 27.0, 35.0, 17.0, 12.0, 2.0, 6.0, 6.0, 2.0, 3.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.48828125, -5.29949951171875, -5.1107177734375, -4.92193603515625, -4.733154296875, -4.54437255859375, -4.3555908203125, -4.16680908203125, -3.97802734375, -3.78924560546875, -3.6004638671875, -3.41168212890625, -3.222900390625, -3.03411865234375, -2.8453369140625, -2.65655517578125, -2.4677734375, -2.27899169921875, -2.0902099609375, -1.90142822265625, -1.712646484375, -1.52386474609375, -1.3350830078125, -1.14630126953125, -0.95751953125, -0.76873779296875, -0.5799560546875, -0.39117431640625, -0.202392578125, -0.01361083984375, 0.1751708984375, 0.36395263671875, 0.552734375, 0.74151611328125, 0.9302978515625, 1.11907958984375, 1.307861328125, 1.49664306640625, 1.6854248046875, 1.87420654296875, 2.06298828125, 2.25177001953125, 2.4405517578125, 2.62933349609375, 2.818115234375, 3.00689697265625, 3.1956787109375, 3.38446044921875, 3.5732421875, 3.76202392578125, 3.9508056640625, 4.13958740234375, 4.328369140625, 4.51715087890625, 4.7059326171875, 4.89471435546875, 5.08349609375, 5.27227783203125, 5.4610595703125, 5.64984130859375, 5.838623046875, 6.02740478515625, 6.2161865234375, 6.40496826171875, 6.59375]}, "gradients/decoder.model.decoder.layers.6.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 3.0, 8.0, 12.0, 23.0, 35.0, 75.0, 91.0, 133.0, 130.0, 171.0, 116.0, 89.0, 72.0, 34.0, 11.0, 6.0, 6.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.45703125, -3.16595458984375, -2.8748779296875, -2.58380126953125, -2.292724609375, -2.00164794921875, -1.7105712890625, -1.41949462890625, -1.12841796875, -0.83734130859375, -0.5462646484375, -0.25518798828125, 0.035888671875, 0.32696533203125, 0.6180419921875, 0.90911865234375, 1.2001953125, 1.49127197265625, 1.7823486328125, 2.07342529296875, 2.364501953125, 2.65557861328125, 2.9466552734375, 3.23773193359375, 3.52880859375, 3.81988525390625, 4.1109619140625, 4.40203857421875, 4.693115234375, 4.98419189453125, 5.2752685546875, 5.56634521484375, 5.857421875, 6.14849853515625, 6.4395751953125, 6.73065185546875, 7.021728515625, 7.31280517578125, 7.6038818359375, 7.89495849609375, 8.18603515625, 8.47711181640625, 8.7681884765625, 9.05926513671875, 9.350341796875, 9.64141845703125, 9.9324951171875, 10.22357177734375, 10.5146484375, 10.80572509765625, 11.0968017578125, 11.38787841796875, 11.678955078125, 11.97003173828125, 12.2611083984375, 12.55218505859375, 12.84326171875, 13.13433837890625, 13.4254150390625, 13.71649169921875, 14.007568359375, 14.29864501953125, 14.5897216796875, 14.88079833984375, 15.171875]}, "gradients/decoder.model.decoder.layers.6.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 4.0, 1.0, 4.0, 12.0, 6.0, 8.0, 15.0, 33.0, 33.0, 48.0, 59.0, 70.0, 87.0, 156.0, 211.0, 330.0, 663.0, 2139.0, 16609.0, 427171.0, 572939.0, 23281.0, 2779.0, 764.0, 356.0, 224.0, 162.0, 94.0, 64.0, 66.0, 50.0, 30.0, 27.0, 17.0, 11.0, 9.0, 9.0, 3.0, 4.0, 4.0, 1.0, 2.0, 1.0, 3.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-4.72265625, -4.583984375, -4.4453125, -4.306640625, -4.16796875, -4.029296875, -3.890625, -3.751953125, -3.61328125, -3.474609375, -3.3359375, -3.197265625, -3.05859375, -2.919921875, -2.78125, -2.642578125, -2.50390625, -2.365234375, -2.2265625, -2.087890625, -1.94921875, -1.810546875, -1.671875, -1.533203125, -1.39453125, -1.255859375, -1.1171875, -0.978515625, -0.83984375, -0.701171875, -0.5625, -0.423828125, -0.28515625, -0.146484375, -0.0078125, 0.130859375, 0.26953125, 0.408203125, 0.546875, 0.685546875, 0.82421875, 0.962890625, 1.1015625, 1.240234375, 1.37890625, 1.517578125, 1.65625, 1.794921875, 1.93359375, 2.072265625, 2.2109375, 2.349609375, 2.48828125, 2.626953125, 2.765625, 2.904296875, 3.04296875, 3.181640625, 3.3203125, 3.458984375, 3.59765625, 3.736328125, 3.875, 4.013671875, 4.15234375]}, "gradients/decoder.model.decoder.layers.6.self_attn.v_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 2.0, 3.0, 7.0, 10.0, 15.0, 20.0, 13.0, 12.0, 16.0, 24.0, 22.0, 34.0, 49.0, 35.0, 40.0, 41.0, 33.0, 47.0, 45.0, 49.0, 44.0, 55.0, 38.0, 41.0, 46.0, 31.0, 33.0, 25.0, 23.0, 24.0, 26.0, 18.0, 12.0, 13.0, 9.0, 5.0, 14.0, 11.0, 4.0, 6.0, 3.0, 0.0, 1.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.529296875, -3.409027099609375, -3.28875732421875, -3.168487548828125, -3.0482177734375, -2.927947998046875, -2.80767822265625, -2.687408447265625, -2.567138671875, -2.446868896484375, -2.32659912109375, -2.206329345703125, -2.0860595703125, -1.965789794921875, -1.84552001953125, -1.725250244140625, -1.60498046875, -1.484710693359375, -1.36444091796875, -1.244171142578125, -1.1239013671875, -1.003631591796875, -0.88336181640625, -0.763092041015625, -0.642822265625, -0.522552490234375, -0.40228271484375, -0.282012939453125, -0.1617431640625, -0.041473388671875, 0.07879638671875, 0.199066162109375, 0.3193359375, 0.439605712890625, 0.55987548828125, 0.680145263671875, 0.8004150390625, 0.920684814453125, 1.04095458984375, 1.161224365234375, 1.281494140625, 1.401763916015625, 1.52203369140625, 1.642303466796875, 1.7625732421875, 1.882843017578125, 2.00311279296875, 2.123382568359375, 2.24365234375, 2.363922119140625, 2.48419189453125, 2.604461669921875, 2.7247314453125, 2.845001220703125, 2.96527099609375, 3.085540771484375, 3.205810546875, 3.326080322265625, 3.44635009765625, 3.566619873046875, 3.6868896484375, 3.807159423828125, 3.92742919921875, 4.047698974609375, 4.16796875]}, "gradients/decoder.model.decoder.layers.6.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 7.0, 6.0, 14.0, 24.0, 47.0, 104.0, 279.0, 958.0, 4745.0, 89766.0, 924640.0, 24377.0, 2557.0, 626.0, 220.0, 88.0, 47.0, 19.0, 12.0, 4.0, 1.0, 7.0, 1.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.185546875, -2.095733642578125, -2.00592041015625, -1.916107177734375, -1.8262939453125, -1.736480712890625, -1.64666748046875, -1.556854248046875, -1.467041015625, -1.377227783203125, -1.28741455078125, -1.197601318359375, -1.1077880859375, -1.017974853515625, -0.92816162109375, -0.838348388671875, -0.74853515625, -0.658721923828125, -0.56890869140625, -0.479095458984375, -0.3892822265625, -0.299468994140625, -0.20965576171875, -0.119842529296875, -0.030029296875, 0.059783935546875, 0.14959716796875, 0.239410400390625, 0.3292236328125, 0.419036865234375, 0.50885009765625, 0.598663330078125, 0.6884765625, 0.778289794921875, 0.86810302734375, 0.957916259765625, 1.0477294921875, 1.137542724609375, 1.22735595703125, 1.317169189453125, 1.406982421875, 1.496795654296875, 1.58660888671875, 1.676422119140625, 1.7662353515625, 1.856048583984375, 1.94586181640625, 2.035675048828125, 2.12548828125, 2.215301513671875, 2.30511474609375, 2.394927978515625, 2.4847412109375, 2.574554443359375, 2.66436767578125, 2.754180908203125, 2.843994140625, 2.933807373046875, 3.02362060546875, 3.113433837890625, 3.2032470703125, 3.293060302734375, 3.38287353515625, 3.472686767578125, 3.5625]}, "gradients/decoder.model.decoder.layers.6.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 1.0, 4.0, 4.0, 7.0, 8.0, 22.0, 41.0, 38.0, 94.0, 160.0, 188.0, 171.0, 106.0, 71.0, 36.0, 24.0, 11.0, 13.0, 5.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.00037097930908203125, -0.0003620833158493042, -0.00035318732261657715, -0.0003442913293838501, -0.00033539533615112305, -0.000326499342918396, -0.00031760334968566895, -0.0003087073564529419, -0.00029981136322021484, -0.0002909153699874878, -0.00028201937675476074, -0.0002731233835220337, -0.00026422739028930664, -0.0002553313970565796, -0.00024643540382385254, -0.0002375394105911255, -0.00022864341735839844, -0.0002197474241256714, -0.00021085143089294434, -0.00020195543766021729, -0.00019305944442749023, -0.00018416345119476318, -0.00017526745796203613, -0.00016637146472930908, -0.00015747547149658203, -0.00014857947826385498, -0.00013968348503112793, -0.00013078749179840088, -0.00012189149856567383, -0.00011299550533294678, -0.00010409951210021973, -9.520351886749268e-05, -8.630752563476562e-05, -7.741153240203857e-05, -6.851553916931152e-05, -5.961954593658447e-05, -5.072355270385742e-05, -4.182755947113037e-05, -3.293156623840332e-05, -2.403557300567627e-05, -1.5139579772949219e-05, -6.243586540222168e-06, 2.652406692504883e-06, 1.1548399925231934e-05, 2.0444393157958984e-05, 2.9340386390686035e-05, 3.8236379623413086e-05, 4.713237285614014e-05, 5.602836608886719e-05, 6.492435932159424e-05, 7.382035255432129e-05, 8.271634578704834e-05, 9.161233901977539e-05, 0.00010050833225250244, 0.00010940432548522949, 0.00011830031871795654, 0.0001271963119506836, 0.00013609230518341064, 0.0001449882984161377, 0.00015388429164886475, 0.0001627802848815918, 0.00017167627811431885, 0.0001805722713470459, 0.00018946826457977295, 0.0001983642578125]}, "gradients/decoder.model.decoder.layers.6.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 3.0, 4.0, 9.0, 9.0, 21.0, 20.0, 63.0, 113.0, 322.0, 1547.0, 29447.0, 990938.0, 23975.0, 1533.0, 311.0, 113.0, 49.0, 32.0, 18.0, 6.0, 7.0, 4.0, 5.0, 1.0, 4.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-5.28515625, -5.16632080078125, -5.0474853515625, -4.92864990234375, -4.809814453125, -4.69097900390625, -4.5721435546875, -4.45330810546875, -4.33447265625, -4.21563720703125, -4.0968017578125, -3.97796630859375, -3.859130859375, -3.74029541015625, -3.6214599609375, -3.50262451171875, -3.3837890625, -3.26495361328125, -3.1461181640625, -3.02728271484375, -2.908447265625, -2.78961181640625, -2.6707763671875, -2.55194091796875, -2.43310546875, -2.31427001953125, -2.1954345703125, -2.07659912109375, -1.957763671875, -1.83892822265625, -1.7200927734375, -1.60125732421875, -1.482421875, -1.36358642578125, -1.2447509765625, -1.12591552734375, -1.007080078125, -0.88824462890625, -0.7694091796875, -0.65057373046875, -0.53173828125, -0.41290283203125, -0.2940673828125, -0.17523193359375, -0.056396484375, 0.06243896484375, 0.1812744140625, 0.30010986328125, 0.4189453125, 0.53778076171875, 0.6566162109375, 0.77545166015625, 0.894287109375, 1.01312255859375, 1.1319580078125, 1.25079345703125, 1.36962890625, 1.48846435546875, 1.6072998046875, 1.72613525390625, 1.844970703125, 1.96380615234375, 2.0826416015625, 2.20147705078125, 2.3203125]}, "gradients/decoder.model.decoder.layers.6.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 4.0, 5.0, 6.0, 8.0, 7.0, 28.0, 41.0, 71.0, 115.0, 148.0, 221.0, 115.0, 113.0, 49.0, 34.0, 20.0, 7.0, 7.0, 7.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.642578125, -0.6137237548828125, -0.584869384765625, -0.5560150146484375, -0.52716064453125, -0.4983062744140625, -0.469451904296875, -0.4405975341796875, -0.4117431640625, -0.3828887939453125, -0.354034423828125, -0.3251800537109375, -0.29632568359375, -0.2674713134765625, -0.238616943359375, -0.2097625732421875, -0.180908203125, -0.1520538330078125, -0.123199462890625, -0.0943450927734375, -0.06549072265625, -0.0366363525390625, -0.007781982421875, 0.0210723876953125, 0.0499267578125, 0.0787811279296875, 0.107635498046875, 0.1364898681640625, 0.16534423828125, 0.1941986083984375, 0.223052978515625, 0.2519073486328125, 0.28076171875, 0.3096160888671875, 0.338470458984375, 0.3673248291015625, 0.39617919921875, 0.4250335693359375, 0.453887939453125, 0.4827423095703125, 0.5115966796875, 0.5404510498046875, 0.569305419921875, 0.5981597900390625, 0.62701416015625, 0.6558685302734375, 0.684722900390625, 0.7135772705078125, 0.742431640625, 0.7712860107421875, 0.800140380859375, 0.8289947509765625, 0.85784912109375, 0.8867034912109375, 0.915557861328125, 0.9444122314453125, 0.9732666015625, 1.0021209716796875, 1.030975341796875, 1.0598297119140625, 1.08868408203125, 1.1175384521484375, 1.146392822265625, 1.1752471923828125, 1.2041015625]}, "gradients/decoder.model.decoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 2.0, 3.0, 15.0, 15.0, 42.0, 78.0, 122.0, 179.0, 205.0, 161.0, 91.0, 35.0, 29.0, 13.0, 6.0, 6.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.8226189613342285, -4.524514198303223, -4.226409912109375, -3.928305149078369, -3.6302008628845215, -3.3320960998535156, -3.033991575241089, -2.735887050628662, -2.4377825260162354, -2.1396780014038086, -1.8415734767913818, -1.5434688329696655, -1.2453643083572388, -0.947259783744812, -0.6491551399230957, -0.35105061531066895, -0.05294609069824219, 0.24515846371650696, 0.5432630181312561, 0.8413676023483276, 1.1394721269607544, 1.4375766515731812, 1.7356812953948975, 2.033785820007324, 2.331890344619751, 2.6299948692321777, 2.9280993938446045, 3.2262039184570312, 3.524308681488037, 3.8224129676818848, 4.120517730712891, 4.418622016906738, 4.716726303100586, 5.014831066131592, 5.3129353523254395, 5.611040115356445, 5.909144401550293, 6.207249164581299, 6.505353927612305, 6.803458213806152, 7.1015625, 7.399667263031006, 7.6977715492248535, 7.995876312255859, 8.293980598449707, 8.592084884643555, 8.890190124511719, 9.188294410705566, 9.486398696899414, 9.784502983093262, 10.082608222961426, 10.380712509155273, 10.678816795349121, 10.976921081542969, 11.275026321411133, 11.57313060760498, 11.871235847473145, 12.169340133666992, 12.467445373535156, 12.765549659729004, 13.063653945922852, 13.3617582321167, 13.659863471984863, 13.957967758178711, 14.256072044372559]}, "gradients/decoder.model.decoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 5.0, 3.0, 5.0, 8.0, 14.0, 13.0, 13.0, 15.0, 19.0, 26.0, 27.0, 29.0, 38.0, 36.0, 45.0, 35.0, 52.0, 45.0, 43.0, 60.0, 54.0, 51.0, 46.0, 42.0, 49.0, 39.0, 36.0, 30.0, 31.0, 28.0, 21.0, 10.0, 12.0, 7.0, 9.0, 5.0, 3.0, 5.0, 6.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.0236945152282715, -5.784102439880371, -5.5445098876953125, -5.304917335510254, -5.0653252601623535, -4.825733184814453, -4.5861406326293945, -4.346548080444336, -4.1069560050964355, -3.867363691329956, -3.6277713775634766, -3.388179063796997, -3.1485867500305176, -2.908994436264038, -2.6694021224975586, -2.429809808731079, -2.1902174949645996, -1.9506251811981201, -1.7110328674316406, -1.4714405536651611, -1.2318482398986816, -0.9922559261322021, -0.7526636123657227, -0.5130712985992432, -0.27347898483276367, -0.03388667106628418, 0.2057056427001953, 0.4452979564666748, 0.6848902702331543, 0.9244825839996338, 1.1640748977661133, 1.4036672115325928, 1.643259048461914, 1.8828513622283936, 2.122443675994873, 2.3620359897613525, 2.601628303527832, 2.8412206172943115, 3.080812931060791, 3.3204052448272705, 3.55999755859375, 3.7995898723602295, 4.039182186126709, 4.278774261474609, 4.518366813659668, 4.757959365844727, 4.997551441192627, 5.237143516540527, 5.476736068725586, 5.7163286209106445, 5.955920696258545, 6.195512771606445, 6.435105323791504, 6.6746978759765625, 6.914289951324463, 7.153882026672363, 7.393474578857422, 7.6330671310424805, 7.872659206390381, 8.112251281738281, 8.35184383392334, 8.591436386108398, 8.83102798461914, 9.0706205368042, 9.310213088989258]}, "gradients/decoder.model.decoder.layers.5.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 3.0, 3.0, 11.0, 13.0, 12.0, 19.0, 29.0, 24.0, 53.0, 95.0, 171.0, 384.0, 1391.0, 12923.0, 1377667.0, 2772416.0, 25602.0, 2164.0, 670.0, 302.0, 126.0, 63.0, 44.0, 39.0, 16.0, 17.0, 7.0, 4.0, 6.0, 3.0, 5.0, 1.0, 1.0, 4.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.7890625, -8.53125, -8.2734375, -8.015625, -7.7578125, -7.5, -7.2421875, -6.984375, -6.7265625, -6.46875, -6.2109375, -5.953125, -5.6953125, -5.4375, -5.1796875, -4.921875, -4.6640625, -4.40625, -4.1484375, -3.890625, -3.6328125, -3.375, -3.1171875, -2.859375, -2.6015625, -2.34375, -2.0859375, -1.828125, -1.5703125, -1.3125, -1.0546875, -0.796875, -0.5390625, -0.28125, -0.0234375, 0.234375, 0.4921875, 0.75, 1.0078125, 1.265625, 1.5234375, 1.78125, 2.0390625, 2.296875, 2.5546875, 2.8125, 3.0703125, 3.328125, 3.5859375, 3.84375, 4.1015625, 4.359375, 4.6171875, 4.875, 5.1328125, 5.390625, 5.6484375, 5.90625, 6.1640625, 6.421875, 6.6796875, 6.9375, 7.1953125, 7.453125, 7.7109375]}, "gradients/decoder.model.decoder.layers.5.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 7.0, 3.0, 4.0, 9.0, 9.0, 14.0, 9.0, 27.0, 24.0, 26.0, 37.0, 33.0, 39.0, 47.0, 49.0, 50.0, 65.0, 46.0, 77.0, 68.0, 59.0, 59.0, 43.0, 43.0, 41.0, 27.0, 21.0, 16.0, 20.0, 10.0, 12.0, 7.0, 5.0, 3.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.779296875, -2.696685791015625, -2.61407470703125, -2.531463623046875, -2.4488525390625, -2.366241455078125, -2.28363037109375, -2.201019287109375, -2.118408203125, -2.035797119140625, -1.95318603515625, -1.870574951171875, -1.7879638671875, -1.705352783203125, -1.62274169921875, -1.540130615234375, -1.45751953125, -1.374908447265625, -1.29229736328125, -1.209686279296875, -1.1270751953125, -1.044464111328125, -0.96185302734375, -0.879241943359375, -0.796630859375, -0.714019775390625, -0.63140869140625, -0.548797607421875, -0.4661865234375, -0.383575439453125, -0.30096435546875, -0.218353271484375, -0.1357421875, -0.053131103515625, 0.02947998046875, 0.112091064453125, 0.1947021484375, 0.277313232421875, 0.35992431640625, 0.442535400390625, 0.525146484375, 0.607757568359375, 0.69036865234375, 0.772979736328125, 0.8555908203125, 0.938201904296875, 1.02081298828125, 1.103424072265625, 1.18603515625, 1.268646240234375, 1.35125732421875, 1.433868408203125, 1.5164794921875, 1.599090576171875, 1.68170166015625, 1.764312744140625, 1.846923828125, 1.929534912109375, 2.01214599609375, 2.094757080078125, 2.1773681640625, 2.259979248046875, 2.34259033203125, 2.425201416015625, 2.5078125]}, "gradients/decoder.model.decoder.layers.5.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 4.0, 3.0, 2.0, 6.0, 4.0, 3.0, 9.0, 11.0, 14.0, 14.0, 18.0, 26.0, 49.0, 60.0, 74.0, 132.0, 135.0, 328.0, 565.0, 1081.0, 2499.0, 7162.0, 32419.0, 354073.0, 3282733.0, 461776.0, 38070.0, 7740.0, 2697.0, 1131.0, 574.0, 307.0, 204.0, 119.0, 83.0, 47.0, 38.0, 16.0, 13.0, 8.0, 7.0, 10.0, 11.0, 6.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-3.69921875, -3.592132568359375, -3.48504638671875, -3.377960205078125, -3.2708740234375, -3.163787841796875, -3.05670166015625, -2.949615478515625, -2.842529296875, -2.735443115234375, -2.62835693359375, -2.521270751953125, -2.4141845703125, -2.307098388671875, -2.20001220703125, -2.092926025390625, -1.98583984375, -1.878753662109375, -1.77166748046875, -1.664581298828125, -1.5574951171875, -1.450408935546875, -1.34332275390625, -1.236236572265625, -1.129150390625, -1.022064208984375, -0.91497802734375, -0.807891845703125, -0.7008056640625, -0.593719482421875, -0.48663330078125, -0.379547119140625, -0.2724609375, -0.165374755859375, -0.05828857421875, 0.048797607421875, 0.1558837890625, 0.262969970703125, 0.37005615234375, 0.477142333984375, 0.584228515625, 0.691314697265625, 0.79840087890625, 0.905487060546875, 1.0125732421875, 1.119659423828125, 1.22674560546875, 1.333831787109375, 1.44091796875, 1.548004150390625, 1.65509033203125, 1.762176513671875, 1.8692626953125, 1.976348876953125, 2.08343505859375, 2.190521240234375, 2.297607421875, 2.404693603515625, 2.51177978515625, 2.618865966796875, 2.7259521484375, 2.833038330078125, 2.94012451171875, 3.047210693359375, 3.154296875]}, "gradients/decoder.model.decoder.layers.5.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 4.0, 1.0, 5.0, 7.0, 9.0, 7.0, 15.0, 22.0, 36.0, 50.0, 74.0, 102.0, 134.0, 180.0, 278.0, 360.0, 449.0, 491.0, 509.0, 380.0, 268.0, 192.0, 147.0, 106.0, 78.0, 45.0, 35.0, 21.0, 21.0, 13.0, 11.0, 8.0, 4.0, 4.0, 2.0, 5.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.81005859375, -0.7826156616210938, -0.7551727294921875, -0.7277297973632812, -0.700286865234375, -0.6728439331054688, -0.6454010009765625, -0.6179580688476562, -0.59051513671875, -0.5630722045898438, -0.5356292724609375, -0.5081863403320312, -0.480743408203125, -0.45330047607421875, -0.4258575439453125, -0.39841461181640625, -0.3709716796875, -0.34352874755859375, -0.3160858154296875, -0.28864288330078125, -0.261199951171875, -0.23375701904296875, -0.2063140869140625, -0.17887115478515625, -0.15142822265625, -0.12398529052734375, -0.0965423583984375, -0.06909942626953125, -0.041656494140625, -0.01421356201171875, 0.0132293701171875, 0.04067230224609375, 0.068115234375, 0.09555816650390625, 0.1230010986328125, 0.15044403076171875, 0.177886962890625, 0.20532989501953125, 0.2327728271484375, 0.26021575927734375, 0.28765869140625, 0.31510162353515625, 0.3425445556640625, 0.36998748779296875, 0.397430419921875, 0.42487335205078125, 0.4523162841796875, 0.47975921630859375, 0.5072021484375, 0.5346450805664062, 0.5620880126953125, 0.5895309448242188, 0.616973876953125, 0.6444168090820312, 0.6718597412109375, 0.6993026733398438, 0.72674560546875, 0.7541885375976562, 0.7816314697265625, 0.8090744018554688, 0.836517333984375, 0.8639602661132812, 0.8914031982421875, 0.9188461303710938, 0.9462890625]}, "gradients/decoder.model.decoder.layers.5.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 3.0, 4.0, 8.0, 7.0, 21.0, 28.0, 44.0, 66.0, 111.0, 118.0, 129.0, 139.0, 92.0, 81.0, 61.0, 42.0, 20.0, 12.0, 10.0, 3.0, 6.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.902558326721191, -5.737022876739502, -5.571487903594971, -5.405952453613281, -5.24041748046875, -5.0748820304870605, -4.909347057342529, -4.74381160736084, -4.578276634216309, -4.412741184234619, -4.247206211090088, -4.081670761108398, -3.916135787963867, -3.7506003379821777, -3.5850651264190674, -3.419529914855957, -3.2539944648742676, -3.0884592533111572, -2.922924041748047, -2.7573888301849365, -2.591853618621826, -2.4263181686401367, -2.2607829570770264, -2.095247745513916, -1.9297125339508057, -1.7641773223876953, -1.598642110824585, -1.433106780052185, -1.2675715684890747, -1.1020363569259644, -0.9365010857582092, -0.7709658145904541, -0.605431079864502, -0.4398958384990692, -0.2743605971336365, -0.10882535576820374, 0.056709885597229004, 0.22224509716033936, 0.3877803683280945, 0.5533156394958496, 0.71885085105896, 0.8843860626220703, 1.0499212741851807, 1.2154566049575806, 1.380991816520691, 1.5465270280838013, 1.7120623588562012, 1.8775975704193115, 2.043132781982422, 2.2086679935455322, 2.3742032051086426, 2.539738416671753, 2.7052736282348633, 2.8708090782165527, 3.036344289779663, 3.2018795013427734, 3.367414712905884, 3.532949924468994, 3.6984851360321045, 3.864020347595215, 4.029555797576904, 4.1950907707214355, 4.360626220703125, 4.526161193847656, 4.691696643829346]}, "gradients/decoder.model.decoder.layers.5.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0, 2.0, 8.0, 7.0, 11.0, 10.0, 18.0, 9.0, 18.0, 19.0, 17.0, 20.0, 28.0, 30.0, 43.0, 25.0, 52.0, 41.0, 38.0, 43.0, 51.0, 47.0, 47.0, 54.0, 49.0, 44.0, 42.0, 36.0, 22.0, 37.0, 28.0, 27.0, 18.0, 12.0, 17.0, 13.0, 5.0, 8.0, 1.0, 6.0, 2.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.434231758117676, -2.35748553276062, -2.2807395458221436, -2.203993320465088, -2.1272473335266113, -2.0505011081695557, -1.973755121231079, -1.8970088958740234, -1.8202629089355469, -1.7435168027877808, -1.6667706966400146, -1.5900245904922485, -1.5132784843444824, -1.4365323781967163, -1.3597862720489502, -1.2830400466918945, -1.2062939405441284, -1.1295478343963623, -1.0528017282485962, -0.9760556221008301, -0.899309515953064, -0.8225634098052979, -0.745817244052887, -0.6690711379051208, -0.5923250317573547, -0.5155789256095886, -0.4388328194618225, -0.362086683511734, -0.2853405773639679, -0.20859447121620178, -0.13184833526611328, -0.05510222911834717, 0.021643877029418945, 0.09838999062776566, 0.17513610422611237, 0.2518822252750397, 0.3286283314228058, 0.4053744375705719, 0.4821205735206604, 0.5588666796684265, 0.6356127858161926, 0.7123588919639587, 0.7891049981117249, 0.8658511638641357, 0.9425972700119019, 1.019343376159668, 1.096089482307434, 1.1728355884552002, 1.2495816946029663, 1.3263278007507324, 1.4030739068984985, 1.4798200130462646, 1.5565661191940308, 1.6333122253417969, 1.7100584506988525, 1.786804437637329, 1.8635506629943848, 1.9402967691421509, 2.017042875289917, 2.0937891006469727, 2.170535087585449, 2.247281312942505, 2.3240272998809814, 2.400773525238037, 2.4775195121765137]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 4.0, 1.0, 2.0, 2.0, 7.0, 10.0, 11.0, 16.0, 11.0, 28.0, 34.0, 59.0, 52.0, 104.0, 166.0, 271.0, 585.0, 1269.0, 3030.0, 8375.0, 24699.0, 73319.0, 196340.0, 334731.0, 248851.0, 102312.0, 35070.0, 11734.0, 4162.0, 1650.0, 705.0, 370.0, 184.0, 102.0, 80.0, 54.0, 41.0, 26.0, 23.0, 19.0, 15.0, 7.0, 8.0, 9.0, 3.0, 1.0, 1.0, 4.0, 0.0, 1.0, 3.0, 1.0, 1.0], "bins": [-0.448974609375, -0.4360198974609375, -0.423065185546875, -0.4101104736328125, -0.39715576171875, -0.3842010498046875, -0.371246337890625, -0.3582916259765625, -0.3453369140625, -0.3323822021484375, -0.319427490234375, -0.3064727783203125, -0.29351806640625, -0.2805633544921875, -0.267608642578125, -0.2546539306640625, -0.24169921875, -0.2287445068359375, -0.215789794921875, -0.2028350830078125, -0.18988037109375, -0.1769256591796875, -0.163970947265625, -0.1510162353515625, -0.1380615234375, -0.1251068115234375, -0.112152099609375, -0.0991973876953125, -0.08624267578125, -0.0732879638671875, -0.060333251953125, -0.0473785400390625, -0.034423828125, -0.0214691162109375, -0.008514404296875, 0.0044403076171875, 0.01739501953125, 0.0303497314453125, 0.043304443359375, 0.0562591552734375, 0.0692138671875, 0.0821685791015625, 0.095123291015625, 0.1080780029296875, 0.12103271484375, 0.1339874267578125, 0.146942138671875, 0.1598968505859375, 0.1728515625, 0.1858062744140625, 0.198760986328125, 0.2117156982421875, 0.22467041015625, 0.2376251220703125, 0.250579833984375, 0.2635345458984375, 0.2764892578125, 0.2894439697265625, 0.302398681640625, 0.3153533935546875, 0.32830810546875, 0.3412628173828125, 0.354217529296875, 0.3671722412109375, 0.380126953125]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 5.0, 8.0, 11.0, 23.0, 34.0, 36.0, 49.0, 58.0, 77.0, 72.0, 90.0, 74.0, 112.0, 89.0, 69.0, 54.0, 43.0, 45.0, 25.0, 13.0, 8.0, 3.0, 5.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.50390625, -3.412506103515625, -3.32110595703125, -3.229705810546875, -3.1383056640625, -3.046905517578125, -2.95550537109375, -2.864105224609375, -2.772705078125, -2.681304931640625, -2.58990478515625, -2.498504638671875, -2.4071044921875, -2.315704345703125, -2.22430419921875, -2.132904052734375, -2.04150390625, -1.950103759765625, -1.85870361328125, -1.767303466796875, -1.6759033203125, -1.584503173828125, -1.49310302734375, -1.401702880859375, -1.310302734375, -1.218902587890625, -1.12750244140625, -1.036102294921875, -0.9447021484375, -0.853302001953125, -0.76190185546875, -0.670501708984375, -0.5791015625, -0.487701416015625, -0.39630126953125, -0.304901123046875, -0.2135009765625, -0.122100830078125, -0.03070068359375, 0.060699462890625, 0.152099609375, 0.243499755859375, 0.33489990234375, 0.426300048828125, 0.5177001953125, 0.609100341796875, 0.70050048828125, 0.791900634765625, 0.88330078125, 0.974700927734375, 1.06610107421875, 1.157501220703125, 1.2489013671875, 1.340301513671875, 1.43170166015625, 1.523101806640625, 1.614501953125, 1.705902099609375, 1.79730224609375, 1.888702392578125, 1.9801025390625, 2.071502685546875, 2.16290283203125, 2.254302978515625, 2.345703125]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 4.0, 3.0, 3.0, 1.0, 5.0, 9.0, 11.0, 17.0, 19.0, 38.0, 57.0, 91.0, 186.0, 262.0, 462.0, 747.0, 1292.0, 2233.0, 3896.0, 6940.0, 11720.0, 20580.0, 35000.0, 58773.0, 95152.0, 140208.0, 174152.0, 167440.0, 125782.0, 82469.0, 50239.0, 29896.0, 17283.0, 9902.0, 5730.0, 3284.0, 1895.0, 1106.0, 606.0, 413.0, 227.0, 154.0, 101.0, 69.0, 36.0, 24.0, 13.0, 16.0, 9.0, 6.0, 3.0, 3.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.1925048828125, -0.1864604949951172, -0.18041610717773438, -0.17437171936035156, -0.16832733154296875, -0.16228294372558594, -0.15623855590820312, -0.1501941680908203, -0.1441497802734375, -0.1381053924560547, -0.13206100463867188, -0.12601661682128906, -0.11997222900390625, -0.11392784118652344, -0.10788345336914062, -0.10183906555175781, -0.095794677734375, -0.08975028991699219, -0.08370590209960938, -0.07766151428222656, -0.07161712646484375, -0.06557273864746094, -0.059528350830078125, -0.05348396301269531, -0.0474395751953125, -0.04139518737792969, -0.035350799560546875, -0.029306411743164062, -0.02326202392578125, -0.017217636108398438, -0.011173248291015625, -0.0051288604736328125, 0.00091552734375, 0.0069599151611328125, 0.013004302978515625, 0.019048690795898438, 0.02509307861328125, 0.031137466430664062, 0.037181854248046875, 0.04322624206542969, 0.0492706298828125, 0.05531501770019531, 0.061359405517578125, 0.06740379333496094, 0.07344818115234375, 0.07949256896972656, 0.08553695678710938, 0.09158134460449219, 0.097625732421875, 0.10367012023925781, 0.10971450805664062, 0.11575889587402344, 0.12180328369140625, 0.12784767150878906, 0.13389205932617188, 0.1399364471435547, 0.1459808349609375, 0.1520252227783203, 0.15806961059570312, 0.16411399841308594, 0.17015838623046875, 0.17620277404785156, 0.18224716186523438, 0.1882915496826172, 0.1943359375]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 3.0, 2.0, 5.0, 4.0, 3.0, 9.0, 7.0, 15.0, 20.0, 20.0, 19.0, 40.0, 33.0, 33.0, 60.0, 46.0, 57.0, 51.0, 57.0, 59.0, 57.0, 52.0, 47.0, 40.0, 50.0, 37.0, 34.0, 28.0, 27.0, 22.0, 12.0, 19.0, 6.0, 17.0, 5.0, 5.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.5703125, -3.4571533203125, -3.343994140625, -3.2308349609375, -3.11767578125, -3.0045166015625, -2.891357421875, -2.7781982421875, -2.6650390625, -2.5518798828125, -2.438720703125, -2.3255615234375, -2.21240234375, -2.0992431640625, -1.986083984375, -1.8729248046875, -1.759765625, -1.6466064453125, -1.533447265625, -1.4202880859375, -1.30712890625, -1.1939697265625, -1.080810546875, -0.9676513671875, -0.8544921875, -0.7413330078125, -0.628173828125, -0.5150146484375, -0.40185546875, -0.2886962890625, -0.175537109375, -0.0623779296875, 0.05078125, 0.1639404296875, 0.277099609375, 0.3902587890625, 0.50341796875, 0.6165771484375, 0.729736328125, 0.8428955078125, 0.9560546875, 1.0692138671875, 1.182373046875, 1.2955322265625, 1.40869140625, 1.5218505859375, 1.635009765625, 1.7481689453125, 1.861328125, 1.9744873046875, 2.087646484375, 2.2008056640625, 2.31396484375, 2.4271240234375, 2.540283203125, 2.6534423828125, 2.7666015625, 2.8797607421875, 2.992919921875, 3.1060791015625, 3.21923828125, 3.3323974609375, 3.445556640625, 3.5587158203125, 3.671875]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 3.0, 4.0, 10.0, 18.0, 28.0, 58.0, 98.0, 207.0, 361.0, 736.0, 1608.0, 4144.0, 14087.0, 76188.0, 543410.0, 345977.0, 46160.0, 9756.0, 3201.0, 1291.0, 605.0, 298.0, 144.0, 76.0, 36.0, 34.0, 13.0, 6.0, 3.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.12139892578125, -0.11810588836669922, -0.11481285095214844, -0.11151981353759766, -0.10822677612304688, -0.1049337387084961, -0.10164070129394531, -0.09834766387939453, -0.09505462646484375, -0.09176158905029297, -0.08846855163574219, -0.0851755142211914, -0.08188247680664062, -0.07858943939208984, -0.07529640197753906, -0.07200336456298828, -0.0687103271484375, -0.06541728973388672, -0.06212425231933594, -0.058831214904785156, -0.055538177490234375, -0.052245140075683594, -0.04895210266113281, -0.04565906524658203, -0.04236602783203125, -0.03907299041748047, -0.03577995300292969, -0.032486915588378906, -0.029193878173828125, -0.025900840759277344, -0.022607803344726562, -0.01931476593017578, -0.016021728515625, -0.012728691101074219, -0.009435653686523438, -0.006142616271972656, -0.002849578857421875, 0.00044345855712890625, 0.0037364959716796875, 0.007029533386230469, 0.01032257080078125, 0.013615608215332031, 0.016908645629882812, 0.020201683044433594, 0.023494720458984375, 0.026787757873535156, 0.030080795288085938, 0.03337383270263672, 0.0366668701171875, 0.03995990753173828, 0.04325294494628906, 0.046545982360839844, 0.049839019775390625, 0.053132057189941406, 0.05642509460449219, 0.05971813201904297, 0.06301116943359375, 0.06630420684814453, 0.06959724426269531, 0.0728902816772461, 0.07618331909179688, 0.07947635650634766, 0.08276939392089844, 0.08606243133544922, 0.08935546875]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 4.0, 9.0, 9.0, 14.0, 17.0, 35.0, 42.0, 49.0, 94.0, 153.0, 160.0, 110.0, 116.0, 72.0, 43.0, 30.0, 17.0, 8.0, 11.0, 5.0, 8.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.276369094848633e-05, -6.077531725168228e-05, -5.8786943554878235e-05, -5.679856985807419e-05, -5.481019616127014e-05, -5.2821822464466095e-05, -5.083344876766205e-05, -4.8845075070858e-05, -4.6856701374053955e-05, -4.486832767724991e-05, -4.287995398044586e-05, -4.0891580283641815e-05, -3.890320658683777e-05, -3.691483289003372e-05, -3.4926459193229675e-05, -3.293808549642563e-05, -3.094971179962158e-05, -2.8961338102817535e-05, -2.697296440601349e-05, -2.4984590709209442e-05, -2.2996217012405396e-05, -2.100784331560135e-05, -1.9019469618797302e-05, -1.7031095921993256e-05, -1.5042722225189209e-05, -1.3054348528385162e-05, -1.1065974831581116e-05, -9.077601134777069e-06, -7.0892274379730225e-06, -5.100853741168976e-06, -3.112480044364929e-06, -1.1241063475608826e-06, 8.642673492431641e-07, 2.8526410460472107e-06, 4.841014742851257e-06, 6.829388439655304e-06, 8.81776213645935e-06, 1.0806135833263397e-05, 1.2794509530067444e-05, 1.478288322687149e-05, 1.6771256923675537e-05, 1.8759630620479584e-05, 2.074800431728363e-05, 2.2736378014087677e-05, 2.4724751710891724e-05, 2.671312540769577e-05, 2.8701499104499817e-05, 3.0689872801303864e-05, 3.267824649810791e-05, 3.466662019491196e-05, 3.6654993891716003e-05, 3.864336758852005e-05, 4.06317412853241e-05, 4.262011498212814e-05, 4.460848867893219e-05, 4.6596862375736237e-05, 4.858523607254028e-05, 5.057360976934433e-05, 5.2561983466148376e-05, 5.455035716295242e-05, 5.653873085975647e-05, 5.8527104556560516e-05, 6.051547825336456e-05, 6.250385195016861e-05, 6.449222564697266e-05]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 1.0, 1.0, 6.0, 3.0, 6.0, 3.0, 8.0, 7.0, 15.0, 18.0, 19.0, 40.0, 38.0, 77.0, 108.0, 184.0, 311.0, 696.0, 1481.0, 3676.0, 11263.0, 39403.0, 172276.0, 532571.0, 216455.0, 49051.0, 13056.0, 4397.0, 1683.0, 765.0, 378.0, 200.0, 117.0, 73.0, 43.0, 37.0, 25.0, 18.0, 11.0, 7.0, 10.0, 5.0, 8.0, 2.0, 1.0, 4.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.088623046875, -0.0859832763671875, -0.083343505859375, -0.0807037353515625, -0.07806396484375, -0.0754241943359375, -0.072784423828125, -0.0701446533203125, -0.0675048828125, -0.0648651123046875, -0.062225341796875, -0.0595855712890625, -0.05694580078125, -0.0543060302734375, -0.051666259765625, -0.0490264892578125, -0.04638671875, -0.0437469482421875, -0.041107177734375, -0.0384674072265625, -0.03582763671875, -0.0331878662109375, -0.030548095703125, -0.0279083251953125, -0.0252685546875, -0.0226287841796875, -0.019989013671875, -0.0173492431640625, -0.01470947265625, -0.0120697021484375, -0.009429931640625, -0.0067901611328125, -0.004150390625, -0.0015106201171875, 0.001129150390625, 0.0037689208984375, 0.00640869140625, 0.0090484619140625, 0.011688232421875, 0.0143280029296875, 0.0169677734375, 0.0196075439453125, 0.022247314453125, 0.0248870849609375, 0.02752685546875, 0.0301666259765625, 0.032806396484375, 0.0354461669921875, 0.0380859375, 0.0407257080078125, 0.043365478515625, 0.0460052490234375, 0.04864501953125, 0.0512847900390625, 0.053924560546875, 0.0565643310546875, 0.0592041015625, 0.0618438720703125, 0.064483642578125, 0.0671234130859375, 0.06976318359375, 0.0724029541015625, 0.075042724609375, 0.0776824951171875, 0.080322265625]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 2.0, 4.0, 4.0, 8.0, 6.0, 3.0, 14.0, 14.0, 19.0, 27.0, 32.0, 41.0, 49.0, 50.0, 63.0, 100.0, 98.0, 89.0, 80.0, 65.0, 62.0, 42.0, 30.0, 28.0, 17.0, 17.0, 13.0, 5.0, 6.0, 4.0, 3.0, 3.0, 2.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0203399658203125, -0.019622802734375, -0.0189056396484375, -0.0181884765625, -0.0174713134765625, -0.016754150390625, -0.0160369873046875, -0.01531982421875, -0.0146026611328125, -0.013885498046875, -0.0131683349609375, -0.012451171875, -0.0117340087890625, -0.011016845703125, -0.0102996826171875, -0.00958251953125, -0.0088653564453125, -0.008148193359375, -0.0074310302734375, -0.0067138671875, -0.0059967041015625, -0.005279541015625, -0.0045623779296875, -0.00384521484375, -0.0031280517578125, -0.002410888671875, -0.0016937255859375, -0.0009765625, -0.0002593994140625, 0.000457763671875, 0.0011749267578125, 0.00189208984375, 0.0026092529296875, 0.003326416015625, 0.0040435791015625, 0.0047607421875, 0.0054779052734375, 0.006195068359375, 0.0069122314453125, 0.00762939453125, 0.0083465576171875, 0.009063720703125, 0.0097808837890625, 0.010498046875, 0.0112152099609375, 0.011932373046875, 0.0126495361328125, 0.01336669921875, 0.0140838623046875, 0.014801025390625, 0.0155181884765625, 0.0162353515625, 0.0169525146484375, 0.017669677734375, 0.0183868408203125, 0.01910400390625, 0.0198211669921875, 0.020538330078125, 0.0212554931640625, 0.02197265625, 0.0226898193359375, 0.023406982421875, 0.0241241455078125, 0.02484130859375, 0.0255584716796875]}, "gradients/decoder.model.decoder.layers.5.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 13.0, 52.0, 213.0, 396.0, 251.0, 62.0, 18.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-15.11353874206543, -14.814570426940918, -14.51560115814209, -14.216632843017578, -13.91766357421875, -13.618695259094238, -13.319726943969727, -13.020757675170898, -12.721789360046387, -12.422821044921875, -12.123851776123047, -11.824883460998535, -11.525915145874023, -11.226945877075195, -10.927977561950684, -10.629009246826172, -10.330039978027344, -10.031071662902832, -9.732102394104004, -9.433134078979492, -9.134164810180664, -8.835196495056152, -8.53622817993164, -8.237258911132812, -7.938290596008301, -7.639321804046631, -7.340353012084961, -7.041384696960449, -6.742415904998779, -6.443447113037109, -6.144478797912598, -5.845510005950928, -5.546541213989258, -5.247572422027588, -4.948603630065918, -4.649635314941406, -4.350666522979736, -4.051697731018066, -3.7527291774749756, -3.4537606239318848, -3.154791831970215, -2.855823040008545, -2.556854486465454, -2.2578859329223633, -1.9589171409606934, -1.659948468208313, -1.3609797954559326, -1.0620112419128418, -0.7630424499511719, -0.4640737771987915, -0.16510510444641113, 0.13386356830596924, 0.4328322410583496, 0.73180091381073, 1.0307695865631104, 1.3297381401062012, 1.628706932067871, 1.9276756048202515, 2.226644277572632, 2.5256128311157227, 2.8245816230773926, 3.1235504150390625, 3.4225189685821533, 3.721487522125244, 4.020456314086914]}, "gradients/decoder.model.decoder.layers.5.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 4.0, 4.0, 6.0, 11.0, 8.0, 16.0, 23.0, 12.0, 26.0, 38.0, 30.0, 42.0, 56.0, 62.0, 55.0, 63.0, 72.0, 66.0, 70.0, 60.0, 54.0, 51.0, 40.0, 33.0, 36.0, 20.0, 17.0, 14.0, 8.0, 8.0, 3.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.947766900062561, -1.8817667961120605, -1.8157665729522705, -1.74976646900177, -1.6837663650512695, -1.617766261100769, -1.5517661571502686, -1.4857659339904785, -1.419765830039978, -1.3537657260894775, -1.2877655029296875, -1.221765398979187, -1.1557652950286865, -1.089765191078186, -1.0237650871276855, -0.9577648639678955, -0.891764760017395, -0.8257646560668945, -0.7597644925117493, -0.693764328956604, -0.6277642250061035, -0.561764121055603, -0.49576395750045776, -0.4297638237476349, -0.363763689994812, -0.29776355624198914, -0.23176342248916626, -0.16576328873634338, -0.09976315498352051, -0.03376302123069763, 0.032237112522125244, 0.09823724627494812, 0.16423749923706055, 0.23023763298988342, 0.2962377667427063, 0.3622379004955292, 0.42823803424835205, 0.4942381680011749, 0.5602383017539978, 0.6262384653091431, 0.6922385692596436, 0.758238673210144, 0.8242388367652893, 0.8902390003204346, 0.9562391042709351, 1.0222392082214355, 1.0882394313812256, 1.154239535331726, 1.2202396392822266, 1.286239743232727, 1.3522398471832275, 1.4182400703430176, 1.484240174293518, 1.5502402782440186, 1.6162405014038086, 1.682240605354309, 1.7482407093048096, 1.81424081325531, 1.8802409172058105, 1.9462411403656006, 2.0122413635253906, 2.0782413482666016, 2.1442415714263916, 2.2102415561676025, 2.2762417793273926]}, "gradients/decoder.model.decoder.layers.5.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 9.0, 4.0, 12.0, 10.0, 14.0, 20.0, 26.0, 45.0, 53.0, 111.0, 228.0, 553.0, 1468.0, 4478.0, 14568.0, 56854.0, 284416.0, 528824.0, 117884.0, 27340.0, 7569.0, 2400.0, 845.0, 381.0, 173.0, 100.0, 36.0, 32.0, 29.0, 14.0, 14.0, 8.0, 11.0, 4.0, 6.0, 4.0, 5.0, 3.0, 0.0, 0.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.009765625, -1.94329833984375, -1.8768310546875, -1.81036376953125, -1.743896484375, -1.67742919921875, -1.6109619140625, -1.54449462890625, -1.47802734375, -1.41156005859375, -1.3450927734375, -1.27862548828125, -1.212158203125, -1.14569091796875, -1.0792236328125, -1.01275634765625, -0.9462890625, -0.87982177734375, -0.8133544921875, -0.74688720703125, -0.680419921875, -0.61395263671875, -0.5474853515625, -0.48101806640625, -0.41455078125, -0.34808349609375, -0.2816162109375, -0.21514892578125, -0.148681640625, -0.08221435546875, -0.0157470703125, 0.05072021484375, 0.1171875, 0.18365478515625, 0.2501220703125, 0.31658935546875, 0.383056640625, 0.44952392578125, 0.5159912109375, 0.58245849609375, 0.64892578125, 0.71539306640625, 0.7818603515625, 0.84832763671875, 0.914794921875, 0.98126220703125, 1.0477294921875, 1.11419677734375, 1.1806640625, 1.24713134765625, 1.3135986328125, 1.38006591796875, 1.446533203125, 1.51300048828125, 1.5794677734375, 1.64593505859375, 1.71240234375, 1.77886962890625, 1.8453369140625, 1.91180419921875, 1.978271484375, 2.04473876953125, 2.1112060546875, 2.17767333984375, 2.244140625]}, "gradients/decoder.model.decoder.layers.5.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 4.0, 1.0, 4.0, 5.0, 13.0, 14.0, 17.0, 12.0, 20.0, 24.0, 30.0, 33.0, 41.0, 54.0, 46.0, 47.0, 63.0, 64.0, 56.0, 69.0, 55.0, 52.0, 45.0, 29.0, 52.0, 30.0, 36.0, 23.0, 17.0, 22.0, 10.0, 7.0, 8.0, 4.0, 2.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.33984375, -4.220245361328125, -4.10064697265625, -3.981048583984375, -3.8614501953125, -3.741851806640625, -3.62225341796875, -3.502655029296875, -3.383056640625, -3.263458251953125, -3.14385986328125, -3.024261474609375, -2.9046630859375, -2.785064697265625, -2.66546630859375, -2.545867919921875, -2.42626953125, -2.306671142578125, -2.18707275390625, -2.067474365234375, -1.9478759765625, -1.828277587890625, -1.70867919921875, -1.589080810546875, -1.469482421875, -1.349884033203125, -1.23028564453125, -1.110687255859375, -0.9910888671875, -0.871490478515625, -0.75189208984375, -0.632293701171875, -0.5126953125, -0.393096923828125, -0.27349853515625, -0.153900146484375, -0.0343017578125, 0.085296630859375, 0.20489501953125, 0.324493408203125, 0.444091796875, 0.563690185546875, 0.68328857421875, 0.802886962890625, 0.9224853515625, 1.042083740234375, 1.16168212890625, 1.281280517578125, 1.40087890625, 1.520477294921875, 1.64007568359375, 1.759674072265625, 1.8792724609375, 1.998870849609375, 2.11846923828125, 2.238067626953125, 2.357666015625, 2.477264404296875, 2.59686279296875, 2.716461181640625, 2.8360595703125, 2.955657958984375, 3.07525634765625, 3.194854736328125, 3.314453125]}, "gradients/decoder.model.decoder.layers.5.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 4.0, 6.0, 8.0, 14.0, 15.0, 13.0, 16.0, 34.0, 46.0, 63.0, 90.0, 138.0, 210.0, 293.0, 609.0, 2241.0, 21958.0, 515015.0, 483094.0, 20812.0, 2229.0, 634.0, 336.0, 205.0, 140.0, 114.0, 53.0, 53.0, 29.0, 17.0, 25.0, 10.0, 11.0, 4.0, 2.0, 3.0, 8.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.203125, -4.0794677734375, -3.955810546875, -3.8321533203125, -3.70849609375, -3.5848388671875, -3.461181640625, -3.3375244140625, -3.2138671875, -3.0902099609375, -2.966552734375, -2.8428955078125, -2.71923828125, -2.5955810546875, -2.471923828125, -2.3482666015625, -2.224609375, -2.1009521484375, -1.977294921875, -1.8536376953125, -1.72998046875, -1.6063232421875, -1.482666015625, -1.3590087890625, -1.2353515625, -1.1116943359375, -0.988037109375, -0.8643798828125, -0.74072265625, -0.6170654296875, -0.493408203125, -0.3697509765625, -0.24609375, -0.1224365234375, 0.001220703125, 0.1248779296875, 0.24853515625, 0.3721923828125, 0.495849609375, 0.6195068359375, 0.7431640625, 0.8668212890625, 0.990478515625, 1.1141357421875, 1.23779296875, 1.3614501953125, 1.485107421875, 1.6087646484375, 1.732421875, 1.8560791015625, 1.979736328125, 2.1033935546875, 2.22705078125, 2.3507080078125, 2.474365234375, 2.5980224609375, 2.7216796875, 2.8453369140625, 2.968994140625, 3.0926513671875, 3.21630859375, 3.3399658203125, 3.463623046875, 3.5872802734375, 3.7109375]}, "gradients/decoder.model.decoder.layers.5.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 3.0, 4.0, 4.0, 2.0, 7.0, 8.0, 5.0, 9.0, 11.0, 15.0, 18.0, 17.0, 21.0, 32.0, 33.0, 34.0, 29.0, 48.0, 27.0, 55.0, 51.0, 55.0, 46.0, 44.0, 44.0, 39.0, 35.0, 41.0, 43.0, 31.0, 39.0, 22.0, 30.0, 13.0, 26.0, 9.0, 11.0, 8.0, 14.0, 3.0, 6.0, 6.0, 5.0, 4.0, 1.0, 2.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.10546875, -3.9813232421875, -3.857177734375, -3.7330322265625, -3.60888671875, -3.4847412109375, -3.360595703125, -3.2364501953125, -3.1123046875, -2.9881591796875, -2.864013671875, -2.7398681640625, -2.61572265625, -2.4915771484375, -2.367431640625, -2.2432861328125, -2.119140625, -1.9949951171875, -1.870849609375, -1.7467041015625, -1.62255859375, -1.4984130859375, -1.374267578125, -1.2501220703125, -1.1259765625, -1.0018310546875, -0.877685546875, -0.7535400390625, -0.62939453125, -0.5052490234375, -0.381103515625, -0.2569580078125, -0.1328125, -0.0086669921875, 0.115478515625, 0.2396240234375, 0.36376953125, 0.4879150390625, 0.612060546875, 0.7362060546875, 0.8603515625, 0.9844970703125, 1.108642578125, 1.2327880859375, 1.35693359375, 1.4810791015625, 1.605224609375, 1.7293701171875, 1.853515625, 1.9776611328125, 2.101806640625, 2.2259521484375, 2.35009765625, 2.4742431640625, 2.598388671875, 2.7225341796875, 2.8466796875, 2.9708251953125, 3.094970703125, 3.2191162109375, 3.34326171875, 3.4674072265625, 3.591552734375, 3.7156982421875, 3.83984375]}, "gradients/decoder.model.decoder.layers.5.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 5.0, 1.0, 3.0, 3.0, 2.0, 11.0, 11.0, 5.0, 25.0, 27.0, 36.0, 57.0, 102.0, 210.0, 374.0, 922.0, 2576.0, 12232.0, 394740.0, 615705.0, 16590.0, 2947.0, 1072.0, 456.0, 202.0, 108.0, 58.0, 31.0, 13.0, 11.0, 7.0, 5.0, 4.0, 5.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.029296875, -1.9679107666015625, -1.906524658203125, -1.8451385498046875, -1.78375244140625, -1.7223663330078125, -1.660980224609375, -1.5995941162109375, -1.5382080078125, -1.4768218994140625, -1.415435791015625, -1.3540496826171875, -1.29266357421875, -1.2312774658203125, -1.169891357421875, -1.1085052490234375, -1.047119140625, -0.9857330322265625, -0.924346923828125, -0.8629608154296875, -0.80157470703125, -0.7401885986328125, -0.678802490234375, -0.6174163818359375, -0.5560302734375, -0.4946441650390625, -0.433258056640625, -0.3718719482421875, -0.31048583984375, -0.2490997314453125, -0.187713623046875, -0.1263275146484375, -0.06494140625, -0.0035552978515625, 0.057830810546875, 0.1192169189453125, 0.18060302734375, 0.2419891357421875, 0.303375244140625, 0.3647613525390625, 0.4261474609375, 0.4875335693359375, 0.548919677734375, 0.6103057861328125, 0.67169189453125, 0.7330780029296875, 0.794464111328125, 0.8558502197265625, 0.917236328125, 0.9786224365234375, 1.040008544921875, 1.1013946533203125, 1.16278076171875, 1.2241668701171875, 1.285552978515625, 1.3469390869140625, 1.4083251953125, 1.4697113037109375, 1.531097412109375, 1.5924835205078125, 1.65386962890625, 1.7152557373046875, 1.776641845703125, 1.8380279541015625, 1.8994140625]}, "gradients/decoder.model.decoder.layers.5.self_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 10.0, 4.0, 9.0, 10.0, 12.0, 15.0, 36.0, 47.0, 67.0, 79.0, 110.0, 160.0, 125.0, 93.0, 68.0, 43.0, 36.0, 21.0, 15.0, 11.0, 15.0, 3.0, 4.0, 2.0, 4.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00018906593322753906, -0.0001828894019126892, -0.00017671287059783936, -0.0001705363392829895, -0.00016435980796813965, -0.0001581832766532898, -0.00015200674533843994, -0.0001458302140235901, -0.00013965368270874023, -0.00013347715139389038, -0.00012730062007904053, -0.00012112408876419067, -0.00011494755744934082, -0.00010877102613449097, -0.00010259449481964111, -9.641796350479126e-05, -9.02414321899414e-05, -8.406490087509155e-05, -7.78883695602417e-05, -7.171183824539185e-05, -6.553530693054199e-05, -5.935877561569214e-05, -5.3182244300842285e-05, -4.700571298599243e-05, -4.082918167114258e-05, -3.4652650356292725e-05, -2.847611904144287e-05, -2.2299587726593018e-05, -1.6123056411743164e-05, -9.94652509689331e-06, -3.769993782043457e-06, 2.4065375328063965e-06, 8.58306884765625e-06, 1.4759600162506104e-05, 2.0936131477355957e-05, 2.711266279220581e-05, 3.3289194107055664e-05, 3.946572542190552e-05, 4.564225673675537e-05, 5.1818788051605225e-05, 5.799531936645508e-05, 6.417185068130493e-05, 7.034838199615479e-05, 7.652491331100464e-05, 8.270144462585449e-05, 8.887797594070435e-05, 9.50545072555542e-05, 0.00010123103857040405, 0.0001074075698852539, 0.00011358410120010376, 0.00011976063251495361, 0.00012593716382980347, 0.00013211369514465332, 0.00013829022645950317, 0.00014446675777435303, 0.00015064328908920288, 0.00015681982040405273, 0.0001629963517189026, 0.00016917288303375244, 0.0001753494143486023, 0.00018152594566345215, 0.000187702476978302, 0.00019387900829315186, 0.0002000555396080017, 0.00020623207092285156]}, "gradients/decoder.model.decoder.layers.5.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 3.0, 2.0, 1.0, 5.0, 9.0, 16.0, 19.0, 18.0, 44.0, 76.0, 151.0, 314.0, 1005.0, 3377.0, 26536.0, 882205.0, 125752.0, 6447.0, 1561.0, 550.0, 216.0, 102.0, 55.0, 26.0, 14.0, 13.0, 11.0, 8.0, 10.0, 1.0, 5.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.583984375, -2.509521484375, -2.43505859375, -2.360595703125, -2.2861328125, -2.211669921875, -2.13720703125, -2.062744140625, -1.98828125, -1.913818359375, -1.83935546875, -1.764892578125, -1.6904296875, -1.615966796875, -1.54150390625, -1.467041015625, -1.392578125, -1.318115234375, -1.24365234375, -1.169189453125, -1.0947265625, -1.020263671875, -0.94580078125, -0.871337890625, -0.796875, -0.722412109375, -0.64794921875, -0.573486328125, -0.4990234375, -0.424560546875, -0.35009765625, -0.275634765625, -0.201171875, -0.126708984375, -0.05224609375, 0.022216796875, 0.0966796875, 0.171142578125, 0.24560546875, 0.320068359375, 0.39453125, 0.468994140625, 0.54345703125, 0.617919921875, 0.6923828125, 0.766845703125, 0.84130859375, 0.915771484375, 0.990234375, 1.064697265625, 1.13916015625, 1.213623046875, 1.2880859375, 1.362548828125, 1.43701171875, 1.511474609375, 1.5859375, 1.660400390625, 1.73486328125, 1.809326171875, 1.8837890625, 1.958251953125, 2.03271484375, 2.107177734375, 2.181640625]}, "gradients/decoder.model.decoder.layers.5.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 4.0, 9.0, 4.0, 8.0, 11.0, 12.0, 20.0, 33.0, 28.0, 59.0, 84.0, 110.0, 141.0, 154.0, 97.0, 64.0, 52.0, 34.0, 23.0, 18.0, 13.0, 10.0, 7.0, 6.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0], "bins": [-0.64599609375, -0.62847900390625, -0.6109619140625, -0.59344482421875, -0.575927734375, -0.55841064453125, -0.5408935546875, -0.52337646484375, -0.505859375, -0.48834228515625, -0.4708251953125, -0.45330810546875, -0.435791015625, -0.41827392578125, -0.4007568359375, -0.38323974609375, -0.36572265625, -0.34820556640625, -0.3306884765625, -0.31317138671875, -0.295654296875, -0.27813720703125, -0.2606201171875, -0.24310302734375, -0.2255859375, -0.20806884765625, -0.1905517578125, -0.17303466796875, -0.155517578125, -0.13800048828125, -0.1204833984375, -0.10296630859375, -0.08544921875, -0.06793212890625, -0.0504150390625, -0.03289794921875, -0.015380859375, 0.00213623046875, 0.0196533203125, 0.03717041015625, 0.0546875, 0.07220458984375, 0.0897216796875, 0.10723876953125, 0.124755859375, 0.14227294921875, 0.1597900390625, 0.17730712890625, 0.19482421875, 0.21234130859375, 0.2298583984375, 0.24737548828125, 0.264892578125, 0.28240966796875, 0.2999267578125, 0.31744384765625, 0.3349609375, 0.35247802734375, 0.3699951171875, 0.38751220703125, 0.405029296875, 0.42254638671875, 0.4400634765625, 0.45758056640625, 0.47509765625]}, "gradients/decoder.model.decoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 0.0, 5.0, 5.0, 8.0, 13.0, 29.0, 62.0, 106.0, 130.0, 157.0, 188.0, 129.0, 69.0, 46.0, 19.0, 16.0, 9.0, 6.0, 4.0, 0.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-10.693497657775879, -10.44906234741211, -10.20462703704834, -9.96019172668457, -9.7157564163208, -9.471321105957031, -9.226886749267578, -8.982451438903809, -8.738016128540039, -8.49358081817627, -8.2491455078125, -8.00471019744873, -7.760275363922119, -7.51584005355835, -7.27140474319458, -7.0269694328308105, -6.782534122467041, -6.5380988121032715, -6.293663501739502, -6.049228668212891, -5.804793357849121, -5.560358047485352, -5.315922737121582, -5.0714874267578125, -4.827052116394043, -4.582616806030273, -4.338181495666504, -4.093746185302734, -3.849311351776123, -3.6048760414123535, -3.360440731048584, -3.1160054206848145, -2.8715710639953613, -2.627135753631592, -2.3827006816864014, -2.138265371322632, -1.8938301801681519, -1.6493949890136719, -1.4049596786499023, -1.1605244874954224, -0.9160892963409424, -0.6716541051864624, -0.42721885442733765, -0.1827836036682129, 0.06165158748626709, 0.30608677864074707, 0.5505220890045166, 0.7949572801589966, 1.0393924713134766, 1.2838276624679565, 1.5282628536224365, 1.772698163986206, 2.0171332359313965, 2.261568546295166, 2.5060038566589355, 2.750439167022705, 2.9948742389678955, 3.239309549331665, 3.4837446212768555, 3.728179931640625, 3.9726152420043945, 4.217050552368164, 4.461485862731934, 4.705920696258545, 4.9503560066223145]}, "gradients/decoder.model.decoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 4.0, 5.0, 10.0, 11.0, 7.0, 12.0, 15.0, 15.0, 24.0, 13.0, 23.0, 42.0, 30.0, 32.0, 27.0, 36.0, 49.0, 52.0, 31.0, 37.0, 38.0, 42.0, 46.0, 48.0, 59.0, 36.0, 33.0, 36.0, 26.0, 35.0, 13.0, 23.0, 15.0, 13.0, 15.0, 17.0, 9.0, 7.0, 8.0, 3.0, 2.0, 5.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.585938930511475, -6.369170188903809, -6.152400970458984, -5.935632228851318, -5.718863010406494, -5.502094268798828, -5.285325050354004, -5.068556308746338, -4.851787567138672, -4.635018825531006, -4.418249607086182, -4.201480865478516, -3.9847116470336914, -3.7679429054260254, -3.5511739253997803, -3.334404945373535, -3.117635726928711, -2.900866746902466, -2.6840977668762207, -2.4673290252685547, -2.2505598068237305, -2.0337910652160645, -1.8170220851898193, -1.6002531051635742, -1.383484125137329, -1.166715145111084, -0.9499462246894836, -0.7331773042678833, -0.5164083242416382, -0.29963934421539307, -0.0828704833984375, 0.13389849662780762, 0.35066795349121094, 0.567436933517456, 0.7842058539390564, 1.0009747743606567, 1.2177437543869019, 1.434512734413147, 1.6512815952301025, 1.8680505752563477, 2.0848195552825928, 2.301588535308838, 2.518357515335083, 2.735126495361328, 2.951895236968994, 3.1686644554138184, 3.3854331970214844, 3.6022021770477295, 3.8189711570739746, 4.035739898681641, 4.252509117126465, 4.469277858734131, 4.686047077178955, 4.902815818786621, 5.119585037231445, 5.336353778839111, 5.553122520446777, 5.769891262054443, 5.986660480499268, 6.203429222106934, 6.420198440551758, 6.636967182159424, 6.85373592376709, 7.070505142211914, 7.287274360656738]}, "gradients/decoder.model.decoder.layers.4.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 5.0, 1.0, 4.0, 3.0, 7.0, 3.0, 11.0, 22.0, 26.0, 47.0, 78.0, 175.0, 503.0, 2517.0, 42982.0, 3356278.0, 778979.0, 10563.0, 1303.0, 390.0, 161.0, 90.0, 51.0, 32.0, 18.0, 13.0, 8.0, 5.0, 7.0, 3.0, 2.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.234375, -8.99005126953125, -8.7457275390625, -8.50140380859375, -8.257080078125, -8.01275634765625, -7.7684326171875, -7.52410888671875, -7.27978515625, -7.03546142578125, -6.7911376953125, -6.54681396484375, -6.302490234375, -6.05816650390625, -5.8138427734375, -5.56951904296875, -5.3251953125, -5.08087158203125, -4.8365478515625, -4.59222412109375, -4.347900390625, -4.10357666015625, -3.8592529296875, -3.61492919921875, -3.37060546875, -3.12628173828125, -2.8819580078125, -2.63763427734375, -2.393310546875, -2.14898681640625, -1.9046630859375, -1.66033935546875, -1.416015625, -1.17169189453125, -0.9273681640625, -0.68304443359375, -0.438720703125, -0.19439697265625, 0.0499267578125, 0.29425048828125, 0.53857421875, 0.78289794921875, 1.0272216796875, 1.27154541015625, 1.515869140625, 1.76019287109375, 2.0045166015625, 2.24884033203125, 2.4931640625, 2.73748779296875, 2.9818115234375, 3.22613525390625, 3.470458984375, 3.71478271484375, 3.9591064453125, 4.20343017578125, 4.44775390625, 4.69207763671875, 4.9364013671875, 5.18072509765625, 5.425048828125, 5.66937255859375, 5.9136962890625, 6.15802001953125, 6.40234375]}, "gradients/decoder.model.decoder.layers.4.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 5.0, 8.0, 1.0, 4.0, 9.0, 9.0, 17.0, 22.0, 36.0, 33.0, 37.0, 51.0, 47.0, 41.0, 68.0, 55.0, 64.0, 67.0, 69.0, 69.0, 59.0, 45.0, 46.0, 34.0, 36.0, 26.0, 11.0, 15.0, 9.0, 6.0, 4.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.38671875, -2.30035400390625, -2.2139892578125, -2.12762451171875, -2.041259765625, -1.95489501953125, -1.8685302734375, -1.78216552734375, -1.69580078125, -1.60943603515625, -1.5230712890625, -1.43670654296875, -1.350341796875, -1.26397705078125, -1.1776123046875, -1.09124755859375, -1.0048828125, -0.91851806640625, -0.8321533203125, -0.74578857421875, -0.659423828125, -0.57305908203125, -0.4866943359375, -0.40032958984375, -0.31396484375, -0.22760009765625, -0.1412353515625, -0.05487060546875, 0.031494140625, 0.11785888671875, 0.2042236328125, 0.29058837890625, 0.376953125, 0.46331787109375, 0.5496826171875, 0.63604736328125, 0.722412109375, 0.80877685546875, 0.8951416015625, 0.98150634765625, 1.06787109375, 1.15423583984375, 1.2406005859375, 1.32696533203125, 1.413330078125, 1.49969482421875, 1.5860595703125, 1.67242431640625, 1.7587890625, 1.84515380859375, 1.9315185546875, 2.01788330078125, 2.104248046875, 2.19061279296875, 2.2769775390625, 2.36334228515625, 2.44970703125, 2.53607177734375, 2.6224365234375, 2.70880126953125, 2.795166015625, 2.88153076171875, 2.9678955078125, 3.05426025390625, 3.140625]}, "gradients/decoder.model.decoder.layers.4.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 3.0, 1.0, 2.0, 4.0, 5.0, 7.0, 8.0, 18.0, 19.0, 36.0, 55.0, 74.0, 148.0, 287.0, 624.0, 1537.0, 5668.0, 46928.0, 2489336.0, 1607546.0, 34492.0, 4861.0, 1412.0, 531.0, 288.0, 143.0, 79.0, 68.0, 34.0, 22.0, 13.0, 17.0, 7.0, 5.0, 6.0, 2.0, 2.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.6171875, -3.45953369140625, -3.3018798828125, -3.14422607421875, -2.986572265625, -2.82891845703125, -2.6712646484375, -2.51361083984375, -2.35595703125, -2.19830322265625, -2.0406494140625, -1.88299560546875, -1.725341796875, -1.56768798828125, -1.4100341796875, -1.25238037109375, -1.0947265625, -0.93707275390625, -0.7794189453125, -0.62176513671875, -0.464111328125, -0.30645751953125, -0.1488037109375, 0.00885009765625, 0.16650390625, 0.32415771484375, 0.4818115234375, 0.63946533203125, 0.797119140625, 0.95477294921875, 1.1124267578125, 1.27008056640625, 1.427734375, 1.58538818359375, 1.7430419921875, 1.90069580078125, 2.058349609375, 2.21600341796875, 2.3736572265625, 2.53131103515625, 2.68896484375, 2.84661865234375, 3.0042724609375, 3.16192626953125, 3.319580078125, 3.47723388671875, 3.6348876953125, 3.79254150390625, 3.9501953125, 4.10784912109375, 4.2655029296875, 4.42315673828125, 4.580810546875, 4.73846435546875, 4.8961181640625, 5.05377197265625, 5.21142578125, 5.36907958984375, 5.5267333984375, 5.68438720703125, 5.842041015625, 5.99969482421875, 6.1573486328125, 6.31500244140625, 6.47265625]}, "gradients/decoder.model.decoder.layers.4.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 4.0, 1.0, 1.0, 10.0, 13.0, 16.0, 12.0, 25.0, 50.0, 49.0, 82.0, 158.0, 178.0, 315.0, 477.0, 656.0, 628.0, 485.0, 304.0, 206.0, 165.0, 63.0, 59.0, 43.0, 28.0, 20.0, 8.0, 9.0, 5.0, 3.0, 5.0, 2.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.275390625, -1.2418060302734375, -1.208221435546875, -1.1746368408203125, -1.14105224609375, -1.1074676513671875, -1.073883056640625, -1.0402984619140625, -1.0067138671875, -0.9731292724609375, -0.939544677734375, -0.9059600830078125, -0.87237548828125, -0.8387908935546875, -0.805206298828125, -0.7716217041015625, -0.738037109375, -0.7044525146484375, -0.670867919921875, -0.6372833251953125, -0.60369873046875, -0.5701141357421875, -0.536529541015625, -0.5029449462890625, -0.4693603515625, -0.4357757568359375, -0.402191162109375, -0.3686065673828125, -0.33502197265625, -0.3014373779296875, -0.267852783203125, -0.2342681884765625, -0.20068359375, -0.1670989990234375, -0.133514404296875, -0.0999298095703125, -0.06634521484375, -0.0327606201171875, 0.000823974609375, 0.0344085693359375, 0.0679931640625, 0.1015777587890625, 0.135162353515625, 0.1687469482421875, 0.20233154296875, 0.2359161376953125, 0.269500732421875, 0.3030853271484375, 0.336669921875, 0.3702545166015625, 0.403839111328125, 0.4374237060546875, 0.47100830078125, 0.5045928955078125, 0.538177490234375, 0.5717620849609375, 0.6053466796875, 0.6389312744140625, 0.672515869140625, 0.7061004638671875, 0.73968505859375, 0.7732696533203125, 0.806854248046875, 0.8404388427734375, 0.8740234375]}, "gradients/decoder.model.decoder.layers.4.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 5.0, 3.0, 7.0, 12.0, 18.0, 24.0, 43.0, 59.0, 79.0, 115.0, 125.0, 111.0, 113.0, 108.0, 55.0, 39.0, 29.0, 22.0, 14.0, 8.0, 8.0, 2.0, 4.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.257492542266846, -4.1158342361450195, -3.9741759300231934, -3.832517623901367, -3.690859317779541, -3.549201011657715, -3.4075429439544678, -3.2658846378326416, -3.1242263317108154, -2.9825680255889893, -2.840909719467163, -2.699251413345337, -2.55759334564209, -2.4159350395202637, -2.2742767333984375, -2.1326184272766113, -1.9909601211547852, -1.849301815032959, -1.7076435089111328, -1.5659853219985962, -1.42432701587677, -1.2826687097549438, -1.1410105228424072, -0.999352216720581, -0.8576939105987549, -0.7160356044769287, -0.5743773579597473, -0.43271908164024353, -0.29106080532073975, -0.14940249919891357, -0.007744252681732178, 0.13391399383544922, 0.2755727767944336, 0.4172310531139374, 0.5588893294334412, 0.7005475759506226, 0.8422058820724487, 0.9838641881942749, 1.1255223751068115, 1.2671806812286377, 1.4088389873504639, 1.55049729347229, 1.6921555995941162, 1.8338137865066528, 1.975472092628479, 2.1171302795410156, 2.258788585662842, 2.400446891784668, 2.542105197906494, 2.6837635040283203, 2.8254218101501465, 2.9670801162719727, 3.108738422393799, 3.250396728515625, 3.392054796218872, 3.5337131023406982, 3.6753714084625244, 3.8170297145843506, 3.9586880207061768, 4.100346088409424, 4.24200439453125, 4.383662700653076, 4.525321006774902, 4.6669793128967285, 4.808637619018555]}, "gradients/decoder.model.decoder.layers.4.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 5.0, 4.0, 4.0, 9.0, 8.0, 9.0, 9.0, 11.0, 22.0, 17.0, 18.0, 23.0, 27.0, 31.0, 38.0, 31.0, 35.0, 66.0, 52.0, 51.0, 50.0, 48.0, 54.0, 35.0, 52.0, 47.0, 45.0, 34.0, 39.0, 27.0, 28.0, 21.0, 8.0, 10.0, 11.0, 8.0, 3.0, 8.0, 6.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-2.4210946559906006, -2.3459179401397705, -2.2707412242889404, -2.1955645084381104, -2.1203877925872803, -2.04521107673645, -1.9700344800949097, -1.8948577642440796, -1.8196810483932495, -1.7445043325424194, -1.6693276166915894, -1.5941509008407593, -1.5189743041992188, -1.4437975883483887, -1.3686208724975586, -1.2934441566467285, -1.2182674407958984, -1.1430907249450684, -1.0679140090942383, -0.992737352848053, -0.9175606369972229, -0.8423839211463928, -0.7672072649002075, -0.6920305490493774, -0.6168538331985474, -0.5416771173477173, -0.4665004312992096, -0.3913237452507019, -0.3161470293998718, -0.24097031354904175, -0.16579362750053406, -0.09061694145202637, -0.015440225601196289, 0.059736475348472595, 0.13491317629814148, 0.21008987724781036, 0.28526657819747925, 0.3604432940483093, 0.435619980096817, 0.5107966661453247, 0.5859733819961548, 0.6611500978469849, 0.7363268136978149, 0.8115034699440002, 0.8866801857948303, 0.9618569016456604, 1.0370335578918457, 1.1122102737426758, 1.1873869895935059, 1.262563705444336, 1.337740421295166, 1.412917137145996, 1.4880938529968262, 1.5632705688476562, 1.6384471654891968, 1.7136238813400269, 1.788800597190857, 1.863977313041687, 1.939154028892517, 2.0143306255340576, 2.0895073413848877, 2.1646840572357178, 2.239860773086548, 2.315037488937378, 2.390214204788208]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 4.0, 12.0, 11.0, 17.0, 24.0, 52.0, 80.0, 138.0, 215.0, 449.0, 1135.0, 4213.0, 20002.0, 108517.0, 408125.0, 385244.0, 96786.0, 17576.0, 3897.0, 1098.0, 443.0, 217.0, 116.0, 75.0, 46.0, 32.0, 15.0, 7.0, 6.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.66650390625, -0.6456527709960938, -0.6248016357421875, -0.6039505004882812, -0.583099365234375, -0.5622482299804688, -0.5413970947265625, -0.5205459594726562, -0.49969482421875, -0.47884368896484375, -0.4579925537109375, -0.43714141845703125, -0.416290283203125, -0.39543914794921875, -0.3745880126953125, -0.35373687744140625, -0.3328857421875, -0.31203460693359375, -0.2911834716796875, -0.27033233642578125, -0.249481201171875, -0.22863006591796875, -0.2077789306640625, -0.18692779541015625, -0.16607666015625, -0.14522552490234375, -0.1243743896484375, -0.10352325439453125, -0.082672119140625, -0.06182098388671875, -0.0409698486328125, -0.02011871337890625, 0.000732421875, 0.02158355712890625, 0.0424346923828125, 0.06328582763671875, 0.084136962890625, 0.10498809814453125, 0.1258392333984375, 0.14669036865234375, 0.16754150390625, 0.18839263916015625, 0.2092437744140625, 0.23009490966796875, 0.250946044921875, 0.27179718017578125, 0.2926483154296875, 0.31349945068359375, 0.3343505859375, 0.35520172119140625, 0.3760528564453125, 0.39690399169921875, 0.417755126953125, 0.43860626220703125, 0.4594573974609375, 0.48030853271484375, 0.50115966796875, 0.5220108032226562, 0.5428619384765625, 0.5637130737304688, 0.584564208984375, 0.6054153442382812, 0.6262664794921875, 0.6471176147460938, 0.66796875]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 3.0, 7.0, 13.0, 12.0, 18.0, 16.0, 23.0, 41.0, 49.0, 45.0, 72.0, 84.0, 86.0, 69.0, 86.0, 82.0, 72.0, 68.0, 49.0, 36.0, 26.0, 22.0, 13.0, 7.0, 6.0, 0.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.12890625, -2.045013427734375, -1.96112060546875, -1.877227783203125, -1.7933349609375, -1.709442138671875, -1.62554931640625, -1.541656494140625, -1.457763671875, -1.373870849609375, -1.28997802734375, -1.206085205078125, -1.1221923828125, -1.038299560546875, -0.95440673828125, -0.870513916015625, -0.78662109375, -0.702728271484375, -0.61883544921875, -0.534942626953125, -0.4510498046875, -0.367156982421875, -0.28326416015625, -0.199371337890625, -0.115478515625, -0.031585693359375, 0.05230712890625, 0.136199951171875, 0.2200927734375, 0.303985595703125, 0.38787841796875, 0.471771240234375, 0.5556640625, 0.639556884765625, 0.72344970703125, 0.807342529296875, 0.8912353515625, 0.975128173828125, 1.05902099609375, 1.142913818359375, 1.226806640625, 1.310699462890625, 1.39459228515625, 1.478485107421875, 1.5623779296875, 1.646270751953125, 1.73016357421875, 1.814056396484375, 1.89794921875, 1.981842041015625, 2.06573486328125, 2.149627685546875, 2.2335205078125, 2.317413330078125, 2.40130615234375, 2.485198974609375, 2.569091796875, 2.652984619140625, 2.73687744140625, 2.820770263671875, 2.9046630859375, 2.988555908203125, 3.07244873046875, 3.156341552734375, 3.240234375]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 4.0, 2.0, 3.0, 8.0, 5.0, 14.0, 20.0, 35.0, 69.0, 90.0, 132.0, 246.0, 422.0, 730.0, 1255.0, 2244.0, 4311.0, 7661.0, 13609.0, 24297.0, 42005.0, 69195.0, 106321.0, 145224.0, 166091.0, 154292.0, 117191.0, 79059.0, 48542.0, 28550.0, 16406.0, 8961.0, 5105.0, 2824.0, 1541.0, 814.0, 534.0, 285.0, 172.0, 108.0, 61.0, 41.0, 27.0, 19.0, 10.0, 13.0, 6.0, 7.0, 5.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.179931640625, -0.17386245727539062, -0.16779327392578125, -0.16172409057617188, -0.1556549072265625, -0.14958572387695312, -0.14351654052734375, -0.13744735717773438, -0.131378173828125, -0.12530899047851562, -0.11923980712890625, -0.11317062377929688, -0.1071014404296875, -0.10103225708007812, -0.09496307373046875, -0.08889389038085938, -0.08282470703125, -0.07675552368164062, -0.07068634033203125, -0.06461715698242188, -0.0585479736328125, -0.052478790283203125, -0.04640960693359375, -0.040340423583984375, -0.034271240234375, -0.028202056884765625, -0.02213287353515625, -0.016063690185546875, -0.0099945068359375, -0.003925323486328125, 0.00214385986328125, 0.008213043212890625, 0.0142822265625, 0.020351409912109375, 0.02642059326171875, 0.032489776611328125, 0.0385589599609375, 0.044628143310546875, 0.05069732666015625, 0.056766510009765625, 0.062835693359375, 0.06890487670898438, 0.07497406005859375, 0.08104324340820312, 0.0871124267578125, 0.09318161010742188, 0.09925079345703125, 0.10531997680664062, 0.11138916015625, 0.11745834350585938, 0.12352752685546875, 0.12959671020507812, 0.1356658935546875, 0.14173507690429688, 0.14780426025390625, 0.15387344360351562, 0.159942626953125, 0.16601181030273438, 0.17208099365234375, 0.17815017700195312, 0.1842193603515625, 0.19028854370117188, 0.19635772705078125, 0.20242691040039062, 0.20849609375]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 1.0, 2.0, 2.0, 6.0, 6.0, 9.0, 8.0, 14.0, 13.0, 12.0, 16.0, 16.0, 23.0, 20.0, 26.0, 25.0, 29.0, 36.0, 45.0, 31.0, 40.0, 51.0, 43.0, 43.0, 43.0, 35.0, 40.0, 32.0, 49.0, 39.0, 29.0, 28.0, 26.0, 28.0, 17.0, 17.0, 22.0, 20.0, 14.0, 13.0, 7.0, 9.0, 5.0, 4.0, 0.0, 3.0, 2.0, 1.0, 5.0, 2.0, 3.0, 1.0, 1.0, 2.0], "bins": [-3.09375, -3.002777099609375, -2.91180419921875, -2.820831298828125, -2.7298583984375, -2.638885498046875, -2.54791259765625, -2.456939697265625, -2.365966796875, -2.274993896484375, -2.18402099609375, -2.093048095703125, -2.0020751953125, -1.911102294921875, -1.82012939453125, -1.729156494140625, -1.63818359375, -1.547210693359375, -1.45623779296875, -1.365264892578125, -1.2742919921875, -1.183319091796875, -1.09234619140625, -1.001373291015625, -0.910400390625, -0.819427490234375, -0.72845458984375, -0.637481689453125, -0.5465087890625, -0.455535888671875, -0.36456298828125, -0.273590087890625, -0.1826171875, -0.091644287109375, -0.00067138671875, 0.090301513671875, 0.1812744140625, 0.272247314453125, 0.36322021484375, 0.454193115234375, 0.545166015625, 0.636138916015625, 0.72711181640625, 0.818084716796875, 0.9090576171875, 1.000030517578125, 1.09100341796875, 1.181976318359375, 1.27294921875, 1.363922119140625, 1.45489501953125, 1.545867919921875, 1.6368408203125, 1.727813720703125, 1.81878662109375, 1.909759521484375, 2.000732421875, 2.091705322265625, 2.18267822265625, 2.273651123046875, 2.3646240234375, 2.455596923828125, 2.54656982421875, 2.637542724609375, 2.728515625]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 5.0, 5.0, 8.0, 11.0, 13.0, 24.0, 39.0, 70.0, 128.0, 193.0, 399.0, 1019.0, 3138.0, 15881.0, 192261.0, 747952.0, 75371.0, 8637.0, 2040.0, 691.0, 309.0, 156.0, 90.0, 39.0, 29.0, 16.0, 14.0, 7.0, 6.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.18359375, -0.17839813232421875, -0.1732025146484375, -0.16800689697265625, -0.162811279296875, -0.15761566162109375, -0.1524200439453125, -0.14722442626953125, -0.14202880859375, -0.13683319091796875, -0.1316375732421875, -0.12644195556640625, -0.121246337890625, -0.11605072021484375, -0.1108551025390625, -0.10565948486328125, -0.1004638671875, -0.09526824951171875, -0.0900726318359375, -0.08487701416015625, -0.079681396484375, -0.07448577880859375, -0.0692901611328125, -0.06409454345703125, -0.05889892578125, -0.05370330810546875, -0.0485076904296875, -0.04331207275390625, -0.038116455078125, -0.03292083740234375, -0.0277252197265625, -0.02252960205078125, -0.017333984375, -0.01213836669921875, -0.0069427490234375, -0.00174713134765625, 0.003448486328125, 0.00864410400390625, 0.0138397216796875, 0.01903533935546875, 0.02423095703125, 0.02942657470703125, 0.0346221923828125, 0.03981781005859375, 0.045013427734375, 0.05020904541015625, 0.0554046630859375, 0.06060028076171875, 0.0657958984375, 0.07099151611328125, 0.0761871337890625, 0.08138275146484375, 0.086578369140625, 0.09177398681640625, 0.0969696044921875, 0.10216522216796875, 0.10736083984375, 0.11255645751953125, 0.1177520751953125, 0.12294769287109375, 0.128143310546875, 0.13333892822265625, 0.1385345458984375, 0.14373016357421875, 0.14892578125]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 5.0, 0.0, 1.0, 2.0, 3.0, 1.0, 10.0, 2.0, 5.0, 4.0, 12.0, 21.0, 14.0, 19.0, 36.0, 46.0, 56.0, 57.0, 95.0, 76.0, 76.0, 87.0, 81.0, 64.0, 57.0, 30.0, 36.0, 34.0, 19.0, 15.0, 14.0, 8.0, 6.0, 3.0, 4.0, 6.0, 4.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-4.4405460357666016e-05, -4.319101572036743e-05, -4.197657108306885e-05, -4.0762126445770264e-05, -3.954768180847168e-05, -3.8333237171173096e-05, -3.711879253387451e-05, -3.590434789657593e-05, -3.4689903259277344e-05, -3.347545862197876e-05, -3.2261013984680176e-05, -3.104656934738159e-05, -2.9832124710083008e-05, -2.8617680072784424e-05, -2.740323543548584e-05, -2.6188790798187256e-05, -2.4974346160888672e-05, -2.3759901523590088e-05, -2.2545456886291504e-05, -2.133101224899292e-05, -2.0116567611694336e-05, -1.8902122974395752e-05, -1.7687678337097168e-05, -1.6473233699798584e-05, -1.52587890625e-05, -1.4044344425201416e-05, -1.2829899787902832e-05, -1.1615455150604248e-05, -1.0401010513305664e-05, -9.18656587600708e-06, -7.972121238708496e-06, -6.757676601409912e-06, -5.543231964111328e-06, -4.328787326812744e-06, -3.11434268951416e-06, -1.8998980522155762e-06, -6.854534149169922e-07, 5.289912223815918e-07, 1.7434358596801758e-06, 2.9578804969787598e-06, 4.172325134277344e-06, 5.386769771575928e-06, 6.601214408874512e-06, 7.815659046173096e-06, 9.03010368347168e-06, 1.0244548320770264e-05, 1.1458992958068848e-05, 1.2673437595367432e-05, 1.3887882232666016e-05, 1.51023268699646e-05, 1.6316771507263184e-05, 1.7531216144561768e-05, 1.874566078186035e-05, 1.9960105419158936e-05, 2.117455005645752e-05, 2.2388994693756104e-05, 2.3603439331054688e-05, 2.481788396835327e-05, 2.6032328605651855e-05, 2.724677324295044e-05, 2.8461217880249023e-05, 2.9675662517547607e-05, 3.089010715484619e-05, 3.2104551792144775e-05, 3.331899642944336e-05]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 4.0, 4.0, 5.0, 3.0, 7.0, 12.0, 19.0, 21.0, 43.0, 56.0, 104.0, 190.0, 368.0, 839.0, 2227.0, 7610.0, 32956.0, 201838.0, 598470.0, 165256.0, 28233.0, 6656.0, 2041.0, 768.0, 371.0, 172.0, 97.0, 62.0, 37.0, 32.0, 15.0, 13.0, 19.0, 3.0, 3.0, 2.0, 0.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.10150146484375, -0.09793376922607422, -0.09436607360839844, -0.09079837799072266, -0.08723068237304688, -0.0836629867553711, -0.08009529113769531, -0.07652759552001953, -0.07295989990234375, -0.06939220428466797, -0.06582450866699219, -0.062256813049316406, -0.058689117431640625, -0.055121421813964844, -0.05155372619628906, -0.04798603057861328, -0.0444183349609375, -0.04085063934326172, -0.03728294372558594, -0.033715248107910156, -0.030147552490234375, -0.026579856872558594, -0.023012161254882812, -0.01944446563720703, -0.01587677001953125, -0.012309074401855469, -0.008741378784179688, -0.005173683166503906, -0.001605987548828125, 0.0019617080688476562, 0.0055294036865234375, 0.009097099304199219, 0.012664794921875, 0.01623249053955078, 0.019800186157226562, 0.023367881774902344, 0.026935577392578125, 0.030503273010253906, 0.03407096862792969, 0.03763866424560547, 0.04120635986328125, 0.04477405548095703, 0.04834175109863281, 0.051909446716308594, 0.055477142333984375, 0.059044837951660156, 0.06261253356933594, 0.06618022918701172, 0.0697479248046875, 0.07331562042236328, 0.07688331604003906, 0.08045101165771484, 0.08401870727539062, 0.0875864028930664, 0.09115409851074219, 0.09472179412841797, 0.09828948974609375, 0.10185718536376953, 0.10542488098144531, 0.1089925765991211, 0.11256027221679688, 0.11612796783447266, 0.11969566345214844, 0.12326335906982422, 0.1268310546875]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 2.0, 4.0, 1.0, 3.0, 7.0, 7.0, 15.0, 14.0, 22.0, 20.0, 21.0, 29.0, 36.0, 61.0, 84.0, 109.0, 110.0, 105.0, 79.0, 68.0, 52.0, 30.0, 29.0, 22.0, 14.0, 18.0, 10.0, 6.0, 11.0, 9.0, 6.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.03570556640625, -0.034679412841796875, -0.03365325927734375, -0.032627105712890625, -0.0316009521484375, -0.030574798583984375, -0.02954864501953125, -0.028522491455078125, -0.027496337890625, -0.026470184326171875, -0.02544403076171875, -0.024417877197265625, -0.0233917236328125, -0.022365570068359375, -0.02133941650390625, -0.020313262939453125, -0.019287109375, -0.018260955810546875, -0.01723480224609375, -0.016208648681640625, -0.0151824951171875, -0.014156341552734375, -0.01313018798828125, -0.012104034423828125, -0.011077880859375, -0.010051727294921875, -0.00902557373046875, -0.007999420166015625, -0.0069732666015625, -0.005947113037109375, -0.00492095947265625, -0.003894805908203125, -0.00286865234375, -0.001842498779296875, -0.00081634521484375, 0.000209808349609375, 0.0012359619140625, 0.002262115478515625, 0.00328826904296875, 0.004314422607421875, 0.005340576171875, 0.006366729736328125, 0.00739288330078125, 0.008419036865234375, 0.0094451904296875, 0.010471343994140625, 0.01149749755859375, 0.012523651123046875, 0.0135498046875, 0.014575958251953125, 0.01560211181640625, 0.016628265380859375, 0.0176544189453125, 0.018680572509765625, 0.01970672607421875, 0.020732879638671875, 0.021759033203125, 0.022785186767578125, 0.02381134033203125, 0.024837493896484375, 0.0258636474609375, 0.026889801025390625, 0.02791595458984375, 0.028942108154296875, 0.02996826171875]}, "gradients/decoder.model.decoder.layers.4.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 9.0, 10.0, 34.0, 105.0, 245.0, 303.0, 181.0, 75.0, 30.0, 10.0, 5.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.61667537689209, -9.409029006958008, -9.20138168334961, -8.993735313415527, -8.786088943481445, -8.578441619873047, -8.370795249938965, -8.163148880004883, -7.955501556396484, -7.747854709625244, -7.540208339691162, -7.332561492919922, -7.124914646148682, -6.917267799377441, -6.709621429443359, -6.501974582672119, -6.294328212738037, -6.086681365966797, -5.879034996032715, -5.671388149261475, -5.463741302490234, -5.256094932556152, -5.048448085784912, -4.840801239013672, -4.63315486907959, -4.42550802230835, -4.217861652374268, -4.010214805603027, -3.802567958831787, -3.594921350479126, -3.387274742126465, -3.1796278953552246, -2.971980571746826, -2.764333963394165, -2.556687116622925, -2.3490405082702637, -2.1413936614990234, -1.9337470531463623, -1.7261004447937012, -1.5184537172317505, -1.3108069896697998, -1.1031602621078491, -0.8955135941505432, -0.6878669261932373, -0.4802201986312866, -0.27257347106933594, -0.0649268627166748, 0.14271986484527588, 0.35036659240722656, 0.5580133199691772, 0.7656599879264832, 0.9733066558837891, 1.1809533834457397, 1.3886001110076904, 1.5962467193603516, 1.8038934469223022, 2.011540174484253, 2.219186782836914, 2.4268336296081543, 2.6344802379608154, 2.8421268463134766, 3.049773693084717, 3.257420301437378, 3.465066909790039, 3.6727137565612793]}, "gradients/decoder.model.decoder.layers.4.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 1.0, 2.0, 3.0, 9.0, 4.0, 10.0, 13.0, 15.0, 18.0, 23.0, 34.0, 30.0, 46.0, 49.0, 47.0, 78.0, 71.0, 69.0, 73.0, 57.0, 58.0, 68.0, 50.0, 46.0, 42.0, 30.0, 11.0, 15.0, 12.0, 5.0, 10.0, 1.0, 9.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.057645797729492, -1.9905017614364624, -1.9233578443527222, -1.8562138080596924, -1.7890697717666626, -1.7219257354736328, -1.6547818183898926, -1.5876377820968628, -1.520493745803833, -1.4533497095108032, -1.386205792427063, -1.3190617561340332, -1.2519177198410034, -1.1847736835479736, -1.1176297664642334, -1.0504857301712036, -0.9833418130874634, -0.9161978363990784, -0.8490538001060486, -0.7819098234176636, -0.7147657871246338, -0.6476218104362488, -0.5804778337478638, -0.513333797454834, -0.446189820766449, -0.3790458142757416, -0.3119018077850342, -0.24475783109664917, -0.17761382460594177, -0.11046981811523438, -0.043325841426849365, 0.023818165063858032, 0.09096217155456543, 0.15810617804527283, 0.22525016963481903, 0.29239416122436523, 0.35953816771507263, 0.42668217420578003, 0.49382615089416504, 0.5609701871871948, 0.6281141638755798, 0.6952581405639648, 0.7624021768569946, 0.8295461535453796, 0.8966901302337646, 0.9638341665267944, 1.0309782028198242, 1.0981221199035645, 1.1652661561965942, 1.232410192489624, 1.2995541095733643, 1.366698145866394, 1.4338421821594238, 1.500986099243164, 1.5681301355361938, 1.6352741718292236, 1.7024180889129639, 1.7695621252059937, 1.8367060422897339, 1.9038500785827637, 1.9709941148757935, 2.0381381511688232, 2.1052820682525635, 2.1724259853363037, 2.239570140838623]}, "gradients/decoder.model.decoder.layers.4.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 4.0, 2.0, 5.0, 8.0, 11.0, 8.0, 17.0, 28.0, 59.0, 103.0, 200.0, 450.0, 1307.0, 4054.0, 14871.0, 66205.0, 395905.0, 462219.0, 78939.0, 17000.0, 4740.0, 1459.0, 498.0, 221.0, 85.0, 52.0, 29.0, 29.0, 15.0, 13.0, 2.0, 4.0, 7.0, 3.0, 2.0, 3.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.421875, -2.348602294921875, -2.27532958984375, -2.202056884765625, -2.1287841796875, -2.055511474609375, -1.98223876953125, -1.908966064453125, -1.835693359375, -1.762420654296875, -1.68914794921875, -1.615875244140625, -1.5426025390625, -1.469329833984375, -1.39605712890625, -1.322784423828125, -1.24951171875, -1.176239013671875, -1.10296630859375, -1.029693603515625, -0.9564208984375, -0.883148193359375, -0.80987548828125, -0.736602783203125, -0.663330078125, -0.590057373046875, -0.51678466796875, -0.443511962890625, -0.3702392578125, -0.296966552734375, -0.22369384765625, -0.150421142578125, -0.0771484375, -0.003875732421875, 0.06939697265625, 0.142669677734375, 0.2159423828125, 0.289215087890625, 0.36248779296875, 0.435760498046875, 0.509033203125, 0.582305908203125, 0.65557861328125, 0.728851318359375, 0.8021240234375, 0.875396728515625, 0.94866943359375, 1.021942138671875, 1.09521484375, 1.168487548828125, 1.24176025390625, 1.315032958984375, 1.3883056640625, 1.461578369140625, 1.53485107421875, 1.608123779296875, 1.681396484375, 1.754669189453125, 1.82794189453125, 1.901214599609375, 1.9744873046875, 2.047760009765625, 2.12103271484375, 2.194305419921875, 2.267578125]}, "gradients/decoder.model.decoder.layers.4.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 1.0, 2.0, 3.0, 6.0, 5.0, 9.0, 12.0, 14.0, 20.0, 19.0, 26.0, 33.0, 42.0, 50.0, 46.0, 47.0, 77.0, 65.0, 68.0, 61.0, 63.0, 57.0, 50.0, 39.0, 48.0, 34.0, 35.0, 25.0, 11.0, 12.0, 8.0, 9.0, 5.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-4.58203125, -4.459869384765625, -4.33770751953125, -4.215545654296875, -4.0933837890625, -3.971221923828125, -3.84906005859375, -3.726898193359375, -3.604736328125, -3.482574462890625, -3.36041259765625, -3.238250732421875, -3.1160888671875, -2.993927001953125, -2.87176513671875, -2.749603271484375, -2.62744140625, -2.505279541015625, -2.38311767578125, -2.260955810546875, -2.1387939453125, -2.016632080078125, -1.89447021484375, -1.772308349609375, -1.650146484375, -1.527984619140625, -1.40582275390625, -1.283660888671875, -1.1614990234375, -1.039337158203125, -0.91717529296875, -0.795013427734375, -0.6728515625, -0.550689697265625, -0.42852783203125, -0.306365966796875, -0.1842041015625, -0.062042236328125, 0.06011962890625, 0.182281494140625, 0.304443359375, 0.426605224609375, 0.54876708984375, 0.670928955078125, 0.7930908203125, 0.915252685546875, 1.03741455078125, 1.159576416015625, 1.28173828125, 1.403900146484375, 1.52606201171875, 1.648223876953125, 1.7703857421875, 1.892547607421875, 2.01470947265625, 2.136871337890625, 2.259033203125, 2.381195068359375, 2.50335693359375, 2.625518798828125, 2.7476806640625, 2.869842529296875, 2.99200439453125, 3.114166259765625, 3.236328125]}, "gradients/decoder.model.decoder.layers.4.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 3.0, 3.0, 2.0, 5.0, 9.0, 4.0, 12.0, 14.0, 13.0, 14.0, 14.0, 23.0, 44.0, 63.0, 93.0, 123.0, 164.0, 326.0, 807.0, 3038.0, 26922.0, 565489.0, 426447.0, 20696.0, 2674.0, 709.0, 299.0, 171.0, 107.0, 87.0, 50.0, 40.0, 23.0, 19.0, 17.0, 14.0, 3.0, 7.0, 5.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-4.43359375, -4.3135986328125, -4.193603515625, -4.0736083984375, -3.95361328125, -3.8336181640625, -3.713623046875, -3.5936279296875, -3.4736328125, -3.3536376953125, -3.233642578125, -3.1136474609375, -2.99365234375, -2.8736572265625, -2.753662109375, -2.6336669921875, -2.513671875, -2.3936767578125, -2.273681640625, -2.1536865234375, -2.03369140625, -1.9136962890625, -1.793701171875, -1.6737060546875, -1.5537109375, -1.4337158203125, -1.313720703125, -1.1937255859375, -1.07373046875, -0.9537353515625, -0.833740234375, -0.7137451171875, -0.59375, -0.4737548828125, -0.353759765625, -0.2337646484375, -0.11376953125, 0.0062255859375, 0.126220703125, 0.2462158203125, 0.3662109375, 0.4862060546875, 0.606201171875, 0.7261962890625, 0.84619140625, 0.9661865234375, 1.086181640625, 1.2061767578125, 1.326171875, 1.4461669921875, 1.566162109375, 1.6861572265625, 1.80615234375, 1.9261474609375, 2.046142578125, 2.1661376953125, 2.2861328125, 2.4061279296875, 2.526123046875, 2.6461181640625, 2.76611328125, 2.8861083984375, 3.006103515625, 3.1260986328125, 3.24609375]}, "gradients/decoder.model.decoder.layers.4.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 3.0, 2.0, 4.0, 8.0, 6.0, 9.0, 20.0, 18.0, 17.0, 18.0, 25.0, 31.0, 31.0, 23.0, 37.0, 37.0, 35.0, 32.0, 51.0, 58.0, 49.0, 54.0, 59.0, 58.0, 40.0, 43.0, 36.0, 30.0, 29.0, 20.0, 27.0, 15.0, 15.0, 18.0, 10.0, 8.0, 13.0, 7.0, 6.0, 1.0, 2.0, 4.0, 3.0, 1.0, 1.0, 2.0, 2.0], "bins": [-4.6171875, -4.494049072265625, -4.37091064453125, -4.247772216796875, -4.1246337890625, -4.001495361328125, -3.87835693359375, -3.755218505859375, -3.632080078125, -3.508941650390625, -3.38580322265625, -3.262664794921875, -3.1395263671875, -3.016387939453125, -2.89324951171875, -2.770111083984375, -2.64697265625, -2.523834228515625, -2.40069580078125, -2.277557373046875, -2.1544189453125, -2.031280517578125, -1.90814208984375, -1.785003662109375, -1.661865234375, -1.538726806640625, -1.41558837890625, -1.292449951171875, -1.1693115234375, -1.046173095703125, -0.92303466796875, -0.799896240234375, -0.6767578125, -0.553619384765625, -0.43048095703125, -0.307342529296875, -0.1842041015625, -0.061065673828125, 0.06207275390625, 0.185211181640625, 0.308349609375, 0.431488037109375, 0.55462646484375, 0.677764892578125, 0.8009033203125, 0.924041748046875, 1.04718017578125, 1.170318603515625, 1.29345703125, 1.416595458984375, 1.53973388671875, 1.662872314453125, 1.7860107421875, 1.909149169921875, 2.03228759765625, 2.155426025390625, 2.278564453125, 2.401702880859375, 2.52484130859375, 2.647979736328125, 2.7711181640625, 2.894256591796875, 3.01739501953125, 3.140533447265625, 3.263671875]}, "gradients/decoder.model.decoder.layers.4.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 8.0, 3.0, 3.0, 15.0, 14.0, 33.0, 57.0, 146.0, 404.0, 1375.0, 7805.0, 635822.0, 394465.0, 6455.0, 1271.0, 403.0, 138.0, 61.0, 29.0, 15.0, 8.0, 8.0, 4.0, 2.0, 5.0, 5.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.271484375, -3.17791748046875, -3.0843505859375, -2.99078369140625, -2.897216796875, -2.80364990234375, -2.7100830078125, -2.61651611328125, -2.52294921875, -2.42938232421875, -2.3358154296875, -2.24224853515625, -2.148681640625, -2.05511474609375, -1.9615478515625, -1.86798095703125, -1.7744140625, -1.68084716796875, -1.5872802734375, -1.49371337890625, -1.400146484375, -1.30657958984375, -1.2130126953125, -1.11944580078125, -1.02587890625, -0.93231201171875, -0.8387451171875, -0.74517822265625, -0.651611328125, -0.55804443359375, -0.4644775390625, -0.37091064453125, -0.27734375, -0.18377685546875, -0.0902099609375, 0.00335693359375, 0.096923828125, 0.19049072265625, 0.2840576171875, 0.37762451171875, 0.47119140625, 0.56475830078125, 0.6583251953125, 0.75189208984375, 0.845458984375, 0.93902587890625, 1.0325927734375, 1.12615966796875, 1.2197265625, 1.31329345703125, 1.4068603515625, 1.50042724609375, 1.593994140625, 1.68756103515625, 1.7811279296875, 1.87469482421875, 1.96826171875, 2.06182861328125, 2.1553955078125, 2.24896240234375, 2.342529296875, 2.43609619140625, 2.5296630859375, 2.62322998046875, 2.716796875]}, "gradients/decoder.model.decoder.layers.4.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 10.0, 18.0, 20.0, 56.0, 71.0, 167.0, 280.0, 149.0, 93.0, 54.0, 42.0, 16.0, 11.0, 3.0, 2.0, 4.0, 4.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0003230571746826172, -0.0003124848008155823, -0.00030191242694854736, -0.00029134005308151245, -0.00028076767921447754, -0.0002701953053474426, -0.0002596229314804077, -0.0002490505576133728, -0.0002384781837463379, -0.00022790580987930298, -0.00021733343601226807, -0.00020676106214523315, -0.00019618868827819824, -0.00018561631441116333, -0.00017504394054412842, -0.0001644715666770935, -0.0001538991928100586, -0.00014332681894302368, -0.00013275444507598877, -0.00012218207120895386, -0.00011160969734191895, -0.00010103732347488403, -9.046494960784912e-05, -7.989257574081421e-05, -6.93202018737793e-05, -5.8747828006744385e-05, -4.817545413970947e-05, -3.760308027267456e-05, -2.703070640563965e-05, -1.6458332538604736e-05, -5.885958671569824e-06, 4.686415195465088e-06, 1.52587890625e-05, 2.5831162929534912e-05, 3.6403536796569824e-05, 4.6975910663604736e-05, 5.754828453063965e-05, 6.812065839767456e-05, 7.869303226470947e-05, 8.926540613174438e-05, 9.98377799987793e-05, 0.00011041015386581421, 0.00012098252773284912, 0.00013155490159988403, 0.00014212727546691895, 0.00015269964933395386, 0.00016327202320098877, 0.00017384439706802368, 0.0001844167709350586, 0.0001949891448020935, 0.00020556151866912842, 0.00021613389253616333, 0.00022670626640319824, 0.00023727864027023315, 0.00024785101413726807, 0.000258423388004303, 0.0002689957618713379, 0.0002795681357383728, 0.0002901405096054077, 0.0003007128834724426, 0.00031128525733947754, 0.00032185763120651245, 0.00033243000507354736, 0.0003430023789405823, 0.0003535747528076172]}, "gradients/decoder.model.decoder.layers.4.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 4.0, 3.0, 2.0, 7.0, 10.0, 15.0, 23.0, 46.0, 84.0, 166.0, 392.0, 1205.0, 5199.0, 100486.0, 909863.0, 26641.0, 3013.0, 737.0, 291.0, 153.0, 81.0, 40.0, 26.0, 23.0, 15.0, 9.0, 3.0, 5.0, 4.0, 2.0, 4.0, 3.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9443359375, -1.8644256591796875, -1.784515380859375, -1.7046051025390625, -1.62469482421875, -1.5447845458984375, -1.464874267578125, -1.3849639892578125, -1.3050537109375, -1.2251434326171875, -1.145233154296875, -1.0653228759765625, -0.98541259765625, -0.9055023193359375, -0.825592041015625, -0.7456817626953125, -0.665771484375, -0.5858612060546875, -0.505950927734375, -0.4260406494140625, -0.34613037109375, -0.2662200927734375, -0.186309814453125, -0.1063995361328125, -0.0264892578125, 0.0534210205078125, 0.133331298828125, 0.2132415771484375, 0.29315185546875, 0.3730621337890625, 0.452972412109375, 0.5328826904296875, 0.61279296875, 0.6927032470703125, 0.772613525390625, 0.8525238037109375, 0.93243408203125, 1.0123443603515625, 1.092254638671875, 1.1721649169921875, 1.2520751953125, 1.3319854736328125, 1.411895751953125, 1.4918060302734375, 1.57171630859375, 1.6516265869140625, 1.731536865234375, 1.8114471435546875, 1.891357421875, 1.9712677001953125, 2.051177978515625, 2.1310882568359375, 2.21099853515625, 2.2909088134765625, 2.370819091796875, 2.4507293701171875, 2.5306396484375, 2.6105499267578125, 2.690460205078125, 2.7703704833984375, 2.85028076171875, 2.9301910400390625, 3.010101318359375, 3.0900115966796875, 3.169921875]}, "gradients/decoder.model.decoder.layers.4.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 6.0, 3.0, 1.0, 5.0, 6.0, 7.0, 8.0, 14.0, 13.0, 28.0, 28.0, 41.0, 65.0, 102.0, 207.0, 182.0, 86.0, 58.0, 48.0, 33.0, 18.0, 18.0, 12.0, 10.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.76171875, -0.7416152954101562, -0.7215118408203125, -0.7014083862304688, -0.681304931640625, -0.6612014770507812, -0.6410980224609375, -0.6209945678710938, -0.60089111328125, -0.5807876586914062, -0.5606842041015625, -0.5405807495117188, -0.520477294921875, -0.5003738403320312, -0.4802703857421875, -0.46016693115234375, -0.4400634765625, -0.41996002197265625, -0.3998565673828125, -0.37975311279296875, -0.359649658203125, -0.33954620361328125, -0.3194427490234375, -0.29933929443359375, -0.27923583984375, -0.25913238525390625, -0.2390289306640625, -0.21892547607421875, -0.198822021484375, -0.17871856689453125, -0.1586151123046875, -0.13851165771484375, -0.118408203125, -0.09830474853515625, -0.0782012939453125, -0.05809783935546875, -0.037994384765625, -0.01789093017578125, 0.0022125244140625, 0.02231597900390625, 0.04241943359375, 0.06252288818359375, 0.0826263427734375, 0.10272979736328125, 0.122833251953125, 0.14293670654296875, 0.1630401611328125, 0.18314361572265625, 0.2032470703125, 0.22335052490234375, 0.2434539794921875, 0.26355743408203125, 0.283660888671875, 0.30376434326171875, 0.3238677978515625, 0.34397125244140625, 0.36407470703125, 0.38417816162109375, 0.4042816162109375, 0.42438507080078125, 0.444488525390625, 0.46459197998046875, 0.4846954345703125, 0.5047988891601562, 0.52490234375]}, "gradients/decoder.model.decoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 13.0, 11.0, 24.0, 57.0, 128.0, 188.0, 216.0, 176.0, 109.0, 36.0, 23.0, 9.0, 10.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.872335910797119, -4.554630279541016, -4.236924171447754, -3.9192185401916504, -3.6015124320983887, -3.283806800842285, -2.9661009311676025, -2.64839506149292, -2.3306891918182373, -2.0129833221435547, -1.695277452468872, -1.377571702003479, -1.0598658323287964, -0.7421599626541138, -0.4244542121887207, -0.10674834251403809, 0.21095752716064453, 0.5286633968353271, 0.846369206905365, 1.1640750169754028, 1.4817808866500854, 1.799486756324768, 2.117192506790161, 2.4348983764648438, 2.7526042461395264, 3.070310115814209, 3.3880159854888916, 3.705721855163574, 4.023427486419678, 4.3411335945129395, 4.658839225769043, 4.976545333862305, 5.294251441955566, 5.61195707321167, 5.929663181304932, 6.247368812561035, 6.565074920654297, 6.8827805519104, 7.200486183166504, 7.518192291259766, 7.835898399353027, 8.153604507446289, 8.471309661865234, 8.789015769958496, 9.106721878051758, 9.42442798614502, 9.742133140563965, 10.059839248657227, 10.377544403076172, 10.695250511169434, 11.012955665588379, 11.33066177368164, 11.648367881774902, 11.966073989868164, 12.28377914428711, 12.601485252380371, 12.919191360473633, 13.236897468566895, 13.55460262298584, 13.872308731079102, 14.190014839172363, 14.507720947265625, 14.82542610168457, 15.143132209777832, 15.460838317871094]}, "gradients/decoder.model.decoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 3.0, 4.0, 7.0, 2.0, 7.0, 4.0, 6.0, 8.0, 9.0, 10.0, 14.0, 9.0, 22.0, 14.0, 25.0, 22.0, 23.0, 22.0, 22.0, 17.0, 24.0, 40.0, 28.0, 19.0, 31.0, 44.0, 34.0, 38.0, 42.0, 27.0, 28.0, 42.0, 24.0, 28.0, 42.0, 34.0, 29.0, 32.0, 32.0, 17.0, 23.0, 14.0, 16.0, 18.0, 14.0, 9.0, 9.0, 8.0, 6.0, 4.0, 3.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-4.496866226196289, -4.350981712341309, -4.20509672164917, -4.0592122077941895, -3.91332745552063, -3.7674427032470703, -3.62155818939209, -3.4756734371185303, -3.3297886848449707, -3.183903932571411, -3.0380194187164307, -2.892134666442871, -2.7462499141693115, -2.600365161895752, -2.4544806480407715, -2.308595895767212, -2.1627113819122314, -2.016826629638672, -1.8709419965744019, -1.7250573635101318, -1.5791726112365723, -1.4332879781723022, -1.2874033451080322, -1.1415185928344727, -0.9956339597702026, -0.8497492671012878, -0.703864574432373, -0.557979941368103, -0.41209524869918823, -0.26621055603027344, -0.12032592296600342, 0.025558829307556152, 0.17144346237182617, 0.31732815504074097, 0.4632128179073334, 0.6090974807739258, 0.7549821734428406, 0.9008668661117554, 1.0467514991760254, 1.192636251449585, 1.338520884513855, 1.484405517578125, 1.6302902698516846, 1.7761749029159546, 1.9220595359802246, 2.067944288253784, 2.2138290405273438, 2.359713554382324, 2.505598306655884, 2.6514830589294434, 2.797367572784424, 2.9432523250579834, 3.089137077331543, 3.2350215911865234, 3.380906343460083, 3.5267910957336426, 3.672675609588623, 3.8185603618621826, 3.964444875717163, 4.110329627990723, 4.256214141845703, 4.402099132537842, 4.547983646392822, 4.693868637084961, 4.839753150939941]}, "gradients/decoder.model.decoder.layers.3.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 4.0, 2.0, 7.0, 3.0, 8.0, 16.0, 19.0, 27.0, 59.0, 111.0, 258.0, 701.0, 2645.0, 54604.0, 3888712.0, 241818.0, 4208.0, 642.0, 220.0, 89.0, 53.0, 21.0, 23.0, 16.0, 10.0, 7.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.6484375, -7.3717041015625, -7.094970703125, -6.8182373046875, -6.54150390625, -6.2647705078125, -5.988037109375, -5.7113037109375, -5.4345703125, -5.1578369140625, -4.881103515625, -4.6043701171875, -4.32763671875, -4.0509033203125, -3.774169921875, -3.4974365234375, -3.220703125, -2.9439697265625, -2.667236328125, -2.3905029296875, -2.11376953125, -1.8370361328125, -1.560302734375, -1.2835693359375, -1.0068359375, -0.7301025390625, -0.453369140625, -0.1766357421875, 0.10009765625, 0.3768310546875, 0.653564453125, 0.9302978515625, 1.20703125, 1.4837646484375, 1.760498046875, 2.0372314453125, 2.31396484375, 2.5906982421875, 2.867431640625, 3.1441650390625, 3.4208984375, 3.6976318359375, 3.974365234375, 4.2510986328125, 4.52783203125, 4.8045654296875, 5.081298828125, 5.3580322265625, 5.634765625, 5.9114990234375, 6.188232421875, 6.4649658203125, 6.74169921875, 7.0184326171875, 7.295166015625, 7.5718994140625, 7.8486328125, 8.1253662109375, 8.402099609375, 8.6788330078125, 8.95556640625, 9.2322998046875, 9.509033203125, 9.7857666015625, 10.0625]}, "gradients/decoder.model.decoder.layers.3.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 4.0, 2.0, 0.0, 4.0, 5.0, 10.0, 11.0, 16.0, 20.0, 16.0, 20.0, 22.0, 31.0, 41.0, 46.0, 43.0, 56.0, 44.0, 48.0, 58.0, 73.0, 51.0, 55.0, 60.0, 36.0, 43.0, 34.0, 28.0, 28.0, 25.0, 17.0, 18.0, 7.0, 7.0, 10.0, 6.0, 3.0, 5.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.01953125, -1.951568603515625, -1.88360595703125, -1.815643310546875, -1.7476806640625, -1.679718017578125, -1.61175537109375, -1.543792724609375, -1.475830078125, -1.407867431640625, -1.33990478515625, -1.271942138671875, -1.2039794921875, -1.136016845703125, -1.06805419921875, -1.000091552734375, -0.93212890625, -0.864166259765625, -0.79620361328125, -0.728240966796875, -0.6602783203125, -0.592315673828125, -0.52435302734375, -0.456390380859375, -0.388427734375, -0.320465087890625, -0.25250244140625, -0.184539794921875, -0.1165771484375, -0.048614501953125, 0.01934814453125, 0.087310791015625, 0.1552734375, 0.223236083984375, 0.29119873046875, 0.359161376953125, 0.4271240234375, 0.495086669921875, 0.56304931640625, 0.631011962890625, 0.698974609375, 0.766937255859375, 0.83489990234375, 0.902862548828125, 0.9708251953125, 1.038787841796875, 1.10675048828125, 1.174713134765625, 1.24267578125, 1.310638427734375, 1.37860107421875, 1.446563720703125, 1.5145263671875, 1.582489013671875, 1.65045166015625, 1.718414306640625, 1.786376953125, 1.854339599609375, 1.92230224609375, 1.990264892578125, 2.0582275390625, 2.126190185546875, 2.19415283203125, 2.262115478515625, 2.330078125]}, "gradients/decoder.model.decoder.layers.3.fc1.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 6.0, 1.0, 2.0, 3.0, 5.0, 9.0, 10.0, 11.0, 18.0, 20.0, 30.0, 53.0, 75.0, 145.0, 279.0, 614.0, 1696.0, 6577.0, 60058.0, 3408273.0, 691211.0, 19806.0, 3469.0, 1018.0, 429.0, 195.0, 106.0, 54.0, 39.0, 19.0, 19.0, 15.0, 7.0, 8.0, 1.0, 2.0, 1.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.4765625, -5.3043212890625, -5.132080078125, -4.9598388671875, -4.78759765625, -4.6153564453125, -4.443115234375, -4.2708740234375, -4.0986328125, -3.9263916015625, -3.754150390625, -3.5819091796875, -3.40966796875, -3.2374267578125, -3.065185546875, -2.8929443359375, -2.720703125, -2.5484619140625, -2.376220703125, -2.2039794921875, -2.03173828125, -1.8594970703125, -1.687255859375, -1.5150146484375, -1.3427734375, -1.1705322265625, -0.998291015625, -0.8260498046875, -0.65380859375, -0.4815673828125, -0.309326171875, -0.1370849609375, 0.03515625, 0.2073974609375, 0.379638671875, 0.5518798828125, 0.72412109375, 0.8963623046875, 1.068603515625, 1.2408447265625, 1.4130859375, 1.5853271484375, 1.757568359375, 1.9298095703125, 2.10205078125, 2.2742919921875, 2.446533203125, 2.6187744140625, 2.791015625, 2.9632568359375, 3.135498046875, 3.3077392578125, 3.47998046875, 3.6522216796875, 3.824462890625, 3.9967041015625, 4.1689453125, 4.3411865234375, 4.513427734375, 4.6856689453125, 4.85791015625, 5.0301513671875, 5.202392578125, 5.3746337890625, 5.546875]}, "gradients/decoder.model.decoder.layers.3.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 4.0, 3.0, 3.0, 2.0, 4.0, 6.0, 8.0, 24.0, 23.0, 58.0, 70.0, 110.0, 176.0, 257.0, 475.0, 675.0, 710.0, 520.0, 359.0, 217.0, 134.0, 88.0, 48.0, 36.0, 25.0, 12.0, 15.0, 5.0, 4.0, 4.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9892578125, -0.9541778564453125, -0.919097900390625, -0.8840179443359375, -0.84893798828125, -0.8138580322265625, -0.778778076171875, -0.7436981201171875, -0.7086181640625, -0.6735382080078125, -0.638458251953125, -0.6033782958984375, -0.56829833984375, -0.5332183837890625, -0.498138427734375, -0.4630584716796875, -0.427978515625, -0.3928985595703125, -0.357818603515625, -0.3227386474609375, -0.28765869140625, -0.2525787353515625, -0.217498779296875, -0.1824188232421875, -0.1473388671875, -0.1122589111328125, -0.077178955078125, -0.0420989990234375, -0.00701904296875, 0.0280609130859375, 0.063140869140625, 0.0982208251953125, 0.13330078125, 0.1683807373046875, 0.203460693359375, 0.2385406494140625, 0.27362060546875, 0.3087005615234375, 0.343780517578125, 0.3788604736328125, 0.4139404296875, 0.4490203857421875, 0.484100341796875, 0.5191802978515625, 0.55426025390625, 0.5893402099609375, 0.624420166015625, 0.6595001220703125, 0.694580078125, 0.7296600341796875, 0.764739990234375, 0.7998199462890625, 0.83489990234375, 0.8699798583984375, 0.905059814453125, 0.9401397705078125, 0.9752197265625, 1.0102996826171875, 1.045379638671875, 1.0804595947265625, 1.11553955078125, 1.1506195068359375, 1.185699462890625, 1.2207794189453125, 1.255859375]}, "gradients/decoder.model.decoder.layers.3.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 7.0, 12.0, 12.0, 38.0, 63.0, 116.0, 147.0, 152.0, 171.0, 119.0, 95.0, 35.0, 19.0, 13.0, 6.0, 3.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.59725284576416, -7.3842339515686035, -7.171214580535889, -6.958195686340332, -6.745176792144775, -6.532157897949219, -6.319138526916504, -6.106119632720947, -5.893100738525391, -5.680081844329834, -5.467062473297119, -5.2540435791015625, -5.041024684906006, -4.828005790710449, -4.614986419677734, -4.401967525482178, -4.188948154449463, -3.975929021835327, -3.7629101276397705, -3.5498909950256348, -3.336872100830078, -3.1238529682159424, -2.9108338356018066, -2.69781494140625, -2.4847958087921143, -2.2717766761779785, -2.058757781982422, -1.8457386493682861, -1.63271963596344, -1.4197006225585938, -1.206681489944458, -0.9936624765396118, -0.7806439399719238, -0.5676249265670776, -0.35460585355758667, -0.1415867805480957, 0.07143223285675049, 0.2844512462615967, 0.4974703788757324, 0.7104893922805786, 0.9235084056854248, 1.136527419090271, 1.3495464324951172, 1.562565565109253, 1.7755845785140991, 1.9886035919189453, 2.201622724533081, 2.414641857147217, 2.6276607513427734, 2.840679883956909, 3.053698778152466, 3.2667179107666016, 3.479736804962158, 3.692755937576294, 3.9057750701904297, 4.118793964385986, 4.331812858581543, 4.5448317527771, 4.7578511238098145, 4.970870018005371, 5.183888912200928, 5.396907806396484, 5.609927177429199, 5.822946071624756, 6.035965442657471]}, "gradients/decoder.model.decoder.layers.3.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 6.0, 6.0, 7.0, 9.0, 10.0, 12.0, 19.0, 15.0, 17.0, 17.0, 22.0, 26.0, 22.0, 42.0, 36.0, 45.0, 44.0, 48.0, 47.0, 44.0, 33.0, 46.0, 55.0, 59.0, 43.0, 42.0, 26.0, 31.0, 43.0, 22.0, 20.0, 20.0, 17.0, 14.0, 14.0, 11.0, 2.0, 6.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.1844964027404785, -2.1115779876708984, -2.0386595726013184, -1.9657411575317383, -1.8928228616714478, -1.8199044466018677, -1.7469860315322876, -1.674067735671997, -1.601149320602417, -1.528230905532837, -1.4553124904632568, -1.3823940753936768, -1.3094757795333862, -1.2365573644638062, -1.163638949394226, -1.0907206535339355, -1.017802119255066, -0.9448837041854858, -0.8719653487205505, -0.7990469336509705, -0.7261285781860352, -0.6532101631164551, -0.580291748046875, -0.5073733925819397, -0.4344549775123596, -0.36153659224510193, -0.28861820697784424, -0.21569979190826416, -0.14278140664100647, -0.06986302137374878, 0.003055393695831299, 0.0759737491607666, 0.14889216423034668, 0.22181054949760437, 0.29472893476486206, 0.36764734983444214, 0.44056573510169983, 0.5134841203689575, 0.5864025354385376, 0.6593208909034729, 0.732239305973053, 0.8051577210426331, 0.8780760765075684, 0.9509944915771484, 1.0239129066467285, 1.0968313217163086, 1.1697497367858887, 1.2426680326461792, 1.3155864477157593, 1.3885048627853394, 1.4614232778549194, 1.53434157371521, 1.60725998878479, 1.6801784038543701, 1.7530968189239502, 1.8260152339935303, 1.8989336490631104, 1.9718520641326904, 2.0447704792022705, 2.1176888942718506, 2.1906073093414307, 2.2635254859924316, 2.3364439010620117, 2.409362316131592, 2.482280731201172]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 3.0, 5.0, 2.0, 5.0, 4.0, 4.0, 5.0, 17.0, 8.0, 17.0, 19.0, 29.0, 19.0, 45.0, 52.0, 66.0, 77.0, 149.0, 299.0, 618.0, 1695.0, 6270.0, 32495.0, 188357.0, 523129.0, 240724.0, 42842.0, 7954.0, 2017.0, 705.0, 349.0, 184.0, 97.0, 74.0, 49.0, 42.0, 30.0, 27.0, 18.0, 23.0, 10.0, 5.0, 10.0, 8.0, 1.0, 4.0, 0.0, 3.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.7978515625, -0.7760391235351562, -0.7542266845703125, -0.7324142456054688, -0.710601806640625, -0.6887893676757812, -0.6669769287109375, -0.6451644897460938, -0.62335205078125, -0.6015396118164062, -0.5797271728515625, -0.5579147338867188, -0.536102294921875, -0.5142898559570312, -0.4924774169921875, -0.47066497802734375, -0.4488525390625, -0.42704010009765625, -0.4052276611328125, -0.38341522216796875, -0.361602783203125, -0.33979034423828125, -0.3179779052734375, -0.29616546630859375, -0.27435302734375, -0.25254058837890625, -0.2307281494140625, -0.20891571044921875, -0.187103271484375, -0.16529083251953125, -0.1434783935546875, -0.12166595458984375, -0.099853515625, -0.07804107666015625, -0.0562286376953125, -0.03441619873046875, -0.012603759765625, 0.00920867919921875, 0.0310211181640625, 0.05283355712890625, 0.07464599609375, 0.09645843505859375, 0.1182708740234375, 0.14008331298828125, 0.161895751953125, 0.18370819091796875, 0.2055206298828125, 0.22733306884765625, 0.2491455078125, 0.27095794677734375, 0.2927703857421875, 0.31458282470703125, 0.336395263671875, 0.35820770263671875, 0.3800201416015625, 0.40183258056640625, 0.42364501953125, 0.44545745849609375, 0.4672698974609375, 0.48908233642578125, 0.510894775390625, 0.5327072143554688, 0.5545196533203125, 0.5763320922851562, 0.59814453125]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 5.0, 7.0, 5.0, 11.0, 11.0, 18.0, 20.0, 34.0, 26.0, 39.0, 25.0, 60.0, 69.0, 63.0, 67.0, 65.0, 66.0, 72.0, 63.0, 66.0, 47.0, 49.0, 27.0, 22.0, 27.0, 18.0, 7.0, 9.0, 2.0, 5.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.5947265625, -1.5268096923828125, -1.458892822265625, -1.3909759521484375, -1.32305908203125, -1.2551422119140625, -1.187225341796875, -1.1193084716796875, -1.0513916015625, -0.9834747314453125, -0.915557861328125, -0.8476409912109375, -0.77972412109375, -0.7118072509765625, -0.643890380859375, -0.5759735107421875, -0.508056640625, -0.4401397705078125, -0.372222900390625, -0.3043060302734375, -0.23638916015625, -0.1684722900390625, -0.100555419921875, -0.0326385498046875, 0.0352783203125, 0.1031951904296875, 0.171112060546875, 0.2390289306640625, 0.30694580078125, 0.3748626708984375, 0.442779541015625, 0.5106964111328125, 0.57861328125, 0.6465301513671875, 0.714447021484375, 0.7823638916015625, 0.85028076171875, 0.9181976318359375, 0.986114501953125, 1.0540313720703125, 1.1219482421875, 1.1898651123046875, 1.257781982421875, 1.3256988525390625, 1.39361572265625, 1.4615325927734375, 1.529449462890625, 1.5973663330078125, 1.665283203125, 1.7332000732421875, 1.801116943359375, 1.8690338134765625, 1.93695068359375, 2.0048675537109375, 2.072784423828125, 2.1407012939453125, 2.2086181640625, 2.2765350341796875, 2.344451904296875, 2.4123687744140625, 2.48028564453125, 2.5482025146484375, 2.616119384765625, 2.6840362548828125, 2.751953125]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 2.0, 2.0, 3.0, 2.0, 9.0, 11.0, 12.0, 14.0, 26.0, 31.0, 48.0, 91.0, 161.0, 314.0, 565.0, 1134.0, 2336.0, 5127.0, 11168.0, 24393.0, 51781.0, 105090.0, 182666.0, 235330.0, 197296.0, 117918.0, 60015.0, 28227.0, 13111.0, 6053.0, 2758.0, 1358.0, 676.0, 335.0, 189.0, 104.0, 60.0, 48.0, 28.0, 21.0, 18.0, 10.0, 4.0, 3.0, 5.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.247314453125, -0.2394866943359375, -0.231658935546875, -0.2238311767578125, -0.21600341796875, -0.2081756591796875, -0.200347900390625, -0.1925201416015625, -0.1846923828125, -0.1768646240234375, -0.169036865234375, -0.1612091064453125, -0.15338134765625, -0.1455535888671875, -0.137725830078125, -0.1298980712890625, -0.1220703125, -0.1142425537109375, -0.106414794921875, -0.0985870361328125, -0.09075927734375, -0.0829315185546875, -0.075103759765625, -0.0672760009765625, -0.0594482421875, -0.0516204833984375, -0.043792724609375, -0.0359649658203125, -0.02813720703125, -0.0203094482421875, -0.012481689453125, -0.0046539306640625, 0.003173828125, 0.0110015869140625, 0.018829345703125, 0.0266571044921875, 0.03448486328125, 0.0423126220703125, 0.050140380859375, 0.0579681396484375, 0.0657958984375, 0.0736236572265625, 0.081451416015625, 0.0892791748046875, 0.09710693359375, 0.1049346923828125, 0.112762451171875, 0.1205902099609375, 0.12841796875, 0.1362457275390625, 0.144073486328125, 0.1519012451171875, 0.15972900390625, 0.1675567626953125, 0.175384521484375, 0.1832122802734375, 0.1910400390625, 0.1988677978515625, 0.206695556640625, 0.2145233154296875, 0.22235107421875, 0.2301788330078125, 0.238006591796875, 0.2458343505859375, 0.253662109375]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 7.0, 9.0, 7.0, 4.0, 8.0, 7.0, 11.0, 17.0, 16.0, 25.0, 23.0, 30.0, 31.0, 37.0, 48.0, 48.0, 55.0, 45.0, 55.0, 49.0, 53.0, 54.0, 34.0, 50.0, 41.0, 39.0, 27.0, 32.0, 19.0, 21.0, 15.0, 16.0, 17.0, 11.0, 9.0, 6.0, 6.0, 7.0, 5.0, 4.0, 8.0, 1.0, 5.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.423828125, -2.331695556640625, -2.23956298828125, -2.147430419921875, -2.0552978515625, -1.963165283203125, -1.87103271484375, -1.778900146484375, -1.686767578125, -1.594635009765625, -1.50250244140625, -1.410369873046875, -1.3182373046875, -1.226104736328125, -1.13397216796875, -1.041839599609375, -0.94970703125, -0.857574462890625, -0.76544189453125, -0.673309326171875, -0.5811767578125, -0.489044189453125, -0.39691162109375, -0.304779052734375, -0.212646484375, -0.120513916015625, -0.02838134765625, 0.063751220703125, 0.1558837890625, 0.248016357421875, 0.34014892578125, 0.432281494140625, 0.5244140625, 0.616546630859375, 0.70867919921875, 0.800811767578125, 0.8929443359375, 0.985076904296875, 1.07720947265625, 1.169342041015625, 1.261474609375, 1.353607177734375, 1.44573974609375, 1.537872314453125, 1.6300048828125, 1.722137451171875, 1.81427001953125, 1.906402587890625, 1.99853515625, 2.090667724609375, 2.18280029296875, 2.274932861328125, 2.3670654296875, 2.459197998046875, 2.55133056640625, 2.643463134765625, 2.735595703125, 2.827728271484375, 2.91986083984375, 3.011993408203125, 3.1041259765625, 3.196258544921875, 3.28839111328125, 3.380523681640625, 3.47265625]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 4.0, 3.0, 6.0, 8.0, 9.0, 14.0, 21.0, 29.0, 60.0, 80.0, 138.0, 258.0, 478.0, 1022.0, 2388.0, 6116.0, 20297.0, 99339.0, 472576.0, 355560.0, 66514.0, 15114.0, 4743.0, 1851.0, 893.0, 414.0, 252.0, 143.0, 71.0, 51.0, 31.0, 29.0, 15.0, 10.0, 4.0, 8.0, 4.0, 2.0, 3.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.087158203125, -0.08403205871582031, -0.08090591430664062, -0.07777976989746094, -0.07465362548828125, -0.07152748107910156, -0.06840133666992188, -0.06527519226074219, -0.0621490478515625, -0.05902290344238281, -0.055896759033203125, -0.05277061462402344, -0.04964447021484375, -0.04651832580566406, -0.043392181396484375, -0.04026603698730469, -0.037139892578125, -0.03401374816894531, -0.030887603759765625, -0.027761459350585938, -0.02463531494140625, -0.021509170532226562, -0.018383026123046875, -0.015256881713867188, -0.0121307373046875, -0.009004592895507812, -0.005878448486328125, -0.0027523040771484375, 0.00037384033203125, 0.0034999847412109375, 0.006626129150390625, 0.009752273559570312, 0.01287841796875, 0.016004562377929688, 0.019130706787109375, 0.022256851196289062, 0.02538299560546875, 0.028509140014648438, 0.031635284423828125, 0.03476142883300781, 0.0378875732421875, 0.04101371765136719, 0.044139862060546875, 0.04726600646972656, 0.05039215087890625, 0.05351829528808594, 0.056644439697265625, 0.05977058410644531, 0.062896728515625, 0.06602287292480469, 0.06914901733398438, 0.07227516174316406, 0.07540130615234375, 0.07852745056152344, 0.08165359497070312, 0.08477973937988281, 0.0879058837890625, 0.09103202819824219, 0.09415817260742188, 0.09728431701660156, 0.10041046142578125, 0.10353660583496094, 0.10666275024414062, 0.10978889465332031, 0.1129150390625]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 2.0, 4.0, 3.0, 7.0, 22.0, 34.0, 41.0, 61.0, 51.0, 106.0, 106.0, 122.0, 129.0, 89.0, 68.0, 46.0, 44.0, 25.0, 11.0, 8.0, 14.0, 3.0, 6.0, 1.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.61015510559082e-05, -6.422773003578186e-05, -6.235390901565552e-05, -6.0480087995529175e-05, -5.860626697540283e-05, -5.673244595527649e-05, -5.4858624935150146e-05, -5.2984803915023804e-05, -5.111098289489746e-05, -4.923716187477112e-05, -4.7363340854644775e-05, -4.548951983451843e-05, -4.361569881439209e-05, -4.174187779426575e-05, -3.9868056774139404e-05, -3.799423575401306e-05, -3.612041473388672e-05, -3.4246593713760376e-05, -3.237277269363403e-05, -3.049895167350769e-05, -2.8625130653381348e-05, -2.6751309633255005e-05, -2.4877488613128662e-05, -2.300366759300232e-05, -2.1129846572875977e-05, -1.9256025552749634e-05, -1.738220453262329e-05, -1.5508383512496948e-05, -1.3634562492370605e-05, -1.1760741472244263e-05, -9.88692045211792e-06, -8.013099431991577e-06, -6.139278411865234e-06, -4.265457391738892e-06, -2.391636371612549e-06, -5.178153514862061e-07, 1.3560056686401367e-06, 3.2298266887664795e-06, 5.103647708892822e-06, 6.977468729019165e-06, 8.851289749145508e-06, 1.072511076927185e-05, 1.2598931789398193e-05, 1.4472752809524536e-05, 1.634657382965088e-05, 1.822039484977722e-05, 2.0094215869903564e-05, 2.1968036890029907e-05, 2.384185791015625e-05, 2.5715678930282593e-05, 2.7589499950408936e-05, 2.946332097053528e-05, 3.133714199066162e-05, 3.3210963010787964e-05, 3.508478403091431e-05, 3.695860505104065e-05, 3.883242607116699e-05, 4.0706247091293335e-05, 4.258006811141968e-05, 4.445388913154602e-05, 4.632771015167236e-05, 4.8201531171798706e-05, 5.007535219192505e-05, 5.194917321205139e-05, 5.3822994232177734e-05]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 2.0, 6.0, 8.0, 7.0, 14.0, 12.0, 14.0, 36.0, 43.0, 70.0, 115.0, 189.0, 348.0, 661.0, 1298.0, 2875.0, 6995.0, 19104.0, 61791.0, 235982.0, 471297.0, 175271.0, 46766.0, 15293.0, 5560.0, 2341.0, 1140.0, 563.0, 311.0, 135.0, 92.0, 66.0, 44.0, 31.0, 23.0, 17.0, 11.0, 7.0, 8.0, 3.0, 6.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09100341796875, -0.088104248046875, -0.085205078125, -0.082305908203125, -0.07940673828125, -0.076507568359375, -0.0736083984375, -0.070709228515625, -0.06781005859375, -0.064910888671875, -0.06201171875, -0.059112548828125, -0.05621337890625, -0.053314208984375, -0.0504150390625, -0.047515869140625, -0.04461669921875, -0.041717529296875, -0.038818359375, -0.035919189453125, -0.03302001953125, -0.030120849609375, -0.0272216796875, -0.024322509765625, -0.02142333984375, -0.018524169921875, -0.015625, -0.012725830078125, -0.00982666015625, -0.006927490234375, -0.0040283203125, -0.001129150390625, 0.00177001953125, 0.004669189453125, 0.007568359375, 0.010467529296875, 0.01336669921875, 0.016265869140625, 0.0191650390625, 0.022064208984375, 0.02496337890625, 0.027862548828125, 0.03076171875, 0.033660888671875, 0.03656005859375, 0.039459228515625, 0.0423583984375, 0.045257568359375, 0.04815673828125, 0.051055908203125, 0.053955078125, 0.056854248046875, 0.05975341796875, 0.062652587890625, 0.0655517578125, 0.068450927734375, 0.07135009765625, 0.074249267578125, 0.0771484375, 0.080047607421875, 0.08294677734375, 0.085845947265625, 0.0887451171875, 0.091644287109375, 0.09454345703125]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 4.0, 1.0, 1.0, 7.0, 5.0, 0.0, 1.0, 11.0, 9.0, 9.0, 16.0, 23.0, 36.0, 40.0, 45.0, 67.0, 94.0, 87.0, 78.0, 94.0, 80.0, 72.0, 53.0, 50.0, 32.0, 21.0, 22.0, 8.0, 13.0, 8.0, 4.0, 2.0, 5.0, 1.0, 2.0, 1.0, 3.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.024688720703125, -0.023790359497070312, -0.022891998291015625, -0.021993637084960938, -0.02109527587890625, -0.020196914672851562, -0.019298553466796875, -0.018400192260742188, -0.0175018310546875, -0.016603469848632812, -0.015705108642578125, -0.014806747436523438, -0.01390838623046875, -0.013010025024414062, -0.012111663818359375, -0.011213302612304688, -0.01031494140625, -0.009416580200195312, -0.008518218994140625, -0.0076198577880859375, -0.00672149658203125, -0.0058231353759765625, -0.004924774169921875, -0.0040264129638671875, -0.0031280517578125, -0.0022296905517578125, -0.001331329345703125, -0.0004329681396484375, 0.00046539306640625, 0.0013637542724609375, 0.002262115478515625, 0.0031604766845703125, 0.004058837890625, 0.0049571990966796875, 0.005855560302734375, 0.0067539215087890625, 0.00765228271484375, 0.008550643920898438, 0.009449005126953125, 0.010347366333007812, 0.0112457275390625, 0.012144088745117188, 0.013042449951171875, 0.013940811157226562, 0.01483917236328125, 0.015737533569335938, 0.016635894775390625, 0.017534255981445312, 0.0184326171875, 0.019330978393554688, 0.020229339599609375, 0.021127700805664062, 0.02202606201171875, 0.022924423217773438, 0.023822784423828125, 0.024721145629882812, 0.0256195068359375, 0.026517868041992188, 0.027416229248046875, 0.028314590454101562, 0.02921295166015625, 0.030111312866210938, 0.031009674072265625, 0.03190803527832031, 0.032806396484375]}, "gradients/decoder.model.decoder.layers.3.self_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 4.0, 4.0, 11.0, 28.0, 50.0, 96.0, 138.0, 168.0, 169.0, 149.0, 96.0, 43.0, 26.0, 12.0, 4.0, 4.0, 3.0, 4.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-4.926216125488281, -4.799779891967773, -4.673343658447266, -4.546907424926758, -4.42047119140625, -4.294034957885742, -4.167598724365234, -4.041162967681885, -3.914726734161377, -3.788290500640869, -3.6618542671203613, -3.5354180335998535, -3.408982038497925, -3.282545804977417, -3.156109571456909, -3.0296733379364014, -2.9032371044158936, -2.7768008708953857, -2.650364637374878, -2.523928642272949, -2.3974924087524414, -2.2710561752319336, -2.144619941711426, -2.018183708190918, -1.8917475938796997, -1.765311360359192, -1.6388752460479736, -1.5124390125274658, -1.386002779006958, -1.2595666646957397, -1.133130431175232, -1.0066943168640137, -0.8802578449249268, -0.7538216710090637, -0.6273854970932007, -0.5009492635726929, -0.37451308965682983, -0.2480769157409668, -0.12164068222045898, 0.004795491695404053, 0.1312316656112671, 0.2576678395271301, 0.38410404324531555, 0.510540246963501, 0.636976420879364, 0.763412594795227, 0.8898488283157349, 1.0162849426269531, 1.142721176147461, 1.2691574096679688, 1.395593523979187, 1.5220297574996948, 1.648465871810913, 1.774902105331421, 1.9013383388519287, 2.0277745723724365, 2.1542105674743652, 2.280646800994873, 2.407083034515381, 2.5335192680358887, 2.6599552631378174, 2.786391496658325, 2.912827730178833, 3.039263963699341, 3.1657001972198486]}, "gradients/decoder.model.decoder.layers.3.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 4.0, 5.0, 6.0, 9.0, 12.0, 18.0, 22.0, 25.0, 34.0, 23.0, 47.0, 44.0, 60.0, 68.0, 84.0, 51.0, 61.0, 88.0, 65.0, 58.0, 43.0, 54.0, 33.0, 25.0, 27.0, 17.0, 13.0, 5.0, 4.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.6342898607254028, -1.5679179430007935, -1.5015461444854736, -1.4351742267608643, -1.3688024282455444, -1.302430510520935, -1.2360587120056152, -1.1696867942810059, -1.1033148765563965, -1.036942958831787, -0.9705711603164673, -0.9041992425918579, -0.8378274440765381, -0.7714555263519287, -0.7050836682319641, -0.6387118101119995, -0.5723400115966797, -0.5059681534767151, -0.4395962953567505, -0.3732244074344635, -0.3068525493144989, -0.2404806911945343, -0.17410880327224731, -0.10773694515228271, -0.041365087032318115, 0.02500677853822708, 0.09137864410877228, 0.15775051712989807, 0.22412237524986267, 0.29049423336982727, 0.35686612129211426, 0.42323797941207886, 0.489609956741333, 0.5559818148612976, 0.6223536729812622, 0.6887255907058716, 0.7550973892211914, 0.8214693069458008, 0.8878411650657654, 0.95421302318573, 1.0205848217010498, 1.0869567394256592, 1.153328537940979, 1.2197004556655884, 1.2860722541809082, 1.3524441719055176, 1.418816089630127, 1.4851878881454468, 1.5515598058700562, 1.6179317235946655, 1.6843035221099854, 1.7506754398345947, 1.8170472383499146, 1.883419156074524, 1.9497909545898438, 2.016162872314453, 2.0825347900390625, 2.148906707763672, 2.2152786254882812, 2.2816503047943115, 2.348022222518921, 2.4143941402435303, 2.4807660579681396, 2.54713773727417, 2.6135096549987793]}, "gradients/decoder.model.decoder.layers.3.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 4.0, 2.0, 3.0, 3.0, 4.0, 9.0, 8.0, 13.0, 9.0, 16.0, 17.0, 20.0, 37.0, 66.0, 138.0, 289.0, 754.0, 2467.0, 11251.0, 75725.0, 753319.0, 177218.0, 21055.0, 4221.0, 1104.0, 380.0, 174.0, 85.0, 52.0, 33.0, 19.0, 14.0, 13.0, 9.0, 4.0, 6.0, 2.0, 4.0, 4.0, 3.0, 5.0, 0.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.626953125, -2.53204345703125, -2.4371337890625, -2.34222412109375, -2.247314453125, -2.15240478515625, -2.0574951171875, -1.96258544921875, -1.86767578125, -1.77276611328125, -1.6778564453125, -1.58294677734375, -1.488037109375, -1.39312744140625, -1.2982177734375, -1.20330810546875, -1.1083984375, -1.01348876953125, -0.9185791015625, -0.82366943359375, -0.728759765625, -0.63385009765625, -0.5389404296875, -0.44403076171875, -0.34912109375, -0.25421142578125, -0.1593017578125, -0.06439208984375, 0.030517578125, 0.12542724609375, 0.2203369140625, 0.31524658203125, 0.41015625, 0.50506591796875, 0.5999755859375, 0.69488525390625, 0.789794921875, 0.88470458984375, 0.9796142578125, 1.07452392578125, 1.16943359375, 1.26434326171875, 1.3592529296875, 1.45416259765625, 1.549072265625, 1.64398193359375, 1.7388916015625, 1.83380126953125, 1.9287109375, 2.02362060546875, 2.1185302734375, 2.21343994140625, 2.308349609375, 2.40325927734375, 2.4981689453125, 2.59307861328125, 2.68798828125, 2.78289794921875, 2.8778076171875, 2.97271728515625, 3.067626953125, 3.16253662109375, 3.2574462890625, 3.35235595703125, 3.447265625]}, "gradients/decoder.model.decoder.layers.3.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 2.0, 4.0, 5.0, 6.0, 6.0, 7.0, 12.0, 21.0, 9.0, 19.0, 11.0, 19.0, 24.0, 35.0, 37.0, 39.0, 61.0, 62.0, 58.0, 55.0, 50.0, 53.0, 52.0, 47.0, 66.0, 42.0, 31.0, 42.0, 31.0, 16.0, 27.0, 12.0, 9.0, 10.0, 10.0, 12.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.208984375, -3.10614013671875, -3.0032958984375, -2.90045166015625, -2.797607421875, -2.69476318359375, -2.5919189453125, -2.48907470703125, -2.38623046875, -2.28338623046875, -2.1805419921875, -2.07769775390625, -1.974853515625, -1.87200927734375, -1.7691650390625, -1.66632080078125, -1.5634765625, -1.46063232421875, -1.3577880859375, -1.25494384765625, -1.152099609375, -1.04925537109375, -0.9464111328125, -0.84356689453125, -0.74072265625, -0.63787841796875, -0.5350341796875, -0.43218994140625, -0.329345703125, -0.22650146484375, -0.1236572265625, -0.02081298828125, 0.08203125, 0.18487548828125, 0.2877197265625, 0.39056396484375, 0.493408203125, 0.59625244140625, 0.6990966796875, 0.80194091796875, 0.90478515625, 1.00762939453125, 1.1104736328125, 1.21331787109375, 1.316162109375, 1.41900634765625, 1.5218505859375, 1.62469482421875, 1.7275390625, 1.83038330078125, 1.9332275390625, 2.03607177734375, 2.138916015625, 2.24176025390625, 2.3446044921875, 2.44744873046875, 2.55029296875, 2.65313720703125, 2.7559814453125, 2.85882568359375, 2.961669921875, 3.06451416015625, 3.1673583984375, 3.27020263671875, 3.373046875]}, "gradients/decoder.model.decoder.layers.3.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 3.0, 3.0, 6.0, 12.0, 7.0, 11.0, 7.0, 7.0, 16.0, 21.0, 17.0, 26.0, 40.0, 53.0, 79.0, 117.0, 157.0, 275.0, 528.0, 1571.0, 14271.0, 746907.0, 273691.0, 8304.0, 1215.0, 460.0, 237.0, 154.0, 106.0, 70.0, 42.0, 29.0, 25.0, 27.0, 19.0, 13.0, 8.0, 8.0, 6.0, 4.0, 3.0, 3.0, 2.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0], "bins": [-5.80859375, -5.64678955078125, -5.4849853515625, -5.32318115234375, -5.161376953125, -4.99957275390625, -4.8377685546875, -4.67596435546875, -4.51416015625, -4.35235595703125, -4.1905517578125, -4.02874755859375, -3.866943359375, -3.70513916015625, -3.5433349609375, -3.38153076171875, -3.2197265625, -3.05792236328125, -2.8961181640625, -2.73431396484375, -2.572509765625, -2.41070556640625, -2.2489013671875, -2.08709716796875, -1.92529296875, -1.76348876953125, -1.6016845703125, -1.43988037109375, -1.278076171875, -1.11627197265625, -0.9544677734375, -0.79266357421875, -0.630859375, -0.46905517578125, -0.3072509765625, -0.14544677734375, 0.016357421875, 0.17816162109375, 0.3399658203125, 0.50177001953125, 0.66357421875, 0.82537841796875, 0.9871826171875, 1.14898681640625, 1.310791015625, 1.47259521484375, 1.6343994140625, 1.79620361328125, 1.9580078125, 2.11981201171875, 2.2816162109375, 2.44342041015625, 2.605224609375, 2.76702880859375, 2.9288330078125, 3.09063720703125, 3.25244140625, 3.41424560546875, 3.5760498046875, 3.73785400390625, 3.899658203125, 4.06146240234375, 4.2232666015625, 4.38507080078125, 4.546875]}, "gradients/decoder.model.decoder.layers.3.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 3.0, 1.0, 3.0, 8.0, 8.0, 6.0, 9.0, 13.0, 12.0, 13.0, 16.0, 10.0, 17.0, 21.0, 29.0, 39.0, 22.0, 33.0, 39.0, 32.0, 42.0, 34.0, 42.0, 51.0, 50.0, 45.0, 45.0, 48.0, 38.0, 30.0, 37.0, 34.0, 34.0, 30.0, 25.0, 9.0, 14.0, 20.0, 9.0, 9.0, 7.0, 3.0, 3.0, 4.0, 7.0, 1.0, 0.0, 1.0, 0.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-3.193359375, -3.09051513671875, -2.9876708984375, -2.88482666015625, -2.781982421875, -2.67913818359375, -2.5762939453125, -2.47344970703125, -2.37060546875, -2.26776123046875, -2.1649169921875, -2.06207275390625, -1.959228515625, -1.85638427734375, -1.7535400390625, -1.65069580078125, -1.5478515625, -1.44500732421875, -1.3421630859375, -1.23931884765625, -1.136474609375, -1.03363037109375, -0.9307861328125, -0.82794189453125, -0.72509765625, -0.62225341796875, -0.5194091796875, -0.41656494140625, -0.313720703125, -0.21087646484375, -0.1080322265625, -0.00518798828125, 0.09765625, 0.20050048828125, 0.3033447265625, 0.40618896484375, 0.509033203125, 0.61187744140625, 0.7147216796875, 0.81756591796875, 0.92041015625, 1.02325439453125, 1.1260986328125, 1.22894287109375, 1.331787109375, 1.43463134765625, 1.5374755859375, 1.64031982421875, 1.7431640625, 1.84600830078125, 1.9488525390625, 2.05169677734375, 2.154541015625, 2.25738525390625, 2.3602294921875, 2.46307373046875, 2.56591796875, 2.66876220703125, 2.7716064453125, 2.87445068359375, 2.977294921875, 3.08013916015625, 3.1829833984375, 3.28582763671875, 3.388671875]}, "gradients/decoder.model.decoder.layers.3.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 4.0, 3.0, 2.0, 9.0, 8.0, 14.0, 31.0, 94.0, 153.0, 376.0, 939.0, 5135.0, 229030.0, 802089.0, 8544.0, 1331.0, 444.0, 190.0, 77.0, 44.0, 19.0, 7.0, 4.0, 2.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.60546875, -3.5198211669921875, -3.434173583984375, -3.3485260009765625, -3.26287841796875, -3.1772308349609375, -3.091583251953125, -3.0059356689453125, -2.9202880859375, -2.8346405029296875, -2.748992919921875, -2.6633453369140625, -2.57769775390625, -2.4920501708984375, -2.406402587890625, -2.3207550048828125, -2.235107421875, -2.1494598388671875, -2.063812255859375, -1.9781646728515625, -1.89251708984375, -1.8068695068359375, -1.721221923828125, -1.6355743408203125, -1.5499267578125, -1.4642791748046875, -1.378631591796875, -1.2929840087890625, -1.20733642578125, -1.1216888427734375, -1.036041259765625, -0.9503936767578125, -0.86474609375, -0.7790985107421875, -0.693450927734375, -0.6078033447265625, -0.52215576171875, -0.4365081787109375, -0.350860595703125, -0.2652130126953125, -0.1795654296875, -0.0939178466796875, -0.008270263671875, 0.0773773193359375, 0.16302490234375, 0.2486724853515625, 0.334320068359375, 0.4199676513671875, 0.505615234375, 0.5912628173828125, 0.676910400390625, 0.7625579833984375, 0.84820556640625, 0.9338531494140625, 1.019500732421875, 1.1051483154296875, 1.1907958984375, 1.2764434814453125, 1.362091064453125, 1.4477386474609375, 1.53338623046875, 1.6190338134765625, 1.704681396484375, 1.7903289794921875, 1.8759765625]}, "gradients/decoder.model.decoder.layers.3.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 4.0, 3.0, 4.0, 6.0, 11.0, 6.0, 6.0, 9.0, 21.0, 30.0, 32.0, 43.0, 71.0, 108.0, 336.0, 78.0, 62.0, 39.0, 29.0, 21.0, 19.0, 18.0, 14.0, 10.0, 12.0, 2.0, 5.0, 2.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00018215179443359375, -0.00017573684453964233, -0.00016932189464569092, -0.0001629069447517395, -0.00015649199485778809, -0.00015007704496383667, -0.00014366209506988525, -0.00013724714517593384, -0.00013083219528198242, -0.000124417245388031, -0.00011800229549407959, -0.00011158734560012817, -0.00010517239570617676, -9.875744581222534e-05, -9.234249591827393e-05, -8.592754602432251e-05, -7.95125961303711e-05, -7.309764623641968e-05, -6.668269634246826e-05, -6.0267746448516846e-05, -5.385279655456543e-05, -4.7437846660614014e-05, -4.10228967666626e-05, -3.460794687271118e-05, -2.8192996978759766e-05, -2.177804708480835e-05, -1.5363097190856934e-05, -8.948147296905518e-06, -2.5331974029541016e-06, 3.8817524909973145e-06, 1.029670238494873e-05, 1.6711652278900146e-05, 2.3126602172851562e-05, 2.954155206680298e-05, 3.5956501960754395e-05, 4.237145185470581e-05, 4.8786401748657227e-05, 5.520135164260864e-05, 6.161630153656006e-05, 6.803125143051147e-05, 7.444620132446289e-05, 8.08611512184143e-05, 8.727610111236572e-05, 9.369105100631714e-05, 0.00010010600090026855, 0.00010652095079421997, 0.00011293590068817139, 0.0001193508505821228, 0.00012576580047607422, 0.00013218075037002563, 0.00013859570026397705, 0.00014501065015792847, 0.00015142560005187988, 0.0001578405499458313, 0.00016425549983978271, 0.00017067044973373413, 0.00017708539962768555, 0.00018350034952163696, 0.00018991529941558838, 0.0001963302493095398, 0.0002027451992034912, 0.00020916014909744263, 0.00021557509899139404, 0.00022199004888534546, 0.00022840499877929688]}, "gradients/decoder.model.decoder.layers.3.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 6.0, 8.0, 8.0, 14.0, 21.0, 32.0, 48.0, 59.0, 115.0, 174.0, 306.0, 590.0, 1442.0, 7977.0, 229998.0, 789379.0, 14984.0, 1829.0, 686.0, 342.0, 193.0, 122.0, 75.0, 49.0, 38.0, 20.0, 14.0, 7.0, 6.0, 2.0, 2.0, 6.0, 3.0, 1.0, 5.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9052734375, -1.8262786865234375, -1.747283935546875, -1.6682891845703125, -1.58929443359375, -1.5102996826171875, -1.431304931640625, -1.3523101806640625, -1.2733154296875, -1.1943206787109375, -1.115325927734375, -1.0363311767578125, -0.95733642578125, -0.8783416748046875, -0.799346923828125, -0.7203521728515625, -0.641357421875, -0.5623626708984375, -0.483367919921875, -0.4043731689453125, -0.32537841796875, -0.2463836669921875, -0.167388916015625, -0.0883941650390625, -0.0093994140625, 0.0695953369140625, 0.148590087890625, 0.2275848388671875, 0.30657958984375, 0.3855743408203125, 0.464569091796875, 0.5435638427734375, 0.62255859375, 0.7015533447265625, 0.780548095703125, 0.8595428466796875, 0.93853759765625, 1.0175323486328125, 1.096527099609375, 1.1755218505859375, 1.2545166015625, 1.3335113525390625, 1.412506103515625, 1.4915008544921875, 1.57049560546875, 1.6494903564453125, 1.728485107421875, 1.8074798583984375, 1.886474609375, 1.9654693603515625, 2.044464111328125, 2.1234588623046875, 2.20245361328125, 2.2814483642578125, 2.360443115234375, 2.4394378662109375, 2.5184326171875, 2.5974273681640625, 2.676422119140625, 2.7554168701171875, 2.83441162109375, 2.9134063720703125, 2.992401123046875, 3.0713958740234375, 3.150390625]}, "gradients/decoder.model.decoder.layers.3.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 3.0, 6.0, 11.0, 11.0, 11.0, 26.0, 32.0, 40.0, 48.0, 60.0, 177.0, 262.0, 94.0, 54.0, 42.0, 31.0, 29.0, 19.0, 18.0, 10.0, 4.0, 5.0, 3.0, 2.0, 3.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.72216796875, -0.7050247192382812, -0.6878814697265625, -0.6707382202148438, -0.653594970703125, -0.6364517211914062, -0.6193084716796875, -0.6021652221679688, -0.58502197265625, -0.5678787231445312, -0.5507354736328125, -0.5335922241210938, -0.516448974609375, -0.49930572509765625, -0.4821624755859375, -0.46501922607421875, -0.4478759765625, -0.43073272705078125, -0.4135894775390625, -0.39644622802734375, -0.379302978515625, -0.36215972900390625, -0.3450164794921875, -0.32787322998046875, -0.31072998046875, -0.29358673095703125, -0.2764434814453125, -0.25930023193359375, -0.242156982421875, -0.22501373291015625, -0.2078704833984375, -0.19072723388671875, -0.173583984375, -0.15644073486328125, -0.1392974853515625, -0.12215423583984375, -0.105010986328125, -0.08786773681640625, -0.0707244873046875, -0.05358123779296875, -0.03643798828125, -0.01929473876953125, -0.0021514892578125, 0.01499176025390625, 0.032135009765625, 0.04927825927734375, 0.0664215087890625, 0.08356475830078125, 0.1007080078125, 0.11785125732421875, 0.1349945068359375, 0.15213775634765625, 0.169281005859375, 0.18642425537109375, 0.2035675048828125, 0.22071075439453125, 0.23785400390625, 0.25499725341796875, 0.2721405029296875, 0.28928375244140625, 0.306427001953125, 0.32357025146484375, 0.3407135009765625, 0.35785675048828125, 0.375]}, "gradients/decoder.model.decoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 13.0, 23.0, 52.0, 97.0, 152.0, 205.0, 217.0, 122.0, 65.0, 36.0, 9.0, 7.0, 3.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-14.607107162475586, -14.273211479187012, -13.939315795898438, -13.605419158935547, -13.271523475646973, -12.937627792358398, -12.603732109069824, -12.26983642578125, -11.935940742492676, -11.602045059204102, -11.268149375915527, -10.934253692626953, -10.600357055664062, -10.266461372375488, -9.932565689086914, -9.59867000579834, -9.264774322509766, -8.930878639221191, -8.596982955932617, -8.263086318969727, -7.9291911125183105, -7.595294952392578, -7.261399269104004, -6.92750358581543, -6.593606948852539, -6.259711265563965, -5.925815105438232, -5.591919422149658, -5.258023738861084, -4.924127578735352, -4.590231895446777, -4.256336212158203, -3.922440528869629, -3.5885446071624756, -3.2546489238739014, -2.920753002166748, -2.586857318878174, -2.2529613971710205, -1.9190654754638672, -1.585169792175293, -1.2512738704681396, -0.9173780679702759, -0.5834822058677673, -0.2495863437652588, 0.08430945873260498, 0.41820526123046875, 0.7521011829376221, 1.0859968662261963, 1.4198927879333496, 1.7537885904312134, 2.087684392929077, 2.4215803146362305, 2.7554759979248047, 3.089371919631958, 3.4232678413391113, 3.7571635246276855, 4.091059684753418, 4.424955368041992, 4.758851528167725, 5.092747211456299, 5.426642894744873, 5.7605390548706055, 6.09443473815918, 6.428330421447754, 6.762226104736328]}, "gradients/decoder.model.decoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 4.0, 3.0, 2.0, 5.0, 9.0, 8.0, 10.0, 12.0, 20.0, 21.0, 22.0, 24.0, 26.0, 33.0, 45.0, 49.0, 41.0, 47.0, 49.0, 41.0, 38.0, 56.0, 66.0, 51.0, 42.0, 32.0, 33.0, 35.0, 34.0, 30.0, 19.0, 16.0, 21.0, 11.0, 16.0, 7.0, 4.0, 10.0, 3.0, 4.0, 3.0, 0.0, 6.0, 0.0, 1.0, 3.0, 1.0, 1.0], "bins": [-6.703184127807617, -6.517426490783691, -6.331668853759766, -6.145910739898682, -5.960153102874756, -5.77439546585083, -5.588637828826904, -5.40287971496582, -5.2171220779418945, -5.031364440917969, -4.845606803894043, -4.659848690032959, -4.474091053009033, -4.288333415985107, -4.102575778961182, -3.9168179035186768, -3.731060266494751, -3.545302629470825, -3.3595447540283203, -3.1737871170043945, -2.9880292415618896, -2.802271604537964, -2.616513729095459, -2.430756092071533, -2.2449984550476074, -2.0592408180236816, -1.8734829425811768, -1.687725305557251, -1.501967430114746, -1.3162097930908203, -1.130452036857605, -0.9446942806243896, -0.7589364051818848, -0.5731786489486694, -0.3874209225177765, -0.20166319608688354, -0.015905439853668213, 0.16985231637954712, 0.3556100130081177, 0.541367769241333, 0.7271255254745483, 0.9128832817077637, 1.098641037940979, 1.2843987941741943, 1.4701564311981201, 1.655914306640625, 1.8416719436645508, 2.0274295806884766, 2.2131874561309814, 2.3989450931549072, 2.584702968597412, 2.770460605621338, 2.9562184810638428, 3.1419761180877686, 3.3277339935302734, 3.513491630554199, 3.699249267578125, 3.885006904602051, 4.070764541625977, 4.2565226554870605, 4.442280292510986, 4.628037929534912, 4.813795566558838, 4.999553680419922, 5.185311317443848]}, "gradients/decoder.model.decoder.layers.2.fc2.weight": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 4.0, 2.0, 4.0, 3.0, 8.0, 9.0, 16.0, 12.0, 15.0, 25.0, 29.0, 24.0, 44.0, 97.0, 127.0, 259.0, 693.0, 2734.0, 40990.0, 3653101.0, 487390.0, 7044.0, 892.0, 300.0, 130.0, 79.0, 50.0, 50.0, 38.0, 36.0, 18.0, 17.0, 16.0, 10.0, 6.0, 9.0, 2.0, 5.0, 1.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.82421875, -5.56817626953125, -5.3121337890625, -5.05609130859375, -4.800048828125, -4.54400634765625, -4.2879638671875, -4.03192138671875, -3.77587890625, -3.51983642578125, -3.2637939453125, -3.00775146484375, -2.751708984375, -2.49566650390625, -2.2396240234375, -1.98358154296875, -1.7275390625, -1.47149658203125, -1.2154541015625, -0.95941162109375, -0.703369140625, -0.44732666015625, -0.1912841796875, 0.06475830078125, 0.32080078125, 0.57684326171875, 0.8328857421875, 1.08892822265625, 1.344970703125, 1.60101318359375, 1.8570556640625, 2.11309814453125, 2.369140625, 2.62518310546875, 2.8812255859375, 3.13726806640625, 3.393310546875, 3.64935302734375, 3.9053955078125, 4.16143798828125, 4.41748046875, 4.67352294921875, 4.9295654296875, 5.18560791015625, 5.441650390625, 5.69769287109375, 5.9537353515625, 6.20977783203125, 6.4658203125, 6.72186279296875, 6.9779052734375, 7.23394775390625, 7.489990234375, 7.74603271484375, 8.0020751953125, 8.25811767578125, 8.51416015625, 8.77020263671875, 9.0262451171875, 9.28228759765625, 9.538330078125, 9.79437255859375, 10.0504150390625, 10.30645751953125, 10.5625]}, "gradients/decoder.model.decoder.layers.2.fc2.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 6.0, 1.0, 2.0, 8.0, 11.0, 11.0, 10.0, 15.0, 14.0, 20.0, 29.0, 31.0, 28.0, 47.0, 47.0, 55.0, 65.0, 80.0, 57.0, 65.0, 66.0, 41.0, 48.0, 53.0, 48.0, 37.0, 33.0, 18.0, 15.0, 15.0, 11.0, 7.0, 5.0, 2.0, 2.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.73828125, -1.667144775390625, -1.59600830078125, -1.524871826171875, -1.4537353515625, -1.382598876953125, -1.31146240234375, -1.240325927734375, -1.169189453125, -1.098052978515625, -1.02691650390625, -0.955780029296875, -0.8846435546875, -0.813507080078125, -0.74237060546875, -0.671234130859375, -0.60009765625, -0.528961181640625, -0.45782470703125, -0.386688232421875, -0.3155517578125, -0.244415283203125, -0.17327880859375, -0.102142333984375, -0.031005859375, 0.040130615234375, 0.11126708984375, 0.182403564453125, 0.2535400390625, 0.324676513671875, 0.39581298828125, 0.466949462890625, 0.5380859375, 0.609222412109375, 0.68035888671875, 0.751495361328125, 0.8226318359375, 0.893768310546875, 0.96490478515625, 1.036041259765625, 1.107177734375, 1.178314208984375, 1.24945068359375, 1.320587158203125, 1.3917236328125, 1.462860107421875, 1.53399658203125, 1.605133056640625, 1.67626953125, 1.747406005859375, 1.81854248046875, 1.889678955078125, 1.9608154296875, 2.031951904296875, 2.10308837890625, 2.174224853515625, 2.245361328125, 2.316497802734375, 2.38763427734375, 2.458770751953125, 2.5299072265625, 2.601043701171875, 2.67218017578125, 2.743316650390625, 2.814453125]}, "gradients/decoder.model.decoder.layers.2.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 8.0, 6.0, 7.0, 19.0, 24.0, 47.0, 78.0, 249.0, 705.0, 2633.0, 31259.0, 4003724.0, 149208.0, 4606.0, 1029.0, 365.0, 152.0, 67.0, 33.0, 24.0, 14.0, 8.0, 8.0, 3.0, 6.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.8359375, -9.543701171875, -9.25146484375, -8.959228515625, -8.6669921875, -8.374755859375, -8.08251953125, -7.790283203125, -7.498046875, -7.205810546875, -6.91357421875, -6.621337890625, -6.3291015625, -6.036865234375, -5.74462890625, -5.452392578125, -5.16015625, -4.867919921875, -4.57568359375, -4.283447265625, -3.9912109375, -3.698974609375, -3.40673828125, -3.114501953125, -2.822265625, -2.530029296875, -2.23779296875, -1.945556640625, -1.6533203125, -1.361083984375, -1.06884765625, -0.776611328125, -0.484375, -0.192138671875, 0.10009765625, 0.392333984375, 0.6845703125, 0.976806640625, 1.26904296875, 1.561279296875, 1.853515625, 2.145751953125, 2.43798828125, 2.730224609375, 3.0224609375, 3.314697265625, 3.60693359375, 3.899169921875, 4.19140625, 4.483642578125, 4.77587890625, 5.068115234375, 5.3603515625, 5.652587890625, 5.94482421875, 6.237060546875, 6.529296875, 6.821533203125, 7.11376953125, 7.406005859375, 7.6982421875, 7.990478515625, 8.28271484375, 8.574951171875, 8.8671875]}, "gradients/decoder.model.decoder.layers.2.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 8.0, 11.0, 8.0, 9.0, 13.0, 22.0, 47.0, 58.0, 83.0, 161.0, 252.0, 441.0, 698.0, 789.0, 576.0, 348.0, 220.0, 130.0, 69.0, 47.0, 33.0, 16.0, 19.0, 8.0, 2.0, 3.0, 0.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.447265625, -1.408447265625, -1.36962890625, -1.330810546875, -1.2919921875, -1.253173828125, -1.21435546875, -1.175537109375, -1.13671875, -1.097900390625, -1.05908203125, -1.020263671875, -0.9814453125, -0.942626953125, -0.90380859375, -0.864990234375, -0.826171875, -0.787353515625, -0.74853515625, -0.709716796875, -0.6708984375, -0.632080078125, -0.59326171875, -0.554443359375, -0.515625, -0.476806640625, -0.43798828125, -0.399169921875, -0.3603515625, -0.321533203125, -0.28271484375, -0.243896484375, -0.205078125, -0.166259765625, -0.12744140625, -0.088623046875, -0.0498046875, -0.010986328125, 0.02783203125, 0.066650390625, 0.10546875, 0.144287109375, 0.18310546875, 0.221923828125, 0.2607421875, 0.299560546875, 0.33837890625, 0.377197265625, 0.416015625, 0.454833984375, 0.49365234375, 0.532470703125, 0.5712890625, 0.610107421875, 0.64892578125, 0.687744140625, 0.7265625, 0.765380859375, 0.80419921875, 0.843017578125, 0.8818359375, 0.920654296875, 0.95947265625, 0.998291015625, 1.037109375]}, "gradients/decoder.model.decoder.layers.2.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 12.0, 14.0, 41.0, 63.0, 131.0, 156.0, 163.0, 166.0, 118.0, 62.0, 45.0, 19.0, 15.0, 4.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.07180643081665, -6.849813461303711, -6.6278204917907715, -6.405827522277832, -6.183834075927734, -5.961841106414795, -5.7398481369018555, -5.517855167388916, -5.295862197875977, -5.073869228363037, -4.851876258850098, -4.6298828125, -4.4078898429870605, -4.185896873474121, -3.9639039039611816, -3.741910934448242, -3.5199174880981445, -3.297924518585205, -3.0759313106536865, -2.853938341140747, -2.6319451332092285, -2.409952163696289, -2.1879591941833496, -1.9659661054611206, -1.7439730167388916, -1.5219799280166626, -1.2999868392944336, -1.0779938697814941, -0.8560007810592651, -0.6340076923370361, -0.4120147228240967, -0.19002163410186768, 0.031970977783203125, 0.25396403670310974, 0.47595709562301636, 0.6979501247406006, 0.9199432134628296, 1.1419363021850586, 1.363929271697998, 1.585922360420227, 1.807915449142456, 2.0299084186553955, 2.251901626586914, 2.4738945960998535, 2.695887565612793, 2.9178807735443115, 3.139873743057251, 3.3618669509887695, 3.583859920501709, 3.8058528900146484, 4.027845859527588, 4.249838829040527, 4.471832275390625, 4.6938252449035645, 4.915818214416504, 5.137811183929443, 5.359804153442383, 5.581797122955322, 5.803790092468262, 6.025783538818359, 6.247776508331299, 6.469769477844238, 6.691762447357178, 6.913755416870117, 7.135748863220215]}, "gradients/decoder.model.decoder.layers.2.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 8.0, 4.0, 4.0, 8.0, 17.0, 15.0, 11.0, 15.0, 11.0, 16.0, 27.0, 31.0, 28.0, 31.0, 34.0, 44.0, 47.0, 45.0, 44.0, 49.0, 32.0, 60.0, 34.0, 42.0, 52.0, 42.0, 35.0, 33.0, 33.0, 30.0, 26.0, 17.0, 18.0, 16.0, 16.0, 7.0, 8.0, 7.0, 4.0, 4.0, 3.0, 0.0, 1.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.0989229679107666, -2.02917742729187, -1.9594320058822632, -1.8896865844726562, -1.8199410438537598, -1.7501956224441528, -1.680450201034546, -1.6107046604156494, -1.5409592390060425, -1.4712138175964355, -1.401468276977539, -1.3317228555679321, -1.2619774341583252, -1.1922318935394287, -1.1224864721298218, -1.0527410507202148, -0.9829955101013184, -0.9132500290870667, -0.8435045480728149, -0.773759126663208, -0.7040136456489563, -0.6342681646347046, -0.5645227432250977, -0.49477726221084595, -0.42503178119659424, -0.35528630018234253, -0.2855408489704132, -0.2157953828573227, -0.14604991674423218, -0.07630443572998047, -0.0065589845180511475, 0.06318646669387817, 0.13293194770812988, 0.2026774138212204, 0.2724228799343109, 0.34216833114624023, 0.41191381216049194, 0.48165929317474365, 0.5514047145843506, 0.6211501955986023, 0.690895676612854, 0.7606411576271057, 0.8303866386413574, 0.9001320600509644, 0.9698775410652161, 1.0396230220794678, 1.1093684434890747, 1.1791138648986816, 1.2488594055175781, 1.318604826927185, 1.3883503675460815, 1.4580957889556885, 1.527841329574585, 1.597586750984192, 1.6673321723937988, 1.7370777130126953, 1.8068231344223022, 1.8765685558319092, 1.9463140964508057, 2.016059637069702, 2.0858049392700195, 2.155550479888916, 2.2252960205078125, 2.29504132270813, 2.3647868633270264]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 6.0, 7.0, 2.0, 9.0, 9.0, 13.0, 21.0, 24.0, 31.0, 54.0, 75.0, 109.0, 144.0, 194.0, 288.0, 497.0, 921.0, 1814.0, 4717.0, 14988.0, 56853.0, 198186.0, 400246.0, 258025.0, 79286.0, 20923.0, 6191.0, 2215.0, 1061.0, 558.0, 344.0, 241.0, 158.0, 117.0, 64.0, 54.0, 38.0, 31.0, 13.0, 9.0, 8.0, 7.0, 3.0, 5.0, 2.0, 0.0, 3.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.59326171875, -0.5738906860351562, -0.5545196533203125, -0.5351486206054688, -0.515777587890625, -0.49640655517578125, -0.4770355224609375, -0.45766448974609375, -0.43829345703125, -0.41892242431640625, -0.3995513916015625, -0.38018035888671875, -0.360809326171875, -0.34143829345703125, -0.3220672607421875, -0.30269622802734375, -0.2833251953125, -0.26395416259765625, -0.2445831298828125, -0.22521209716796875, -0.205841064453125, -0.18647003173828125, -0.1670989990234375, -0.14772796630859375, -0.12835693359375, -0.10898590087890625, -0.0896148681640625, -0.07024383544921875, -0.050872802734375, -0.03150177001953125, -0.0121307373046875, 0.00724029541015625, 0.026611328125, 0.04598236083984375, 0.0653533935546875, 0.08472442626953125, 0.104095458984375, 0.12346649169921875, 0.1428375244140625, 0.16220855712890625, 0.18157958984375, 0.20095062255859375, 0.2203216552734375, 0.23969268798828125, 0.259063720703125, 0.27843475341796875, 0.2978057861328125, 0.31717681884765625, 0.3365478515625, 0.35591888427734375, 0.3752899169921875, 0.39466094970703125, 0.414031982421875, 0.43340301513671875, 0.4527740478515625, 0.47214508056640625, 0.49151611328125, 0.5108871459960938, 0.5302581787109375, 0.5496292114257812, 0.569000244140625, 0.5883712768554688, 0.6077423095703125, 0.6271133422851562, 0.646484375]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 5.0, 3.0, 4.0, 7.0, 10.0, 17.0, 17.0, 13.0, 19.0, 20.0, 30.0, 35.0, 29.0, 39.0, 40.0, 50.0, 41.0, 49.0, 59.0, 47.0, 49.0, 49.0, 48.0, 41.0, 42.0, 32.0, 33.0, 35.0, 20.0, 24.0, 24.0, 16.0, 15.0, 11.0, 10.0, 4.0, 6.0, 4.0, 3.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.4716796875, -1.4199066162109375, -1.368133544921875, -1.3163604736328125, -1.26458740234375, -1.2128143310546875, -1.161041259765625, -1.1092681884765625, -1.0574951171875, -1.0057220458984375, -0.953948974609375, -0.9021759033203125, -0.85040283203125, -0.7986297607421875, -0.746856689453125, -0.6950836181640625, -0.643310546875, -0.5915374755859375, -0.539764404296875, -0.4879913330078125, -0.43621826171875, -0.3844451904296875, -0.332672119140625, -0.2808990478515625, -0.2291259765625, -0.1773529052734375, -0.125579833984375, -0.0738067626953125, -0.02203369140625, 0.0297393798828125, 0.081512451171875, 0.1332855224609375, 0.18505859375, 0.2368316650390625, 0.288604736328125, 0.3403778076171875, 0.39215087890625, 0.4439239501953125, 0.495697021484375, 0.5474700927734375, 0.5992431640625, 0.6510162353515625, 0.702789306640625, 0.7545623779296875, 0.80633544921875, 0.8581085205078125, 0.909881591796875, 0.9616546630859375, 1.013427734375, 1.0652008056640625, 1.116973876953125, 1.1687469482421875, 1.22052001953125, 1.2722930908203125, 1.324066162109375, 1.3758392333984375, 1.4276123046875, 1.4793853759765625, 1.531158447265625, 1.5829315185546875, 1.63470458984375, 1.6864776611328125, 1.738250732421875, 1.7900238037109375, 1.841796875]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 2.0, 6.0, 5.0, 13.0, 13.0, 17.0, 24.0, 25.0, 43.0, 85.0, 139.0, 240.0, 493.0, 1045.0, 2234.0, 4822.0, 10551.0, 23048.0, 49849.0, 100632.0, 177470.0, 234105.0, 201616.0, 123750.0, 63378.0, 29517.0, 13577.0, 6203.0, 2865.0, 1376.0, 668.0, 296.0, 191.0, 90.0, 60.0, 31.0, 25.0, 18.0, 10.0, 12.0, 4.0, 3.0, 2.0, 1.0, 3.0, 3.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.2607421875, -0.2516441345214844, -0.24254608154296875, -0.23344802856445312, -0.2243499755859375, -0.21525192260742188, -0.20615386962890625, -0.19705581665039062, -0.187957763671875, -0.17885971069335938, -0.16976165771484375, -0.16066360473632812, -0.1515655517578125, -0.14246749877929688, -0.13336944580078125, -0.12427139282226562, -0.11517333984375, -0.10607528686523438, -0.09697723388671875, -0.08787918090820312, -0.0787811279296875, -0.06968307495117188, -0.06058502197265625, -0.051486968994140625, -0.042388916015625, -0.033290863037109375, -0.02419281005859375, -0.015094757080078125, -0.0059967041015625, 0.003101348876953125, 0.01219940185546875, 0.021297454833984375, 0.0303955078125, 0.039493560791015625, 0.04859161376953125, 0.057689666748046875, 0.0667877197265625, 0.07588577270507812, 0.08498382568359375, 0.09408187866210938, 0.103179931640625, 0.11227798461914062, 0.12137603759765625, 0.13047409057617188, 0.1395721435546875, 0.14867019653320312, 0.15776824951171875, 0.16686630249023438, 0.17596435546875, 0.18506240844726562, 0.19416046142578125, 0.20325851440429688, 0.2123565673828125, 0.22145462036132812, 0.23055267333984375, 0.23965072631835938, 0.248748779296875, 0.2578468322753906, 0.26694488525390625, 0.2760429382324219, 0.2851409912109375, 0.2942390441894531, 0.30333709716796875, 0.3124351501464844, 0.321533203125]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 4.0, 4.0, 8.0, 7.0, 10.0, 17.0, 12.0, 16.0, 22.0, 30.0, 35.0, 41.0, 41.0, 55.0, 49.0, 40.0, 40.0, 49.0, 45.0, 50.0, 46.0, 57.0, 56.0, 29.0, 41.0, 31.0, 23.0, 30.0, 27.0, 26.0, 16.0, 18.0, 4.0, 5.0, 8.0, 3.0, 7.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.1171875, -3.01123046875, -2.9052734375, -2.79931640625, -2.693359375, -2.58740234375, -2.4814453125, -2.37548828125, -2.26953125, -2.16357421875, -2.0576171875, -1.95166015625, -1.845703125, -1.73974609375, -1.6337890625, -1.52783203125, -1.421875, -1.31591796875, -1.2099609375, -1.10400390625, -0.998046875, -0.89208984375, -0.7861328125, -0.68017578125, -0.57421875, -0.46826171875, -0.3623046875, -0.25634765625, -0.150390625, -0.04443359375, 0.0615234375, 0.16748046875, 0.2734375, 0.37939453125, 0.4853515625, 0.59130859375, 0.697265625, 0.80322265625, 0.9091796875, 1.01513671875, 1.12109375, 1.22705078125, 1.3330078125, 1.43896484375, 1.544921875, 1.65087890625, 1.7568359375, 1.86279296875, 1.96875, 2.07470703125, 2.1806640625, 2.28662109375, 2.392578125, 2.49853515625, 2.6044921875, 2.71044921875, 2.81640625, 2.92236328125, 3.0283203125, 3.13427734375, 3.240234375, 3.34619140625, 3.4521484375, 3.55810546875, 3.6640625]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 2.0, 11.0, 19.0, 33.0, 45.0, 99.0, 227.0, 513.0, 1587.0, 8905.0, 124291.0, 809591.0, 93347.0, 7515.0, 1479.0, 448.0, 230.0, 86.0, 49.0, 33.0, 24.0, 7.0, 9.0, 4.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1942138671875, -0.1868724822998047, -0.17953109741210938, -0.17218971252441406, -0.16484832763671875, -0.15750694274902344, -0.15016555786132812, -0.1428241729736328, -0.1354827880859375, -0.1281414031982422, -0.12080001831054688, -0.11345863342285156, -0.10611724853515625, -0.09877586364746094, -0.09143447875976562, -0.08409309387207031, -0.076751708984375, -0.06941032409667969, -0.062068939208984375, -0.05472755432128906, -0.04738616943359375, -0.04004478454589844, -0.032703399658203125, -0.025362014770507812, -0.0180206298828125, -0.010679244995117188, -0.003337860107421875, 0.0040035247802734375, 0.01134490966796875, 0.018686294555664062, 0.026027679443359375, 0.03336906433105469, 0.04071044921875, 0.04805183410644531, 0.055393218994140625, 0.06273460388183594, 0.07007598876953125, 0.07741737365722656, 0.08475875854492188, 0.09210014343261719, 0.0994415283203125, 0.10678291320800781, 0.11412429809570312, 0.12146568298339844, 0.12880706787109375, 0.13614845275878906, 0.14348983764648438, 0.1508312225341797, 0.158172607421875, 0.1655139923095703, 0.17285537719726562, 0.18019676208496094, 0.18753814697265625, 0.19487953186035156, 0.20222091674804688, 0.2095623016357422, 0.2169036865234375, 0.2242450714111328, 0.23158645629882812, 0.23892784118652344, 0.24626922607421875, 0.25361061096191406, 0.2609519958496094, 0.2682933807373047, 0.275634765625]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 6.0, 1.0, 4.0, 14.0, 10.0, 17.0, 26.0, 35.0, 30.0, 45.0, 67.0, 71.0, 83.0, 98.0, 97.0, 82.0, 69.0, 63.0, 43.0, 36.0, 37.0, 15.0, 19.0, 14.0, 6.0, 6.0, 6.0, 6.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.5703182220458984e-05, -3.421306610107422e-05, -3.272294998168945e-05, -3.123283386230469e-05, -2.9742717742919922e-05, -2.8252601623535156e-05, -2.676248550415039e-05, -2.5272369384765625e-05, -2.378225326538086e-05, -2.2292137145996094e-05, -2.0802021026611328e-05, -1.9311904907226562e-05, -1.7821788787841797e-05, -1.633167266845703e-05, -1.4841556549072266e-05, -1.33514404296875e-05, -1.1861324310302734e-05, -1.0371208190917969e-05, -8.881092071533203e-06, -7.3909759521484375e-06, -5.900859832763672e-06, -4.410743713378906e-06, -2.9206275939941406e-06, -1.430511474609375e-06, 5.960464477539063e-08, 1.5497207641601562e-06, 3.039836883544922e-06, 4.5299530029296875e-06, 6.020069122314453e-06, 7.510185241699219e-06, 9.000301361083984e-06, 1.049041748046875e-05, 1.1980533599853516e-05, 1.3470649719238281e-05, 1.4960765838623047e-05, 1.6450881958007812e-05, 1.7940998077392578e-05, 1.9431114196777344e-05, 2.092123031616211e-05, 2.2411346435546875e-05, 2.390146255493164e-05, 2.5391578674316406e-05, 2.6881694793701172e-05, 2.8371810913085938e-05, 2.9861927032470703e-05, 3.135204315185547e-05, 3.2842159271240234e-05, 3.4332275390625e-05, 3.5822391510009766e-05, 3.731250762939453e-05, 3.88026237487793e-05, 4.029273986816406e-05, 4.178285598754883e-05, 4.3272972106933594e-05, 4.476308822631836e-05, 4.6253204345703125e-05, 4.774332046508789e-05, 4.9233436584472656e-05, 5.072355270385742e-05, 5.221366882324219e-05, 5.370378494262695e-05, 5.519390106201172e-05, 5.6684017181396484e-05, 5.817413330078125e-05, 5.9664249420166016e-05]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 3.0, 5.0, 5.0, 4.0, 6.0, 8.0, 6.0, 10.0, 12.0, 30.0, 46.0, 69.0, 89.0, 178.0, 282.0, 638.0, 1740.0, 5530.0, 23917.0, 155030.0, 663783.0, 163447.0, 24762.0, 5722.0, 1770.0, 706.0, 321.0, 174.0, 96.0, 48.0, 35.0, 27.0, 16.0, 13.0, 7.0, 6.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 0.0, 2.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0], "bins": [-0.1671142578125, -0.1612529754638672, -0.15539169311523438, -0.14953041076660156, -0.14366912841796875, -0.13780784606933594, -0.13194656372070312, -0.1260852813720703, -0.1202239990234375, -0.11436271667480469, -0.10850143432617188, -0.10264015197753906, -0.09677886962890625, -0.09091758728027344, -0.08505630493164062, -0.07919502258300781, -0.073333740234375, -0.06747245788574219, -0.061611175537109375, -0.05574989318847656, -0.04988861083984375, -0.04402732849121094, -0.038166046142578125, -0.03230476379394531, -0.0264434814453125, -0.020582199096679688, -0.014720916748046875, -0.008859634399414062, -0.00299835205078125, 0.0028629302978515625, 0.008724212646484375, 0.014585494995117188, 0.02044677734375, 0.026308059692382812, 0.032169342041015625, 0.03803062438964844, 0.04389190673828125, 0.04975318908691406, 0.055614471435546875, 0.06147575378417969, 0.0673370361328125, 0.07319831848144531, 0.07905960083007812, 0.08492088317871094, 0.09078216552734375, 0.09664344787597656, 0.10250473022460938, 0.10836601257324219, 0.114227294921875, 0.12008857727050781, 0.12594985961914062, 0.13181114196777344, 0.13767242431640625, 0.14353370666503906, 0.14939498901367188, 0.1552562713623047, 0.1611175537109375, 0.1669788360595703, 0.17284011840820312, 0.17870140075683594, 0.18456268310546875, 0.19042396545410156, 0.19628524780273438, 0.2021465301513672, 0.2080078125]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 1.0, 3.0, 7.0, 9.0, 6.0, 23.0, 22.0, 26.0, 36.0, 67.0, 97.0, 107.0, 133.0, 136.0, 112.0, 68.0, 45.0, 30.0, 26.0, 11.0, 7.0, 11.0, 7.0, 6.0, 1.0, 1.0, 2.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07000732421875, -0.06804323196411133, -0.06607913970947266, -0.06411504745483398, -0.06215095520019531, -0.06018686294555664, -0.05822277069091797, -0.0562586784362793, -0.054294586181640625, -0.05233049392700195, -0.05036640167236328, -0.04840230941772461, -0.04643821716308594, -0.044474124908447266, -0.042510032653808594, -0.04054594039916992, -0.03858184814453125, -0.03661775588989258, -0.034653663635253906, -0.032689571380615234, -0.030725479125976562, -0.02876138687133789, -0.02679729461669922, -0.024833202362060547, -0.022869110107421875, -0.020905017852783203, -0.01894092559814453, -0.01697683334350586, -0.015012741088867188, -0.013048648834228516, -0.011084556579589844, -0.009120464324951172, -0.0071563720703125, -0.005192279815673828, -0.0032281875610351562, -0.0012640953063964844, 0.0006999969482421875, 0.0026640892028808594, 0.004628181457519531, 0.006592273712158203, 0.008556365966796875, 0.010520458221435547, 0.012484550476074219, 0.01444864273071289, 0.016412734985351562, 0.018376827239990234, 0.020340919494628906, 0.022305011749267578, 0.02426910400390625, 0.026233196258544922, 0.028197288513183594, 0.030161380767822266, 0.03212547302246094, 0.03408956527709961, 0.03605365753173828, 0.03801774978637695, 0.039981842041015625, 0.0419459342956543, 0.04391002655029297, 0.04587411880493164, 0.04783821105957031, 0.049802303314208984, 0.051766395568847656, 0.05373048782348633, 0.055694580078125]}, "gradients/decoder.model.decoder.layers.2.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 12.0, 19.0, 44.0, 85.0, 161.0, 164.0, 175.0, 160.0, 102.0, 45.0, 19.0, 12.0, 10.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.4635112285614014, -3.307328701019287, -3.1511459350585938, -2.9949634075164795, -2.8387808799743652, -2.682598114013672, -2.5264155864715576, -2.3702330589294434, -2.21405029296875, -2.0578677654266357, -1.901685118675232, -1.7455024719238281, -1.5893199443817139, -1.43313729763031, -1.2769546508789062, -1.120772123336792, -0.9645895957946777, -0.8084070086479187, -0.6522244215011597, -0.49604177474975586, -0.3398591876029968, -0.1836766004562378, -0.027493953704833984, 0.12868857383728027, 0.2848712205886841, 0.4410538077354431, 0.5972363948822021, 0.753419041633606, 0.909601628780365, 1.065784215927124, 1.2219668626785278, 1.378149390220642, 1.5343317985534668, 1.6905144453048706, 1.8466969728469849, 2.0028796195983887, 2.159062147140503, 2.315244674682617, 2.4714274406433105, 2.627609968185425, 2.783792495727539, 2.9399750232696533, 3.0961577892303467, 3.252340316772461, 3.408522844314575, 3.5647053718566895, 3.720888137817383, 3.877070665359497, 4.0332536697387695, 4.189436435699463, 4.345618724822998, 4.501801490783691, 4.657984256744385, 4.81416654586792, 4.970349311828613, 5.126531600952148, 5.282714366912842, 5.438897132873535, 5.59507942199707, 5.751262187957764, 5.907444953918457, 6.063627243041992, 6.2198100090026855, 6.375992774963379, 6.532175064086914]}, "gradients/decoder.model.decoder.layers.2.self_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 6.0, 4.0, 12.0, 13.0, 17.0, 16.0, 10.0, 24.0, 34.0, 33.0, 34.0, 36.0, 41.0, 56.0, 54.0, 58.0, 43.0, 49.0, 57.0, 53.0, 58.0, 40.0, 51.0, 30.0, 34.0, 35.0, 21.0, 19.0, 24.0, 8.0, 9.0, 7.0, 4.0, 8.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.6688393354415894, -1.6133403778076172, -1.5578415393829346, -1.5023425817489624, -1.4468437433242798, -1.3913447856903076, -1.335845947265625, -1.2803469896316528, -1.2248481512069702, -1.169349193572998, -1.1138503551483154, -1.0583513975143433, -1.0028525590896606, -0.9473536014556885, -0.8918547630310059, -0.8363558053970337, -0.7808569073677063, -0.7253580093383789, -0.6698591113090515, -0.6143602132797241, -0.5588613152503967, -0.5033624172210693, -0.44786348938941956, -0.39236459136009216, -0.33686569333076477, -0.2813667953014374, -0.22586789727210999, -0.1703689843416214, -0.114870086312294, -0.05937117338180542, -0.0038722753524780273, 0.051626622676849365, 0.10712552070617676, 0.16262441873550415, 0.21812331676483154, 0.27362221479415894, 0.32912111282348633, 0.3846200406551361, 0.4401189386844635, 0.4956178367137909, 0.5511167049407959, 0.6066156029701233, 0.6621145009994507, 0.7176133990287781, 0.7731122970581055, 0.8286112546920776, 0.8841100931167603, 0.9396090507507324, 0.9951079487800598, 1.0506068468093872, 1.1061058044433594, 1.161604642868042, 1.2171036005020142, 1.2726024389266968, 1.328101396560669, 1.3836002349853516, 1.4390991926193237, 1.494598150253296, 1.5500969886779785, 1.6055959463119507, 1.6610947847366333, 1.7165937423706055, 1.772092580795288, 1.8275915384292603, 1.8830903768539429]}, "gradients/decoder.model.decoder.layers.2.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 6.0, 1.0, 4.0, 15.0, 9.0, 15.0, 30.0, 62.0, 88.0, 147.0, 287.0, 582.0, 1537.0, 5608.0, 26820.0, 209512.0, 702667.0, 82375.0, 13679.0, 3142.0, 1008.0, 438.0, 214.0, 120.0, 72.0, 36.0, 33.0, 11.0, 14.0, 8.0, 7.0, 4.0, 4.0, 3.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-2.693359375, -2.586883544921875, -2.48040771484375, -2.373931884765625, -2.2674560546875, -2.160980224609375, -2.05450439453125, -1.948028564453125, -1.841552734375, -1.735076904296875, -1.62860107421875, -1.522125244140625, -1.4156494140625, -1.309173583984375, -1.20269775390625, -1.096221923828125, -0.98974609375, -0.883270263671875, -0.77679443359375, -0.670318603515625, -0.5638427734375, -0.457366943359375, -0.35089111328125, -0.244415283203125, -0.137939453125, -0.031463623046875, 0.07501220703125, 0.181488037109375, 0.2879638671875, 0.394439697265625, 0.50091552734375, 0.607391357421875, 0.7138671875, 0.820343017578125, 0.92681884765625, 1.033294677734375, 1.1397705078125, 1.246246337890625, 1.35272216796875, 1.459197998046875, 1.565673828125, 1.672149658203125, 1.77862548828125, 1.885101318359375, 1.9915771484375, 2.098052978515625, 2.20452880859375, 2.311004638671875, 2.41748046875, 2.523956298828125, 2.63043212890625, 2.736907958984375, 2.8433837890625, 2.949859619140625, 3.05633544921875, 3.162811279296875, 3.269287109375, 3.375762939453125, 3.48223876953125, 3.588714599609375, 3.6951904296875, 3.801666259765625, 3.90814208984375, 4.014617919921875, 4.12109375]}, "gradients/decoder.model.decoder.layers.2.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 6.0, 0.0, 6.0, 16.0, 19.0, 29.0, 33.0, 43.0, 49.0, 55.0, 84.0, 72.0, 88.0, 76.0, 83.0, 93.0, 67.0, 46.0, 51.0, 37.0, 16.0, 17.0, 11.0, 4.0, 2.0, 4.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.162109375, -3.004058837890625, -2.84600830078125, -2.687957763671875, -2.5299072265625, -2.371856689453125, -2.21380615234375, -2.055755615234375, -1.897705078125, -1.739654541015625, -1.58160400390625, -1.423553466796875, -1.2655029296875, -1.107452392578125, -0.94940185546875, -0.791351318359375, -0.63330078125, -0.475250244140625, -0.31719970703125, -0.159149169921875, -0.0010986328125, 0.156951904296875, 0.31500244140625, 0.473052978515625, 0.631103515625, 0.789154052734375, 0.94720458984375, 1.105255126953125, 1.2633056640625, 1.421356201171875, 1.57940673828125, 1.737457275390625, 1.8955078125, 2.053558349609375, 2.21160888671875, 2.369659423828125, 2.5277099609375, 2.685760498046875, 2.84381103515625, 3.001861572265625, 3.159912109375, 3.317962646484375, 3.47601318359375, 3.634063720703125, 3.7921142578125, 3.950164794921875, 4.10821533203125, 4.266265869140625, 4.42431640625, 4.582366943359375, 4.74041748046875, 4.898468017578125, 5.0565185546875, 5.214569091796875, 5.37261962890625, 5.530670166015625, 5.688720703125, 5.846771240234375, 6.00482177734375, 6.162872314453125, 6.3209228515625, 6.478973388671875, 6.63702392578125, 6.795074462890625, 6.953125]}, "gradients/decoder.model.decoder.layers.2.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 2.0, 4.0, 5.0, 7.0, 2.0, 7.0, 7.0, 11.0, 7.0, 14.0, 20.0, 24.0, 25.0, 33.0, 60.0, 69.0, 91.0, 165.0, 308.0, 568.0, 2287.0, 25183.0, 857308.0, 153762.0, 6575.0, 1065.0, 329.0, 215.0, 112.0, 64.0, 46.0, 38.0, 31.0, 27.0, 16.0, 19.0, 10.0, 7.0, 6.0, 10.0, 7.0, 3.0, 1.0, 5.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-6.55859375, -6.3642578125, -6.169921875, -5.9755859375, -5.78125, -5.5869140625, -5.392578125, -5.1982421875, -5.00390625, -4.8095703125, -4.615234375, -4.4208984375, -4.2265625, -4.0322265625, -3.837890625, -3.6435546875, -3.44921875, -3.2548828125, -3.060546875, -2.8662109375, -2.671875, -2.4775390625, -2.283203125, -2.0888671875, -1.89453125, -1.7001953125, -1.505859375, -1.3115234375, -1.1171875, -0.9228515625, -0.728515625, -0.5341796875, -0.33984375, -0.1455078125, 0.048828125, 0.2431640625, 0.4375, 0.6318359375, 0.826171875, 1.0205078125, 1.21484375, 1.4091796875, 1.603515625, 1.7978515625, 1.9921875, 2.1865234375, 2.380859375, 2.5751953125, 2.76953125, 2.9638671875, 3.158203125, 3.3525390625, 3.546875, 3.7412109375, 3.935546875, 4.1298828125, 4.32421875, 4.5185546875, 4.712890625, 4.9072265625, 5.1015625, 5.2958984375, 5.490234375, 5.6845703125, 5.87890625]}, "gradients/decoder.model.decoder.layers.2.self_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 6.0, 5.0, 6.0, 10.0, 10.0, 11.0, 11.0, 9.0, 23.0, 20.0, 22.0, 29.0, 24.0, 23.0, 37.0, 34.0, 52.0, 42.0, 43.0, 49.0, 58.0, 45.0, 50.0, 51.0, 46.0, 43.0, 30.0, 28.0, 34.0, 26.0, 27.0, 14.0, 17.0, 11.0, 11.0, 10.0, 6.0, 4.0, 9.0, 5.0, 2.0, 3.0, 2.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-3.54296875, -3.433990478515625, -3.32501220703125, -3.216033935546875, -3.1070556640625, -2.998077392578125, -2.88909912109375, -2.780120849609375, -2.671142578125, -2.562164306640625, -2.45318603515625, -2.344207763671875, -2.2352294921875, -2.126251220703125, -2.01727294921875, -1.908294677734375, -1.79931640625, -1.690338134765625, -1.58135986328125, -1.472381591796875, -1.3634033203125, -1.254425048828125, -1.14544677734375, -1.036468505859375, -0.927490234375, -0.818511962890625, -0.70953369140625, -0.600555419921875, -0.4915771484375, -0.382598876953125, -0.27362060546875, -0.164642333984375, -0.0556640625, 0.053314208984375, 0.16229248046875, 0.271270751953125, 0.3802490234375, 0.489227294921875, 0.59820556640625, 0.707183837890625, 0.816162109375, 0.925140380859375, 1.03411865234375, 1.143096923828125, 1.2520751953125, 1.361053466796875, 1.47003173828125, 1.579010009765625, 1.68798828125, 1.796966552734375, 1.90594482421875, 2.014923095703125, 2.1239013671875, 2.232879638671875, 2.34185791015625, 2.450836181640625, 2.559814453125, 2.668792724609375, 2.77777099609375, 2.886749267578125, 2.9957275390625, 3.104705810546875, 3.21368408203125, 3.322662353515625, 3.431640625]}, "gradients/decoder.model.decoder.layers.2.self_attn.k_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 11.0, 5.0, 4.0, 8.0, 13.0, 9.0, 14.0, 15.0, 20.0, 17.0, 42.0, 44.0, 69.0, 108.0, 277.0, 577.0, 1792.0, 7330.0, 61805.0, 798681.0, 159135.0, 14229.0, 2732.0, 847.0, 337.0, 165.0, 87.0, 43.0, 42.0, 28.0, 10.0, 19.0, 12.0, 5.0, 5.0, 5.0, 4.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3212890625, -1.271759033203125, -1.22222900390625, -1.172698974609375, -1.1231689453125, -1.073638916015625, -1.02410888671875, -0.974578857421875, -0.925048828125, -0.875518798828125, -0.82598876953125, -0.776458740234375, -0.7269287109375, -0.677398681640625, -0.62786865234375, -0.578338623046875, -0.52880859375, -0.479278564453125, -0.42974853515625, -0.380218505859375, -0.3306884765625, -0.281158447265625, -0.23162841796875, -0.182098388671875, -0.132568359375, -0.083038330078125, -0.03350830078125, 0.016021728515625, 0.0655517578125, 0.115081787109375, 0.16461181640625, 0.214141845703125, 0.263671875, 0.313201904296875, 0.36273193359375, 0.412261962890625, 0.4617919921875, 0.511322021484375, 0.56085205078125, 0.610382080078125, 0.659912109375, 0.709442138671875, 0.75897216796875, 0.808502197265625, 0.8580322265625, 0.907562255859375, 0.95709228515625, 1.006622314453125, 1.05615234375, 1.105682373046875, 1.15521240234375, 1.204742431640625, 1.2542724609375, 1.303802490234375, 1.35333251953125, 1.402862548828125, 1.452392578125, 1.501922607421875, 1.55145263671875, 1.600982666015625, 1.6505126953125, 1.700042724609375, 1.74957275390625, 1.799102783203125, 1.8486328125]}, "gradients/decoder.model.decoder.layers.2.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 7.0, 2.0, 3.0, 3.0, 3.0, 3.0, 14.0, 14.0, 42.0, 43.0, 56.0, 116.0, 198.0, 222.0, 87.0, 60.0, 51.0, 21.0, 19.0, 9.0, 5.0, 12.0, 5.0, 2.0, 1.0, 3.0, 3.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00023627281188964844, -0.0002284012734889984, -0.0002205297350883484, -0.00021265819668769836, -0.00020478665828704834, -0.00019691511988639832, -0.0001890435814857483, -0.00018117204308509827, -0.00017330050468444824, -0.00016542896628379822, -0.0001575574278831482, -0.00014968588948249817, -0.00014181435108184814, -0.00013394281268119812, -0.0001260712742805481, -0.00011819973587989807, -0.00011032819747924805, -0.00010245665907859802, -9.4585120677948e-05, -8.671358227729797e-05, -7.884204387664795e-05, -7.097050547599792e-05, -6.30989670753479e-05, -5.5227428674697876e-05, -4.735589027404785e-05, -3.948435187339783e-05, -3.16128134727478e-05, -2.374127507209778e-05, -1.5869736671447754e-05, -7.99819827079773e-06, -1.2665987014770508e-07, 7.74487853050232e-06, 1.5616416931152344e-05, 2.3487955331802368e-05, 3.135949373245239e-05, 3.923103213310242e-05, 4.710257053375244e-05, 5.4974108934402466e-05, 6.284564733505249e-05, 7.071718573570251e-05, 7.858872413635254e-05, 8.646026253700256e-05, 9.433180093765259e-05, 0.00010220333933830261, 0.00011007487773895264, 0.00011794641613960266, 0.00012581795454025269, 0.0001336894929409027, 0.00014156103134155273, 0.00014943256974220276, 0.00015730410814285278, 0.0001651756465435028, 0.00017304718494415283, 0.00018091872334480286, 0.00018879026174545288, 0.0001966618001461029, 0.00020453333854675293, 0.00021240487694740295, 0.00022027641534805298, 0.000228147953748703, 0.00023601949214935303, 0.00024389103055000305, 0.0002517625689506531, 0.0002596341073513031, 0.0002675056457519531]}, "gradients/decoder.model.decoder.layers.2.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 1.0, 1.0, 6.0, 8.0, 13.0, 23.0, 48.0, 135.0, 350.0, 985.0, 6291.0, 838940.0, 197064.0, 3487.0, 771.0, 242.0, 95.0, 48.0, 19.0, 17.0, 7.0, 2.0, 2.0, 2.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.203125, -4.082611083984375, -3.96209716796875, -3.841583251953125, -3.7210693359375, -3.600555419921875, -3.48004150390625, -3.359527587890625, -3.239013671875, -3.118499755859375, -2.99798583984375, -2.877471923828125, -2.7569580078125, -2.636444091796875, -2.51593017578125, -2.395416259765625, -2.27490234375, -2.154388427734375, -2.03387451171875, -1.913360595703125, -1.7928466796875, -1.672332763671875, -1.55181884765625, -1.431304931640625, -1.310791015625, -1.190277099609375, -1.06976318359375, -0.949249267578125, -0.8287353515625, -0.708221435546875, -0.58770751953125, -0.467193603515625, -0.3466796875, -0.226165771484375, -0.10565185546875, 0.014862060546875, 0.1353759765625, 0.255889892578125, 0.37640380859375, 0.496917724609375, 0.617431640625, 0.737945556640625, 0.85845947265625, 0.978973388671875, 1.0994873046875, 1.220001220703125, 1.34051513671875, 1.461029052734375, 1.58154296875, 1.702056884765625, 1.82257080078125, 1.943084716796875, 2.0635986328125, 2.184112548828125, 2.30462646484375, 2.425140380859375, 2.545654296875, 2.666168212890625, 2.78668212890625, 2.907196044921875, 3.0277099609375, 3.148223876953125, 3.26873779296875, 3.389251708984375, 3.509765625]}, "gradients/decoder.model.decoder.layers.2.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 0.0, 2.0, 3.0, 4.0, 12.0, 9.0, 25.0, 26.0, 81.0, 94.0, 275.0, 190.0, 111.0, 62.0, 44.0, 27.0, 17.0, 14.0, 1.0, 2.0, 2.0, 2.0, 1.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.77099609375, -0.7412796020507812, -0.7115631103515625, -0.6818466186523438, -0.652130126953125, -0.6224136352539062, -0.5926971435546875, -0.5629806518554688, -0.53326416015625, -0.5035476684570312, -0.4738311767578125, -0.44411468505859375, -0.414398193359375, -0.38468170166015625, -0.3549652099609375, -0.32524871826171875, -0.2955322265625, -0.26581573486328125, -0.2360992431640625, -0.20638275146484375, -0.176666259765625, -0.14694976806640625, -0.1172332763671875, -0.08751678466796875, -0.05780029296875, -0.02808380126953125, 0.0016326904296875, 0.03134918212890625, 0.061065673828125, 0.09078216552734375, 0.1204986572265625, 0.15021514892578125, 0.179931640625, 0.20964813232421875, 0.2393646240234375, 0.26908111572265625, 0.298797607421875, 0.32851409912109375, 0.3582305908203125, 0.38794708251953125, 0.41766357421875, 0.44738006591796875, 0.4770965576171875, 0.5068130493164062, 0.536529541015625, 0.5662460327148438, 0.5959625244140625, 0.6256790161132812, 0.6553955078125, 0.6851119995117188, 0.7148284912109375, 0.7445449829101562, 0.774261474609375, 0.8039779663085938, 0.8336944580078125, 0.8634109497070312, 0.89312744140625, 0.9228439331054688, 0.9525604248046875, 0.9822769165039062, 1.011993408203125, 1.0417098999023438, 1.0714263916015625, 1.1011428833007812, 1.130859375]}, "gradients/decoder.model.decoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 8.0, 36.0, 80.0, 134.0, 195.0, 209.0, 186.0, 84.0, 41.0, 23.0, 8.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.748982906341553, -6.381380558013916, -6.013778209686279, -5.646175861358643, -5.278573513031006, -4.910971164703369, -4.543368339538574, -4.1757659912109375, -3.80816388130188, -3.440561532974243, -3.0729591846466064, -2.7053565979003906, -2.337754249572754, -1.9701520204544067, -1.6025495529174805, -1.2349472045898438, -0.867344856262207, -0.4997424781322479, -0.13214010000228882, 0.23546230792999268, 0.6030646562576294, 0.9706670045852661, 1.3382694721221924, 1.705871820449829, 2.073474168777466, 2.4410765171051025, 2.8086788654327393, 3.176281452178955, 3.543883800506592, 3.9114861488342285, 4.279088497161865, 4.646690845489502, 5.0142927169799805, 5.381895065307617, 5.749497413635254, 6.117099761962891, 6.484702110290527, 6.852304458618164, 7.219906806945801, 7.5875091552734375, 7.955111503601074, 8.322713851928711, 8.690316200256348, 9.057918548583984, 9.425520896911621, 9.793123245239258, 10.160725593566895, 10.528327941894531, 10.895931243896484, 11.263533592224121, 11.631135940551758, 11.998738288879395, 12.366340637207031, 12.733942985534668, 13.101545333862305, 13.469147682189941, 13.836750030517578, 14.204352378845215, 14.571954727172852, 14.939557075500488, 15.307159423828125, 15.674761772155762, 16.0423641204834, 16.40996742248535, 16.777568817138672]}, "gradients/decoder.model.decoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 5.0, 2.0, 9.0, 7.0, 8.0, 7.0, 5.0, 10.0, 9.0, 27.0, 20.0, 19.0, 22.0, 32.0, 37.0, 32.0, 26.0, 36.0, 36.0, 32.0, 40.0, 47.0, 39.0, 51.0, 44.0, 41.0, 41.0, 38.0, 36.0, 32.0, 24.0, 30.0, 25.0, 31.0, 25.0, 21.0, 15.0, 6.0, 10.0, 9.0, 7.0, 4.0, 5.0, 10.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.386319160461426, -4.2209906578063965, -4.055662155151367, -3.890333890914917, -3.725005626678467, -3.5596771240234375, -3.394348621368408, -3.229020118713379, -3.0636918544769287, -2.8983633518218994, -2.733035087585449, -2.56770658493042, -2.4023780822753906, -2.2370498180389404, -2.071721315383911, -1.9063929319381714, -1.7410645484924316, -1.575736165046692, -1.4104077816009521, -1.2450792789459229, -1.079750895500183, -0.9144225120544434, -0.7490940690040588, -0.5837656259536743, -0.41843724250793457, -0.25310882925987244, -0.0877804160118103, 0.07754799723625183, 0.24287641048431396, 0.4082047939300537, 0.5735332369804382, 0.7388616800308228, 0.9041905403137207, 1.0695189237594604, 1.2348473072052002, 1.4001758098602295, 1.5655041933059692, 1.730832576751709, 1.8961610794067383, 2.0614895820617676, 2.2268178462982178, 2.392146348953247, 2.5574746131896973, 2.7228031158447266, 2.888131618499756, 3.053459882736206, 3.2187883853912354, 3.3841166496276855, 3.549445152282715, 3.714773654937744, 3.8801019191741943, 4.0454301834106445, 4.210758686065674, 4.376087188720703, 4.541415691375732, 4.706744194030762, 4.872072219848633, 5.037400722503662, 5.202729225158691, 5.3680572509765625, 5.533385753631592, 5.698714256286621, 5.86404275894165, 6.02937126159668, 6.194699764251709]}, "gradients/decoder.model.decoder.layers.1.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 0.0, 3.0, 1.0, 6.0, 4.0, 6.0, 7.0, 23.0, 27.0, 38.0, 47.0, 66.0, 116.0, 180.0, 266.0, 568.0, 1227.0, 2896.0, 8321.0, 32656.0, 185561.0, 1486484.0, 2105224.0, 303450.0, 49072.0, 11621.0, 3551.0, 1345.0, 645.0, 343.0, 161.0, 118.0, 88.0, 56.0, 39.0, 22.0, 10.0, 10.0, 8.0, 5.0, 5.0, 3.0, 3.0, 5.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.865234375, -2.778717041015625, -2.69219970703125, -2.605682373046875, -2.5191650390625, -2.432647705078125, -2.34613037109375, -2.259613037109375, -2.173095703125, -2.086578369140625, -2.00006103515625, -1.913543701171875, -1.8270263671875, -1.740509033203125, -1.65399169921875, -1.567474365234375, -1.48095703125, -1.394439697265625, -1.30792236328125, -1.221405029296875, -1.1348876953125, -1.048370361328125, -0.96185302734375, -0.875335693359375, -0.788818359375, -0.702301025390625, -0.61578369140625, -0.529266357421875, -0.4427490234375, -0.356231689453125, -0.26971435546875, -0.183197021484375, -0.0966796875, -0.010162353515625, 0.07635498046875, 0.162872314453125, 0.2493896484375, 0.335906982421875, 0.42242431640625, 0.508941650390625, 0.595458984375, 0.681976318359375, 0.76849365234375, 0.855010986328125, 0.9415283203125, 1.028045654296875, 1.11456298828125, 1.201080322265625, 1.28759765625, 1.374114990234375, 1.46063232421875, 1.547149658203125, 1.6336669921875, 1.720184326171875, 1.80670166015625, 1.893218994140625, 1.979736328125, 2.066253662109375, 2.15277099609375, 2.239288330078125, 2.3258056640625, 2.412322998046875, 2.49884033203125, 2.585357666015625, 2.671875]}, "gradients/decoder.model.decoder.layers.1.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 2.0, 4.0, 3.0, 9.0, 3.0, 8.0, 18.0, 16.0, 22.0, 31.0, 34.0, 38.0, 51.0, 44.0, 47.0, 49.0, 49.0, 58.0, 51.0, 61.0, 59.0, 45.0, 59.0, 38.0, 33.0, 49.0, 31.0, 18.0, 21.0, 13.0, 12.0, 11.0, 7.0, 5.0, 2.0, 3.0, 0.0, 2.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.08984375, -2.02484130859375, -1.9598388671875, -1.89483642578125, -1.829833984375, -1.76483154296875, -1.6998291015625, -1.63482666015625, -1.56982421875, -1.50482177734375, -1.4398193359375, -1.37481689453125, -1.309814453125, -1.24481201171875, -1.1798095703125, -1.11480712890625, -1.0498046875, -0.98480224609375, -0.9197998046875, -0.85479736328125, -0.789794921875, -0.72479248046875, -0.6597900390625, -0.59478759765625, -0.52978515625, -0.46478271484375, -0.3997802734375, -0.33477783203125, -0.269775390625, -0.20477294921875, -0.1397705078125, -0.07476806640625, -0.009765625, 0.05523681640625, 0.1202392578125, 0.18524169921875, 0.250244140625, 0.31524658203125, 0.3802490234375, 0.44525146484375, 0.51025390625, 0.57525634765625, 0.6402587890625, 0.70526123046875, 0.770263671875, 0.83526611328125, 0.9002685546875, 0.96527099609375, 1.0302734375, 1.09527587890625, 1.1602783203125, 1.22528076171875, 1.290283203125, 1.35528564453125, 1.4202880859375, 1.48529052734375, 1.55029296875, 1.61529541015625, 1.6802978515625, 1.74530029296875, 1.810302734375, 1.87530517578125, 1.9403076171875, 2.00531005859375, 2.0703125]}, "gradients/decoder.model.decoder.layers.1.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 5.0, 3.0, 4.0, 6.0, 6.0, 7.0, 11.0, 20.0, 26.0, 36.0, 70.0, 141.0, 290.0, 1018.0, 5987.0, 186730.0, 3947642.0, 47880.0, 3298.0, 644.0, 219.0, 97.0, 50.0, 31.0, 23.0, 16.0, 4.0, 6.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-9.2109375, -8.94281005859375, -8.6746826171875, -8.40655517578125, -8.138427734375, -7.87030029296875, -7.6021728515625, -7.33404541015625, -7.06591796875, -6.79779052734375, -6.5296630859375, -6.26153564453125, -5.993408203125, -5.72528076171875, -5.4571533203125, -5.18902587890625, -4.9208984375, -4.65277099609375, -4.3846435546875, -4.11651611328125, -3.848388671875, -3.58026123046875, -3.3121337890625, -3.04400634765625, -2.77587890625, -2.50775146484375, -2.2396240234375, -1.97149658203125, -1.703369140625, -1.43524169921875, -1.1671142578125, -0.89898681640625, -0.630859375, -0.36273193359375, -0.0946044921875, 0.17352294921875, 0.441650390625, 0.70977783203125, 0.9779052734375, 1.24603271484375, 1.51416015625, 1.78228759765625, 2.0504150390625, 2.31854248046875, 2.586669921875, 2.85479736328125, 3.1229248046875, 3.39105224609375, 3.6591796875, 3.92730712890625, 4.1954345703125, 4.46356201171875, 4.731689453125, 4.99981689453125, 5.2679443359375, 5.53607177734375, 5.80419921875, 6.07232666015625, 6.3404541015625, 6.60858154296875, 6.876708984375, 7.14483642578125, 7.4129638671875, 7.68109130859375, 7.94921875]}, "gradients/decoder.model.decoder.layers.1.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 5.0, 6.0, 7.0, 8.0, 7.0, 11.0, 22.0, 27.0, 45.0, 81.0, 123.0, 212.0, 289.0, 486.0, 722.0, 633.0, 510.0, 318.0, 198.0, 93.0, 79.0, 56.0, 41.0, 35.0, 15.0, 11.0, 5.0, 6.0, 9.0, 4.0, 3.0, 1.0, 2.0, 1.0, 3.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1630859375, -1.1267547607421875, -1.090423583984375, -1.0540924072265625, -1.01776123046875, -0.9814300537109375, -0.945098876953125, -0.9087677001953125, -0.8724365234375, -0.8361053466796875, -0.799774169921875, -0.7634429931640625, -0.72711181640625, -0.6907806396484375, -0.654449462890625, -0.6181182861328125, -0.581787109375, -0.5454559326171875, -0.509124755859375, -0.4727935791015625, -0.43646240234375, -0.4001312255859375, -0.363800048828125, -0.3274688720703125, -0.2911376953125, -0.2548065185546875, -0.218475341796875, -0.1821441650390625, -0.14581298828125, -0.1094818115234375, -0.073150634765625, -0.0368194580078125, -0.00048828125, 0.0358428955078125, 0.072174072265625, 0.1085052490234375, 0.14483642578125, 0.1811676025390625, 0.217498779296875, 0.2538299560546875, 0.2901611328125, 0.3264923095703125, 0.362823486328125, 0.3991546630859375, 0.43548583984375, 0.4718170166015625, 0.508148193359375, 0.5444793701171875, 0.580810546875, 0.6171417236328125, 0.653472900390625, 0.6898040771484375, 0.72613525390625, 0.7624664306640625, 0.798797607421875, 0.8351287841796875, 0.8714599609375, 0.9077911376953125, 0.944122314453125, 0.9804534912109375, 1.01678466796875, 1.0531158447265625, 1.089447021484375, 1.1257781982421875, 1.162109375]}, "gradients/decoder.model.decoder.layers.1.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 8.0, 10.0, 19.0, 11.0, 21.0, 37.0, 38.0, 62.0, 64.0, 72.0, 94.0, 79.0, 91.0, 89.0, 65.0, 64.0, 50.0, 43.0, 36.0, 19.0, 16.0, 12.0, 2.0, 5.0, 4.0, 2.0, 1.0, 1.0, 1.0], "bins": [-5.423590183258057, -5.30781888961792, -5.192047595977783, -5.076275825500488, -4.960504531860352, -4.844733238220215, -4.728961944580078, -4.613190650939941, -4.497419357299805, -4.381648063659668, -4.265876770019531, -4.1501054763793945, -4.0343337059021, -3.918562412261963, -3.802791118621826, -3.6870198249816895, -3.5712482929229736, -3.455476999282837, -3.339705467224121, -3.2239341735839844, -3.1081628799438477, -2.992391586303711, -2.876620054244995, -2.7608487606048584, -2.6450772285461426, -2.529305934906006, -2.41353440284729, -2.2977631092071533, -2.1819918155670166, -2.066220283508301, -1.950448989868164, -1.8346776962280273, -1.7189065217971802, -1.603135108947754, -1.4873638153076172, -1.371592402458191, -1.2558209896087646, -1.140049695968628, -1.0242782831192017, -0.9085069298744202, -0.7927355766296387, -0.6769642233848572, -0.5611928701400757, -0.4454214572906494, -0.3296501040458679, -0.21387875080108643, -0.09810733795166016, 0.017664015293121338, 0.13343536853790283, 0.24920673668384552, 0.3649781048297882, 0.4807494878768921, 0.5965208411216736, 0.7122921943664551, 0.8280636072158813, 0.9438349604606628, 1.0596063137054443, 1.1753777265548706, 1.2911490201950073, 1.4069204330444336, 1.5226917266845703, 1.6384631395339966, 1.7542345523834229, 1.8700058460235596, 1.9857772588729858]}, "gradients/decoder.model.decoder.layers.1.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 1.0, 1.0, 3.0, 0.0, 6.0, 12.0, 7.0, 7.0, 15.0, 14.0, 19.0, 15.0, 17.0, 24.0, 19.0, 40.0, 31.0, 25.0, 56.0, 42.0, 44.0, 53.0, 35.0, 44.0, 37.0, 43.0, 38.0, 38.0, 38.0, 39.0, 35.0, 32.0, 30.0, 23.0, 23.0, 16.0, 17.0, 20.0, 12.0, 13.0, 5.0, 7.0, 2.0, 2.0, 2.0, 4.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.040525436401367, -1.977013349533081, -1.9135013818740845, -1.849989414215088, -1.7864773273468018, -1.7229652404785156, -1.659453272819519, -1.5959413051605225, -1.5324292182922363, -1.4689171314239502, -1.4054051637649536, -1.341893196105957, -1.278381109237671, -1.2148690223693848, -1.1513570547103882, -1.0878450870513916, -1.0243330001831055, -0.9608209729194641, -0.8973089456558228, -0.8337969183921814, -0.77028489112854, -0.7067728638648987, -0.6432608366012573, -0.579748809337616, -0.5162367820739746, -0.45272475481033325, -0.3892127275466919, -0.32570070028305054, -0.2621886730194092, -0.19867664575576782, -0.13516461849212646, -0.07165259122848511, -0.00814056396484375, 0.05537146329879761, 0.11888349056243896, 0.18239551782608032, 0.24590754508972168, 0.30941957235336304, 0.3729315996170044, 0.43644362688064575, 0.4999556541442871, 0.5634676814079285, 0.6269797086715698, 0.6904917359352112, 0.7540037631988525, 0.8175157904624939, 0.8810278177261353, 0.9445398449897766, 1.008051872253418, 1.071563959121704, 1.1350759267807007, 1.1985878944396973, 1.2620999813079834, 1.3256120681762695, 1.3891240358352661, 1.4526360034942627, 1.5161480903625488, 1.579660177230835, 1.6431721448898315, 1.7066841125488281, 1.7701961994171143, 1.8337082862854004, 1.897220253944397, 1.9607322216033936, 2.0242443084716797]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 2.0, 4.0, 0.0, 2.0, 7.0, 6.0, 5.0, 9.0, 14.0, 23.0, 33.0, 52.0, 68.0, 121.0, 143.0, 282.0, 594.0, 1190.0, 3126.0, 8625.0, 29007.0, 102518.0, 300760.0, 376551.0, 158284.0, 45782.0, 13447.0, 4431.0, 1794.0, 723.0, 371.0, 192.0, 147.0, 73.0, 59.0, 43.0, 21.0, 19.0, 14.0, 8.0, 4.0, 5.0, 0.0, 4.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.455322265625, -0.4385719299316406, -0.42182159423828125, -0.4050712585449219, -0.3883209228515625, -0.3715705871582031, -0.35482025146484375, -0.3380699157714844, -0.321319580078125, -0.3045692443847656, -0.28781890869140625, -0.2710685729980469, -0.2543182373046875, -0.23756790161132812, -0.22081756591796875, -0.20406723022460938, -0.18731689453125, -0.17056655883789062, -0.15381622314453125, -0.13706588745117188, -0.1203155517578125, -0.10356521606445312, -0.08681488037109375, -0.07006454467773438, -0.053314208984375, -0.036563873291015625, -0.01981353759765625, -0.003063201904296875, 0.0136871337890625, 0.030437469482421875, 0.04718780517578125, 0.06393814086914062, 0.0806884765625, 0.09743881225585938, 0.11418914794921875, 0.13093948364257812, 0.1476898193359375, 0.16444015502929688, 0.18119049072265625, 0.19794082641601562, 0.214691162109375, 0.23144149780273438, 0.24819183349609375, 0.2649421691894531, 0.2816925048828125, 0.2984428405761719, 0.31519317626953125, 0.3319435119628906, 0.34869384765625, 0.3654441833496094, 0.38219451904296875, 0.3989448547363281, 0.4156951904296875, 0.4324455261230469, 0.44919586181640625, 0.4659461975097656, 0.482696533203125, 0.4994468688964844, 0.5161972045898438, 0.5329475402832031, 0.5496978759765625, 0.5664482116699219, 0.5831985473632812, 0.5999488830566406, 0.61669921875]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 3.0, 4.0, 3.0, 6.0, 10.0, 18.0, 16.0, 15.0, 22.0, 19.0, 32.0, 34.0, 47.0, 50.0, 41.0, 45.0, 66.0, 56.0, 48.0, 55.0, 52.0, 51.0, 47.0, 43.0, 37.0, 35.0, 26.0, 26.0, 17.0, 18.0, 20.0, 16.0, 8.0, 7.0, 2.0, 5.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2578125, -1.2117919921875, -1.165771484375, -1.1197509765625, -1.07373046875, -1.0277099609375, -0.981689453125, -0.9356689453125, -0.8896484375, -0.8436279296875, -0.797607421875, -0.7515869140625, -0.70556640625, -0.6595458984375, -0.613525390625, -0.5675048828125, -0.521484375, -0.4754638671875, -0.429443359375, -0.3834228515625, -0.33740234375, -0.2913818359375, -0.245361328125, -0.1993408203125, -0.1533203125, -0.1072998046875, -0.061279296875, -0.0152587890625, 0.03076171875, 0.0767822265625, 0.122802734375, 0.1688232421875, 0.21484375, 0.2608642578125, 0.306884765625, 0.3529052734375, 0.39892578125, 0.4449462890625, 0.490966796875, 0.5369873046875, 0.5830078125, 0.6290283203125, 0.675048828125, 0.7210693359375, 0.76708984375, 0.8131103515625, 0.859130859375, 0.9051513671875, 0.951171875, 0.9971923828125, 1.043212890625, 1.0892333984375, 1.13525390625, 1.1812744140625, 1.227294921875, 1.2733154296875, 1.3193359375, 1.3653564453125, 1.411376953125, 1.4573974609375, 1.50341796875, 1.5494384765625, 1.595458984375, 1.6414794921875, 1.6875]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 3.0, 7.0, 7.0, 4.0, 10.0, 7.0, 17.0, 25.0, 55.0, 79.0, 143.0, 321.0, 621.0, 1369.0, 3162.0, 7242.0, 16803.0, 39330.0, 88686.0, 178670.0, 268726.0, 224052.0, 120951.0, 56029.0, 24308.0, 10087.0, 4269.0, 1859.0, 883.0, 409.0, 179.0, 95.0, 57.0, 32.0, 22.0, 18.0, 11.0, 2.0, 4.0, 2.0, 3.0, 1.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.298828125, -0.2899627685546875, -0.281097412109375, -0.2722320556640625, -0.26336669921875, -0.2545013427734375, -0.245635986328125, -0.2367706298828125, -0.2279052734375, -0.2190399169921875, -0.210174560546875, -0.2013092041015625, -0.19244384765625, -0.1835784912109375, -0.174713134765625, -0.1658477783203125, -0.156982421875, -0.1481170654296875, -0.139251708984375, -0.1303863525390625, -0.12152099609375, -0.1126556396484375, -0.103790283203125, -0.0949249267578125, -0.0860595703125, -0.0771942138671875, -0.068328857421875, -0.0594635009765625, -0.05059814453125, -0.0417327880859375, -0.032867431640625, -0.0240020751953125, -0.01513671875, -0.0062713623046875, 0.002593994140625, 0.0114593505859375, 0.02032470703125, 0.0291900634765625, 0.038055419921875, 0.0469207763671875, 0.0557861328125, 0.0646514892578125, 0.073516845703125, 0.0823822021484375, 0.09124755859375, 0.1001129150390625, 0.108978271484375, 0.1178436279296875, 0.126708984375, 0.1355743408203125, 0.144439697265625, 0.1533050537109375, 0.16217041015625, 0.1710357666015625, 0.179901123046875, 0.1887664794921875, 0.1976318359375, 0.2064971923828125, 0.215362548828125, 0.2242279052734375, 0.23309326171875, 0.2419586181640625, 0.250823974609375, 0.2596893310546875, 0.2685546875]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 4.0, 6.0, 10.0, 6.0, 10.0, 10.0, 13.0, 9.0, 19.0, 21.0, 24.0, 45.0, 46.0, 50.0, 50.0, 52.0, 48.0, 50.0, 65.0, 57.0, 58.0, 46.0, 49.0, 38.0, 41.0, 44.0, 24.0, 18.0, 19.0, 16.0, 20.0, 6.0, 8.0, 7.0, 2.0, 4.0, 2.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-3.291015625, -3.200286865234375, -3.10955810546875, -3.018829345703125, -2.9281005859375, -2.837371826171875, -2.74664306640625, -2.655914306640625, -2.565185546875, -2.474456787109375, -2.38372802734375, -2.292999267578125, -2.2022705078125, -2.111541748046875, -2.02081298828125, -1.930084228515625, -1.83935546875, -1.748626708984375, -1.65789794921875, -1.567169189453125, -1.4764404296875, -1.385711669921875, -1.29498291015625, -1.204254150390625, -1.113525390625, -1.022796630859375, -0.93206787109375, -0.841339111328125, -0.7506103515625, -0.659881591796875, -0.56915283203125, -0.478424072265625, -0.3876953125, -0.296966552734375, -0.20623779296875, -0.115509033203125, -0.0247802734375, 0.065948486328125, 0.15667724609375, 0.247406005859375, 0.338134765625, 0.428863525390625, 0.51959228515625, 0.610321044921875, 0.7010498046875, 0.791778564453125, 0.88250732421875, 0.973236083984375, 1.06396484375, 1.154693603515625, 1.24542236328125, 1.336151123046875, 1.4268798828125, 1.517608642578125, 1.60833740234375, 1.699066162109375, 1.789794921875, 1.880523681640625, 1.97125244140625, 2.061981201171875, 2.1527099609375, 2.243438720703125, 2.33416748046875, 2.424896240234375, 2.515625]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 6.0, 5.0, 13.0, 17.0, 14.0, 35.0, 50.0, 69.0, 130.0, 279.0, 533.0, 1243.0, 3502.0, 13485.0, 83604.0, 588421.0, 307376.0, 38151.0, 7538.0, 2298.0, 903.0, 369.0, 207.0, 107.0, 96.0, 42.0, 16.0, 11.0, 11.0, 12.0, 5.0, 3.0, 1.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.2020263671875, -0.19653701782226562, -0.19104766845703125, -0.18555831909179688, -0.1800689697265625, -0.17457962036132812, -0.16909027099609375, -0.16360092163085938, -0.158111572265625, -0.15262222290039062, -0.14713287353515625, -0.14164352416992188, -0.1361541748046875, -0.13066482543945312, -0.12517547607421875, -0.11968612670898438, -0.11419677734375, -0.10870742797851562, -0.10321807861328125, -0.09772872924804688, -0.0922393798828125, -0.08675003051757812, -0.08126068115234375, -0.07577133178710938, -0.070281982421875, -0.06479263305664062, -0.05930328369140625, -0.053813934326171875, -0.0483245849609375, -0.042835235595703125, -0.03734588623046875, -0.031856536865234375, -0.0263671875, -0.020877838134765625, -0.01538848876953125, -0.009899139404296875, -0.0044097900390625, 0.001079559326171875, 0.00656890869140625, 0.012058258056640625, 0.017547607421875, 0.023036956787109375, 0.02852630615234375, 0.034015655517578125, 0.0395050048828125, 0.044994354248046875, 0.05048370361328125, 0.055973052978515625, 0.06146240234375, 0.06695175170898438, 0.07244110107421875, 0.07793045043945312, 0.0834197998046875, 0.08890914916992188, 0.09439849853515625, 0.09988784790039062, 0.105377197265625, 0.11086654663085938, 0.11635589599609375, 0.12184524536132812, 0.1273345947265625, 0.13282394409179688, 0.13831329345703125, 0.14380264282226562, 0.1492919921875]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 2.0, 4.0, 4.0, 4.0, 4.0, 11.0, 9.0, 8.0, 16.0, 18.0, 24.0, 41.0, 35.0, 59.0, 52.0, 61.0, 61.0, 72.0, 88.0, 61.0, 79.0, 57.0, 49.0, 33.0, 22.0, 26.0, 31.0, 14.0, 20.0, 9.0, 7.0, 8.0, 2.0, 3.0, 2.0, 1.0, 4.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.6253204345703125e-05, -4.474259912967682e-05, -4.323199391365051e-05, -4.1721388697624207e-05, -4.02107834815979e-05, -3.8700178265571594e-05, -3.718957304954529e-05, -3.567896783351898e-05, -3.4168362617492676e-05, -3.265775740146637e-05, -3.1147152185440063e-05, -2.9636546969413757e-05, -2.812594175338745e-05, -2.6615336537361145e-05, -2.510473132133484e-05, -2.3594126105308533e-05, -2.2083520889282227e-05, -2.057291567325592e-05, -1.9062310457229614e-05, -1.7551705241203308e-05, -1.6041100025177002e-05, -1.4530494809150696e-05, -1.301988959312439e-05, -1.1509284377098083e-05, -9.998679161071777e-06, -8.488073945045471e-06, -6.977468729019165e-06, -5.466863512992859e-06, -3.956258296966553e-06, -2.4456530809402466e-06, -9.350478649139404e-07, 5.755573511123657e-07, 2.086162567138672e-06, 3.596767783164978e-06, 5.107372999191284e-06, 6.61797821521759e-06, 8.128583431243896e-06, 9.639188647270203e-06, 1.1149793863296509e-05, 1.2660399079322815e-05, 1.4171004295349121e-05, 1.5681609511375427e-05, 1.7192214727401733e-05, 1.870281994342804e-05, 2.0213425159454346e-05, 2.1724030375480652e-05, 2.3234635591506958e-05, 2.4745240807533264e-05, 2.625584602355957e-05, 2.7766451239585876e-05, 2.9277056455612183e-05, 3.078766167163849e-05, 3.2298266887664795e-05, 3.38088721036911e-05, 3.531947731971741e-05, 3.683008253574371e-05, 3.834068775177002e-05, 3.9851292967796326e-05, 4.136189818382263e-05, 4.287250339984894e-05, 4.4383108615875244e-05, 4.589371383190155e-05, 4.7404319047927856e-05, 4.891492426395416e-05, 5.042552947998047e-05]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 1.0, 6.0, 10.0, 7.0, 14.0, 18.0, 26.0, 34.0, 58.0, 67.0, 131.0, 196.0, 319.0, 627.0, 1210.0, 2511.0, 5883.0, 15274.0, 45725.0, 174186.0, 514333.0, 206467.0, 52394.0, 16792.0, 6458.0, 2840.0, 1346.0, 666.0, 335.0, 209.0, 138.0, 68.0, 45.0, 43.0, 29.0, 31.0, 14.0, 7.0, 6.0, 7.0, 9.0, 5.0, 6.0, 1.0, 3.0, 0.0, 1.0, 1.0], "bins": [-0.17236328125, -0.1676483154296875, -0.162933349609375, -0.1582183837890625, -0.15350341796875, -0.1487884521484375, -0.144073486328125, -0.1393585205078125, -0.1346435546875, -0.1299285888671875, -0.125213623046875, -0.1204986572265625, -0.11578369140625, -0.1110687255859375, -0.106353759765625, -0.1016387939453125, -0.096923828125, -0.0922088623046875, -0.087493896484375, -0.0827789306640625, -0.07806396484375, -0.0733489990234375, -0.068634033203125, -0.0639190673828125, -0.0592041015625, -0.0544891357421875, -0.049774169921875, -0.0450592041015625, -0.04034423828125, -0.0356292724609375, -0.030914306640625, -0.0261993408203125, -0.021484375, -0.0167694091796875, -0.012054443359375, -0.0073394775390625, -0.00262451171875, 0.0020904541015625, 0.006805419921875, 0.0115203857421875, 0.0162353515625, 0.0209503173828125, 0.025665283203125, 0.0303802490234375, 0.03509521484375, 0.0398101806640625, 0.044525146484375, 0.0492401123046875, 0.053955078125, 0.0586700439453125, 0.063385009765625, 0.0680999755859375, 0.07281494140625, 0.0775299072265625, 0.082244873046875, 0.0869598388671875, 0.0916748046875, 0.0963897705078125, 0.101104736328125, 0.1058197021484375, 0.11053466796875, 0.1152496337890625, 0.119964599609375, 0.1246795654296875, 0.12939453125]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 6.0, 1.0, 4.0, 9.0, 4.0, 8.0, 9.0, 10.0, 12.0, 26.0, 27.0, 29.0, 66.0, 102.0, 109.0, 127.0, 97.0, 105.0, 72.0, 50.0, 28.0, 24.0, 23.0, 18.0, 10.0, 8.0, 7.0, 6.0, 5.0, 2.0, 2.0, 1.0, 2.0, 0.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.036651611328125, -0.03532838821411133, -0.034005165100097656, -0.032681941986083984, -0.03135871887207031, -0.03003549575805664, -0.02871227264404297, -0.027389049530029297, -0.026065826416015625, -0.024742603302001953, -0.02341938018798828, -0.02209615707397461, -0.020772933959960938, -0.019449710845947266, -0.018126487731933594, -0.016803264617919922, -0.01548004150390625, -0.014156818389892578, -0.012833595275878906, -0.011510372161865234, -0.010187149047851562, -0.00886392593383789, -0.007540702819824219, -0.006217479705810547, -0.004894256591796875, -0.003571033477783203, -0.0022478103637695312, -0.0009245872497558594, 0.0003986358642578125, 0.0017218589782714844, 0.0030450820922851562, 0.004368305206298828, 0.0056915283203125, 0.007014751434326172, 0.008337974548339844, 0.009661197662353516, 0.010984420776367188, 0.01230764389038086, 0.013630867004394531, 0.014954090118408203, 0.016277313232421875, 0.017600536346435547, 0.01892375946044922, 0.02024698257446289, 0.021570205688476562, 0.022893428802490234, 0.024216651916503906, 0.025539875030517578, 0.02686309814453125, 0.028186321258544922, 0.029509544372558594, 0.030832767486572266, 0.03215599060058594, 0.03347921371459961, 0.03480243682861328, 0.03612565994262695, 0.037448883056640625, 0.0387721061706543, 0.04009532928466797, 0.04141855239868164, 0.04274177551269531, 0.044064998626708984, 0.045388221740722656, 0.04671144485473633, 0.04803466796875]}, "gradients/decoder.model.decoder.layers.1.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 3.0, 11.0, 16.0, 21.0, 33.0, 48.0, 53.0, 68.0, 82.0, 99.0, 79.0, 119.0, 89.0, 82.0, 65.0, 55.0, 25.0, 22.0, 18.0, 8.0, 6.0, 4.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.6389849185943604, -2.5651090145111084, -2.4912331104278564, -2.4173572063446045, -2.3434813022613525, -2.2696056365966797, -2.1957297325134277, -2.121853828430176, -2.047977924346924, -1.9741020202636719, -1.90022611618042, -1.826350212097168, -1.7524744272232056, -1.6785985231399536, -1.6047226190567017, -1.5308468341827393, -1.4569708108901978, -1.3830949068069458, -1.3092190027236938, -1.2353432178497314, -1.1614673137664795, -1.0875914096832275, -1.0137155055999756, -0.9398396611213684, -0.8659637570381165, -0.7920878529548645, -0.7182120084762573, -0.6443361043930054, -0.5704602003097534, -0.49658435583114624, -0.4227084517478943, -0.3488326072692871, -0.27495670318603516, -0.2010808289051056, -0.12720493972301483, -0.05332905054092407, 0.020546823740005493, 0.09442269802093506, 0.168298602104187, 0.2421744465827942, 0.31605035066604614, 0.3899262249469757, 0.4638020992279053, 0.5376780033111572, 0.6115539073944092, 0.6854297518730164, 0.7593056559562683, 0.8331815004348755, 0.9070574045181274, 0.9809333086013794, 1.0548092126846313, 1.1286849975585938, 1.2025609016418457, 1.2764368057250977, 1.3503127098083496, 1.4241886138916016, 1.4980645179748535, 1.5719404220581055, 1.6458163261413574, 1.7196922302246094, 1.7935680150985718, 1.8674439191818237, 1.9413198232650757, 2.015195608139038, 2.08907151222229]}, "gradients/decoder.model.decoder.layers.1.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 5.0, 0.0, 1.0, 5.0, 1.0, 10.0, 8.0, 16.0, 8.0, 16.0, 19.0, 19.0, 19.0, 18.0, 32.0, 45.0, 37.0, 50.0, 46.0, 55.0, 51.0, 40.0, 56.0, 34.0, 50.0, 46.0, 45.0, 31.0, 44.0, 38.0, 30.0, 27.0, 20.0, 19.0, 17.0, 17.0, 9.0, 11.0, 3.0, 4.0, 2.0, 2.0, 2.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.1370736360549927, -1.0966190099716187, -1.0561643838882446, -1.0157097578048706, -0.9752551317214966, -0.9348005056381226, -0.8943458199501038, -0.8538911938667297, -0.8134365677833557, -0.7729819416999817, -0.7325273156166077, -0.6920726895332336, -0.6516180038452148, -0.6111633777618408, -0.5707087516784668, -0.5302541255950928, -0.48979949951171875, -0.4493448734283447, -0.4088902473449707, -0.3684355914592743, -0.32798096537590027, -0.28752633929252625, -0.24707169830799103, -0.2066170573234558, -0.1661624312400818, -0.12570780515670776, -0.08525316417217255, -0.044798530638217926, -0.004343897104263306, 0.03611072897911072, 0.07656536996364594, 0.11702001094818115, 0.15747475624084473, 0.19792938232421875, 0.23838402330875397, 0.2788386642932892, 0.3192932903766632, 0.35974791646003723, 0.40020257234573364, 0.44065719842910767, 0.4811118245124817, 0.5215664505958557, 0.5620210766792297, 0.6024757027626038, 0.6429303884506226, 0.6833850145339966, 0.7238396406173706, 0.7642942667007446, 0.8047488927841187, 0.8452035188674927, 0.8856581449508667, 0.9261127710342407, 0.9665673971176147, 1.0070220232009888, 1.0474766492843628, 1.0879313945770264, 1.1283860206604004, 1.1688406467437744, 1.2092952728271484, 1.2497498989105225, 1.2902045249938965, 1.3306591510772705, 1.3711137771606445, 1.4115684032440186, 1.4520230293273926]}, "gradients/decoder.model.decoder.layers.1.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 4.0, 2.0, 4.0, 4.0, 5.0, 13.0, 10.0, 14.0, 27.0, 44.0, 39.0, 52.0, 80.0, 139.0, 186.0, 291.0, 543.0, 978.0, 1823.0, 3865.0, 8047.0, 17563.0, 40214.0, 96479.0, 259826.0, 362289.0, 149591.0, 58670.0, 25368.0, 11291.0, 5376.0, 2560.0, 1270.0, 736.0, 424.0, 245.0, 144.0, 96.0, 73.0, 51.0, 32.0, 25.0, 16.0, 11.0, 11.0, 6.0, 6.0, 11.0, 5.0, 3.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.49609375, -1.4449005126953125, -1.393707275390625, -1.3425140380859375, -1.29132080078125, -1.2401275634765625, -1.188934326171875, -1.1377410888671875, -1.0865478515625, -1.0353546142578125, -0.984161376953125, -0.9329681396484375, -0.88177490234375, -0.8305816650390625, -0.779388427734375, -0.7281951904296875, -0.677001953125, -0.6258087158203125, -0.574615478515625, -0.5234222412109375, -0.47222900390625, -0.4210357666015625, -0.369842529296875, -0.3186492919921875, -0.2674560546875, -0.2162628173828125, -0.165069580078125, -0.1138763427734375, -0.06268310546875, -0.0114898681640625, 0.039703369140625, 0.0908966064453125, 0.14208984375, 0.1932830810546875, 0.244476318359375, 0.2956695556640625, 0.34686279296875, 0.3980560302734375, 0.449249267578125, 0.5004425048828125, 0.5516357421875, 0.6028289794921875, 0.654022216796875, 0.7052154541015625, 0.75640869140625, 0.8076019287109375, 0.858795166015625, 0.9099884033203125, 0.961181640625, 1.0123748779296875, 1.063568115234375, 1.1147613525390625, 1.16595458984375, 1.2171478271484375, 1.268341064453125, 1.3195343017578125, 1.3707275390625, 1.4219207763671875, 1.473114013671875, 1.5243072509765625, 1.57550048828125, 1.6266937255859375, 1.677886962890625, 1.7290802001953125, 1.7802734375]}, "gradients/decoder.model.decoder.layers.1.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 0.0, 5.0, 0.0, 1.0, 3.0, 3.0, 8.0, 17.0, 15.0, 14.0, 11.0, 19.0, 29.0, 26.0, 36.0, 38.0, 30.0, 52.0, 42.0, 46.0, 57.0, 41.0, 54.0, 55.0, 40.0, 48.0, 47.0, 39.0, 41.0, 36.0, 27.0, 19.0, 28.0, 25.0, 10.0, 9.0, 4.0, 9.0, 8.0, 5.0, 5.0, 3.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.3359375, -2.25286865234375, -2.1697998046875, -2.08673095703125, -2.003662109375, -1.92059326171875, -1.8375244140625, -1.75445556640625, -1.67138671875, -1.58831787109375, -1.5052490234375, -1.42218017578125, -1.339111328125, -1.25604248046875, -1.1729736328125, -1.08990478515625, -1.0068359375, -0.92376708984375, -0.8406982421875, -0.75762939453125, -0.674560546875, -0.59149169921875, -0.5084228515625, -0.42535400390625, -0.34228515625, -0.25921630859375, -0.1761474609375, -0.09307861328125, -0.010009765625, 0.07305908203125, 0.1561279296875, 0.23919677734375, 0.322265625, 0.40533447265625, 0.4884033203125, 0.57147216796875, 0.654541015625, 0.73760986328125, 0.8206787109375, 0.90374755859375, 0.98681640625, 1.06988525390625, 1.1529541015625, 1.23602294921875, 1.319091796875, 1.40216064453125, 1.4852294921875, 1.56829833984375, 1.6513671875, 1.73443603515625, 1.8175048828125, 1.90057373046875, 1.983642578125, 2.06671142578125, 2.1497802734375, 2.23284912109375, 2.31591796875, 2.39898681640625, 2.4820556640625, 2.56512451171875, 2.648193359375, 2.73126220703125, 2.8143310546875, 2.89739990234375, 2.98046875]}, "gradients/decoder.model.decoder.layers.1.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 8.0, 6.0, 7.0, 13.0, 14.0, 26.0, 19.0, 55.0, 72.0, 119.0, 202.0, 445.0, 1081.0, 3596.0, 21069.0, 207134.0, 710047.0, 90017.0, 10814.0, 2220.0, 772.0, 334.0, 173.0, 101.0, 73.0, 45.0, 23.0, 15.0, 11.0, 7.0, 8.0, 9.0, 4.0, 5.0, 2.0, 3.0, 2.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.11328125, -3.9776611328125, -3.842041015625, -3.7064208984375, -3.57080078125, -3.4351806640625, -3.299560546875, -3.1639404296875, -3.0283203125, -2.8927001953125, -2.757080078125, -2.6214599609375, -2.48583984375, -2.3502197265625, -2.214599609375, -2.0789794921875, -1.943359375, -1.8077392578125, -1.672119140625, -1.5364990234375, -1.40087890625, -1.2652587890625, -1.129638671875, -0.9940185546875, -0.8583984375, -0.7227783203125, -0.587158203125, -0.4515380859375, -0.31591796875, -0.1802978515625, -0.044677734375, 0.0909423828125, 0.2265625, 0.3621826171875, 0.497802734375, 0.6334228515625, 0.76904296875, 0.9046630859375, 1.040283203125, 1.1759033203125, 1.3115234375, 1.4471435546875, 1.582763671875, 1.7183837890625, 1.85400390625, 1.9896240234375, 2.125244140625, 2.2608642578125, 2.396484375, 2.5321044921875, 2.667724609375, 2.8033447265625, 2.93896484375, 3.0745849609375, 3.210205078125, 3.3458251953125, 3.4814453125, 3.6170654296875, 3.752685546875, 3.8883056640625, 4.02392578125, 4.1595458984375, 4.295166015625, 4.4307861328125, 4.56640625]}, "gradients/decoder.model.decoder.layers.1.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 4.0, 3.0, 5.0, 7.0, 3.0, 8.0, 20.0, 14.0, 15.0, 28.0, 25.0, 43.0, 47.0, 48.0, 52.0, 62.0, 56.0, 71.0, 69.0, 68.0, 53.0, 48.0, 40.0, 48.0, 29.0, 30.0, 22.0, 19.0, 18.0, 15.0, 11.0, 13.0, 5.0, 6.0, 4.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.337890625, -3.222869873046875, -3.10784912109375, -2.992828369140625, -2.8778076171875, -2.762786865234375, -2.64776611328125, -2.532745361328125, -2.417724609375, -2.302703857421875, -2.18768310546875, -2.072662353515625, -1.9576416015625, -1.842620849609375, -1.72760009765625, -1.612579345703125, -1.49755859375, -1.382537841796875, -1.26751708984375, -1.152496337890625, -1.0374755859375, -0.922454833984375, -0.80743408203125, -0.692413330078125, -0.577392578125, -0.462371826171875, -0.34735107421875, -0.232330322265625, -0.1173095703125, -0.002288818359375, 0.11273193359375, 0.227752685546875, 0.3427734375, 0.457794189453125, 0.57281494140625, 0.687835693359375, 0.8028564453125, 0.917877197265625, 1.03289794921875, 1.147918701171875, 1.262939453125, 1.377960205078125, 1.49298095703125, 1.608001708984375, 1.7230224609375, 1.838043212890625, 1.95306396484375, 2.068084716796875, 2.18310546875, 2.298126220703125, 2.41314697265625, 2.528167724609375, 2.6431884765625, 2.758209228515625, 2.87322998046875, 2.988250732421875, 3.103271484375, 3.218292236328125, 3.33331298828125, 3.448333740234375, 3.5633544921875, 3.678375244140625, 3.79339599609375, 3.908416748046875, 4.0234375]}, "gradients/decoder.model.decoder.layers.1.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 4.0, 1.0, 0.0, 1.0, 4.0, 2.0, 5.0, 5.0, 11.0, 15.0, 29.0, 54.0, 104.0, 216.0, 544.0, 1404.0, 4249.0, 21788.0, 220218.0, 712976.0, 73006.0, 9796.0, 2548.0, 903.0, 365.0, 146.0, 69.0, 45.0, 19.0, 12.0, 8.0, 4.0, 6.0, 5.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.521484375, -1.4743499755859375, -1.427215576171875, -1.3800811767578125, -1.33294677734375, -1.2858123779296875, -1.238677978515625, -1.1915435791015625, -1.1444091796875, -1.0972747802734375, -1.050140380859375, -1.0030059814453125, -0.95587158203125, -0.9087371826171875, -0.861602783203125, -0.8144683837890625, -0.767333984375, -0.7201995849609375, -0.673065185546875, -0.6259307861328125, -0.57879638671875, -0.5316619873046875, -0.484527587890625, -0.4373931884765625, -0.3902587890625, -0.3431243896484375, -0.295989990234375, -0.2488555908203125, -0.20172119140625, -0.1545867919921875, -0.107452392578125, -0.0603179931640625, -0.01318359375, 0.0339508056640625, 0.081085205078125, 0.1282196044921875, 0.17535400390625, 0.2224884033203125, 0.269622802734375, 0.3167572021484375, 0.3638916015625, 0.4110260009765625, 0.458160400390625, 0.5052947998046875, 0.55242919921875, 0.5995635986328125, 0.646697998046875, 0.6938323974609375, 0.740966796875, 0.7881011962890625, 0.835235595703125, 0.8823699951171875, 0.92950439453125, 0.9766387939453125, 1.023773193359375, 1.0709075927734375, 1.1180419921875, 1.1651763916015625, 1.212310791015625, 1.2594451904296875, 1.30657958984375, 1.3537139892578125, 1.400848388671875, 1.4479827880859375, 1.4951171875]}, "gradients/decoder.model.decoder.layers.1.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 7.0, 8.0, 8.0, 15.0, 12.0, 21.0, 32.0, 44.0, 53.0, 74.0, 115.0, 140.0, 142.0, 98.0, 51.0, 54.0, 42.0, 27.0, 14.0, 14.0, 10.0, 2.0, 8.0, 3.0, 4.0, 1.0, 2.0, 1.0, 0.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0002415180206298828, -0.00023513101041316986, -0.0002287440001964569, -0.00022235698997974396, -0.000215969979763031, -0.00020958296954631805, -0.0002031959593296051, -0.00019680894911289215, -0.0001904219388961792, -0.00018403492867946625, -0.0001776479184627533, -0.00017126090824604034, -0.0001648738980293274, -0.00015848688781261444, -0.0001520998775959015, -0.00014571286737918854, -0.00013932585716247559, -0.00013293884694576263, -0.00012655183672904968, -0.00012016482651233673, -0.00011377781629562378, -0.00010739080607891083, -0.00010100379586219788, -9.461678564548492e-05, -8.822977542877197e-05, -8.184276521205902e-05, -7.545575499534607e-05, -6.906874477863312e-05, -6.268173456192017e-05, -5.6294724345207214e-05, -4.990771412849426e-05, -4.352070391178131e-05, -3.713369369506836e-05, -3.074668347835541e-05, -2.4359673261642456e-05, -1.7972663044929504e-05, -1.1585652828216553e-05, -5.198642611503601e-06, 1.1883676052093506e-06, 7.575377821922302e-06, 1.3962388038635254e-05, 2.0349398255348206e-05, 2.6736408472061157e-05, 3.312341868877411e-05, 3.951042890548706e-05, 4.589743912220001e-05, 5.2284449338912964e-05, 5.8671459555625916e-05, 6.505846977233887e-05, 7.144547998905182e-05, 7.783249020576477e-05, 8.421950042247772e-05, 9.060651063919067e-05, 9.699352085590363e-05, 0.00010338053107261658, 0.00010976754128932953, 0.00011615455150604248, 0.00012254156172275543, 0.00012892857193946838, 0.00013531558215618134, 0.0001417025923728943, 0.00014808960258960724, 0.0001544766128063202, 0.00016086362302303314, 0.0001672506332397461]}, "gradients/decoder.model.decoder.layers.1.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 5.0, 9.0, 8.0, 4.0, 11.0, 15.0, 24.0, 34.0, 53.0, 125.0, 230.0, 534.0, 1162.0, 3042.0, 8827.0, 38550.0, 291922.0, 596845.0, 84103.0, 15326.0, 4516.0, 1751.0, 725.0, 339.0, 163.0, 94.0, 39.0, 23.0, 21.0, 15.0, 11.0, 6.0, 6.0, 4.0, 4.0, 2.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.265625, -1.2222900390625, -1.178955078125, -1.1356201171875, -1.09228515625, -1.0489501953125, -1.005615234375, -0.9622802734375, -0.9189453125, -0.8756103515625, -0.832275390625, -0.7889404296875, -0.74560546875, -0.7022705078125, -0.658935546875, -0.6156005859375, -0.572265625, -0.5289306640625, -0.485595703125, -0.4422607421875, -0.39892578125, -0.3555908203125, -0.312255859375, -0.2689208984375, -0.2255859375, -0.1822509765625, -0.138916015625, -0.0955810546875, -0.05224609375, -0.0089111328125, 0.034423828125, 0.0777587890625, 0.12109375, 0.1644287109375, 0.207763671875, 0.2510986328125, 0.29443359375, 0.3377685546875, 0.381103515625, 0.4244384765625, 0.4677734375, 0.5111083984375, 0.554443359375, 0.5977783203125, 0.64111328125, 0.6844482421875, 0.727783203125, 0.7711181640625, 0.814453125, 0.8577880859375, 0.901123046875, 0.9444580078125, 0.98779296875, 1.0311279296875, 1.074462890625, 1.1177978515625, 1.1611328125, 1.2044677734375, 1.247802734375, 1.2911376953125, 1.33447265625, 1.3778076171875, 1.421142578125, 1.4644775390625, 1.5078125]}, "gradients/decoder.model.decoder.layers.1.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 4.0, 4.0, 4.0, 9.0, 2.0, 4.0, 8.0, 12.0, 10.0, 13.0, 14.0, 17.0, 24.0, 42.0, 38.0, 55.0, 62.0, 70.0, 64.0, 85.0, 67.0, 79.0, 65.0, 55.0, 47.0, 24.0, 24.0, 22.0, 17.0, 13.0, 13.0, 9.0, 7.0, 6.0, 6.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.469970703125, -0.4574317932128906, -0.44489288330078125, -0.4323539733886719, -0.4198150634765625, -0.4072761535644531, -0.39473724365234375, -0.3821983337402344, -0.369659423828125, -0.3571205139160156, -0.34458160400390625, -0.3320426940917969, -0.3195037841796875, -0.3069648742675781, -0.29442596435546875, -0.2818870544433594, -0.26934814453125, -0.2568092346191406, -0.24427032470703125, -0.23173141479492188, -0.2191925048828125, -0.20665359497070312, -0.19411468505859375, -0.18157577514648438, -0.169036865234375, -0.15649795532226562, -0.14395904541015625, -0.13142013549804688, -0.1188812255859375, -0.10634231567382812, -0.09380340576171875, -0.08126449584960938, -0.0687255859375, -0.056186676025390625, -0.04364776611328125, -0.031108856201171875, -0.0185699462890625, -0.006031036376953125, 0.00650787353515625, 0.019046783447265625, 0.031585693359375, 0.044124603271484375, 0.05666351318359375, 0.06920242309570312, 0.0817413330078125, 0.09428024291992188, 0.10681915283203125, 0.11935806274414062, 0.13189697265625, 0.14443588256835938, 0.15697479248046875, 0.16951370239257812, 0.1820526123046875, 0.19459152221679688, 0.20713043212890625, 0.21966934204101562, 0.232208251953125, 0.24474716186523438, 0.25728607177734375, 0.2698249816894531, 0.2823638916015625, 0.2949028015136719, 0.30744171142578125, 0.3199806213378906, 0.33251953125]}, "gradients/decoder.model.decoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 6.0, 16.0, 31.0, 91.0, 145.0, 213.0, 230.0, 155.0, 81.0, 26.0, 16.0, 4.0, 2.0, 0.0, 1.0, 1.0], "bins": [-20.0159912109375, -19.64496421813965, -19.273935317993164, -18.902908325195312, -18.53188133239746, -18.160852432250977, -17.789825439453125, -17.418798446655273, -17.047771453857422, -16.67674446105957, -16.305715560913086, -15.934688568115234, -15.563661575317383, -15.192633628845215, -14.821605682373047, -14.450578689575195, -14.079549789428711, -13.708521842956543, -13.337494850158691, -12.966466903686523, -12.595439910888672, -12.224411964416504, -11.853384017944336, -11.482357025146484, -11.111329078674316, -10.740301132202148, -10.369274139404297, -9.998246192932129, -9.627218246459961, -9.25619125366211, -8.885163307189941, -8.514135360717773, -8.143108367919922, -7.772080898284912, -7.401053428649902, -7.030025482177734, -6.658998012542725, -6.287970542907715, -5.916942596435547, -5.545915126800537, -5.174887657165527, -4.803860187530518, -4.432832717895508, -4.06180477142334, -3.69077730178833, -3.3197498321533203, -2.9487221240997314, -2.5776944160461426, -2.206666946411133, -1.8356393575668335, -1.4646117687225342, -1.0935841798782349, -0.7225565910339355, -0.35152900218963623, 0.019498586654663086, 0.39052629470825195, 0.7615537643432617, 1.132581353187561, 1.5036089420318604, 1.8746365308761597, 2.245664119720459, 2.6166915893554688, 2.9877192974090576, 3.3587470054626465, 3.7297744750976562]}, "gradients/decoder.model.decoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 5.0, 6.0, 6.0, 13.0, 17.0, 8.0, 24.0, 19.0, 26.0, 29.0, 28.0, 29.0, 34.0, 36.0, 43.0, 51.0, 50.0, 42.0, 61.0, 44.0, 41.0, 40.0, 49.0, 33.0, 33.0, 38.0, 41.0, 29.0, 12.0, 22.0, 30.0, 20.0, 12.0, 10.0, 8.0, 5.0, 1.0, 5.0, 3.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0], "bins": [-5.846386909484863, -5.69079065322876, -5.5351948738098145, -5.379598617553711, -5.224002361297607, -5.068406105041504, -4.912810325622559, -4.757214069366455, -4.601617813110352, -4.446021556854248, -4.290425777435303, -4.134829521179199, -3.9792332649230957, -3.8236372470855713, -3.668041229248047, -3.5124449729919434, -3.356848955154419, -3.2012529373168945, -3.045656681060791, -2.8900606632232666, -2.734464406967163, -2.5788683891296387, -2.423272132873535, -2.2676761150360107, -2.1120800971984863, -1.9564839601516724, -1.8008878231048584, -1.645291805267334, -1.4896955490112305, -1.334099531173706, -1.178503394126892, -1.0229072570800781, -0.8673110008239746, -0.7117148637771606, -0.5561187267303467, -0.4005226492881775, -0.24492651224136353, -0.08933037519454956, 0.06626570224761963, 0.2218618392944336, 0.37745797634124756, 0.5330541133880615, 0.6886502504348755, 0.8442463278770447, 0.9998424649238586, 1.1554386615753174, 1.3110346794128418, 1.4666308164596558, 1.6222269535064697, 1.7778230905532837, 1.9334192276000977, 2.089015245437622, 2.2446115016937256, 2.40020751953125, 2.5558037757873535, 2.711399793624878, 2.8669958114624023, 3.0225918292999268, 3.1781880855560303, 3.3337841033935547, 3.489380359649658, 3.6449763774871826, 3.800572395324707, 3.9561686515808105, 4.111764907836914]}, "gradients/decoder.model.decoder.layers.0.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 3.0, 2.0, 1.0, 2.0, 10.0, 13.0, 16.0, 17.0, 24.0, 29.0, 40.0, 74.0, 91.0, 152.0, 273.0, 576.0, 1469.0, 5580.0, 28837.0, 251990.0, 2618530.0, 1179338.0, 89945.0, 12849.0, 2643.0, 854.0, 381.0, 191.0, 103.0, 62.0, 42.0, 49.0, 24.0, 22.0, 15.0, 8.0, 10.0, 6.0, 8.0, 4.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 3.0, 0.0, 0.0, 1.0], "bins": [-3.791015625, -3.678802490234375, -3.56658935546875, -3.454376220703125, -3.3421630859375, -3.229949951171875, -3.11773681640625, -3.005523681640625, -2.893310546875, -2.781097412109375, -2.66888427734375, -2.556671142578125, -2.4444580078125, -2.332244873046875, -2.22003173828125, -2.107818603515625, -1.99560546875, -1.883392333984375, -1.77117919921875, -1.658966064453125, -1.5467529296875, -1.434539794921875, -1.32232666015625, -1.210113525390625, -1.097900390625, -0.985687255859375, -0.87347412109375, -0.761260986328125, -0.6490478515625, -0.536834716796875, -0.42462158203125, -0.312408447265625, -0.2001953125, -0.087982177734375, 0.02423095703125, 0.136444091796875, 0.2486572265625, 0.360870361328125, 0.47308349609375, 0.585296630859375, 0.697509765625, 0.809722900390625, 0.92193603515625, 1.034149169921875, 1.1463623046875, 1.258575439453125, 1.37078857421875, 1.483001708984375, 1.59521484375, 1.707427978515625, 1.81964111328125, 1.931854248046875, 2.0440673828125, 2.156280517578125, 2.26849365234375, 2.380706787109375, 2.492919921875, 2.605133056640625, 2.71734619140625, 2.829559326171875, 2.9417724609375, 3.053985595703125, 3.16619873046875, 3.278411865234375, 3.390625]}, "gradients/decoder.model.decoder.layers.0.fc2.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 0.0, 2.0, 5.0, 8.0, 11.0, 14.0, 13.0, 16.0, 30.0, 27.0, 39.0, 42.0, 42.0, 53.0, 63.0, 58.0, 46.0, 66.0, 67.0, 55.0, 52.0, 55.0, 41.0, 38.0, 30.0, 30.0, 26.0, 18.0, 15.0, 17.0, 9.0, 7.0, 5.0, 1.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3916015625, -1.3347320556640625, -1.277862548828125, -1.2209930419921875, -1.16412353515625, -1.1072540283203125, -1.050384521484375, -0.9935150146484375, -0.9366455078125, -0.8797760009765625, -0.822906494140625, -0.7660369873046875, -0.70916748046875, -0.6522979736328125, -0.595428466796875, -0.5385589599609375, -0.481689453125, -0.4248199462890625, -0.367950439453125, -0.3110809326171875, -0.25421142578125, -0.1973419189453125, -0.140472412109375, -0.0836029052734375, -0.0267333984375, 0.0301361083984375, 0.087005615234375, 0.1438751220703125, 0.20074462890625, 0.2576141357421875, 0.314483642578125, 0.3713531494140625, 0.42822265625, 0.4850921630859375, 0.541961669921875, 0.5988311767578125, 0.65570068359375, 0.7125701904296875, 0.769439697265625, 0.8263092041015625, 0.8831787109375, 0.9400482177734375, 0.996917724609375, 1.0537872314453125, 1.11065673828125, 1.1675262451171875, 1.224395751953125, 1.2812652587890625, 1.338134765625, 1.3950042724609375, 1.451873779296875, 1.5087432861328125, 1.56561279296875, 1.6224822998046875, 1.679351806640625, 1.7362213134765625, 1.7930908203125, 1.8499603271484375, 1.906829833984375, 1.9636993408203125, 2.02056884765625, 2.0774383544921875, 2.134307861328125, 2.1911773681640625, 2.248046875]}, "gradients/decoder.model.decoder.layers.0.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 5.0, 9.0, 7.0, 23.0, 55.0, 107.0, 417.0, 1608.0, 15174.0, 3969324.0, 202561.0, 3858.0, 787.0, 199.0, 72.0, 29.0, 19.0, 11.0, 5.0, 4.0, 3.0, 3.0, 1.0, 0.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-10.8359375, -10.4945068359375, -10.153076171875, -9.8116455078125, -9.47021484375, -9.1287841796875, -8.787353515625, -8.4459228515625, -8.1044921875, -7.7630615234375, -7.421630859375, -7.0802001953125, -6.73876953125, -6.3973388671875, -6.055908203125, -5.7144775390625, -5.373046875, -5.0316162109375, -4.690185546875, -4.3487548828125, -4.00732421875, -3.6658935546875, -3.324462890625, -2.9830322265625, -2.6416015625, -2.3001708984375, -1.958740234375, -1.6173095703125, -1.27587890625, -0.9344482421875, -0.593017578125, -0.2515869140625, 0.08984375, 0.4312744140625, 0.772705078125, 1.1141357421875, 1.45556640625, 1.7969970703125, 2.138427734375, 2.4798583984375, 2.8212890625, 3.1627197265625, 3.504150390625, 3.8455810546875, 4.18701171875, 4.5284423828125, 4.869873046875, 5.2113037109375, 5.552734375, 5.8941650390625, 6.235595703125, 6.5770263671875, 6.91845703125, 7.2598876953125, 7.601318359375, 7.9427490234375, 8.2841796875, 8.6256103515625, 8.967041015625, 9.3084716796875, 9.64990234375, 9.9913330078125, 10.332763671875, 10.6741943359375, 11.015625]}, "gradients/decoder.model.decoder.layers.0.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 5.0, 4.0, 5.0, 9.0, 11.0, 8.0, 28.0, 38.0, 94.0, 128.0, 201.0, 382.0, 558.0, 689.0, 709.0, 490.0, 288.0, 168.0, 101.0, 74.0, 26.0, 24.0, 15.0, 9.0, 6.0, 2.0, 2.0, 4.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.3916015625, -1.3492279052734375, -1.306854248046875, -1.2644805908203125, -1.22210693359375, -1.1797332763671875, -1.137359619140625, -1.0949859619140625, -1.0526123046875, -1.0102386474609375, -0.967864990234375, -0.9254913330078125, -0.88311767578125, -0.8407440185546875, -0.798370361328125, -0.7559967041015625, -0.713623046875, -0.6712493896484375, -0.628875732421875, -0.5865020751953125, -0.54412841796875, -0.5017547607421875, -0.459381103515625, -0.4170074462890625, -0.3746337890625, -0.3322601318359375, -0.289886474609375, -0.2475128173828125, -0.20513916015625, -0.1627655029296875, -0.120391845703125, -0.0780181884765625, -0.03564453125, 0.0067291259765625, 0.049102783203125, 0.0914764404296875, 0.13385009765625, 0.1762237548828125, 0.218597412109375, 0.2609710693359375, 0.3033447265625, 0.3457183837890625, 0.388092041015625, 0.4304656982421875, 0.47283935546875, 0.5152130126953125, 0.557586669921875, 0.5999603271484375, 0.642333984375, 0.6847076416015625, 0.727081298828125, 0.7694549560546875, 0.81182861328125, 0.8542022705078125, 0.896575927734375, 0.9389495849609375, 0.9813232421875, 1.0236968994140625, 1.066070556640625, 1.1084442138671875, 1.15081787109375, 1.1931915283203125, 1.235565185546875, 1.2779388427734375, 1.3203125]}, "gradients/decoder.model.decoder.layers.0.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 2.0, 3.0, 8.0, 9.0, 13.0, 14.0, 16.0, 28.0, 25.0, 34.0, 36.0, 41.0, 31.0, 44.0, 50.0, 51.0, 57.0, 66.0, 73.0, 56.0, 56.0, 43.0, 41.0, 36.0, 38.0, 23.0, 20.0, 21.0, 19.0, 13.0, 12.0, 8.0, 10.0, 4.0, 5.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.906385064125061, -1.8349493741989136, -1.7635135650634766, -1.692077875137329, -1.6206421852111816, -1.5492063760757446, -1.4777706861495972, -1.4063348770141602, -1.3348991870880127, -1.2634634971618652, -1.1920276880264282, -1.1205919981002808, -1.0491561889648438, -0.9777204990386963, -0.9062848091125488, -0.8348490595817566, -0.7634133100509644, -0.6919775605201721, -0.6205418109893799, -0.5491061210632324, -0.4776703715324402, -0.40623462200164795, -0.3347989022731781, -0.26336318254470825, -0.19192743301391602, -0.12049169838428497, -0.04905596375465393, 0.022379770874977112, 0.09381550550460815, 0.1652512550354004, 0.23668697476387024, 0.3081226944923401, 0.3795585632324219, 0.4509943127632141, 0.5224300622940063, 0.5938657522201538, 0.665301501750946, 0.7367372512817383, 0.8081729412078857, 0.879608690738678, 0.9510444402694702, 1.0224801301956177, 1.0939159393310547, 1.1653516292572021, 1.2367873191833496, 1.3082231283187866, 1.379658818244934, 1.451094627380371, 1.5225303173065186, 1.593966007232666, 1.665401816368103, 1.7368375062942505, 1.8082733154296875, 1.879709005355835, 1.9511446952819824, 2.02258038520813, 2.0940160751342773, 2.165451765060425, 2.2368874549865723, 2.308323383331299, 2.3797590732574463, 2.4511947631835938, 2.522630453109741, 2.5940661430358887, 2.6655020713806152]}, "gradients/decoder.model.decoder.layers.0.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 4.0, 7.0, 2.0, 9.0, 8.0, 15.0, 13.0, 16.0, 15.0, 25.0, 25.0, 27.0, 30.0, 33.0, 57.0, 51.0, 48.0, 55.0, 50.0, 50.0, 44.0, 39.0, 49.0, 27.0, 45.0, 36.0, 36.0, 34.0, 32.0, 25.0, 19.0, 14.0, 19.0, 10.0, 7.0, 9.0, 3.0, 7.0, 4.0, 5.0, 3.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9667867422103882, -1.9001915454864502, -1.8335963487625122, -1.7670011520385742, -1.7004058361053467, -1.6338107585906982, -1.5672154426574707, -1.5006202459335327, -1.4340250492095947, -1.3674298524856567, -1.3008346557617188, -1.2342394590377808, -1.1676442623138428, -1.1010489463806152, -1.0344537496566772, -0.9678585529327393, -0.9012633562088013, -0.8346681594848633, -0.7680729627609253, -0.7014777064323425, -0.6348825097084045, -0.5682873129844666, -0.5016920566558838, -0.4350968599319458, -0.3685016632080078, -0.3019064664840698, -0.23531123995780945, -0.16871602833271027, -0.10212081670761108, -0.035525619983673096, 0.03106960654258728, 0.09766483306884766, 0.1642601490020752, 0.23085536062717438, 0.29745057225227356, 0.36404579877853394, 0.4306409955024719, 0.4972361922264099, 0.5638314485549927, 0.6304266452789307, 0.6970218420028687, 0.7636170387268066, 0.8302122354507446, 0.8968074917793274, 0.9634026885032654, 1.0299978256225586, 1.0965931415557861, 1.1631883382797241, 1.229783535003662, 1.2963787317276, 1.362973928451538, 1.429569125175476, 1.496164321899414, 1.5627596378326416, 1.6293548345565796, 1.6959500312805176, 1.7625452280044556, 1.8291404247283936, 1.8957356214523315, 1.9623308181762695, 2.028926134109497, 2.0955212116241455, 2.162116527557373, 2.2287116050720215, 2.295306921005249]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 5.0, 3.0, 8.0, 8.0, 12.0, 11.0, 20.0, 29.0, 30.0, 36.0, 67.0, 85.0, 115.0, 171.0, 226.0, 386.0, 715.0, 1910.0, 9943.0, 71602.0, 365747.0, 460142.0, 116285.0, 16042.0, 2762.0, 864.0, 435.0, 281.0, 161.0, 124.0, 72.0, 83.0, 46.0, 32.0, 29.0, 17.0, 14.0, 12.0, 14.0, 4.0, 4.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8046875, -0.7796401977539062, -0.7545928955078125, -0.7295455932617188, -0.704498291015625, -0.6794509887695312, -0.6544036865234375, -0.6293563842773438, -0.60430908203125, -0.5792617797851562, -0.5542144775390625, -0.5291671752929688, -0.504119873046875, -0.47907257080078125, -0.4540252685546875, -0.42897796630859375, -0.4039306640625, -0.37888336181640625, -0.3538360595703125, -0.32878875732421875, -0.303741455078125, -0.27869415283203125, -0.2536468505859375, -0.22859954833984375, -0.20355224609375, -0.17850494384765625, -0.1534576416015625, -0.12841033935546875, -0.103363037109375, -0.07831573486328125, -0.0532684326171875, -0.02822113037109375, -0.003173828125, 0.02187347412109375, 0.0469207763671875, 0.07196807861328125, 0.097015380859375, 0.12206268310546875, 0.1471099853515625, 0.17215728759765625, 0.19720458984375, 0.22225189208984375, 0.2472991943359375, 0.27234649658203125, 0.297393798828125, 0.32244110107421875, 0.3474884033203125, 0.37253570556640625, 0.3975830078125, 0.42263031005859375, 0.4476776123046875, 0.47272491455078125, 0.497772216796875, 0.5228195190429688, 0.5478668212890625, 0.5729141235351562, 0.59796142578125, 0.6230087280273438, 0.6480560302734375, 0.6731033325195312, 0.698150634765625, 0.7231979370117188, 0.7482452392578125, 0.7732925415039062, 0.79833984375]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 5.0, 3.0, 10.0, 9.0, 11.0, 15.0, 9.0, 20.0, 32.0, 21.0, 25.0, 28.0, 36.0, 45.0, 62.0, 40.0, 53.0, 52.0, 39.0, 53.0, 46.0, 42.0, 42.0, 39.0, 41.0, 32.0, 36.0, 22.0, 32.0, 23.0, 18.0, 8.0, 17.0, 12.0, 2.0, 8.0, 5.0, 3.0, 4.0, 6.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.3330078125, -1.289947509765625, -1.24688720703125, -1.203826904296875, -1.1607666015625, -1.117706298828125, -1.07464599609375, -1.031585693359375, -0.988525390625, -0.945465087890625, -0.90240478515625, -0.859344482421875, -0.8162841796875, -0.773223876953125, -0.73016357421875, -0.687103271484375, -0.64404296875, -0.600982666015625, -0.55792236328125, -0.514862060546875, -0.4718017578125, -0.428741455078125, -0.38568115234375, -0.342620849609375, -0.299560546875, -0.256500244140625, -0.21343994140625, -0.170379638671875, -0.1273193359375, -0.084259033203125, -0.04119873046875, 0.001861572265625, 0.044921875, 0.087982177734375, 0.13104248046875, 0.174102783203125, 0.2171630859375, 0.260223388671875, 0.30328369140625, 0.346343994140625, 0.389404296875, 0.432464599609375, 0.47552490234375, 0.518585205078125, 0.5616455078125, 0.604705810546875, 0.64776611328125, 0.690826416015625, 0.73388671875, 0.776947021484375, 0.82000732421875, 0.863067626953125, 0.9061279296875, 0.949188232421875, 0.99224853515625, 1.035308837890625, 1.078369140625, 1.121429443359375, 1.16448974609375, 1.207550048828125, 1.2506103515625, 1.293670654296875, 1.33673095703125, 1.379791259765625, 1.4228515625]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 4.0, 8.0, 3.0, 11.0, 16.0, 15.0, 38.0, 58.0, 84.0, 141.0, 215.0, 350.0, 688.0, 1218.0, 2161.0, 4078.0, 7482.0, 14136.0, 25559.0, 45258.0, 76199.0, 119278.0, 160538.0, 175492.0, 151090.0, 108558.0, 67749.0, 39812.0, 22081.0, 12131.0, 6443.0, 3381.0, 1925.0, 1011.0, 564.0, 308.0, 197.0, 103.0, 62.0, 40.0, 23.0, 16.0, 13.0, 9.0, 9.0, 1.0, 6.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.2398681640625, -0.23289108276367188, -0.22591400146484375, -0.21893692016601562, -0.2119598388671875, -0.20498275756835938, -0.19800567626953125, -0.19102859497070312, -0.184051513671875, -0.17707443237304688, -0.17009735107421875, -0.16312026977539062, -0.1561431884765625, -0.14916610717773438, -0.14218902587890625, -0.13521194458007812, -0.12823486328125, -0.12125778198242188, -0.11428070068359375, -0.10730361938476562, -0.1003265380859375, -0.09334945678710938, -0.08637237548828125, -0.07939529418945312, -0.072418212890625, -0.06544113159179688, -0.05846405029296875, -0.051486968994140625, -0.0445098876953125, -0.037532806396484375, -0.03055572509765625, -0.023578643798828125, -0.0166015625, -0.009624481201171875, -0.00264739990234375, 0.004329681396484375, 0.0113067626953125, 0.018283843994140625, 0.02526092529296875, 0.032238006591796875, 0.039215087890625, 0.046192169189453125, 0.05316925048828125, 0.060146331787109375, 0.0671234130859375, 0.07410049438476562, 0.08107757568359375, 0.08805465698242188, 0.09503173828125, 0.10200881958007812, 0.10898590087890625, 0.11596298217773438, 0.1229400634765625, 0.12991714477539062, 0.13689422607421875, 0.14387130737304688, 0.150848388671875, 0.15782546997070312, 0.16480255126953125, 0.17177963256835938, 0.1787567138671875, 0.18573379516601562, 0.19271087646484375, 0.19968795776367188, 0.2066650390625]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 6.0, 2.0, 4.0, 2.0, 1.0, 9.0, 6.0, 9.0, 15.0, 18.0, 12.0, 25.0, 26.0, 27.0, 23.0, 23.0, 34.0, 31.0, 51.0, 44.0, 44.0, 47.0, 62.0, 44.0, 36.0, 54.0, 39.0, 49.0, 38.0, 22.0, 35.0, 20.0, 24.0, 18.0, 26.0, 16.0, 16.0, 18.0, 6.0, 8.0, 5.0, 5.0, 4.0, 3.0, 3.0, 3.0, 0.0, 2.0, 0.0, 3.0], "bins": [-3.669921875, -3.570465087890625, -3.47100830078125, -3.371551513671875, -3.2720947265625, -3.172637939453125, -3.07318115234375, -2.973724365234375, -2.874267578125, -2.774810791015625, -2.67535400390625, -2.575897216796875, -2.4764404296875, -2.376983642578125, -2.27752685546875, -2.178070068359375, -2.07861328125, -1.979156494140625, -1.87969970703125, -1.780242919921875, -1.6807861328125, -1.581329345703125, -1.48187255859375, -1.382415771484375, -1.282958984375, -1.183502197265625, -1.08404541015625, -0.984588623046875, -0.8851318359375, -0.785675048828125, -0.68621826171875, -0.586761474609375, -0.4873046875, -0.387847900390625, -0.28839111328125, -0.188934326171875, -0.0894775390625, 0.009979248046875, 0.10943603515625, 0.208892822265625, 0.308349609375, 0.407806396484375, 0.50726318359375, 0.606719970703125, 0.7061767578125, 0.805633544921875, 0.90509033203125, 1.004547119140625, 1.10400390625, 1.203460693359375, 1.30291748046875, 1.402374267578125, 1.5018310546875, 1.601287841796875, 1.70074462890625, 1.800201416015625, 1.899658203125, 1.999114990234375, 2.09857177734375, 2.198028564453125, 2.2974853515625, 2.396942138671875, 2.49639892578125, 2.595855712890625, 2.6953125]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 1.0, 2.0, 3.0, 3.0, 6.0, 14.0, 14.0, 19.0, 32.0, 53.0, 125.0, 202.0, 321.0, 619.0, 1483.0, 4097.0, 21763.0, 285432.0, 662079.0, 60275.0, 7835.0, 2309.0, 934.0, 457.0, 222.0, 107.0, 54.0, 39.0, 23.0, 15.0, 6.0, 1.0, 7.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.3564453125, -0.3466033935546875, -0.336761474609375, -0.3269195556640625, -0.31707763671875, -0.3072357177734375, -0.297393798828125, -0.2875518798828125, -0.2777099609375, -0.2678680419921875, -0.258026123046875, -0.2481842041015625, -0.23834228515625, -0.2285003662109375, -0.218658447265625, -0.2088165283203125, -0.198974609375, -0.1891326904296875, -0.179290771484375, -0.1694488525390625, -0.15960693359375, -0.1497650146484375, -0.139923095703125, -0.1300811767578125, -0.1202392578125, -0.1103973388671875, -0.100555419921875, -0.0907135009765625, -0.08087158203125, -0.0710296630859375, -0.061187744140625, -0.0513458251953125, -0.04150390625, -0.0316619873046875, -0.021820068359375, -0.0119781494140625, -0.00213623046875, 0.0077056884765625, 0.017547607421875, 0.0273895263671875, 0.0372314453125, 0.0470733642578125, 0.056915283203125, 0.0667572021484375, 0.07659912109375, 0.0864410400390625, 0.096282958984375, 0.1061248779296875, 0.115966796875, 0.1258087158203125, 0.135650634765625, 0.1454925537109375, 0.15533447265625, 0.1651763916015625, 0.175018310546875, 0.1848602294921875, 0.1947021484375, 0.2045440673828125, 0.214385986328125, 0.2242279052734375, 0.23406982421875, 0.2439117431640625, 0.253753662109375, 0.2635955810546875, 0.2734375]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 4.0, 5.0, 5.0, 3.0, 3.0, 9.0, 16.0, 20.0, 28.0, 44.0, 63.0, 78.0, 81.0, 84.0, 86.0, 122.0, 93.0, 73.0, 63.0, 36.0, 36.0, 18.0, 16.0, 9.0, 4.0, 4.0, 3.0, 3.0, 2.0, 1.0, 2.0, 1.0], "bins": [-0.0001289844512939453, -0.00012620538473129272, -0.00012342631816864014, -0.00012064725160598755, -0.00011786818504333496, -0.00011508911848068237, -0.00011231005191802979, -0.0001095309853553772, -0.00010675191879272461, -0.00010397285223007202, -0.00010119378566741943, -9.841471910476685e-05, -9.563565254211426e-05, -9.285658597946167e-05, -9.007751941680908e-05, -8.72984528541565e-05, -8.45193862915039e-05, -8.174031972885132e-05, -7.896125316619873e-05, -7.618218660354614e-05, -7.340312004089355e-05, -7.062405347824097e-05, -6.784498691558838e-05, -6.506592035293579e-05, -6.22868537902832e-05, -5.9507787227630615e-05, -5.672872066497803e-05, -5.394965410232544e-05, -5.117058753967285e-05, -4.8391520977020264e-05, -4.5612454414367676e-05, -4.283338785171509e-05, -4.00543212890625e-05, -3.727525472640991e-05, -3.4496188163757324e-05, -3.1717121601104736e-05, -2.893805503845215e-05, -2.615898847579956e-05, -2.3379921913146973e-05, -2.0600855350494385e-05, -1.7821788787841797e-05, -1.5042722225189209e-05, -1.2263655662536621e-05, -9.484589099884033e-06, -6.705522537231445e-06, -3.926455974578857e-06, -1.1473894119262695e-06, 1.6316771507263184e-06, 4.410743713378906e-06, 7.189810276031494e-06, 9.968876838684082e-06, 1.274794340133667e-05, 1.5527009963989258e-05, 1.8306076526641846e-05, 2.1085143089294434e-05, 2.386420965194702e-05, 2.664327621459961e-05, 2.9422342777252197e-05, 3.2201409339904785e-05, 3.498047590255737e-05, 3.775954246520996e-05, 4.053860902786255e-05, 4.331767559051514e-05, 4.6096742153167725e-05, 4.887580871582031e-05]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 4.0, 2.0, 5.0, 3.0, 5.0, 12.0, 14.0, 26.0, 20.0, 30.0, 40.0, 51.0, 80.0, 127.0, 161.0, 272.0, 453.0, 728.0, 1314.0, 2554.0, 5177.0, 10612.0, 23390.0, 55728.0, 147592.0, 368378.0, 266296.0, 94650.0, 37809.0, 16354.0, 7731.0, 3858.0, 2016.0, 1112.0, 704.0, 413.0, 261.0, 175.0, 115.0, 91.0, 62.0, 38.0, 33.0, 16.0, 15.0, 13.0, 9.0, 4.0, 4.0, 5.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.180419921875, -0.1752338409423828, -0.17004776000976562, -0.16486167907714844, -0.15967559814453125, -0.15448951721191406, -0.14930343627929688, -0.1441173553466797, -0.1389312744140625, -0.1337451934814453, -0.12855911254882812, -0.12337303161621094, -0.11818695068359375, -0.11300086975097656, -0.10781478881835938, -0.10262870788574219, -0.097442626953125, -0.09225654602050781, -0.08707046508789062, -0.08188438415527344, -0.07669830322265625, -0.07151222229003906, -0.06632614135742188, -0.06114006042480469, -0.0559539794921875, -0.05076789855957031, -0.045581817626953125, -0.04039573669433594, -0.03520965576171875, -0.030023574829101562, -0.024837493896484375, -0.019651412963867188, -0.01446533203125, -0.009279251098632812, -0.004093170166015625, 0.0010929107666015625, 0.00627899169921875, 0.011465072631835938, 0.016651153564453125, 0.021837234497070312, 0.0270233154296875, 0.03220939636230469, 0.037395477294921875, 0.04258155822753906, 0.04776763916015625, 0.05295372009277344, 0.058139801025390625, 0.06332588195800781, 0.068511962890625, 0.07369804382324219, 0.07888412475585938, 0.08407020568847656, 0.08925628662109375, 0.09444236755371094, 0.09962844848632812, 0.10481452941894531, 0.1100006103515625, 0.11518669128417969, 0.12037277221679688, 0.12555885314941406, 0.13074493408203125, 0.13593101501464844, 0.14111709594726562, 0.1463031768798828, 0.1514892578125]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 6.0, 7.0, 6.0, 5.0, 5.0, 8.0, 10.0, 14.0, 20.0, 21.0, 19.0, 24.0, 25.0, 35.0, 50.0, 57.0, 81.0, 67.0, 84.0, 94.0, 71.0, 43.0, 44.0, 39.0, 20.0, 30.0, 21.0, 21.0, 13.0, 7.0, 13.0, 8.0, 13.0, 7.0, 5.0, 1.0, 3.0, 4.0, 1.0, 1.0, 6.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.05023193359375, -0.04827690124511719, -0.046321868896484375, -0.04436683654785156, -0.04241180419921875, -0.04045677185058594, -0.038501739501953125, -0.03654670715332031, -0.0345916748046875, -0.03263664245605469, -0.030681610107421875, -0.028726577758789062, -0.02677154541015625, -0.024816513061523438, -0.022861480712890625, -0.020906448364257812, -0.018951416015625, -0.016996383666992188, -0.015041351318359375, -0.013086318969726562, -0.01113128662109375, -0.009176254272460938, -0.007221221923828125, -0.0052661895751953125, -0.0033111572265625, -0.0013561248779296875, 0.000598907470703125, 0.0025539398193359375, 0.00450897216796875, 0.0064640045166015625, 0.008419036865234375, 0.010374069213867188, 0.0123291015625, 0.014284133911132812, 0.016239166259765625, 0.018194198608398438, 0.02014923095703125, 0.022104263305664062, 0.024059295654296875, 0.026014328002929688, 0.0279693603515625, 0.029924392700195312, 0.031879425048828125, 0.03383445739746094, 0.03578948974609375, 0.03774452209472656, 0.039699554443359375, 0.04165458679199219, 0.043609619140625, 0.04556465148925781, 0.047519683837890625, 0.04947471618652344, 0.05142974853515625, 0.05338478088378906, 0.055339813232421875, 0.05729484558105469, 0.0592498779296875, 0.06120491027832031, 0.06315994262695312, 0.06511497497558594, 0.06707000732421875, 0.06902503967285156, 0.07098007202148438, 0.07293510437011719, 0.07489013671875]}, "gradients/decoder.model.decoder.layers.0.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 10.0, 5.0, 17.0, 30.0, 40.0, 47.0, 49.0, 70.0, 77.0, 82.0, 102.0, 112.0, 89.0, 69.0, 61.0, 44.0, 31.0, 27.0, 16.0, 12.0, 9.0, 9.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.2007575035095215, -2.1314151287078857, -2.062072515487671, -1.9927300214767456, -1.9233875274658203, -1.8540451526641846, -1.7847026586532593, -1.715360164642334, -1.6460176706314087, -1.5766751766204834, -1.507332682609558, -1.4379901885986328, -1.368647813796997, -1.2993052005767822, -1.2299628257751465, -1.1606203317642212, -1.091277837753296, -1.0219353437423706, -0.9525928497314453, -0.8832504153251648, -0.8139079213142395, -0.7445654273033142, -0.6752229928970337, -0.6058804988861084, -0.5365380048751831, -0.4671955108642578, -0.3978530466556549, -0.328510582447052, -0.2591680884361267, -0.18982559442520142, -0.12048313021659851, -0.051140666007995605, 0.018201589584350586, 0.08754406869411469, 0.15688654780387878, 0.22622902691364288, 0.295571506023407, 0.3649140000343323, 0.4342564642429352, 0.5035989284515381, 0.5729414224624634, 0.6422839164733887, 0.711626410484314, 0.7809688448905945, 0.8503113389015198, 0.9196538329124451, 0.9889962673187256, 1.0583387613296509, 1.1276812553405762, 1.1970237493515015, 1.2663662433624268, 1.335708737373352, 1.4050512313842773, 1.474393606185913, 1.5437361001968384, 1.6130785942077637, 1.682421088218689, 1.7517635822296143, 1.8211060762405396, 1.8904485702514648, 1.9597909450531006, 2.0291335582733154, 2.098475933074951, 2.167818546295166, 2.2371609210968018]}, "gradients/decoder.model.decoder.layers.0.self_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 3.0, 1.0, 2.0, 2.0, 9.0, 8.0, 7.0, 8.0, 13.0, 10.0, 21.0, 20.0, 28.0, 25.0, 35.0, 37.0, 31.0, 47.0, 43.0, 51.0, 55.0, 64.0, 38.0, 46.0, 48.0, 41.0, 39.0, 40.0, 24.0, 45.0, 28.0, 35.0, 19.0, 20.0, 10.0, 17.0, 9.0, 6.0, 8.0, 2.0, 5.0, 3.0, 4.0, 1.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2035744190216064, -1.1631237268447876, -1.1226730346679688, -1.0822222232818604, -1.0417715311050415, -1.0013208389282227, -0.9608701467514038, -0.9204193949699402, -0.8799686431884766, -0.8395179510116577, -0.7990671992301941, -0.7586165070533752, -0.7181657552719116, -0.6777150630950928, -0.6372643709182739, -0.5968136191368103, -0.5563629269599915, -0.5159122347831726, -0.475461483001709, -0.43501079082489014, -0.3945600390434265, -0.35410934686660767, -0.31365862488746643, -0.2732079029083252, -0.23275718092918396, -0.19230645895004272, -0.1518557369709015, -0.11140502989292145, -0.07095430791378021, -0.030503585934638977, 0.009947121143341064, 0.0503978431224823, 0.09084856510162354, 0.13129928708076477, 0.171750009059906, 0.21220071613788605, 0.2526514530181885, 0.2931021451950073, 0.33355286717414856, 0.3740035891532898, 0.41445431113243103, 0.45490503311157227, 0.4953557550907135, 0.5358064770698547, 0.5762571692466736, 0.6167079210281372, 0.657158613204956, 0.6976093053817749, 0.7380600571632385, 0.7785107493400574, 0.818961501121521, 0.8594121932983398, 0.8998629450798035, 0.9403136372566223, 0.9807643890380859, 1.0212150812149048, 1.0616657733917236, 1.1021164655685425, 1.1425671577453613, 1.1830179691314697, 1.2234686613082886, 1.2639193534851074, 1.3043700456619263, 1.3448207378387451, 1.3852715492248535]}, "gradients/decoder.model.decoder.layers.0.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 3.0, 3.0, 3.0, 3.0, 6.0, 5.0, 10.0, 14.0, 17.0, 26.0, 36.0, 34.0, 50.0, 88.0, 142.0, 178.0, 248.0, 432.0, 785.0, 1532.0, 2908.0, 6152.0, 13912.0, 31817.0, 74644.0, 157924.0, 257753.0, 243782.0, 140816.0, 64595.0, 27409.0, 12193.0, 5215.0, 2603.0, 1293.0, 698.0, 395.0, 291.0, 176.0, 98.0, 66.0, 60.0, 46.0, 22.0, 22.0, 15.0, 14.0, 9.0, 11.0, 5.0, 2.0, 3.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 2.0], "bins": [-1.7646484375, -1.7075653076171875, -1.650482177734375, -1.5933990478515625, -1.53631591796875, -1.4792327880859375, -1.422149658203125, -1.3650665283203125, -1.3079833984375, -1.2509002685546875, -1.193817138671875, -1.1367340087890625, -1.07965087890625, -1.0225677490234375, -0.965484619140625, -0.9084014892578125, -0.851318359375, -0.7942352294921875, -0.737152099609375, -0.6800689697265625, -0.62298583984375, -0.5659027099609375, -0.508819580078125, -0.4517364501953125, -0.3946533203125, -0.3375701904296875, -0.280487060546875, -0.2234039306640625, -0.16632080078125, -0.1092376708984375, -0.052154541015625, 0.0049285888671875, 0.06201171875, 0.1190948486328125, 0.176177978515625, 0.2332611083984375, 0.29034423828125, 0.3474273681640625, 0.404510498046875, 0.4615936279296875, 0.5186767578125, 0.5757598876953125, 0.632843017578125, 0.6899261474609375, 0.74700927734375, 0.8040924072265625, 0.861175537109375, 0.9182586669921875, 0.975341796875, 1.0324249267578125, 1.089508056640625, 1.1465911865234375, 1.20367431640625, 1.2607574462890625, 1.317840576171875, 1.3749237060546875, 1.4320068359375, 1.4890899658203125, 1.546173095703125, 1.6032562255859375, 1.66033935546875, 1.7174224853515625, 1.774505615234375, 1.8315887451171875, 1.888671875]}, "gradients/decoder.model.decoder.layers.0.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 4.0, 5.0, 8.0, 5.0, 4.0, 6.0, 9.0, 13.0, 19.0, 15.0, 16.0, 22.0, 23.0, 27.0, 28.0, 49.0, 40.0, 52.0, 45.0, 46.0, 45.0, 43.0, 44.0, 43.0, 44.0, 53.0, 36.0, 34.0, 33.0, 34.0, 34.0, 27.0, 18.0, 19.0, 12.0, 10.0, 10.0, 8.0, 6.0, 3.0, 5.0, 8.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.013671875, -1.94561767578125, -1.8775634765625, -1.80950927734375, -1.741455078125, -1.67340087890625, -1.6053466796875, -1.53729248046875, -1.46923828125, -1.40118408203125, -1.3331298828125, -1.26507568359375, -1.197021484375, -1.12896728515625, -1.0609130859375, -0.99285888671875, -0.9248046875, -0.85675048828125, -0.7886962890625, -0.72064208984375, -0.652587890625, -0.58453369140625, -0.5164794921875, -0.44842529296875, -0.38037109375, -0.31231689453125, -0.2442626953125, -0.17620849609375, -0.108154296875, -0.04010009765625, 0.0279541015625, 0.09600830078125, 0.1640625, 0.23211669921875, 0.3001708984375, 0.36822509765625, 0.436279296875, 0.50433349609375, 0.5723876953125, 0.64044189453125, 0.70849609375, 0.77655029296875, 0.8446044921875, 0.91265869140625, 0.980712890625, 1.04876708984375, 1.1168212890625, 1.18487548828125, 1.2529296875, 1.32098388671875, 1.3890380859375, 1.45709228515625, 1.525146484375, 1.59320068359375, 1.6612548828125, 1.72930908203125, 1.79736328125, 1.86541748046875, 1.9334716796875, 2.00152587890625, 2.069580078125, 2.13763427734375, 2.2056884765625, 2.27374267578125, 2.341796875]}, "gradients/decoder.model.decoder.layers.0.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 6.0, 3.0, 6.0, 13.0, 5.0, 8.0, 15.0, 22.0, 36.0, 39.0, 76.0, 101.0, 145.0, 170.0, 290.0, 469.0, 764.0, 1428.0, 2767.0, 6105.0, 15479.0, 41232.0, 113805.0, 270560.0, 326952.0, 166923.0, 61738.0, 22641.0, 8605.0, 3706.0, 1794.0, 995.0, 569.0, 362.0, 215.0, 140.0, 104.0, 79.0, 55.0, 37.0, 27.0, 16.0, 24.0, 11.0, 9.0, 4.0, 6.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.544921875, -2.46588134765625, -2.3868408203125, -2.30780029296875, -2.228759765625, -2.14971923828125, -2.0706787109375, -1.99163818359375, -1.91259765625, -1.83355712890625, -1.7545166015625, -1.67547607421875, -1.596435546875, -1.51739501953125, -1.4383544921875, -1.35931396484375, -1.2802734375, -1.20123291015625, -1.1221923828125, -1.04315185546875, -0.964111328125, -0.88507080078125, -0.8060302734375, -0.72698974609375, -0.64794921875, -0.56890869140625, -0.4898681640625, -0.41082763671875, -0.331787109375, -0.25274658203125, -0.1737060546875, -0.09466552734375, -0.015625, 0.06341552734375, 0.1424560546875, 0.22149658203125, 0.300537109375, 0.37957763671875, 0.4586181640625, 0.53765869140625, 0.61669921875, 0.69573974609375, 0.7747802734375, 0.85382080078125, 0.932861328125, 1.01190185546875, 1.0909423828125, 1.16998291015625, 1.2490234375, 1.32806396484375, 1.4071044921875, 1.48614501953125, 1.565185546875, 1.64422607421875, 1.7232666015625, 1.80230712890625, 1.88134765625, 1.96038818359375, 2.0394287109375, 2.11846923828125, 2.197509765625, 2.27655029296875, 2.3555908203125, 2.43463134765625, 2.513671875]}, "gradients/decoder.model.decoder.layers.0.self_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 7.0, 4.0, 3.0, 2.0, 5.0, 1.0, 1.0, 8.0, 7.0, 12.0, 21.0, 24.0, 16.0, 22.0, 30.0, 27.0, 21.0, 35.0, 41.0, 35.0, 41.0, 44.0, 53.0, 69.0, 50.0, 43.0, 46.0, 35.0, 35.0, 39.0, 31.0, 27.0, 26.0, 29.0, 15.0, 18.0, 16.0, 14.0, 11.0, 7.0, 13.0, 6.0, 7.0, 7.0, 5.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0], "bins": [-2.576171875, -2.49822998046875, -2.4202880859375, -2.34234619140625, -2.264404296875, -2.18646240234375, -2.1085205078125, -2.03057861328125, -1.95263671875, -1.87469482421875, -1.7967529296875, -1.71881103515625, -1.640869140625, -1.56292724609375, -1.4849853515625, -1.40704345703125, -1.3291015625, -1.25115966796875, -1.1732177734375, -1.09527587890625, -1.017333984375, -0.93939208984375, -0.8614501953125, -0.78350830078125, -0.70556640625, -0.62762451171875, -0.5496826171875, -0.47174072265625, -0.393798828125, -0.31585693359375, -0.2379150390625, -0.15997314453125, -0.08203125, -0.00408935546875, 0.0738525390625, 0.15179443359375, 0.229736328125, 0.30767822265625, 0.3856201171875, 0.46356201171875, 0.54150390625, 0.61944580078125, 0.6973876953125, 0.77532958984375, 0.853271484375, 0.93121337890625, 1.0091552734375, 1.08709716796875, 1.1650390625, 1.24298095703125, 1.3209228515625, 1.39886474609375, 1.476806640625, 1.55474853515625, 1.6326904296875, 1.71063232421875, 1.78857421875, 1.86651611328125, 1.9444580078125, 2.02239990234375, 2.100341796875, 2.17828369140625, 2.2562255859375, 2.33416748046875, 2.412109375]}, "gradients/decoder.model.decoder.layers.0.self_attn.k_proj.weight": {"_type": "histogram", "values": [4.0, 0.0, 1.0, 4.0, 2.0, 4.0, 0.0, 5.0, 11.0, 18.0, 18.0, 32.0, 49.0, 53.0, 91.0, 142.0, 244.0, 367.0, 565.0, 927.0, 1509.0, 2603.0, 4828.0, 9381.0, 19168.0, 41420.0, 87205.0, 168266.0, 280173.0, 209335.0, 114369.0, 55321.0, 25878.0, 12256.0, 6031.0, 3435.0, 1872.0, 1099.0, 668.0, 439.0, 260.0, 171.0, 104.0, 73.0, 49.0, 37.0, 23.0, 17.0, 21.0, 8.0, 4.0, 4.0, 1.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.40673828125, -0.3925628662109375, -0.378387451171875, -0.3642120361328125, -0.35003662109375, -0.3358612060546875, -0.321685791015625, -0.3075103759765625, -0.2933349609375, -0.2791595458984375, -0.264984130859375, -0.2508087158203125, -0.23663330078125, -0.2224578857421875, -0.208282470703125, -0.1941070556640625, -0.179931640625, -0.1657562255859375, -0.151580810546875, -0.1374053955078125, -0.12322998046875, -0.1090545654296875, -0.094879150390625, -0.0807037353515625, -0.0665283203125, -0.0523529052734375, -0.038177490234375, -0.0240020751953125, -0.00982666015625, 0.0043487548828125, 0.018524169921875, 0.0326995849609375, 0.046875, 0.0610504150390625, 0.075225830078125, 0.0894012451171875, 0.10357666015625, 0.1177520751953125, 0.131927490234375, 0.1461029052734375, 0.1602783203125, 0.1744537353515625, 0.188629150390625, 0.2028045654296875, 0.21697998046875, 0.2311553955078125, 0.245330810546875, 0.2595062255859375, 0.273681640625, 0.2878570556640625, 0.302032470703125, 0.3162078857421875, 0.33038330078125, 0.3445587158203125, 0.358734130859375, 0.3729095458984375, 0.3870849609375, 0.4012603759765625, 0.415435791015625, 0.4296112060546875, 0.44378662109375, 0.4579620361328125, 0.472137451171875, 0.4863128662109375, 0.50048828125]}, "gradients/decoder.model.decoder.layers.0.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 3.0, 6.0, 8.0, 6.0, 11.0, 9.0, 15.0, 23.0, 29.0, 34.0, 53.0, 54.0, 59.0, 82.0, 93.0, 95.0, 60.0, 67.0, 60.0, 46.0, 38.0, 37.0, 36.0, 22.0, 14.0, 13.0, 10.0, 6.0, 5.0, 2.0, 5.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0001385211944580078, -0.0001342184841632843, -0.0001299157738685608, -0.00012561306357383728, -0.00012131035327911377, -0.00011700764298439026, -0.00011270493268966675, -0.00010840222239494324, -0.00010409951210021973, -9.979680180549622e-05, -9.54940915107727e-05, -9.11913812160492e-05, -8.688867092132568e-05, -8.258596062660217e-05, -7.828325033187866e-05, -7.398054003715515e-05, -6.967782974243164e-05, -6.537511944770813e-05, -6.107240915298462e-05, -5.676969885826111e-05, -5.24669885635376e-05, -4.816427826881409e-05, -4.3861567974090576e-05, -3.9558857679367065e-05, -3.5256147384643555e-05, -3.0953437089920044e-05, -2.6650726795196533e-05, -2.2348016500473022e-05, -1.8045306205749512e-05, -1.3742595911026001e-05, -9.43988561630249e-06, -5.1371753215789795e-06, -8.344650268554688e-07, 3.468245267868042e-06, 7.770955562591553e-06, 1.2073665857315063e-05, 1.6376376152038574e-05, 2.0679086446762085e-05, 2.4981796741485596e-05, 2.9284507036209106e-05, 3.358721733093262e-05, 3.788992762565613e-05, 4.219263792037964e-05, 4.649534821510315e-05, 5.079805850982666e-05, 5.510076880455017e-05, 5.940347909927368e-05, 6.370618939399719e-05, 6.80088996887207e-05, 7.231160998344421e-05, 7.661432027816772e-05, 8.091703057289124e-05, 8.521974086761475e-05, 8.952245116233826e-05, 9.382516145706177e-05, 9.812787175178528e-05, 0.00010243058204650879, 0.0001067332923412323, 0.00011103600263595581, 0.00011533871293067932, 0.00011964142322540283, 0.00012394413352012634, 0.00012824684381484985, 0.00013254955410957336, 0.00013685226440429688]}, "gradients/decoder.model.decoder.layers.0.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 5.0, 1.0, 10.0, 9.0, 12.0, 7.0, 19.0, 26.0, 37.0, 70.0, 79.0, 122.0, 131.0, 241.0, 326.0, 448.0, 671.0, 935.0, 1332.0, 2002.0, 3383.0, 5713.0, 10462.0, 20945.0, 45634.0, 101756.0, 204778.0, 308229.0, 176868.0, 85111.0, 38010.0, 17991.0, 9030.0, 5045.0, 3098.0, 1937.0, 1217.0, 858.0, 625.0, 446.0, 253.0, 202.0, 119.0, 104.0, 65.0, 58.0, 36.0, 33.0, 20.0, 17.0, 16.0, 10.0, 12.0, 2.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0], "bins": [-0.53369140625, -0.5161285400390625, -0.498565673828125, -0.4810028076171875, -0.46343994140625, -0.4458770751953125, -0.428314208984375, -0.4107513427734375, -0.3931884765625, -0.3756256103515625, -0.358062744140625, -0.3404998779296875, -0.32293701171875, -0.3053741455078125, -0.287811279296875, -0.2702484130859375, -0.252685546875, -0.2351226806640625, -0.217559814453125, -0.1999969482421875, -0.18243408203125, -0.1648712158203125, -0.147308349609375, -0.1297454833984375, -0.1121826171875, -0.0946197509765625, -0.077056884765625, -0.0594940185546875, -0.04193115234375, -0.0243682861328125, -0.006805419921875, 0.0107574462890625, 0.0283203125, 0.0458831787109375, 0.063446044921875, 0.0810089111328125, 0.09857177734375, 0.1161346435546875, 0.133697509765625, 0.1512603759765625, 0.1688232421875, 0.1863861083984375, 0.203948974609375, 0.2215118408203125, 0.23907470703125, 0.2566375732421875, 0.274200439453125, 0.2917633056640625, 0.309326171875, 0.3268890380859375, 0.344451904296875, 0.3620147705078125, 0.37957763671875, 0.3971405029296875, 0.414703369140625, 0.4322662353515625, 0.4498291015625, 0.4673919677734375, 0.484954833984375, 0.5025177001953125, 0.52008056640625, 0.5376434326171875, 0.555206298828125, 0.5727691650390625, 0.59033203125]}, "gradients/decoder.model.decoder.layers.0.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 2.0, 5.0, 4.0, 1.0, 8.0, 5.0, 9.0, 19.0, 20.0, 32.0, 55.0, 61.0, 87.0, 99.0, 120.0, 104.0, 103.0, 71.0, 59.0, 29.0, 35.0, 20.0, 16.0, 10.0, 5.0, 6.0, 5.0, 4.0, 0.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.6435546875, -0.6226577758789062, -0.6017608642578125, -0.5808639526367188, -0.559967041015625, -0.5390701293945312, -0.5181732177734375, -0.49727630615234375, -0.47637939453125, -0.45548248291015625, -0.4345855712890625, -0.41368865966796875, -0.392791748046875, -0.37189483642578125, -0.3509979248046875, -0.33010101318359375, -0.3092041015625, -0.28830718994140625, -0.2674102783203125, -0.24651336669921875, -0.225616455078125, -0.20471954345703125, -0.1838226318359375, -0.16292572021484375, -0.14202880859375, -0.12113189697265625, -0.1002349853515625, -0.07933807373046875, -0.058441162109375, -0.03754425048828125, -0.0166473388671875, 0.00424957275390625, 0.025146484375, 0.04604339599609375, 0.0669403076171875, 0.08783721923828125, 0.108734130859375, 0.12963104248046875, 0.1505279541015625, 0.17142486572265625, 0.19232177734375, 0.21321868896484375, 0.2341156005859375, 0.25501251220703125, 0.275909423828125, 0.29680633544921875, 0.3177032470703125, 0.33860015869140625, 0.3594970703125, 0.38039398193359375, 0.4012908935546875, 0.42218780517578125, 0.443084716796875, 0.46398162841796875, 0.4848785400390625, 0.5057754516601562, 0.52667236328125, 0.5475692749023438, 0.5684661865234375, 0.5893630981445312, 0.610260009765625, 0.6311569213867188, 0.6520538330078125, 0.6729507446289062, 0.69384765625]}, "gradients/decoder.model.decoder.layernorm_embedding.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 4.0, 3.0, 3.0, 6.0, 21.0, 40.0, 81.0, 117.0, 126.0, 185.0, 148.0, 107.0, 78.0, 47.0, 20.0, 10.0, 7.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.285005569458008, -7.029697895050049, -6.774389743804932, -6.519082069396973, -6.2637739181518555, -6.0084662437438965, -5.7531585693359375, -5.49785041809082, -5.242542743682861, -4.987235069274902, -4.731926918029785, -4.476619243621826, -4.221311569213867, -3.96600341796875, -3.710695743560791, -3.455387830734253, -3.200079917907715, -2.9447720050811768, -2.6894640922546387, -2.4341564178466797, -2.1788485050201416, -1.9235405921936035, -1.668232798576355, -1.4129250049591064, -1.1576170921325684, -0.902309238910675, -0.6470013856887817, -0.3916935324668884, -0.13638567924499512, 0.11892223358154297, 0.3742300271987915, 0.62953782081604, 0.8848447799682617, 1.1401526927947998, 1.3954604864120483, 1.6507682800292969, 1.906076192855835, 2.161384105682373, 2.416691780090332, 2.67199969291687, 2.927307605743408, 3.1826155185699463, 3.4379234313964844, 3.6932311058044434, 3.9485390186309814, 4.2038469314575195, 4.4591546058654785, 4.7144622802734375, 4.969770431518555, 5.225078105926514, 5.480386257171631, 5.73569393157959, 5.991002082824707, 6.246309757232666, 6.501617431640625, 6.756925582885742, 7.012233257293701, 7.26754093170166, 7.522849082946777, 7.778156757354736, 8.033464431762695, 8.288772583007812, 8.54408073425293, 8.79938793182373, 9.054696083068848]}, "gradients/decoder.model.decoder.layernorm_embedding.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 3.0, 2.0, 6.0, 13.0, 5.0, 4.0, 13.0, 14.0, 12.0, 15.0, 24.0, 24.0, 16.0, 17.0, 33.0, 20.0, 27.0, 26.0, 44.0, 47.0, 41.0, 40.0, 37.0, 31.0, 35.0, 38.0, 46.0, 37.0, 37.0, 35.0, 27.0, 28.0, 20.0, 24.0, 26.0, 21.0, 14.0, 18.0, 13.0, 12.0, 11.0, 9.0, 11.0, 9.0, 6.0, 4.0, 3.0, 2.0, 1.0, 4.0, 3.0, 3.0, 3.0, 0.0, 1.0, 1.0], "bins": [-3.366345167160034, -3.260174512863159, -3.154003858566284, -3.047833204269409, -2.941662549972534, -2.835491895675659, -2.729321002960205, -2.62315034866333, -2.516979694366455, -2.41080904006958, -2.304638385772705, -2.19846773147583, -2.092297077178955, -1.98612642288208, -1.8799556493759155, -1.7737849950790405, -1.667614459991455, -1.56144380569458, -1.455273151397705, -1.34910249710083, -1.242931842803955, -1.13676118850708, -1.0305904150009155, -0.9244197607040405, -0.8182491064071655, -0.7120784521102905, -0.6059077978134155, -0.49973708391189575, -0.39356642961502075, -0.28739577531814575, -0.18122506141662598, -0.07505440711975098, 0.031116247177124023, 0.13728691637516022, 0.2434575855731964, 0.3496282696723938, 0.4557989239692688, 0.5619695782661438, 0.6681402921676636, 0.7743109464645386, 0.8804816007614136, 0.9866522550582886, 1.0928229093551636, 1.1989936828613281, 1.3051643371582031, 1.4113349914550781, 1.5175056457519531, 1.6236763000488281, 1.7298469543457031, 1.8360176086425781, 1.9421882629394531, 2.048358917236328, 2.154529571533203, 2.260700225830078, 2.366870880126953, 2.473041534423828, 2.579212188720703, 2.685382843017578, 2.791553497314453, 2.897724151611328, 3.003894805908203, 3.110065460205078, 3.216236114501953, 3.322406768798828, 3.4285776615142822]}, "gradients/decoder.model.decoder.embed_positions.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 11.0, 10.0, 13.0, 14.0, 31.0, 38.0, 43.0, 64.0, 64.0, 114.0, 167.0, 229.0, 319.0, 431.0, 599.0, 917.0, 1168.0, 1654.0, 2193.0, 2835.0, 3676.0, 6302.0, 1011250.0, 5148.0, 3358.0, 2514.0, 2022.0, 1480.0, 1071.0, 770.0, 586.0, 400.0, 307.0, 243.0, 185.0, 113.0, 83.0, 51.0, 47.0, 25.0, 16.0, 11.0, 11.0, 4.0, 7.0, 3.0, 7.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-3.26330828666687, -3.1592674255371094, -3.0552265644073486, -2.951185703277588, -2.847144603729248, -2.7431039810180664, -2.6390628814697266, -2.535022020339966, -2.430981159210205, -2.3269402980804443, -2.2228994369506836, -2.118858575820923, -2.014817714691162, -1.9107767343521118, -1.8067357540130615, -1.7026948928833008, -1.59865403175354, -1.4946131706237793, -1.3905723094940186, -1.2865313291549683, -1.1824904680252075, -1.0784496068954468, -0.9744086861610413, -0.8703677654266357, -0.766326904296875, -0.6622860431671143, -0.5582451224327087, -0.4542042315006256, -0.3501633405685425, -0.24612247943878174, -0.14208155870437622, -0.0380406379699707, 0.06599998474121094, 0.17004087567329407, 0.2740817666053772, 0.3781226575374603, 0.48216354846954346, 0.5862044095993042, 0.6902453303337097, 0.7942862510681152, 0.898327112197876, 1.0023679733276367, 1.1064088344573975, 1.2104498147964478, 1.3144906759262085, 1.4185315370559692, 1.5225725173950195, 1.6266133785247803, 1.730654239654541, 1.8346951007843018, 1.9387359619140625, 2.0427768230438232, 2.146817684173584, 2.250858783721924, 2.3548996448516846, 2.4589405059814453, 2.562981367111206, 2.667022228240967, 2.7710630893707275, 2.8751039505004883, 2.979145050048828, 3.0831856727600098, 3.1872267723083496, 3.2912676334381104, 3.395308494567871]}, "gradients/decoder.model.decoder.embed_tokens.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 3.0, 1.0, 5.0, 5.0, 13.0, 23.0, 140.0, 170.0, 749.0, 8554.0, 51386280.0, 71409.0, 3279.0, 414.0, 154.0, 77.0, 36.0, 24.0, 14.0, 3.0, 6.0, 5.0, 2.0, 0.0, 2.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.0625, -32.083946228027344, -31.105396270751953, -30.12684440612793, -29.148292541503906, -28.16973876953125, -27.191186904907227, -26.212635040283203, -25.23408317565918, -24.255531311035156, -23.276979446411133, -22.29842758178711, -21.319873809814453, -20.341323852539062, -19.362770080566406, -18.384218215942383, -17.40566635131836, -16.427114486694336, -15.448562622070312, -14.470009803771973, -13.49145793914795, -12.512906074523926, -11.534353256225586, -10.555801391601562, -9.577249526977539, -8.598697662353516, -7.620145320892334, -6.641592979431152, -5.663041114807129, -4.6844892501831055, -3.705936908721924, -2.727384567260742, -1.7488346099853516, -0.770282506942749, 0.20826959609985352, 1.186821699142456, 2.1653738021850586, 3.143925666809082, 4.122478008270264, 5.101030349731445, 6.079582214355469, 7.058134078979492, 8.036685943603516, 9.015238761901855, 9.993790626525879, 10.972342491149902, 11.950895309448242, 12.929447174072266, 13.907999038696289, 14.886550903320312, 15.865102767944336, 16.84365463256836, 17.822208404541016, 18.800758361816406, 19.779312133789062, 20.757863998413086, 21.73641586303711, 22.714967727661133, 23.693519592285156, 24.67207145690918, 25.650623321533203, 26.62917709350586, 27.607728958129883, 28.586280822753906, 29.56483268737793]}, "gradients/encoder.adapter.layers.2.conv.weight": {"_type": "histogram", "values": [3.0, 8.0, 3.0, 7.0, 16.0, 16.0, 27.0, 34.0, 61.0, 85.0, 150.0, 226.0, 410.0, 622.0, 914.0, 1522.0, 2483.0, 4066.0, 6650.0, 10406.0, 16729.0, 26531.0, 41004.0, 62175.0, 94163.0, 134846.0, 185562.0, 241687.0, 295806.0, 459630.0, 3334492.0, 343414.0, 280776.0, 223590.0, 168171.0, 120737.0, 82970.0, 54733.0, 35771.0, 22803.0, 14297.0, 8963.0, 5612.0, 3498.0, 2114.0, 1365.0, 823.0, 549.0, 337.0, 217.0, 135.0, 86.0, 49.0, 33.0, 22.0, 20.0, 12.0, 9.0, 5.0, 3.0, 4.0, 2.0, 0.0, 2.0], "bins": [-0.7099609375, -0.6865692138671875, -0.663177490234375, -0.6397857666015625, -0.61639404296875, -0.5930023193359375, -0.569610595703125, -0.5462188720703125, -0.5228271484375, -0.4994354248046875, -0.476043701171875, -0.4526519775390625, -0.42926025390625, -0.4058685302734375, -0.382476806640625, -0.3590850830078125, -0.335693359375, -0.3123016357421875, -0.288909912109375, -0.2655181884765625, -0.24212646484375, -0.2187347412109375, -0.195343017578125, -0.1719512939453125, -0.1485595703125, -0.1251678466796875, -0.101776123046875, -0.0783843994140625, -0.05499267578125, -0.0316009521484375, -0.008209228515625, 0.0151824951171875, 0.03857421875, 0.0619659423828125, 0.085357666015625, 0.1087493896484375, 0.13214111328125, 0.1555328369140625, 0.178924560546875, 0.2023162841796875, 0.2257080078125, 0.2490997314453125, 0.272491455078125, 0.2958831787109375, 0.31927490234375, 0.3426666259765625, 0.366058349609375, 0.3894500732421875, 0.412841796875, 0.4362335205078125, 0.459625244140625, 0.4830169677734375, 0.50640869140625, 0.5298004150390625, 0.553192138671875, 0.5765838623046875, 0.5999755859375, 0.6233673095703125, 0.646759033203125, 0.6701507568359375, 0.69354248046875, 0.7169342041015625, 0.740325927734375, 0.7637176513671875, 0.787109375]}, "gradients/encoder.adapter.layers.2.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 1.0, 4.0, 1.0, 9.0, 10.0, 15.0, 20.0, 22.0, 20.0, 29.0, 35.0, 24.0, 33.0, 35.0, 30.0, 42.0, 50.0, 57.0, 66.0, 1033.0, 94.0, 43.0, 39.0, 36.0, 42.0, 35.0, 32.0, 24.0, 27.0, 23.0, 12.0, 27.0, 15.0, 11.0, 9.0, 6.0, 3.0, 5.0, 3.0, 1.0, 4.0, 5.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.390625, -18.8614501953125, -18.332275390625, -17.8031005859375, -17.27392578125, -16.7447509765625, -16.215576171875, -15.6864013671875, -15.1572265625, -14.6280517578125, -14.098876953125, -13.5697021484375, -13.04052734375, -12.5113525390625, -11.982177734375, -11.4530029296875, -10.923828125, -10.3946533203125, -9.865478515625, -9.3363037109375, -8.80712890625, -8.2779541015625, -7.748779296875, -7.2196044921875, -6.6904296875, -6.1612548828125, -5.632080078125, -5.1029052734375, -4.57373046875, -4.0445556640625, -3.515380859375, -2.9862060546875, -2.45703125, -1.9278564453125, -1.398681640625, -0.8695068359375, -0.34033203125, 0.1888427734375, 0.718017578125, 1.2471923828125, 1.7763671875, 2.3055419921875, 2.834716796875, 3.3638916015625, 3.89306640625, 4.4222412109375, 4.951416015625, 5.4805908203125, 6.009765625, 6.5389404296875, 7.068115234375, 7.5972900390625, 8.12646484375, 8.6556396484375, 9.184814453125, 9.7139892578125, 10.2431640625, 10.7723388671875, 11.301513671875, 11.8306884765625, 12.35986328125, 12.8890380859375, 13.418212890625, 13.9473876953125, 14.4765625]}, "gradients/encoder.adapter.layers.1.conv.weight": {"_type": "histogram", "values": [5.0, 4.0, 5.0, 16.0, 22.0, 34.0, 43.0, 53.0, 107.0, 147.0, 239.0, 339.0, 532.0, 878.0, 1371.0, 2234.0, 3434.0, 5259.0, 8410.0, 12714.0, 19250.0, 28754.0, 42415.0, 60073.0, 85048.0, 115853.0, 152440.0, 191797.0, 230935.0, 266041.0, 729750.0, 2976170.0, 285683.0, 245544.0, 210004.0, 169120.0, 130857.0, 97507.0, 70399.0, 49210.0, 33682.0, 23002.0, 15077.0, 9795.0, 6425.0, 4026.0, 2500.0, 1630.0, 989.0, 577.0, 413.0, 258.0, 161.0, 94.0, 56.0, 31.0, 17.0, 10.0, 7.0, 2.0, 5.0, 0.0, 2.0, 1.0], "bins": [-0.5390625, -0.5217971801757812, -0.5045318603515625, -0.48726654052734375, -0.470001220703125, -0.45273590087890625, -0.4354705810546875, -0.41820526123046875, -0.40093994140625, -0.38367462158203125, -0.3664093017578125, -0.34914398193359375, -0.331878662109375, -0.31461334228515625, -0.2973480224609375, -0.28008270263671875, -0.2628173828125, -0.24555206298828125, -0.2282867431640625, -0.21102142333984375, -0.193756103515625, -0.17649078369140625, -0.1592254638671875, -0.14196014404296875, -0.12469482421875, -0.10742950439453125, -0.0901641845703125, -0.07289886474609375, -0.055633544921875, -0.03836822509765625, -0.0211029052734375, -0.00383758544921875, 0.013427734375, 0.03069305419921875, 0.0479583740234375, 0.06522369384765625, 0.082489013671875, 0.09975433349609375, 0.1170196533203125, 0.13428497314453125, 0.15155029296875, 0.16881561279296875, 0.1860809326171875, 0.20334625244140625, 0.220611572265625, 0.23787689208984375, 0.2551422119140625, 0.27240753173828125, 0.2896728515625, 0.30693817138671875, 0.3242034912109375, 0.34146881103515625, 0.358734130859375, 0.37599945068359375, 0.3932647705078125, 0.41053009033203125, 0.42779541015625, 0.44506072998046875, 0.4623260498046875, 0.47959136962890625, 0.496856689453125, 0.5141220092773438, 0.5313873291015625, 0.5486526489257812, 0.56591796875]}, "gradients/encoder.adapter.layers.1.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 5.0, 6.0, 6.0, 9.0, 11.0, 13.0, 17.0, 13.0, 20.0, 30.0, 26.0, 38.0, 25.0, 39.0, 40.0, 38.0, 39.0, 48.0, 53.0, 959.0, 157.0, 41.0, 46.0, 60.0, 30.0, 41.0, 32.0, 28.0, 29.0, 23.0, 23.0, 18.0, 18.0, 12.0, 10.0, 8.0, 2.0, 4.0, 3.0, 2.0, 8.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-15.7734375, -15.3448486328125, -14.916259765625, -14.4876708984375, -14.05908203125, -13.6304931640625, -13.201904296875, -12.7733154296875, -12.3447265625, -11.9161376953125, -11.487548828125, -11.0589599609375, -10.63037109375, -10.2017822265625, -9.773193359375, -9.3446044921875, -8.916015625, -8.4874267578125, -8.058837890625, -7.6302490234375, -7.20166015625, -6.7730712890625, -6.344482421875, -5.9158935546875, -5.4873046875, -5.0587158203125, -4.630126953125, -4.2015380859375, -3.77294921875, -3.3443603515625, -2.915771484375, -2.4871826171875, -2.05859375, -1.6300048828125, -1.201416015625, -0.7728271484375, -0.34423828125, 0.0843505859375, 0.512939453125, 0.9415283203125, 1.3701171875, 1.7987060546875, 2.227294921875, 2.6558837890625, 3.08447265625, 3.5130615234375, 3.941650390625, 4.3702392578125, 4.798828125, 5.2274169921875, 5.656005859375, 6.0845947265625, 6.51318359375, 6.9417724609375, 7.370361328125, 7.7989501953125, 8.2275390625, 8.6561279296875, 9.084716796875, 9.5133056640625, 9.94189453125, 10.3704833984375, 10.799072265625, 11.2276611328125, 11.65625]}, "gradients/encoder.adapter.layers.0.conv.weight": {"_type": "histogram", "values": [3.0, 2.0, 3.0, 5.0, 5.0, 6.0, 5.0, 5.0, 12.0, 15.0, 17.0, 17.0, 30.0, 37.0, 40.0, 55.0, 68.0, 91.0, 110.0, 132.0, 208.0, 250.0, 365.0, 559.0, 1071.0, 2421.0, 5463.0, 12925.0, 29548.0, 64871.0, 137997.0, 5725529.0, 167886.0, 77461.0, 35559.0, 15577.0, 6629.0, 2945.0, 1327.0, 656.0, 385.0, 285.0, 186.0, 155.0, 107.0, 81.0, 89.0, 51.0, 55.0, 43.0, 27.0, 17.0, 17.0, 7.0, 8.0, 7.0, 8.0, 7.0, 1.0, 2.0, 3.0, 4.0, 3.0, 3.0], "bins": [-3.0390625, -2.94293212890625, -2.8468017578125, -2.75067138671875, -2.654541015625, -2.55841064453125, -2.4622802734375, -2.36614990234375, -2.27001953125, -2.17388916015625, -2.0777587890625, -1.98162841796875, -1.885498046875, -1.78936767578125, -1.6932373046875, -1.59710693359375, -1.5009765625, -1.40484619140625, -1.3087158203125, -1.21258544921875, -1.116455078125, -1.02032470703125, -0.9241943359375, -0.82806396484375, -0.73193359375, -0.63580322265625, -0.5396728515625, -0.44354248046875, -0.347412109375, -0.25128173828125, -0.1551513671875, -0.05902099609375, 0.037109375, 0.13323974609375, 0.2293701171875, 0.32550048828125, 0.421630859375, 0.51776123046875, 0.6138916015625, 0.71002197265625, 0.80615234375, 0.90228271484375, 0.9984130859375, 1.09454345703125, 1.190673828125, 1.28680419921875, 1.3829345703125, 1.47906494140625, 1.5751953125, 1.67132568359375, 1.7674560546875, 1.86358642578125, 1.959716796875, 2.05584716796875, 2.1519775390625, 2.24810791015625, 2.34423828125, 2.44036865234375, 2.5364990234375, 2.63262939453125, 2.728759765625, 2.82489013671875, 2.9210205078125, 3.01715087890625, 3.11328125]}, "gradients/encoder.adapter.layers.0.conv.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 4.0, 2.0, 2.0, 4.0, 9.0, 7.0, 10.0, 15.0, 10.0, 13.0, 17.0, 16.0, 16.0, 31.0, 30.0, 31.0, 24.0, 38.0, 32.0, 30.0, 40.0, 27.0, 31.0, 87.0, 1001.0, 58.0, 35.0, 34.0, 33.0, 36.0, 32.0, 28.0, 22.0, 18.0, 28.0, 24.0, 17.0, 17.0, 15.0, 13.0, 14.0, 12.0, 9.0, 8.0, 5.0, 6.0, 10.0, 9.0, 5.0, 5.0, 4.0, 5.0, 6.0, 0.0, 1.0, 1.0], "bins": [-10.125, -9.8126220703125, -9.500244140625, -9.1878662109375, -8.87548828125, -8.5631103515625, -8.250732421875, -7.9383544921875, -7.6259765625, -7.3135986328125, -7.001220703125, -6.6888427734375, -6.37646484375, -6.0640869140625, -5.751708984375, -5.4393310546875, -5.126953125, -4.8145751953125, -4.502197265625, -4.1898193359375, -3.87744140625, -3.5650634765625, -3.252685546875, -2.9403076171875, -2.6279296875, -2.3155517578125, -2.003173828125, -1.6907958984375, -1.37841796875, -1.0660400390625, -0.753662109375, -0.4412841796875, -0.12890625, 0.1834716796875, 0.495849609375, 0.8082275390625, 1.12060546875, 1.4329833984375, 1.745361328125, 2.0577392578125, 2.3701171875, 2.6824951171875, 2.994873046875, 3.3072509765625, 3.61962890625, 3.9320068359375, 4.244384765625, 4.5567626953125, 4.869140625, 5.1815185546875, 5.493896484375, 5.8062744140625, 6.11865234375, 6.4310302734375, 6.743408203125, 7.0557861328125, 7.3681640625, 7.6805419921875, 7.992919921875, 8.3052978515625, 8.61767578125, 8.9300537109375, 9.242431640625, 9.5548095703125, 9.8671875]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 2.0, 2.0, 13.0, 37.0, 101.0, 298.0, 342.0, 122.0, 54.0, 20.0, 11.0, 5.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-133.92686462402344, -130.41455078125, -126.90223693847656, -123.38992309570312, -119.87760925292969, -116.36529541015625, -112.85298156738281, -109.34066009521484, -105.8283462524414, -102.31603240966797, -98.80371856689453, -95.2914047241211, -91.77909088134766, -88.26676940917969, -84.75445556640625, -81.24214172363281, -77.72982788085938, -74.21751403808594, -70.7052001953125, -67.19288635253906, -63.68056869506836, -60.16825485229492, -56.655941009521484, -53.14362335205078, -49.631317138671875, -46.11900329589844, -42.606689453125, -39.09437561035156, -35.58205795288086, -32.06974411010742, -28.557430267333984, -25.045114517211914, -21.532798767089844, -18.020484924316406, -14.508169174194336, -10.995855331420898, -7.4835405349731445, -3.9712257385253906, -0.4589118957519531, 3.053403854370117, 6.565717697143555, 10.078032493591309, 13.590347290039062, 17.1026611328125, 20.614974975585938, 24.127290725708008, 27.639604568481445, 31.151920318603516, 34.66423416137695, 38.17654800415039, 41.68886184692383, 45.20117950439453, 48.71349334716797, 52.225807189941406, 55.738121032714844, 59.25043487548828, 62.76274871826172, 66.27506256103516, 69.7873764038086, 73.29969024658203, 76.81200408935547, 80.32432556152344, 83.83663940429688, 87.34895324707031, 90.86126708984375]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 0.0, 4.0, 1.0, 0.0, 6.0, 5.0, 7.0, 4.0, 3.0, 9.0, 16.0, 20.0, 16.0, 26.0, 36.0, 45.0, 67.0, 58.0, 73.0, 118.0, 89.0, 80.0, 75.0, 53.0, 49.0, 32.0, 27.0, 19.0, 11.0, 18.0, 8.0, 10.0, 5.0, 3.0, 5.0, 2.0, 3.0, 0.0, 0.0, 3.0, 1.0, 3.0, 1.0, 0.0, 2.0], "bins": [-158.6954345703125, -154.61233520507812, -150.5292205810547, -146.44610595703125, -142.36300659179688, -138.2799072265625, -134.19679260253906, -130.11367797851562, -126.03057861328125, -121.94747161865234, -117.86436462402344, -113.78125762939453, -109.69815063476562, -105.61504364013672, -101.53193664550781, -97.4488296508789, -93.36572265625, -89.2826156616211, -85.19950866699219, -81.11640167236328, -77.03329467773438, -72.95018768310547, -68.86708068847656, -64.78397369384766, -60.70086669921875, -56.617759704589844, -52.53465270996094, -48.45154571533203, -44.368438720703125, -40.28533172607422, -36.20222473144531, -32.119117736816406, -28.036026000976562, -23.952919006347656, -19.86981201171875, -15.786705017089844, -11.703598022460938, -7.620491027832031, -3.537384033203125, 0.5457229614257812, 4.6288299560546875, 8.711936950683594, 12.7950439453125, 16.878150939941406, 20.961257934570312, 25.04436492919922, 29.127471923828125, 33.21057891845703, 37.29368591308594, 41.376792907714844, 45.45989990234375, 49.543006896972656, 53.62611389160156, 57.70922088623047, 61.792327880859375, 65.87543487548828, 69.95854187011719, 74.0416488647461, 78.124755859375, 82.2078628540039, 86.29096984863281, 90.37407684326172, 94.45718383789062, 98.54029083251953, 102.62339782714844]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 4.0, 4.0, 9.0, 7.0, 19.0, 11.0, 23.0, 39.0, 42.0, 56.0, 78.0, 90.0, 119.0, 213.0, 308.0, 448.0, 740.0, 1167.0, 1925.0, 3541.0, 7069.0, 18122.0, 82595.0, 3913789.0, 120008.0, 23635.0, 9148.0, 4489.0, 2370.0, 1391.0, 837.0, 591.0, 383.0, 293.0, 168.0, 153.0, 97.0, 79.0, 67.0, 57.0, 25.0, 14.0, 13.0, 12.0, 11.0, 10.0, 9.0, 3.0, 2.0, 3.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.140625, -0.13602638244628906, -0.13142776489257812, -0.1268291473388672, -0.12223052978515625, -0.11763191223144531, -0.11303329467773438, -0.10843467712402344, -0.1038360595703125, -0.09923744201660156, -0.09463882446289062, -0.09004020690917969, -0.08544158935546875, -0.08084297180175781, -0.07624435424804688, -0.07164573669433594, -0.067047119140625, -0.06244850158691406, -0.057849884033203125, -0.05325126647949219, -0.04865264892578125, -0.04405403137207031, -0.039455413818359375, -0.03485679626464844, -0.0302581787109375, -0.025659561157226562, -0.021060943603515625, -0.016462326049804688, -0.01186370849609375, -0.0072650909423828125, -0.002666473388671875, 0.0019321441650390625, 0.00653076171875, 0.011129379272460938, 0.015727996826171875, 0.020326614379882812, 0.02492523193359375, 0.029523849487304688, 0.034122467041015625, 0.03872108459472656, 0.0433197021484375, 0.04791831970214844, 0.052516937255859375, 0.05711555480957031, 0.06171417236328125, 0.06631278991699219, 0.07091140747070312, 0.07551002502441406, 0.080108642578125, 0.08470726013183594, 0.08930587768554688, 0.09390449523925781, 0.09850311279296875, 0.10310173034667969, 0.10770034790039062, 0.11229896545410156, 0.1168975830078125, 0.12149620056152344, 0.12609481811523438, 0.1306934356689453, 0.13529205322265625, 0.1398906707763672, 0.14448928833007812, 0.14908790588378906, 0.1536865234375]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 8.0, 3.0, 2.0, 2.0, 4.0, 5.0, 5.0, 4.0, 6.0, 5.0, 5.0, 10.0, 8.0, 10.0, 22.0, 135.0, 625.0, 27.0, 14.0, 20.0, 12.0, 13.0, 5.0, 9.0, 5.0, 6.0, 4.0, 3.0, 1.0, 4.0, 5.0, 3.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.1231689453125, -0.11947822570800781, -0.11578750610351562, -0.11209678649902344, -0.10840606689453125, -0.10471534729003906, -0.10102462768554688, -0.09733390808105469, -0.0936431884765625, -0.08995246887207031, -0.08626174926757812, -0.08257102966308594, -0.07888031005859375, -0.07518959045410156, -0.07149887084960938, -0.06780815124511719, -0.064117431640625, -0.06042671203613281, -0.056735992431640625, -0.05304527282714844, -0.04935455322265625, -0.04566383361816406, -0.041973114013671875, -0.03828239440917969, -0.0345916748046875, -0.030900955200195312, -0.027210235595703125, -0.023519515991210938, -0.01982879638671875, -0.016138076782226562, -0.012447357177734375, -0.008756637573242188, -0.00506591796875, -0.0013751983642578125, 0.002315521240234375, 0.0060062408447265625, 0.00969696044921875, 0.013387680053710938, 0.017078399658203125, 0.020769119262695312, 0.0244598388671875, 0.028150558471679688, 0.031841278076171875, 0.03553199768066406, 0.03922271728515625, 0.04291343688964844, 0.046604156494140625, 0.05029487609863281, 0.053985595703125, 0.05767631530761719, 0.061367034912109375, 0.06505775451660156, 0.06874847412109375, 0.07243919372558594, 0.07612991333007812, 0.07982063293457031, 0.0835113525390625, 0.08720207214355469, 0.09089279174804688, 0.09458351135253906, 0.09827423095703125, 0.10196495056152344, 0.10565567016601562, 0.10934638977050781, 0.113037109375]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 1.0, 6.0, 5.0, 6.0, 11.0, 15.0, 21.0, 25.0, 30.0, 61.0, 68.0, 131.0, 175.0, 338.0, 627.0, 1438.0, 3565.0, 10267.0, 39697.0, 287368.0, 3442156.0, 345825.0, 44402.0, 11215.0, 3789.0, 1492.0, 666.0, 316.0, 212.0, 91.0, 90.0, 48.0, 36.0, 22.0, 15.0, 25.0, 9.0, 4.0, 8.0, 6.0, 2.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.1573486328125, -0.1525115966796875, -0.147674560546875, -0.1428375244140625, -0.13800048828125, -0.1331634521484375, -0.128326416015625, -0.1234893798828125, -0.11865234375, -0.1138153076171875, -0.108978271484375, -0.1041412353515625, -0.09930419921875, -0.0944671630859375, -0.089630126953125, -0.0847930908203125, -0.0799560546875, -0.0751190185546875, -0.070281982421875, -0.0654449462890625, -0.06060791015625, -0.0557708740234375, -0.050933837890625, -0.0460968017578125, -0.041259765625, -0.0364227294921875, -0.031585693359375, -0.0267486572265625, -0.02191162109375, -0.0170745849609375, -0.012237548828125, -0.0074005126953125, -0.0025634765625, 0.0022735595703125, 0.007110595703125, 0.0119476318359375, 0.01678466796875, 0.0216217041015625, 0.026458740234375, 0.0312957763671875, 0.0361328125, 0.0409698486328125, 0.045806884765625, 0.0506439208984375, 0.05548095703125, 0.0603179931640625, 0.065155029296875, 0.0699920654296875, 0.0748291015625, 0.0796661376953125, 0.084503173828125, 0.0893402099609375, 0.09417724609375, 0.0990142822265625, 0.103851318359375, 0.1086883544921875, 0.113525390625, 0.1183624267578125, 0.123199462890625, 0.1280364990234375, 0.13287353515625, 0.1377105712890625, 0.142547607421875, 0.1473846435546875, 0.1522216796875]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 6.0, 8.0, 5.0, 2.0, 4.0, 2.0, 9.0, 15.0, 18.0, 26.0, 24.0, 42.0, 43.0, 108.0, 164.0, 312.0, 784.0, 1344.0, 504.0, 229.0, 137.0, 86.0, 42.0, 46.0, 25.0, 20.0, 22.0, 10.0, 13.0, 7.0, 4.0, 1.0, 8.0, 2.0, 3.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.091796875, -0.08895301818847656, -0.08610916137695312, -0.08326530456542969, -0.08042144775390625, -0.07757759094238281, -0.07473373413085938, -0.07188987731933594, -0.0690460205078125, -0.06620216369628906, -0.06335830688476562, -0.06051445007324219, -0.05767059326171875, -0.05482673645019531, -0.051982879638671875, -0.04913902282714844, -0.046295166015625, -0.04345130920410156, -0.040607452392578125, -0.03776359558105469, -0.03491973876953125, -0.03207588195800781, -0.029232025146484375, -0.026388168334960938, -0.0235443115234375, -0.020700454711914062, -0.017856597900390625, -0.015012741088867188, -0.01216888427734375, -0.009325027465820312, -0.006481170654296875, -0.0036373138427734375, -0.00079345703125, 0.0020503997802734375, 0.004894256591796875, 0.0077381134033203125, 0.01058197021484375, 0.013425827026367188, 0.016269683837890625, 0.019113540649414062, 0.0219573974609375, 0.024801254272460938, 0.027645111083984375, 0.030488967895507812, 0.03333282470703125, 0.03617668151855469, 0.039020538330078125, 0.04186439514160156, 0.044708251953125, 0.04755210876464844, 0.050395965576171875, 0.05323982238769531, 0.05608367919921875, 0.05892753601074219, 0.061771392822265625, 0.06461524963378906, 0.0674591064453125, 0.07030296325683594, 0.07314682006835938, 0.07599067687988281, 0.07883453369140625, 0.08167839050292969, 0.08452224731445312, 0.08736610412597656, 0.0902099609375]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 5.0, 30.0, 156.0, 574.0, 209.0, 23.0, 4.0, 5.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.0225844383239746, -0.9930246472358704, -0.9634647965431213, -0.9339050054550171, -0.9043452143669128, -0.8747854232788086, -0.8452255725860596, -0.8156657814979553, -0.7861059904098511, -0.7565461993217468, -0.7269863486289978, -0.6974265575408936, -0.6678667664527893, -0.6383069753646851, -0.608747124671936, -0.5791873335838318, -0.5496275424957275, -0.5200677514076233, -0.49050793051719666, -0.46094810962677, -0.43138831853866577, -0.40182849764823914, -0.3722686767578125, -0.34270888566970825, -0.31314903497695923, -0.2835892140865326, -0.25402942299842834, -0.2244696021080017, -0.19490981101989746, -0.16534999012947083, -0.13579018414020538, -0.10623037815093994, -0.0766705870628357, -0.04711078107357025, -0.01755097135901451, 0.01200883835554123, 0.04156864434480667, 0.07112845778465271, 0.10068826377391815, 0.1302480697631836, 0.15980787575244904, 0.18936768174171448, 0.21892748773097992, 0.24848729372024536, 0.278047114610672, 0.30760693550109863, 0.3371667265892029, 0.36672651767730713, 0.39628633856773376, 0.4258461594581604, 0.45540595054626465, 0.4849657714366913, 0.5145255923271179, 0.5440853834152222, 0.5736451745033264, 0.6032049655914307, 0.6327648162841797, 0.6623246073722839, 0.691884458065033, 0.7214442491531372, 0.7510040402412415, 0.7805638313293457, 0.8101236820220947, 0.839683473110199, 0.8692432641983032]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 3.0, 4.0, 4.0, 10.0, 11.0, 11.0, 10.0, 16.0, 24.0, 33.0, 35.0, 46.0, 48.0, 57.0, 74.0, 61.0, 71.0, 82.0, 53.0, 61.0, 57.0, 42.0, 44.0, 40.0, 30.0, 26.0, 15.0, 9.0, 6.0, 9.0, 3.0, 2.0, 7.0, 0.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.34378623962402344, -0.33228981494903564, -0.32079336047172546, -0.3092969059944153, -0.2978004813194275, -0.2863040566444397, -0.2748076021671295, -0.26331114768981934, -0.25181472301483154, -0.24031828343868256, -0.22882184386253357, -0.21732540428638458, -0.2058289647102356, -0.1943325251340866, -0.18283608555793762, -0.17133964598178864, -0.15984320640563965, -0.14834676682949066, -0.13685032725334167, -0.1253538876771927, -0.1138574481010437, -0.10236100852489471, -0.09086456894874573, -0.07936812937259674, -0.06787168979644775, -0.05637525022029877, -0.04487881064414978, -0.03338237106800079, -0.021885931491851807, -0.01038949191570282, 0.001106947660446167, 0.012603387236595154, 0.02409982681274414, 0.03559626638889313, 0.047092705965042114, 0.0585891455411911, 0.07008558511734009, 0.08158202469348907, 0.09307846426963806, 0.10457490384578705, 0.11607134342193604, 0.12756778299808502, 0.139064222574234, 0.150560662150383, 0.16205710172653198, 0.17355354130268097, 0.18504998087882996, 0.19654642045497894, 0.20804286003112793, 0.21953929960727692, 0.2310357391834259, 0.2425321787595749, 0.2540286183357239, 0.26552504301071167, 0.27702149748802185, 0.28851795196533203, 0.3000143766403198, 0.3115108013153076, 0.3230072557926178, 0.334503710269928, 0.34600013494491577, 0.35749655961990356, 0.36899301409721375, 0.3804894685745239, 0.3919858932495117]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 4.0, 4.0, 5.0, 8.0, 11.0, 14.0, 23.0, 29.0, 34.0, 43.0, 63.0, 93.0, 108.0, 150.0, 226.0, 291.0, 365.0, 512.0, 709.0, 988.0, 1295.0, 1854.0, 2637.0, 3790.0, 5719.0, 9156.0, 15429.0, 30174.0, 222880.0, 671474.0, 33854.0, 16934.0, 9614.0, 6141.0, 4060.0, 2721.0, 1942.0, 1373.0, 1048.0, 743.0, 526.0, 417.0, 316.0, 185.0, 163.0, 112.0, 77.0, 70.0, 57.0, 35.0, 26.0, 19.0, 19.0, 6.0, 8.0, 7.0, 5.0, 2.0, 1.0, 0.0, 2.0, 1.0, 2.0], "bins": [-0.360107421875, -0.3481330871582031, -0.33615875244140625, -0.3241844177246094, -0.3122100830078125, -0.3002357482910156, -0.28826141357421875, -0.2762870788574219, -0.264312744140625, -0.2523384094238281, -0.24036407470703125, -0.22838973999023438, -0.2164154052734375, -0.20444107055664062, -0.19246673583984375, -0.18049240112304688, -0.16851806640625, -0.15654373168945312, -0.14456939697265625, -0.13259506225585938, -0.1206207275390625, -0.10864639282226562, -0.09667205810546875, -0.08469772338867188, -0.072723388671875, -0.060749053955078125, -0.04877471923828125, -0.036800384521484375, -0.0248260498046875, -0.012851715087890625, -0.00087738037109375, 0.011096954345703125, 0.0230712890625, 0.035045623779296875, 0.04701995849609375, 0.058994293212890625, 0.0709686279296875, 0.08294296264648438, 0.09491729736328125, 0.10689163208007812, 0.118865966796875, 0.13084030151367188, 0.14281463623046875, 0.15478897094726562, 0.1667633056640625, 0.17873764038085938, 0.19071197509765625, 0.20268630981445312, 0.21466064453125, 0.22663497924804688, 0.23860931396484375, 0.2505836486816406, 0.2625579833984375, 0.2745323181152344, 0.28650665283203125, 0.2984809875488281, 0.310455322265625, 0.3224296569824219, 0.33440399169921875, 0.3463783264160156, 0.3583526611328125, 0.3703269958496094, 0.38230133056640625, 0.3942756652832031, 0.40625]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 5.0, 6.0, 3.0, 1.0, 2.0, 5.0, 4.0, 4.0, 4.0, 5.0, 8.0, 5.0, 9.0, 9.0, 11.0, 34.0, 438.0, 313.0, 23.0, 15.0, 19.0, 17.0, 6.0, 7.0, 9.0, 7.0, 5.0, 1.0, 3.0, 3.0, 4.0, 4.0, 3.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.12188720703125, -0.1182088851928711, -0.11453056335449219, -0.11085224151611328, -0.10717391967773438, -0.10349559783935547, -0.09981727600097656, -0.09613895416259766, -0.09246063232421875, -0.08878231048583984, -0.08510398864746094, -0.08142566680908203, -0.07774734497070312, -0.07406902313232422, -0.07039070129394531, -0.0667123794555664, -0.0630340576171875, -0.059355735778808594, -0.05567741394042969, -0.05199909210205078, -0.048320770263671875, -0.04464244842529297, -0.04096412658691406, -0.037285804748535156, -0.03360748291015625, -0.029929161071777344, -0.026250839233398438, -0.02257251739501953, -0.018894195556640625, -0.015215873718261719, -0.011537551879882812, -0.007859230041503906, -0.004180908203125, -0.0005025863647460938, 0.0031757354736328125, 0.006854057312011719, 0.010532379150390625, 0.014210700988769531, 0.017889022827148438, 0.021567344665527344, 0.02524566650390625, 0.028923988342285156, 0.03260231018066406, 0.03628063201904297, 0.039958953857421875, 0.04363727569580078, 0.04731559753417969, 0.050993919372558594, 0.0546722412109375, 0.058350563049316406, 0.06202888488769531, 0.06570720672607422, 0.06938552856445312, 0.07306385040283203, 0.07674217224121094, 0.08042049407958984, 0.08409881591796875, 0.08777713775634766, 0.09145545959472656, 0.09513378143310547, 0.09881210327148438, 0.10249042510986328, 0.10616874694824219, 0.1098470687866211, 0.113525390625]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 1.0, 1.0, 2.0, 7.0, 4.0, 8.0, 18.0, 14.0, 22.0, 43.0, 49.0, 61.0, 100.0, 126.0, 157.0, 235.0, 437.0, 696.0, 1402.0, 3123.0, 7631.0, 22706.0, 85057.0, 388808.0, 410027.0, 89256.0, 23657.0, 8164.0, 3218.0, 1435.0, 717.0, 452.0, 267.0, 180.0, 144.0, 93.0, 55.0, 59.0, 43.0, 30.0, 18.0, 10.0, 11.0, 5.0, 7.0, 6.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.356689453125, -0.34588623046875, -0.3350830078125, -0.32427978515625, -0.3134765625, -0.30267333984375, -0.2918701171875, -0.28106689453125, -0.270263671875, -0.25946044921875, -0.2486572265625, -0.23785400390625, -0.22705078125, -0.21624755859375, -0.2054443359375, -0.19464111328125, -0.183837890625, -0.17303466796875, -0.1622314453125, -0.15142822265625, -0.140625, -0.12982177734375, -0.1190185546875, -0.10821533203125, -0.097412109375, -0.08660888671875, -0.0758056640625, -0.06500244140625, -0.05419921875, -0.04339599609375, -0.0325927734375, -0.02178955078125, -0.010986328125, -0.00018310546875, 0.0106201171875, 0.02142333984375, 0.0322265625, 0.04302978515625, 0.0538330078125, 0.06463623046875, 0.075439453125, 0.08624267578125, 0.0970458984375, 0.10784912109375, 0.11865234375, 0.12945556640625, 0.1402587890625, 0.15106201171875, 0.161865234375, 0.17266845703125, 0.1834716796875, 0.19427490234375, 0.205078125, 0.21588134765625, 0.2266845703125, 0.23748779296875, 0.248291015625, 0.25909423828125, 0.2698974609375, 0.28070068359375, 0.29150390625, 0.30230712890625, 0.3131103515625, 0.32391357421875, 0.334716796875]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 5.0, 8.0, 6.0, 15.0, 11.0, 15.0, 13.0, 21.0, 23.0, 27.0, 34.0, 30.0, 33.0, 21.0, 37.0, 53.0, 30.0, 43.0, 51.0, 45.0, 47.0, 47.0, 50.0, 42.0, 39.0, 27.0, 35.0, 26.0, 30.0, 37.0, 22.0, 16.0, 15.0, 13.0, 14.0, 5.0, 3.0, 7.0, 3.0, 3.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4921875, -0.47589111328125, -0.4595947265625, -0.44329833984375, -0.427001953125, -0.41070556640625, -0.3944091796875, -0.37811279296875, -0.36181640625, -0.34552001953125, -0.3292236328125, -0.31292724609375, -0.296630859375, -0.28033447265625, -0.2640380859375, -0.24774169921875, -0.2314453125, -0.21514892578125, -0.1988525390625, -0.18255615234375, -0.166259765625, -0.14996337890625, -0.1336669921875, -0.11737060546875, -0.10107421875, -0.08477783203125, -0.0684814453125, -0.05218505859375, -0.035888671875, -0.01959228515625, -0.0032958984375, 0.01300048828125, 0.029296875, 0.04559326171875, 0.0618896484375, 0.07818603515625, 0.094482421875, 0.11077880859375, 0.1270751953125, 0.14337158203125, 0.15966796875, 0.17596435546875, 0.1922607421875, 0.20855712890625, 0.224853515625, 0.24114990234375, 0.2574462890625, 0.27374267578125, 0.2900390625, 0.30633544921875, 0.3226318359375, 0.33892822265625, 0.355224609375, 0.37152099609375, 0.3878173828125, 0.40411376953125, 0.42041015625, 0.43670654296875, 0.4530029296875, 0.46929931640625, 0.485595703125, 0.50189208984375, 0.5181884765625, 0.53448486328125, 0.55078125]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 4.0, 1.0, 1.0, 6.0, 6.0, 4.0, 5.0, 12.0, 13.0, 17.0, 19.0, 33.0, 37.0, 79.0, 131.0, 235.0, 504.0, 1300.0, 3837.0, 26158.0, 960750.0, 47496.0, 5168.0, 1509.0, 594.0, 249.0, 149.0, 87.0, 45.0, 33.0, 21.0, 16.0, 13.0, 9.0, 2.0, 5.0, 7.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4794921875, -1.435455322265625, -1.39141845703125, -1.347381591796875, -1.3033447265625, -1.259307861328125, -1.21527099609375, -1.171234130859375, -1.127197265625, -1.083160400390625, -1.03912353515625, -0.995086669921875, -0.9510498046875, -0.907012939453125, -0.86297607421875, -0.818939208984375, -0.77490234375, -0.730865478515625, -0.68682861328125, -0.642791748046875, -0.5987548828125, -0.554718017578125, -0.51068115234375, -0.466644287109375, -0.422607421875, -0.378570556640625, -0.33453369140625, -0.290496826171875, -0.2464599609375, -0.202423095703125, -0.15838623046875, -0.114349365234375, -0.0703125, -0.026275634765625, 0.01776123046875, 0.061798095703125, 0.1058349609375, 0.149871826171875, 0.19390869140625, 0.237945556640625, 0.281982421875, 0.326019287109375, 0.37005615234375, 0.414093017578125, 0.4581298828125, 0.502166748046875, 0.54620361328125, 0.590240478515625, 0.63427734375, 0.678314208984375, 0.72235107421875, 0.766387939453125, 0.8104248046875, 0.854461669921875, 0.89849853515625, 0.942535400390625, 0.986572265625, 1.030609130859375, 1.07464599609375, 1.118682861328125, 1.1627197265625, 1.206756591796875, 1.25079345703125, 1.294830322265625, 1.3388671875]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 4.0, 7.0, 5.0, 4.0, 15.0, 14.0, 30.0, 37.0, 59.0, 79.0, 137.0, 168.0, 154.0, 88.0, 63.0, 56.0, 32.0, 10.0, 13.0, 7.0, 6.0, 5.0, 3.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.412101745605469e-05, -5.2012503147125244e-05, -4.99039888381958e-05, -4.779547452926636e-05, -4.5686960220336914e-05, -4.357844591140747e-05, -4.146993160247803e-05, -3.9361417293548584e-05, -3.725290298461914e-05, -3.51443886756897e-05, -3.3035874366760254e-05, -3.092736005783081e-05, -2.8818845748901367e-05, -2.6710331439971924e-05, -2.460181713104248e-05, -2.2493302822113037e-05, -2.0384788513183594e-05, -1.827627420425415e-05, -1.6167759895324707e-05, -1.4059245586395264e-05, -1.195073127746582e-05, -9.842216968536377e-06, -7.733702659606934e-06, -5.62518835067749e-06, -3.516674041748047e-06, -1.4081597328186035e-06, 7.003545761108398e-07, 2.808868885040283e-06, 4.9173831939697266e-06, 7.02589750289917e-06, 9.134411811828613e-06, 1.1242926120758057e-05, 1.33514404296875e-05, 1.5459954738616943e-05, 1.7568469047546387e-05, 1.967698335647583e-05, 2.1785497665405273e-05, 2.3894011974334717e-05, 2.600252628326416e-05, 2.8111040592193604e-05, 3.0219554901123047e-05, 3.232806921005249e-05, 3.4436583518981934e-05, 3.654509782791138e-05, 3.865361213684082e-05, 4.0762126445770264e-05, 4.287064075469971e-05, 4.497915506362915e-05, 4.7087669372558594e-05, 4.919618368148804e-05, 5.130469799041748e-05, 5.3413212299346924e-05, 5.552172660827637e-05, 5.763024091720581e-05, 5.9738755226135254e-05, 6.18472695350647e-05, 6.395578384399414e-05, 6.606429815292358e-05, 6.817281246185303e-05, 7.028132677078247e-05, 7.238984107971191e-05, 7.449835538864136e-05, 7.66068696975708e-05, 7.871538400650024e-05, 8.082389831542969e-05]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 4.0, 2.0, 7.0, 8.0, 16.0, 15.0, 31.0, 61.0, 117.0, 277.0, 747.0, 3315.0, 36645.0, 965318.0, 37241.0, 3424.0, 784.0, 286.0, 131.0, 51.0, 27.0, 12.0, 13.0, 6.0, 5.0, 9.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.3291015625, -1.2894287109375, -1.249755859375, -1.2100830078125, -1.17041015625, -1.1307373046875, -1.091064453125, -1.0513916015625, -1.01171875, -0.9720458984375, -0.932373046875, -0.8927001953125, -0.85302734375, -0.8133544921875, -0.773681640625, -0.7340087890625, -0.6943359375, -0.6546630859375, -0.614990234375, -0.5753173828125, -0.53564453125, -0.4959716796875, -0.456298828125, -0.4166259765625, -0.376953125, -0.3372802734375, -0.297607421875, -0.2579345703125, -0.21826171875, -0.1785888671875, -0.138916015625, -0.0992431640625, -0.0595703125, -0.0198974609375, 0.019775390625, 0.0594482421875, 0.09912109375, 0.1387939453125, 0.178466796875, 0.2181396484375, 0.2578125, 0.2974853515625, 0.337158203125, 0.3768310546875, 0.41650390625, 0.4561767578125, 0.495849609375, 0.5355224609375, 0.5751953125, 0.6148681640625, 0.654541015625, 0.6942138671875, 0.73388671875, 0.7735595703125, 0.813232421875, 0.8529052734375, 0.892578125, 0.9322509765625, 0.971923828125, 1.0115966796875, 1.05126953125, 1.0909423828125, 1.130615234375, 1.1702880859375, 1.2099609375]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 4.0, 3.0, 5.0, 8.0, 8.0, 11.0, 14.0, 18.0, 30.0, 27.0, 51.0, 82.0, 145.0, 161.0, 146.0, 73.0, 59.0, 46.0, 34.0, 17.0, 12.0, 6.0, 11.0, 4.0, 9.0, 8.0, 2.0, 6.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.791015625, -0.765869140625, -0.74072265625, -0.715576171875, -0.6904296875, -0.665283203125, -0.64013671875, -0.614990234375, -0.58984375, -0.564697265625, -0.53955078125, -0.514404296875, -0.4892578125, -0.464111328125, -0.43896484375, -0.413818359375, -0.388671875, -0.363525390625, -0.33837890625, -0.313232421875, -0.2880859375, -0.262939453125, -0.23779296875, -0.212646484375, -0.1875, -0.162353515625, -0.13720703125, -0.112060546875, -0.0869140625, -0.061767578125, -0.03662109375, -0.011474609375, 0.013671875, 0.038818359375, 0.06396484375, 0.089111328125, 0.1142578125, 0.139404296875, 0.16455078125, 0.189697265625, 0.21484375, 0.239990234375, 0.26513671875, 0.290283203125, 0.3154296875, 0.340576171875, 0.36572265625, 0.390869140625, 0.416015625, 0.441162109375, 0.46630859375, 0.491455078125, 0.5166015625, 0.541748046875, 0.56689453125, 0.592041015625, 0.6171875, 0.642333984375, 0.66748046875, 0.692626953125, 0.7177734375, 0.742919921875, 0.76806640625, 0.793212890625, 0.818359375]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 12.0, 36.0, 346.0, 506.0, 79.0, 17.0, 4.0, 3.0, 4.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.117149353027344, -19.61482810974121, -19.11250877380371, -18.610187530517578, -18.107868194580078, -17.605546951293945, -17.103227615356445, -16.600906372070312, -16.098587036132812, -15.596266746520996, -15.09394645690918, -14.591626167297363, -14.089305877685547, -13.58698558807373, -13.084665298461914, -12.582344055175781, -12.080023765563965, -11.577703475952148, -11.075383186340332, -10.573062896728516, -10.0707426071167, -9.568422317504883, -9.06610107421875, -8.56378173828125, -8.061460494995117, -7.559140205383301, -7.056819915771484, -6.554499626159668, -6.052179336547852, -5.549859046936035, -5.0475382804870605, -4.545217990875244, -4.042898178100586, -3.5405778884887695, -3.038257598876953, -2.5359370708465576, -2.033616781234741, -1.5312964916229248, -1.0289759635925293, -0.5266556739807129, -0.024335384368896484, 0.4779849648475647, 0.9803053140640259, 1.4826257228851318, 1.9849460124969482, 2.4872663021087646, 2.98958683013916, 3.4919071197509766, 3.994227409362793, 4.496547698974609, 4.998867988586426, 5.501188278198242, 6.003508567810059, 6.505828857421875, 7.00814962387085, 7.510469913482666, 8.01279067993164, 8.515110969543457, 9.017431259155273, 9.51975154876709, 10.022071838378906, 10.524392127990723, 11.026712417602539, 11.529033660888672, 12.031352996826172]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 4.0, 1.0, 1.0, 4.0, 5.0, 2.0, 1.0, 3.0, 3.0, 2.0, 5.0, 5.0, 6.0, 7.0, 18.0, 13.0, 24.0, 44.0, 70.0, 125.0, 171.0, 144.0, 128.0, 80.0, 46.0, 32.0, 22.0, 10.0, 3.0, 7.0, 2.0, 4.0, 4.0, 3.0, 3.0, 3.0, 5.0, 3.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-9.919219970703125, -9.588475227355957, -9.257730484008789, -8.926985740661621, -8.596240997314453, -8.265496253967285, -7.934751510620117, -7.604006767272949, -7.273262023925781, -6.942517280578613, -6.611772537231445, -6.281027793884277, -5.950283050537109, -5.619538307189941, -5.288793563842773, -4.9580488204956055, -4.627304553985596, -4.296559810638428, -3.9658150672912598, -3.635070323944092, -3.304325580596924, -2.973580837249756, -2.642836332321167, -2.312091588973999, -1.981346845626831, -1.650602102279663, -1.3198573589324951, -0.9891127347946167, -0.6583679914474487, -0.32762324810028076, 0.0031213760375976562, 0.3338661193847656, 0.6646108627319336, 0.9953556060791016, 1.3261003494262695, 1.656844973564148, 1.987589716911316, 2.3183345794677734, 2.6490790843963623, 2.9798238277435303, 3.3105685710906982, 3.641313314437866, 3.972058057785034, 4.302802562713623, 4.633547306060791, 4.964292049407959, 5.295036792755127, 5.625781536102295, 5.956526279449463, 6.287271022796631, 6.618015766143799, 6.948760509490967, 7.279505252838135, 7.610249996185303, 7.9409942626953125, 8.27173900604248, 8.602483749389648, 8.933228492736816, 9.263973236083984, 9.594717979431152, 9.92546272277832, 10.256207466125488, 10.586952209472656, 10.917696952819824, 11.248441696166992]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 1.0, 3.0, 2.0, 5.0, 4.0, 5.0, 11.0, 16.0, 15.0, 30.0, 30.0, 64.0, 66.0, 110.0, 165.0, 222.0, 348.0, 484.0, 796.0, 1290.0, 2146.0, 3692.0, 7497.0, 16859.0, 50524.0, 582868.0, 3408596.0, 77910.0, 21714.0, 8859.0, 4306.0, 2256.0, 1273.0, 784.0, 465.0, 284.0, 207.0, 130.0, 96.0, 56.0, 42.0, 13.0, 18.0, 13.0, 6.0, 4.0, 6.0, 2.0, 0.0, 2.0, 0.0, 2.0], "bins": [-0.8486328125, -0.8263778686523438, -0.8041229248046875, -0.7818679809570312, -0.759613037109375, -0.7373580932617188, -0.7151031494140625, -0.6928482055664062, -0.67059326171875, -0.6483383178710938, -0.6260833740234375, -0.6038284301757812, -0.581573486328125, -0.5593185424804688, -0.5370635986328125, -0.5148086547851562, -0.4925537109375, -0.47029876708984375, -0.4480438232421875, -0.42578887939453125, -0.403533935546875, -0.38127899169921875, -0.3590240478515625, -0.33676910400390625, -0.31451416015625, -0.29225921630859375, -0.2700042724609375, -0.24774932861328125, -0.225494384765625, -0.20323944091796875, -0.1809844970703125, -0.15872955322265625, -0.136474609375, -0.11421966552734375, -0.0919647216796875, -0.06970977783203125, -0.047454833984375, -0.02519989013671875, -0.0029449462890625, 0.01930999755859375, 0.04156494140625, 0.06381988525390625, 0.0860748291015625, 0.10832977294921875, 0.130584716796875, 0.15283966064453125, 0.1750946044921875, 0.19734954833984375, 0.2196044921875, 0.24185943603515625, 0.2641143798828125, 0.28636932373046875, 0.308624267578125, 0.33087921142578125, 0.3531341552734375, 0.37538909912109375, 0.39764404296875, 0.41989898681640625, 0.4421539306640625, 0.46440887451171875, 0.486663818359375, 0.5089187622070312, 0.5311737060546875, 0.5534286499023438, 0.57568359375]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 1.0, 3.0, 4.0, 3.0, 5.0, 4.0, 6.0, 13.0, 4.0, 5.0, 12.0, 7.0, 9.0, 24.0, 60.0, 203.0, 299.0, 146.0, 64.0, 30.0, 15.0, 4.0, 14.0, 15.0, 10.0, 8.0, 6.0, 5.0, 5.0, 2.0, 1.0, 5.0, 5.0, 1.0, 1.0, 2.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10882568359375, -0.10584354400634766, -0.10286140441894531, -0.09987926483154297, -0.09689712524414062, -0.09391498565673828, -0.09093284606933594, -0.0879507064819336, -0.08496856689453125, -0.0819864273071289, -0.07900428771972656, -0.07602214813232422, -0.07304000854492188, -0.07005786895751953, -0.06707572937011719, -0.06409358978271484, -0.0611114501953125, -0.058129310607910156, -0.05514717102050781, -0.05216503143310547, -0.049182891845703125, -0.04620075225830078, -0.04321861267089844, -0.040236473083496094, -0.03725433349609375, -0.034272193908691406, -0.03129005432128906, -0.02830791473388672, -0.025325775146484375, -0.02234363555908203, -0.019361495971679688, -0.016379356384277344, -0.013397216796875, -0.010415077209472656, -0.0074329376220703125, -0.004450798034667969, -0.001468658447265625, 0.0015134811401367188, 0.0044956207275390625, 0.007477760314941406, 0.01045989990234375, 0.013442039489746094, 0.016424179077148438, 0.01940631866455078, 0.022388458251953125, 0.02537059783935547, 0.028352737426757812, 0.031334877014160156, 0.0343170166015625, 0.037299156188964844, 0.04028129577636719, 0.04326343536376953, 0.046245574951171875, 0.04922771453857422, 0.05220985412597656, 0.055191993713378906, 0.05817413330078125, 0.061156272888183594, 0.06413841247558594, 0.06712055206298828, 0.07010269165039062, 0.07308483123779297, 0.07606697082519531, 0.07904911041259766, 0.08203125]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 5.0, 3.0, 3.0, 6.0, 6.0, 7.0, 10.0, 24.0, 29.0, 58.0, 67.0, 118.0, 200.0, 371.0, 672.0, 1369.0, 3443.0, 10994.0, 52197.0, 686389.0, 3264172.0, 142782.0, 21203.0, 5862.0, 2164.0, 974.0, 479.0, 237.0, 137.0, 98.0, 67.0, 50.0, 35.0, 22.0, 12.0, 11.0, 4.0, 6.0, 4.0, 0.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.53857421875, -0.522369384765625, -0.50616455078125, -0.489959716796875, -0.4737548828125, -0.457550048828125, -0.44134521484375, -0.425140380859375, -0.408935546875, -0.392730712890625, -0.37652587890625, -0.360321044921875, -0.3441162109375, -0.327911376953125, -0.31170654296875, -0.295501708984375, -0.279296875, -0.263092041015625, -0.24688720703125, -0.230682373046875, -0.2144775390625, -0.198272705078125, -0.18206787109375, -0.165863037109375, -0.149658203125, -0.133453369140625, -0.11724853515625, -0.101043701171875, -0.0848388671875, -0.068634033203125, -0.05242919921875, -0.036224365234375, -0.02001953125, -0.003814697265625, 0.01239013671875, 0.028594970703125, 0.0447998046875, 0.061004638671875, 0.07720947265625, 0.093414306640625, 0.109619140625, 0.125823974609375, 0.14202880859375, 0.158233642578125, 0.1744384765625, 0.190643310546875, 0.20684814453125, 0.223052978515625, 0.2392578125, 0.255462646484375, 0.27166748046875, 0.287872314453125, 0.3040771484375, 0.320281982421875, 0.33648681640625, 0.352691650390625, 0.368896484375, 0.385101318359375, 0.40130615234375, 0.417510986328125, 0.4337158203125, 0.449920654296875, 0.46612548828125, 0.482330322265625, 0.49853515625]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 4.0, 6.0, 6.0, 3.0, 10.0, 9.0, 14.0, 16.0, 29.0, 46.0, 86.0, 111.0, 220.0, 365.0, 1033.0, 1054.0, 477.0, 241.0, 105.0, 86.0, 54.0, 28.0, 19.0, 18.0, 7.0, 6.0, 6.0, 4.0, 6.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.14013671875, -0.13634967803955078, -0.13256263732910156, -0.12877559661865234, -0.12498855590820312, -0.1212015151977539, -0.11741447448730469, -0.11362743377685547, -0.10984039306640625, -0.10605335235595703, -0.10226631164550781, -0.0984792709350586, -0.09469223022460938, -0.09090518951416016, -0.08711814880371094, -0.08333110809326172, -0.0795440673828125, -0.07575702667236328, -0.07196998596191406, -0.06818294525146484, -0.06439590454101562, -0.060608863830566406, -0.05682182312011719, -0.05303478240966797, -0.04924774169921875, -0.04546070098876953, -0.04167366027832031, -0.037886619567871094, -0.034099578857421875, -0.030312538146972656, -0.026525497436523438, -0.02273845672607422, -0.018951416015625, -0.015164375305175781, -0.011377334594726562, -0.007590293884277344, -0.003803253173828125, -1.621246337890625e-05, 0.0037708282470703125, 0.007557868957519531, 0.01134490966796875, 0.015131950378417969, 0.018918991088867188, 0.022706031799316406, 0.026493072509765625, 0.030280113220214844, 0.03406715393066406, 0.03785419464111328, 0.0416412353515625, 0.04542827606201172, 0.04921531677246094, 0.053002357482910156, 0.056789398193359375, 0.060576438903808594, 0.06436347961425781, 0.06815052032470703, 0.07193756103515625, 0.07572460174560547, 0.07951164245605469, 0.0832986831665039, 0.08708572387695312, 0.09087276458740234, 0.09465980529785156, 0.09844684600830078, 0.10223388671875]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [10.0, 196.0, 742.0, 45.0, 11.0, 6.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.26927781105041504, -0.14243300259113312, -0.015588194131851196, 0.11125659942626953, 0.23810142278671265, 0.36494624614715576, 0.4917910099029541, 0.6186358332633972, 0.7454806566238403, 0.8723254799842834, 0.9991703033447266, 1.126015067100525, 1.2528598308563232, 1.3797047138214111, 1.5065494775772095, 1.6333942413330078, 1.7602391242980957, 1.887083888053894, 2.0139286518096924, 2.1407735347747803, 2.267618417739868, 2.394463062286377, 2.521307945251465, 2.6481528282165527, 2.7749977111816406, 2.9018425941467285, 3.0286872386932373, 3.155532121658325, 3.282377004623413, 3.409221649169922, 3.5360665321350098, 3.6629114151000977, 3.7897562980651855, 3.9166011810302734, 4.043446063995361, 4.170290946960449, 4.297135353088379, 4.423980236053467, 4.550825119018555, 4.677670001983643, 4.8045148849487305, 4.931359767913818, 5.058204650878906, 5.185049057006836, 5.311893939971924, 5.438738822937012, 5.5655837059021, 5.6924285888671875, 5.819272994995117, 5.946117877960205, 6.072962760925293, 6.199807167053223, 6.3266520500183105, 6.453496932983398, 6.580341815948486, 6.707186698913574, 6.834031581878662, 6.96087646484375, 7.087721347808838, 7.214566230773926, 7.3414106369018555, 7.468255519866943, 7.595100402832031, 7.721945285797119, 7.848790168762207]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 4.0, 2.0, 10.0, 1.0, 10.0, 6.0, 16.0, 21.0, 24.0, 26.0, 24.0, 36.0, 52.0, 52.0, 76.0, 81.0, 70.0, 66.0, 72.0, 62.0, 75.0, 54.0, 38.0, 38.0, 21.0, 14.0, 12.0, 8.0, 9.0, 5.0, 6.0, 1.0, 6.0, 4.0, 1.0, 1.0, 0.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8020894527435303, -0.7790535092353821, -0.7560175657272339, -0.7329816222190857, -0.7099456787109375, -0.6869097352027893, -0.6638737916946411, -0.6408379077911377, -0.6178019046783447, -0.5947659611701965, -0.5717300176620483, -0.5486940741539001, -0.525658130645752, -0.5026221871376038, -0.47958627343177795, -0.45655032992362976, -0.43351441621780396, -0.41047847270965576, -0.38744252920150757, -0.3644065856933594, -0.3413706421852112, -0.318334698677063, -0.2952987849712372, -0.272262841463089, -0.2492268979549408, -0.2261909544467926, -0.2031550109386444, -0.1801190823316574, -0.15708313882350922, -0.13404719531536102, -0.11101126670837402, -0.08797532320022583, -0.06493937969207764, -0.04190343990921974, -0.018867500126361847, 0.0041684359312057495, 0.027204379439353943, 0.050240322947502136, 0.07327625155448914, 0.09631219506263733, 0.11934813857078552, 0.14238408207893372, 0.1654200255870819, 0.1884559541940689, 0.2114918977022171, 0.2345278412103653, 0.2575637698173523, 0.2805997133255005, 0.3036356568336487, 0.3266716003417969, 0.34970754384994507, 0.37274348735809326, 0.39577943086624146, 0.41881537437438965, 0.44185128808021545, 0.46488723158836365, 0.48792317509651184, 0.5109590888023376, 0.5339950323104858, 0.557030975818634, 0.5800669193267822, 0.6031028628349304, 0.6261388063430786, 0.6491747498512268, 0.672210693359375]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 5.0, 5.0, 9.0, 3.0, 8.0, 13.0, 21.0, 24.0, 36.0, 62.0, 85.0, 141.0, 177.0, 256.0, 458.0, 681.0, 1082.0, 1811.0, 3147.0, 5799.0, 10969.0, 23399.0, 73340.0, 624329.0, 229924.0, 38290.0, 15967.0, 7896.0, 4334.0, 2462.0, 1368.0, 844.0, 533.0, 350.0, 257.0, 154.0, 99.0, 70.0, 39.0, 37.0, 24.0, 16.0, 7.0, 9.0, 13.0, 5.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4541015625, -0.43933868408203125, -0.4245758056640625, -0.40981292724609375, -0.395050048828125, -0.38028717041015625, -0.3655242919921875, -0.35076141357421875, -0.33599853515625, -0.32123565673828125, -0.3064727783203125, -0.29170989990234375, -0.276947021484375, -0.26218414306640625, -0.2474212646484375, -0.23265838623046875, -0.2178955078125, -0.20313262939453125, -0.1883697509765625, -0.17360687255859375, -0.158843994140625, -0.14408111572265625, -0.1293182373046875, -0.11455535888671875, -0.09979248046875, -0.08502960205078125, -0.0702667236328125, -0.05550384521484375, -0.040740966796875, -0.02597808837890625, -0.0112152099609375, 0.00354766845703125, 0.018310546875, 0.03307342529296875, 0.0478363037109375, 0.06259918212890625, 0.077362060546875, 0.09212493896484375, 0.1068878173828125, 0.12165069580078125, 0.13641357421875, 0.15117645263671875, 0.1659393310546875, 0.18070220947265625, 0.195465087890625, 0.21022796630859375, 0.2249908447265625, 0.23975372314453125, 0.2545166015625, 0.26927947998046875, 0.2840423583984375, 0.29880523681640625, 0.313568115234375, 0.32833099365234375, 0.3430938720703125, 0.35785675048828125, 0.37261962890625, 0.38738250732421875, 0.4021453857421875, 0.41690826416015625, 0.431671142578125, 0.44643402099609375, 0.4611968994140625, 0.47595977783203125, 0.49072265625]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 3.0, 0.0, 1.0, 3.0, 2.0, 3.0, 3.0, 7.0, 13.0, 5.0, 6.0, 7.0, 5.0, 11.0, 24.0, 51.0, 98.0, 200.0, 217.0, 134.0, 86.0, 35.0, 14.0, 18.0, 12.0, 11.0, 5.0, 8.0, 2.0, 10.0, 3.0, 3.0, 3.0, 5.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1082763671875, -0.10529422760009766, -0.10231208801269531, -0.09932994842529297, -0.09634780883789062, -0.09336566925048828, -0.09038352966308594, -0.0874013900756836, -0.08441925048828125, -0.0814371109008789, -0.07845497131347656, -0.07547283172607422, -0.07249069213867188, -0.06950855255126953, -0.06652641296386719, -0.06354427337646484, -0.0605621337890625, -0.057579994201660156, -0.05459785461425781, -0.05161571502685547, -0.048633575439453125, -0.04565143585205078, -0.04266929626464844, -0.039687156677246094, -0.03670501708984375, -0.033722877502441406, -0.030740737915039062, -0.02775859832763672, -0.024776458740234375, -0.02179431915283203, -0.018812179565429688, -0.015830039978027344, -0.012847900390625, -0.009865760803222656, -0.0068836212158203125, -0.0039014816284179688, -0.000919342041015625, 0.0020627975463867188, 0.0050449371337890625, 0.008027076721191406, 0.01100921630859375, 0.013991355895996094, 0.016973495483398438, 0.01995563507080078, 0.022937774658203125, 0.02591991424560547, 0.028902053833007812, 0.031884193420410156, 0.0348663330078125, 0.037848472595214844, 0.04083061218261719, 0.04381275177001953, 0.046794891357421875, 0.04977703094482422, 0.05275917053222656, 0.055741310119628906, 0.05872344970703125, 0.061705589294433594, 0.06468772888183594, 0.06766986846923828, 0.07065200805664062, 0.07363414764404297, 0.07661628723144531, 0.07959842681884766, 0.08258056640625]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 4.0, 2.0, 3.0, 2.0, 2.0, 6.0, 8.0, 6.0, 15.0, 22.0, 24.0, 36.0, 36.0, 57.0, 90.0, 133.0, 220.0, 312.0, 564.0, 1127.0, 2568.0, 6794.0, 20761.0, 78357.0, 344449.0, 443789.0, 107001.0, 27194.0, 8587.0, 3239.0, 1334.0, 686.0, 382.0, 230.0, 154.0, 100.0, 65.0, 52.0, 38.0, 29.0, 20.0, 16.0, 17.0, 11.0, 6.0, 3.0, 8.0, 1.0, 3.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.2841796875, -0.27407073974609375, -0.2639617919921875, -0.25385284423828125, -0.243743896484375, -0.23363494873046875, -0.2235260009765625, -0.21341705322265625, -0.20330810546875, -0.19319915771484375, -0.1830902099609375, -0.17298126220703125, -0.162872314453125, -0.15276336669921875, -0.1426544189453125, -0.13254547119140625, -0.1224365234375, -0.11232757568359375, -0.1022186279296875, -0.09210968017578125, -0.082000732421875, -0.07189178466796875, -0.0617828369140625, -0.05167388916015625, -0.04156494140625, -0.03145599365234375, -0.0213470458984375, -0.01123809814453125, -0.001129150390625, 0.00897979736328125, 0.0190887451171875, 0.02919769287109375, 0.039306640625, 0.04941558837890625, 0.0595245361328125, 0.06963348388671875, 0.079742431640625, 0.08985137939453125, 0.0999603271484375, 0.11006927490234375, 0.12017822265625, 0.13028717041015625, 0.1403961181640625, 0.15050506591796875, 0.160614013671875, 0.17072296142578125, 0.1808319091796875, 0.19094085693359375, 0.2010498046875, 0.21115875244140625, 0.2212677001953125, 0.23137664794921875, 0.241485595703125, 0.25159454345703125, 0.2617034912109375, 0.27181243896484375, 0.28192138671875, 0.29203033447265625, 0.3021392822265625, 0.31224822998046875, 0.322357177734375, 0.33246612548828125, 0.3425750732421875, 0.35268402099609375, 0.36279296875]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 3.0, 4.0, 1.0, 2.0, 2.0, 8.0, 7.0, 5.0, 6.0, 8.0, 8.0, 15.0, 17.0, 17.0, 16.0, 25.0, 24.0, 34.0, 38.0, 38.0, 29.0, 39.0, 27.0, 46.0, 52.0, 36.0, 46.0, 47.0, 43.0, 39.0, 38.0, 38.0, 35.0, 27.0, 32.0, 16.0, 27.0, 20.0, 14.0, 17.0, 10.0, 12.0, 4.0, 8.0, 7.0, 8.0, 3.0, 7.0, 1.0, 5.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.263916015625, -0.25514984130859375, -0.2463836669921875, -0.23761749267578125, -0.228851318359375, -0.22008514404296875, -0.2113189697265625, -0.20255279541015625, -0.19378662109375, -0.18502044677734375, -0.1762542724609375, -0.16748809814453125, -0.158721923828125, -0.14995574951171875, -0.1411895751953125, -0.13242340087890625, -0.1236572265625, -0.11489105224609375, -0.1061248779296875, -0.09735870361328125, -0.088592529296875, -0.07982635498046875, -0.0710601806640625, -0.06229400634765625, -0.05352783203125, -0.04476165771484375, -0.0359954833984375, -0.02722930908203125, -0.018463134765625, -0.00969696044921875, -0.0009307861328125, 0.00783538818359375, 0.0166015625, 0.02536773681640625, 0.0341339111328125, 0.04290008544921875, 0.051666259765625, 0.06043243408203125, 0.0691986083984375, 0.07796478271484375, 0.08673095703125, 0.09549713134765625, 0.1042633056640625, 0.11302947998046875, 0.121795654296875, 0.13056182861328125, 0.1393280029296875, 0.14809417724609375, 0.1568603515625, 0.16562652587890625, 0.1743927001953125, 0.18315887451171875, 0.191925048828125, 0.20069122314453125, 0.2094573974609375, 0.21822357177734375, 0.22698974609375, 0.23575592041015625, 0.2445220947265625, 0.25328826904296875, 0.262054443359375, 0.27082061767578125, 0.2795867919921875, 0.28835296630859375, 0.297119140625]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 3.0, 3.0, 1.0, 3.0, 4.0, 2.0, 4.0, 5.0, 3.0, 10.0, 11.0, 14.0, 19.0, 33.0, 43.0, 52.0, 75.0, 126.0, 219.0, 374.0, 757.0, 1781.0, 5006.0, 29857.0, 794822.0, 196999.0, 12581.0, 3059.0, 1233.0, 616.0, 320.0, 179.0, 104.0, 69.0, 49.0, 34.0, 20.0, 23.0, 15.0, 10.0, 5.0, 4.0, 5.0, 6.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.89404296875, -0.8650131225585938, -0.8359832763671875, -0.8069534301757812, -0.777923583984375, -0.7488937377929688, -0.7198638916015625, -0.6908340454101562, -0.66180419921875, -0.6327743530273438, -0.6037445068359375, -0.5747146606445312, -0.545684814453125, -0.5166549682617188, -0.4876251220703125, -0.45859527587890625, -0.4295654296875, -0.40053558349609375, -0.3715057373046875, -0.34247589111328125, -0.313446044921875, -0.28441619873046875, -0.2553863525390625, -0.22635650634765625, -0.19732666015625, -0.16829681396484375, -0.1392669677734375, -0.11023712158203125, -0.081207275390625, -0.05217742919921875, -0.0231475830078125, 0.00588226318359375, 0.034912109375, 0.06394195556640625, 0.0929718017578125, 0.12200164794921875, 0.151031494140625, 0.18006134033203125, 0.2090911865234375, 0.23812103271484375, 0.26715087890625, 0.29618072509765625, 0.3252105712890625, 0.35424041748046875, 0.383270263671875, 0.41230010986328125, 0.4413299560546875, 0.47035980224609375, 0.4993896484375, 0.5284194946289062, 0.5574493408203125, 0.5864791870117188, 0.615509033203125, 0.6445388793945312, 0.6735687255859375, 0.7025985717773438, 0.73162841796875, 0.7606582641601562, 0.7896881103515625, 0.8187179565429688, 0.847747802734375, 0.8767776489257812, 0.9058074951171875, 0.9348373413085938, 0.9638671875]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 7.0, 4.0, 1.0, 7.0, 8.0, 1.0, 11.0, 11.0, 19.0, 36.0, 63.0, 123.0, 201.0, 199.0, 151.0, 60.0, 37.0, 19.0, 9.0, 9.0, 8.0, 6.0, 5.0, 6.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.322166442871094e-05, -8.989870548248291e-05, -8.657574653625488e-05, -8.325278759002686e-05, -7.992982864379883e-05, -7.66068696975708e-05, -7.328391075134277e-05, -6.996095180511475e-05, -6.663799285888672e-05, -6.331503391265869e-05, -5.9992074966430664e-05, -5.666911602020264e-05, -5.334615707397461e-05, -5.002319812774658e-05, -4.6700239181518555e-05, -4.337728023529053e-05, -4.00543212890625e-05, -3.673136234283447e-05, -3.3408403396606445e-05, -3.0085444450378418e-05, -2.676248550415039e-05, -2.3439526557922363e-05, -2.0116567611694336e-05, -1.679360866546631e-05, -1.3470649719238281e-05, -1.0147690773010254e-05, -6.8247318267822266e-06, -3.5017728805541992e-06, -1.7881393432617188e-07, 3.1441450119018555e-06, 6.467103958129883e-06, 9.79006290435791e-06, 1.3113021850585938e-05, 1.6435980796813965e-05, 1.9758939743041992e-05, 2.308189868927002e-05, 2.6404857635498047e-05, 2.9727816581726074e-05, 3.30507755279541e-05, 3.637373447418213e-05, 3.9696693420410156e-05, 4.3019652366638184e-05, 4.634261131286621e-05, 4.966557025909424e-05, 5.2988529205322266e-05, 5.631148815155029e-05, 5.963444709777832e-05, 6.295740604400635e-05, 6.628036499023438e-05, 6.96033239364624e-05, 7.292628288269043e-05, 7.624924182891846e-05, 7.957220077514648e-05, 8.289515972137451e-05, 8.621811866760254e-05, 8.954107761383057e-05, 9.28640365600586e-05, 9.618699550628662e-05, 9.950995445251465e-05, 0.00010283291339874268, 0.0001061558723449707, 0.00010947883129119873, 0.00011280179023742676, 0.00011612474918365479, 0.00011944770812988281]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 4.0, 2.0, 8.0, 6.0, 6.0, 14.0, 20.0, 32.0, 71.0, 97.0, 158.0, 283.0, 629.0, 1418.0, 4760.0, 25319.0, 375155.0, 594842.0, 35905.0, 6265.0, 1882.0, 780.0, 379.0, 204.0, 96.0, 76.0, 51.0, 25.0, 21.0, 7.0, 10.0, 3.0, 6.0, 6.0, 4.0, 5.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.66650390625, -0.6463546752929688, -0.6262054443359375, -0.6060562133789062, -0.585906982421875, -0.5657577514648438, -0.5456085205078125, -0.5254592895507812, -0.50531005859375, -0.48516082763671875, -0.4650115966796875, -0.44486236572265625, -0.424713134765625, -0.40456390380859375, -0.3844146728515625, -0.36426544189453125, -0.3441162109375, -0.32396697998046875, -0.3038177490234375, -0.28366851806640625, -0.263519287109375, -0.24337005615234375, -0.2232208251953125, -0.20307159423828125, -0.18292236328125, -0.16277313232421875, -0.1426239013671875, -0.12247467041015625, -0.102325439453125, -0.08217620849609375, -0.0620269775390625, -0.04187774658203125, -0.021728515625, -0.00157928466796875, 0.0185699462890625, 0.03871917724609375, 0.058868408203125, 0.07901763916015625, 0.0991668701171875, 0.11931610107421875, 0.13946533203125, 0.15961456298828125, 0.1797637939453125, 0.19991302490234375, 0.220062255859375, 0.24021148681640625, 0.2603607177734375, 0.28050994873046875, 0.3006591796875, 0.32080841064453125, 0.3409576416015625, 0.36110687255859375, 0.381256103515625, 0.40140533447265625, 0.4215545654296875, 0.44170379638671875, 0.46185302734375, 0.48200225830078125, 0.5021514892578125, 0.5223007202148438, 0.542449951171875, 0.5625991821289062, 0.5827484130859375, 0.6028976440429688, 0.623046875]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 1.0, 2.0, 3.0, 7.0, 14.0, 15.0, 12.0, 20.0, 19.0, 50.0, 72.0, 96.0, 191.0, 167.0, 115.0, 75.0, 41.0, 31.0, 21.0, 16.0, 16.0, 8.0, 3.0, 5.0, 7.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.58251953125, -0.5648956298828125, -0.547271728515625, -0.5296478271484375, -0.51202392578125, -0.4944000244140625, -0.476776123046875, -0.4591522216796875, -0.4415283203125, -0.4239044189453125, -0.406280517578125, -0.3886566162109375, -0.37103271484375, -0.3534088134765625, -0.335784912109375, -0.3181610107421875, -0.300537109375, -0.2829132080078125, -0.265289306640625, -0.2476654052734375, -0.23004150390625, -0.2124176025390625, -0.194793701171875, -0.1771697998046875, -0.1595458984375, -0.1419219970703125, -0.124298095703125, -0.1066741943359375, -0.08905029296875, -0.0714263916015625, -0.053802490234375, -0.0361785888671875, -0.0185546875, -0.0009307861328125, 0.016693115234375, 0.0343170166015625, 0.05194091796875, 0.0695648193359375, 0.087188720703125, 0.1048126220703125, 0.1224365234375, 0.1400604248046875, 0.157684326171875, 0.1753082275390625, 0.19293212890625, 0.2105560302734375, 0.228179931640625, 0.2458038330078125, 0.263427734375, 0.2810516357421875, 0.298675537109375, 0.3162994384765625, 0.33392333984375, 0.3515472412109375, 0.369171142578125, 0.3867950439453125, 0.4044189453125, 0.4220428466796875, 0.439666748046875, 0.4572906494140625, 0.47491455078125, 0.4925384521484375, 0.510162353515625, 0.5277862548828125, 0.54541015625]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 3.0, 27.0, 161.0, 507.0, 251.0, 37.0, 12.0, 7.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.829008102416992, -9.59841251373291, -9.367816925048828, -9.137221336364746, -8.906625747680664, -8.676031112670898, -8.445435523986816, -8.214839935302734, -7.984244346618652, -7.75364875793457, -7.523053169250488, -7.2924580574035645, -7.061862468719482, -6.8312668800354, -6.600671291351318, -6.3700761795043945, -6.1394805908203125, -5.9088850021362305, -5.678289413452148, -5.447694301605225, -5.217098712921143, -4.9865031242370605, -4.7559075355529785, -4.525312423706055, -4.2947163581848145, -4.064120769500732, -3.8335254192352295, -3.6029298305511475, -3.3723344802856445, -3.1417388916015625, -2.9111433029174805, -2.6805479526519775, -2.4499526023864746, -2.2193570137023926, -1.9887616634368896, -1.7581660747528076, -1.5275707244873047, -1.2969751358032227, -1.0663796663284302, -0.8357841968536377, -0.6051887273788452, -0.37459325790405273, -0.14399775862693787, 0.086597740650177, 0.3171932101249695, 0.5477887392044067, 0.7783842086791992, 1.0089796781539917, 1.2395751476287842, 1.4701706171035767, 1.7007660865783691, 1.9313616752624512, 2.161957025527954, 2.392552614212036, 2.623147964477539, 2.853743553161621, 3.084339141845703, 3.314934730529785, 3.545530080795288, 3.77612566947937, 4.006721019744873, 4.237316608428955, 4.467912197113037, 4.698507308959961, 4.929102897644043]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 1.0, 3.0, 1.0, 4.0, 4.0, 5.0, 6.0, 7.0, 15.0, 18.0, 21.0, 27.0, 40.0, 54.0, 58.0, 74.0, 82.0, 118.0, 78.0, 82.0, 67.0, 59.0, 43.0, 47.0, 27.0, 16.0, 15.0, 9.0, 5.0, 8.0, 5.0, 2.0, 4.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.269229412078857, -4.146988868713379, -4.024747848510742, -3.9025070667266846, -3.780266284942627, -3.6580257415771484, -3.535784959793091, -3.413544178009033, -3.2913033962249756, -3.169062614440918, -3.0468218326568604, -2.9245810508728027, -2.802340507507324, -2.6800994873046875, -2.557858943939209, -2.4356181621551514, -2.3133773803710938, -2.191136598587036, -2.0688958168029785, -1.9466551542282104, -1.8244143724441528, -1.7021735906600952, -1.5799329280853271, -1.4576921463012695, -1.335451364517212, -1.2132105827331543, -1.0909698009490967, -0.9687291383743286, -0.846488356590271, -0.7242475748062134, -0.6020068526268005, -0.4797661304473877, -0.3575253486633301, -0.23528459668159485, -0.11304384469985962, 0.00919690728187561, 0.13143765926361084, 0.25367844104766846, 0.3759191632270813, 0.49815988540649414, 0.6204006671905518, 0.7426414489746094, 0.8648821711540222, 0.9871228933334351, 1.1093636751174927, 1.2316044569015503, 1.3538451194763184, 1.476085901260376, 1.5983266830444336, 1.7205674648284912, 1.8428082466125488, 1.965048909187317, 2.087289810180664, 2.2095303535461426, 2.3317711353302, 2.454011917114258, 2.5762526988983154, 2.698493480682373, 2.8207342624664307, 2.9429750442504883, 3.065215587615967, 3.1874566078186035, 3.309697151184082, 3.4319379329681396, 3.5541787147521973]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 5.0, 11.0, 7.0, 11.0, 3.0, 11.0, 11.0, 13.0, 21.0, 29.0, 39.0, 30.0, 59.0, 58.0, 91.0, 130.0, 217.0, 324.0, 463.0, 671.0, 1053.0, 1996.0, 4381.0, 15669.0, 153986.0, 3943980.0, 54535.0, 9175.0, 3278.0, 1510.0, 928.0, 526.0, 375.0, 256.0, 157.0, 97.0, 68.0, 28.0, 27.0, 9.0, 11.0, 10.0, 12.0, 8.0, 1.0, 4.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0], "bins": [-1.5810546875, -1.5387115478515625, -1.496368408203125, -1.4540252685546875, -1.41168212890625, -1.3693389892578125, -1.326995849609375, -1.2846527099609375, -1.2423095703125, -1.1999664306640625, -1.157623291015625, -1.1152801513671875, -1.07293701171875, -1.0305938720703125, -0.988250732421875, -0.9459075927734375, -0.903564453125, -0.8612213134765625, -0.818878173828125, -0.7765350341796875, -0.73419189453125, -0.6918487548828125, -0.649505615234375, -0.6071624755859375, -0.5648193359375, -0.5224761962890625, -0.480133056640625, -0.4377899169921875, -0.39544677734375, -0.3531036376953125, -0.310760498046875, -0.2684173583984375, -0.22607421875, -0.1837310791015625, -0.141387939453125, -0.0990447998046875, -0.05670166015625, -0.0143585205078125, 0.027984619140625, 0.0703277587890625, 0.1126708984375, 0.1550140380859375, 0.197357177734375, 0.2397003173828125, 0.28204345703125, 0.3243865966796875, 0.366729736328125, 0.4090728759765625, 0.451416015625, 0.4937591552734375, 0.536102294921875, 0.5784454345703125, 0.62078857421875, 0.6631317138671875, 0.705474853515625, 0.7478179931640625, 0.7901611328125, 0.8325042724609375, 0.874847412109375, 0.9171905517578125, 0.95953369140625, 1.0018768310546875, 1.044219970703125, 1.0865631103515625, 1.12890625]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 4.0, 6.0, 2.0, 7.0, 7.0, 7.0, 12.0, 14.0, 25.0, 60.0, 126.0, 185.0, 165.0, 164.0, 91.0, 43.0, 26.0, 17.0, 9.0, 6.0, 7.0, 8.0, 2.0, 5.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1197509765625, -0.11653423309326172, -0.11331748962402344, -0.11010074615478516, -0.10688400268554688, -0.1036672592163086, -0.10045051574707031, -0.09723377227783203, -0.09401702880859375, -0.09080028533935547, -0.08758354187011719, -0.0843667984008789, -0.08115005493164062, -0.07793331146240234, -0.07471656799316406, -0.07149982452392578, -0.0682830810546875, -0.06506633758544922, -0.06184959411621094, -0.058632850646972656, -0.055416107177734375, -0.052199363708496094, -0.04898262023925781, -0.04576587677001953, -0.04254913330078125, -0.03933238983154297, -0.03611564636230469, -0.032898902893066406, -0.029682159423828125, -0.026465415954589844, -0.023248672485351562, -0.02003192901611328, -0.016815185546875, -0.013598442077636719, -0.010381698608398438, -0.007164955139160156, -0.003948211669921875, -0.0007314682006835938, 0.0024852752685546875, 0.005702018737792969, 0.00891876220703125, 0.012135505676269531, 0.015352249145507812, 0.018568992614746094, 0.021785736083984375, 0.025002479553222656, 0.028219223022460938, 0.03143596649169922, 0.0346527099609375, 0.03786945343017578, 0.04108619689941406, 0.044302940368652344, 0.047519683837890625, 0.050736427307128906, 0.05395317077636719, 0.05716991424560547, 0.06038665771484375, 0.06360340118408203, 0.06682014465332031, 0.0700368881225586, 0.07325363159179688, 0.07647037506103516, 0.07968711853027344, 0.08290386199951172, 0.08612060546875]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 4.0, 3.0, 2.0, 4.0, 8.0, 6.0, 15.0, 30.0, 38.0, 68.0, 151.0, 463.0, 3551.0, 132918.0, 4039292.0, 15871.0, 1288.0, 324.0, 102.0, 52.0, 29.0, 16.0, 12.0, 12.0, 6.0, 7.0, 1.0, 2.0, 1.0, 0.0, 5.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-2.15234375, -2.0975341796875, -2.042724609375, -1.9879150390625, -1.93310546875, -1.8782958984375, -1.823486328125, -1.7686767578125, -1.7138671875, -1.6590576171875, -1.604248046875, -1.5494384765625, -1.49462890625, -1.4398193359375, -1.385009765625, -1.3302001953125, -1.275390625, -1.2205810546875, -1.165771484375, -1.1109619140625, -1.05615234375, -1.0013427734375, -0.946533203125, -0.8917236328125, -0.8369140625, -0.7821044921875, -0.727294921875, -0.6724853515625, -0.61767578125, -0.5628662109375, -0.508056640625, -0.4532470703125, -0.3984375, -0.3436279296875, -0.288818359375, -0.2340087890625, -0.17919921875, -0.1243896484375, -0.069580078125, -0.0147705078125, 0.0400390625, 0.0948486328125, 0.149658203125, 0.2044677734375, 0.25927734375, 0.3140869140625, 0.368896484375, 0.4237060546875, 0.478515625, 0.5333251953125, 0.588134765625, 0.6429443359375, 0.69775390625, 0.7525634765625, 0.807373046875, 0.8621826171875, 0.9169921875, 0.9718017578125, 1.026611328125, 1.0814208984375, 1.13623046875, 1.1910400390625, 1.245849609375, 1.3006591796875, 1.35546875]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 2.0, 2.0, 5.0, 4.0, 2.0, 4.0, 9.0, 16.0, 20.0, 12.0, 35.0, 62.0, 115.0, 226.0, 491.0, 1346.0, 945.0, 381.0, 154.0, 83.0, 51.0, 41.0, 26.0, 13.0, 5.0, 8.0, 4.0, 3.0, 5.0, 5.0, 0.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10430908203125, -0.10027217864990234, -0.09623527526855469, -0.09219837188720703, -0.08816146850585938, -0.08412456512451172, -0.08008766174316406, -0.0760507583618164, -0.07201385498046875, -0.0679769515991211, -0.06394004821777344, -0.05990314483642578, -0.055866241455078125, -0.05182933807373047, -0.04779243469238281, -0.043755531311035156, -0.0397186279296875, -0.035681724548339844, -0.03164482116699219, -0.02760791778564453, -0.023571014404296875, -0.01953411102294922, -0.015497207641601562, -0.011460304260253906, -0.00742340087890625, -0.0033864974975585938, 0.0006504058837890625, 0.004687309265136719, 0.008724212646484375, 0.012761116027832031, 0.016798019409179688, 0.020834922790527344, 0.024871826171875, 0.028908729553222656, 0.03294563293457031, 0.03698253631591797, 0.041019439697265625, 0.04505634307861328, 0.04909324645996094, 0.053130149841308594, 0.05716705322265625, 0.061203956604003906, 0.06524085998535156, 0.06927776336669922, 0.07331466674804688, 0.07735157012939453, 0.08138847351074219, 0.08542537689208984, 0.0894622802734375, 0.09349918365478516, 0.09753608703613281, 0.10157299041748047, 0.10560989379882812, 0.10964679718017578, 0.11368370056152344, 0.1177206039428711, 0.12175750732421875, 0.1257944107055664, 0.12983131408691406, 0.13386821746826172, 0.13790512084960938, 0.14194202423095703, 0.1459789276123047, 0.15001583099365234, 0.154052734375]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 7.0, 17.0, 67.0, 293.0, 462.0, 129.0, 29.0, 2.0, 0.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8766725659370422, -0.8288012742996216, -0.7809299230575562, -0.7330585718154907, -0.6851872801780701, -0.6373159885406494, -0.589444637298584, -0.5415732860565186, -0.4937019944190979, -0.44583067297935486, -0.3979593515396118, -0.3500880300998688, -0.30221670866012573, -0.2543453872203827, -0.20647406578063965, -0.1586027443408966, -0.11073142290115356, -0.06286010146141052, -0.01498878002166748, 0.03288254141807556, 0.0807538628578186, 0.12862518429756165, 0.1764965057373047, 0.22436782717704773, 0.27223914861679077, 0.3201104700565338, 0.36798179149627686, 0.4158531129360199, 0.46372443437576294, 0.5115957260131836, 0.559467077255249, 0.6073384284973145, 0.6552097797393799, 0.7030811309814453, 0.750952422618866, 0.7988237142562866, 0.846695065498352, 0.8945664167404175, 0.9424377083778381, 0.9903090000152588, 1.0381803512573242, 1.0860517024993896, 1.133923053741455, 1.181794285774231, 1.2296656370162964, 1.2775369882583618, 1.3254082202911377, 1.3732795715332031, 1.4211509227752686, 1.469022274017334, 1.5168936252593994, 1.5647648572921753, 1.6126362085342407, 1.6605075597763062, 1.708378791809082, 1.7562501430511475, 1.804121494293213, 1.8519928455352783, 1.8998641967773438, 1.9477354288101196, 1.995606780052185, 2.043478012084961, 2.0913493633270264, 2.139220714569092, 2.1870920658111572]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 3.0, 7.0, 5.0, 7.0, 5.0, 14.0, 14.0, 27.0, 18.0, 30.0, 40.0, 40.0, 54.0, 56.0, 67.0, 73.0, 73.0, 65.0, 61.0, 64.0, 46.0, 41.0, 36.0, 23.0, 32.0, 22.0, 18.0, 14.0, 19.0, 11.0, 6.0, 7.0, 1.0, 2.0, 5.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.4359545111656189, -0.42113929986953735, -0.4063240587711334, -0.3915088474750519, -0.37669363617897034, -0.3618783950805664, -0.34706318378448486, -0.3322479724884033, -0.3174327313899994, -0.30261752009391785, -0.2878022789955139, -0.2729870676994324, -0.25817185640335083, -0.2433566153049469, -0.22854140400886536, -0.21372617781162262, -0.19891096651554108, -0.18409574031829834, -0.1692805290222168, -0.15446530282497406, -0.13965007662773132, -0.12483485788106918, -0.11001963913440704, -0.0952044129371643, -0.08038919419050217, -0.06557397544384003, -0.05075874924659729, -0.03594353049993515, -0.021128308027982712, -0.0063130855560302734, 0.008502133190631866, 0.023317359387874603, 0.03813257813453674, 0.05294780060648918, 0.06776302307844162, 0.08257824182510376, 0.0973934680223465, 0.11220868676900864, 0.12702390551567078, 0.1418391317129135, 0.15665435791015625, 0.171469584107399, 0.18628479540348053, 0.20110002160072327, 0.215915247797966, 0.23073047399520874, 0.24554568529129028, 0.2603608965873718, 0.27517610788345337, 0.2899913191795349, 0.30480656027793884, 0.3196217715740204, 0.33443698287010193, 0.34925222396850586, 0.3640674352645874, 0.37888264656066895, 0.3936978876590729, 0.4085130989551544, 0.42332834005355835, 0.4381435513496399, 0.45295876264572144, 0.46777400374412537, 0.4825892150402069, 0.49740445613861084, 0.5122196674346924]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 5.0, 3.0, 4.0, 3.0, 6.0, 7.0, 19.0, 15.0, 23.0, 43.0, 83.0, 110.0, 197.0, 363.0, 785.0, 1870.0, 5541.0, 26539.0, 475706.0, 500497.0, 27502.0, 5677.0, 1871.0, 752.0, 394.0, 199.0, 137.0, 76.0, 37.0, 38.0, 19.0, 12.0, 12.0, 4.0, 2.0, 6.0, 3.0, 0.0, 1.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.70947265625, -0.6865921020507812, -0.6637115478515625, -0.6408309936523438, -0.617950439453125, -0.5950698852539062, -0.5721893310546875, -0.5493087768554688, -0.52642822265625, -0.5035476684570312, -0.4806671142578125, -0.45778656005859375, -0.434906005859375, -0.41202545166015625, -0.3891448974609375, -0.36626434326171875, -0.3433837890625, -0.32050323486328125, -0.2976226806640625, -0.27474212646484375, -0.251861572265625, -0.22898101806640625, -0.2061004638671875, -0.18321990966796875, -0.16033935546875, -0.13745880126953125, -0.1145782470703125, -0.09169769287109375, -0.068817138671875, -0.04593658447265625, -0.0230560302734375, -0.00017547607421875, 0.022705078125, 0.04558563232421875, 0.0684661865234375, 0.09134674072265625, 0.114227294921875, 0.13710784912109375, 0.1599884033203125, 0.18286895751953125, 0.20574951171875, 0.22863006591796875, 0.2515106201171875, 0.27439117431640625, 0.297271728515625, 0.32015228271484375, 0.3430328369140625, 0.36591339111328125, 0.3887939453125, 0.41167449951171875, 0.4345550537109375, 0.45743560791015625, 0.480316162109375, 0.5031967163085938, 0.5260772705078125, 0.5489578247070312, 0.57183837890625, 0.5947189331054688, 0.6175994873046875, 0.6404800415039062, 0.663360595703125, 0.6862411499023438, 0.7091217041015625, 0.7320022583007812, 0.7548828125]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 7.0, 1.0, 2.0, 12.0, 6.0, 8.0, 8.0, 17.0, 30.0, 73.0, 134.0, 196.0, 195.0, 122.0, 88.0, 45.0, 23.0, 9.0, 8.0, 6.0, 8.0, 4.0, 3.0, 4.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.115966796875, -0.1129159927368164, -0.10986518859863281, -0.10681438446044922, -0.10376358032226562, -0.10071277618408203, -0.09766197204589844, -0.09461116790771484, -0.09156036376953125, -0.08850955963134766, -0.08545875549316406, -0.08240795135498047, -0.07935714721679688, -0.07630634307861328, -0.07325553894042969, -0.0702047348022461, -0.0671539306640625, -0.0641031265258789, -0.06105232238769531, -0.05800151824951172, -0.054950714111328125, -0.05189990997314453, -0.04884910583496094, -0.045798301696777344, -0.04274749755859375, -0.039696693420410156, -0.03664588928222656, -0.03359508514404297, -0.030544281005859375, -0.02749347686767578, -0.024442672729492188, -0.021391868591308594, -0.018341064453125, -0.015290260314941406, -0.012239456176757812, -0.009188652038574219, -0.006137847900390625, -0.0030870437622070312, -3.62396240234375e-05, 0.0030145645141601562, 0.00606536865234375, 0.009116172790527344, 0.012166976928710938, 0.015217781066894531, 0.018268585205078125, 0.02131938934326172, 0.024370193481445312, 0.027420997619628906, 0.0304718017578125, 0.033522605895996094, 0.03657341003417969, 0.03962421417236328, 0.042675018310546875, 0.04572582244873047, 0.04877662658691406, 0.051827430725097656, 0.05487823486328125, 0.057929039001464844, 0.06097984313964844, 0.06403064727783203, 0.06708145141601562, 0.07013225555419922, 0.07318305969238281, 0.0762338638305664, 0.07928466796875]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 2.0, 2.0, 1.0, 4.0, 0.0, 5.0, 8.0, 7.0, 11.0, 13.0, 12.0, 16.0, 24.0, 30.0, 31.0, 73.0, 70.0, 127.0, 192.0, 258.0, 516.0, 1122.0, 2882.0, 10504.0, 56342.0, 395847.0, 487000.0, 74321.0, 12946.0, 3336.0, 1261.0, 603.0, 313.0, 202.0, 142.0, 88.0, 55.0, 51.0, 34.0, 25.0, 19.0, 20.0, 13.0, 10.0, 7.0, 4.0, 3.0, 7.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3720703125, -0.3592720031738281, -0.34647369384765625, -0.3336753845214844, -0.3208770751953125, -0.3080787658691406, -0.29528045654296875, -0.2824821472167969, -0.269683837890625, -0.2568855285644531, -0.24408721923828125, -0.23128890991210938, -0.2184906005859375, -0.20569229125976562, -0.19289398193359375, -0.18009567260742188, -0.16729736328125, -0.15449905395507812, -0.14170074462890625, -0.12890243530273438, -0.1161041259765625, -0.10330581665039062, -0.09050750732421875, -0.07770919799804688, -0.064910888671875, -0.052112579345703125, -0.03931427001953125, -0.026515960693359375, -0.0137176513671875, -0.000919342041015625, 0.01187896728515625, 0.024677276611328125, 0.0374755859375, 0.050273895263671875, 0.06307220458984375, 0.07587051391601562, 0.0886688232421875, 0.10146713256835938, 0.11426544189453125, 0.12706375122070312, 0.139862060546875, 0.15266036987304688, 0.16545867919921875, 0.17825698852539062, 0.1910552978515625, 0.20385360717773438, 0.21665191650390625, 0.22945022583007812, 0.24224853515625, 0.2550468444824219, 0.26784515380859375, 0.2806434631347656, 0.2934417724609375, 0.3062400817871094, 0.31903839111328125, 0.3318367004394531, 0.344635009765625, 0.3574333190917969, 0.37023162841796875, 0.3830299377441406, 0.3958282470703125, 0.4086265563964844, 0.42142486572265625, 0.4342231750488281, 0.447021484375]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0, 9.0, 3.0, 6.0, 7.0, 4.0, 10.0, 8.0, 16.0, 21.0, 16.0, 30.0, 37.0, 31.0, 42.0, 47.0, 43.0, 58.0, 56.0, 66.0, 51.0, 64.0, 51.0, 43.0, 43.0, 40.0, 26.0, 29.0, 27.0, 20.0, 16.0, 18.0, 16.0, 11.0, 15.0, 4.0, 5.0, 4.0, 4.0, 4.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.25634765625, -0.2475433349609375, -0.238739013671875, -0.2299346923828125, -0.22113037109375, -0.2123260498046875, -0.203521728515625, -0.1947174072265625, -0.1859130859375, -0.1771087646484375, -0.168304443359375, -0.1595001220703125, -0.15069580078125, -0.1418914794921875, -0.133087158203125, -0.1242828369140625, -0.115478515625, -0.1066741943359375, -0.097869873046875, -0.0890655517578125, -0.08026123046875, -0.0714569091796875, -0.062652587890625, -0.0538482666015625, -0.0450439453125, -0.0362396240234375, -0.027435302734375, -0.0186309814453125, -0.00982666015625, -0.0010223388671875, 0.007781982421875, 0.0165863037109375, 0.025390625, 0.0341949462890625, 0.042999267578125, 0.0518035888671875, 0.06060791015625, 0.0694122314453125, 0.078216552734375, 0.0870208740234375, 0.0958251953125, 0.1046295166015625, 0.113433837890625, 0.1222381591796875, 0.13104248046875, 0.1398468017578125, 0.148651123046875, 0.1574554443359375, 0.166259765625, 0.1750640869140625, 0.183868408203125, 0.1926727294921875, 0.20147705078125, 0.2102813720703125, 0.219085693359375, 0.2278900146484375, 0.2366943359375, 0.2454986572265625, 0.254302978515625, 0.2631072998046875, 0.27191162109375, 0.2807159423828125, 0.289520263671875, 0.2983245849609375, 0.30712890625]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 1.0, 3.0, 0.0, 4.0, 10.0, 16.0, 15.0, 26.0, 42.0, 76.0, 145.0, 282.0, 681.0, 2126.0, 11524.0, 100782.0, 760168.0, 152364.0, 15890.0, 2874.0, 837.0, 328.0, 166.0, 66.0, 37.0, 23.0, 17.0, 18.0, 12.0, 6.0, 8.0, 5.0, 3.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.29345703125, -0.2828178405761719, -0.27217864990234375, -0.2615394592285156, -0.2509002685546875, -0.24026107788085938, -0.22962188720703125, -0.21898269653320312, -0.208343505859375, -0.19770431518554688, -0.18706512451171875, -0.17642593383789062, -0.1657867431640625, -0.15514755249023438, -0.14450836181640625, -0.13386917114257812, -0.12322998046875, -0.11259078979492188, -0.10195159912109375, -0.09131240844726562, -0.0806732177734375, -0.07003402709960938, -0.05939483642578125, -0.048755645751953125, -0.038116455078125, -0.027477264404296875, -0.01683807373046875, -0.006198883056640625, 0.0044403076171875, 0.015079498291015625, 0.02571868896484375, 0.036357879638671875, 0.0469970703125, 0.057636260986328125, 0.06827545166015625, 0.07891464233398438, 0.0895538330078125, 0.10019302368164062, 0.11083221435546875, 0.12147140502929688, 0.132110595703125, 0.14274978637695312, 0.15338897705078125, 0.16402816772460938, 0.1746673583984375, 0.18530654907226562, 0.19594573974609375, 0.20658493041992188, 0.21722412109375, 0.22786331176757812, 0.23850250244140625, 0.24914169311523438, 0.2597808837890625, 0.2704200744628906, 0.28105926513671875, 0.2916984558105469, 0.302337646484375, 0.3129768371582031, 0.32361602783203125, 0.3342552185058594, 0.3448944091796875, 0.3555335998535156, 0.36617279052734375, 0.3768119812011719, 0.387451171875]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 4.0, 2.0, 0.0, 3.0, 2.0, 4.0, 12.0, 10.0, 13.0, 20.0, 20.0, 41.0, 49.0, 39.0, 74.0, 115.0, 153.0, 133.0, 94.0, 47.0, 47.0, 39.0, 29.0, 15.0, 16.0, 8.0, 9.0, 8.0, 4.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.747245788574219e-05, -6.365403532981873e-05, -5.9835612773895264e-05, -5.60171902179718e-05, -5.219876766204834e-05, -4.838034510612488e-05, -4.4561922550201416e-05, -4.0743499994277954e-05, -3.692507743835449e-05, -3.310665488243103e-05, -2.928823232650757e-05, -2.5469809770584106e-05, -2.1651387214660645e-05, -1.7832964658737183e-05, -1.401454210281372e-05, -1.0196119546890259e-05, -6.377696990966797e-06, -2.559274435043335e-06, 1.259148120880127e-06, 5.077570676803589e-06, 8.89599323272705e-06, 1.2714415788650513e-05, 1.6532838344573975e-05, 2.0351260900497437e-05, 2.41696834564209e-05, 2.798810601234436e-05, 3.180652856826782e-05, 3.5624951124191284e-05, 3.9443373680114746e-05, 4.326179623603821e-05, 4.708021879196167e-05, 5.089864134788513e-05, 5.4717063903808594e-05, 5.8535486459732056e-05, 6.235390901565552e-05, 6.617233157157898e-05, 6.999075412750244e-05, 7.38091766834259e-05, 7.762759923934937e-05, 8.144602179527283e-05, 8.526444435119629e-05, 8.908286690711975e-05, 9.290128946304321e-05, 9.671971201896667e-05, 0.00010053813457489014, 0.0001043565571308136, 0.00010817497968673706, 0.00011199340224266052, 0.00011581182479858398, 0.00011963024735450745, 0.0001234486699104309, 0.00012726709246635437, 0.00013108551502227783, 0.0001349039375782013, 0.00013872236013412476, 0.00014254078269004822, 0.00014635920524597168, 0.00015017762780189514, 0.0001539960503578186, 0.00015781447291374207, 0.00016163289546966553, 0.000165451318025589, 0.00016926974058151245, 0.0001730881631374359, 0.00017690658569335938]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 4.0, 4.0, 2.0, 12.0, 19.0, 21.0, 44.0, 74.0, 127.0, 288.0, 666.0, 1751.0, 10037.0, 103243.0, 807136.0, 111404.0, 10490.0, 1973.0, 651.0, 307.0, 112.0, 80.0, 43.0, 30.0, 18.0, 14.0, 1.0, 5.0, 3.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.50244140625, -0.4893951416015625, -0.476348876953125, -0.4633026123046875, -0.45025634765625, -0.4372100830078125, -0.424163818359375, -0.4111175537109375, -0.3980712890625, -0.3850250244140625, -0.371978759765625, -0.3589324951171875, -0.34588623046875, -0.3328399658203125, -0.319793701171875, -0.3067474365234375, -0.293701171875, -0.2806549072265625, -0.267608642578125, -0.2545623779296875, -0.24151611328125, -0.2284698486328125, -0.215423583984375, -0.2023773193359375, -0.1893310546875, -0.1762847900390625, -0.163238525390625, -0.1501922607421875, -0.13714599609375, -0.1240997314453125, -0.111053466796875, -0.0980072021484375, -0.0849609375, -0.0719146728515625, -0.058868408203125, -0.0458221435546875, -0.03277587890625, -0.0197296142578125, -0.006683349609375, 0.0063629150390625, 0.0194091796875, 0.0324554443359375, 0.045501708984375, 0.0585479736328125, 0.07159423828125, 0.0846405029296875, 0.097686767578125, 0.1107330322265625, 0.123779296875, 0.1368255615234375, 0.149871826171875, 0.1629180908203125, 0.17596435546875, 0.1890106201171875, 0.202056884765625, 0.2151031494140625, 0.2281494140625, 0.2411956787109375, 0.254241943359375, 0.2672882080078125, 0.28033447265625, 0.2933807373046875, 0.306427001953125, 0.3194732666015625, 0.33251953125]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 3.0, 1.0, 11.0, 16.0, 17.0, 24.0, 36.0, 59.0, 88.0, 115.0, 157.0, 159.0, 103.0, 65.0, 42.0, 34.0, 26.0, 21.0, 12.0, 7.0, 4.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2393798828125, -0.23268890380859375, -0.2259979248046875, -0.21930694580078125, -0.212615966796875, -0.20592498779296875, -0.1992340087890625, -0.19254302978515625, -0.18585205078125, -0.17916107177734375, -0.1724700927734375, -0.16577911376953125, -0.159088134765625, -0.15239715576171875, -0.1457061767578125, -0.13901519775390625, -0.13232421875, -0.12563323974609375, -0.1189422607421875, -0.11225128173828125, -0.105560302734375, -0.09886932373046875, -0.0921783447265625, -0.08548736572265625, -0.07879638671875, -0.07210540771484375, -0.0654144287109375, -0.05872344970703125, -0.052032470703125, -0.04534149169921875, -0.0386505126953125, -0.03195953369140625, -0.0252685546875, -0.01857757568359375, -0.0118865966796875, -0.00519561767578125, 0.001495361328125, 0.00818634033203125, 0.0148773193359375, 0.02156829833984375, 0.02825927734375, 0.03495025634765625, 0.0416412353515625, 0.04833221435546875, 0.055023193359375, 0.06171417236328125, 0.0684051513671875, 0.07509613037109375, 0.081787109375, 0.08847808837890625, 0.0951690673828125, 0.10186004638671875, 0.108551025390625, 0.11524200439453125, 0.1219329833984375, 0.12862396240234375, 0.13531494140625, 0.14200592041015625, 0.1486968994140625, 0.15538787841796875, 0.162078857421875, 0.16876983642578125, 0.1754608154296875, 0.18215179443359375, 0.1888427734375]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 10.0, 24.0, 87.0, 255.0, 368.0, 172.0, 59.0, 12.0, 7.0, 3.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.41822624206543, -4.277159690856934, -4.1360931396484375, -3.9950265884399414, -3.8539600372314453, -3.712893486022949, -3.571826934814453, -3.430760383605957, -3.289693832397461, -3.148627281188965, -3.0075607299804688, -2.8664941787719727, -2.7254276275634766, -2.5843610763549805, -2.4432945251464844, -2.3022279739379883, -2.161161422729492, -2.020094871520996, -1.8790283203125, -1.737961769104004, -1.5968952178955078, -1.4558286666870117, -1.3147621154785156, -1.1736955642700195, -1.0326290130615234, -0.8915624618530273, -0.7504959106445312, -0.6094293594360352, -0.46836280822753906, -0.32729625701904297, -0.18622970581054688, -0.04516315460205078, 0.09590339660644531, 0.2369699478149414, 0.3780364990234375, 0.5191030502319336, 0.6601696014404297, 0.8012361526489258, 0.9423027038574219, 1.083369255065918, 1.224435806274414, 1.3655023574829102, 1.5065689086914062, 1.6476354598999023, 1.7887020111083984, 1.9297685623168945, 2.0708351135253906, 2.2119016647338867, 2.352968215942383, 2.494034767150879, 2.635101318359375, 2.776167869567871, 2.917234420776367, 3.0583009719848633, 3.1993675231933594, 3.3404340744018555, 3.4815006256103516, 3.6225671768188477, 3.7636337280273438, 3.90470027923584, 4.045766830444336, 4.186833381652832, 4.327899932861328, 4.468966484069824, 4.61003303527832]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 5.0, 4.0, 6.0, 3.0, 8.0, 14.0, 15.0, 16.0, 13.0, 35.0, 28.0, 38.0, 48.0, 56.0, 59.0, 52.0, 66.0, 76.0, 60.0, 64.0, 48.0, 45.0, 46.0, 45.0, 40.0, 27.0, 25.0, 15.0, 15.0, 15.0, 9.0, 2.0, 5.0, 1.0, 2.0, 0.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.1233720779418945, -2.0433895587921143, -1.963407278060913, -1.8834248781204224, -1.8034424781799316, -1.7234599590301514, -1.6434775590896606, -1.56349515914917, -1.4835127592086792, -1.4035303592681885, -1.3235479593276978, -1.243565559387207, -1.1635830402374268, -1.0836007595062256, -1.0036182403564453, -0.9236358404159546, -0.8436534404754639, -0.7636710405349731, -0.6836886405944824, -0.6037061810493469, -0.5237237811088562, -0.4437413811683655, -0.36375895142555237, -0.28377652168273926, -0.20379412174224854, -0.12381170690059662, -0.0438292920589447, 0.036153122782707214, 0.11613553762435913, 0.19611793756484985, 0.27610036730766296, 0.3560827970504761, 0.4360651969909668, 0.5160475969314575, 0.5960299968719482, 0.6760124564170837, 0.7559948563575745, 0.8359772562980652, 0.9159597158432007, 0.9959421157836914, 1.0759245157241821, 1.1559069156646729, 1.2358893156051636, 1.3158717155456543, 1.3958542346954346, 1.4758365154266357, 1.555819034576416, 1.6358014345169067, 1.7157838344573975, 1.7957662343978882, 1.875748634338379, 1.9557310342788696, 2.0357134342193604, 2.1156959533691406, 2.195678234100342, 2.275660753250122, 2.3556432723999023, 2.4356257915496826, 2.515608072280884, 2.595590591430664, 2.6755728721618652, 2.7555553913116455, 2.8355376720428467, 2.915520191192627, 2.995502471923828]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 5.0, 5.0, 10.0, 8.0, 14.0, 13.0, 30.0, 44.0, 67.0, 123.0, 303.0, 911.0, 4727.0, 3453818.0, 729406.0, 3737.0, 655.0, 199.0, 89.0, 55.0, 32.0, 12.0, 14.0, 7.0, 0.0, 1.0, 5.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-3.615234375, -3.52001953125, -3.4248046875, -3.32958984375, -3.234375, -3.13916015625, -3.0439453125, -2.94873046875, -2.853515625, -2.75830078125, -2.6630859375, -2.56787109375, -2.47265625, -2.37744140625, -2.2822265625, -2.18701171875, -2.091796875, -1.99658203125, -1.9013671875, -1.80615234375, -1.7109375, -1.61572265625, -1.5205078125, -1.42529296875, -1.330078125, -1.23486328125, -1.1396484375, -1.04443359375, -0.94921875, -0.85400390625, -0.7587890625, -0.66357421875, -0.568359375, -0.47314453125, -0.3779296875, -0.28271484375, -0.1875, -0.09228515625, 0.0029296875, 0.09814453125, 0.193359375, 0.28857421875, 0.3837890625, 0.47900390625, 0.57421875, 0.66943359375, 0.7646484375, 0.85986328125, 0.955078125, 1.05029296875, 1.1455078125, 1.24072265625, 1.3359375, 1.43115234375, 1.5263671875, 1.62158203125, 1.716796875, 1.81201171875, 1.9072265625, 2.00244140625, 2.09765625, 2.19287109375, 2.2880859375, 2.38330078125, 2.478515625]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 5.0, 3.0, 5.0, 5.0, 14.0, 18.0, 16.0, 51.0, 63.0, 113.0, 134.0, 159.0, 119.0, 99.0, 67.0, 46.0, 27.0, 26.0, 11.0, 9.0, 3.0, 4.0, 3.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.12939453125, -0.12602615356445312, -0.12265777587890625, -0.11928939819335938, -0.1159210205078125, -0.11255264282226562, -0.10918426513671875, -0.10581588745117188, -0.102447509765625, -0.09907913208007812, -0.09571075439453125, -0.09234237670898438, -0.0889739990234375, -0.08560562133789062, -0.08223724365234375, -0.07886886596679688, -0.07550048828125, -0.07213211059570312, -0.06876373291015625, -0.06539535522460938, -0.0620269775390625, -0.058658599853515625, -0.05529022216796875, -0.051921844482421875, -0.048553466796875, -0.045185089111328125, -0.04181671142578125, -0.038448333740234375, -0.0350799560546875, -0.031711578369140625, -0.02834320068359375, -0.024974822998046875, -0.0216064453125, -0.018238067626953125, -0.01486968994140625, -0.011501312255859375, -0.0081329345703125, -0.004764556884765625, -0.00139617919921875, 0.001972198486328125, 0.005340576171875, 0.008708953857421875, 0.01207733154296875, 0.015445709228515625, 0.0188140869140625, 0.022182464599609375, 0.02555084228515625, 0.028919219970703125, 0.03228759765625, 0.035655975341796875, 0.03902435302734375, 0.042392730712890625, 0.0457611083984375, 0.049129486083984375, 0.05249786376953125, 0.055866241455078125, 0.059234619140625, 0.06260299682617188, 0.06597137451171875, 0.06933975219726562, 0.0727081298828125, 0.07607650756835938, 0.07944488525390625, 0.08281326293945312, 0.086181640625]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 5.0, 5.0, 4.0, 9.0, 11.0, 19.0, 30.0, 48.0, 60.0, 88.0, 173.0, 317.0, 698.0, 1612.0, 3963.0, 13022.0, 63875.0, 1028269.0, 2945906.0, 109376.0, 18116.0, 5144.0, 1869.0, 819.0, 381.0, 180.0, 107.0, 60.0, 45.0, 28.0, 15.0, 5.0, 8.0, 7.0, 6.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.395263671875, -0.3806953430175781, -0.36612701416015625, -0.3515586853027344, -0.3369903564453125, -0.3224220275878906, -0.30785369873046875, -0.2932853698730469, -0.278717041015625, -0.2641487121582031, -0.24958038330078125, -0.23501205444335938, -0.2204437255859375, -0.20587539672851562, -0.19130706787109375, -0.17673873901367188, -0.16217041015625, -0.14760208129882812, -0.13303375244140625, -0.11846542358398438, -0.1038970947265625, -0.08932876586914062, -0.07476043701171875, -0.060192108154296875, -0.045623779296875, -0.031055450439453125, -0.01648712158203125, -0.001918792724609375, 0.0126495361328125, 0.027217864990234375, 0.04178619384765625, 0.056354522705078125, 0.0709228515625, 0.08549118041992188, 0.10005950927734375, 0.11462783813476562, 0.1291961669921875, 0.14376449584960938, 0.15833282470703125, 0.17290115356445312, 0.187469482421875, 0.20203781127929688, 0.21660614013671875, 0.23117446899414062, 0.2457427978515625, 0.2603111267089844, 0.27487945556640625, 0.2894477844238281, 0.30401611328125, 0.3185844421386719, 0.33315277099609375, 0.3477210998535156, 0.3622894287109375, 0.3768577575683594, 0.39142608642578125, 0.4059944152832031, 0.420562744140625, 0.4351310729980469, 0.44969940185546875, 0.4642677307128906, 0.4788360595703125, 0.4934043884277344, 0.5079727172851562, 0.5225410461425781, 0.537109375]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 0.0, 3.0, 1.0, 1.0, 2.0, 4.0, 5.0, 11.0, 5.0, 12.0, 18.0, 16.0, 20.0, 24.0, 54.0, 99.0, 137.0, 258.0, 501.0, 1303.0, 796.0, 311.0, 182.0, 87.0, 79.0, 33.0, 34.0, 16.0, 11.0, 11.0, 8.0, 13.0, 5.0, 2.0, 4.0, 6.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0], "bins": [-0.125, -0.12169170379638672, -0.11838340759277344, -0.11507511138916016, -0.11176681518554688, -0.1084585189819336, -0.10515022277832031, -0.10184192657470703, -0.09853363037109375, -0.09522533416748047, -0.09191703796386719, -0.0886087417602539, -0.08530044555664062, -0.08199214935302734, -0.07868385314941406, -0.07537555694580078, -0.0720672607421875, -0.06875896453857422, -0.06545066833496094, -0.062142372131347656, -0.058834075927734375, -0.055525779724121094, -0.05221748352050781, -0.04890918731689453, -0.04560089111328125, -0.04229259490966797, -0.03898429870605469, -0.035676002502441406, -0.032367706298828125, -0.029059410095214844, -0.025751113891601562, -0.02244281768798828, -0.019134521484375, -0.01582622528076172, -0.012517929077148438, -0.009209632873535156, -0.005901336669921875, -0.0025930404663085938, 0.0007152557373046875, 0.004023551940917969, 0.00733184814453125, 0.010640144348144531, 0.013948440551757812, 0.017256736755371094, 0.020565032958984375, 0.023873329162597656, 0.027181625366210938, 0.03048992156982422, 0.0337982177734375, 0.03710651397705078, 0.04041481018066406, 0.043723106384277344, 0.047031402587890625, 0.050339698791503906, 0.05364799499511719, 0.05695629119873047, 0.06026458740234375, 0.06357288360595703, 0.06688117980957031, 0.0701894760131836, 0.07349777221679688, 0.07680606842041016, 0.08011436462402344, 0.08342266082763672, 0.08673095703125]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 4.0, 12.0, 52.0, 244.0, 453.0, 199.0, 40.0, 5.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9817826747894287, -0.9313123822212219, -0.8808420300483704, -0.8303717374801636, -0.779901385307312, -0.7294310927391052, -0.6789608001708984, -0.6284904479980469, -0.5780200958251953, -0.5275498032569885, -0.47707945108413696, -0.4266091585159302, -0.3761388063430786, -0.3256685137748718, -0.27519819140434265, -0.22472786903381348, -0.1742575764656067, -0.12378725409507751, -0.07331693917512894, -0.02284662425518036, 0.027623698115348816, 0.0780940055847168, 0.12856432795524597, 0.17903465032577515, 0.22950497269630432, 0.2799752950668335, 0.33044561743736267, 0.38091593980789185, 0.43138623237609863, 0.4818565547466278, 0.532326877117157, 0.5827971696853638, 0.6332675218582153, 0.6837378144264221, 0.7342081665992737, 0.7846784591674805, 0.835148811340332, 0.8856191039085388, 0.9360893964767456, 0.9865597486495972, 1.0370301008224487, 1.0875004529953003, 1.1379706859588623, 1.1884410381317139, 1.2389113903045654, 1.289381742477417, 1.339851975440979, 1.3903223276138306, 1.4407925605773926, 1.4912629127502441, 1.5417331457138062, 1.5922034978866577, 1.6426738500595093, 1.6931440830230713, 1.7436144351959229, 1.7940847873687744, 1.844555139541626, 1.8950254917144775, 1.9454957246780396, 1.9959660768508911, 2.046436309814453, 2.0969066619873047, 2.1473770141601562, 2.197847366333008, 2.2483177185058594]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 1.0, 4.0, 4.0, 6.0, 7.0, 8.0, 10.0, 15.0, 7.0, 17.0, 17.0, 29.0, 27.0, 36.0, 30.0, 43.0, 35.0, 42.0, 49.0, 43.0, 46.0, 44.0, 46.0, 50.0, 53.0, 41.0, 37.0, 41.0, 35.0, 23.0, 27.0, 32.0, 17.0, 17.0, 15.0, 10.0, 13.0, 6.0, 10.0, 5.0, 3.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.35060304403305054, -0.3394174873828888, -0.32823196053504944, -0.3170464038848877, -0.30586087703704834, -0.2946753203868866, -0.28348976373672485, -0.2723042368888855, -0.26111871004104614, -0.2499331682920456, -0.23874762654304504, -0.2275620698928833, -0.21637654304504395, -0.2051909863948822, -0.19400544464588165, -0.1828199028968811, -0.17163434624671936, -0.1604488044977188, -0.14926326274871826, -0.13807770609855652, -0.12689217925071716, -0.11570663005113602, -0.10452108085155487, -0.09333553910255432, -0.08214999735355377, -0.07096445560455322, -0.059778910130262375, -0.04859336465597153, -0.03740782290697098, -0.02622228115797043, -0.015036731958389282, -0.003851190209388733, 0.007334351539611816, 0.018519895151257515, 0.029705438762903214, 0.04089098423719406, 0.05207652598619461, 0.06326206773519516, 0.0744476169347763, 0.08563315868377686, 0.0968187004327774, 0.10800424218177795, 0.1191897839307785, 0.13037532567977905, 0.1415608823299408, 0.15274640917778015, 0.1639319658279419, 0.17511750757694244, 0.186303049325943, 0.19748859107494354, 0.2086741328239441, 0.21985968947410583, 0.2310452163219452, 0.24223077297210693, 0.2534162998199463, 0.26460185647010803, 0.2757874131202698, 0.2869729697704315, 0.2981584966182709, 0.3093440532684326, 0.320529580116272, 0.3317151367664337, 0.34290069341659546, 0.3540862202644348, 0.36527174711227417]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 0.0, 2.0, 6.0, 6.0, 1.0, 3.0, 7.0, 5.0, 8.0, 25.0, 41.0, 53.0, 81.0, 132.0, 247.0, 519.0, 1131.0, 2864.0, 10720.0, 111481.0, 805033.0, 101050.0, 10165.0, 2777.0, 1092.0, 492.0, 255.0, 132.0, 87.0, 54.0, 31.0, 17.0, 10.0, 6.0, 5.0, 8.0, 3.0, 4.0, 1.0, 4.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.6884765625, -0.6679153442382812, -0.6473541259765625, -0.6267929077148438, -0.606231689453125, -0.5856704711914062, -0.5651092529296875, -0.5445480346679688, -0.52398681640625, -0.5034255981445312, -0.4828643798828125, -0.46230316162109375, -0.441741943359375, -0.42118072509765625, -0.4006195068359375, -0.38005828857421875, -0.3594970703125, -0.33893585205078125, -0.3183746337890625, -0.29781341552734375, -0.277252197265625, -0.25669097900390625, -0.2361297607421875, -0.21556854248046875, -0.19500732421875, -0.17444610595703125, -0.1538848876953125, -0.13332366943359375, -0.112762451171875, -0.09220123291015625, -0.0716400146484375, -0.05107879638671875, -0.030517578125, -0.00995635986328125, 0.0106048583984375, 0.03116607666015625, 0.051727294921875, 0.07228851318359375, 0.0928497314453125, 0.11341094970703125, 0.13397216796875, 0.15453338623046875, 0.1750946044921875, 0.19565582275390625, 0.216217041015625, 0.23677825927734375, 0.2573394775390625, 0.27790069580078125, 0.2984619140625, 0.31902313232421875, 0.3395843505859375, 0.36014556884765625, 0.380706787109375, 0.40126800537109375, 0.4218292236328125, 0.44239044189453125, 0.46295166015625, 0.48351287841796875, 0.5040740966796875, 0.5246353149414062, 0.545196533203125, 0.5657577514648438, 0.5863189697265625, 0.6068801879882812, 0.62744140625]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 4.0, 6.0, 4.0, 7.0, 7.0, 14.0, 16.0, 31.0, 65.0, 102.0, 128.0, 163.0, 136.0, 119.0, 64.0, 53.0, 38.0, 19.0, 10.0, 5.0, 4.0, 3.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.12322998046875, -0.12003898620605469, -0.11684799194335938, -0.11365699768066406, -0.11046600341796875, -0.10727500915527344, -0.10408401489257812, -0.10089302062988281, -0.0977020263671875, -0.09451103210449219, -0.09132003784179688, -0.08812904357910156, -0.08493804931640625, -0.08174705505371094, -0.07855606079101562, -0.07536506652832031, -0.072174072265625, -0.06898307800292969, -0.06579208374023438, -0.06260108947753906, -0.05941009521484375, -0.05621910095214844, -0.053028106689453125, -0.04983711242675781, -0.0466461181640625, -0.04345512390136719, -0.040264129638671875, -0.03707313537597656, -0.03388214111328125, -0.030691146850585938, -0.027500152587890625, -0.024309158325195312, -0.0211181640625, -0.017927169799804688, -0.014736175537109375, -0.011545181274414062, -0.00835418701171875, -0.0051631927490234375, -0.001972198486328125, 0.0012187957763671875, 0.0044097900390625, 0.0076007843017578125, 0.010791778564453125, 0.013982772827148438, 0.01717376708984375, 0.020364761352539062, 0.023555755615234375, 0.026746749877929688, 0.029937744140625, 0.03312873840332031, 0.036319732666015625, 0.03951072692871094, 0.04270172119140625, 0.04589271545410156, 0.049083709716796875, 0.05227470397949219, 0.0554656982421875, 0.05865669250488281, 0.061847686767578125, 0.06503868103027344, 0.06822967529296875, 0.07142066955566406, 0.07461166381835938, 0.07780265808105469, 0.08099365234375]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 2.0, 5.0, 6.0, 7.0, 14.0, 12.0, 24.0, 32.0, 42.0, 54.0, 66.0, 106.0, 159.0, 236.0, 421.0, 838.0, 1828.0, 5755.0, 22517.0, 108711.0, 450827.0, 358395.0, 74482.0, 16300.0, 4372.0, 1592.0, 671.0, 364.0, 214.0, 130.0, 112.0, 70.0, 46.0, 38.0, 28.0, 24.0, 13.0, 15.0, 9.0, 10.0, 3.0, 8.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.3046875, -0.29376220703125, -0.2828369140625, -0.27191162109375, -0.260986328125, -0.25006103515625, -0.2391357421875, -0.22821044921875, -0.21728515625, -0.20635986328125, -0.1954345703125, -0.18450927734375, -0.173583984375, -0.16265869140625, -0.1517333984375, -0.14080810546875, -0.1298828125, -0.11895751953125, -0.1080322265625, -0.09710693359375, -0.086181640625, -0.07525634765625, -0.0643310546875, -0.05340576171875, -0.04248046875, -0.03155517578125, -0.0206298828125, -0.00970458984375, 0.001220703125, 0.01214599609375, 0.0230712890625, 0.03399658203125, 0.044921875, 0.05584716796875, 0.0667724609375, 0.07769775390625, 0.088623046875, 0.09954833984375, 0.1104736328125, 0.12139892578125, 0.13232421875, 0.14324951171875, 0.1541748046875, 0.16510009765625, 0.176025390625, 0.18695068359375, 0.1978759765625, 0.20880126953125, 0.2197265625, 0.23065185546875, 0.2415771484375, 0.25250244140625, 0.263427734375, 0.27435302734375, 0.2852783203125, 0.29620361328125, 0.30712890625, 0.31805419921875, 0.3289794921875, 0.33990478515625, 0.350830078125, 0.36175537109375, 0.3726806640625, 0.38360595703125, 0.39453125]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 3.0, 2.0, 7.0, 5.0, 7.0, 11.0, 23.0, 19.0, 19.0, 18.0, 33.0, 32.0, 39.0, 37.0, 37.0, 37.0, 54.0, 49.0, 65.0, 52.0, 38.0, 54.0, 47.0, 41.0, 40.0, 44.0, 39.0, 19.0, 18.0, 19.0, 24.0, 15.0, 15.0, 12.0, 11.0, 11.0, 3.0, 7.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.28369140625, -0.2737236022949219, -0.26375579833984375, -0.2537879943847656, -0.2438201904296875, -0.23385238647460938, -0.22388458251953125, -0.21391677856445312, -0.203948974609375, -0.19398117065429688, -0.18401336669921875, -0.17404556274414062, -0.1640777587890625, -0.15410995483398438, -0.14414215087890625, -0.13417434692382812, -0.12420654296875, -0.11423873901367188, -0.10427093505859375, -0.09430313110351562, -0.0843353271484375, -0.07436752319335938, -0.06439971923828125, -0.054431915283203125, -0.044464111328125, -0.034496307373046875, -0.02452850341796875, -0.014560699462890625, -0.0045928955078125, 0.005374908447265625, 0.01534271240234375, 0.025310516357421875, 0.0352783203125, 0.045246124267578125, 0.05521392822265625, 0.06518173217773438, 0.0751495361328125, 0.08511734008789062, 0.09508514404296875, 0.10505294799804688, 0.115020751953125, 0.12498855590820312, 0.13495635986328125, 0.14492416381835938, 0.1548919677734375, 0.16485977172851562, 0.17482757568359375, 0.18479537963867188, 0.19476318359375, 0.20473098754882812, 0.21469879150390625, 0.22466659545898438, 0.2346343994140625, 0.24460220336914062, 0.25457000732421875, 0.2645378112792969, 0.274505615234375, 0.2844734191894531, 0.29444122314453125, 0.3044090270996094, 0.3143768310546875, 0.3243446350097656, 0.33431243896484375, 0.3442802429199219, 0.354248046875]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 4.0, 11.0, 6.0, 13.0, 23.0, 49.0, 66.0, 141.0, 326.0, 936.0, 3898.0, 27676.0, 244591.0, 662489.0, 94067.0, 11067.0, 2069.0, 612.0, 274.0, 108.0, 58.0, 28.0, 18.0, 12.0, 11.0, 4.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.302490234375, -0.29415321350097656, -0.2858161926269531, -0.2774791717529297, -0.26914215087890625, -0.2608051300048828, -0.2524681091308594, -0.24413108825683594, -0.2357940673828125, -0.22745704650878906, -0.21912002563476562, -0.2107830047607422, -0.20244598388671875, -0.1941089630126953, -0.18577194213867188, -0.17743492126464844, -0.169097900390625, -0.16076087951660156, -0.15242385864257812, -0.1440868377685547, -0.13574981689453125, -0.1274127960205078, -0.11907577514648438, -0.11073875427246094, -0.1024017333984375, -0.09406471252441406, -0.08572769165039062, -0.07739067077636719, -0.06905364990234375, -0.06071662902832031, -0.052379608154296875, -0.04404258728027344, -0.03570556640625, -0.027368545532226562, -0.019031524658203125, -0.010694503784179688, -0.00235748291015625, 0.0059795379638671875, 0.014316558837890625, 0.022653579711914062, 0.0309906005859375, 0.03932762145996094, 0.047664642333984375, 0.05600166320800781, 0.06433868408203125, 0.07267570495605469, 0.08101272583007812, 0.08934974670410156, 0.097686767578125, 0.10602378845214844, 0.11436080932617188, 0.12269783020019531, 0.13103485107421875, 0.1393718719482422, 0.14770889282226562, 0.15604591369628906, 0.1643829345703125, 0.17271995544433594, 0.18105697631835938, 0.1893939971923828, 0.19773101806640625, 0.2060680389404297, 0.21440505981445312, 0.22274208068847656, 0.2310791015625]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 5.0, 2.0, 2.0, 7.0, 8.0, 8.0, 18.0, 21.0, 27.0, 32.0, 41.0, 48.0, 78.0, 163.0, 163.0, 122.0, 71.0, 38.0, 30.0, 23.0, 28.0, 24.0, 16.0, 7.0, 6.0, 6.0, 6.0, 2.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.255243301391602e-05, -7.902737706899643e-05, -7.550232112407684e-05, -7.197726517915726e-05, -6.845220923423767e-05, -6.492715328931808e-05, -6.14020973443985e-05, -5.787704139947891e-05, -5.4351985454559326e-05, -5.082692950963974e-05, -4.7301873564720154e-05, -4.377681761980057e-05, -4.025176167488098e-05, -3.6726705729961395e-05, -3.320164978504181e-05, -2.9676593840122223e-05, -2.6151537895202637e-05, -2.262648195028305e-05, -1.9101426005363464e-05, -1.5576370060443878e-05, -1.2051314115524292e-05, -8.526258170604706e-06, -5.00120222568512e-06, -1.4761462807655334e-06, 2.0489096641540527e-06, 5.573965609073639e-06, 9.099021553993225e-06, 1.2624077498912811e-05, 1.6149133443832397e-05, 1.9674189388751984e-05, 2.319924533367157e-05, 2.6724301278591156e-05, 3.0249357223510742e-05, 3.377441316843033e-05, 3.7299469113349915e-05, 4.08245250582695e-05, 4.434958100318909e-05, 4.787463694810867e-05, 5.139969289302826e-05, 5.4924748837947845e-05, 5.844980478286743e-05, 6.197486072778702e-05, 6.54999166727066e-05, 6.902497261762619e-05, 7.255002856254578e-05, 7.607508450746536e-05, 7.960014045238495e-05, 8.312519639730453e-05, 8.665025234222412e-05, 9.017530828714371e-05, 9.37003642320633e-05, 9.722542017698288e-05, 0.00010075047612190247, 0.00010427553206682205, 0.00010780058801174164, 0.00011132564395666122, 0.00011485069990158081, 0.0001183757558465004, 0.00012190081179141998, 0.00012542586773633957, 0.00012895092368125916, 0.00013247597962617874, 0.00013600103557109833, 0.00013952609151601791, 0.0001430511474609375]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 5.0, 3.0, 11.0, 18.0, 28.0, 27.0, 60.0, 59.0, 145.0, 311.0, 593.0, 1664.0, 6569.0, 41228.0, 322749.0, 587047.0, 73523.0, 10701.0, 2227.0, 801.0, 359.0, 175.0, 95.0, 57.0, 38.0, 20.0, 14.0, 9.0, 11.0, 6.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.39501953125, -0.3856468200683594, -0.37627410888671875, -0.3669013977050781, -0.3575286865234375, -0.3481559753417969, -0.33878326416015625, -0.3294105529785156, -0.320037841796875, -0.3106651306152344, -0.30129241943359375, -0.2919197082519531, -0.2825469970703125, -0.2731742858886719, -0.26380157470703125, -0.2544288635253906, -0.24505615234375, -0.23568344116210938, -0.22631072998046875, -0.21693801879882812, -0.2075653076171875, -0.19819259643554688, -0.18881988525390625, -0.17944717407226562, -0.170074462890625, -0.16070175170898438, -0.15132904052734375, -0.14195632934570312, -0.1325836181640625, -0.12321090698242188, -0.11383819580078125, -0.10446548461914062, -0.0950927734375, -0.08572006225585938, -0.07634735107421875, -0.06697463989257812, -0.0576019287109375, -0.048229217529296875, -0.03885650634765625, -0.029483795166015625, -0.020111083984375, -0.010738372802734375, -0.00136566162109375, 0.008007049560546875, 0.0173797607421875, 0.026752471923828125, 0.03612518310546875, 0.045497894287109375, 0.05487060546875, 0.06424331665039062, 0.07361602783203125, 0.08298873901367188, 0.0923614501953125, 0.10173416137695312, 0.11110687255859375, 0.12047958374023438, 0.129852294921875, 0.13922500610351562, 0.14859771728515625, 0.15797042846679688, 0.1673431396484375, 0.17671585083007812, 0.18608856201171875, 0.19546127319335938, 0.204833984375]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 2.0, 4.0, 5.0, 3.0, 6.0, 11.0, 9.0, 11.0, 12.0, 11.0, 18.0, 12.0, 19.0, 38.0, 39.0, 43.0, 45.0, 69.0, 74.0, 80.0, 88.0, 68.0, 82.0, 51.0, 42.0, 26.0, 26.0, 26.0, 13.0, 15.0, 13.0, 11.0, 7.0, 9.0, 5.0, 5.0, 2.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.1380615234375, -0.1341991424560547, -0.13033676147460938, -0.12647438049316406, -0.12261199951171875, -0.11874961853027344, -0.11488723754882812, -0.11102485656738281, -0.1071624755859375, -0.10330009460449219, -0.09943771362304688, -0.09557533264160156, -0.09171295166015625, -0.08785057067871094, -0.08398818969726562, -0.08012580871582031, -0.076263427734375, -0.07240104675292969, -0.06853866577148438, -0.06467628479003906, -0.06081390380859375, -0.05695152282714844, -0.053089141845703125, -0.04922676086425781, -0.0453643798828125, -0.04150199890136719, -0.037639617919921875, -0.03377723693847656, -0.02991485595703125, -0.026052474975585938, -0.022190093994140625, -0.018327713012695312, -0.01446533203125, -0.010602951049804688, -0.006740570068359375, -0.0028781890869140625, 0.00098419189453125, 0.0048465728759765625, 0.008708953857421875, 0.012571334838867188, 0.0164337158203125, 0.020296096801757812, 0.024158477783203125, 0.028020858764648438, 0.03188323974609375, 0.03574562072753906, 0.039608001708984375, 0.04347038269042969, 0.047332763671875, 0.05119514465332031, 0.055057525634765625, 0.05891990661621094, 0.06278228759765625, 0.06664466857910156, 0.07050704956054688, 0.07436943054199219, 0.0782318115234375, 0.08209419250488281, 0.08595657348632812, 0.08981895446777344, 0.09368133544921875, 0.09754371643066406, 0.10140609741210938, 0.10526847839355469, 0.109130859375]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 12.0, 24.0, 39.0, 74.0, 162.0, 217.0, 221.0, 119.0, 60.0, 35.0, 21.0, 12.0, 6.0, 2.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.002054691314697, -3.9129621982574463, -3.8238697052001953, -3.7347772121429443, -3.6456847190856934, -3.5565922260284424, -3.4674997329711914, -3.3784074783325195, -3.2893147468566895, -3.2002222537994385, -3.1111297607421875, -3.0220372676849365, -2.9329447746276855, -2.8438522815704346, -2.7547597885131836, -2.6656675338745117, -2.5765750408172607, -2.4874825477600098, -2.398390054702759, -2.309297561645508, -2.220205068588257, -2.131112575531006, -2.042020320892334, -1.9529277086257935, -1.8638352155685425, -1.7747427225112915, -1.6856502294540405, -1.596557855606079, -1.5074653625488281, -1.4183728694915771, -1.3292803764343262, -1.2401878833770752, -1.1510956287384033, -1.0620031356811523, -0.9729106426239014, -0.8838182091712952, -0.7947257161140442, -0.7056332230567932, -0.616540789604187, -0.527448296546936, -0.43835580348968506, -0.3492633104324341, -0.2601708471775055, -0.1710783839225769, -0.08198589086532593, 0.007106602191925049, 0.09619903564453125, 0.18529152870178223, 0.2743840217590332, 0.3634765148162842, 0.45256897807121277, 0.5416614413261414, 0.6307539343833923, 0.7198464274406433, 0.8089388608932495, 0.8980313539505005, 0.9871238470077515, 1.0762163400650024, 1.1653088331222534, 1.2544012069702148, 1.3434937000274658, 1.4325861930847168, 1.5216786861419678, 1.6107711791992188, 1.6998636722564697]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 0.0, 4.0, 3.0, 5.0, 10.0, 9.0, 14.0, 8.0, 11.0, 19.0, 19.0, 20.0, 23.0, 23.0, 39.0, 31.0, 28.0, 38.0, 40.0, 52.0, 57.0, 54.0, 55.0, 49.0, 52.0, 33.0, 37.0, 34.0, 29.0, 34.0, 28.0, 20.0, 18.0, 18.0, 12.0, 18.0, 7.0, 12.0, 6.0, 7.0, 13.0, 7.0, 5.0, 2.0, 1.0, 1.0, 4.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0], "bins": [-2.007315158843994, -1.9458867311477661, -1.884458303451538, -1.82302987575531, -1.761601448059082, -1.700173020362854, -1.638744592666626, -1.577316164970398, -1.51588773727417, -1.454459309577942, -1.3930308818817139, -1.3316024541854858, -1.2701740264892578, -1.2087455987930298, -1.1473171710968018, -1.0858887434005737, -1.0244603157043457, -0.9630318880081177, -0.9016034603118896, -0.8401750326156616, -0.7787466049194336, -0.7173181772232056, -0.6558897495269775, -0.5944613218307495, -0.533033013343811, -0.471604585647583, -0.410176157951355, -0.34874773025512695, -0.2873193025588989, -0.2258909046649933, -0.16446247696876526, -0.10303404927253723, -0.041605591773986816, 0.019822832196950912, 0.08125125616788864, 0.14267967641353607, 0.2041081041097641, 0.26553651690483093, 0.32696494460105896, 0.388393372297287, 0.449821799993515, 0.5112501978874207, 0.5726786255836487, 0.6341070532798767, 0.6955354809761047, 0.7569639086723328, 0.8183923363685608, 0.8798207640647888, 0.9412491917610168, 1.0026775598526, 1.0641059875488281, 1.1255344152450562, 1.1869628429412842, 1.2483912706375122, 1.3098196983337402, 1.3712481260299683, 1.4326765537261963, 1.4941049814224243, 1.5555334091186523, 1.6169618368148804, 1.6783902645111084, 1.7398186922073364, 1.8012471199035645, 1.8626755475997925, 1.9241039752960205]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 5.0, 1.0, 1.0, 2.0, 4.0, 6.0, 7.0, 20.0, 14.0, 18.0, 55.0, 83.0, 134.0, 301.0, 569.0, 1464.0, 5282.0, 52702.0, 4005849.0, 118130.0, 7058.0, 1555.0, 549.0, 222.0, 110.0, 58.0, 29.0, 16.0, 11.0, 10.0, 7.0, 4.0, 5.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.060546875, -1.0315780639648438, -1.0026092529296875, -0.9736404418945312, -0.944671630859375, -0.9157028198242188, -0.8867340087890625, -0.8577651977539062, -0.82879638671875, -0.7998275756835938, -0.7708587646484375, -0.7418899536132812, -0.712921142578125, -0.6839523315429688, -0.6549835205078125, -0.6260147094726562, -0.5970458984375, -0.5680770874023438, -0.5391082763671875, -0.5101394653320312, -0.481170654296875, -0.45220184326171875, -0.4232330322265625, -0.39426422119140625, -0.36529541015625, -0.33632659912109375, -0.3073577880859375, -0.27838897705078125, -0.249420166015625, -0.22045135498046875, -0.1914825439453125, -0.16251373291015625, -0.133544921875, -0.10457611083984375, -0.0756072998046875, -0.04663848876953125, -0.017669677734375, 0.01129913330078125, 0.0402679443359375, 0.06923675537109375, 0.09820556640625, 0.12717437744140625, 0.1561431884765625, 0.18511199951171875, 0.214080810546875, 0.24304962158203125, 0.2720184326171875, 0.30098724365234375, 0.3299560546875, 0.35892486572265625, 0.3878936767578125, 0.41686248779296875, 0.445831298828125, 0.47480010986328125, 0.5037689208984375, 0.5327377319335938, 0.56170654296875, 0.5906753540039062, 0.6196441650390625, 0.6486129760742188, 0.677581787109375, 0.7065505981445312, 0.7355194091796875, 0.7644882202148438, 0.79345703125]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 3.0, 4.0, 1.0, 7.0, 9.0, 6.0, 7.0, 21.0, 26.0, 45.0, 55.0, 68.0, 87.0, 108.0, 94.0, 110.0, 93.0, 68.0, 63.0, 52.0, 26.0, 18.0, 18.0, 5.0, 6.0, 2.0, 3.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.1240234375, -0.12079906463623047, -0.11757469177246094, -0.1143503189086914, -0.11112594604492188, -0.10790157318115234, -0.10467720031738281, -0.10145282745361328, -0.09822845458984375, -0.09500408172607422, -0.09177970886230469, -0.08855533599853516, -0.08533096313476562, -0.0821065902709961, -0.07888221740722656, -0.07565784454345703, -0.0724334716796875, -0.06920909881591797, -0.06598472595214844, -0.0627603530883789, -0.059535980224609375, -0.056311607360839844, -0.05308723449707031, -0.04986286163330078, -0.04663848876953125, -0.04341411590576172, -0.04018974304199219, -0.036965370178222656, -0.033740997314453125, -0.030516624450683594, -0.027292251586914062, -0.02406787872314453, -0.020843505859375, -0.01761913299560547, -0.014394760131835938, -0.011170387268066406, -0.007946014404296875, -0.004721641540527344, -0.0014972686767578125, 0.0017271041870117188, 0.00495147705078125, 0.008175849914550781, 0.011400222778320312, 0.014624595642089844, 0.017848968505859375, 0.021073341369628906, 0.024297714233398438, 0.02752208709716797, 0.0307464599609375, 0.03397083282470703, 0.03719520568847656, 0.040419578552246094, 0.043643951416015625, 0.046868324279785156, 0.05009269714355469, 0.05331707000732422, 0.05654144287109375, 0.05976581573486328, 0.06299018859863281, 0.06621456146240234, 0.06943893432617188, 0.0726633071899414, 0.07588768005371094, 0.07911205291748047, 0.08233642578125]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 5.0, 1.0, 5.0, 7.0, 5.0, 13.0, 22.0, 23.0, 43.0, 61.0, 130.0, 246.0, 554.0, 1441.0, 4666.0, 21573.0, 205492.0, 3623568.0, 299221.0, 27808.0, 5933.0, 1832.0, 733.0, 372.0, 213.0, 129.0, 71.0, 51.0, 21.0, 16.0, 18.0, 3.0, 10.0, 2.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.25537109375, -0.242950439453125, -0.23052978515625, -0.218109130859375, -0.2056884765625, -0.193267822265625, -0.18084716796875, -0.168426513671875, -0.156005859375, -0.143585205078125, -0.13116455078125, -0.118743896484375, -0.1063232421875, -0.093902587890625, -0.08148193359375, -0.069061279296875, -0.056640625, -0.044219970703125, -0.03179931640625, -0.019378662109375, -0.0069580078125, 0.005462646484375, 0.01788330078125, 0.030303955078125, 0.042724609375, 0.055145263671875, 0.06756591796875, 0.079986572265625, 0.0924072265625, 0.104827880859375, 0.11724853515625, 0.129669189453125, 0.14208984375, 0.154510498046875, 0.16693115234375, 0.179351806640625, 0.1917724609375, 0.204193115234375, 0.21661376953125, 0.229034423828125, 0.241455078125, 0.253875732421875, 0.26629638671875, 0.278717041015625, 0.2911376953125, 0.303558349609375, 0.31597900390625, 0.328399658203125, 0.3408203125, 0.353240966796875, 0.36566162109375, 0.378082275390625, 0.3905029296875, 0.402923583984375, 0.41534423828125, 0.427764892578125, 0.440185546875, 0.452606201171875, 0.46502685546875, 0.477447509765625, 0.4898681640625, 0.502288818359375, 0.51470947265625, 0.527130126953125, 0.53955078125]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 2.0, 2.0, 4.0, 7.0, 7.0, 21.0, 23.0, 40.0, 69.0, 117.0, 340.0, 823.0, 1600.0, 533.0, 228.0, 93.0, 63.0, 27.0, 30.0, 13.0, 12.0, 12.0, 5.0, 5.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0924072265625, -0.0882720947265625, -0.084136962890625, -0.0800018310546875, -0.07586669921875, -0.0717315673828125, -0.067596435546875, -0.0634613037109375, -0.059326171875, -0.0551910400390625, -0.051055908203125, -0.0469207763671875, -0.04278564453125, -0.0386505126953125, -0.034515380859375, -0.0303802490234375, -0.0262451171875, -0.0221099853515625, -0.017974853515625, -0.0138397216796875, -0.00970458984375, -0.0055694580078125, -0.001434326171875, 0.0027008056640625, 0.0068359375, 0.0109710693359375, 0.015106201171875, 0.0192413330078125, 0.02337646484375, 0.0275115966796875, 0.031646728515625, 0.0357818603515625, 0.0399169921875, 0.0440521240234375, 0.048187255859375, 0.0523223876953125, 0.05645751953125, 0.0605926513671875, 0.064727783203125, 0.0688629150390625, 0.072998046875, 0.0771331787109375, 0.081268310546875, 0.0854034423828125, 0.08953857421875, 0.0936737060546875, 0.097808837890625, 0.1019439697265625, 0.1060791015625, 0.1102142333984375, 0.114349365234375, 0.1184844970703125, 0.12261962890625, 0.1267547607421875, 0.130889892578125, 0.1350250244140625, 0.13916015625, 0.1432952880859375, 0.147430419921875, 0.1515655517578125, 0.15570068359375, 0.1598358154296875, 0.163970947265625, 0.1681060791015625, 0.1722412109375]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 3.0, 18.0, 64.0, 182.0, 336.0, 248.0, 123.0, 27.0, 6.0, 5.0, 0.0, 1.0, 1.0], "bins": [-1.9848458766937256, -1.949238896369934, -1.9136319160461426, -1.8780250549316406, -1.8424180746078491, -1.8068110942840576, -1.7712041139602661, -1.7355971336364746, -1.6999902725219727, -1.6643832921981812, -1.6287763118743896, -1.5931694507598877, -1.5575624704360962, -1.5219554901123047, -1.4863485097885132, -1.4507415294647217, -1.4151345491409302, -1.3795275688171387, -1.3439205884933472, -1.3083137273788452, -1.2727067470550537, -1.2370997667312622, -1.2014927864074707, -1.1658858060836792, -1.1302788257598877, -1.0946718454360962, -1.0590648651123047, -1.0234580039978027, -0.9878510236740112, -0.9522440433502197, -0.9166370630264282, -0.8810300827026367, -0.8454233407974243, -0.8098163604736328, -0.7742094397544861, -0.7386024594306946, -0.7029955387115479, -0.6673885583877563, -0.6317815780639648, -0.5961745977401733, -0.5605676770210266, -0.5249606966972351, -0.4893537759780884, -0.4537467956542969, -0.41813984513282776, -0.38253289461135864, -0.34692591428756714, -0.311318963766098, -0.2757120132446289, -0.2401050627231598, -0.20449809730052948, -0.16889113187789917, -0.13328418135643005, -0.09767723083496094, -0.06207026541233063, -0.026463299989700317, 0.009143650531768799, 0.04475060850381851, 0.08035756647586823, 0.11596452444791794, 0.15157148241996765, 0.18717843294143677, 0.22278539836406708, 0.2583923637866974, 0.2939993143081665]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 5.0, 0.0, 4.0, 6.0, 3.0, 7.0, 6.0, 5.0, 14.0, 14.0, 9.0, 15.0, 13.0, 27.0, 21.0, 23.0, 32.0, 24.0, 28.0, 32.0, 43.0, 43.0, 35.0, 43.0, 52.0, 37.0, 42.0, 47.0, 31.0, 29.0, 55.0, 33.0, 35.0, 31.0, 19.0, 20.0, 22.0, 17.0, 15.0, 20.0, 11.0, 11.0, 10.0, 4.0, 6.0, 3.0, 2.0, 1.0, 6.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.30326271057128906, -0.29452818632125854, -0.28579363226890564, -0.2770591080188751, -0.2683245837688446, -0.2595900297164917, -0.2508555054664612, -0.24212098121643066, -0.23338644206523895, -0.22465190291404724, -0.21591737866401672, -0.207182839512825, -0.1984483003616333, -0.18971377611160278, -0.18097923696041107, -0.17224469780921936, -0.16351017355918884, -0.15477563440799713, -0.1460411101579666, -0.1373065710067749, -0.12857204675674438, -0.11983750760555267, -0.11110296845436096, -0.10236843675374985, -0.09363390505313873, -0.08489937335252762, -0.0761648416519165, -0.06743030250072479, -0.05869577080011368, -0.049961239099502563, -0.04122670367360115, -0.03249216824769974, -0.023757636547088623, -0.01502310298383236, -0.006288569420576096, 0.002445964142680168, 0.011180497705936432, 0.019915029406547546, 0.02864956483244896, 0.03738410025835037, 0.04611863195896149, 0.0548531636595726, 0.06358769536018372, 0.07232223451137543, 0.08105676621198654, 0.08979129791259766, 0.09852583706378937, 0.10726036876440048, 0.1159949004650116, 0.12472943216562271, 0.13346396386623383, 0.14219850301742554, 0.15093302726745605, 0.15966756641864777, 0.16840210556983948, 0.17713662981987, 0.1858711689710617, 0.19460570812225342, 0.20334023237228394, 0.21207477152347565, 0.22080931067466736, 0.22954383492469788, 0.2382783740758896, 0.2470129132270813, 0.2557474374771118]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 5.0, 5.0, 6.0, 9.0, 13.0, 20.0, 23.0, 29.0, 39.0, 43.0, 70.0, 87.0, 113.0, 205.0, 262.0, 426.0, 578.0, 909.0, 1593.0, 2875.0, 5930.0, 14329.0, 39528.0, 123089.0, 342894.0, 333473.0, 117216.0, 37875.0, 13789.0, 5841.0, 2848.0, 1561.0, 939.0, 596.0, 388.0, 259.0, 188.0, 127.0, 114.0, 72.0, 43.0, 39.0, 26.0, 29.0, 17.0, 9.0, 6.0, 9.0, 4.0, 1.0, 6.0, 2.0, 3.0, 3.0, 2.0, 1.0, 1.0], "bins": [-0.206787109375, -0.20032119750976562, -0.19385528564453125, -0.18738937377929688, -0.1809234619140625, -0.17445755004882812, -0.16799163818359375, -0.16152572631835938, -0.155059814453125, -0.14859390258789062, -0.14212799072265625, -0.13566207885742188, -0.1291961669921875, -0.12273025512695312, -0.11626434326171875, -0.10979843139648438, -0.10333251953125, -0.09686660766601562, -0.09040069580078125, -0.08393478393554688, -0.0774688720703125, -0.07100296020507812, -0.06453704833984375, -0.058071136474609375, -0.051605224609375, -0.045139312744140625, -0.03867340087890625, -0.032207489013671875, -0.0257415771484375, -0.019275665283203125, -0.01280975341796875, -0.006343841552734375, 0.0001220703125, 0.006587982177734375, 0.01305389404296875, 0.019519805908203125, 0.0259857177734375, 0.032451629638671875, 0.03891754150390625, 0.045383453369140625, 0.051849365234375, 0.058315277099609375, 0.06478118896484375, 0.07124710083007812, 0.0777130126953125, 0.08417892456054688, 0.09064483642578125, 0.09711074829101562, 0.10357666015625, 0.11004257202148438, 0.11650848388671875, 0.12297439575195312, 0.1294403076171875, 0.13590621948242188, 0.14237213134765625, 0.14883804321289062, 0.155303955078125, 0.16176986694335938, 0.16823577880859375, 0.17470169067382812, 0.1811676025390625, 0.18763351440429688, 0.19409942626953125, 0.20056533813476562, 0.20703125]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 6.0, 2.0, 7.0, 10.0, 18.0, 22.0, 28.0, 49.0, 55.0, 55.0, 93.0, 102.0, 113.0, 105.0, 75.0, 57.0, 61.0, 52.0, 36.0, 19.0, 11.0, 10.0, 3.0, 2.0, 5.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.11529541015625, -0.11228752136230469, -0.10927963256835938, -0.10627174377441406, -0.10326385498046875, -0.10025596618652344, -0.09724807739257812, -0.09424018859863281, -0.0912322998046875, -0.08822441101074219, -0.08521652221679688, -0.08220863342285156, -0.07920074462890625, -0.07619285583496094, -0.07318496704101562, -0.07017707824707031, -0.067169189453125, -0.06416130065917969, -0.061153411865234375, -0.05814552307128906, -0.05513763427734375, -0.05212974548339844, -0.049121856689453125, -0.04611396789550781, -0.0431060791015625, -0.04009819030761719, -0.037090301513671875, -0.03408241271972656, -0.03107452392578125, -0.028066635131835938, -0.025058746337890625, -0.022050857543945312, -0.01904296875, -0.016035079956054688, -0.013027191162109375, -0.010019302368164062, -0.00701141357421875, -0.0040035247802734375, -0.000995635986328125, 0.0020122528076171875, 0.0050201416015625, 0.008028030395507812, 0.011035919189453125, 0.014043807983398438, 0.01705169677734375, 0.020059585571289062, 0.023067474365234375, 0.026075363159179688, 0.029083251953125, 0.03209114074707031, 0.035099029541015625, 0.03810691833496094, 0.04111480712890625, 0.04412269592285156, 0.047130584716796875, 0.05013847351074219, 0.0531463623046875, 0.05615425109863281, 0.059162139892578125, 0.06217002868652344, 0.06517791748046875, 0.06818580627441406, 0.07119369506835938, 0.07420158386230469, 0.07720947265625]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 1.0, 6.0, 6.0, 9.0, 6.0, 13.0, 24.0, 31.0, 41.0, 68.0, 92.0, 141.0, 194.0, 320.0, 562.0, 1082.0, 2410.0, 6438.0, 18827.0, 66395.0, 242935.0, 431743.0, 199201.0, 52718.0, 15341.0, 5518.0, 2127.0, 940.0, 463.0, 284.0, 200.0, 124.0, 107.0, 59.0, 38.0, 25.0, 29.0, 9.0, 10.0, 12.0, 2.0, 2.0, 5.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.264404296875, -0.25672149658203125, -0.2490386962890625, -0.24135589599609375, -0.233673095703125, -0.22599029541015625, -0.2183074951171875, -0.21062469482421875, -0.20294189453125, -0.19525909423828125, -0.1875762939453125, -0.17989349365234375, -0.172210693359375, -0.16452789306640625, -0.1568450927734375, -0.14916229248046875, -0.1414794921875, -0.13379669189453125, -0.1261138916015625, -0.11843109130859375, -0.110748291015625, -0.10306549072265625, -0.0953826904296875, -0.08769989013671875, -0.08001708984375, -0.07233428955078125, -0.0646514892578125, -0.05696868896484375, -0.049285888671875, -0.04160308837890625, -0.0339202880859375, -0.02623748779296875, -0.0185546875, -0.01087188720703125, -0.0031890869140625, 0.00449371337890625, 0.012176513671875, 0.01985931396484375, 0.0275421142578125, 0.03522491455078125, 0.04290771484375, 0.05059051513671875, 0.0582733154296875, 0.06595611572265625, 0.073638916015625, 0.08132171630859375, 0.0890045166015625, 0.09668731689453125, 0.1043701171875, 0.11205291748046875, 0.1197357177734375, 0.12741851806640625, 0.135101318359375, 0.14278411865234375, 0.1504669189453125, 0.15814971923828125, 0.16583251953125, 0.17351531982421875, 0.1811981201171875, 0.18888092041015625, 0.196563720703125, 0.20424652099609375, 0.2119293212890625, 0.21961212158203125, 0.227294921875]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 1.0, 3.0, 0.0, 7.0, 8.0, 5.0, 15.0, 14.0, 15.0, 17.0, 26.0, 32.0, 26.0, 30.0, 40.0, 44.0, 43.0, 46.0, 56.0, 39.0, 49.0, 62.0, 56.0, 50.0, 39.0, 36.0, 38.0, 39.0, 25.0, 32.0, 23.0, 21.0, 14.0, 9.0, 18.0, 5.0, 6.0, 2.0, 3.0, 10.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.347412109375, -0.3372688293457031, -0.32712554931640625, -0.3169822692871094, -0.3068389892578125, -0.2966957092285156, -0.28655242919921875, -0.2764091491699219, -0.266265869140625, -0.2561225891113281, -0.24597930908203125, -0.23583602905273438, -0.2256927490234375, -0.21554946899414062, -0.20540618896484375, -0.19526290893554688, -0.18511962890625, -0.17497634887695312, -0.16483306884765625, -0.15468978881835938, -0.1445465087890625, -0.13440322875976562, -0.12425994873046875, -0.11411666870117188, -0.103973388671875, -0.09383010864257812, -0.08368682861328125, -0.07354354858398438, -0.0634002685546875, -0.053256988525390625, -0.04311370849609375, -0.032970428466796875, -0.0228271484375, -0.012683868408203125, -0.00254058837890625, 0.007602691650390625, 0.0177459716796875, 0.027889251708984375, 0.03803253173828125, 0.048175811767578125, 0.058319091796875, 0.06846237182617188, 0.07860565185546875, 0.08874893188476562, 0.0988922119140625, 0.10903549194335938, 0.11917877197265625, 0.12932205200195312, 0.13946533203125, 0.14960861206054688, 0.15975189208984375, 0.16989517211914062, 0.1800384521484375, 0.19018173217773438, 0.20032501220703125, 0.21046829223632812, 0.220611572265625, 0.23075485229492188, 0.24089813232421875, 0.2510414123535156, 0.2611846923828125, 0.2713279724121094, 0.28147125244140625, 0.2916145324707031, 0.3017578125]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 4.0, 4.0, 1.0, 3.0, 6.0, 9.0, 12.0, 18.0, 24.0, 36.0, 43.0, 84.0, 136.0, 261.0, 551.0, 1277.0, 3695.0, 14257.0, 80399.0, 512021.0, 367417.0, 53066.0, 10189.0, 2892.0, 1091.0, 474.0, 226.0, 132.0, 70.0, 54.0, 32.0, 14.0, 15.0, 13.0, 12.0, 4.0, 3.0, 5.0, 1.0, 2.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.1351318359375, -0.13114452362060547, -0.12715721130371094, -0.1231698989868164, -0.11918258666992188, -0.11519527435302734, -0.11120796203613281, -0.10722064971923828, -0.10323333740234375, -0.09924602508544922, -0.09525871276855469, -0.09127140045166016, -0.08728408813476562, -0.0832967758178711, -0.07930946350097656, -0.07532215118408203, -0.0713348388671875, -0.06734752655029297, -0.06336021423339844, -0.059372901916503906, -0.055385589599609375, -0.051398277282714844, -0.04741096496582031, -0.04342365264892578, -0.03943634033203125, -0.03544902801513672, -0.03146171569824219, -0.027474403381347656, -0.023487091064453125, -0.019499778747558594, -0.015512466430664062, -0.011525154113769531, -0.007537841796875, -0.0035505294799804688, 0.0004367828369140625, 0.004424095153808594, 0.008411407470703125, 0.012398719787597656, 0.016386032104492188, 0.02037334442138672, 0.02436065673828125, 0.02834796905517578, 0.03233528137207031, 0.036322593688964844, 0.040309906005859375, 0.044297218322753906, 0.04828453063964844, 0.05227184295654297, 0.0562591552734375, 0.06024646759033203, 0.06423377990722656, 0.0682210922241211, 0.07220840454101562, 0.07619571685791016, 0.08018302917480469, 0.08417034149169922, 0.08815765380859375, 0.09214496612548828, 0.09613227844238281, 0.10011959075927734, 0.10410690307617188, 0.1080942153930664, 0.11208152770996094, 0.11606884002685547, 0.12005615234375]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 3.0, 6.0, 4.0, 4.0, 7.0, 3.0, 9.0, 9.0, 15.0, 12.0, 20.0, 23.0, 16.0, 18.0, 25.0, 44.0, 46.0, 60.0, 73.0, 94.0, 79.0, 69.0, 59.0, 66.0, 36.0, 37.0, 36.0, 20.0, 19.0, 18.0, 10.0, 13.0, 8.0, 7.0, 14.0, 9.0, 5.0, 7.0, 0.0, 4.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.587671279907227e-05, -7.366389036178589e-05, -7.145106792449951e-05, -6.923824548721313e-05, -6.702542304992676e-05, -6.481260061264038e-05, -6.2599778175354e-05, -6.038695573806763e-05, -5.817413330078125e-05, -5.596131086349487e-05, -5.3748488426208496e-05, -5.153566598892212e-05, -4.932284355163574e-05, -4.7110021114349365e-05, -4.489719867706299e-05, -4.268437623977661e-05, -4.0471553802490234e-05, -3.825873136520386e-05, -3.604590892791748e-05, -3.3833086490631104e-05, -3.1620264053344727e-05, -2.940744161605835e-05, -2.7194619178771973e-05, -2.4981796741485596e-05, -2.276897430419922e-05, -2.0556151866912842e-05, -1.8343329429626465e-05, -1.6130506992340088e-05, -1.3917684555053711e-05, -1.1704862117767334e-05, -9.492039680480957e-06, -7.27921724319458e-06, -5.066394805908203e-06, -2.853572368621826e-06, -6.407499313354492e-07, 1.5720725059509277e-06, 3.7848949432373047e-06, 5.997717380523682e-06, 8.210539817810059e-06, 1.0423362255096436e-05, 1.2636184692382812e-05, 1.484900712966919e-05, 1.7061829566955566e-05, 1.9274652004241943e-05, 2.148747444152832e-05, 2.3700296878814697e-05, 2.5913119316101074e-05, 2.812594175338745e-05, 3.0338764190673828e-05, 3.2551586627960205e-05, 3.476440906524658e-05, 3.697723150253296e-05, 3.9190053939819336e-05, 4.140287637710571e-05, 4.361569881439209e-05, 4.582852125167847e-05, 4.8041343688964844e-05, 5.025416612625122e-05, 5.24669885635376e-05, 5.4679811000823975e-05, 5.689263343811035e-05, 5.910545587539673e-05, 6.13182783126831e-05, 6.353110074996948e-05, 6.574392318725586e-05]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 4.0, 5.0, 6.0, 8.0, 11.0, 14.0, 20.0, 35.0, 54.0, 101.0, 212.0, 467.0, 1086.0, 3206.0, 11644.0, 63118.0, 448481.0, 441872.0, 61378.0, 11520.0, 3246.0, 1103.0, 479.0, 190.0, 127.0, 62.0, 40.0, 22.0, 23.0, 12.0, 5.0, 5.0, 3.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.16845703125, -0.16402339935302734, -0.1595897674560547, -0.15515613555908203, -0.15072250366210938, -0.14628887176513672, -0.14185523986816406, -0.1374216079711914, -0.13298797607421875, -0.1285543441772461, -0.12412071228027344, -0.11968708038330078, -0.11525344848632812, -0.11081981658935547, -0.10638618469238281, -0.10195255279541016, -0.0975189208984375, -0.09308528900146484, -0.08865165710449219, -0.08421802520751953, -0.07978439331054688, -0.07535076141357422, -0.07091712951660156, -0.0664834976196289, -0.06204986572265625, -0.057616233825683594, -0.05318260192871094, -0.04874897003173828, -0.044315338134765625, -0.03988170623779297, -0.03544807434082031, -0.031014442443847656, -0.026580810546875, -0.022147178649902344, -0.017713546752929688, -0.013279914855957031, -0.008846282958984375, -0.004412651062011719, 2.09808349609375e-05, 0.004454612731933594, 0.00888824462890625, 0.013321876525878906, 0.017755508422851562, 0.02218914031982422, 0.026622772216796875, 0.03105640411376953, 0.03549003601074219, 0.039923667907714844, 0.0443572998046875, 0.048790931701660156, 0.05322456359863281, 0.05765819549560547, 0.062091827392578125, 0.06652545928955078, 0.07095909118652344, 0.0753927230834961, 0.07982635498046875, 0.0842599868774414, 0.08869361877441406, 0.09312725067138672, 0.09756088256835938, 0.10199451446533203, 0.10642814636230469, 0.11086177825927734, 0.11529541015625]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 0.0, 4.0, 11.0, 9.0, 10.0, 10.0, 19.0, 29.0, 32.0, 38.0, 54.0, 82.0, 70.0, 101.0, 109.0, 81.0, 79.0, 66.0, 41.0, 43.0, 29.0, 18.0, 17.0, 16.0, 10.0, 5.0, 5.0, 0.0, 5.0, 2.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0927734375, -0.08970928192138672, -0.08664512634277344, -0.08358097076416016, -0.08051681518554688, -0.0774526596069336, -0.07438850402832031, -0.07132434844970703, -0.06826019287109375, -0.06519603729248047, -0.06213188171386719, -0.059067726135253906, -0.056003570556640625, -0.052939414978027344, -0.04987525939941406, -0.04681110382080078, -0.0437469482421875, -0.04068279266357422, -0.03761863708496094, -0.034554481506347656, -0.031490325927734375, -0.028426170349121094, -0.025362014770507812, -0.02229785919189453, -0.01923370361328125, -0.01616954803466797, -0.013105392456054688, -0.010041236877441406, -0.006977081298828125, -0.003912925720214844, -0.0008487701416015625, 0.0022153854370117188, 0.005279541015625, 0.008343696594238281, 0.011407852172851562, 0.014472007751464844, 0.017536163330078125, 0.020600318908691406, 0.023664474487304688, 0.02672863006591797, 0.02979278564453125, 0.03285694122314453, 0.03592109680175781, 0.038985252380371094, 0.042049407958984375, 0.045113563537597656, 0.04817771911621094, 0.05124187469482422, 0.0543060302734375, 0.05737018585205078, 0.06043434143066406, 0.06349849700927734, 0.06656265258789062, 0.0696268081665039, 0.07269096374511719, 0.07575511932373047, 0.07881927490234375, 0.08188343048095703, 0.08494758605957031, 0.0880117416381836, 0.09107589721679688, 0.09414005279541016, 0.09720420837402344, 0.10026836395263672, 0.10333251953125]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 7.0, 9.0, 12.0, 23.0, 79.0, 149.0, 240.0, 236.0, 136.0, 52.0, 36.0, 11.0, 7.0, 5.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.505434036254883, -3.4200596809387207, -3.3346853256225586, -3.2493109703063965, -3.1639363765716553, -3.078562021255493, -2.993187665939331, -2.907813310623169, -2.8224387168884277, -2.7370643615722656, -2.6516900062561035, -2.5663156509399414, -2.4809410572052, -2.395566701889038, -2.310192346572876, -2.224817991256714, -2.1394436359405518, -2.0540692806243896, -1.968694806098938, -1.8833204507827759, -1.7979459762573242, -1.712571620941162, -1.627197265625, -1.541822910308838, -1.4564484357833862, -1.3710740804672241, -1.2856996059417725, -1.2003252506256104, -1.1149508953094482, -1.0295764207839966, -0.9442020654678345, -0.8588276505470276, -0.7734529972076416, -0.6880785822868347, -0.6027041673660278, -0.5173298120498657, -0.43195539712905884, -0.34658098220825195, -0.26120662689208984, -0.17583221197128296, -0.09045779705047607, -0.005083397030830383, 0.08029100298881531, 0.1656653881072998, 0.2510398030281067, 0.3364142179489136, 0.4217885732650757, 0.5071629881858826, 0.5925374031066895, 0.6779118180274963, 0.7632862329483032, 0.8486605882644653, 0.9340350031852722, 1.019409418106079, 1.1047837734222412, 1.1901581287384033, 1.275532603263855, 1.360906958580017, 1.4462814331054688, 1.5316557884216309, 1.617030143737793, 1.7024046182632446, 1.7877789735794067, 1.8731534481048584, 1.9585278034210205]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 5.0, 5.0, 2.0, 2.0, 6.0, 6.0, 5.0, 7.0, 12.0, 14.0, 18.0, 12.0, 20.0, 17.0, 19.0, 28.0, 28.0, 31.0, 26.0, 51.0, 37.0, 39.0, 43.0, 56.0, 38.0, 38.0, 40.0, 56.0, 49.0, 31.0, 34.0, 35.0, 28.0, 25.0, 27.0, 21.0, 19.0, 17.0, 13.0, 10.0, 5.0, 9.0, 3.0, 11.0, 4.0, 1.0, 3.0, 2.0, 1.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0], "bins": [-1.6746662855148315, -1.6245983839035034, -1.5745306015014648, -1.5244626998901367, -1.4743949174880981, -1.42432701587677, -1.3742592334747314, -1.3241913318634033, -1.2741234302520752, -1.224055528640747, -1.1739877462387085, -1.1239198446273804, -1.0738520622253418, -1.0237841606140137, -0.9737163186073303, -0.923648476600647, -0.8735806345939636, -0.8235127925872803, -0.7734449505805969, -0.7233771085739136, -0.6733092069625854, -0.6232413649559021, -0.5731735229492188, -0.5231056213378906, -0.47303780913352966, -0.4229699671268463, -0.3729020953178406, -0.3228342533111572, -0.2727664113044739, -0.22269853949546814, -0.1726306974887848, -0.12256282567977905, -0.0724949836730957, -0.022427130490541458, 0.027640722692012787, 0.07770857214927673, 0.12777642905712128, 0.17784428596496582, 0.22791212797164917, 0.2779799997806549, 0.32804784178733826, 0.3781156837940216, 0.42818355560302734, 0.4782513976097107, 0.528319239616394, 0.5783871412277222, 0.6284549236297607, 0.6785228252410889, 0.7285906672477722, 0.7786585092544556, 0.8287263512611389, 0.8787941932678223, 0.9288620948791504, 0.9789299368858337, 1.028997778892517, 1.0790656805038452, 1.1291334629058838, 1.179201364517212, 1.2292691469192505, 1.2793370485305786, 1.3294048309326172, 1.3794727325439453, 1.4295406341552734, 1.479608416557312, 1.5296763181686401]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 1.0, 4.0, 3.0, 0.0, 6.0, 4.0, 10.0, 16.0, 16.0, 20.0, 19.0, 33.0, 47.0, 62.0, 137.0, 170.0, 261.0, 486.0, 959.0, 2253.0, 5825.0, 21995.0, 185691.0, 3841487.0, 109864.0, 16740.0, 4673.0, 1791.0, 802.0, 407.0, 202.0, 111.0, 85.0, 34.0, 34.0, 13.0, 7.0, 7.0, 7.0, 2.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.466064453125, -0.4539299011230469, -0.44179534912109375, -0.4296607971191406, -0.4175262451171875, -0.4053916931152344, -0.39325714111328125, -0.3811225891113281, -0.368988037109375, -0.3568534851074219, -0.34471893310546875, -0.3325843811035156, -0.3204498291015625, -0.3083152770996094, -0.29618072509765625, -0.2840461730957031, -0.27191162109375, -0.2597770690917969, -0.24764251708984375, -0.23550796508789062, -0.2233734130859375, -0.21123886108398438, -0.19910430908203125, -0.18696975708007812, -0.174835205078125, -0.16270065307617188, -0.15056610107421875, -0.13843154907226562, -0.1262969970703125, -0.11416244506835938, -0.10202789306640625, -0.08989334106445312, -0.0777587890625, -0.06562423706054688, -0.05348968505859375, -0.041355133056640625, -0.0292205810546875, -0.017086029052734375, -0.00495147705078125, 0.007183074951171875, 0.019317626953125, 0.031452178955078125, 0.04358673095703125, 0.055721282958984375, 0.0678558349609375, 0.07999038696289062, 0.09212493896484375, 0.10425949096679688, 0.11639404296875, 0.12852859497070312, 0.14066314697265625, 0.15279769897460938, 0.1649322509765625, 0.17706680297851562, 0.18920135498046875, 0.20133590698242188, 0.213470458984375, 0.22560501098632812, 0.23773956298828125, 0.24987411499023438, 0.2620086669921875, 0.2741432189941406, 0.28627777099609375, 0.2984123229980469, 0.310546875]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 3.0, 2.0, 6.0, 6.0, 13.0, 17.0, 18.0, 42.0, 41.0, 56.0, 78.0, 86.0, 81.0, 94.0, 83.0, 82.0, 72.0, 49.0, 44.0, 31.0, 32.0, 25.0, 19.0, 9.0, 4.0, 5.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.1136474609375, -0.11069679260253906, -0.10774612426757812, -0.10479545593261719, -0.10184478759765625, -0.09889411926269531, -0.09594345092773438, -0.09299278259277344, -0.0900421142578125, -0.08709144592285156, -0.08414077758789062, -0.08119010925292969, -0.07823944091796875, -0.07528877258300781, -0.07233810424804688, -0.06938743591308594, -0.066436767578125, -0.06348609924316406, -0.060535430908203125, -0.05758476257324219, -0.05463409423828125, -0.05168342590332031, -0.048732757568359375, -0.04578208923339844, -0.0428314208984375, -0.03988075256347656, -0.036930084228515625, -0.03397941589355469, -0.03102874755859375, -0.028078079223632812, -0.025127410888671875, -0.022176742553710938, -0.01922607421875, -0.016275405883789062, -0.013324737548828125, -0.010374069213867188, -0.00742340087890625, -0.0044727325439453125, -0.001522064208984375, 0.0014286041259765625, 0.0043792724609375, 0.0073299407958984375, 0.010280609130859375, 0.013231277465820312, 0.01618194580078125, 0.019132614135742188, 0.022083282470703125, 0.025033950805664062, 0.027984619140625, 0.030935287475585938, 0.033885955810546875, 0.03683662414550781, 0.03978729248046875, 0.04273796081542969, 0.045688629150390625, 0.04863929748535156, 0.0515899658203125, 0.05454063415527344, 0.057491302490234375, 0.06044197082519531, 0.06339263916015625, 0.06634330749511719, 0.06929397583007812, 0.07224464416503906, 0.0751953125]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 3.0, 7.0, 8.0, 24.0, 31.0, 33.0, 79.0, 140.0, 295.0, 573.0, 1343.0, 3790.0, 13065.0, 73207.0, 1736699.0, 2261935.0, 81962.0, 14442.0, 3959.0, 1466.0, 622.0, 277.0, 128.0, 86.0, 51.0, 24.0, 14.0, 12.0, 5.0, 5.0, 2.0, 2.0, 2.0, 0.0, 1.0], "bins": [-0.369873046875, -0.36147117614746094, -0.3530693054199219, -0.3446674346923828, -0.33626556396484375, -0.3278636932373047, -0.3194618225097656, -0.31105995178222656, -0.3026580810546875, -0.29425621032714844, -0.2858543395996094, -0.2774524688720703, -0.26905059814453125, -0.2606487274169922, -0.2522468566894531, -0.24384498596191406, -0.235443115234375, -0.22704124450683594, -0.21863937377929688, -0.2102375030517578, -0.20183563232421875, -0.1934337615966797, -0.18503189086914062, -0.17663002014160156, -0.1682281494140625, -0.15982627868652344, -0.15142440795898438, -0.1430225372314453, -0.13462066650390625, -0.1262187957763672, -0.11781692504882812, -0.10941505432128906, -0.10101318359375, -0.09261131286621094, -0.08420944213867188, -0.07580757141113281, -0.06740570068359375, -0.05900382995605469, -0.050601959228515625, -0.04220008850097656, -0.0337982177734375, -0.025396347045898438, -0.016994476318359375, -0.008592605590820312, -0.00019073486328125, 0.008211135864257812, 0.016613006591796875, 0.025014877319335938, 0.033416748046875, 0.04181861877441406, 0.050220489501953125, 0.05862236022949219, 0.06702423095703125, 0.07542610168457031, 0.08382797241210938, 0.09222984313964844, 0.1006317138671875, 0.10903358459472656, 0.11743545532226562, 0.1258373260498047, 0.13423919677734375, 0.1426410675048828, 0.15104293823242188, 0.15944480895996094, 0.1678466796875]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 3.0, 5.0, 4.0, 4.0, 5.0, 6.0, 12.0, 23.0, 18.0, 48.0, 58.0, 114.0, 252.0, 619.0, 1568.0, 675.0, 305.0, 137.0, 67.0, 55.0, 32.0, 29.0, 14.0, 4.0, 4.0, 6.0, 2.0, 4.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.088623046875, -0.08598136901855469, -0.08333969116210938, -0.08069801330566406, -0.07805633544921875, -0.07541465759277344, -0.07277297973632812, -0.07013130187988281, -0.0674896240234375, -0.06484794616699219, -0.062206268310546875, -0.05956459045410156, -0.05692291259765625, -0.05428123474121094, -0.051639556884765625, -0.04899787902832031, -0.046356201171875, -0.04371452331542969, -0.041072845458984375, -0.03843116760253906, -0.03578948974609375, -0.03314781188964844, -0.030506134033203125, -0.027864456176757812, -0.0252227783203125, -0.022581100463867188, -0.019939422607421875, -0.017297744750976562, -0.01465606689453125, -0.012014389038085938, -0.009372711181640625, -0.0067310333251953125, -0.00408935546875, -0.0014476776123046875, 0.001194000244140625, 0.0038356781005859375, 0.00647735595703125, 0.009119033813476562, 0.011760711669921875, 0.014402389526367188, 0.0170440673828125, 0.019685745239257812, 0.022327423095703125, 0.024969100952148438, 0.02761077880859375, 0.030252456665039062, 0.032894134521484375, 0.03553581237792969, 0.038177490234375, 0.04081916809082031, 0.043460845947265625, 0.04610252380371094, 0.04874420166015625, 0.05138587951660156, 0.054027557373046875, 0.05666923522949219, 0.0593109130859375, 0.06195259094238281, 0.06459426879882812, 0.06723594665527344, 0.06987762451171875, 0.07251930236816406, 0.07516098022460938, 0.07780265808105469, 0.0804443359375]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 7.0, 13.0, 82.0, 196.0, 333.0, 237.0, 109.0, 23.0, 8.0, 2.0, 3.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-1.5152854919433594, -1.4864425659179688, -1.4575996398925781, -1.4287567138671875, -1.3999139070510864, -1.3710709810256958, -1.3422280550003052, -1.3133851289749146, -1.284542202949524, -1.2556992769241333, -1.2268563508987427, -1.1980135440826416, -1.169170618057251, -1.1403276920318604, -1.1114847660064697, -1.082641839981079, -1.053799033164978, -1.0249561071395874, -0.9961132407188416, -0.9672703146934509, -0.9384273886680603, -0.9095845222473145, -0.8807415962219238, -0.8518986701965332, -0.8230557441711426, -0.794212818145752, -0.7653699517250061, -0.7365270256996155, -0.7076840996742249, -0.678841233253479, -0.6499983072280884, -0.6211553812026978, -0.5923125743865967, -0.563469648361206, -0.5346267819404602, -0.5057838559150696, -0.47694095969200134, -0.4480980634689331, -0.4192551374435425, -0.39041224122047424, -0.36156928539276123, -0.332726389169693, -0.30388346314430237, -0.27504056692123413, -0.2461976706981659, -0.21735475957393646, -0.18851184844970703, -0.1596689522266388, -0.13082605600357056, -0.10198315232992172, -0.07314024865627289, -0.04429733753204346, -0.015454433858394623, 0.013388469815254211, 0.04223138093948364, 0.07107427716255188, 0.09991718828678131, 0.12876009941101074, 0.15760299563407898, 0.1864459067583084, 0.21528881788253784, 0.24413171410560608, 0.2729746103286743, 0.30181753635406494, 0.3306604325771332]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 3.0, 2.0, 7.0, 3.0, 7.0, 9.0, 11.0, 17.0, 11.0, 19.0, 29.0, 26.0, 30.0, 33.0, 48.0, 38.0, 32.0, 43.0, 45.0, 51.0, 48.0, 45.0, 49.0, 41.0, 48.0, 38.0, 39.0, 39.0, 30.0, 26.0, 30.0, 17.0, 27.0, 9.0, 13.0, 11.0, 5.0, 5.0, 6.0, 0.0, 7.0, 3.0, 1.0, 2.0, 3.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.23657631874084473, -0.22934478521347046, -0.222113236784935, -0.21488170325756073, -0.20765015482902527, -0.200418621301651, -0.19318708777427673, -0.18595553934574127, -0.1787239909172058, -0.17149245738983154, -0.16426090896129608, -0.15702937543392181, -0.14979782700538635, -0.14256629347801208, -0.13533475995063782, -0.12810321152210236, -0.12087167799472809, -0.11364013701677322, -0.10640859603881836, -0.09917706251144409, -0.09194551408290863, -0.08471398055553436, -0.0774824395775795, -0.07025089859962463, -0.06301935762166977, -0.055787816643714905, -0.04855627566576004, -0.041324738413095474, -0.03409319743514061, -0.026861656457185745, -0.01963011920452118, -0.012398578226566315, -0.00516703724861145, 0.0020645027980208397, 0.00929604284465313, 0.016527581959962845, 0.02375912293791771, 0.030990663915872574, 0.03822220116853714, 0.045453742146492004, 0.05268528312444687, 0.05991682410240173, 0.0671483650803566, 0.07437990605831146, 0.08161143958568573, 0.08884298801422119, 0.09607452154159546, 0.10330606251955032, 0.11053760349750519, 0.11776914447546005, 0.12500068545341492, 0.13223221898078918, 0.13946376740932465, 0.1466953009366989, 0.15392684936523438, 0.16115838289260864, 0.1683899164199829, 0.17562144994735718, 0.18285299837589264, 0.1900845319032669, 0.19731608033180237, 0.20454761385917664, 0.2117791473865509, 0.21901069581508636, 0.22624224424362183]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 3.0, 2.0, 3.0, 7.0, 10.0, 8.0, 12.0, 19.0, 32.0, 45.0, 83.0, 71.0, 132.0, 196.0, 334.0, 576.0, 1023.0, 1889.0, 4092.0, 10874.0, 35040.0, 134277.0, 423411.0, 315671.0, 83350.0, 23070.0, 7712.0, 3074.0, 1408.0, 844.0, 481.0, 264.0, 176.0, 125.0, 68.0, 42.0, 49.0, 26.0, 13.0, 15.0, 10.0, 7.0, 4.0, 4.0, 4.0, 5.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.25634765625, -0.24898719787597656, -0.24162673950195312, -0.2342662811279297, -0.22690582275390625, -0.2195453643798828, -0.21218490600585938, -0.20482444763183594, -0.1974639892578125, -0.19010353088378906, -0.18274307250976562, -0.1753826141357422, -0.16802215576171875, -0.1606616973876953, -0.15330123901367188, -0.14594078063964844, -0.138580322265625, -0.13121986389160156, -0.12385940551757812, -0.11649894714355469, -0.10913848876953125, -0.10177803039550781, -0.09441757202148438, -0.08705711364746094, -0.0796966552734375, -0.07233619689941406, -0.06497573852539062, -0.05761528015136719, -0.05025482177734375, -0.04289436340332031, -0.035533905029296875, -0.028173446655273438, -0.02081298828125, -0.013452529907226562, -0.006092071533203125, 0.0012683868408203125, 0.00862884521484375, 0.015989303588867188, 0.023349761962890625, 0.030710220336914062, 0.0380706787109375, 0.04543113708496094, 0.052791595458984375, 0.06015205383300781, 0.06751251220703125, 0.07487297058105469, 0.08223342895507812, 0.08959388732910156, 0.096954345703125, 0.10431480407714844, 0.11167526245117188, 0.11903572082519531, 0.12639617919921875, 0.1337566375732422, 0.14111709594726562, 0.14847755432128906, 0.1558380126953125, 0.16319847106933594, 0.17055892944335938, 0.1779193878173828, 0.18527984619140625, 0.1926403045654297, 0.20000076293945312, 0.20736122131347656, 0.2147216796875]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 4.0, 8.0, 5.0, 15.0, 17.0, 27.0, 41.0, 47.0, 49.0, 100.0, 94.0, 86.0, 92.0, 86.0, 69.0, 68.0, 39.0, 46.0, 36.0, 25.0, 22.0, 15.0, 6.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1195068359375, -0.11644935607910156, -0.11339187622070312, -0.11033439636230469, -0.10727691650390625, -0.10421943664550781, -0.10116195678710938, -0.09810447692871094, -0.0950469970703125, -0.09198951721191406, -0.08893203735351562, -0.08587455749511719, -0.08281707763671875, -0.07975959777832031, -0.07670211791992188, -0.07364463806152344, -0.070587158203125, -0.06752967834472656, -0.06447219848632812, -0.06141471862792969, -0.05835723876953125, -0.05529975891113281, -0.052242279052734375, -0.04918479919433594, -0.0461273193359375, -0.04306983947753906, -0.040012359619140625, -0.03695487976074219, -0.03389739990234375, -0.030839920043945312, -0.027782440185546875, -0.024724960327148438, -0.02166748046875, -0.018610000610351562, -0.015552520751953125, -0.012495040893554688, -0.00943756103515625, -0.0063800811767578125, -0.003322601318359375, -0.0002651214599609375, 0.0027923583984375, 0.0058498382568359375, 0.008907318115234375, 0.011964797973632812, 0.01502227783203125, 0.018079757690429688, 0.021137237548828125, 0.024194717407226562, 0.027252197265625, 0.030309677124023438, 0.033367156982421875, 0.03642463684082031, 0.03948211669921875, 0.04253959655761719, 0.045597076416015625, 0.04865455627441406, 0.0517120361328125, 0.05476951599121094, 0.057826995849609375, 0.06088447570800781, 0.06394195556640625, 0.06699943542480469, 0.07005691528320312, 0.07311439514160156, 0.076171875]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 5.0, 4.0, 4.0, 5.0, 12.0, 12.0, 24.0, 25.0, 37.0, 68.0, 97.0, 160.0, 238.0, 467.0, 974.0, 2543.0, 8963.0, 43455.0, 266133.0, 545444.0, 146201.0, 24511.0, 5761.0, 1824.0, 761.0, 372.0, 197.0, 100.0, 60.0, 42.0, 27.0, 12.0, 10.0, 4.0, 6.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.261474609375, -0.2525596618652344, -0.24364471435546875, -0.23472976684570312, -0.2258148193359375, -0.21689987182617188, -0.20798492431640625, -0.19906997680664062, -0.190155029296875, -0.18124008178710938, -0.17232513427734375, -0.16341018676757812, -0.1544952392578125, -0.14558029174804688, -0.13666534423828125, -0.12775039672851562, -0.11883544921875, -0.10992050170898438, -0.10100555419921875, -0.09209060668945312, -0.0831756591796875, -0.07426071166992188, -0.06534576416015625, -0.056430816650390625, -0.047515869140625, -0.038600921630859375, -0.02968597412109375, -0.020771026611328125, -0.0118560791015625, -0.002941131591796875, 0.00597381591796875, 0.014888763427734375, 0.0238037109375, 0.032718658447265625, 0.04163360595703125, 0.050548553466796875, 0.0594635009765625, 0.06837844848632812, 0.07729339599609375, 0.08620834350585938, 0.095123291015625, 0.10403823852539062, 0.11295318603515625, 0.12186813354492188, 0.1307830810546875, 0.13969802856445312, 0.14861297607421875, 0.15752792358398438, 0.16644287109375, 0.17535781860351562, 0.18427276611328125, 0.19318771362304688, 0.2021026611328125, 0.21101760864257812, 0.21993255615234375, 0.22884750366210938, 0.237762451171875, 0.24667739868164062, 0.25559234619140625, 0.2645072937011719, 0.2734222412109375, 0.2823371887207031, 0.29125213623046875, 0.3001670837402344, 0.30908203125]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 2.0, 5.0, 4.0, 7.0, 6.0, 6.0, 3.0, 7.0, 9.0, 6.0, 15.0, 14.0, 19.0, 21.0, 22.0, 26.0, 27.0, 23.0, 35.0, 38.0, 36.0, 47.0, 48.0, 53.0, 47.0, 56.0, 54.0, 38.0, 49.0, 36.0, 28.0, 44.0, 32.0, 32.0, 16.0, 18.0, 15.0, 20.0, 10.0, 11.0, 6.0, 8.0, 3.0, 2.0, 3.0, 5.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.273193359375, -0.2650909423828125, -0.256988525390625, -0.2488861083984375, -0.24078369140625, -0.2326812744140625, -0.224578857421875, -0.2164764404296875, -0.2083740234375, -0.2002716064453125, -0.192169189453125, -0.1840667724609375, -0.17596435546875, -0.1678619384765625, -0.159759521484375, -0.1516571044921875, -0.1435546875, -0.1354522705078125, -0.127349853515625, -0.1192474365234375, -0.11114501953125, -0.1030426025390625, -0.094940185546875, -0.0868377685546875, -0.0787353515625, -0.0706329345703125, -0.062530517578125, -0.0544281005859375, -0.04632568359375, -0.0382232666015625, -0.030120849609375, -0.0220184326171875, -0.013916015625, -0.0058135986328125, 0.002288818359375, 0.0103912353515625, 0.01849365234375, 0.0265960693359375, 0.034698486328125, 0.0428009033203125, 0.0509033203125, 0.0590057373046875, 0.067108154296875, 0.0752105712890625, 0.08331298828125, 0.0914154052734375, 0.099517822265625, 0.1076202392578125, 0.11572265625, 0.1238250732421875, 0.131927490234375, 0.1400299072265625, 0.14813232421875, 0.1562347412109375, 0.164337158203125, 0.1724395751953125, 0.1805419921875, 0.1886444091796875, 0.196746826171875, 0.2048492431640625, 0.21295166015625, 0.2210540771484375, 0.229156494140625, 0.2372589111328125, 0.245361328125]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 5.0, 10.0, 6.0, 8.0, 16.0, 46.0, 97.0, 268.0, 1165.0, 10481.0, 249260.0, 750335.0, 33620.0, 2535.0, 477.0, 125.0, 55.0, 21.0, 11.0, 6.0, 2.0, 6.0, 3.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.156982421875, -0.15099143981933594, -0.14500045776367188, -0.1390094757080078, -0.13301849365234375, -0.1270275115966797, -0.12103652954101562, -0.11504554748535156, -0.1090545654296875, -0.10306358337402344, -0.09707260131835938, -0.09108161926269531, -0.08509063720703125, -0.07909965515136719, -0.07310867309570312, -0.06711769104003906, -0.061126708984375, -0.05513572692871094, -0.049144744873046875, -0.04315376281738281, -0.03716278076171875, -0.031171798706054688, -0.025180816650390625, -0.019189834594726562, -0.0131988525390625, -0.0072078704833984375, -0.001216888427734375, 0.0047740936279296875, 0.01076507568359375, 0.016756057739257812, 0.022747039794921875, 0.028738021850585938, 0.03472900390625, 0.04071998596191406, 0.046710968017578125, 0.05270195007324219, 0.05869293212890625, 0.06468391418457031, 0.07067489624023438, 0.07666587829589844, 0.0826568603515625, 0.08864784240722656, 0.09463882446289062, 0.10062980651855469, 0.10662078857421875, 0.11261177062988281, 0.11860275268554688, 0.12459373474121094, 0.130584716796875, 0.13657569885253906, 0.14256668090820312, 0.1485576629638672, 0.15454864501953125, 0.1605396270751953, 0.16653060913085938, 0.17252159118652344, 0.1785125732421875, 0.18450355529785156, 0.19049453735351562, 0.1964855194091797, 0.20247650146484375, 0.2084674835205078, 0.21445846557617188, 0.22044944763183594, 0.2264404296875]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 5.0, 4.0, 7.0, 9.0, 8.0, 16.0, 21.0, 17.0, 22.0, 33.0, 42.0, 64.0, 76.0, 107.0, 135.0, 128.0, 83.0, 43.0, 45.0, 34.0, 19.0, 22.0, 14.0, 11.0, 15.0, 8.0, 2.0, 4.0, 1.0, 4.0, 2.0, 2.0, 1.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-7.033348083496094e-05, -6.787572056055069e-05, -6.541796028614044e-05, -6.29602000117302e-05, -6.0502439737319946e-05, -5.80446794629097e-05, -5.558691918849945e-05, -5.31291589140892e-05, -5.0671398639678955e-05, -4.821363836526871e-05, -4.575587809085846e-05, -4.329811781644821e-05, -4.0840357542037964e-05, -3.8382597267627716e-05, -3.592483699321747e-05, -3.346707671880722e-05, -3.100931644439697e-05, -2.8551556169986725e-05, -2.6093795895576477e-05, -2.363603562116623e-05, -2.117827534675598e-05, -1.8720515072345734e-05, -1.6262754797935486e-05, -1.3804994523525238e-05, -1.134723424911499e-05, -8.889473974704742e-06, -6.431713700294495e-06, -3.973953425884247e-06, -1.516193151473999e-06, 9.415671229362488e-07, 3.3993273973464966e-06, 5.857087671756744e-06, 8.314847946166992e-06, 1.077260822057724e-05, 1.3230368494987488e-05, 1.5688128769397736e-05, 1.8145889043807983e-05, 2.060364931821823e-05, 2.306140959262848e-05, 2.5519169867038727e-05, 2.7976930141448975e-05, 3.0434690415859222e-05, 3.289245069026947e-05, 3.535021096467972e-05, 3.7807971239089966e-05, 4.0265731513500214e-05, 4.272349178791046e-05, 4.518125206232071e-05, 4.763901233673096e-05, 5.0096772611141205e-05, 5.255453288555145e-05, 5.50122931599617e-05, 5.747005343437195e-05, 5.9927813708782196e-05, 6.238557398319244e-05, 6.484333425760269e-05, 6.730109453201294e-05, 6.975885480642319e-05, 7.221661508083344e-05, 7.467437535524368e-05, 7.713213562965393e-05, 7.958989590406418e-05, 8.204765617847443e-05, 8.450541645288467e-05, 8.696317672729492e-05]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 3.0, 4.0, 3.0, 7.0, 8.0, 18.0, 26.0, 27.0, 37.0, 67.0, 103.0, 183.0, 326.0, 639.0, 1376.0, 3797.0, 14460.0, 77141.0, 528948.0, 357151.0, 49018.0, 9992.0, 2891.0, 1105.0, 512.0, 260.0, 196.0, 98.0, 56.0, 32.0, 27.0, 17.0, 8.0, 8.0, 3.0, 4.0, 3.0, 2.0, 2.0, 4.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10211181640625, -0.0984487533569336, -0.09478569030761719, -0.09112262725830078, -0.08745956420898438, -0.08379650115966797, -0.08013343811035156, -0.07647037506103516, -0.07280731201171875, -0.06914424896240234, -0.06548118591308594, -0.06181812286376953, -0.058155059814453125, -0.05449199676513672, -0.05082893371582031, -0.047165870666503906, -0.0435028076171875, -0.039839744567871094, -0.03617668151855469, -0.03251361846923828, -0.028850555419921875, -0.02518749237060547, -0.021524429321289062, -0.017861366271972656, -0.01419830322265625, -0.010535240173339844, -0.0068721771240234375, -0.0032091140747070312, 0.000453948974609375, 0.004117012023925781, 0.0077800750732421875, 0.011443138122558594, 0.015106201171875, 0.018769264221191406, 0.022432327270507812, 0.02609539031982422, 0.029758453369140625, 0.03342151641845703, 0.03708457946777344, 0.040747642517089844, 0.04441070556640625, 0.048073768615722656, 0.05173683166503906, 0.05539989471435547, 0.059062957763671875, 0.06272602081298828, 0.06638908386230469, 0.0700521469116211, 0.0737152099609375, 0.0773782730102539, 0.08104133605957031, 0.08470439910888672, 0.08836746215820312, 0.09203052520751953, 0.09569358825683594, 0.09935665130615234, 0.10301971435546875, 0.10668277740478516, 0.11034584045410156, 0.11400890350341797, 0.11767196655273438, 0.12133502960205078, 0.12499809265136719, 0.1286611557006836, 0.13232421875]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 8.0, 5.0, 20.0, 23.0, 34.0, 68.0, 96.0, 174.0, 154.0, 171.0, 107.0, 68.0, 27.0, 22.0, 15.0, 10.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1771240234375, -0.1718120574951172, -0.16650009155273438, -0.16118812561035156, -0.15587615966796875, -0.15056419372558594, -0.14525222778320312, -0.1399402618408203, -0.1346282958984375, -0.1293163299560547, -0.12400436401367188, -0.11869239807128906, -0.11338043212890625, -0.10806846618652344, -0.10275650024414062, -0.09744453430175781, -0.092132568359375, -0.08682060241699219, -0.08150863647460938, -0.07619667053222656, -0.07088470458984375, -0.06557273864746094, -0.060260772705078125, -0.05494880676269531, -0.0496368408203125, -0.04432487487792969, -0.039012908935546875, -0.03370094299316406, -0.02838897705078125, -0.023077011108398438, -0.017765045166015625, -0.012453079223632812, -0.00714111328125, -0.0018291473388671875, 0.003482818603515625, 0.008794784545898438, 0.01410675048828125, 0.019418716430664062, 0.024730682373046875, 0.030042648315429688, 0.0353546142578125, 0.04066658020019531, 0.045978546142578125, 0.05129051208496094, 0.05660247802734375, 0.06191444396972656, 0.06722640991210938, 0.07253837585449219, 0.077850341796875, 0.08316230773925781, 0.08847427368164062, 0.09378623962402344, 0.09909820556640625, 0.10441017150878906, 0.10972213745117188, 0.11503410339355469, 0.1203460693359375, 0.1256580352783203, 0.13097000122070312, 0.13628196716308594, 0.14159393310546875, 0.14690589904785156, 0.15221786499023438, 0.1575298309326172, 0.162841796875]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 5.0, 22.0, 59.0, 147.0, 297.0, 281.0, 124.0, 45.0, 18.0, 8.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1073718070983887, -1.0068485736846924, -0.9063252210617065, -0.8058019876480103, -0.7052786946296692, -0.6047554016113281, -0.5042321681976318, -0.40370887517929077, -0.3031855821609497, -0.20266230404376984, -0.10213902592658997, -0.001615762710571289, 0.09890753030776978, 0.19943082332611084, 0.29995405673980713, 0.4004773497581482, 0.5010006427764893, 0.6015239357948303, 0.7020472288131714, 0.8025704622268677, 0.9030937552452087, 1.0036170482635498, 1.104140281677246, 1.2046635150909424, 1.3051868677139282, 1.4057101011276245, 1.5062334537506104, 1.6067566871643066, 1.707279920578003, 1.8078032732009888, 1.908326506614685, 2.008849859237671, 2.109373092651367, 2.2098963260650635, 2.3104195594787598, 2.410943031311035, 2.5114662647247314, 2.6119894981384277, 2.712512731552124, 2.8130359649658203, 2.9135594367980957, 3.014082670211792, 3.1146059036254883, 3.2151293754577637, 3.31565260887146, 3.4161758422851562, 3.5166990756988525, 3.617222309112549, 3.717745542526245, 3.8182687759399414, 3.9187920093536377, 4.019315242767334, 4.119838714599609, 4.220361709594727, 4.320885181427002, 4.421408653259277, 4.5219316482543945, 4.62245512008667, 4.722978115081787, 4.8235015869140625, 4.92402458190918, 5.024548053741455, 5.1250715255737305, 5.225594520568848, 5.326117992401123]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 4.0, 3.0, 3.0, 5.0, 10.0, 8.0, 14.0, 18.0, 14.0, 23.0, 26.0, 28.0, 34.0, 45.0, 52.0, 61.0, 64.0, 47.0, 53.0, 63.0, 49.0, 61.0, 52.0, 46.0, 37.0, 36.0, 27.0, 28.0, 18.0, 16.0, 19.0, 14.0, 3.0, 6.0, 5.0, 1.0, 3.0, 3.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.7119643688201904, -1.65807044506073, -1.604176640510559, -1.5502827167510986, -1.4963887929916382, -1.4424949884414673, -1.3886010646820068, -1.334707260131836, -1.2808133363723755, -1.226919412612915, -1.1730256080627441, -1.1191316843032837, -1.0652377605438232, -1.0113439559936523, -0.9574500322341919, -0.9035561680793762, -0.8496622443199158, -0.7957683801651001, -0.7418744564056396, -0.687980592250824, -0.6340867280960083, -0.5801928043365479, -0.5262989401817322, -0.4724050760269165, -0.41851118206977844, -0.3646172881126404, -0.3107234239578247, -0.25682953000068665, -0.20293565094470978, -0.1490417718887329, -0.09514787793159485, -0.041254013776779175, 0.012639880180358887, 0.06653375923633575, 0.12042764574289322, 0.17432153224945068, 0.22821541130542755, 0.2821092903614044, 0.3360031843185425, 0.38989704847335815, 0.4437909424304962, 0.4976848363876343, 0.55157870054245, 0.6054725646972656, 0.6593664884567261, 0.7132603526115417, 0.7671542167663574, 0.8210481405258179, 0.8749420046806335, 0.9288358688354492, 0.9827297925949097, 1.0366237163543701, 1.090517520904541, 1.1444114446640015, 1.198305368423462, 1.2521991729736328, 1.3060930967330933, 1.3599870204925537, 1.4138808250427246, 1.467774748802185, 1.5216686725616455, 1.5755624771118164, 1.6294564008712769, 1.6833503246307373, 1.7372441291809082]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 4.0, 2.0, 3.0, 2.0, 1.0, 4.0, 6.0, 5.0, 7.0, 6.0, 13.0, 18.0, 24.0, 31.0, 49.0, 71.0, 92.0, 151.0, 302.0, 516.0, 1004.0, 2202.0, 6194.0, 25647.0, 273121.0, 3742627.0, 118084.0, 16520.0, 4465.0, 1591.0, 701.0, 345.0, 197.0, 99.0, 68.0, 40.0, 31.0, 23.0, 8.0, 5.0, 7.0, 4.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.427978515625, -0.4165229797363281, -0.40506744384765625, -0.3936119079589844, -0.3821563720703125, -0.3707008361816406, -0.35924530029296875, -0.3477897644042969, -0.336334228515625, -0.3248786926269531, -0.31342315673828125, -0.3019676208496094, -0.2905120849609375, -0.2790565490722656, -0.26760101318359375, -0.2561454772949219, -0.24468994140625, -0.23323440551757812, -0.22177886962890625, -0.21032333374023438, -0.1988677978515625, -0.18741226196289062, -0.17595672607421875, -0.16450119018554688, -0.153045654296875, -0.14159011840820312, -0.13013458251953125, -0.11867904663085938, -0.1072235107421875, -0.09576797485351562, -0.08431243896484375, -0.07285690307617188, -0.0614013671875, -0.049945831298828125, -0.03849029541015625, -0.027034759521484375, -0.0155792236328125, -0.004123687744140625, 0.00733184814453125, 0.018787384033203125, 0.030242919921875, 0.041698455810546875, 0.05315399169921875, 0.06460952758789062, 0.0760650634765625, 0.08752059936523438, 0.09897613525390625, 0.11043167114257812, 0.12188720703125, 0.13334274291992188, 0.14479827880859375, 0.15625381469726562, 0.1677093505859375, 0.17916488647460938, 0.19062042236328125, 0.20207595825195312, 0.213531494140625, 0.22498703002929688, 0.23644256591796875, 0.24789810180664062, 0.2593536376953125, 0.2708091735839844, 0.28226470947265625, 0.2937202453613281, 0.30517578125]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 5.0, 9.0, 17.0, 17.0, 24.0, 40.0, 43.0, 46.0, 62.0, 96.0, 93.0, 76.0, 73.0, 78.0, 70.0, 52.0, 50.0, 34.0, 31.0, 20.0, 26.0, 19.0, 8.0, 3.0, 4.0, 1.0, 0.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.10858154296875, -0.10570144653320312, -0.10282135009765625, -0.09994125366210938, -0.0970611572265625, -0.09418106079101562, -0.09130096435546875, -0.08842086791992188, -0.085540771484375, -0.08266067504882812, -0.07978057861328125, -0.07690048217773438, -0.0740203857421875, -0.07114028930664062, -0.06826019287109375, -0.06538009643554688, -0.0625, -0.059619903564453125, -0.05673980712890625, -0.053859710693359375, -0.0509796142578125, -0.048099517822265625, -0.04521942138671875, -0.042339324951171875, -0.039459228515625, -0.036579132080078125, -0.03369903564453125, -0.030818939208984375, -0.0279388427734375, -0.025058746337890625, -0.02217864990234375, -0.019298553466796875, -0.01641845703125, -0.013538360595703125, -0.01065826416015625, -0.007778167724609375, -0.0048980712890625, -0.002017974853515625, 0.00086212158203125, 0.003742218017578125, 0.006622314453125, 0.009502410888671875, 0.01238250732421875, 0.015262603759765625, 0.0181427001953125, 0.021022796630859375, 0.02390289306640625, 0.026782989501953125, 0.0296630859375, 0.032543182373046875, 0.03542327880859375, 0.038303375244140625, 0.0411834716796875, 0.044063568115234375, 0.04694366455078125, 0.049823760986328125, 0.052703857421875, 0.055583953857421875, 0.05846405029296875, 0.061344146728515625, 0.0642242431640625, 0.06710433959960938, 0.06998443603515625, 0.07286453247070312, 0.07574462890625]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 5.0, 1.0, 1.0, 6.0, 7.0, 9.0, 15.0, 24.0, 40.0, 51.0, 107.0, 188.0, 357.0, 821.0, 1975.0, 7270.0, 42733.0, 875462.0, 3153177.0, 94617.0, 12295.0, 2940.0, 1035.0, 481.0, 263.0, 150.0, 94.0, 52.0, 44.0, 27.0, 11.0, 15.0, 7.0, 4.0, 7.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.235107421875, -0.22576522827148438, -0.21642303466796875, -0.20708084106445312, -0.1977386474609375, -0.18839645385742188, -0.17905426025390625, -0.16971206665039062, -0.160369873046875, -0.15102767944335938, -0.14168548583984375, -0.13234329223632812, -0.1230010986328125, -0.11365890502929688, -0.10431671142578125, -0.09497451782226562, -0.08563232421875, -0.07629013061523438, -0.06694793701171875, -0.057605743408203125, -0.0482635498046875, -0.038921356201171875, -0.02957916259765625, -0.020236968994140625, -0.010894775390625, -0.001552581787109375, 0.00778961181640625, 0.017131805419921875, 0.0264739990234375, 0.035816192626953125, 0.04515838623046875, 0.054500579833984375, 0.0638427734375, 0.07318496704101562, 0.08252716064453125, 0.09186935424804688, 0.1012115478515625, 0.11055374145507812, 0.11989593505859375, 0.12923812866210938, 0.138580322265625, 0.14792251586914062, 0.15726470947265625, 0.16660690307617188, 0.1759490966796875, 0.18529129028320312, 0.19463348388671875, 0.20397567749023438, 0.21331787109375, 0.22266006469726562, 0.23200225830078125, 0.24134445190429688, 0.2506866455078125, 0.2600288391113281, 0.26937103271484375, 0.2787132263183594, 0.288055419921875, 0.2973976135253906, 0.30673980712890625, 0.3160820007324219, 0.3254241943359375, 0.3347663879394531, 0.34410858154296875, 0.3534507751464844, 0.36279296875]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 4.0, 8.0, 4.0, 5.0, 16.0, 25.0, 27.0, 63.0, 118.0, 272.0, 766.0, 1636.0, 651.0, 234.0, 95.0, 62.0, 28.0, 28.0, 13.0, 12.0, 4.0, 2.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.11785888671875, -0.11303424835205078, -0.10820960998535156, -0.10338497161865234, -0.09856033325195312, -0.0937356948852539, -0.08891105651855469, -0.08408641815185547, -0.07926177978515625, -0.07443714141845703, -0.06961250305175781, -0.0647878646850586, -0.059963226318359375, -0.055138587951660156, -0.05031394958496094, -0.04548931121826172, -0.0406646728515625, -0.03584003448486328, -0.031015396118164062, -0.026190757751464844, -0.021366119384765625, -0.016541481018066406, -0.011716842651367188, -0.006892204284667969, -0.00206756591796875, 0.0027570724487304688, 0.0075817108154296875, 0.012406349182128906, 0.017230987548828125, 0.022055625915527344, 0.026880264282226562, 0.03170490264892578, 0.036529541015625, 0.04135417938232422, 0.04617881774902344, 0.051003456115722656, 0.055828094482421875, 0.060652732849121094, 0.06547737121582031, 0.07030200958251953, 0.07512664794921875, 0.07995128631591797, 0.08477592468261719, 0.0896005630493164, 0.09442520141601562, 0.09924983978271484, 0.10407447814941406, 0.10889911651611328, 0.1137237548828125, 0.11854839324951172, 0.12337303161621094, 0.12819766998291016, 0.13302230834960938, 0.1378469467163086, 0.1426715850830078, 0.14749622344970703, 0.15232086181640625, 0.15714550018310547, 0.1619701385498047, 0.1667947769165039, 0.17161941528320312, 0.17644405364990234, 0.18126869201660156, 0.18609333038330078, 0.19091796875]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 6.0, 21.0, 55.0, 173.0, 318.0, 255.0, 124.0, 39.0, 12.0, 3.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7482775449752808, -1.7084803581237793, -1.6686832904815674, -1.628886103630066, -1.5890889167785645, -1.549291729927063, -1.5094945430755615, -1.4696974754333496, -1.4299002885818481, -1.3901031017303467, -1.3503060340881348, -1.3105088472366333, -1.2707116603851318, -1.2309144735336304, -1.191117286682129, -1.151320219039917, -1.1115230321884155, -1.071725845336914, -1.0319287776947021, -0.9921315908432007, -0.9523344039916992, -0.9125372171401978, -0.8727400898933411, -0.8329429626464844, -0.7931457757949829, -0.7533485889434814, -0.7135514616966248, -0.6737543344497681, -0.6339571475982666, -0.5941599607467651, -0.5543628334999084, -0.5145657062530518, -0.47476840019226074, -0.43497124314308167, -0.3951740860939026, -0.3553769290447235, -0.31557977199554443, -0.27578261494636536, -0.23598545789718628, -0.1961883008480072, -0.15639114379882812, -0.11659398674964905, -0.07679682970046997, -0.036999672651290894, 0.0027974843978881836, 0.04259464144706726, 0.08239179849624634, 0.12218895554542542, 0.1619861125946045, 0.20178326964378357, 0.24158042669296265, 0.2813775837421417, 0.3211747407913208, 0.3609718978404999, 0.40076905488967896, 0.44056621193885803, 0.4803633689880371, 0.5201605558395386, 0.5599576830863953, 0.599754810333252, 0.6395519971847534, 0.6793491840362549, 0.7191463112831116, 0.7589434385299683, 0.7987406253814697]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 4.0, 4.0, 6.0, 7.0, 7.0, 12.0, 11.0, 19.0, 18.0, 20.0, 25.0, 19.0, 41.0, 39.0, 47.0, 47.0, 40.0, 52.0, 49.0, 46.0, 53.0, 50.0, 48.0, 44.0, 44.0, 37.0, 35.0, 36.0, 33.0, 23.0, 21.0, 18.0, 15.0, 7.0, 7.0, 3.0, 6.0, 3.0, 4.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0], "bins": [-0.41998982429504395, -0.4070392847061157, -0.3940887153148651, -0.3811381757259369, -0.3681876063346863, -0.35523706674575806, -0.34228652715682983, -0.3293359577655792, -0.3163853883743286, -0.3034348487854004, -0.2904842793941498, -0.27753373980522156, -0.26458317041397095, -0.2516326308250427, -0.2386820763349533, -0.2257315218448639, -0.21278098225593567, -0.19983042776584625, -0.18687987327575684, -0.1739293336868286, -0.160978764295578, -0.14802822470664978, -0.13507767021656036, -0.12212711572647095, -0.10917656123638153, -0.09622600674629211, -0.0832754522562027, -0.07032490521669388, -0.05737435072660446, -0.044423796236515045, -0.031473249197006226, -0.01852269470691681, -0.005572140216827393, 0.007378412410616875, 0.020328965038061142, 0.03327951580286026, 0.046230070292949677, 0.05918062478303909, 0.07213117182254791, 0.08508172631263733, 0.09803228080272675, 0.11098283529281616, 0.12393338978290558, 0.136883944272995, 0.14983448386192322, 0.16278505325317383, 0.17573559284210205, 0.18868614733219147, 0.20163670182228088, 0.2145872563123703, 0.22753781080245972, 0.24048835039138794, 0.25343891978263855, 0.2663894593715668, 0.2793400287628174, 0.2922905683517456, 0.30524110794067383, 0.31819164752960205, 0.33114221692085266, 0.3440927565097809, 0.3570433259010315, 0.3699938654899597, 0.38294440507888794, 0.39589497447013855, 0.40884554386138916]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 4.0, 4.0, 1.0, 3.0, 6.0, 10.0, 11.0, 22.0, 34.0, 83.0, 98.0, 188.0, 353.0, 651.0, 1222.0, 2873.0, 9090.0, 41408.0, 258474.0, 579825.0, 122730.0, 21990.0, 5512.0, 2004.0, 884.0, 462.0, 251.0, 145.0, 90.0, 47.0, 33.0, 15.0, 17.0, 4.0, 8.0, 4.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.377685546875, -0.3663444519042969, -0.35500335693359375, -0.3436622619628906, -0.3323211669921875, -0.3209800720214844, -0.30963897705078125, -0.2982978820800781, -0.286956787109375, -0.2756156921386719, -0.26427459716796875, -0.2529335021972656, -0.2415924072265625, -0.23025131225585938, -0.21891021728515625, -0.20756912231445312, -0.19622802734375, -0.18488693237304688, -0.17354583740234375, -0.16220474243164062, -0.1508636474609375, -0.13952255249023438, -0.12818145751953125, -0.11684036254882812, -0.105499267578125, -0.09415817260742188, -0.08281707763671875, -0.07147598266601562, -0.0601348876953125, -0.048793792724609375, -0.03745269775390625, -0.026111602783203125, -0.0147705078125, -0.003429412841796875, 0.00791168212890625, 0.019252777099609375, 0.0305938720703125, 0.041934967041015625, 0.05327606201171875, 0.06461715698242188, 0.075958251953125, 0.08729934692382812, 0.09864044189453125, 0.10998153686523438, 0.1213226318359375, 0.13266372680664062, 0.14400482177734375, 0.15534591674804688, 0.16668701171875, 0.17802810668945312, 0.18936920166015625, 0.20071029663085938, 0.2120513916015625, 0.22339248657226562, 0.23473358154296875, 0.24607467651367188, 0.257415771484375, 0.2687568664550781, 0.28009796142578125, 0.2914390563964844, 0.3027801513671875, 0.3141212463378906, 0.32546234130859375, 0.3368034362792969, 0.34814453125]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 6.0, 5.0, 9.0, 17.0, 23.0, 33.0, 43.0, 49.0, 66.0, 83.0, 93.0, 89.0, 81.0, 78.0, 68.0, 55.0, 44.0, 51.0, 29.0, 26.0, 20.0, 15.0, 6.0, 3.0, 1.0, 4.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.11236572265625, -0.10947513580322266, -0.10658454895019531, -0.10369396209716797, -0.10080337524414062, -0.09791278839111328, -0.09502220153808594, -0.0921316146850586, -0.08924102783203125, -0.0863504409790039, -0.08345985412597656, -0.08056926727294922, -0.07767868041992188, -0.07478809356689453, -0.07189750671386719, -0.06900691986083984, -0.0661163330078125, -0.06322574615478516, -0.06033515930175781, -0.05744457244873047, -0.054553985595703125, -0.05166339874267578, -0.04877281188964844, -0.045882225036621094, -0.04299163818359375, -0.040101051330566406, -0.03721046447753906, -0.03431987762451172, -0.031429290771484375, -0.02853870391845703, -0.025648117065429688, -0.022757530212402344, -0.019866943359375, -0.016976356506347656, -0.014085769653320312, -0.011195182800292969, -0.008304595947265625, -0.005414009094238281, -0.0025234222412109375, 0.00036716461181640625, 0.00325775146484375, 0.006148338317871094, 0.009038925170898438, 0.011929512023925781, 0.014820098876953125, 0.01771068572998047, 0.020601272583007812, 0.023491859436035156, 0.0263824462890625, 0.029273033142089844, 0.03216361999511719, 0.03505420684814453, 0.037944793701171875, 0.04083538055419922, 0.04372596740722656, 0.046616554260253906, 0.04950714111328125, 0.052397727966308594, 0.05528831481933594, 0.05817890167236328, 0.061069488525390625, 0.06396007537841797, 0.06685066223144531, 0.06974124908447266, 0.0726318359375]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 3.0, 3.0, 6.0, 6.0, 10.0, 22.0, 36.0, 49.0, 83.0, 129.0, 235.0, 478.0, 1060.0, 2778.0, 8247.0, 30071.0, 132551.0, 447009.0, 321778.0, 77098.0, 18452.0, 5132.0, 1805.0, 725.0, 344.0, 175.0, 104.0, 65.0, 40.0, 25.0, 13.0, 11.0, 7.0, 5.0, 4.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.258544921875, -0.2509002685546875, -0.243255615234375, -0.2356109619140625, -0.22796630859375, -0.2203216552734375, -0.212677001953125, -0.2050323486328125, -0.1973876953125, -0.1897430419921875, -0.182098388671875, -0.1744537353515625, -0.16680908203125, -0.1591644287109375, -0.151519775390625, -0.1438751220703125, -0.13623046875, -0.1285858154296875, -0.120941162109375, -0.1132965087890625, -0.10565185546875, -0.0980072021484375, -0.090362548828125, -0.0827178955078125, -0.0750732421875, -0.0674285888671875, -0.059783935546875, -0.0521392822265625, -0.04449462890625, -0.0368499755859375, -0.029205322265625, -0.0215606689453125, -0.013916015625, -0.0062713623046875, 0.001373291015625, 0.0090179443359375, 0.01666259765625, 0.0243072509765625, 0.031951904296875, 0.0395965576171875, 0.0472412109375, 0.0548858642578125, 0.062530517578125, 0.0701751708984375, 0.07781982421875, 0.0854644775390625, 0.093109130859375, 0.1007537841796875, 0.1083984375, 0.1160430908203125, 0.123687744140625, 0.1313323974609375, 0.13897705078125, 0.1466217041015625, 0.154266357421875, 0.1619110107421875, 0.1695556640625, 0.1772003173828125, 0.184844970703125, 0.1924896240234375, 0.20013427734375, 0.2077789306640625, 0.215423583984375, 0.2230682373046875, 0.230712890625]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 5.0, 4.0, 7.0, 9.0, 9.0, 12.0, 15.0, 17.0, 13.0, 26.0, 32.0, 32.0, 34.0, 53.0, 48.0, 56.0, 48.0, 57.0, 57.0, 44.0, 55.0, 55.0, 52.0, 40.0, 54.0, 33.0, 18.0, 25.0, 26.0, 15.0, 13.0, 9.0, 11.0, 5.0, 3.0, 9.0, 1.0, 7.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2158203125, -0.2062225341796875, -0.196624755859375, -0.1870269775390625, -0.17742919921875, -0.1678314208984375, -0.158233642578125, -0.1486358642578125, -0.1390380859375, -0.1294403076171875, -0.119842529296875, -0.1102447509765625, -0.10064697265625, -0.0910491943359375, -0.081451416015625, -0.0718536376953125, -0.062255859375, -0.0526580810546875, -0.043060302734375, -0.0334625244140625, -0.02386474609375, -0.0142669677734375, -0.004669189453125, 0.0049285888671875, 0.0145263671875, 0.0241241455078125, 0.033721923828125, 0.0433197021484375, 0.05291748046875, 0.0625152587890625, 0.072113037109375, 0.0817108154296875, 0.09130859375, 0.1009063720703125, 0.110504150390625, 0.1201019287109375, 0.12969970703125, 0.1392974853515625, 0.148895263671875, 0.1584930419921875, 0.1680908203125, 0.1776885986328125, 0.187286376953125, 0.1968841552734375, 0.20648193359375, 0.2160797119140625, 0.225677490234375, 0.2352752685546875, 0.244873046875, 0.2544708251953125, 0.264068603515625, 0.2736663818359375, 0.28326416015625, 0.2928619384765625, 0.302459716796875, 0.3120574951171875, 0.3216552734375, 0.3312530517578125, 0.340850830078125, 0.3504486083984375, 0.36004638671875, 0.3696441650390625, 0.379241943359375, 0.3888397216796875, 0.3984375]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 2.0, 3.0, 5.0, 4.0, 6.0, 8.0, 12.0, 16.0, 17.0, 55.0, 60.0, 80.0, 230.0, 492.0, 1308.0, 4885.0, 31375.0, 543214.0, 434261.0, 26100.0, 4309.0, 1217.0, 434.0, 193.0, 104.0, 60.0, 28.0, 24.0, 18.0, 11.0, 8.0, 4.0, 2.0, 3.0, 2.0, 3.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1741943359375, -0.16856765747070312, -0.16294097900390625, -0.15731430053710938, -0.1516876220703125, -0.14606094360351562, -0.14043426513671875, -0.13480758666992188, -0.129180908203125, -0.12355422973632812, -0.11792755126953125, -0.11230087280273438, -0.1066741943359375, -0.10104751586914062, -0.09542083740234375, -0.08979415893554688, -0.08416748046875, -0.07854080200195312, -0.07291412353515625, -0.06728744506835938, -0.0616607666015625, -0.056034088134765625, -0.05040740966796875, -0.044780731201171875, -0.039154052734375, -0.033527374267578125, -0.02790069580078125, -0.022274017333984375, -0.0166473388671875, -0.011020660400390625, -0.00539398193359375, 0.000232696533203125, 0.005859375, 0.011486053466796875, 0.01711273193359375, 0.022739410400390625, 0.0283660888671875, 0.033992767333984375, 0.03961944580078125, 0.045246124267578125, 0.050872802734375, 0.056499481201171875, 0.06212615966796875, 0.06775283813476562, 0.0733795166015625, 0.07900619506835938, 0.08463287353515625, 0.09025955200195312, 0.09588623046875, 0.10151290893554688, 0.10713958740234375, 0.11276626586914062, 0.1183929443359375, 0.12401962280273438, 0.12964630126953125, 0.13527297973632812, 0.140899658203125, 0.14652633666992188, 0.15215301513671875, 0.15777969360351562, 0.1634063720703125, 0.16903305053710938, 0.17465972900390625, 0.18028640747070312, 0.1859130859375]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 1.0, 3.0, 4.0, 4.0, 7.0, 8.0, 10.0, 8.0, 15.0, 17.0, 22.0, 31.0, 30.0, 71.0, 117.0, 141.0, 138.0, 102.0, 86.0, 48.0, 34.0, 20.0, 14.0, 22.0, 21.0, 10.0, 7.0, 6.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.842613220214844e-05, -6.590224802494049e-05, -6.337836384773254e-05, -6.08544796705246e-05, -5.833059549331665e-05, -5.5806711316108704e-05, -5.328282713890076e-05, -5.075894296169281e-05, -4.823505878448486e-05, -4.5711174607276917e-05, -4.318729043006897e-05, -4.066340625286102e-05, -3.8139522075653076e-05, -3.561563789844513e-05, -3.309175372123718e-05, -3.0567869544029236e-05, -2.804398536682129e-05, -2.5520101189613342e-05, -2.2996217012405396e-05, -2.047233283519745e-05, -1.7948448657989502e-05, -1.5424564480781555e-05, -1.2900680303573608e-05, -1.0376796126365662e-05, -7.852911949157715e-06, -5.329027771949768e-06, -2.8051435947418213e-06, -2.812594175338745e-07, 2.2426247596740723e-06, 4.766508936882019e-06, 7.290393114089966e-06, 9.814277291297913e-06, 1.233816146850586e-05, 1.4862045645713806e-05, 1.7385929822921753e-05, 1.99098140001297e-05, 2.2433698177337646e-05, 2.4957582354545593e-05, 2.748146653175354e-05, 3.0005350708961487e-05, 3.2529234886169434e-05, 3.505311906337738e-05, 3.757700324058533e-05, 4.0100887417793274e-05, 4.262477159500122e-05, 4.514865577220917e-05, 4.7672539949417114e-05, 5.019642412662506e-05, 5.272030830383301e-05, 5.5244192481040955e-05, 5.77680766582489e-05, 6.029196083545685e-05, 6.28158450126648e-05, 6.533972918987274e-05, 6.786361336708069e-05, 7.038749754428864e-05, 7.291138172149658e-05, 7.543526589870453e-05, 7.795915007591248e-05, 8.048303425312042e-05, 8.300691843032837e-05, 8.553080260753632e-05, 8.805468678474426e-05, 9.057857096195221e-05, 9.310245513916016e-05]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 0.0, 6.0, 5.0, 11.0, 14.0, 9.0, 20.0, 25.0, 53.0, 94.0, 124.0, 209.0, 357.0, 788.0, 1621.0, 4190.0, 14382.0, 82731.0, 644509.0, 254851.0, 32089.0, 7429.0, 2659.0, 1117.0, 510.0, 310.0, 164.0, 86.0, 73.0, 34.0, 24.0, 18.0, 9.0, 13.0, 4.0, 7.0, 4.0, 2.0, 3.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1329345703125, -0.12874794006347656, -0.12456130981445312, -0.12037467956542969, -0.11618804931640625, -0.11200141906738281, -0.10781478881835938, -0.10362815856933594, -0.0994415283203125, -0.09525489807128906, -0.09106826782226562, -0.08688163757324219, -0.08269500732421875, -0.07850837707519531, -0.07432174682617188, -0.07013511657714844, -0.065948486328125, -0.06176185607910156, -0.057575225830078125, -0.05338859558105469, -0.04920196533203125, -0.04501533508300781, -0.040828704833984375, -0.03664207458496094, -0.0324554443359375, -0.028268814086914062, -0.024082183837890625, -0.019895553588867188, -0.01570892333984375, -0.011522293090820312, -0.007335662841796875, -0.0031490325927734375, 0.00103759765625, 0.0052242279052734375, 0.009410858154296875, 0.013597488403320312, 0.01778411865234375, 0.021970748901367188, 0.026157379150390625, 0.030344009399414062, 0.0345306396484375, 0.03871726989746094, 0.042903900146484375, 0.04709053039550781, 0.05127716064453125, 0.05546379089355469, 0.059650421142578125, 0.06383705139160156, 0.068023681640625, 0.07221031188964844, 0.07639694213867188, 0.08058357238769531, 0.08477020263671875, 0.08895683288574219, 0.09314346313476562, 0.09733009338378906, 0.1015167236328125, 0.10570335388183594, 0.10988998413085938, 0.11407661437988281, 0.11826324462890625, 0.12244987487792969, 0.12663650512695312, 0.13082313537597656, 0.135009765625]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 3.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 4.0, 4.0, 8.0, 10.0, 6.0, 27.0, 31.0, 47.0, 96.0, 128.0, 157.0, 139.0, 121.0, 66.0, 67.0, 29.0, 19.0, 24.0, 4.0, 3.0, 0.0, 4.0, 1.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10101318359375, -0.09693622589111328, -0.09285926818847656, -0.08878231048583984, -0.08470535278320312, -0.0806283950805664, -0.07655143737792969, -0.07247447967529297, -0.06839752197265625, -0.06432056427001953, -0.06024360656738281, -0.056166648864746094, -0.052089691162109375, -0.048012733459472656, -0.04393577575683594, -0.03985881805419922, -0.0357818603515625, -0.03170490264892578, -0.027627944946289062, -0.023550987243652344, -0.019474029541015625, -0.015397071838378906, -0.011320114135742188, -0.007243156433105469, -0.00316619873046875, 0.0009107589721679688, 0.0049877166748046875, 0.009064674377441406, 0.013141632080078125, 0.017218589782714844, 0.021295547485351562, 0.02537250518798828, 0.029449462890625, 0.03352642059326172, 0.03760337829589844, 0.041680335998535156, 0.045757293701171875, 0.049834251403808594, 0.05391120910644531, 0.05798816680908203, 0.06206512451171875, 0.06614208221435547, 0.07021903991699219, 0.0742959976196289, 0.07837295532226562, 0.08244991302490234, 0.08652687072753906, 0.09060382843017578, 0.0946807861328125, 0.09875774383544922, 0.10283470153808594, 0.10691165924072266, 0.11098861694335938, 0.1150655746459961, 0.11914253234863281, 0.12321949005126953, 0.12729644775390625, 0.13137340545654297, 0.1354503631591797, 0.1395273208618164, 0.14360427856445312, 0.14768123626708984, 0.15175819396972656, 0.15583515167236328, 0.159912109375]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 5.0, 1.0, 6.0, 5.0, 12.0, 19.0, 24.0, 43.0, 64.0, 121.0, 109.0, 146.0, 142.0, 97.0, 86.0, 48.0, 32.0, 21.0, 9.0, 8.0, 2.0, 4.0, 3.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.149479627609253, -1.1032607555389404, -1.057041883468628, -1.0108230113983154, -0.9646040797233582, -0.9183852076530457, -0.8721662759780884, -0.8259474039077759, -0.7797285318374634, -0.7335096597671509, -0.6872907876968384, -0.6410718560218811, -0.5948529839515686, -0.5486341118812561, -0.5024151802062988, -0.45619630813598633, -0.40997743606567383, -0.36375856399536133, -0.31753966212272644, -0.27132076025009155, -0.22510188817977905, -0.17888300120830536, -0.13266411423683167, -0.08644521236419678, -0.04022634029388428, 0.0059925466775894165, 0.05221143364906311, 0.0984303206205368, 0.1446492075920105, 0.1908680945634842, 0.23708698153495789, 0.2833058834075928, 0.3295247554779053, 0.3757436275482178, 0.42196252942085266, 0.46818143129348755, 0.5144003033638, 0.5606191754341125, 0.6068381071090698, 0.6530569791793823, 0.6992758512496948, 0.7454947233200073, 0.7917135953903198, 0.8379325270652771, 0.8841513991355896, 0.9303702712059021, 0.9765892028808594, 1.0228080749511719, 1.0690269470214844, 1.1152458190917969, 1.1614646911621094, 1.2076835632324219, 1.2539024353027344, 1.3001214265823364, 1.346340298652649, 1.3925591707229614, 1.438778042793274, 1.4849969148635864, 1.531215786933899, 1.5774346590042114, 1.6236536502838135, 1.669872522354126, 1.7160913944244385, 1.762310266494751, 1.8085291385650635]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 6.0, 5.0, 9.0, 11.0, 8.0, 8.0, 14.0, 13.0, 18.0, 19.0, 20.0, 32.0, 29.0, 37.0, 42.0, 35.0, 32.0, 49.0, 49.0, 41.0, 38.0, 44.0, 55.0, 46.0, 43.0, 52.0, 34.0, 27.0, 33.0, 21.0, 27.0, 24.0, 16.0, 18.0, 14.0, 9.0, 8.0, 10.0, 7.0, 4.0, 1.0, 2.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0], "bins": [-1.705547571182251, -1.65894615650177, -1.612344741821289, -1.5657432079315186, -1.5191417932510376, -1.4725403785705566, -1.4259389638900757, -1.3793375492095947, -1.3327360153198242, -1.2861346006393433, -1.2395331859588623, -1.1929316520690918, -1.1463302373886108, -1.0997288227081299, -1.053127408027649, -1.006525993347168, -0.9599245190620422, -0.9133231043815613, -0.8667216300964355, -0.8201202154159546, -0.7735187411308289, -0.7269173264503479, -0.6803158521652222, -0.6337144374847412, -0.5871130228042603, -0.5405116081237793, -0.49391013383865356, -0.4473087191581726, -0.4007072448730469, -0.3541058301925659, -0.3075043857097626, -0.26090294122695923, -0.2143014669418335, -0.16770002245903015, -0.1210985854268074, -0.07449714839458466, -0.02789570391178131, 0.018705740571022034, 0.06530717015266418, 0.11190861463546753, 0.15851005911827087, 0.20511150360107422, 0.25171294808387756, 0.2983143925666809, 0.34491580724716187, 0.3915172815322876, 0.43811869621276855, 0.4847201406955719, 0.5313215851783752, 0.5779229998588562, 0.6245244741439819, 0.6711258888244629, 0.7177273631095886, 0.7643287777900696, 0.8109302520751953, 0.8575316667556763, 0.9041330814361572, 0.9507344961166382, 0.9973359704017639, 1.0439374446868896, 1.0905388593673706, 1.1371402740478516, 1.1837416887283325, 1.2303431034088135, 1.276944637298584]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 3.0, 6.0, 10.0, 3.0, 4.0, 13.0, 13.0, 16.0, 36.0, 37.0, 54.0, 68.0, 99.0, 187.0, 351.0, 622.0, 1223.0, 2665.0, 7349.0, 27075.0, 215813.0, 3771273.0, 136014.0, 21094.0, 6126.0, 2260.0, 946.0, 428.0, 214.0, 125.0, 67.0, 45.0, 21.0, 10.0, 5.0, 8.0, 5.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.325927734375, -0.3172168731689453, -0.3085060119628906, -0.29979515075683594, -0.29108428955078125, -0.28237342834472656, -0.2736625671386719, -0.2649517059326172, -0.2562408447265625, -0.2475299835205078, -0.23881912231445312, -0.23010826110839844, -0.22139739990234375, -0.21268653869628906, -0.20397567749023438, -0.1952648162841797, -0.186553955078125, -0.1778430938720703, -0.16913223266601562, -0.16042137145996094, -0.15171051025390625, -0.14299964904785156, -0.13428878784179688, -0.1255779266357422, -0.1168670654296875, -0.10815620422363281, -0.09944534301757812, -0.09073448181152344, -0.08202362060546875, -0.07331275939941406, -0.06460189819335938, -0.05589103698730469, -0.04718017578125, -0.03846931457519531, -0.029758453369140625, -0.021047592163085938, -0.01233673095703125, -0.0036258697509765625, 0.005084991455078125, 0.013795852661132812, 0.0225067138671875, 0.031217575073242188, 0.039928436279296875, 0.04863929748535156, 0.05735015869140625, 0.06606101989746094, 0.07477188110351562, 0.08348274230957031, 0.092193603515625, 0.10090446472167969, 0.10961532592773438, 0.11832618713378906, 0.12703704833984375, 0.13574790954589844, 0.14445877075195312, 0.1531696319580078, 0.1618804931640625, 0.1705913543701172, 0.17930221557617188, 0.18801307678222656, 0.19672393798828125, 0.20543479919433594, 0.21414566040039062, 0.2228565216064453, 0.2315673828125]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 9.0, 9.0, 10.0, 18.0, 18.0, 21.0, 36.0, 41.0, 60.0, 49.0, 75.0, 80.0, 70.0, 63.0, 74.0, 71.0, 56.0, 47.0, 40.0, 50.0, 23.0, 28.0, 19.0, 10.0, 8.0, 5.0, 2.0, 2.0, 0.0, 2.0, 1.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10504150390625, -0.10227012634277344, -0.09949874877929688, -0.09672737121582031, -0.09395599365234375, -0.09118461608886719, -0.08841323852539062, -0.08564186096191406, -0.0828704833984375, -0.08009910583496094, -0.07732772827148438, -0.07455635070800781, -0.07178497314453125, -0.06901359558105469, -0.06624221801757812, -0.06347084045410156, -0.060699462890625, -0.05792808532714844, -0.055156707763671875, -0.05238533020019531, -0.04961395263671875, -0.04684257507324219, -0.044071197509765625, -0.04129981994628906, -0.0385284423828125, -0.03575706481933594, -0.032985687255859375, -0.030214309692382812, -0.02744293212890625, -0.024671554565429688, -0.021900177001953125, -0.019128799438476562, -0.016357421875, -0.013586044311523438, -0.010814666748046875, -0.008043289184570312, -0.00527191162109375, -0.0025005340576171875, 0.000270843505859375, 0.0030422210693359375, 0.0058135986328125, 0.008584976196289062, 0.011356353759765625, 0.014127731323242188, 0.01689910888671875, 0.019670486450195312, 0.022441864013671875, 0.025213241577148438, 0.027984619140625, 0.030755996704101562, 0.033527374267578125, 0.03629875183105469, 0.03907012939453125, 0.04184150695800781, 0.044612884521484375, 0.04738426208496094, 0.0501556396484375, 0.05292701721191406, 0.055698394775390625, 0.05846977233886719, 0.06124114990234375, 0.06401252746582031, 0.06678390502929688, 0.06955528259277344, 0.07232666015625]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 4.0, 8.0, 2.0, 7.0, 7.0, 17.0, 33.0, 42.0, 70.0, 183.0, 326.0, 746.0, 2039.0, 7123.0, 36687.0, 463111.0, 3503983.0, 153659.0, 19180.0, 4453.0, 1445.0, 573.0, 296.0, 124.0, 73.0, 39.0, 21.0, 14.0, 7.0, 6.0, 8.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1756591796875, -0.16812705993652344, -0.16059494018554688, -0.1530628204345703, -0.14553070068359375, -0.1379985809326172, -0.13046646118164062, -0.12293434143066406, -0.1154022216796875, -0.10787010192871094, -0.10033798217773438, -0.09280586242675781, -0.08527374267578125, -0.07774162292480469, -0.07020950317382812, -0.06267738342285156, -0.055145263671875, -0.04761314392089844, -0.040081024169921875, -0.03254890441894531, -0.02501678466796875, -0.017484664916992188, -0.009952545166015625, -0.0024204254150390625, 0.0051116943359375, 0.012643814086914062, 0.020175933837890625, 0.027708053588867188, 0.03524017333984375, 0.04277229309082031, 0.050304412841796875, 0.05783653259277344, 0.06536865234375, 0.07290077209472656, 0.08043289184570312, 0.08796501159667969, 0.09549713134765625, 0.10302925109863281, 0.11056137084960938, 0.11809349060058594, 0.1256256103515625, 0.13315773010253906, 0.14068984985351562, 0.1482219696044922, 0.15575408935546875, 0.1632862091064453, 0.17081832885742188, 0.17835044860839844, 0.185882568359375, 0.19341468811035156, 0.20094680786132812, 0.2084789276123047, 0.21601104736328125, 0.2235431671142578, 0.23107528686523438, 0.23860740661621094, 0.2461395263671875, 0.25367164611816406, 0.2612037658691406, 0.2687358856201172, 0.27626800537109375, 0.2838001251220703, 0.2913322448730469, 0.29886436462402344, 0.306396484375]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 5.0, 0.0, 2.0, 4.0, 7.0, 5.0, 18.0, 13.0, 28.0, 51.0, 89.0, 195.0, 479.0, 1504.0, 1055.0, 315.0, 127.0, 74.0, 38.0, 25.0, 14.0, 15.0, 10.0, 5.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08538818359375, -0.08208370208740234, -0.07877922058105469, -0.07547473907470703, -0.07217025756835938, -0.06886577606201172, -0.06556129455566406, -0.062256813049316406, -0.05895233154296875, -0.055647850036621094, -0.05234336853027344, -0.04903888702392578, -0.045734405517578125, -0.04242992401123047, -0.03912544250488281, -0.035820960998535156, -0.0325164794921875, -0.029211997985839844, -0.025907516479492188, -0.02260303497314453, -0.019298553466796875, -0.01599407196044922, -0.012689590454101562, -0.009385108947753906, -0.00608062744140625, -0.0027761459350585938, 0.0005283355712890625, 0.0038328170776367188, 0.007137298583984375, 0.010441780090332031, 0.013746261596679688, 0.017050743103027344, 0.020355224609375, 0.023659706115722656, 0.026964187622070312, 0.03026866912841797, 0.033573150634765625, 0.03687763214111328, 0.04018211364746094, 0.043486595153808594, 0.04679107666015625, 0.050095558166503906, 0.05340003967285156, 0.05670452117919922, 0.060009002685546875, 0.06331348419189453, 0.06661796569824219, 0.06992244720458984, 0.0732269287109375, 0.07653141021728516, 0.07983589172363281, 0.08314037322998047, 0.08644485473632812, 0.08974933624267578, 0.09305381774902344, 0.0963582992553711, 0.09966278076171875, 0.1029672622680664, 0.10627174377441406, 0.10957622528076172, 0.11288070678710938, 0.11618518829345703, 0.11948966979980469, 0.12279415130615234, 0.1260986328125]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 5.0, 6.0, 19.0, 77.0, 146.0, 248.0, 246.0, 146.0, 67.0, 32.0, 10.0, 7.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.31054216623306274, -0.2850634753704071, -0.2595847547054291, -0.23410606384277344, -0.2086273580789566, -0.18314865231513977, -0.15766996145248413, -0.1321912556886673, -0.10671254992485046, -0.08123384416103363, -0.055755145847797394, -0.030276447534561157, -0.004797741770744324, 0.02068096399307251, 0.04615965485572815, 0.07163836061954498, 0.09711706638336182, 0.12259577214717865, 0.14807447791099548, 0.17355316877365112, 0.19903187453746796, 0.2245105803012848, 0.24998927116394043, 0.27546799182891846, 0.3009466826915741, 0.32642537355422974, 0.35190409421920776, 0.3773827850818634, 0.40286147594451904, 0.42834019660949707, 0.4538188874721527, 0.47929757833480835, 0.5047763586044312, 0.5302550792694092, 0.5557337403297424, 0.5812124609947205, 0.6066911816596985, 0.6321698427200317, 0.6576485633850098, 0.6831272840499878, 0.7086060047149658, 0.7340847253799438, 0.7595633864402771, 0.7850421071052551, 0.8105208277702332, 0.8359994888305664, 0.8614782094955444, 0.8869569301605225, 0.9124355912208557, 0.9379143118858337, 0.963392972946167, 0.988871693611145, 1.014350414276123, 1.039829134941101, 1.065307855606079, 1.0907864570617676, 1.1162651777267456, 1.1417438983917236, 1.1672226190567017, 1.1927013397216797, 1.2181799411773682, 1.2436586618423462, 1.2691373825073242, 1.2946161031723022, 1.3200948238372803]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 3.0, 1.0, 5.0, 8.0, 6.0, 7.0, 9.0, 15.0, 17.0, 14.0, 11.0, 16.0, 17.0, 23.0, 22.0, 33.0, 31.0, 34.0, 44.0, 35.0, 49.0, 50.0, 42.0, 56.0, 47.0, 41.0, 49.0, 40.0, 33.0, 30.0, 31.0, 30.0, 33.0, 17.0, 23.0, 15.0, 15.0, 17.0, 12.0, 8.0, 2.0, 5.0, 4.0, 1.0, 5.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.20412296056747437, -0.1965848058462143, -0.18904663622379303, -0.18150848150253296, -0.1739703118801117, -0.16643215715885162, -0.15889400243759155, -0.1513558328151703, -0.14381766319274902, -0.13627950847148895, -0.1287413388490677, -0.12120318412780762, -0.11366501450538635, -0.10612685978412628, -0.09858869761228561, -0.09105053544044495, -0.08351238071918488, -0.07597421854734421, -0.06843605637550354, -0.06089789792895317, -0.0533597357571125, -0.045821573585271835, -0.038283415138721466, -0.0307452529668808, -0.02320709079504013, -0.015668928623199463, -0.008130768314003944, -0.0005926080048084259, 0.006945554167032242, 0.01448371633887291, 0.02202187478542328, 0.029560036957263947, 0.037098199129104614, 0.04463636130094528, 0.05217452347278595, 0.05971268191933632, 0.06725084781646729, 0.07478900253772736, 0.08232716470956802, 0.08986532688140869, 0.09740348905324936, 0.10494165122509003, 0.1124798133969307, 0.12001797556877136, 0.12755613029003143, 0.1350942999124527, 0.14263245463371277, 0.15017062425613403, 0.1577087789773941, 0.16524693369865417, 0.17278510332107544, 0.1803232580423355, 0.18786142766475677, 0.19539958238601685, 0.2029377520084381, 0.21047590672969818, 0.21801406145095825, 0.22555221617221832, 0.2330903857946396, 0.24062854051589966, 0.24816671013832092, 0.2557048797607422, 0.26324301958084106, 0.27078118920326233, 0.2783193588256836]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 5.0, 4.0, 9.0, 14.0, 16.0, 40.0, 58.0, 75.0, 109.0, 209.0, 262.0, 530.0, 927.0, 1849.0, 3996.0, 9714.0, 28754.0, 94770.0, 312146.0, 397775.0, 134595.0, 39738.0, 12976.0, 4975.0, 2235.0, 1173.0, 628.0, 350.0, 204.0, 145.0, 91.0, 64.0, 30.0, 26.0, 16.0, 15.0, 9.0, 6.0, 8.0, 4.0, 4.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2247314453125, -0.21727561950683594, -0.20981979370117188, -0.2023639678955078, -0.19490814208984375, -0.1874523162841797, -0.17999649047851562, -0.17254066467285156, -0.1650848388671875, -0.15762901306152344, -0.15017318725585938, -0.1427173614501953, -0.13526153564453125, -0.1278057098388672, -0.12034988403320312, -0.11289405822753906, -0.105438232421875, -0.09798240661621094, -0.09052658081054688, -0.08307075500488281, -0.07561492919921875, -0.06815910339355469, -0.060703277587890625, -0.05324745178222656, -0.0457916259765625, -0.03833580017089844, -0.030879974365234375, -0.023424148559570312, -0.01596832275390625, -0.008512496948242188, -0.001056671142578125, 0.0063991546630859375, 0.01385498046875, 0.021310806274414062, 0.028766632080078125, 0.03622245788574219, 0.04367828369140625, 0.05113410949707031, 0.058589935302734375, 0.06604576110839844, 0.0735015869140625, 0.08095741271972656, 0.08841323852539062, 0.09586906433105469, 0.10332489013671875, 0.11078071594238281, 0.11823654174804688, 0.12569236755371094, 0.133148193359375, 0.14060401916503906, 0.14805984497070312, 0.1555156707763672, 0.16297149658203125, 0.1704273223876953, 0.17788314819335938, 0.18533897399902344, 0.1927947998046875, 0.20025062561035156, 0.20770645141601562, 0.2151622772216797, 0.22261810302734375, 0.2300739288330078, 0.23752975463867188, 0.24498558044433594, 0.25244140625]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 5.0, 3.0, 14.0, 5.0, 14.0, 16.0, 22.0, 36.0, 32.0, 58.0, 58.0, 75.0, 63.0, 82.0, 69.0, 67.0, 75.0, 56.0, 50.0, 44.0, 43.0, 33.0, 23.0, 20.0, 16.0, 8.0, 4.0, 4.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10565185546875, -0.10288715362548828, -0.10012245178222656, -0.09735774993896484, -0.09459304809570312, -0.0918283462524414, -0.08906364440917969, -0.08629894256591797, -0.08353424072265625, -0.08076953887939453, -0.07800483703613281, -0.0752401351928711, -0.07247543334960938, -0.06971073150634766, -0.06694602966308594, -0.06418132781982422, -0.0614166259765625, -0.05865192413330078, -0.05588722229003906, -0.053122520446777344, -0.050357818603515625, -0.047593116760253906, -0.04482841491699219, -0.04206371307373047, -0.03929901123046875, -0.03653430938720703, -0.03376960754394531, -0.031004905700683594, -0.028240203857421875, -0.025475502014160156, -0.022710800170898438, -0.01994609832763672, -0.017181396484375, -0.014416694641113281, -0.011651992797851562, -0.008887290954589844, -0.006122589111328125, -0.0033578872680664062, -0.0005931854248046875, 0.0021715164184570312, 0.00493621826171875, 0.007700920104980469, 0.010465621948242188, 0.013230323791503906, 0.015995025634765625, 0.018759727478027344, 0.021524429321289062, 0.02428913116455078, 0.0270538330078125, 0.02981853485107422, 0.03258323669433594, 0.035347938537597656, 0.038112640380859375, 0.040877342224121094, 0.04364204406738281, 0.04640674591064453, 0.04917144775390625, 0.05193614959716797, 0.05470085144042969, 0.057465553283691406, 0.060230255126953125, 0.06299495697021484, 0.06575965881347656, 0.06852436065673828, 0.0712890625]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 5.0, 4.0, 7.0, 7.0, 16.0, 16.0, 20.0, 28.0, 30.0, 51.0, 73.0, 99.0, 148.0, 185.0, 302.0, 505.0, 768.0, 1515.0, 3334.0, 8080.0, 21790.0, 64469.0, 177732.0, 347298.0, 261332.0, 103074.0, 35495.0, 12355.0, 4863.0, 2116.0, 1076.0, 632.0, 374.0, 235.0, 158.0, 114.0, 78.0, 47.0, 37.0, 25.0, 17.0, 14.0, 14.0, 5.0, 5.0, 5.0, 1.0, 5.0, 5.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.1611328125, -0.1560535430908203, -0.15097427368164062, -0.14589500427246094, -0.14081573486328125, -0.13573646545410156, -0.13065719604492188, -0.1255779266357422, -0.1204986572265625, -0.11541938781738281, -0.11034011840820312, -0.10526084899902344, -0.10018157958984375, -0.09510231018066406, -0.09002304077148438, -0.08494377136230469, -0.079864501953125, -0.07478523254394531, -0.06970596313476562, -0.06462669372558594, -0.05954742431640625, -0.05446815490722656, -0.049388885498046875, -0.04430961608886719, -0.0392303466796875, -0.03415107727050781, -0.029071807861328125, -0.023992538452148438, -0.01891326904296875, -0.013833999633789062, -0.008754730224609375, -0.0036754608154296875, 0.00140380859375, 0.0064830780029296875, 0.011562347412109375, 0.016641616821289062, 0.02172088623046875, 0.026800155639648438, 0.031879425048828125, 0.03695869445800781, 0.0420379638671875, 0.04711723327636719, 0.052196502685546875, 0.05727577209472656, 0.06235504150390625, 0.06743431091308594, 0.07251358032226562, 0.07759284973144531, 0.082672119140625, 0.08775138854980469, 0.09283065795898438, 0.09790992736816406, 0.10298919677734375, 0.10806846618652344, 0.11314773559570312, 0.11822700500488281, 0.1233062744140625, 0.1283855438232422, 0.13346481323242188, 0.13854408264160156, 0.14362335205078125, 0.14870262145996094, 0.15378189086914062, 0.1588611602783203, 0.1639404296875]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 3.0, 4.0, 2.0, 8.0, 15.0, 6.0, 15.0, 12.0, 18.0, 21.0, 16.0, 20.0, 33.0, 36.0, 33.0, 33.0, 37.0, 37.0, 35.0, 43.0, 53.0, 47.0, 36.0, 48.0, 46.0, 33.0, 42.0, 43.0, 38.0, 32.0, 34.0, 24.0, 19.0, 6.0, 16.0, 10.0, 7.0, 16.0, 7.0, 8.0, 5.0, 2.0, 2.0, 3.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.277587890625, -0.26958656311035156, -0.2615852355957031, -0.2535839080810547, -0.24558258056640625, -0.2375812530517578, -0.22957992553710938, -0.22157859802246094, -0.2135772705078125, -0.20557594299316406, -0.19757461547851562, -0.1895732879638672, -0.18157196044921875, -0.1735706329345703, -0.16556930541992188, -0.15756797790527344, -0.149566650390625, -0.14156532287597656, -0.13356399536132812, -0.1255626678466797, -0.11756134033203125, -0.10956001281738281, -0.10155868530273438, -0.09355735778808594, -0.0855560302734375, -0.07755470275878906, -0.06955337524414062, -0.06155204772949219, -0.05355072021484375, -0.04554939270019531, -0.037548065185546875, -0.029546737670898438, -0.02154541015625, -0.013544082641601562, -0.005542755126953125, 0.0024585723876953125, 0.01045989990234375, 0.018461227416992188, 0.026462554931640625, 0.03446388244628906, 0.0424652099609375, 0.05046653747558594, 0.058467864990234375, 0.06646919250488281, 0.07447052001953125, 0.08247184753417969, 0.09047317504882812, 0.09847450256347656, 0.106475830078125, 0.11447715759277344, 0.12247848510742188, 0.1304798126220703, 0.13848114013671875, 0.1464824676513672, 0.15448379516601562, 0.16248512268066406, 0.1704864501953125, 0.17848777770996094, 0.18648910522460938, 0.1944904327392578, 0.20249176025390625, 0.2104930877685547, 0.21849441528320312, 0.22649574279785156, 0.2344970703125]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 3.0, 0.0, 0.0, 2.0, 5.0, 8.0, 10.0, 24.0, 48.0, 94.0, 181.0, 380.0, 939.0, 2723.0, 10868.0, 61434.0, 543986.0, 373644.0, 42572.0, 8081.0, 2211.0, 715.0, 308.0, 139.0, 85.0, 40.0, 27.0, 14.0, 6.0, 5.0, 3.0, 2.0, 1.0, 2.0, 2.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11126708984375, -0.10679912567138672, -0.10233116149902344, -0.09786319732666016, -0.09339523315429688, -0.0889272689819336, -0.08445930480957031, -0.07999134063720703, -0.07552337646484375, -0.07105541229248047, -0.06658744812011719, -0.062119483947753906, -0.057651519775390625, -0.053183555603027344, -0.04871559143066406, -0.04424762725830078, -0.0397796630859375, -0.03531169891357422, -0.030843734741210938, -0.026375770568847656, -0.021907806396484375, -0.017439842224121094, -0.012971878051757812, -0.008503913879394531, -0.00403594970703125, 0.00043201446533203125, 0.0048999786376953125, 0.009367942810058594, 0.013835906982421875, 0.018303871154785156, 0.022771835327148438, 0.02723979949951172, 0.031707763671875, 0.03617572784423828, 0.04064369201660156, 0.045111656188964844, 0.049579620361328125, 0.054047584533691406, 0.05851554870605469, 0.06298351287841797, 0.06745147705078125, 0.07191944122314453, 0.07638740539550781, 0.0808553695678711, 0.08532333374023438, 0.08979129791259766, 0.09425926208496094, 0.09872722625732422, 0.1031951904296875, 0.10766315460205078, 0.11213111877441406, 0.11659908294677734, 0.12106704711914062, 0.1255350112915039, 0.1300029754638672, 0.13447093963623047, 0.13893890380859375, 0.14340686798095703, 0.1478748321533203, 0.1523427963256836, 0.15681076049804688, 0.16127872467041016, 0.16574668884277344, 0.17021465301513672, 0.1746826171875]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 4.0, 3.0, 1.0, 3.0, 11.0, 14.0, 10.0, 12.0, 22.0, 18.0, 23.0, 35.0, 43.0, 51.0, 108.0, 93.0, 108.0, 108.0, 71.0, 53.0, 38.0, 38.0, 29.0, 27.0, 20.0, 15.0, 12.0, 9.0, 9.0, 4.0, 7.0, 6.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.230043411254883e-05, -6.975512951612473e-05, -6.720982491970062e-05, -6.466452032327652e-05, -6.211921572685242e-05, -5.9573911130428314e-05, -5.702860653400421e-05, -5.448330193758011e-05, -5.1937997341156006e-05, -4.93926927447319e-05, -4.68473881483078e-05, -4.43020835518837e-05, -4.1756778955459595e-05, -3.921147435903549e-05, -3.666616976261139e-05, -3.4120865166187286e-05, -3.1575560569763184e-05, -2.903025597333908e-05, -2.6484951376914978e-05, -2.3939646780490875e-05, -2.1394342184066772e-05, -1.884903758764267e-05, -1.6303732991218567e-05, -1.3758428394794464e-05, -1.1213123798370361e-05, -8.667819201946259e-06, -6.122514605522156e-06, -3.577210009098053e-06, -1.0319054126739502e-06, 1.5133991837501526e-06, 4.058703780174255e-06, 6.604008376598358e-06, 9.149312973022461e-06, 1.1694617569446564e-05, 1.4239922165870667e-05, 1.678522676229477e-05, 1.9330531358718872e-05, 2.1875835955142975e-05, 2.4421140551567078e-05, 2.696644514799118e-05, 2.9511749744415283e-05, 3.2057054340839386e-05, 3.460235893726349e-05, 3.714766353368759e-05, 3.9692968130111694e-05, 4.22382727265358e-05, 4.47835773229599e-05, 4.7328881919384e-05, 4.9874186515808105e-05, 5.241949111223221e-05, 5.496479570865631e-05, 5.7510100305080414e-05, 6.0055404901504517e-05, 6.260070949792862e-05, 6.514601409435272e-05, 6.769131869077682e-05, 7.023662328720093e-05, 7.278192788362503e-05, 7.532723248004913e-05, 7.787253707647324e-05, 8.041784167289734e-05, 8.296314626932144e-05, 8.550845086574554e-05, 8.805375546216965e-05, 9.059906005859375e-05]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 0.0, 1.0, 3.0, 8.0, 12.0, 11.0, 23.0, 22.0, 27.0, 37.0, 41.0, 64.0, 102.0, 179.0, 320.0, 559.0, 1092.0, 2309.0, 5470.0, 15569.0, 52849.0, 245615.0, 545436.0, 128936.0, 32111.0, 10299.0, 3841.0, 1631.0, 818.0, 491.0, 232.0, 161.0, 103.0, 61.0, 28.0, 28.0, 20.0, 14.0, 11.0, 13.0, 4.0, 3.0, 0.0, 4.0, 3.0, 1.0, 0.0, 3.0, 1.0, 2.0], "bins": [-0.11834716796875, -0.11508750915527344, -0.11182785034179688, -0.10856819152832031, -0.10530853271484375, -0.10204887390136719, -0.09878921508789062, -0.09552955627441406, -0.0922698974609375, -0.08901023864746094, -0.08575057983398438, -0.08249092102050781, -0.07923126220703125, -0.07597160339355469, -0.07271194458007812, -0.06945228576660156, -0.066192626953125, -0.06293296813964844, -0.059673309326171875, -0.05641365051269531, -0.05315399169921875, -0.04989433288574219, -0.046634674072265625, -0.04337501525878906, -0.0401153564453125, -0.03685569763183594, -0.033596038818359375, -0.030336380004882812, -0.02707672119140625, -0.023817062377929688, -0.020557403564453125, -0.017297744750976562, -0.0140380859375, -0.010778427124023438, -0.007518768310546875, -0.0042591094970703125, -0.00099945068359375, 0.0022602081298828125, 0.005519866943359375, 0.008779525756835938, 0.0120391845703125, 0.015298843383789062, 0.018558502197265625, 0.021818161010742188, 0.02507781982421875, 0.028337478637695312, 0.031597137451171875, 0.03485679626464844, 0.038116455078125, 0.04137611389160156, 0.044635772705078125, 0.04789543151855469, 0.05115509033203125, 0.05441474914550781, 0.057674407958984375, 0.06093406677246094, 0.0641937255859375, 0.06745338439941406, 0.07071304321289062, 0.07397270202636719, 0.07723236083984375, 0.08049201965332031, 0.08375167846679688, 0.08701133728027344, 0.09027099609375]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 4.0, 1.0, 3.0, 3.0, 15.0, 12.0, 10.0, 15.0, 25.0, 53.0, 49.0, 68.0, 86.0, 134.0, 131.0, 115.0, 93.0, 62.0, 50.0, 31.0, 13.0, 16.0, 6.0, 4.0, 6.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.159423828125, -0.15544986724853516, -0.1514759063720703, -0.14750194549560547, -0.14352798461914062, -0.13955402374267578, -0.13558006286621094, -0.1316061019897461, -0.12763214111328125, -0.1236581802368164, -0.11968421936035156, -0.11571025848388672, -0.11173629760742188, -0.10776233673095703, -0.10378837585449219, -0.09981441497802734, -0.0958404541015625, -0.09186649322509766, -0.08789253234863281, -0.08391857147216797, -0.07994461059570312, -0.07597064971923828, -0.07199668884277344, -0.0680227279663086, -0.06404876708984375, -0.060074806213378906, -0.05610084533691406, -0.05212688446044922, -0.048152923583984375, -0.04417896270751953, -0.04020500183105469, -0.036231040954589844, -0.032257080078125, -0.028283119201660156, -0.024309158325195312, -0.02033519744873047, -0.016361236572265625, -0.012387275695800781, -0.008413314819335938, -0.004439353942871094, -0.00046539306640625, 0.0035085678100585938, 0.0074825286865234375, 0.011456489562988281, 0.015430450439453125, 0.01940441131591797, 0.023378372192382812, 0.027352333068847656, 0.0313262939453125, 0.035300254821777344, 0.03927421569824219, 0.04324817657470703, 0.047222137451171875, 0.05119609832763672, 0.05517005920410156, 0.059144020080566406, 0.06311798095703125, 0.0670919418334961, 0.07106590270996094, 0.07503986358642578, 0.07901382446289062, 0.08298778533935547, 0.08696174621582031, 0.09093570709228516, 0.09490966796875]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 3.0, 6.0, 11.0, 30.0, 72.0, 133.0, 234.0, 239.0, 145.0, 78.0, 34.0, 9.0, 6.0, 1.0, 2.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3133618831634521, -1.232060194015503, -1.1507583856582642, -1.0694565773010254, -0.9881548881530762, -0.9068531394004822, -0.8255513906478882, -0.7442496418952942, -0.6629478931427002, -0.5816461443901062, -0.5003443956375122, -0.4190426468849182, -0.3377408981323242, -0.2564391493797302, -0.17513740062713623, -0.09383565187454224, -0.012533903121948242, 0.06876784563064575, 0.15006959438323975, 0.23137134313583374, 0.31267309188842773, 0.39397484064102173, 0.4752765893936157, 0.5565783381462097, 0.6378800868988037, 0.7191818356513977, 0.8004835844039917, 0.8817853331565857, 0.9630870819091797, 1.044388771057129, 1.1256905794143677, 1.2069923877716064, 1.2882943153381348, 1.369596004486084, 1.4508978128433228, 1.5321996212005615, 1.6135013103485107, 1.69480299949646, 1.7761048078536987, 1.8574066162109375, 1.9387083053588867, 2.020009994506836, 2.101311683654785, 2.1826136112213135, 2.2639153003692627, 2.345216989517212, 2.4265189170837402, 2.5078206062316895, 2.5891222953796387, 2.670423984527588, 2.751725673675537, 2.8330276012420654, 2.9143292903900146, 2.995630979537964, 3.076932907104492, 3.1582345962524414, 3.2395362854003906, 3.32083797454834, 3.402139663696289, 3.4834415912628174, 3.5647432804107666, 3.646044969558716, 3.727346897125244, 3.8086485862731934, 3.8899502754211426]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 5.0, 5.0, 3.0, 8.0, 6.0, 16.0, 6.0, 12.0, 25.0, 26.0, 26.0, 26.0, 33.0, 30.0, 27.0, 27.0, 29.0, 37.0, 51.0, 49.0, 46.0, 46.0, 41.0, 44.0, 41.0, 45.0, 38.0, 32.0, 24.0, 36.0, 27.0, 16.0, 18.0, 21.0, 14.0, 14.0, 9.0, 10.0, 9.0, 5.0, 4.0, 5.0, 2.0, 3.0, 4.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-1.3588221073150635, -1.3138513565063477, -1.2688804864883423, -1.2239097356796265, -1.178938865661621, -1.1339681148529053, -1.0889973640441895, -1.0440266132354736, -0.9990557432174683, -0.9540849328041077, -0.9091141223907471, -0.8641433715820312, -0.8191725611686707, -0.7742017507553101, -0.7292309999465942, -0.6842601895332336, -0.639289379119873, -0.5943185687065125, -0.5493477582931519, -0.504377007484436, -0.45940619707107544, -0.41443538665771484, -0.36946460604667664, -0.3244938254356384, -0.27952301502227783, -0.23455221951007843, -0.18958142399787903, -0.14461062848567963, -0.09963983297348022, -0.05466903746128082, -0.009698241949081421, 0.03527253866195679, 0.08024322986602783, 0.12521402537822723, 0.17018482089042664, 0.21515561640262604, 0.26012641191482544, 0.30509722232818604, 0.35006800293922424, 0.39503878355026245, 0.44000959396362305, 0.48498040437698364, 0.5299512147903442, 0.5749219655990601, 0.6198927760124207, 0.6648635864257812, 0.7098343372344971, 0.7548051476478577, 0.7997759580612183, 0.8447467684745789, 0.8897175788879395, 0.9346883296966553, 0.9796591401100159, 1.0246299505233765, 1.0696007013320923, 1.1145715713500977, 1.1595423221588135, 1.2045130729675293, 1.2494839429855347, 1.2944546937942505, 1.3394255638122559, 1.3843963146209717, 1.4293670654296875, 1.4743378162384033, 1.5193086862564087]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 1.0, 5.0, 4.0, 9.0, 7.0, 11.0, 11.0, 21.0, 33.0, 46.0, 76.0, 97.0, 176.0, 237.0, 435.0, 797.0, 1538.0, 4005.0, 11420.0, 52770.0, 1684934.0, 2362533.0, 56290.0, 11832.0, 3956.0, 1517.0, 676.0, 368.0, 198.0, 110.0, 60.0, 40.0, 27.0, 10.0, 11.0, 13.0, 3.0, 1.0, 1.0, 3.0, 1.0, 2.0, 2.0], "bins": [-0.346923828125, -0.3386669158935547, -0.3304100036621094, -0.32215309143066406, -0.31389617919921875, -0.30563926696777344, -0.2973823547363281, -0.2891254425048828, -0.2808685302734375, -0.2726116180419922, -0.2643547058105469, -0.25609779357910156, -0.24784088134765625, -0.23958396911621094, -0.23132705688476562, -0.2230701446533203, -0.214813232421875, -0.2065563201904297, -0.19829940795898438, -0.19004249572753906, -0.18178558349609375, -0.17352867126464844, -0.16527175903320312, -0.1570148468017578, -0.1487579345703125, -0.1405010223388672, -0.13224411010742188, -0.12398719787597656, -0.11573028564453125, -0.10747337341308594, -0.09921646118164062, -0.09095954895019531, -0.08270263671875, -0.07444572448730469, -0.06618881225585938, -0.05793190002441406, -0.04967498779296875, -0.04141807556152344, -0.033161163330078125, -0.024904251098632812, -0.0166473388671875, -0.008390426635742188, -0.000133514404296875, 0.008123397827148438, 0.01638031005859375, 0.024637222290039062, 0.032894134521484375, 0.04115104675292969, 0.049407958984375, 0.05766487121582031, 0.06592178344726562, 0.07417869567871094, 0.08243560791015625, 0.09069252014160156, 0.09894943237304688, 0.10720634460449219, 0.1154632568359375, 0.12372016906738281, 0.13197708129882812, 0.14023399353027344, 0.14849090576171875, 0.15674781799316406, 0.16500473022460938, 0.1732616424560547, 0.1815185546875]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 3.0, 6.0, 8.0, 6.0, 14.0, 16.0, 18.0, 22.0, 29.0, 32.0, 52.0, 56.0, 59.0, 76.0, 63.0, 65.0, 59.0, 59.0, 66.0, 55.0, 60.0, 43.0, 30.0, 42.0, 22.0, 14.0, 3.0, 6.0, 9.0, 3.0, 1.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.1090087890625, -0.10617256164550781, -0.10333633422851562, -0.10050010681152344, -0.09766387939453125, -0.09482765197753906, -0.09199142456054688, -0.08915519714355469, -0.0863189697265625, -0.08348274230957031, -0.08064651489257812, -0.07781028747558594, -0.07497406005859375, -0.07213783264160156, -0.06930160522460938, -0.06646537780761719, -0.063629150390625, -0.06079292297363281, -0.057956695556640625, -0.05512046813964844, -0.05228424072265625, -0.04944801330566406, -0.046611785888671875, -0.04377555847167969, -0.0409393310546875, -0.03810310363769531, -0.035266876220703125, -0.03243064880371094, -0.02959442138671875, -0.026758193969726562, -0.023921966552734375, -0.021085739135742188, -0.01824951171875, -0.015413284301757812, -0.012577056884765625, -0.009740829467773438, -0.00690460205078125, -0.0040683746337890625, -0.001232147216796875, 0.0016040802001953125, 0.0044403076171875, 0.0072765350341796875, 0.010112762451171875, 0.012948989868164062, 0.01578521728515625, 0.018621444702148438, 0.021457672119140625, 0.024293899536132812, 0.027130126953125, 0.029966354370117188, 0.032802581787109375, 0.03563880920410156, 0.03847503662109375, 0.04131126403808594, 0.044147491455078125, 0.04698371887207031, 0.0498199462890625, 0.05265617370605469, 0.055492401123046875, 0.05832862854003906, 0.06116485595703125, 0.06400108337402344, 0.06683731079101562, 0.06967353820800781, 0.072509765625]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 6.0, 7.0, 9.0, 20.0, 40.0, 92.0, 224.0, 613.0, 1562.0, 5945.0, 36917.0, 1093728.0, 2984976.0, 58307.0, 8268.0, 2154.0, 828.0, 349.0, 130.0, 60.0, 30.0, 13.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.298095703125, -0.2890892028808594, -0.28008270263671875, -0.2710762023925781, -0.2620697021484375, -0.2530632019042969, -0.24405670166015625, -0.23505020141601562, -0.226043701171875, -0.21703720092773438, -0.20803070068359375, -0.19902420043945312, -0.1900177001953125, -0.18101119995117188, -0.17200469970703125, -0.16299819946289062, -0.15399169921875, -0.14498519897460938, -0.13597869873046875, -0.12697219848632812, -0.1179656982421875, -0.10895919799804688, -0.09995269775390625, -0.09094619750976562, -0.081939697265625, -0.07293319702148438, -0.06392669677734375, -0.054920196533203125, -0.0459136962890625, -0.036907196044921875, -0.02790069580078125, -0.018894195556640625, -0.0098876953125, -0.000881195068359375, 0.00812530517578125, 0.017131805419921875, 0.0261383056640625, 0.035144805908203125, 0.04415130615234375, 0.053157806396484375, 0.062164306640625, 0.07117080688476562, 0.08017730712890625, 0.08918380737304688, 0.0981903076171875, 0.10719680786132812, 0.11620330810546875, 0.12520980834960938, 0.13421630859375, 0.14322280883789062, 0.15222930908203125, 0.16123580932617188, 0.1702423095703125, 0.17924880981445312, 0.18825531005859375, 0.19726181030273438, 0.206268310546875, 0.21527481079101562, 0.22428131103515625, 0.23328781127929688, 0.2422943115234375, 0.2513008117675781, 0.26030731201171875, 0.2693138122558594, 0.2783203125]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 4.0, 9.0, 4.0, 10.0, 5.0, 12.0, 19.0, 31.0, 55.0, 88.0, 177.0, 480.0, 1281.0, 1109.0, 387.0, 173.0, 72.0, 51.0, 24.0, 19.0, 22.0, 15.0, 5.0, 6.0, 6.0, 5.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0904541015625, -0.08709716796875, -0.083740234375, -0.08038330078125, -0.0770263671875, -0.07366943359375, -0.0703125, -0.06695556640625, -0.0635986328125, -0.06024169921875, -0.056884765625, -0.05352783203125, -0.0501708984375, -0.04681396484375, -0.04345703125, -0.04010009765625, -0.0367431640625, -0.03338623046875, -0.030029296875, -0.02667236328125, -0.0233154296875, -0.01995849609375, -0.0166015625, -0.01324462890625, -0.0098876953125, -0.00653076171875, -0.003173828125, 0.00018310546875, 0.0035400390625, 0.00689697265625, 0.01025390625, 0.01361083984375, 0.0169677734375, 0.02032470703125, 0.023681640625, 0.02703857421875, 0.0303955078125, 0.03375244140625, 0.037109375, 0.04046630859375, 0.0438232421875, 0.04718017578125, 0.050537109375, 0.05389404296875, 0.0572509765625, 0.06060791015625, 0.06396484375, 0.06732177734375, 0.0706787109375, 0.07403564453125, 0.077392578125, 0.08074951171875, 0.0841064453125, 0.08746337890625, 0.0908203125, 0.09417724609375, 0.0975341796875, 0.10089111328125, 0.104248046875, 0.10760498046875, 0.1109619140625, 0.11431884765625, 0.11767578125, 0.12103271484375, 0.1243896484375]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 0.0, 5.0, 8.0, 21.0, 49.0, 121.0, 202.0, 266.0, 177.0, 105.0, 31.0, 12.0, 5.0, 4.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9393589496612549, -0.9111850261688232, -0.8830111622810364, -0.8548372983932495, -0.8266633749008179, -0.7984894514083862, -0.7703155875205994, -0.7421417236328125, -0.7139678001403809, -0.6857938766479492, -0.6576200127601624, -0.6294461488723755, -0.6012722253799438, -0.5730983018875122, -0.5449244379997253, -0.5167505741119385, -0.48857665061950684, -0.4604027569293976, -0.43222886323928833, -0.4040549695491791, -0.3758810758590698, -0.34770718216896057, -0.3195332884788513, -0.29135939478874207, -0.2631855010986328, -0.23501160740852356, -0.2068377137184143, -0.17866382002830505, -0.1504899263381958, -0.12231603264808655, -0.0941421389579773, -0.06596824526786804, -0.037794411182403564, -0.009620517492294312, 0.01855337619781494, 0.046727269887924194, 0.07490116357803345, 0.1030750572681427, 0.13124895095825195, 0.1594228446483612, 0.18759673833847046, 0.2157706320285797, 0.24394452571868896, 0.2721184194087982, 0.30029231309890747, 0.3284662067890167, 0.356640100479126, 0.38481399416923523, 0.4129878878593445, 0.44116178154945374, 0.469335675239563, 0.49750956892967224, 0.5256834626197815, 0.5538573265075684, 0.58203125, 0.6102051734924316, 0.6383790373802185, 0.6665529012680054, 0.694726824760437, 0.7229007482528687, 0.7510746121406555, 0.7792484760284424, 0.807422399520874, 0.8355963230133057, 0.8637701869010925]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 2.0, 6.0, 3.0, 9.0, 7.0, 18.0, 13.0, 13.0, 15.0, 24.0, 27.0, 30.0, 34.0, 42.0, 31.0, 33.0, 36.0, 48.0, 45.0, 34.0, 48.0, 43.0, 32.0, 38.0, 37.0, 41.0, 31.0, 27.0, 36.0, 43.0, 30.0, 24.0, 21.0, 20.0, 11.0, 8.0, 10.0, 8.0, 5.0, 3.0, 3.0, 4.0, 1.0, 3.0, 3.0, 2.0, 0.0, 3.0, 2.0, 0.0, 3.0], "bins": [-0.31077879667282104, -0.3014974594116211, -0.29221612215042114, -0.2829347550868988, -0.27365341782569885, -0.2643720805644989, -0.25509074330329895, -0.245809406042099, -0.23652805387973785, -0.2272467166185379, -0.21796536445617676, -0.2086840271949768, -0.19940268993377686, -0.1901213377714157, -0.18084000051021576, -0.17155864834785461, -0.16227731108665466, -0.1529959738254547, -0.14371462166309357, -0.13443328440189362, -0.12515193223953247, -0.11587059497833252, -0.10658925771713257, -0.09730791300535202, -0.08802656829357147, -0.07874522358179092, -0.06946387887001038, -0.060182541608810425, -0.05090119689702988, -0.04161985218524933, -0.03233851119875908, -0.02305717021226883, -0.013775825500488281, -0.004494482651352882, 0.0047868601977825165, 0.014068203046917915, 0.023349545896053314, 0.03263089060783386, 0.04191223159432411, 0.05119357258081436, 0.06047491729259491, 0.06975626200437546, 0.079037606716156, 0.08831894397735596, 0.0976002886891365, 0.10688163340091705, 0.116162970662117, 0.12544432282447815, 0.1347256600856781, 0.14400699734687805, 0.1532883495092392, 0.16256968677043915, 0.1718510389328003, 0.18113237619400024, 0.1904137134552002, 0.19969505071640015, 0.2089764028787613, 0.21825774013996124, 0.2275390923023224, 0.23682042956352234, 0.2461017668247223, 0.25538313388824463, 0.2646644711494446, 0.27394580841064453, 0.2832271456718445]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 4.0, 0.0, 2.0, 2.0, 2.0, 7.0, 6.0, 5.0, 9.0, 15.0, 15.0, 19.0, 30.0, 44.0, 64.0, 90.0, 174.0, 239.0, 387.0, 653.0, 1197.0, 2206.0, 4771.0, 11123.0, 29569.0, 91549.0, 340462.0, 398544.0, 109221.0, 34274.0, 12824.0, 5329.0, 2554.0, 1274.0, 748.0, 400.0, 256.0, 148.0, 93.0, 88.0, 56.0, 33.0, 26.0, 17.0, 11.0, 8.0, 9.0, 6.0, 5.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.238037109375, -0.23178482055664062, -0.22553253173828125, -0.21928024291992188, -0.2130279541015625, -0.20677566528320312, -0.20052337646484375, -0.19427108764648438, -0.188018798828125, -0.18176651000976562, -0.17551422119140625, -0.16926193237304688, -0.1630096435546875, -0.15675735473632812, -0.15050506591796875, -0.14425277709960938, -0.13800048828125, -0.13174819946289062, -0.12549591064453125, -0.11924362182617188, -0.1129913330078125, -0.10673904418945312, -0.10048675537109375, -0.09423446655273438, -0.087982177734375, -0.08172988891601562, -0.07547760009765625, -0.06922531127929688, -0.0629730224609375, -0.056720733642578125, -0.05046844482421875, -0.044216156005859375, -0.0379638671875, -0.031711578369140625, -0.02545928955078125, -0.019207000732421875, -0.0129547119140625, -0.006702423095703125, -0.00045013427734375, 0.005802154541015625, 0.012054443359375, 0.018306732177734375, 0.02455902099609375, 0.030811309814453125, 0.0370635986328125, 0.043315887451171875, 0.04956817626953125, 0.055820465087890625, 0.06207275390625, 0.06832504272460938, 0.07457733154296875, 0.08082962036132812, 0.0870819091796875, 0.09333419799804688, 0.09958648681640625, 0.10583877563476562, 0.112091064453125, 0.11834335327148438, 0.12459564208984375, 0.13084793090820312, 0.1371002197265625, 0.14335250854492188, 0.14960479736328125, 0.15585708618164062, 0.162109375]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 5.0, 2.0, 10.0, 6.0, 11.0, 15.0, 16.0, 20.0, 19.0, 35.0, 40.0, 60.0, 55.0, 70.0, 71.0, 61.0, 67.0, 59.0, 57.0, 64.0, 48.0, 56.0, 39.0, 46.0, 19.0, 13.0, 14.0, 6.0, 7.0, 6.0, 1.0, 3.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.10858154296875, -0.10579109191894531, -0.10300064086914062, -0.10021018981933594, -0.09741973876953125, -0.09462928771972656, -0.09183883666992188, -0.08904838562011719, -0.0862579345703125, -0.08346748352050781, -0.08067703247070312, -0.07788658142089844, -0.07509613037109375, -0.07230567932128906, -0.06951522827148438, -0.06672477722167969, -0.063934326171875, -0.06114387512207031, -0.058353424072265625, -0.05556297302246094, -0.05277252197265625, -0.04998207092285156, -0.047191619873046875, -0.04440116882324219, -0.0416107177734375, -0.03882026672363281, -0.036029815673828125, -0.03323936462402344, -0.03044891357421875, -0.027658462524414062, -0.024868011474609375, -0.022077560424804688, -0.019287109375, -0.016496658325195312, -0.013706207275390625, -0.010915756225585938, -0.00812530517578125, -0.0053348541259765625, -0.002544403076171875, 0.0002460479736328125, 0.0030364990234375, 0.0058269500732421875, 0.008617401123046875, 0.011407852172851562, 0.01419830322265625, 0.016988754272460938, 0.019779205322265625, 0.022569656372070312, 0.025360107421875, 0.028150558471679688, 0.030941009521484375, 0.03373146057128906, 0.03652191162109375, 0.03931236267089844, 0.042102813720703125, 0.04489326477050781, 0.0476837158203125, 0.05047416687011719, 0.053264617919921875, 0.05605506896972656, 0.05884552001953125, 0.06163597106933594, 0.06442642211914062, 0.06721687316894531, 0.07000732421875]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 2.0, 5.0, 6.0, 7.0, 11.0, 18.0, 18.0, 31.0, 39.0, 67.0, 96.0, 132.0, 219.0, 400.0, 772.0, 1893.0, 6774.0, 38402.0, 326779.0, 584060.0, 72832.0, 11078.0, 2696.0, 1000.0, 468.0, 267.0, 170.0, 87.0, 63.0, 41.0, 35.0, 26.0, 22.0, 14.0, 6.0, 4.0, 7.0, 5.0, 1.0, 2.0, 3.0, 0.0, 2.0, 1.0, 2.0], "bins": [-0.356689453125, -0.34734153747558594, -0.3379936218261719, -0.3286457061767578, -0.31929779052734375, -0.3099498748779297, -0.3006019592285156, -0.29125404357910156, -0.2819061279296875, -0.27255821228027344, -0.2632102966308594, -0.2538623809814453, -0.24451446533203125, -0.2351665496826172, -0.22581863403320312, -0.21647071838378906, -0.207122802734375, -0.19777488708496094, -0.18842697143554688, -0.1790790557861328, -0.16973114013671875, -0.1603832244873047, -0.15103530883789062, -0.14168739318847656, -0.1323394775390625, -0.12299156188964844, -0.11364364624023438, -0.10429573059082031, -0.09494781494140625, -0.08559989929199219, -0.07625198364257812, -0.06690406799316406, -0.05755615234375, -0.04820823669433594, -0.038860321044921875, -0.029512405395507812, -0.02016448974609375, -0.010816574096679688, -0.001468658447265625, 0.007879257202148438, 0.0172271728515625, 0.026575088500976562, 0.035923004150390625, 0.04527091979980469, 0.05461883544921875, 0.06396675109863281, 0.07331466674804688, 0.08266258239746094, 0.092010498046875, 0.10135841369628906, 0.11070632934570312, 0.12005424499511719, 0.12940216064453125, 0.1387500762939453, 0.14809799194335938, 0.15744590759277344, 0.1667938232421875, 0.17614173889160156, 0.18548965454101562, 0.1948375701904297, 0.20418548583984375, 0.2135334014892578, 0.22288131713867188, 0.23222923278808594, 0.2415771484375]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 1.0, 4.0, 5.0, 5.0, 5.0, 13.0, 14.0, 19.0, 22.0, 16.0, 25.0, 26.0, 38.0, 36.0, 36.0, 42.0, 44.0, 53.0, 47.0, 55.0, 45.0, 44.0, 42.0, 53.0, 46.0, 43.0, 50.0, 36.0, 28.0, 25.0, 16.0, 14.0, 13.0, 11.0, 7.0, 5.0, 5.0, 3.0, 2.0, 6.0, 3.0, 4.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.26416015625, -0.2552604675292969, -0.24636077880859375, -0.23746109008789062, -0.2285614013671875, -0.21966171264648438, -0.21076202392578125, -0.20186233520507812, -0.192962646484375, -0.18406295776367188, -0.17516326904296875, -0.16626358032226562, -0.1573638916015625, -0.14846420288085938, -0.13956451416015625, -0.13066482543945312, -0.12176513671875, -0.11286544799804688, -0.10396575927734375, -0.09506607055664062, -0.0861663818359375, -0.07726669311523438, -0.06836700439453125, -0.059467315673828125, -0.050567626953125, -0.041667938232421875, -0.03276824951171875, -0.023868560791015625, -0.0149688720703125, -0.006069183349609375, 0.00283050537109375, 0.011730194091796875, 0.0206298828125, 0.029529571533203125, 0.03842926025390625, 0.047328948974609375, 0.0562286376953125, 0.06512832641601562, 0.07402801513671875, 0.08292770385742188, 0.091827392578125, 0.10072708129882812, 0.10962677001953125, 0.11852645874023438, 0.1274261474609375, 0.13632583618164062, 0.14522552490234375, 0.15412521362304688, 0.16302490234375, 0.17192459106445312, 0.18082427978515625, 0.18972396850585938, 0.1986236572265625, 0.20752334594726562, 0.21642303466796875, 0.22532272338867188, 0.234222412109375, 0.24312210083007812, 0.25202178955078125, 0.2609214782714844, 0.2698211669921875, 0.2787208557128906, 0.28762054443359375, 0.2965202331542969, 0.305419921875]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 6.0, 6.0, 13.0, 17.0, 42.0, 94.0, 272.0, 1763.0, 104284.0, 935661.0, 5692.0, 443.0, 146.0, 61.0, 28.0, 11.0, 7.0, 5.0, 2.0, 0.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.292236328125, -0.2801513671875, -0.26806640625, -0.2559814453125, -0.243896484375, -0.2318115234375, -0.2197265625, -0.2076416015625, -0.195556640625, -0.1834716796875, -0.17138671875, -0.1593017578125, -0.147216796875, -0.1351318359375, -0.123046875, -0.1109619140625, -0.098876953125, -0.0867919921875, -0.07470703125, -0.0626220703125, -0.050537109375, -0.0384521484375, -0.0263671875, -0.0142822265625, -0.002197265625, 0.0098876953125, 0.02197265625, 0.0340576171875, 0.046142578125, 0.0582275390625, 0.0703125, 0.0823974609375, 0.094482421875, 0.1065673828125, 0.11865234375, 0.1307373046875, 0.142822265625, 0.1549072265625, 0.1669921875, 0.1790771484375, 0.191162109375, 0.2032470703125, 0.21533203125, 0.2274169921875, 0.239501953125, 0.2515869140625, 0.263671875, 0.2757568359375, 0.287841796875, 0.2999267578125, 0.31201171875, 0.3240966796875, 0.336181640625, 0.3482666015625, 0.3603515625, 0.3724365234375, 0.384521484375, 0.3966064453125, 0.40869140625, 0.4207763671875, 0.432861328125, 0.4449462890625, 0.45703125, 0.4691162109375, 0.481201171875]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 4.0, 5.0, 5.0, 6.0, 7.0, 15.0, 15.0, 15.0, 25.0, 25.0, 35.0, 36.0, 51.0, 55.0, 73.0, 109.0, 114.0, 81.0, 76.0, 64.0, 42.0, 36.0, 26.0, 18.0, 11.0, 13.0, 13.0, 10.0, 6.0, 2.0, 4.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-7.802248001098633e-05, -7.591862231492996e-05, -7.38147646188736e-05, -7.171090692281723e-05, -6.960704922676086e-05, -6.75031915307045e-05, -6.539933383464813e-05, -6.329547613859177e-05, -6.11916184425354e-05, -5.9087760746479034e-05, -5.698390305042267e-05, -5.48800453543663e-05, -5.2776187658309937e-05, -5.067232996225357e-05, -4.8568472266197205e-05, -4.646461457014084e-05, -4.436075687408447e-05, -4.225689917802811e-05, -4.015304148197174e-05, -3.8049183785915375e-05, -3.594532608985901e-05, -3.384146839380264e-05, -3.173761069774628e-05, -2.963375300168991e-05, -2.7529895305633545e-05, -2.542603760957718e-05, -2.3322179913520813e-05, -2.1218322217464447e-05, -1.911446452140808e-05, -1.7010606825351715e-05, -1.4906749129295349e-05, -1.2802891433238983e-05, -1.0699033737182617e-05, -8.595176041126251e-06, -6.491318345069885e-06, -4.387460649013519e-06, -2.2836029529571533e-06, -1.7974525690078735e-07, 1.9241124391555786e-06, 4.027970135211945e-06, 6.1318278312683105e-06, 8.235685527324677e-06, 1.0339543223381042e-05, 1.2443400919437408e-05, 1.4547258615493774e-05, 1.665111631155014e-05, 1.8754974007606506e-05, 2.0858831703662872e-05, 2.2962689399719238e-05, 2.5066547095775604e-05, 2.717040479183197e-05, 2.9274262487888336e-05, 3.13781201839447e-05, 3.348197788000107e-05, 3.5585835576057434e-05, 3.76896932721138e-05, 3.9793550968170166e-05, 4.189740866422653e-05, 4.40012663602829e-05, 4.6105124056339264e-05, 4.820898175239563e-05, 5.0312839448451996e-05, 5.241669714450836e-05, 5.452055484056473e-05, 5.6624412536621094e-05]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 5.0, 8.0, 2.0, 6.0, 7.0, 18.0, 28.0, 55.0, 82.0, 175.0, 495.0, 2383.0, 77130.0, 953512.0, 13060.0, 1049.0, 274.0, 121.0, 56.0, 42.0, 19.0, 17.0, 11.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.373046875, -0.3621673583984375, -0.351287841796875, -0.3404083251953125, -0.32952880859375, -0.3186492919921875, -0.307769775390625, -0.2968902587890625, -0.2860107421875, -0.2751312255859375, -0.264251708984375, -0.2533721923828125, -0.24249267578125, -0.2316131591796875, -0.220733642578125, -0.2098541259765625, -0.198974609375, -0.1880950927734375, -0.177215576171875, -0.1663360595703125, -0.15545654296875, -0.1445770263671875, -0.133697509765625, -0.1228179931640625, -0.1119384765625, -0.1010589599609375, -0.090179443359375, -0.0792999267578125, -0.06842041015625, -0.0575408935546875, -0.046661376953125, -0.0357818603515625, -0.02490234375, -0.0140228271484375, -0.003143310546875, 0.0077362060546875, 0.01861572265625, 0.0294952392578125, 0.040374755859375, 0.0512542724609375, 0.0621337890625, 0.0730133056640625, 0.083892822265625, 0.0947723388671875, 0.10565185546875, 0.1165313720703125, 0.127410888671875, 0.1382904052734375, 0.149169921875, 0.1600494384765625, 0.170928955078125, 0.1818084716796875, 0.19268798828125, 0.2035675048828125, 0.214447021484375, 0.2253265380859375, 0.2362060546875, 0.2470855712890625, 0.257965087890625, 0.2688446044921875, 0.27972412109375, 0.2906036376953125, 0.301483154296875, 0.3123626708984375, 0.3232421875]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 9.0, 8.0, 16.0, 34.0, 57.0, 187.0, 386.0, 172.0, 61.0, 37.0, 25.0, 9.0, 5.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.3779296875, -0.3704566955566406, -0.36298370361328125, -0.3555107116699219, -0.3480377197265625, -0.3405647277832031, -0.33309173583984375, -0.3256187438964844, -0.318145751953125, -0.3106727600097656, -0.30319976806640625, -0.2957267761230469, -0.2882537841796875, -0.2807807922363281, -0.27330780029296875, -0.2658348083496094, -0.25836181640625, -0.2508888244628906, -0.24341583251953125, -0.23594284057617188, -0.2284698486328125, -0.22099685668945312, -0.21352386474609375, -0.20605087280273438, -0.198577880859375, -0.19110488891601562, -0.18363189697265625, -0.17615890502929688, -0.1686859130859375, -0.16121292114257812, -0.15373992919921875, -0.14626693725585938, -0.1387939453125, -0.13132095336914062, -0.12384796142578125, -0.11637496948242188, -0.1089019775390625, -0.10142898559570312, -0.09395599365234375, -0.08648300170898438, -0.079010009765625, -0.07153701782226562, -0.06406402587890625, -0.056591033935546875, -0.0491180419921875, -0.041645050048828125, -0.03417205810546875, -0.026699066162109375, -0.01922607421875, -0.011753082275390625, -0.00428009033203125, 0.003192901611328125, 0.0106658935546875, 0.018138885498046875, 0.02561187744140625, 0.033084869384765625, 0.040557861328125, 0.048030853271484375, 0.05550384521484375, 0.06297683715820312, 0.0704498291015625, 0.07792282104492188, 0.08539581298828125, 0.09286880493164062, 0.100341796875]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 0.0, 2.0, 1.0, 3.0, 8.0, 12.0, 36.0, 71.0, 92.0, 160.0, 184.0, 191.0, 118.0, 66.0, 18.0, 17.0, 13.0, 5.0, 5.0, 0.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.6501035690307617, -2.590501308441162, -2.5308990478515625, -2.471296787261963, -2.4116945266723633, -2.3520922660827637, -2.292490005493164, -2.2328879833221436, -2.173285722732544, -2.1136834621429443, -2.0540812015533447, -1.9944789409637451, -1.934876799583435, -1.8752745389938354, -1.8156722784042358, -1.7560700178146362, -1.6964677572250366, -1.636865496635437, -1.5772632360458374, -1.5176610946655273, -1.4580588340759277, -1.3984565734863281, -1.3388543128967285, -1.279252052307129, -1.2196497917175293, -1.1600475311279297, -1.10044527053833, -1.0408430099487305, -0.9812408685684204, -0.9216386079788208, -0.8620363473892212, -0.8024340867996216, -0.7428319454193115, -0.6832296848297119, -0.6236274838447571, -0.5640252232551575, -0.5044230222702026, -0.444820761680603, -0.3852185010910034, -0.3256162703037262, -0.266014039516449, -0.20641180872917175, -0.14680956304073334, -0.08720731735229492, -0.0276050865650177, 0.03199714422225952, 0.09159940481185913, 0.15120163559913635, 0.21080386638641357, 0.2704060971736908, 0.330008327960968, 0.3896105885505676, 0.44921281933784485, 0.5088150501251221, 0.5684173107147217, 0.6280195713043213, 0.6876217722892761, 0.7472240328788757, 0.8068262338638306, 0.8664284944534302, 0.9260307550430298, 0.9856329560279846, 1.0452351570129395, 1.104837417602539, 1.1644396781921387]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 6.0, 4.0, 1.0, 4.0, 6.0, 6.0, 9.0, 7.0, 16.0, 17.0, 17.0, 22.0, 22.0, 22.0, 32.0, 30.0, 38.0, 36.0, 35.0, 29.0, 38.0, 51.0, 34.0, 41.0, 35.0, 47.0, 40.0, 27.0, 36.0, 24.0, 26.0, 28.0, 27.0, 28.0, 19.0, 23.0, 17.0, 16.0, 16.0, 12.0, 17.0, 13.0, 3.0, 8.0, 4.0, 8.0, 3.0, 3.0, 2.0, 3.0, 1.0, 1.0, 2.0, 3.0], "bins": [-1.2632848024368286, -1.226023554801941, -1.1887624263763428, -1.151501178741455, -1.1142399311065674, -1.0769786834716797, -1.039717435836792, -1.0024563074111938, -0.9651950597763062, -0.9279338121414185, -0.8906726241111755, -0.8534114360809326, -0.8161501884460449, -0.7788889408111572, -0.7416277527809143, -0.7043665647506714, -0.6671053171157837, -0.629844069480896, -0.5925828814506531, -0.5553216934204102, -0.5180604457855225, -0.48079922795295715, -0.44353801012039185, -0.40627679228782654, -0.36901557445526123, -0.3317543566226959, -0.2944931387901306, -0.2572319209575653, -0.219970703125, -0.1827094852924347, -0.14544826745986938, -0.10818704962730408, -0.07092595100402832, -0.03366473317146301, 0.003596484661102295, 0.0408577024936676, 0.07811892032623291, 0.11538013815879822, 0.15264135599136353, 0.18990257382392883, 0.22716379165649414, 0.26442500948905945, 0.30168622732162476, 0.33894744515419006, 0.37620866298675537, 0.4134698808193207, 0.450731098651886, 0.4879923164844513, 0.5252535343170166, 0.5625147819519043, 0.5997759699821472, 0.6370371580123901, 0.6742984056472778, 0.7115596532821655, 0.7488208413124084, 0.7860820293426514, 0.8233432769775391, 0.8606045246124268, 0.8978657126426697, 0.9351269006729126, 0.9723881483078003, 1.009649395942688, 1.0469105243682861, 1.0841717720031738, 1.1214330196380615]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 8.0, 10.0, 4.0, 6.0, 10.0, 19.0, 21.0, 29.0, 42.0, 50.0, 70.0, 105.0, 163.0, 267.0, 440.0, 696.0, 1275.0, 2391.0, 5196.0, 11996.0, 35396.0, 192521.0, 3571995.0, 300830.0, 45103.0, 14079.0, 5804.0, 2716.0, 1368.0, 689.0, 360.0, 229.0, 151.0, 79.0, 56.0, 35.0, 27.0, 10.0, 11.0, 10.0, 5.0, 5.0, 4.0, 3.0, 0.0, 1.0, 2.0, 1.0], "bins": [-0.2342529296875, -0.2281818389892578, -0.22211074829101562, -0.21603965759277344, -0.20996856689453125, -0.20389747619628906, -0.19782638549804688, -0.1917552947998047, -0.1856842041015625, -0.1796131134033203, -0.17354202270507812, -0.16747093200683594, -0.16139984130859375, -0.15532875061035156, -0.14925765991210938, -0.1431865692138672, -0.137115478515625, -0.1310443878173828, -0.12497329711914062, -0.11890220642089844, -0.11283111572265625, -0.10676002502441406, -0.10068893432617188, -0.09461784362792969, -0.0885467529296875, -0.08247566223144531, -0.07640457153320312, -0.07033348083496094, -0.06426239013671875, -0.05819129943847656, -0.052120208740234375, -0.04604911804199219, -0.03997802734375, -0.03390693664550781, -0.027835845947265625, -0.021764755249023438, -0.01569366455078125, -0.009622573852539062, -0.003551483154296875, 0.0025196075439453125, 0.0085906982421875, 0.014661788940429688, 0.020732879638671875, 0.026803970336914062, 0.03287506103515625, 0.03894615173339844, 0.045017242431640625, 0.05108833312988281, 0.057159423828125, 0.06323051452636719, 0.06930160522460938, 0.07537269592285156, 0.08144378662109375, 0.08751487731933594, 0.09358596801757812, 0.09965705871582031, 0.1057281494140625, 0.11179924011230469, 0.11787033081054688, 0.12394142150878906, 0.13001251220703125, 0.13608360290527344, 0.14215469360351562, 0.1482257843017578, 0.154296875]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 4.0, 8.0, 6.0, 10.0, 16.0, 23.0, 17.0, 35.0, 30.0, 48.0, 51.0, 54.0, 70.0, 75.0, 68.0, 58.0, 62.0, 68.0, 56.0, 50.0, 50.0, 39.0, 38.0, 25.0, 8.0, 17.0, 3.0, 3.0, 6.0, 4.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.11181640625, -0.10884952545166016, -0.10588264465332031, -0.10291576385498047, -0.09994888305664062, -0.09698200225830078, -0.09401512145996094, -0.0910482406616211, -0.08808135986328125, -0.0851144790649414, -0.08214759826660156, -0.07918071746826172, -0.07621383666992188, -0.07324695587158203, -0.07028007507324219, -0.06731319427490234, -0.0643463134765625, -0.061379432678222656, -0.05841255187988281, -0.05544567108154297, -0.052478790283203125, -0.04951190948486328, -0.04654502868652344, -0.043578147888183594, -0.04061126708984375, -0.037644386291503906, -0.03467750549316406, -0.03171062469482422, -0.028743743896484375, -0.02577686309814453, -0.022809982299804688, -0.019843101501464844, -0.016876220703125, -0.013909339904785156, -0.010942459106445312, -0.007975578308105469, -0.005008697509765625, -0.0020418167114257812, 0.0009250640869140625, 0.0038919448852539062, 0.00685882568359375, 0.009825706481933594, 0.012792587280273438, 0.01575946807861328, 0.018726348876953125, 0.02169322967529297, 0.024660110473632812, 0.027626991271972656, 0.0305938720703125, 0.033560752868652344, 0.03652763366699219, 0.03949451446533203, 0.042461395263671875, 0.04542827606201172, 0.04839515686035156, 0.051362037658691406, 0.05432891845703125, 0.057295799255371094, 0.06026268005371094, 0.06322956085205078, 0.06619644165039062, 0.06916332244873047, 0.07213020324707031, 0.07509708404541016, 0.07806396484375]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 1.0, 12.0, 10.0, 25.0, 69.0, 112.0, 249.0, 563.0, 1478.0, 4396.0, 20066.0, 211244.0, 3792200.0, 141614.0, 16151.0, 3900.0, 1245.0, 520.0, 229.0, 96.0, 56.0, 20.0, 16.0, 7.0, 4.0, 0.0, 4.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.234375, -0.22583389282226562, -0.21729278564453125, -0.20875167846679688, -0.2002105712890625, -0.19166946411132812, -0.18312835693359375, -0.17458724975585938, -0.166046142578125, -0.15750503540039062, -0.14896392822265625, -0.14042282104492188, -0.1318817138671875, -0.12334060668945312, -0.11479949951171875, -0.10625839233398438, -0.09771728515625, -0.08917617797851562, -0.08063507080078125, -0.07209396362304688, -0.0635528564453125, -0.055011749267578125, -0.04647064208984375, -0.037929534912109375, -0.029388427734375, -0.020847320556640625, -0.01230621337890625, -0.003765106201171875, 0.0047760009765625, 0.013317108154296875, 0.02185821533203125, 0.030399322509765625, 0.0389404296875, 0.047481536865234375, 0.05602264404296875, 0.06456375122070312, 0.0731048583984375, 0.08164596557617188, 0.09018707275390625, 0.09872817993164062, 0.107269287109375, 0.11581039428710938, 0.12435150146484375, 0.13289260864257812, 0.1414337158203125, 0.14997482299804688, 0.15851593017578125, 0.16705703735351562, 0.17559814453125, 0.18413925170898438, 0.19268035888671875, 0.20122146606445312, 0.2097625732421875, 0.21830368041992188, 0.22684478759765625, 0.23538589477539062, 0.243927001953125, 0.2524681091308594, 0.26100921630859375, 0.2695503234863281, 0.2780914306640625, 0.2866325378417969, 0.29517364501953125, 0.3037147521972656, 0.312255859375]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 0.0, 3.0, 7.0, 7.0, 16.0, 23.0, 24.0, 50.0, 97.0, 253.0, 905.0, 1973.0, 444.0, 132.0, 62.0, 25.0, 15.0, 8.0, 11.0, 10.0, 4.0, 5.0, 1.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11285400390625, -0.10912609100341797, -0.10539817810058594, -0.1016702651977539, -0.09794235229492188, -0.09421443939208984, -0.09048652648925781, -0.08675861358642578, -0.08303070068359375, -0.07930278778076172, -0.07557487487792969, -0.07184696197509766, -0.06811904907226562, -0.0643911361694336, -0.06066322326660156, -0.05693531036376953, -0.0532073974609375, -0.04947948455810547, -0.04575157165527344, -0.042023658752441406, -0.038295745849609375, -0.034567832946777344, -0.030839920043945312, -0.02711200714111328, -0.02338409423828125, -0.01965618133544922, -0.015928268432617188, -0.012200355529785156, -0.008472442626953125, -0.004744529724121094, -0.0010166168212890625, 0.0027112960815429688, 0.006439208984375, 0.010167121887207031, 0.013895034790039062, 0.017622947692871094, 0.021350860595703125, 0.025078773498535156, 0.028806686401367188, 0.03253459930419922, 0.03626251220703125, 0.03999042510986328, 0.04371833801269531, 0.047446250915527344, 0.051174163818359375, 0.054902076721191406, 0.05862998962402344, 0.06235790252685547, 0.0660858154296875, 0.06981372833251953, 0.07354164123535156, 0.0772695541381836, 0.08099746704101562, 0.08472537994384766, 0.08845329284667969, 0.09218120574951172, 0.09590911865234375, 0.09963703155517578, 0.10336494445800781, 0.10709285736083984, 0.11082077026367188, 0.1145486831665039, 0.11827659606933594, 0.12200450897216797, 0.125732421875]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 6.0, 9.0, 61.0, 253.0, 390.0, 220.0, 60.0, 16.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.628408432006836, -1.5903983116149902, -1.5523881912231445, -1.5143780708312988, -1.4763679504394531, -1.4383577108383179, -1.4003475904464722, -1.3623374700546265, -1.3243273496627808, -1.286317229270935, -1.2483071088790894, -1.2102969884872437, -1.1722867488861084, -1.1342766284942627, -1.096266508102417, -1.0582563877105713, -1.0202462673187256, -0.9822361469268799, -0.9442260265350342, -0.9062158465385437, -0.868205726146698, -0.8301956057548523, -0.7921854257583618, -0.7541753053665161, -0.7161651849746704, -0.6781550645828247, -0.640144944190979, -0.6021347641944885, -0.5641246438026428, -0.5261145234107971, -0.48810437321662903, -0.45009422302246094, -0.41208410263061523, -0.37407398223876953, -0.33606383204460144, -0.29805368185043335, -0.26004356145858765, -0.22203342616558075, -0.18402329087257385, -0.14601314067840576, -0.10800302028656006, -0.06999288499355316, -0.031982749700546265, 0.006027385592460632, 0.04403752088546753, 0.08204765617847443, 0.12005779147148132, 0.15806794166564941, 0.19607806205749512, 0.23408819735050201, 0.2720983326435089, 0.310108482837677, 0.3481186032295227, 0.3861287236213684, 0.4241388738155365, 0.4621490240097046, 0.5001591444015503, 0.538169264793396, 0.5761793851852417, 0.6141895651817322, 0.6521996855735779, 0.6902098059654236, 0.7282199859619141, 0.7662301063537598, 0.8042402267456055]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 9.0, 3.0, 10.0, 2.0, 6.0, 6.0, 12.0, 9.0, 14.0, 12.0, 18.0, 16.0, 25.0, 27.0, 25.0, 24.0, 28.0, 36.0, 35.0, 45.0, 41.0, 41.0, 37.0, 51.0, 39.0, 41.0, 41.0, 48.0, 34.0, 35.0, 30.0, 28.0, 19.0, 18.0, 14.0, 22.0, 12.0, 22.0, 17.0, 7.0, 14.0, 9.0, 10.0, 4.0, 3.0, 4.0, 1.0, 6.0, 1.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0], "bins": [-0.24504172801971436, -0.2374468445777893, -0.22985196113586426, -0.22225706279277802, -0.21466217935085297, -0.20706729590892792, -0.19947239756584167, -0.19187751412391663, -0.18428263068199158, -0.17668774724006653, -0.16909286379814148, -0.16149796545505524, -0.1539030820131302, -0.14630819857120514, -0.1387133002281189, -0.13111841678619385, -0.1235235333442688, -0.11592864990234375, -0.1083337590098381, -0.10073886811733246, -0.09314398467540741, -0.08554910123348236, -0.07795421034097672, -0.07035931944847107, -0.06276443600654602, -0.05516954883933067, -0.047574661672115326, -0.03997977450489998, -0.03238488733768463, -0.024790000170469284, -0.017195113003253937, -0.00960022583603859, -0.002005338668823242, 0.005589548498392105, 0.013184435665607452, 0.0207793228328228, 0.028374210000038147, 0.035969097167253494, 0.04356398433446884, 0.05115887150168419, 0.058753758668899536, 0.06634864211082458, 0.07394353300333023, 0.08153842389583588, 0.08913330733776093, 0.09672819077968597, 0.10432308167219162, 0.11191797256469727, 0.11951285600662231, 0.12710773944854736, 0.1347026228904724, 0.14229752123355865, 0.1498924046754837, 0.15748728811740875, 0.165082186460495, 0.17267706990242004, 0.1802719533443451, 0.18786683678627014, 0.1954617202281952, 0.20305661857128143, 0.21065150201320648, 0.21824638545513153, 0.22584128379821777, 0.23343616724014282, 0.24103105068206787]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 4.0, 6.0, 4.0, 6.0, 17.0, 20.0, 26.0, 42.0, 64.0, 117.0, 201.0, 396.0, 813.0, 2214.0, 7504.0, 35840.0, 242770.0, 626100.0, 107117.0, 18207.0, 4266.0, 1445.0, 617.0, 297.0, 182.0, 88.0, 59.0, 45.0, 27.0, 18.0, 15.0, 6.0, 5.0, 2.0, 6.0, 3.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.39892578125, -0.3887748718261719, -0.37862396240234375, -0.3684730529785156, -0.3583221435546875, -0.3481712341308594, -0.33802032470703125, -0.3278694152832031, -0.317718505859375, -0.3075675964355469, -0.29741668701171875, -0.2872657775878906, -0.2771148681640625, -0.2669639587402344, -0.25681304931640625, -0.24666213989257812, -0.23651123046875, -0.22636032104492188, -0.21620941162109375, -0.20605850219726562, -0.1959075927734375, -0.18575668334960938, -0.17560577392578125, -0.16545486450195312, -0.155303955078125, -0.14515304565429688, -0.13500213623046875, -0.12485122680664062, -0.1147003173828125, -0.10454940795898438, -0.09439849853515625, -0.08424758911132812, -0.0740966796875, -0.06394577026367188, -0.05379486083984375, -0.043643951416015625, -0.0334930419921875, -0.023342132568359375, -0.01319122314453125, -0.003040313720703125, 0.007110595703125, 0.017261505126953125, 0.02741241455078125, 0.037563323974609375, 0.0477142333984375, 0.057865142822265625, 0.06801605224609375, 0.07816696166992188, 0.08831787109375, 0.09846878051757812, 0.10861968994140625, 0.11877059936523438, 0.1289215087890625, 0.13907241821289062, 0.14922332763671875, 0.15937423706054688, 0.169525146484375, 0.17967605590820312, 0.18982696533203125, 0.19997787475585938, 0.2101287841796875, 0.22027969360351562, 0.23043060302734375, 0.24058151245117188, 0.250732421875]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 6.0, 1.0, 7.0, 7.0, 8.0, 19.0, 17.0, 27.0, 29.0, 26.0, 53.0, 53.0, 52.0, 70.0, 68.0, 64.0, 74.0, 51.0, 71.0, 62.0, 53.0, 42.0, 43.0, 37.0, 16.0, 22.0, 7.0, 8.0, 3.0, 2.0, 4.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1064453125, -0.103546142578125, -0.10064697265625, -0.097747802734375, -0.0948486328125, -0.091949462890625, -0.08905029296875, -0.086151123046875, -0.083251953125, -0.080352783203125, -0.07745361328125, -0.074554443359375, -0.0716552734375, -0.068756103515625, -0.06585693359375, -0.062957763671875, -0.06005859375, -0.057159423828125, -0.05426025390625, -0.051361083984375, -0.0484619140625, -0.045562744140625, -0.04266357421875, -0.039764404296875, -0.036865234375, -0.033966064453125, -0.03106689453125, -0.028167724609375, -0.0252685546875, -0.022369384765625, -0.01947021484375, -0.016571044921875, -0.013671875, -0.010772705078125, -0.00787353515625, -0.004974365234375, -0.0020751953125, 0.000823974609375, 0.00372314453125, 0.006622314453125, 0.009521484375, 0.012420654296875, 0.01531982421875, 0.018218994140625, 0.0211181640625, 0.024017333984375, 0.02691650390625, 0.029815673828125, 0.03271484375, 0.035614013671875, 0.03851318359375, 0.041412353515625, 0.0443115234375, 0.047210693359375, 0.05010986328125, 0.053009033203125, 0.055908203125, 0.058807373046875, 0.06170654296875, 0.064605712890625, 0.0675048828125, 0.070404052734375, 0.07330322265625, 0.076202392578125, 0.0791015625]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 3.0, 1.0, 1.0, 2.0, 6.0, 7.0, 8.0, 12.0, 15.0, 31.0, 33.0, 43.0, 77.0, 109.0, 192.0, 343.0, 692.0, 1774.0, 5332.0, 18847.0, 75990.0, 337740.0, 460527.0, 108629.0, 26656.0, 7317.0, 2293.0, 870.0, 388.0, 225.0, 111.0, 89.0, 63.0, 44.0, 15.0, 24.0, 11.0, 9.0, 6.0, 10.0, 4.0, 3.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1990966796875, -0.1924877166748047, -0.18587875366210938, -0.17926979064941406, -0.17266082763671875, -0.16605186462402344, -0.15944290161132812, -0.1528339385986328, -0.1462249755859375, -0.1396160125732422, -0.13300704956054688, -0.12639808654785156, -0.11978912353515625, -0.11318016052246094, -0.10657119750976562, -0.09996223449707031, -0.093353271484375, -0.08674430847167969, -0.08013534545898438, -0.07352638244628906, -0.06691741943359375, -0.06030845642089844, -0.053699493408203125, -0.04709053039550781, -0.0404815673828125, -0.03387260437011719, -0.027263641357421875, -0.020654678344726562, -0.01404571533203125, -0.0074367523193359375, -0.000827789306640625, 0.0057811737060546875, 0.01239013671875, 0.018999099731445312, 0.025608062744140625, 0.03221702575683594, 0.03882598876953125, 0.04543495178222656, 0.052043914794921875, 0.05865287780761719, 0.0652618408203125, 0.07187080383300781, 0.07847976684570312, 0.08508872985839844, 0.09169769287109375, 0.09830665588378906, 0.10491561889648438, 0.11152458190917969, 0.118133544921875, 0.12474250793457031, 0.13135147094726562, 0.13796043395996094, 0.14456939697265625, 0.15117835998535156, 0.15778732299804688, 0.1643962860107422, 0.1710052490234375, 0.1776142120361328, 0.18422317504882812, 0.19083213806152344, 0.19744110107421875, 0.20405006408691406, 0.21065902709960938, 0.2172679901123047, 0.223876953125]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 3.0, 1.0, 3.0, 5.0, 2.0, 3.0, 6.0, 8.0, 6.0, 11.0, 12.0, 11.0, 11.0, 19.0, 12.0, 29.0, 25.0, 36.0, 29.0, 35.0, 29.0, 28.0, 40.0, 39.0, 44.0, 41.0, 53.0, 37.0, 39.0, 43.0, 40.0, 41.0, 33.0, 27.0, 35.0, 24.0, 28.0, 19.0, 17.0, 16.0, 11.0, 14.0, 13.0, 11.0, 4.0, 4.0, 2.0, 6.0, 3.0, 2.0, 3.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2291259765625, -0.22152137756347656, -0.21391677856445312, -0.2063121795654297, -0.19870758056640625, -0.1911029815673828, -0.18349838256835938, -0.17589378356933594, -0.1682891845703125, -0.16068458557128906, -0.15307998657226562, -0.1454753875732422, -0.13787078857421875, -0.1302661895751953, -0.12266159057617188, -0.11505699157714844, -0.107452392578125, -0.09984779357910156, -0.09224319458007812, -0.08463859558105469, -0.07703399658203125, -0.06942939758300781, -0.061824798583984375, -0.05422019958496094, -0.0466156005859375, -0.03901100158691406, -0.031406402587890625, -0.023801803588867188, -0.01619720458984375, -0.008592605590820312, -0.000988006591796875, 0.0066165924072265625, 0.01422119140625, 0.021825790405273438, 0.029430389404296875, 0.03703498840332031, 0.04463958740234375, 0.05224418640136719, 0.059848785400390625, 0.06745338439941406, 0.0750579833984375, 0.08266258239746094, 0.09026718139648438, 0.09787178039550781, 0.10547637939453125, 0.11308097839355469, 0.12068557739257812, 0.12829017639160156, 0.135894775390625, 0.14349937438964844, 0.15110397338867188, 0.1587085723876953, 0.16631317138671875, 0.1739177703857422, 0.18152236938476562, 0.18912696838378906, 0.1967315673828125, 0.20433616638183594, 0.21194076538085938, 0.2195453643798828, 0.22714996337890625, 0.2347545623779297, 0.24235916137695312, 0.24996376037597656, 0.257568359375]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 2.0, 2.0, 5.0, 9.0, 15.0, 30.0, 102.0, 189.0, 542.0, 1255.0, 3471.0, 15023.0, 189174.0, 787009.0, 42283.0, 6275.0, 1870.0, 732.0, 309.0, 143.0, 56.0, 27.0, 8.0, 7.0, 11.0, 2.0, 6.0, 4.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.150390625, -0.14572525024414062, -0.14105987548828125, -0.13639450073242188, -0.1317291259765625, -0.12706375122070312, -0.12239837646484375, -0.11773300170898438, -0.113067626953125, -0.10840225219726562, -0.10373687744140625, -0.09907150268554688, -0.0944061279296875, -0.08974075317382812, -0.08507537841796875, -0.08041000366210938, -0.07574462890625, -0.07107925415039062, -0.06641387939453125, -0.061748504638671875, -0.0570831298828125, -0.052417755126953125, -0.04775238037109375, -0.043087005615234375, -0.038421630859375, -0.033756256103515625, -0.02909088134765625, -0.024425506591796875, -0.0197601318359375, -0.015094757080078125, -0.01042938232421875, -0.005764007568359375, -0.0010986328125, 0.003566741943359375, 0.00823211669921875, 0.012897491455078125, 0.0175628662109375, 0.022228240966796875, 0.02689361572265625, 0.031558990478515625, 0.036224365234375, 0.040889739990234375, 0.04555511474609375, 0.050220489501953125, 0.0548858642578125, 0.059551239013671875, 0.06421661376953125, 0.06888198852539062, 0.07354736328125, 0.07821273803710938, 0.08287811279296875, 0.08754348754882812, 0.0922088623046875, 0.09687423706054688, 0.10153961181640625, 0.10620498657226562, 0.110870361328125, 0.11553573608398438, 0.12020111083984375, 0.12486648559570312, 0.1295318603515625, 0.13419723510742188, 0.13886260986328125, 0.14352798461914062, 0.148193359375]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 5.0, 1.0, 4.0, 0.0, 3.0, 2.0, 4.0, 9.0, 5.0, 13.0, 13.0, 19.0, 22.0, 26.0, 21.0, 38.0, 59.0, 73.0, 88.0, 101.0, 111.0, 78.0, 59.0, 71.0, 51.0, 28.0, 20.0, 20.0, 10.0, 15.0, 10.0, 8.0, 4.0, 3.0, 4.0, 2.0, 5.0, 2.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.282329559326172e-05, -6.0916878283023834e-05, -5.901046097278595e-05, -5.7104043662548065e-05, -5.519762635231018e-05, -5.3291209042072296e-05, -5.138479173183441e-05, -4.947837442159653e-05, -4.757195711135864e-05, -4.566553980112076e-05, -4.3759122490882874e-05, -4.185270518064499e-05, -3.9946287870407104e-05, -3.803987056016922e-05, -3.6133453249931335e-05, -3.422703593969345e-05, -3.2320618629455566e-05, -3.0414201319217682e-05, -2.8507784008979797e-05, -2.6601366698741913e-05, -2.469494938850403e-05, -2.2788532078266144e-05, -2.088211476802826e-05, -1.8975697457790375e-05, -1.706928014755249e-05, -1.5162862837314606e-05, -1.3256445527076721e-05, -1.1350028216838837e-05, -9.443610906600952e-06, -7.537193596363068e-06, -5.630776286125183e-06, -3.7243589758872986e-06, -1.817941665649414e-06, 8.847564458847046e-08, 1.994892954826355e-06, 3.9013102650642395e-06, 5.807727575302124e-06, 7.714144885540009e-06, 9.620562195777893e-06, 1.1526979506015778e-05, 1.3433396816253662e-05, 1.5339814126491547e-05, 1.724623143672943e-05, 1.9152648746967316e-05, 2.10590660572052e-05, 2.2965483367443085e-05, 2.487190067768097e-05, 2.6778317987918854e-05, 2.8684735298156738e-05, 3.059115260839462e-05, 3.249756991863251e-05, 3.440398722887039e-05, 3.6310404539108276e-05, 3.821682184934616e-05, 4.0123239159584045e-05, 4.202965646982193e-05, 4.3936073780059814e-05, 4.58424910902977e-05, 4.7748908400535583e-05, 4.965532571077347e-05, 5.156174302101135e-05, 5.346816033124924e-05, 5.537457764148712e-05, 5.7280994951725006e-05, 5.918741226196289e-05]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 6.0, 6.0, 2.0, 6.0, 2.0, 7.0, 9.0, 20.0, 26.0, 52.0, 64.0, 112.0, 165.0, 370.0, 686.0, 1361.0, 2853.0, 7410.0, 29048.0, 225060.0, 689726.0, 69537.0, 13706.0, 4387.0, 1913.0, 880.0, 490.0, 255.0, 152.0, 87.0, 50.0, 29.0, 24.0, 11.0, 14.0, 8.0, 5.0, 7.0, 2.0, 3.0, 2.0, 3.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.103515625, -0.10020256042480469, -0.09688949584960938, -0.09357643127441406, -0.09026336669921875, -0.08695030212402344, -0.08363723754882812, -0.08032417297363281, -0.0770111083984375, -0.07369804382324219, -0.07038497924804688, -0.06707191467285156, -0.06375885009765625, -0.06044578552246094, -0.057132720947265625, -0.05381965637207031, -0.050506591796875, -0.04719352722167969, -0.043880462646484375, -0.04056739807128906, -0.03725433349609375, -0.03394126892089844, -0.030628204345703125, -0.027315139770507812, -0.0240020751953125, -0.020689010620117188, -0.017375946044921875, -0.014062881469726562, -0.01074981689453125, -0.0074367523193359375, -0.004123687744140625, -0.0008106231689453125, 0.00250244140625, 0.0058155059814453125, 0.009128570556640625, 0.012441635131835938, 0.01575469970703125, 0.019067764282226562, 0.022380828857421875, 0.025693893432617188, 0.0290069580078125, 0.03232002258300781, 0.035633087158203125, 0.03894615173339844, 0.04225921630859375, 0.04557228088378906, 0.048885345458984375, 0.05219841003417969, 0.055511474609375, 0.05882453918457031, 0.062137603759765625, 0.06545066833496094, 0.06876373291015625, 0.07207679748535156, 0.07538986206054688, 0.07870292663574219, 0.0820159912109375, 0.08532905578613281, 0.08864212036132812, 0.09195518493652344, 0.09526824951171875, 0.09858131408691406, 0.10189437866210938, 0.10520744323730469, 0.1085205078125]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 3.0, 0.0, 2.0, 4.0, 7.0, 5.0, 18.0, 16.0, 20.0, 23.0, 47.0, 45.0, 76.0, 143.0, 121.0, 133.0, 98.0, 64.0, 50.0, 35.0, 27.0, 18.0, 14.0, 12.0, 7.0, 7.0, 3.0, 3.0, 3.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08892822265625, -0.085845947265625, -0.082763671875, -0.079681396484375, -0.07659912109375, -0.073516845703125, -0.0704345703125, -0.067352294921875, -0.06427001953125, -0.061187744140625, -0.05810546875, -0.055023193359375, -0.05194091796875, -0.048858642578125, -0.0457763671875, -0.042694091796875, -0.03961181640625, -0.036529541015625, -0.033447265625, -0.030364990234375, -0.02728271484375, -0.024200439453125, -0.0211181640625, -0.018035888671875, -0.01495361328125, -0.011871337890625, -0.0087890625, -0.005706787109375, -0.00262451171875, 0.000457763671875, 0.0035400390625, 0.006622314453125, 0.00970458984375, 0.012786865234375, 0.015869140625, 0.018951416015625, 0.02203369140625, 0.025115966796875, 0.0281982421875, 0.031280517578125, 0.03436279296875, 0.037445068359375, 0.04052734375, 0.043609619140625, 0.04669189453125, 0.049774169921875, 0.0528564453125, 0.055938720703125, 0.05902099609375, 0.062103271484375, 0.065185546875, 0.068267822265625, 0.07135009765625, 0.074432373046875, 0.0775146484375, 0.080596923828125, 0.08367919921875, 0.086761474609375, 0.08984375, 0.092926025390625, 0.09600830078125, 0.099090576171875, 0.1021728515625, 0.105255126953125, 0.10833740234375]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 8.0, 15.0, 60.0, 114.0, 232.0, 245.0, 185.0, 98.0, 32.0, 16.0, 0.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8235732316970825, -1.7516988515853882, -1.6798243522644043, -1.60794997215271, -1.5360755920410156, -1.4642012119293213, -1.3923267126083374, -1.320452332496643, -1.2485778331756592, -1.1767034530639648, -1.104828953742981, -1.0329545736312866, -0.9610801935195923, -0.8892057538032532, -0.8173313140869141, -0.7454569339752197, -0.6735825538635254, -0.6017081141471863, -0.5298337340354919, -0.45795929431915283, -0.3860848844051361, -0.3142104744911194, -0.24233603477478027, -0.17046165466308594, -0.09858721494674683, -0.026712797582149506, 0.045161619782447815, 0.11703604459762573, 0.18891045451164246, 0.2607848644256592, 0.3326593041419983, 0.4045336842536926, 0.4764082431793213, 0.5482826828956604, 0.6201570630073547, 0.6920315027236938, 0.7639058828353882, 0.8357803225517273, 0.9076547622680664, 0.9795291423797607, 1.051403522491455, 1.1232779026031494, 1.1951524019241333, 1.2670267820358276, 1.338901162147522, 1.4107756614685059, 1.4826500415802002, 1.5545244216918945, 1.6263989210128784, 1.6982733011245728, 1.7701478004455566, 1.842022180557251, 1.9138965606689453, 1.9857709407806396, 2.057645320892334, 2.1295199394226074, 2.2013943195343018, 2.273268699645996, 2.3451430797576904, 2.4170174598693848, 2.488892078399658, 2.5607664585113525, 2.632640838623047, 2.704515218734741, 2.7763895988464355]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 3.0, 0.0, 3.0, 3.0, 7.0, 5.0, 4.0, 11.0, 8.0, 8.0, 11.0, 11.0, 20.0, 16.0, 16.0, 14.0, 21.0, 22.0, 34.0, 29.0, 34.0, 36.0, 46.0, 35.0, 36.0, 53.0, 39.0, 42.0, 52.0, 37.0, 45.0, 29.0, 32.0, 36.0, 32.0, 26.0, 28.0, 17.0, 26.0, 16.0, 12.0, 12.0, 6.0, 8.0, 9.0, 6.0, 6.0, 8.0, 0.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.0415022373199463, -1.007263422012329, -0.9730246663093567, -0.9387859106063843, -0.9045470952987671, -0.8703083395957947, -0.8360695838928223, -0.8018307685852051, -0.7675919532775879, -0.7333531975746155, -0.6991143822669983, -0.6648756265640259, -0.6306368112564087, -0.5963980555534363, -0.5621592998504639, -0.5279204845428467, -0.49368172883987427, -0.45944294333457947, -0.42520415782928467, -0.39096540212631226, -0.35672658681869507, -0.32248783111572266, -0.28824904561042786, -0.25401026010513306, -0.21977147459983826, -0.18553268909454346, -0.15129390358924866, -0.11705513298511505, -0.08281634747982025, -0.04857756197452545, -0.014338791370391846, 0.019899994134902954, 0.054138779640197754, 0.08837756514549255, 0.12261634320020676, 0.15685512125492096, 0.19109390676021576, 0.22533269226551056, 0.25957146286964417, 0.29381024837493896, 0.32804903388023376, 0.36228781938552856, 0.39652660489082336, 0.43076539039611816, 0.4650041460990906, 0.49924296140670776, 0.5334817171096802, 0.5677205324172974, 0.6019592881202698, 0.6361980438232422, 0.6704368591308594, 0.7046756148338318, 0.738914430141449, 0.7731531858444214, 0.8073920011520386, 0.841630756855011, 0.8758695125579834, 0.9101082682609558, 0.944347083568573, 0.9785858392715454, 1.0128246545791626, 1.0470634698867798, 1.0813021659851074, 1.1155409812927246, 1.1497797966003418]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 1.0, 5.0, 5.0, 4.0, 8.0, 8.0, 10.0, 10.0, 23.0, 38.0, 50.0, 65.0, 111.0, 180.0, 265.0, 455.0, 911.0, 1744.0, 4205.0, 11601.0, 44051.0, 423144.0, 3569093.0, 106386.0, 20529.0, 6392.0, 2535.0, 1125.0, 585.0, 301.0, 179.0, 95.0, 55.0, 42.0, 23.0, 21.0, 10.0, 8.0, 5.0, 5.0, 4.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.34130859375, -0.3318901062011719, -0.32247161865234375, -0.3130531311035156, -0.3036346435546875, -0.2942161560058594, -0.28479766845703125, -0.2753791809082031, -0.265960693359375, -0.2565422058105469, -0.24712371826171875, -0.23770523071289062, -0.2282867431640625, -0.21886825561523438, -0.20944976806640625, -0.20003128051757812, -0.19061279296875, -0.18119430541992188, -0.17177581787109375, -0.16235733032226562, -0.1529388427734375, -0.14352035522460938, -0.13410186767578125, -0.12468338012695312, -0.115264892578125, -0.10584640502929688, -0.09642791748046875, -0.08700942993164062, -0.0775909423828125, -0.06817245483398438, -0.05875396728515625, -0.049335479736328125, -0.0399169921875, -0.030498504638671875, -0.02108001708984375, -0.011661529541015625, -0.0022430419921875, 0.007175445556640625, 0.01659393310546875, 0.026012420654296875, 0.035430908203125, 0.044849395751953125, 0.05426788330078125, 0.06368637084960938, 0.0731048583984375, 0.08252334594726562, 0.09194183349609375, 0.10136032104492188, 0.11077880859375, 0.12019729614257812, 0.12961578369140625, 0.13903427124023438, 0.1484527587890625, 0.15787124633789062, 0.16728973388671875, 0.17670822143554688, 0.186126708984375, 0.19554519653320312, 0.20496368408203125, 0.21438217163085938, 0.2238006591796875, 0.23321914672851562, 0.24263763427734375, 0.2520561218261719, 0.261474609375]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 5.0, 4.0, 4.0, 7.0, 9.0, 16.0, 21.0, 17.0, 33.0, 34.0, 41.0, 54.0, 65.0, 76.0, 71.0, 80.0, 66.0, 67.0, 49.0, 58.0, 54.0, 45.0, 30.0, 37.0, 22.0, 11.0, 15.0, 5.0, 6.0, 0.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.110107421875, -0.10701370239257812, -0.10391998291015625, -0.10082626342773438, -0.0977325439453125, -0.09463882446289062, -0.09154510498046875, -0.08845138549804688, -0.085357666015625, -0.08226394653320312, -0.07917022705078125, -0.07607650756835938, -0.0729827880859375, -0.06988906860351562, -0.06679534912109375, -0.06370162963867188, -0.06060791015625, -0.057514190673828125, -0.05442047119140625, -0.051326751708984375, -0.0482330322265625, -0.045139312744140625, -0.04204559326171875, -0.038951873779296875, -0.035858154296875, -0.032764434814453125, -0.02967071533203125, -0.026576995849609375, -0.0234832763671875, -0.020389556884765625, -0.01729583740234375, -0.014202117919921875, -0.0111083984375, -0.008014678955078125, -0.00492095947265625, -0.001827239990234375, 0.0012664794921875, 0.004360198974609375, 0.00745391845703125, 0.010547637939453125, 0.013641357421875, 0.016735076904296875, 0.01982879638671875, 0.022922515869140625, 0.0260162353515625, 0.029109954833984375, 0.03220367431640625, 0.035297393798828125, 0.03839111328125, 0.041484832763671875, 0.04457855224609375, 0.047672271728515625, 0.0507659912109375, 0.053859710693359375, 0.05695343017578125, 0.060047149658203125, 0.063140869140625, 0.06623458862304688, 0.06932830810546875, 0.07242202758789062, 0.0755157470703125, 0.07860946655273438, 0.08170318603515625, 0.08479690551757812, 0.087890625]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 9.0, 22.0, 60.0, 111.0, 218.0, 487.0, 1037.0, 2590.0, 7368.0, 25929.0, 159213.0, 3554763.0, 381803.0, 43286.0, 10902.0, 3702.0, 1555.0, 664.0, 296.0, 129.0, 76.0, 40.0, 12.0, 10.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.20166015625, -0.1938018798828125, -0.185943603515625, -0.1780853271484375, -0.17022705078125, -0.1623687744140625, -0.154510498046875, -0.1466522216796875, -0.1387939453125, -0.1309356689453125, -0.123077392578125, -0.1152191162109375, -0.10736083984375, -0.0995025634765625, -0.091644287109375, -0.0837860107421875, -0.075927734375, -0.0680694580078125, -0.060211181640625, -0.0523529052734375, -0.04449462890625, -0.0366363525390625, -0.028778076171875, -0.0209197998046875, -0.0130615234375, -0.0052032470703125, 0.002655029296875, 0.0105133056640625, 0.01837158203125, 0.0262298583984375, 0.034088134765625, 0.0419464111328125, 0.0498046875, 0.0576629638671875, 0.065521240234375, 0.0733795166015625, 0.08123779296875, 0.0890960693359375, 0.096954345703125, 0.1048126220703125, 0.1126708984375, 0.1205291748046875, 0.128387451171875, 0.1362457275390625, 0.14410400390625, 0.1519622802734375, 0.159820556640625, 0.1676788330078125, 0.175537109375, 0.1833953857421875, 0.191253662109375, 0.1991119384765625, 0.20697021484375, 0.2148284912109375, 0.222686767578125, 0.2305450439453125, 0.2384033203125, 0.2462615966796875, 0.254119873046875, 0.2619781494140625, 0.26983642578125, 0.2776947021484375, 0.285552978515625, 0.2934112548828125, 0.30126953125]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 2.0, 4.0, 2.0, 3.0, 9.0, 8.0, 8.0, 19.0, 27.0, 40.0, 52.0, 91.0, 143.0, 353.0, 1329.0, 1231.0, 354.0, 135.0, 86.0, 43.0, 47.0, 19.0, 13.0, 7.0, 9.0, 12.0, 10.0, 6.0, 3.0, 2.0, 3.0, 0.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.08038330078125, -0.07761001586914062, -0.07483673095703125, -0.07206344604492188, -0.0692901611328125, -0.06651687622070312, -0.06374359130859375, -0.060970306396484375, -0.058197021484375, -0.055423736572265625, -0.05265045166015625, -0.049877166748046875, -0.0471038818359375, -0.044330596923828125, -0.04155731201171875, -0.038784027099609375, -0.0360107421875, -0.033237457275390625, -0.03046417236328125, -0.027690887451171875, -0.0249176025390625, -0.022144317626953125, -0.01937103271484375, -0.016597747802734375, -0.013824462890625, -0.011051177978515625, -0.00827789306640625, -0.005504608154296875, -0.0027313232421875, 4.1961669921875e-05, 0.00281524658203125, 0.005588531494140625, 0.00836181640625, 0.011135101318359375, 0.01390838623046875, 0.016681671142578125, 0.0194549560546875, 0.022228240966796875, 0.02500152587890625, 0.027774810791015625, 0.030548095703125, 0.033321380615234375, 0.03609466552734375, 0.038867950439453125, 0.0416412353515625, 0.044414520263671875, 0.04718780517578125, 0.049961090087890625, 0.052734375, 0.055507659912109375, 0.05828094482421875, 0.061054229736328125, 0.0638275146484375, 0.06660079956054688, 0.06937408447265625, 0.07214736938476562, 0.074920654296875, 0.07769393920898438, 0.08046722412109375, 0.08324050903320312, 0.0860137939453125, 0.08878707885742188, 0.09156036376953125, 0.09433364868164062, 0.09710693359375]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 7.0, 5.0, 27.0, 49.0, 105.0, 133.0, 171.0, 164.0, 137.0, 94.0, 61.0, 21.0, 9.0, 10.0, 1.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.36987996101379395, -0.35131651163101196, -0.33275306224823, -0.314189612865448, -0.295626163482666, -0.27706271409988403, -0.25849923491477966, -0.23993578553199768, -0.2213723361492157, -0.20280888676643372, -0.18424543738365173, -0.16568197309970856, -0.14711852371692657, -0.1285550743341446, -0.10999161750078201, -0.09142816066741943, -0.07286471128463745, -0.05430125817656517, -0.03573780506849289, -0.01717435196042061, 0.0013891011476516724, 0.019952550530433655, 0.038516007363796234, 0.057079464197158813, 0.0756429135799408, 0.09420636296272278, 0.11276981979608536, 0.13133327662944794, 0.14989672601222992, 0.1684601753950119, 0.18702363967895508, 0.20558708906173706, 0.22415059804916382, 0.2427140474319458, 0.2612774968147278, 0.27984094619750977, 0.29840439558029175, 0.31696784496307373, 0.3355313241481781, 0.3540947735309601, 0.37265822291374207, 0.39122167229652405, 0.40978512167930603, 0.428348571062088, 0.4469120502471924, 0.46547549962997437, 0.48403894901275635, 0.5026023983955383, 0.5211658477783203, 0.5397292971611023, 0.5582927465438843, 0.5768561959266663, 0.5954196453094482, 0.6139830946922302, 0.6325465440750122, 0.651110053062439, 0.6696734428405762, 0.6882368922233582, 0.7068003416061401, 0.7253637909889221, 0.7439272403717041, 0.7624906897544861, 0.7810541391372681, 0.7996176481246948, 0.8181810975074768]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 2.0, 4.0, 3.0, 11.0, 13.0, 12.0, 7.0, 20.0, 21.0, 21.0, 24.0, 23.0, 35.0, 44.0, 41.0, 61.0, 57.0, 38.0, 52.0, 47.0, 41.0, 53.0, 51.0, 46.0, 53.0, 27.0, 27.0, 26.0, 27.0, 29.0, 22.0, 22.0, 10.0, 10.0, 6.0, 9.0, 4.0, 3.0, 1.0, 4.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.26835745573043823, -0.2592984139919281, -0.25023937225341797, -0.24118031561374664, -0.23212125897407532, -0.22306221723556519, -0.21400317549705505, -0.20494411885738373, -0.1958850622177124, -0.18682602047920227, -0.17776696383953094, -0.1687079221010208, -0.1596488654613495, -0.15058982372283936, -0.14153078198432922, -0.1324717253446579, -0.12341268360614777, -0.11435363441705704, -0.10529458522796631, -0.09623554348945618, -0.08717648684978485, -0.07811744511127472, -0.06905839592218399, -0.05999934673309326, -0.05094029754400253, -0.041881248354911804, -0.032822199165821075, -0.023763153702020645, -0.014704104512929916, -0.005645055323839188, 0.0034139901399612427, 0.012473039329051971, 0.0215320885181427, 0.03059113770723343, 0.03965018689632416, 0.04870923236012459, 0.05776828154921532, 0.06682732701301575, 0.07588637620210648, 0.0849454253911972, 0.09400447458028793, 0.10306352376937866, 0.11212257295846939, 0.12118162214756012, 0.13024066388607025, 0.13929972052574158, 0.1483587622642517, 0.15741780400276184, 0.16647686064243317, 0.1755359023809433, 0.18459495902061462, 0.19365400075912476, 0.20271305739879608, 0.2117720991373062, 0.22083115577697754, 0.22989019751548767, 0.2389492392539978, 0.24800828099250793, 0.25706732273101807, 0.2661263942718506, 0.2751854360103607, 0.28424447774887085, 0.293303519487381, 0.3023625612258911, 0.31142163276672363]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 4.0, 7.0, 7.0, 8.0, 13.0, 22.0, 45.0, 73.0, 110.0, 171.0, 292.0, 598.0, 1257.0, 3072.0, 8976.0, 35228.0, 163981.0, 523255.0, 240149.0, 51698.0, 12485.0, 4003.0, 1564.0, 730.0, 357.0, 163.0, 106.0, 71.0, 33.0, 27.0, 20.0, 12.0, 9.0, 6.0, 2.0, 4.0, 3.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.298583984375, -0.28850555419921875, -0.2784271240234375, -0.26834869384765625, -0.258270263671875, -0.24819183349609375, -0.2381134033203125, -0.22803497314453125, -0.21795654296875, -0.20787811279296875, -0.1977996826171875, -0.18772125244140625, -0.177642822265625, -0.16756439208984375, -0.1574859619140625, -0.14740753173828125, -0.1373291015625, -0.12725067138671875, -0.1171722412109375, -0.10709381103515625, -0.097015380859375, -0.08693695068359375, -0.0768585205078125, -0.06678009033203125, -0.05670166015625, -0.04662322998046875, -0.0365447998046875, -0.02646636962890625, -0.016387939453125, -0.00630950927734375, 0.0037689208984375, 0.01384735107421875, 0.02392578125, 0.03400421142578125, 0.0440826416015625, 0.05416107177734375, 0.064239501953125, 0.07431793212890625, 0.0843963623046875, 0.09447479248046875, 0.10455322265625, 0.11463165283203125, 0.1247100830078125, 0.13478851318359375, 0.144866943359375, 0.15494537353515625, 0.1650238037109375, 0.17510223388671875, 0.1851806640625, 0.19525909423828125, 0.2053375244140625, 0.21541595458984375, 0.225494384765625, 0.23557281494140625, 0.2456512451171875, 0.25572967529296875, 0.26580810546875, 0.27588653564453125, 0.2859649658203125, 0.29604339599609375, 0.306121826171875, 0.31620025634765625, 0.3262786865234375, 0.33635711669921875, 0.346435546875]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 7.0, 8.0, 15.0, 12.0, 15.0, 21.0, 27.0, 44.0, 45.0, 70.0, 71.0, 77.0, 67.0, 80.0, 72.0, 59.0, 58.0, 54.0, 44.0, 39.0, 39.0, 29.0, 18.0, 11.0, 9.0, 5.0, 4.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10919189453125, -0.1060028076171875, -0.102813720703125, -0.0996246337890625, -0.096435546875, -0.0932464599609375, -0.090057373046875, -0.0868682861328125, -0.08367919921875, -0.0804901123046875, -0.077301025390625, -0.0741119384765625, -0.0709228515625, -0.0677337646484375, -0.064544677734375, -0.0613555908203125, -0.05816650390625, -0.0549774169921875, -0.051788330078125, -0.0485992431640625, -0.04541015625, -0.0422210693359375, -0.039031982421875, -0.0358428955078125, -0.03265380859375, -0.0294647216796875, -0.026275634765625, -0.0230865478515625, -0.0198974609375, -0.0167083740234375, -0.013519287109375, -0.0103302001953125, -0.00714111328125, -0.0039520263671875, -0.000762939453125, 0.0024261474609375, 0.005615234375, 0.0088043212890625, 0.011993408203125, 0.0151824951171875, 0.01837158203125, 0.0215606689453125, 0.024749755859375, 0.0279388427734375, 0.0311279296875, 0.0343170166015625, 0.037506103515625, 0.0406951904296875, 0.04388427734375, 0.0470733642578125, 0.050262451171875, 0.0534515380859375, 0.056640625, 0.0598297119140625, 0.063018798828125, 0.0662078857421875, 0.06939697265625, 0.0725860595703125, 0.075775146484375, 0.0789642333984375, 0.0821533203125, 0.0853424072265625, 0.088531494140625, 0.0917205810546875, 0.09490966796875]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 3.0, 5.0, 2.0, 9.0, 10.0, 12.0, 14.0, 26.0, 37.0, 63.0, 91.0, 181.0, 316.0, 571.0, 1206.0, 3024.0, 10419.0, 53849.0, 324805.0, 524000.0, 104163.0, 17969.0, 4498.0, 1667.0, 732.0, 370.0, 189.0, 118.0, 71.0, 55.0, 23.0, 19.0, 11.0, 10.0, 9.0, 3.0, 5.0, 4.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.28125, -0.2719306945800781, -0.26261138916015625, -0.2532920837402344, -0.2439727783203125, -0.23465347290039062, -0.22533416748046875, -0.21601486206054688, -0.206695556640625, -0.19737625122070312, -0.18805694580078125, -0.17873764038085938, -0.1694183349609375, -0.16009902954101562, -0.15077972412109375, -0.14146041870117188, -0.13214111328125, -0.12282180786132812, -0.11350250244140625, -0.10418319702148438, -0.0948638916015625, -0.08554458618164062, -0.07622528076171875, -0.06690597534179688, -0.057586669921875, -0.048267364501953125, -0.03894805908203125, -0.029628753662109375, -0.0203094482421875, -0.010990142822265625, -0.00167083740234375, 0.007648468017578125, 0.0169677734375, 0.026287078857421875, 0.03560638427734375, 0.044925689697265625, 0.0542449951171875, 0.06356430053710938, 0.07288360595703125, 0.08220291137695312, 0.091522216796875, 0.10084152221679688, 0.11016082763671875, 0.11948013305664062, 0.1287994384765625, 0.13811874389648438, 0.14743804931640625, 0.15675735473632812, 0.16607666015625, 0.17539596557617188, 0.18471527099609375, 0.19403457641601562, 0.2033538818359375, 0.21267318725585938, 0.22199249267578125, 0.23131179809570312, 0.240631103515625, 0.24995040893554688, 0.25926971435546875, 0.2685890197753906, 0.2779083251953125, 0.2872276306152344, 0.29654693603515625, 0.3058662414550781, 0.315185546875]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 4.0, 2.0, 6.0, 5.0, 1.0, 6.0, 12.0, 16.0, 22.0, 21.0, 30.0, 40.0, 38.0, 42.0, 60.0, 48.0, 58.0, 66.0, 74.0, 73.0, 51.0, 68.0, 52.0, 47.0, 37.0, 38.0, 22.0, 22.0, 13.0, 10.0, 8.0, 5.0, 5.0, 2.0, 1.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.44970703125, -0.4364585876464844, -0.42321014404296875, -0.4099617004394531, -0.3967132568359375, -0.3834648132324219, -0.37021636962890625, -0.3569679260253906, -0.343719482421875, -0.3304710388183594, -0.31722259521484375, -0.3039741516113281, -0.2907257080078125, -0.2774772644042969, -0.26422882080078125, -0.2509803771972656, -0.23773193359375, -0.22448348999023438, -0.21123504638671875, -0.19798660278320312, -0.1847381591796875, -0.17148971557617188, -0.15824127197265625, -0.14499282836914062, -0.131744384765625, -0.11849594116210938, -0.10524749755859375, -0.09199905395507812, -0.0787506103515625, -0.06550216674804688, -0.05225372314453125, -0.039005279541015625, -0.0257568359375, -0.012508392333984375, 0.00074005126953125, 0.013988494873046875, 0.0272369384765625, 0.040485382080078125, 0.05373382568359375, 0.06698226928710938, 0.080230712890625, 0.09347915649414062, 0.10672760009765625, 0.11997604370117188, 0.1332244873046875, 0.14647293090820312, 0.15972137451171875, 0.17296981811523438, 0.18621826171875, 0.19946670532226562, 0.21271514892578125, 0.22596359252929688, 0.2392120361328125, 0.2524604797363281, 0.26570892333984375, 0.2789573669433594, 0.292205810546875, 0.3054542541503906, 0.31870269775390625, 0.3319511413574219, 0.3451995849609375, 0.3584480285644531, 0.37169647216796875, 0.3849449157714844, 0.398193359375]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 4.0, 10.0, 21.0, 30.0, 41.0, 98.0, 164.0, 498.0, 2123.0, 30909.0, 941883.0, 68446.0, 3279.0, 611.0, 226.0, 116.0, 44.0, 24.0, 17.0, 13.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.47119140625, -0.45757293701171875, -0.4439544677734375, -0.43033599853515625, -0.416717529296875, -0.40309906005859375, -0.3894805908203125, -0.37586212158203125, -0.36224365234375, -0.34862518310546875, -0.3350067138671875, -0.32138824462890625, -0.307769775390625, -0.29415130615234375, -0.2805328369140625, -0.26691436767578125, -0.2532958984375, -0.23967742919921875, -0.2260589599609375, -0.21244049072265625, -0.198822021484375, -0.18520355224609375, -0.1715850830078125, -0.15796661376953125, -0.14434814453125, -0.13072967529296875, -0.1171112060546875, -0.10349273681640625, -0.089874267578125, -0.07625579833984375, -0.0626373291015625, -0.04901885986328125, -0.035400390625, -0.02178192138671875, -0.0081634521484375, 0.00545501708984375, 0.019073486328125, 0.03269195556640625, 0.0463104248046875, 0.05992889404296875, 0.07354736328125, 0.08716583251953125, 0.1007843017578125, 0.11440277099609375, 0.128021240234375, 0.14163970947265625, 0.1552581787109375, 0.16887664794921875, 0.1824951171875, 0.19611358642578125, 0.2097320556640625, 0.22335052490234375, 0.236968994140625, 0.25058746337890625, 0.2642059326171875, 0.27782440185546875, 0.29144287109375, 0.30506134033203125, 0.3186798095703125, 0.33229827880859375, 0.345916748046875, 0.35953521728515625, 0.3731536865234375, 0.38677215576171875, 0.400390625]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 5.0, 3.0, 2.0, 6.0, 6.0, 11.0, 19.0, 12.0, 22.0, 22.0, 35.0, 43.0, 43.0, 58.0, 81.0, 130.0, 132.0, 89.0, 62.0, 51.0, 36.0, 30.0, 35.0, 11.0, 16.0, 15.0, 12.0, 4.0, 6.0, 4.0, 1.0, 3.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.43865966796875e-05, -7.129088044166565e-05, -6.81951642036438e-05, -6.509944796562195e-05, -6.20037317276001e-05, -5.890801548957825e-05, -5.5812299251556396e-05, -5.2716583013534546e-05, -4.9620866775512695e-05, -4.6525150537490845e-05, -4.3429434299468994e-05, -4.0333718061447144e-05, -3.723800182342529e-05, -3.414228558540344e-05, -3.104656934738159e-05, -2.795085310935974e-05, -2.485513687133789e-05, -2.175942063331604e-05, -1.866370439529419e-05, -1.556798815727234e-05, -1.2472271919250488e-05, -9.376555681228638e-06, -6.280839443206787e-06, -3.1851232051849365e-06, -8.940696716308594e-08, 3.0063092708587646e-06, 6.102025508880615e-06, 9.197741746902466e-06, 1.2293457984924316e-05, 1.5389174222946167e-05, 1.8484890460968018e-05, 2.1580606698989868e-05, 2.467632293701172e-05, 2.777203917503357e-05, 3.086775541305542e-05, 3.396347165107727e-05, 3.705918788909912e-05, 4.015490412712097e-05, 4.325062036514282e-05, 4.634633660316467e-05, 4.9442052841186523e-05, 5.2537769079208374e-05, 5.5633485317230225e-05, 5.8729201555252075e-05, 6.182491779327393e-05, 6.492063403129578e-05, 6.801635026931763e-05, 7.111206650733948e-05, 7.420778274536133e-05, 7.730349898338318e-05, 8.039921522140503e-05, 8.349493145942688e-05, 8.659064769744873e-05, 8.968636393547058e-05, 9.278208017349243e-05, 9.587779641151428e-05, 9.897351264953613e-05, 0.00010206922888755798, 0.00010516494512557983, 0.00010826066136360168, 0.00011135637760162354, 0.00011445209383964539, 0.00011754781007766724, 0.00012064352631568909, 0.00012373924255371094]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 5.0, 3.0, 8.0, 17.0, 17.0, 22.0, 41.0, 73.0, 136.0, 247.0, 626.0, 1936.0, 13528.0, 371340.0, 636580.0, 20335.0, 2369.0, 678.0, 297.0, 136.0, 75.0, 37.0, 20.0, 14.0, 6.0, 9.0, 4.0, 5.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.20849609375, -0.19810867309570312, -0.18772125244140625, -0.17733383178710938, -0.1669464111328125, -0.15655899047851562, -0.14617156982421875, -0.13578414916992188, -0.125396728515625, -0.11500930786132812, -0.10462188720703125, -0.09423446655273438, -0.0838470458984375, -0.07345962524414062, -0.06307220458984375, -0.052684783935546875, -0.04229736328125, -0.031909942626953125, -0.02152252197265625, -0.011135101318359375, -0.0007476806640625, 0.009639739990234375, 0.02002716064453125, 0.030414581298828125, 0.040802001953125, 0.051189422607421875, 0.06157684326171875, 0.07196426391601562, 0.0823516845703125, 0.09273910522460938, 0.10312652587890625, 0.11351394653320312, 0.1239013671875, 0.13428878784179688, 0.14467620849609375, 0.15506362915039062, 0.1654510498046875, 0.17583847045898438, 0.18622589111328125, 0.19661331176757812, 0.207000732421875, 0.21738815307617188, 0.22777557373046875, 0.23816299438476562, 0.2485504150390625, 0.2589378356933594, 0.26932525634765625, 0.2797126770019531, 0.29010009765625, 0.3004875183105469, 0.31087493896484375, 0.3212623596191406, 0.3316497802734375, 0.3420372009277344, 0.35242462158203125, 0.3628120422363281, 0.373199462890625, 0.3835868835449219, 0.39397430419921875, 0.4043617248535156, 0.4147491455078125, 0.4251365661621094, 0.43552398681640625, 0.4459114074707031, 0.456298828125]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 5.0, 13.0, 8.0, 22.0, 45.0, 76.0, 147.0, 216.0, 207.0, 115.0, 66.0, 38.0, 26.0, 9.0, 6.0, 5.0, 2.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.458251953125, -0.4477958679199219, -0.43733978271484375, -0.4268836975097656, -0.4164276123046875, -0.4059715270996094, -0.39551544189453125, -0.3850593566894531, -0.374603271484375, -0.3641471862792969, -0.35369110107421875, -0.3432350158691406, -0.3327789306640625, -0.3223228454589844, -0.31186676025390625, -0.3014106750488281, -0.29095458984375, -0.2804985046386719, -0.27004241943359375, -0.2595863342285156, -0.2491302490234375, -0.23867416381835938, -0.22821807861328125, -0.21776199340820312, -0.207305908203125, -0.19684982299804688, -0.18639373779296875, -0.17593765258789062, -0.1654815673828125, -0.15502548217773438, -0.14456939697265625, -0.13411331176757812, -0.1236572265625, -0.11320114135742188, -0.10274505615234375, -0.09228897094726562, -0.0818328857421875, -0.07137680053710938, -0.06092071533203125, -0.050464630126953125, -0.040008544921875, -0.029552459716796875, -0.01909637451171875, -0.008640289306640625, 0.0018157958984375, 0.012271881103515625, 0.02272796630859375, 0.033184051513671875, 0.04364013671875, 0.054096221923828125, 0.06455230712890625, 0.07500839233398438, 0.0854644775390625, 0.09592056274414062, 0.10637664794921875, 0.11683273315429688, 0.127288818359375, 0.13774490356445312, 0.14820098876953125, 0.15865707397460938, 0.1691131591796875, 0.17956924438476562, 0.19002532958984375, 0.20048141479492188, 0.2109375]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 16.0, 14.0, 29.0, 43.0, 74.0, 87.0, 149.0, 163.0, 131.0, 100.0, 71.0, 40.0, 34.0, 26.0, 10.0, 8.0, 6.0, 4.0, 6.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-2.7389912605285645, -2.6697049140930176, -2.6004185676574707, -2.5311319828033447, -2.461845636367798, -2.392559289932251, -2.323272943496704, -2.2539865970611572, -2.1847000122070312, -2.1154136657714844, -2.0461273193359375, -1.976840853691101, -1.9075543880462646, -1.8382680416107178, -1.768981695175171, -1.699695348739624, -1.6304090023040771, -1.5611226558685303, -1.4918361902236938, -1.422549843788147, -1.3532633781433105, -1.2839770317077637, -1.2146906852722168, -1.14540433883667, -1.0761178731918335, -1.0068315267562866, -0.9375450611114502, -0.8682587146759033, -0.7989723086357117, -0.72968590259552, -0.6603995561599731, -0.5911131501197815, -0.5218267440795898, -0.4525403380393982, -0.38325396180152893, -0.31396758556365967, -0.24468117952346802, -0.17539477348327637, -0.1061083972454071, -0.03682202100753784, 0.03246438503265381, 0.10175077617168427, 0.17103716731071472, 0.24032355844974518, 0.30960994958877563, 0.3788963556289673, 0.44818273186683655, 0.5174691081047058, 0.5867555141448975, 0.6560419201850891, 0.7253283262252808, 0.7946146726608276, 0.8639010787010193, 0.9331874847412109, 1.0024738311767578, 1.0717601776123047, 1.1410466432571411, 1.210332989692688, 1.2796194553375244, 1.3489058017730713, 1.4181921482086182, 1.4874786138534546, 1.5567649602890015, 1.626051425933838, 1.6953377723693848]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 5.0, 5.0, 3.0, 7.0, 8.0, 15.0, 14.0, 17.0, 13.0, 17.0, 22.0, 18.0, 31.0, 36.0, 38.0, 35.0, 35.0, 44.0, 40.0, 44.0, 51.0, 41.0, 40.0, 46.0, 34.0, 39.0, 33.0, 35.0, 38.0, 33.0, 22.0, 25.0, 27.0, 20.0, 14.0, 13.0, 12.0, 7.0, 10.0, 6.0, 2.0, 2.0, 3.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.6305263042449951, -1.5753449201583862, -1.5201635360717773, -1.464982271194458, -1.4098008871078491, -1.3546195030212402, -1.299438238143921, -1.244256854057312, -1.1890754699707031, -1.1338940858840942, -1.0787127017974854, -1.023531436920166, -0.9683500528335571, -0.9131686687469482, -0.8579873442649841, -0.80280601978302, -0.7476246356964111, -0.6924432516098022, -0.6372619271278381, -0.582080602645874, -0.5268992185592651, -0.47171786427497864, -0.41653650999069214, -0.36135515570640564, -0.30617380142211914, -0.25099244713783264, -0.19581109285354614, -0.14062973856925964, -0.08544838428497314, -0.030267030000686646, 0.024914324283599854, 0.08009567856788635, 0.1352771520614624, 0.1904585063457489, 0.2456398606300354, 0.3008212149143219, 0.3560025691986084, 0.4111839234828949, 0.4663652777671814, 0.5215466022491455, 0.5767279863357544, 0.6319093704223633, 0.6870906949043274, 0.7422720193862915, 0.7974534034729004, 0.8526347875595093, 0.9078161120414734, 0.9629974365234375, 1.0181788206100464, 1.0733602046966553, 1.1285414695739746, 1.1837228536605835, 1.2389042377471924, 1.2940856218338013, 1.3492670059204102, 1.4044482707977295, 1.4596296548843384, 1.5148110389709473, 1.5699923038482666, 1.6251736879348755, 1.6803550720214844, 1.7355364561080933, 1.7907178401947021, 1.8458991050720215, 1.9010804891586304]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 5.0, 3.0, 6.0, 7.0, 16.0, 16.0, 33.0, 31.0, 59.0, 80.0, 159.0, 367.0, 791.0, 2644.0, 12916.0, 161491.0, 3892981.0, 109178.0, 10213.0, 2030.0, 657.0, 257.0, 102.0, 81.0, 47.0, 35.0, 24.0, 21.0, 13.0, 6.0, 9.0, 4.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.49853515625, -0.4836273193359375, -0.468719482421875, -0.4538116455078125, -0.43890380859375, -0.4239959716796875, -0.409088134765625, -0.3941802978515625, -0.3792724609375, -0.3643646240234375, -0.349456787109375, -0.3345489501953125, -0.31964111328125, -0.3047332763671875, -0.289825439453125, -0.2749176025390625, -0.260009765625, -0.2451019287109375, -0.230194091796875, -0.2152862548828125, -0.20037841796875, -0.1854705810546875, -0.170562744140625, -0.1556549072265625, -0.1407470703125, -0.1258392333984375, -0.110931396484375, -0.0960235595703125, -0.08111572265625, -0.0662078857421875, -0.051300048828125, -0.0363922119140625, -0.021484375, -0.0065765380859375, 0.008331298828125, 0.0232391357421875, 0.03814697265625, 0.0530548095703125, 0.067962646484375, 0.0828704833984375, 0.0977783203125, 0.1126861572265625, 0.127593994140625, 0.1425018310546875, 0.15740966796875, 0.1723175048828125, 0.187225341796875, 0.2021331787109375, 0.217041015625, 0.2319488525390625, 0.246856689453125, 0.2617645263671875, 0.27667236328125, 0.2915802001953125, 0.306488037109375, 0.3213958740234375, 0.3363037109375, 0.3512115478515625, 0.366119384765625, 0.3810272216796875, 0.39593505859375, 0.4108428955078125, 0.425750732421875, 0.4406585693359375, 0.45556640625]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 3.0, 6.0, 4.0, 7.0, 11.0, 22.0, 19.0, 18.0, 35.0, 41.0, 47.0, 43.0, 57.0, 70.0, 69.0, 62.0, 86.0, 67.0, 61.0, 42.0, 42.0, 40.0, 44.0, 30.0, 21.0, 25.0, 9.0, 5.0, 8.0, 6.0, 4.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11517333984375, -0.111846923828125, -0.1085205078125, -0.105194091796875, -0.10186767578125, -0.098541259765625, -0.09521484375, -0.091888427734375, -0.08856201171875, -0.085235595703125, -0.0819091796875, -0.078582763671875, -0.07525634765625, -0.071929931640625, -0.068603515625, -0.065277099609375, -0.06195068359375, -0.058624267578125, -0.0552978515625, -0.051971435546875, -0.04864501953125, -0.045318603515625, -0.0419921875, -0.038665771484375, -0.03533935546875, -0.032012939453125, -0.0286865234375, -0.025360107421875, -0.02203369140625, -0.018707275390625, -0.015380859375, -0.012054443359375, -0.00872802734375, -0.005401611328125, -0.0020751953125, 0.001251220703125, 0.00457763671875, 0.007904052734375, 0.01123046875, 0.014556884765625, 0.01788330078125, 0.021209716796875, 0.0245361328125, 0.027862548828125, 0.03118896484375, 0.034515380859375, 0.037841796875, 0.041168212890625, 0.04449462890625, 0.047821044921875, 0.0511474609375, 0.054473876953125, 0.05780029296875, 0.061126708984375, 0.064453125, 0.067779541015625, 0.07110595703125, 0.074432373046875, 0.0777587890625, 0.081085205078125, 0.08441162109375, 0.087738037109375, 0.091064453125, 0.094390869140625, 0.09771728515625]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 3.0, 8.0, 2.0, 5.0, 7.0, 22.0, 21.0, 31.0, 65.0, 83.0, 134.0, 210.0, 419.0, 726.0, 1416.0, 2842.0, 6403.0, 17119.0, 55403.0, 280771.0, 3053429.0, 640532.0, 92599.0, 25299.0, 9037.0, 3794.0, 1776.0, 889.0, 498.0, 254.0, 178.0, 112.0, 72.0, 41.0, 22.0, 17.0, 19.0, 16.0, 8.0, 7.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1591796875, -0.1534290313720703, -0.14767837524414062, -0.14192771911621094, -0.13617706298828125, -0.13042640686035156, -0.12467575073242188, -0.11892509460449219, -0.1131744384765625, -0.10742378234863281, -0.10167312622070312, -0.09592247009277344, -0.09017181396484375, -0.08442115783691406, -0.07867050170898438, -0.07291984558105469, -0.067169189453125, -0.06141853332519531, -0.055667877197265625, -0.04991722106933594, -0.04416656494140625, -0.03841590881347656, -0.032665252685546875, -0.026914596557617188, -0.0211639404296875, -0.015413284301757812, -0.009662628173828125, -0.0039119720458984375, 0.00183868408203125, 0.0075893402099609375, 0.013339996337890625, 0.019090652465820312, 0.02484130859375, 0.030591964721679688, 0.036342620849609375, 0.04209327697753906, 0.04784393310546875, 0.05359458923339844, 0.059345245361328125, 0.06509590148925781, 0.0708465576171875, 0.07659721374511719, 0.08234786987304688, 0.08809852600097656, 0.09384918212890625, 0.09959983825683594, 0.10535049438476562, 0.11110115051269531, 0.116851806640625, 0.12260246276855469, 0.12835311889648438, 0.13410377502441406, 0.13985443115234375, 0.14560508728027344, 0.15135574340820312, 0.1571063995361328, 0.1628570556640625, 0.1686077117919922, 0.17435836791992188, 0.18010902404785156, 0.18585968017578125, 0.19161033630371094, 0.19736099243164062, 0.2031116485595703, 0.2088623046875]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 5.0, 6.0, 2.0, 5.0, 7.0, 10.0, 9.0, 17.0, 37.0, 41.0, 101.0, 187.0, 478.0, 1628.0, 886.0, 292.0, 139.0, 83.0, 45.0, 30.0, 20.0, 17.0, 14.0, 7.0, 8.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1412353515625, -0.1366443634033203, -0.13205337524414062, -0.12746238708496094, -0.12287139892578125, -0.11828041076660156, -0.11368942260742188, -0.10909843444824219, -0.1045074462890625, -0.09991645812988281, -0.09532546997070312, -0.09073448181152344, -0.08614349365234375, -0.08155250549316406, -0.07696151733398438, -0.07237052917480469, -0.067779541015625, -0.06318855285644531, -0.058597564697265625, -0.05400657653808594, -0.04941558837890625, -0.04482460021972656, -0.040233612060546875, -0.03564262390136719, -0.0310516357421875, -0.026460647583007812, -0.021869659423828125, -0.017278671264648438, -0.01268768310546875, -0.008096694946289062, -0.003505706787109375, 0.0010852813720703125, 0.00567626953125, 0.010267257690429688, 0.014858245849609375, 0.019449234008789062, 0.02404022216796875, 0.028631210327148438, 0.033222198486328125, 0.03781318664550781, 0.0424041748046875, 0.04699516296386719, 0.051586151123046875, 0.05617713928222656, 0.06076812744140625, 0.06535911560058594, 0.06995010375976562, 0.07454109191894531, 0.079132080078125, 0.08372306823730469, 0.08831405639648438, 0.09290504455566406, 0.09749603271484375, 0.10208702087402344, 0.10667800903320312, 0.11126899719238281, 0.1158599853515625, 0.12045097351074219, 0.12504196166992188, 0.12963294982910156, 0.13422393798828125, 0.13881492614746094, 0.14340591430664062, 0.1479969024658203, 0.152587890625]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 2.0, 5.0, 13.0, 35.0, 39.0, 54.0, 104.0, 140.0, 126.0, 127.0, 128.0, 82.0, 60.0, 37.0, 30.0, 14.0, 7.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4504780173301697, -0.4290088713169098, -0.4075397551059723, -0.3860706090927124, -0.3646014928817749, -0.343132346868515, -0.3216632008552551, -0.3001940846443176, -0.27872493863105774, -0.25725579261779785, -0.23578667640686035, -0.21431753039360046, -0.19284839928150177, -0.17137926816940308, -0.1499101221561432, -0.1284409910440445, -0.1069718599319458, -0.0855027288198471, -0.06403359025716782, -0.042564451694488525, -0.02109532058238983, 0.0003738105297088623, 0.02184295654296875, 0.043312087655067444, 0.06478121876716614, 0.08625034987926483, 0.10771948844194412, 0.1291886270046234, 0.1506577581167221, 0.1721268892288208, 0.1935960352420807, 0.21506516635417938, 0.23653429746627808, 0.25800344347953796, 0.27947255969047546, 0.30094170570373535, 0.32241082191467285, 0.34387996792793274, 0.3653491139411926, 0.3868182301521301, 0.40828737616539, 0.4297565221786499, 0.4512256383895874, 0.4726947844028473, 0.4941639304161072, 0.5156330466270447, 0.537102222442627, 0.5585713386535645, 0.580040454864502, 0.6015095710754395, 0.6229787468910217, 0.6444478631019592, 0.6659169793128967, 0.687386155128479, 0.7088552713394165, 0.730324387550354, 0.7517935037612915, 0.773262619972229, 0.7947317957878113, 0.8162009119987488, 0.8376700282096863, 0.8591392040252686, 0.880608320236206, 0.9020774364471436, 0.9235466122627258]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 5.0, 5.0, 10.0, 3.0, 13.0, 13.0, 12.0, 22.0, 22.0, 18.0, 25.0, 37.0, 28.0, 27.0, 34.0, 35.0, 34.0, 51.0, 36.0, 53.0, 41.0, 38.0, 28.0, 41.0, 49.0, 49.0, 21.0, 32.0, 21.0, 27.0, 19.0, 24.0, 25.0, 13.0, 10.0, 15.0, 10.0, 14.0, 9.0, 11.0, 10.0, 3.0, 4.0, 2.0, 2.0, 1.0, 0.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.33872050046920776, -0.32775643467903137, -0.31679239869117737, -0.305828332901001, -0.294864296913147, -0.2839002311229706, -0.2729361653327942, -0.2619721293449402, -0.2510080933570862, -0.24004404246807098, -0.2290799915790558, -0.2181159257888794, -0.2071518898010254, -0.196187824010849, -0.1852237731218338, -0.1742597222328186, -0.1632956564426422, -0.15233160555362701, -0.14136755466461182, -0.13040348887443542, -0.11943944543600082, -0.10847539454698563, -0.09751133620738983, -0.08654728531837463, -0.07558323442935944, -0.06461918354034424, -0.05365512892603874, -0.042691074311733246, -0.03172702342271805, -0.02076297253370285, -0.009798914194107056, 0.001165136694908142, 0.01212918758392334, 0.023093240335583687, 0.034057293087244034, 0.04502134770154953, 0.05598539859056473, 0.06694944947957993, 0.07791350781917572, 0.08887755870819092, 0.09984160959720612, 0.11080566048622131, 0.12176971137523651, 0.1327337622642517, 0.1436978280544281, 0.1546618640422821, 0.1656259298324585, 0.1765899807214737, 0.1875540316104889, 0.1985180824995041, 0.2094821333885193, 0.22044619917869568, 0.23141023516654968, 0.24237430095672607, 0.2533383369445801, 0.26430240273475647, 0.27526646852493286, 0.28623053431510925, 0.29719457030296326, 0.30815863609313965, 0.31912267208099365, 0.33008673787117004, 0.34105080366134644, 0.35201483964920044, 0.36297887563705444]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 4.0, 6.0, 9.0, 16.0, 25.0, 49.0, 66.0, 94.0, 195.0, 377.0, 727.0, 1615.0, 4173.0, 14413.0, 70004.0, 328533.0, 459177.0, 132789.0, 25661.0, 6392.0, 2281.0, 935.0, 454.0, 236.0, 126.0, 69.0, 40.0, 28.0, 17.0, 14.0, 10.0, 10.0, 5.0, 3.0, 6.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3525390625, -0.3422279357910156, -0.33191680908203125, -0.3216056823730469, -0.3112945556640625, -0.3009834289550781, -0.29067230224609375, -0.2803611755371094, -0.270050048828125, -0.2597389221191406, -0.24942779541015625, -0.23911666870117188, -0.2288055419921875, -0.21849441528320312, -0.20818328857421875, -0.19787216186523438, -0.18756103515625, -0.17724990844726562, -0.16693878173828125, -0.15662765502929688, -0.1463165283203125, -0.13600540161132812, -0.12569427490234375, -0.11538314819335938, -0.105072021484375, -0.09476089477539062, -0.08444976806640625, -0.07413864135742188, -0.0638275146484375, -0.053516387939453125, -0.04320526123046875, -0.032894134521484375, -0.0225830078125, -0.012271881103515625, -0.00196075439453125, 0.008350372314453125, 0.0186614990234375, 0.028972625732421875, 0.03928375244140625, 0.049594879150390625, 0.059906005859375, 0.07021713256835938, 0.08052825927734375, 0.09083938598632812, 0.1011505126953125, 0.11146163940429688, 0.12177276611328125, 0.13208389282226562, 0.14239501953125, 0.15270614624023438, 0.16301727294921875, 0.17332839965820312, 0.1836395263671875, 0.19395065307617188, 0.20426177978515625, 0.21457290649414062, 0.224884033203125, 0.23519515991210938, 0.24550628662109375, 0.2558174133300781, 0.2661285400390625, 0.2764396667480469, 0.28675079345703125, 0.2970619201660156, 0.307373046875]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 5.0, 7.0, 13.0, 16.0, 16.0, 21.0, 31.0, 40.0, 42.0, 45.0, 45.0, 68.0, 81.0, 86.0, 67.0, 61.0, 62.0, 56.0, 48.0, 43.0, 37.0, 31.0, 30.0, 10.0, 15.0, 8.0, 11.0, 3.0, 5.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1170654296875, -0.11361026763916016, -0.11015510559082031, -0.10669994354248047, -0.10324478149414062, -0.09978961944580078, -0.09633445739746094, -0.0928792953491211, -0.08942413330078125, -0.0859689712524414, -0.08251380920410156, -0.07905864715576172, -0.07560348510742188, -0.07214832305908203, -0.06869316101074219, -0.06523799896240234, -0.0617828369140625, -0.058327674865722656, -0.05487251281738281, -0.05141735076904297, -0.047962188720703125, -0.04450702667236328, -0.04105186462402344, -0.037596702575683594, -0.03414154052734375, -0.030686378479003906, -0.027231216430664062, -0.02377605438232422, -0.020320892333984375, -0.01686573028564453, -0.013410568237304688, -0.009955406188964844, -0.006500244140625, -0.0030450820922851562, 0.0004100799560546875, 0.0038652420043945312, 0.007320404052734375, 0.010775566101074219, 0.014230728149414062, 0.017685890197753906, 0.02114105224609375, 0.024596214294433594, 0.028051376342773438, 0.03150653839111328, 0.034961700439453125, 0.03841686248779297, 0.04187202453613281, 0.045327186584472656, 0.0487823486328125, 0.052237510681152344, 0.05569267272949219, 0.05914783477783203, 0.06260299682617188, 0.06605815887451172, 0.06951332092285156, 0.0729684829711914, 0.07642364501953125, 0.0798788070678711, 0.08333396911621094, 0.08678913116455078, 0.09024429321289062, 0.09369945526123047, 0.09715461730957031, 0.10060977935791016, 0.10406494140625]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 5.0, 3.0, 7.0, 11.0, 11.0, 19.0, 27.0, 24.0, 49.0, 86.0, 139.0, 234.0, 442.0, 936.0, 2271.0, 7800.0, 41968.0, 300403.0, 558811.0, 112053.0, 16436.0, 4003.0, 1395.0, 621.0, 335.0, 181.0, 113.0, 55.0, 48.0, 21.0, 14.0, 12.0, 10.0, 7.0, 3.0, 3.0, 2.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.338134765625, -0.3265724182128906, -0.31501007080078125, -0.3034477233886719, -0.2918853759765625, -0.2803230285644531, -0.26876068115234375, -0.2571983337402344, -0.245635986328125, -0.23407363891601562, -0.22251129150390625, -0.21094894409179688, -0.1993865966796875, -0.18782424926757812, -0.17626190185546875, -0.16469955444335938, -0.15313720703125, -0.14157485961914062, -0.13001251220703125, -0.11845016479492188, -0.1068878173828125, -0.09532546997070312, -0.08376312255859375, -0.07220077514648438, -0.060638427734375, -0.049076080322265625, -0.03751373291015625, -0.025951385498046875, -0.0143890380859375, -0.002826690673828125, 0.00873565673828125, 0.020298004150390625, 0.0318603515625, 0.043422698974609375, 0.05498504638671875, 0.06654739379882812, 0.0781097412109375, 0.08967208862304688, 0.10123443603515625, 0.11279678344726562, 0.124359130859375, 0.13592147827148438, 0.14748382568359375, 0.15904617309570312, 0.1706085205078125, 0.18217086791992188, 0.19373321533203125, 0.20529556274414062, 0.21685791015625, 0.22842025756835938, 0.23998260498046875, 0.2515449523925781, 0.2631072998046875, 0.2746696472167969, 0.28623199462890625, 0.2977943420410156, 0.309356689453125, 0.3209190368652344, 0.33248138427734375, 0.3440437316894531, 0.3556060791015625, 0.3671684265136719, 0.37873077392578125, 0.3902931213378906, 0.40185546875]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 4.0, 4.0, 8.0, 8.0, 17.0, 9.0, 17.0, 20.0, 22.0, 15.0, 19.0, 30.0, 31.0, 34.0, 27.0, 31.0, 42.0, 43.0, 49.0, 51.0, 62.0, 45.0, 43.0, 43.0, 41.0, 35.0, 40.0, 38.0, 28.0, 20.0, 25.0, 18.0, 17.0, 18.0, 15.0, 7.0, 7.0, 5.0, 3.0, 3.0, 5.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0], "bins": [-0.396240234375, -0.38466644287109375, -0.3730926513671875, -0.36151885986328125, -0.349945068359375, -0.33837127685546875, -0.3267974853515625, -0.31522369384765625, -0.30364990234375, -0.29207611083984375, -0.2805023193359375, -0.26892852783203125, -0.257354736328125, -0.24578094482421875, -0.2342071533203125, -0.22263336181640625, -0.2110595703125, -0.19948577880859375, -0.1879119873046875, -0.17633819580078125, -0.164764404296875, -0.15319061279296875, -0.1416168212890625, -0.13004302978515625, -0.11846923828125, -0.10689544677734375, -0.0953216552734375, -0.08374786376953125, -0.072174072265625, -0.06060028076171875, -0.0490264892578125, -0.03745269775390625, -0.02587890625, -0.01430511474609375, -0.0027313232421875, 0.00884246826171875, 0.020416259765625, 0.03199005126953125, 0.0435638427734375, 0.05513763427734375, 0.06671142578125, 0.07828521728515625, 0.0898590087890625, 0.10143280029296875, 0.113006591796875, 0.12458038330078125, 0.1361541748046875, 0.14772796630859375, 0.1593017578125, 0.17087554931640625, 0.1824493408203125, 0.19402313232421875, 0.205596923828125, 0.21717071533203125, 0.2287445068359375, 0.24031829833984375, 0.25189208984375, 0.26346588134765625, 0.2750396728515625, 0.28661346435546875, 0.298187255859375, 0.30976104736328125, 0.3213348388671875, 0.33290863037109375, 0.344482421875]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 0.0, 2.0, 2.0, 0.0, 4.0, 13.0, 8.0, 17.0, 20.0, 33.0, 63.0, 104.0, 212.0, 453.0, 1315.0, 6240.0, 67839.0, 750189.0, 205555.0, 13050.0, 2154.0, 670.0, 283.0, 133.0, 77.0, 37.0, 29.0, 13.0, 11.0, 8.0, 13.0, 7.0, 3.0, 1.0, 3.0, 1.0, 1.0, 2.0], "bins": [-0.373779296875, -0.3652229309082031, -0.35666656494140625, -0.3481101989746094, -0.3395538330078125, -0.3309974670410156, -0.32244110107421875, -0.3138847351074219, -0.305328369140625, -0.2967720031738281, -0.28821563720703125, -0.2796592712402344, -0.2711029052734375, -0.2625465393066406, -0.25399017333984375, -0.24543380737304688, -0.23687744140625, -0.22832107543945312, -0.21976470947265625, -0.21120834350585938, -0.2026519775390625, -0.19409561157226562, -0.18553924560546875, -0.17698287963867188, -0.168426513671875, -0.15987014770507812, -0.15131378173828125, -0.14275741577148438, -0.1342010498046875, -0.12564468383789062, -0.11708831787109375, -0.10853195190429688, -0.0999755859375, -0.09141921997070312, -0.08286285400390625, -0.07430648803710938, -0.0657501220703125, -0.057193756103515625, -0.04863739013671875, -0.040081024169921875, -0.031524658203125, -0.022968292236328125, -0.01441192626953125, -0.005855560302734375, 0.0027008056640625, 0.011257171630859375, 0.01981353759765625, 0.028369903564453125, 0.03692626953125, 0.045482635498046875, 0.05403900146484375, 0.06259536743164062, 0.0711517333984375, 0.07970809936523438, 0.08826446533203125, 0.09682083129882812, 0.105377197265625, 0.11393356323242188, 0.12248992919921875, 0.13104629516601562, 0.1396026611328125, 0.14815902709960938, 0.15671539306640625, 0.16527175903320312, 0.173828125]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 4.0, 6.0, 4.0, 6.0, 10.0, 15.0, 16.0, 31.0, 36.0, 32.0, 62.0, 72.0, 58.0, 83.0, 95.0, 80.0, 62.0, 69.0, 52.0, 55.0, 41.0, 26.0, 22.0, 17.0, 16.0, 7.0, 10.0, 5.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-9.071826934814453e-05, -8.79308208823204e-05, -8.514337241649628e-05, -8.235592395067215e-05, -7.956847548484802e-05, -7.67810270190239e-05, -7.399357855319977e-05, -7.120613008737564e-05, -6.841868162155151e-05, -6.563123315572739e-05, -6.284378468990326e-05, -6.005633622407913e-05, -5.7268887758255005e-05, -5.448143929243088e-05, -5.169399082660675e-05, -4.890654236078262e-05, -4.6119093894958496e-05, -4.333164542913437e-05, -4.054419696331024e-05, -3.7756748497486115e-05, -3.496930003166199e-05, -3.218185156583786e-05, -2.9394403100013733e-05, -2.6606954634189606e-05, -2.381950616836548e-05, -2.103205770254135e-05, -1.8244609236717224e-05, -1.5457160770893097e-05, -1.266971230506897e-05, -9.882263839244843e-06, -7.094815373420715e-06, -4.307366907596588e-06, -1.519918441772461e-06, 1.2675300240516663e-06, 4.0549784898757935e-06, 6.842426955699921e-06, 9.629875421524048e-06, 1.2417323887348175e-05, 1.5204772353172302e-05, 1.799222081899643e-05, 2.0779669284820557e-05, 2.3567117750644684e-05, 2.635456621646881e-05, 2.9142014682292938e-05, 3.1929463148117065e-05, 3.471691161394119e-05, 3.750436007976532e-05, 4.029180854558945e-05, 4.3079257011413574e-05, 4.58667054772377e-05, 4.865415394306183e-05, 5.1441602408885956e-05, 5.422905087471008e-05, 5.701649934053421e-05, 5.980394780635834e-05, 6.259139627218246e-05, 6.537884473800659e-05, 6.816629320383072e-05, 7.095374166965485e-05, 7.374119013547897e-05, 7.65286386013031e-05, 7.931608706712723e-05, 8.210353553295135e-05, 8.489098399877548e-05, 8.767843246459961e-05]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 6.0, 4.0, 5.0, 6.0, 10.0, 13.0, 36.0, 35.0, 55.0, 94.0, 123.0, 184.0, 305.0, 580.0, 1040.0, 2280.0, 6029.0, 20240.0, 86001.0, 325236.0, 429309.0, 131866.0, 30540.0, 8570.0, 2999.0, 1283.0, 704.0, 365.0, 225.0, 143.0, 85.0, 50.0, 44.0, 26.0, 21.0, 11.0, 6.0, 7.0, 8.0, 3.0, 3.0, 2.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.1124267578125, -0.10843276977539062, -0.10443878173828125, -0.10044479370117188, -0.0964508056640625, -0.09245681762695312, -0.08846282958984375, -0.08446884155273438, -0.080474853515625, -0.07648086547851562, -0.07248687744140625, -0.06849288940429688, -0.0644989013671875, -0.060504913330078125, -0.05651092529296875, -0.052516937255859375, -0.04852294921875, -0.044528961181640625, -0.04053497314453125, -0.036540985107421875, -0.0325469970703125, -0.028553009033203125, -0.02455902099609375, -0.020565032958984375, -0.016571044921875, -0.012577056884765625, -0.00858306884765625, -0.004589080810546875, -0.0005950927734375, 0.003398895263671875, 0.00739288330078125, 0.011386871337890625, 0.015380859375, 0.019374847412109375, 0.02336883544921875, 0.027362823486328125, 0.0313568115234375, 0.035350799560546875, 0.03934478759765625, 0.043338775634765625, 0.047332763671875, 0.051326751708984375, 0.05532073974609375, 0.059314727783203125, 0.0633087158203125, 0.06730270385742188, 0.07129669189453125, 0.07529067993164062, 0.07928466796875, 0.08327865600585938, 0.08727264404296875, 0.09126663208007812, 0.0952606201171875, 0.09925460815429688, 0.10324859619140625, 0.10724258422851562, 0.111236572265625, 0.11523056030273438, 0.11922454833984375, 0.12321853637695312, 0.1272125244140625, 0.13120651245117188, 0.13520050048828125, 0.13919448852539062, 0.1431884765625]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 6.0, 2.0, 1.0, 2.0, 7.0, 2.0, 11.0, 26.0, 24.0, 25.0, 39.0, 56.0, 75.0, 84.0, 99.0, 110.0, 101.0, 83.0, 55.0, 58.0, 40.0, 26.0, 25.0, 16.0, 14.0, 8.0, 2.0, 5.0, 6.0, 3.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.18115234375, -0.17539024353027344, -0.16962814331054688, -0.1638660430908203, -0.15810394287109375, -0.1523418426513672, -0.14657974243164062, -0.14081764221191406, -0.1350555419921875, -0.12929344177246094, -0.12353134155273438, -0.11776924133300781, -0.11200714111328125, -0.10624504089355469, -0.10048294067382812, -0.09472084045410156, -0.088958740234375, -0.08319664001464844, -0.07743453979492188, -0.07167243957519531, -0.06591033935546875, -0.06014823913574219, -0.054386138916015625, -0.04862403869628906, -0.0428619384765625, -0.03709983825683594, -0.031337738037109375, -0.025575637817382812, -0.01981353759765625, -0.014051437377929688, -0.008289337158203125, -0.0025272369384765625, 0.00323486328125, 0.008996963500976562, 0.014759063720703125, 0.020521163940429688, 0.02628326416015625, 0.03204536437988281, 0.037807464599609375, 0.04356956481933594, 0.0493316650390625, 0.05509376525878906, 0.060855865478515625, 0.06661796569824219, 0.07238006591796875, 0.07814216613769531, 0.08390426635742188, 0.08966636657714844, 0.095428466796875, 0.10119056701660156, 0.10695266723632812, 0.11271476745605469, 0.11847686767578125, 0.12423896789550781, 0.13000106811523438, 0.13576316833496094, 0.1415252685546875, 0.14728736877441406, 0.15304946899414062, 0.1588115692138672, 0.16457366943359375, 0.1703357696533203, 0.17609786987304688, 0.18185997009277344, 0.1876220703125]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 6.0, 20.0, 59.0, 93.0, 159.0, 208.0, 178.0, 145.0, 69.0, 39.0, 13.0, 5.0, 5.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.966043710708618, -2.8552286624908447, -2.7444136142730713, -2.633598804473877, -2.5227837562561035, -2.41196870803833, -2.3011536598205566, -2.190338611602783, -2.0795235633850098, -1.9687085151672363, -1.8578935861587524, -1.747078537940979, -1.6362636089324951, -1.5254485607147217, -1.4146335124969482, -1.3038184642791748, -1.1930036544799805, -1.082188606262207, -0.9713736772537231, -0.8605586290359497, -0.749743640422821, -0.6389286518096924, -0.528113603591919, -0.4172986149787903, -0.3064836263656616, -0.19566862285137177, -0.08485361933708191, 0.02596139907836914, 0.1367763876914978, 0.24759137630462646, 0.3584064245223999, 0.46922141313552856, 0.5800361633300781, 0.6908511519432068, 0.8016661405563354, 0.9124811887741089, 1.0232961177825928, 1.1341111660003662, 1.2449262142181396, 1.355741262435913, 1.466556191444397, 1.5773712396621704, 1.6881861686706543, 1.7990012168884277, 1.9098162651062012, 2.0206313133239746, 2.131446361541748, 2.2422611713409424, 2.353076219558716, 2.4638912677764893, 2.5747063159942627, 2.685521125793457, 2.7963361740112305, 2.907151222229004, 3.0179662704467773, 3.128781318664551, 3.239596366882324, 3.3504114151000977, 3.461226463317871, 3.5720415115356445, 3.682856321334839, 3.7936713695526123, 3.9044864177703857, 4.01530122756958, 4.1261162757873535]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [3.0, 1.0, 3.0, 1.0, 0.0, 5.0, 2.0, 0.0, 3.0, 6.0, 9.0, 8.0, 12.0, 24.0, 19.0, 27.0, 31.0, 35.0, 38.0, 39.0, 45.0, 57.0, 50.0, 46.0, 56.0, 53.0, 40.0, 46.0, 45.0, 43.0, 41.0, 31.0, 49.0, 35.0, 32.0, 8.0, 20.0, 14.0, 7.0, 11.0, 8.0, 5.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.801408052444458, -1.7303305864334106, -1.6592532396316528, -1.5881757736206055, -1.5170984268188477, -1.4460209608078003, -1.374943494796753, -1.3038661479949951, -1.2327886819839478, -1.1617112159729004, -1.0906338691711426, -1.0195564031600952, -0.9484789967536926, -0.87740159034729, -0.8063241243362427, -0.7352467179298401, -0.6641693115234375, -0.5930919051170349, -0.5220144987106323, -0.45093703269958496, -0.3798596262931824, -0.3087822198867798, -0.2377047836780548, -0.16662734746932983, -0.09554994106292725, -0.024472519755363464, 0.04660490155220032, 0.1176823228597641, 0.18875974416732788, 0.25983715057373047, 0.33091458678245544, 0.4019920229911804, 0.473069429397583, 0.5441468358039856, 0.6152242422103882, 0.6863017082214355, 0.7573791146278381, 0.8284565210342407, 0.8995339870452881, 0.9706113934516907, 1.0416887998580933, 1.1127662658691406, 1.1838436126708984, 1.2549210786819458, 1.3259985446929932, 1.397075891494751, 1.4681533575057983, 1.5392308235168457, 1.6103081703186035, 1.6813856363296509, 1.7524629831314087, 1.823540449142456, 1.8946177959442139, 1.9656952619552612, 2.0367727279663086, 2.1078500747680664, 2.178927421569824, 2.250004768371582, 2.321082353591919, 2.3921597003936768, 2.4632370471954346, 2.5343146324157715, 2.6053919792175293, 2.676469326019287, 2.747546911239624]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 4.0, 7.0, 8.0, 12.0, 20.0, 33.0, 50.0, 89.0, 213.0, 435.0, 1173.0, 4216.0, 21015.0, 334693.0, 3786081.0, 37439.0, 6162.0, 1605.0, 540.0, 230.0, 105.0, 57.0, 42.0, 17.0, 18.0, 11.0, 5.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.391357421875, -0.3763847351074219, -0.36141204833984375, -0.3464393615722656, -0.3314666748046875, -0.3164939880371094, -0.30152130126953125, -0.2865486145019531, -0.271575927734375, -0.2566032409667969, -0.24163055419921875, -0.22665786743164062, -0.2116851806640625, -0.19671249389648438, -0.18173980712890625, -0.16676712036132812, -0.15179443359375, -0.13682174682617188, -0.12184906005859375, -0.10687637329101562, -0.0919036865234375, -0.07693099975585938, -0.06195831298828125, -0.046985626220703125, -0.032012939453125, -0.017040252685546875, -0.00206756591796875, 0.012905120849609375, 0.0278778076171875, 0.042850494384765625, 0.05782318115234375, 0.07279586791992188, 0.0877685546875, 0.10274124145507812, 0.11771392822265625, 0.13268661499023438, 0.1476593017578125, 0.16263198852539062, 0.17760467529296875, 0.19257736206054688, 0.207550048828125, 0.22252273559570312, 0.23749542236328125, 0.2524681091308594, 0.2674407958984375, 0.2824134826660156, 0.29738616943359375, 0.3123588562011719, 0.32733154296875, 0.3423042297363281, 0.35727691650390625, 0.3722496032714844, 0.3872222900390625, 0.4021949768066406, 0.41716766357421875, 0.4321403503417969, 0.447113037109375, 0.4620857238769531, 0.47705841064453125, 0.4920310974121094, 0.5070037841796875, 0.5219764709472656, 0.5369491577148438, 0.5519218444824219, 0.56689453125]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 7.0, 5.0, 2.0, 7.0, 10.0, 13.0, 7.0, 24.0, 25.0, 24.0, 46.0, 46.0, 48.0, 59.0, 56.0, 72.0, 59.0, 63.0, 68.0, 63.0, 46.0, 40.0, 40.0, 37.0, 24.0, 27.0, 31.0, 20.0, 9.0, 12.0, 5.0, 5.0, 4.0, 3.0, 6.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.123291015625, -0.11966419219970703, -0.11603736877441406, -0.1124105453491211, -0.10878372192382812, -0.10515689849853516, -0.10153007507324219, -0.09790325164794922, -0.09427642822265625, -0.09064960479736328, -0.08702278137207031, -0.08339595794677734, -0.07976913452148438, -0.0761423110961914, -0.07251548767089844, -0.06888866424560547, -0.0652618408203125, -0.06163501739501953, -0.05800819396972656, -0.054381370544433594, -0.050754547119140625, -0.047127723693847656, -0.04350090026855469, -0.03987407684326172, -0.03624725341796875, -0.03262042999267578, -0.028993606567382812, -0.025366783142089844, -0.021739959716796875, -0.018113136291503906, -0.014486312866210938, -0.010859489440917969, -0.007232666015625, -0.0036058425903320312, 2.09808349609375e-05, 0.0036478042602539062, 0.007274627685546875, 0.010901451110839844, 0.014528274536132812, 0.01815509796142578, 0.02178192138671875, 0.02540874481201172, 0.029035568237304688, 0.032662391662597656, 0.036289215087890625, 0.039916038513183594, 0.04354286193847656, 0.04716968536376953, 0.0507965087890625, 0.05442333221435547, 0.05805015563964844, 0.061676979064941406, 0.06530380249023438, 0.06893062591552734, 0.07255744934082031, 0.07618427276611328, 0.07981109619140625, 0.08343791961669922, 0.08706474304199219, 0.09069156646728516, 0.09431838989257812, 0.0979452133178711, 0.10157203674316406, 0.10519886016845703, 0.10882568359375]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 4.0, 1.0, 0.0, 3.0, 10.0, 7.0, 11.0, 9.0, 16.0, 22.0, 35.0, 43.0, 75.0, 90.0, 143.0, 234.0, 351.0, 654.0, 1100.0, 1973.0, 3999.0, 8882.0, 25094.0, 106423.0, 3414723.0, 537367.0, 62136.0, 17260.0, 6690.0, 3059.0, 1582.0, 902.0, 461.0, 301.0, 185.0, 125.0, 82.0, 68.0, 48.0, 34.0, 21.0, 18.0, 8.0, 16.0, 7.0, 4.0, 6.0, 2.0, 3.0, 0.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.234619140625, -0.2272491455078125, -0.219879150390625, -0.2125091552734375, -0.20513916015625, -0.1977691650390625, -0.190399169921875, -0.1830291748046875, -0.1756591796875, -0.1682891845703125, -0.160919189453125, -0.1535491943359375, -0.14617919921875, -0.1388092041015625, -0.131439208984375, -0.1240692138671875, -0.11669921875, -0.1093292236328125, -0.101959228515625, -0.0945892333984375, -0.08721923828125, -0.0798492431640625, -0.072479248046875, -0.0651092529296875, -0.0577392578125, -0.0503692626953125, -0.042999267578125, -0.0356292724609375, -0.02825927734375, -0.0208892822265625, -0.013519287109375, -0.0061492919921875, 0.001220703125, 0.0085906982421875, 0.015960693359375, 0.0233306884765625, 0.03070068359375, 0.0380706787109375, 0.045440673828125, 0.0528106689453125, 0.0601806640625, 0.0675506591796875, 0.074920654296875, 0.0822906494140625, 0.08966064453125, 0.0970306396484375, 0.104400634765625, 0.1117706298828125, 0.119140625, 0.1265106201171875, 0.133880615234375, 0.1412506103515625, 0.14862060546875, 0.1559906005859375, 0.163360595703125, 0.1707305908203125, 0.1781005859375, 0.1854705810546875, 0.192840576171875, 0.2002105712890625, 0.20758056640625, 0.2149505615234375, 0.222320556640625, 0.2296905517578125, 0.237060546875]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 4.0, 5.0, 9.0, 9.0, 14.0, 33.0, 51.0, 131.0, 639.0, 2799.0, 221.0, 83.0, 39.0, 21.0, 10.0, 7.0, 2.0, 1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11627197265625, -0.11305904388427734, -0.10984611511230469, -0.10663318634033203, -0.10342025756835938, -0.10020732879638672, -0.09699440002441406, -0.0937814712524414, -0.09056854248046875, -0.0873556137084961, -0.08414268493652344, -0.08092975616455078, -0.07771682739257812, -0.07450389862060547, -0.07129096984863281, -0.06807804107666016, -0.0648651123046875, -0.061652183532714844, -0.05843925476074219, -0.05522632598876953, -0.052013397216796875, -0.04880046844482422, -0.04558753967285156, -0.042374610900878906, -0.03916168212890625, -0.035948753356933594, -0.03273582458496094, -0.02952289581298828, -0.026309967041015625, -0.02309703826904297, -0.019884109497070312, -0.016671180725097656, -0.013458251953125, -0.010245323181152344, -0.0070323944091796875, -0.0038194656372070312, -0.000606536865234375, 0.0026063919067382812, 0.0058193206787109375, 0.009032249450683594, 0.01224517822265625, 0.015458106994628906, 0.018671035766601562, 0.02188396453857422, 0.025096893310546875, 0.02830982208251953, 0.03152275085449219, 0.034735679626464844, 0.0379486083984375, 0.041161537170410156, 0.04437446594238281, 0.04758739471435547, 0.050800323486328125, 0.05401325225830078, 0.05722618103027344, 0.060439109802246094, 0.06365203857421875, 0.0668649673461914, 0.07007789611816406, 0.07329082489013672, 0.07650375366210938, 0.07971668243408203, 0.08292961120605469, 0.08614253997802734, 0.08935546875]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 3.0, 1.0, 3.0, 3.0, 5.0, 10.0, 18.0, 18.0, 35.0, 54.0, 69.0, 96.0, 130.0, 121.0, 130.0, 122.0, 80.0, 54.0, 28.0, 11.0, 12.0, 4.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.31168490648269653, -0.3032430410385132, -0.29480117559432983, -0.28635933995246887, -0.2779174745082855, -0.2694756090641022, -0.2610337734222412, -0.25259190797805786, -0.2441500425338745, -0.23570817708969116, -0.227266326546669, -0.21882447600364685, -0.2103826105594635, -0.20194074511528015, -0.193498894572258, -0.18505704402923584, -0.1766151785850525, -0.16817331314086914, -0.15973146259784698, -0.15128961205482483, -0.14284774661064148, -0.13440588116645813, -0.12596403062343597, -0.11752217262983322, -0.10908031463623047, -0.10063845664262772, -0.09219659864902496, -0.08375474065542221, -0.07531288266181946, -0.0668710246682167, -0.05842916667461395, -0.0499873086810112, -0.04154545068740845, -0.033103592693805695, -0.024661734700202942, -0.01621987670660019, -0.0077780187129974365, 0.0006638392806053162, 0.009105697274208069, 0.01754755526781082, 0.025989413261413574, 0.03443127125501633, 0.04287312924861908, 0.05131498724222183, 0.059756845235824585, 0.06819870322942734, 0.07664056122303009, 0.08508241921663284, 0.0935242772102356, 0.10196613520383835, 0.1104079931974411, 0.11884985119104385, 0.1272917091846466, 0.13573357462882996, 0.1441754251718521, 0.15261727571487427, 0.16105914115905762, 0.16950100660324097, 0.17794285714626312, 0.18638470768928528, 0.19482657313346863, 0.20326843857765198, 0.21171028912067413, 0.2201521396636963, 0.22859400510787964]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 6.0, 3.0, 5.0, 7.0, 8.0, 11.0, 17.0, 11.0, 11.0, 22.0, 19.0, 23.0, 31.0, 37.0, 41.0, 41.0, 36.0, 40.0, 47.0, 46.0, 49.0, 45.0, 46.0, 49.0, 40.0, 34.0, 35.0, 31.0, 37.0, 32.0, 24.0, 24.0, 21.0, 21.0, 19.0, 9.0, 7.0, 6.0, 11.0, 4.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 0.0, 1.0], "bins": [-0.16033828258514404, -0.15594208240509033, -0.15154588222503662, -0.1471496969461441, -0.1427534967660904, -0.13835729658603668, -0.13396109640598297, -0.12956489622592926, -0.12516871094703674, -0.12077251076698303, -0.11637631803750992, -0.11198011785745621, -0.1075839251279831, -0.10318772494792938, -0.09879152476787567, -0.09439532458782196, -0.08999912440776825, -0.08560292422771454, -0.08120673149824142, -0.07681053131818771, -0.0724143385887146, -0.06801813840866089, -0.06362193822860718, -0.059225741773843765, -0.05482954531908035, -0.05043334886431694, -0.04603715240955353, -0.04164095222949982, -0.037244755774736404, -0.03284855931997299, -0.02845236100256443, -0.02405616268515587, -0.019659966230392456, -0.015263768844306469, -0.010867571458220482, -0.006471374072134495, -0.0020751766860485077, 0.002321019768714905, 0.0067172180861234665, 0.011113416403532028, 0.01550961285829544, 0.019905809313058853, 0.024302007630467415, 0.028698205947875977, 0.03309440240263939, 0.0374905988574028, 0.04188679903745651, 0.046282995492219925, 0.05067919194698334, 0.05507538840174675, 0.05947158485651016, 0.06386778503656387, 0.06826397776603699, 0.0726601779460907, 0.07705637812614441, 0.08145257830619812, 0.08584877103567123, 0.09024497121572495, 0.09464116394519806, 0.09903736412525177, 0.10343356430530548, 0.1078297570347786, 0.1122259572148323, 0.11662214994430542, 0.12101835012435913]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 6.0, 6.0, 2.0, 10.0, 14.0, 24.0, 22.0, 52.0, 82.0, 152.0, 337.0, 799.0, 2335.0, 7439.0, 29894.0, 139224.0, 431527.0, 327915.0, 82948.0, 18250.0, 4723.0, 1607.0, 600.0, 266.0, 111.0, 81.0, 58.0, 30.0, 20.0, 11.0, 7.0, 7.0, 4.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.318603515625, -0.30859375, -0.298583984375, -0.28857421875, -0.278564453125, -0.2685546875, -0.258544921875, -0.24853515625, -0.238525390625, -0.228515625, -0.218505859375, -0.20849609375, -0.198486328125, -0.1884765625, -0.178466796875, -0.16845703125, -0.158447265625, -0.1484375, -0.138427734375, -0.12841796875, -0.118408203125, -0.1083984375, -0.098388671875, -0.08837890625, -0.078369140625, -0.068359375, -0.058349609375, -0.04833984375, -0.038330078125, -0.0283203125, -0.018310546875, -0.00830078125, 0.001708984375, 0.01171875, 0.021728515625, 0.03173828125, 0.041748046875, 0.0517578125, 0.061767578125, 0.07177734375, 0.081787109375, 0.091796875, 0.101806640625, 0.11181640625, 0.121826171875, 0.1318359375, 0.141845703125, 0.15185546875, 0.161865234375, 0.171875, 0.181884765625, 0.19189453125, 0.201904296875, 0.2119140625, 0.221923828125, 0.23193359375, 0.241943359375, 0.251953125, 0.261962890625, 0.27197265625, 0.281982421875, 0.2919921875, 0.302001953125, 0.31201171875, 0.322021484375]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 8.0, 4.0, 9.0, 13.0, 17.0, 24.0, 21.0, 26.0, 44.0, 52.0, 64.0, 69.0, 68.0, 52.0, 77.0, 68.0, 66.0, 52.0, 52.0, 46.0, 29.0, 25.0, 36.0, 23.0, 16.0, 20.0, 7.0, 8.0, 6.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.1275634765625, -0.12363147735595703, -0.11969947814941406, -0.1157674789428711, -0.11183547973632812, -0.10790348052978516, -0.10397148132324219, -0.10003948211669922, -0.09610748291015625, -0.09217548370361328, -0.08824348449707031, -0.08431148529052734, -0.08037948608398438, -0.0764474868774414, -0.07251548767089844, -0.06858348846435547, -0.0646514892578125, -0.06071949005126953, -0.05678749084472656, -0.052855491638183594, -0.048923492431640625, -0.044991493225097656, -0.04105949401855469, -0.03712749481201172, -0.03319549560546875, -0.02926349639892578, -0.025331497192382812, -0.021399497985839844, -0.017467498779296875, -0.013535499572753906, -0.009603500366210938, -0.005671501159667969, -0.001739501953125, 0.0021924972534179688, 0.0061244964599609375, 0.010056495666503906, 0.013988494873046875, 0.017920494079589844, 0.021852493286132812, 0.02578449249267578, 0.02971649169921875, 0.03364849090576172, 0.03758049011230469, 0.041512489318847656, 0.045444488525390625, 0.049376487731933594, 0.05330848693847656, 0.05724048614501953, 0.0611724853515625, 0.06510448455810547, 0.06903648376464844, 0.0729684829711914, 0.07690048217773438, 0.08083248138427734, 0.08476448059082031, 0.08869647979736328, 0.09262847900390625, 0.09656047821044922, 0.10049247741699219, 0.10442447662353516, 0.10835647583007812, 0.1122884750366211, 0.11622047424316406, 0.12015247344970703, 0.12408447265625]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 3.0, 2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 3.0, 1.0, 4.0, 6.0, 8.0, 11.0, 15.0, 17.0, 28.0, 38.0, 69.0, 117.0, 218.0, 352.0, 656.0, 1392.0, 3760.0, 14057.0, 88506.0, 553851.0, 327574.0, 44475.0, 8481.0, 2609.0, 1105.0, 498.0, 291.0, 137.0, 82.0, 59.0, 47.0, 25.0, 16.0, 10.0, 6.0, 7.0, 3.0, 3.0, 7.0, 5.0, 4.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.35009765625, -0.3383598327636719, -0.32662200927734375, -0.3148841857910156, -0.3031463623046875, -0.2914085388183594, -0.27967071533203125, -0.2679328918457031, -0.256195068359375, -0.24445724487304688, -0.23271942138671875, -0.22098159790039062, -0.2092437744140625, -0.19750595092773438, -0.18576812744140625, -0.17403030395507812, -0.16229248046875, -0.15055465698242188, -0.13881683349609375, -0.12707901000976562, -0.1153411865234375, -0.10360336303710938, -0.09186553955078125, -0.08012771606445312, -0.068389892578125, -0.056652069091796875, -0.04491424560546875, -0.033176422119140625, -0.0214385986328125, -0.009700775146484375, 0.00203704833984375, 0.013774871826171875, 0.0255126953125, 0.037250518798828125, 0.04898834228515625, 0.060726165771484375, 0.0724639892578125, 0.08420181274414062, 0.09593963623046875, 0.10767745971679688, 0.119415283203125, 0.13115310668945312, 0.14289093017578125, 0.15462875366210938, 0.1663665771484375, 0.17810440063476562, 0.18984222412109375, 0.20158004760742188, 0.21331787109375, 0.22505569458007812, 0.23679351806640625, 0.24853134155273438, 0.2602691650390625, 0.2720069885253906, 0.28374481201171875, 0.2954826354980469, 0.307220458984375, 0.3189582824707031, 0.33069610595703125, 0.3424339294433594, 0.3541717529296875, 0.3659095764160156, 0.37764739990234375, 0.3893852233886719, 0.401123046875]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 4.0, 7.0, 3.0, 12.0, 15.0, 16.0, 17.0, 16.0, 20.0, 29.0, 40.0, 42.0, 42.0, 45.0, 41.0, 44.0, 61.0, 53.0, 44.0, 57.0, 49.0, 53.0, 39.0, 42.0, 24.0, 40.0, 27.0, 20.0, 14.0, 17.0, 21.0, 9.0, 9.0, 7.0, 6.0, 2.0, 5.0, 0.0, 5.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.46630859375, -0.45105743408203125, -0.4358062744140625, -0.42055511474609375, -0.405303955078125, -0.39005279541015625, -0.3748016357421875, -0.35955047607421875, -0.34429931640625, -0.32904815673828125, -0.3137969970703125, -0.29854583740234375, -0.283294677734375, -0.26804351806640625, -0.2527923583984375, -0.23754119873046875, -0.2222900390625, -0.20703887939453125, -0.1917877197265625, -0.17653656005859375, -0.161285400390625, -0.14603424072265625, -0.1307830810546875, -0.11553192138671875, -0.10028076171875, -0.08502960205078125, -0.0697784423828125, -0.05452728271484375, -0.039276123046875, -0.02402496337890625, -0.0087738037109375, 0.00647735595703125, 0.021728515625, 0.03697967529296875, 0.0522308349609375, 0.06748199462890625, 0.082733154296875, 0.09798431396484375, 0.1132354736328125, 0.12848663330078125, 0.14373779296875, 0.15898895263671875, 0.1742401123046875, 0.18949127197265625, 0.204742431640625, 0.21999359130859375, 0.2352447509765625, 0.25049591064453125, 0.2657470703125, 0.28099822998046875, 0.2962493896484375, 0.31150054931640625, 0.326751708984375, 0.34200286865234375, 0.3572540283203125, 0.37250518798828125, 0.38775634765625, 0.40300750732421875, 0.4182586669921875, 0.43350982666015625, 0.448760986328125, 0.46401214599609375, 0.4792633056640625, 0.49451446533203125, 0.509765625]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 2.0, 3.0, 4.0, 3.0, 6.0, 8.0, 14.0, 14.0, 11.0, 22.0, 28.0, 56.0, 71.0, 129.0, 219.0, 388.0, 1022.0, 3518.0, 33294.0, 866228.0, 133544.0, 7227.0, 1513.0, 545.0, 249.0, 132.0, 100.0, 61.0, 34.0, 30.0, 26.0, 9.0, 11.0, 8.0, 8.0, 2.0, 6.0, 6.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-0.36376953125, -0.3519172668457031, -0.34006500244140625, -0.3282127380371094, -0.3163604736328125, -0.3045082092285156, -0.29265594482421875, -0.2808036804199219, -0.268951416015625, -0.2570991516113281, -0.24524688720703125, -0.23339462280273438, -0.2215423583984375, -0.20969009399414062, -0.19783782958984375, -0.18598556518554688, -0.17413330078125, -0.16228103637695312, -0.15042877197265625, -0.13857650756835938, -0.1267242431640625, -0.11487197875976562, -0.10301971435546875, -0.09116744995117188, -0.079315185546875, -0.06746292114257812, -0.05561065673828125, -0.043758392333984375, -0.0319061279296875, -0.020053863525390625, -0.00820159912109375, 0.003650665283203125, 0.0155029296875, 0.027355194091796875, 0.03920745849609375, 0.051059722900390625, 0.0629119873046875, 0.07476425170898438, 0.08661651611328125, 0.09846878051757812, 0.110321044921875, 0.12217330932617188, 0.13402557373046875, 0.14587783813476562, 0.1577301025390625, 0.16958236694335938, 0.18143463134765625, 0.19328689575195312, 0.20513916015625, 0.21699142456054688, 0.22884368896484375, 0.24069595336914062, 0.2525482177734375, 0.2644004821777344, 0.27625274658203125, 0.2881050109863281, 0.299957275390625, 0.3118095397949219, 0.32366180419921875, 0.3355140686035156, 0.3473663330078125, 0.3592185974121094, 0.37107086181640625, 0.3829231262207031, 0.394775390625]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 1.0, 4.0, 7.0, 28.0, 43.0, 92.0, 147.0, 236.0, 206.0, 126.0, 64.0, 26.0, 11.0, 7.0, 9.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.85860824584961e-05, -9.193085134029388e-05, -8.527562022209167e-05, -7.862038910388947e-05, -7.196515798568726e-05, -6.530992686748505e-05, -5.865469574928284e-05, -5.199946463108063e-05, -4.534423351287842e-05, -3.868900239467621e-05, -3.2033771276474e-05, -2.537854015827179e-05, -1.872330904006958e-05, -1.206807792186737e-05, -5.412846803665161e-06, 1.2423843145370483e-06, 7.897615432739258e-06, 1.4552846550941467e-05, 2.1208077669143677e-05, 2.7863308787345886e-05, 3.4518539905548096e-05, 4.1173771023750305e-05, 4.7829002141952515e-05, 5.4484233260154724e-05, 6.113946437835693e-05, 6.779469549655914e-05, 7.444992661476135e-05, 8.110515773296356e-05, 8.776038885116577e-05, 9.441561996936798e-05, 0.00010107085108757019, 0.0001077260822057724, 0.00011438131332397461, 0.00012103654444217682, 0.00012769177556037903, 0.00013434700667858124, 0.00014100223779678345, 0.00014765746891498566, 0.00015431270003318787, 0.00016096793115139008, 0.00016762316226959229, 0.0001742783933877945, 0.0001809336245059967, 0.00018758885562419891, 0.00019424408674240112, 0.00020089931786060333, 0.00020755454897880554, 0.00021420978009700775, 0.00022086501121520996, 0.00022752024233341217, 0.00023417547345161438, 0.0002408307045698166, 0.0002474859356880188, 0.000254141166806221, 0.0002607963979244232, 0.00026745162904262543, 0.00027410686016082764, 0.00028076209127902985, 0.00028741732239723206, 0.00029407255351543427, 0.0003007277846336365, 0.0003073830157518387, 0.0003140382468700409, 0.0003206934779882431, 0.0003273487091064453]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 7.0, 10.0, 5.0, 21.0, 19.0, 24.0, 52.0, 81.0, 122.0, 285.0, 638.0, 1471.0, 5035.0, 27751.0, 344875.0, 607786.0, 49581.0, 7312.0, 1965.0, 752.0, 324.0, 174.0, 98.0, 62.0, 31.0, 24.0, 12.0, 10.0, 10.0, 7.0, 4.0, 1.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.2783203125, -0.2712078094482422, -0.2640953063964844, -0.25698280334472656, -0.24987030029296875, -0.24275779724121094, -0.23564529418945312, -0.2285327911376953, -0.2214202880859375, -0.2143077850341797, -0.20719528198242188, -0.20008277893066406, -0.19297027587890625, -0.18585777282714844, -0.17874526977539062, -0.1716327667236328, -0.164520263671875, -0.1574077606201172, -0.15029525756835938, -0.14318275451660156, -0.13607025146484375, -0.12895774841308594, -0.12184524536132812, -0.11473274230957031, -0.1076202392578125, -0.10050773620605469, -0.09339523315429688, -0.08628273010253906, -0.07917022705078125, -0.07205772399902344, -0.06494522094726562, -0.05783271789550781, -0.05072021484375, -0.04360771179199219, -0.036495208740234375, -0.029382705688476562, -0.02227020263671875, -0.015157699584960938, -0.008045196533203125, -0.0009326934814453125, 0.0061798095703125, 0.013292312622070312, 0.020404815673828125, 0.027517318725585938, 0.03462982177734375, 0.04174232482910156, 0.048854827880859375, 0.05596733093261719, 0.063079833984375, 0.07019233703613281, 0.07730484008789062, 0.08441734313964844, 0.09152984619140625, 0.09864234924316406, 0.10575485229492188, 0.11286735534667969, 0.1199798583984375, 0.1270923614501953, 0.13420486450195312, 0.14131736755371094, 0.14842987060546875, 0.15554237365722656, 0.16265487670898438, 0.1697673797607422, 0.1768798828125]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [3.0, 2.0, 2.0, 1.0, 5.0, 1.0, 7.0, 6.0, 5.0, 6.0, 7.0, 21.0, 14.0, 31.0, 43.0, 83.0, 85.0, 124.0, 126.0, 125.0, 101.0, 68.0, 50.0, 23.0, 17.0, 17.0, 7.0, 7.0, 7.0, 5.0, 2.0, 4.0, 4.0, 1.0, 5.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.156005859375, -0.147491455078125, -0.13897705078125, -0.130462646484375, -0.1219482421875, -0.113433837890625, -0.10491943359375, -0.096405029296875, -0.087890625, -0.079376220703125, -0.07086181640625, -0.062347412109375, -0.0538330078125, -0.045318603515625, -0.03680419921875, -0.028289794921875, -0.019775390625, -0.011260986328125, -0.00274658203125, 0.005767822265625, 0.0142822265625, 0.022796630859375, 0.03131103515625, 0.039825439453125, 0.04833984375, 0.056854248046875, 0.06536865234375, 0.073883056640625, 0.0823974609375, 0.090911865234375, 0.09942626953125, 0.107940673828125, 0.116455078125, 0.124969482421875, 0.13348388671875, 0.141998291015625, 0.1505126953125, 0.159027099609375, 0.16754150390625, 0.176055908203125, 0.1845703125, 0.193084716796875, 0.20159912109375, 0.210113525390625, 0.2186279296875, 0.227142333984375, 0.23565673828125, 0.244171142578125, 0.252685546875, 0.261199951171875, 0.26971435546875, 0.278228759765625, 0.2867431640625, 0.295257568359375, 0.30377197265625, 0.312286376953125, 0.32080078125, 0.329315185546875, 0.33782958984375, 0.346343994140625, 0.3548583984375, 0.363372802734375, 0.37188720703125, 0.380401611328125, 0.388916015625]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 7.0, 1.0, 7.0, 4.0, 21.0, 53.0, 139.0, 197.0, 238.0, 184.0, 94.0, 44.0, 14.0, 7.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.593186616897583, -3.4267771244049072, -3.2603676319122314, -3.0939581394195557, -2.92754864692688, -2.761139154434204, -2.5947296619415283, -2.4283201694488525, -2.2619106769561768, -2.095501184463501, -1.9290916919708252, -1.7626821994781494, -1.5962727069854736, -1.4298632144927979, -1.263453722000122, -1.0970442295074463, -0.9306347370147705, -0.7642252445220947, -0.597815752029419, -0.43140625953674316, -0.2649967670440674, -0.0985872745513916, 0.06782221794128418, 0.23423171043395996, 0.40064120292663574, 0.5670506954193115, 0.7334601879119873, 0.8998696804046631, 1.0662791728973389, 1.2326886653900146, 1.3990981578826904, 1.5655076503753662, 1.731917381286621, 1.8983268737792969, 2.0647363662719727, 2.2311458587646484, 2.397555351257324, 2.56396484375, 2.730374336242676, 2.8967838287353516, 3.0631933212280273, 3.229602813720703, 3.396012306213379, 3.5624217987060547, 3.7288312911987305, 3.8952407836914062, 4.061650276184082, 4.228059768676758, 4.394469261169434, 4.560878753662109, 4.727288246154785, 4.893697738647461, 5.060107231140137, 5.2265167236328125, 5.392926216125488, 5.559335708618164, 5.72574520111084, 5.892154693603516, 6.058564186096191, 6.224973678588867, 6.391383171081543, 6.557792663574219, 6.7242021560668945, 6.89061164855957, 7.057021141052246]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 3.0, 7.0, 4.0, 3.0, 5.0, 9.0, 9.0, 10.0, 8.0, 21.0, 25.0, 22.0, 27.0, 31.0, 34.0, 27.0, 41.0, 52.0, 63.0, 60.0, 68.0, 66.0, 54.0, 56.0, 53.0, 31.0, 36.0, 37.0, 21.0, 23.0, 24.0, 18.0, 13.0, 8.0, 15.0, 3.0, 7.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-3.0950942039489746, -3.002689838409424, -2.910285472869873, -2.8178813457489014, -2.7254769802093506, -2.6330726146698, -2.540668487548828, -2.4482641220092773, -2.3558597564697266, -2.263455390930176, -2.171051025390625, -2.0786468982696533, -1.9862425327301025, -1.8938381671905518, -1.8014339208602905, -1.7090296745300293, -1.6166253089904785, -1.5242209434509277, -1.4318166971206665, -1.3394124507904053, -1.2470080852508545, -1.1546037197113037, -1.0621994733810425, -0.9697951674461365, -0.8773908615112305, -0.7849865555763245, -0.6925822496414185, -0.6001779437065125, -0.5077736377716064, -0.41536933183670044, -0.32296502590179443, -0.23056071996688843, -0.13815641403198242, -0.045752108097076416, 0.04665219783782959, 0.1390565037727356, 0.2314608097076416, 0.3238651156425476, 0.4162694215774536, 0.5086737275123596, 0.6010780334472656, 0.6934823393821716, 0.7858866453170776, 0.8782909512519836, 0.9706952571868896, 1.0630996227264404, 1.1555038690567017, 1.247908115386963, 1.3403124809265137, 1.4327168464660645, 1.5251210927963257, 1.617525339126587, 1.7099297046661377, 1.8023340702056885, 1.8947383165359497, 1.987142562866211, 2.0795469284057617, 2.1719512939453125, 2.2643556594848633, 2.356759786605835, 2.4491641521453857, 2.5415685176849365, 2.633972644805908, 2.726377010345459, 2.8187813758850098]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 3.0, 0.0, 1.0, 2.0, 3.0, 3.0, 4.0, 11.0, 6.0, 9.0, 16.0, 29.0, 38.0, 78.0, 111.0, 200.0, 362.0, 767.0, 1612.0, 4343.0, 15440.0, 94755.0, 3836837.0, 204416.0, 24747.0, 6272.0, 2166.0, 942.0, 469.0, 271.0, 145.0, 94.0, 42.0, 31.0, 17.0, 14.0, 10.0, 11.0, 8.0, 3.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2391357421875, -0.22902488708496094, -0.21891403198242188, -0.2088031768798828, -0.19869232177734375, -0.1885814666748047, -0.17847061157226562, -0.16835975646972656, -0.1582489013671875, -0.14813804626464844, -0.13802719116210938, -0.1279163360595703, -0.11780548095703125, -0.10769462585449219, -0.09758377075195312, -0.08747291564941406, -0.077362060546875, -0.06725120544433594, -0.057140350341796875, -0.04702949523925781, -0.03691864013671875, -0.026807785034179688, -0.016696929931640625, -0.0065860748291015625, 0.0035247802734375, 0.013635635375976562, 0.023746490478515625, 0.03385734558105469, 0.04396820068359375, 0.05407905578613281, 0.06418991088867188, 0.07430076599121094, 0.08441162109375, 0.09452247619628906, 0.10463333129882812, 0.11474418640136719, 0.12485504150390625, 0.1349658966064453, 0.14507675170898438, 0.15518760681152344, 0.1652984619140625, 0.17540931701660156, 0.18552017211914062, 0.1956310272216797, 0.20574188232421875, 0.2158527374267578, 0.22596359252929688, 0.23607444763183594, 0.246185302734375, 0.25629615783691406, 0.2664070129394531, 0.2765178680419922, 0.28662872314453125, 0.2967395782470703, 0.3068504333496094, 0.31696128845214844, 0.3270721435546875, 0.33718299865722656, 0.3472938537597656, 0.3574047088623047, 0.36751556396484375, 0.3776264190673828, 0.3877372741699219, 0.39784812927246094, 0.407958984375]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 3.0, 2.0, 4.0, 4.0, 7.0, 8.0, 3.0, 8.0, 15.0, 20.0, 30.0, 26.0, 37.0, 54.0, 44.0, 40.0, 62.0, 67.0, 69.0, 69.0, 67.0, 46.0, 61.0, 52.0, 40.0, 33.0, 30.0, 21.0, 11.0, 19.0, 12.0, 13.0, 8.0, 4.0, 7.0, 3.0, 2.0, 5.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1285400390625, -0.1246480941772461, -0.12075614929199219, -0.11686420440673828, -0.11297225952148438, -0.10908031463623047, -0.10518836975097656, -0.10129642486572266, -0.09740447998046875, -0.09351253509521484, -0.08962059020996094, -0.08572864532470703, -0.08183670043945312, -0.07794475555419922, -0.07405281066894531, -0.0701608657836914, -0.0662689208984375, -0.062376976013183594, -0.05848503112792969, -0.05459308624267578, -0.050701141357421875, -0.04680919647216797, -0.04291725158691406, -0.039025306701660156, -0.03513336181640625, -0.031241416931152344, -0.027349472045898438, -0.02345752716064453, -0.019565582275390625, -0.01567363739013672, -0.011781692504882812, -0.007889747619628906, -0.003997802734375, -0.00010585784912109375, 0.0037860870361328125, 0.007678031921386719, 0.011569976806640625, 0.015461921691894531, 0.019353866577148438, 0.023245811462402344, 0.02713775634765625, 0.031029701232910156, 0.03492164611816406, 0.03881359100341797, 0.042705535888671875, 0.04659748077392578, 0.05048942565917969, 0.054381370544433594, 0.0582733154296875, 0.062165260314941406, 0.06605720520019531, 0.06994915008544922, 0.07384109497070312, 0.07773303985595703, 0.08162498474121094, 0.08551692962646484, 0.08940887451171875, 0.09330081939697266, 0.09719276428222656, 0.10108470916748047, 0.10497665405273438, 0.10886859893798828, 0.11276054382324219, 0.1166524887084961, 0.12054443359375]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 8.0, 8.0, 10.0, 10.0, 14.0, 29.0, 36.0, 34.0, 58.0, 90.0, 122.0, 186.0, 302.0, 537.0, 942.0, 1979.0, 4353.0, 10732.0, 34759.0, 177456.0, 3546202.0, 339642.0, 51547.0, 14550.0, 5517.0, 2377.0, 1160.0, 610.0, 330.0, 221.0, 147.0, 87.0, 74.0, 32.0, 39.0, 27.0, 13.0, 12.0, 14.0, 6.0, 8.0, 4.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.251708984375, -0.24422645568847656, -0.23674392700195312, -0.2292613983154297, -0.22177886962890625, -0.2142963409423828, -0.20681381225585938, -0.19933128356933594, -0.1918487548828125, -0.18436622619628906, -0.17688369750976562, -0.1694011688232422, -0.16191864013671875, -0.1544361114501953, -0.14695358276367188, -0.13947105407714844, -0.131988525390625, -0.12450599670410156, -0.11702346801757812, -0.10954093933105469, -0.10205841064453125, -0.09457588195800781, -0.08709335327148438, -0.07961082458496094, -0.0721282958984375, -0.06464576721191406, -0.057163238525390625, -0.04968070983886719, -0.04219818115234375, -0.03471565246582031, -0.027233123779296875, -0.019750595092773438, -0.01226806640625, -0.0047855377197265625, 0.002696990966796875, 0.010179519653320312, 0.01766204833984375, 0.025144577026367188, 0.032627105712890625, 0.04010963439941406, 0.0475921630859375, 0.05507469177246094, 0.06255722045898438, 0.07003974914550781, 0.07752227783203125, 0.08500480651855469, 0.09248733520507812, 0.09996986389160156, 0.107452392578125, 0.11493492126464844, 0.12241744995117188, 0.1298999786376953, 0.13738250732421875, 0.1448650360107422, 0.15234756469726562, 0.15983009338378906, 0.1673126220703125, 0.17479515075683594, 0.18227767944335938, 0.1897602081298828, 0.19724273681640625, 0.2047252655029297, 0.21220779418945312, 0.21969032287597656, 0.2271728515625]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 2.0, 2.0, 5.0, 4.0, 3.0, 6.0, 9.0, 19.0, 16.0, 25.0, 56.0, 90.0, 179.0, 385.0, 2362.0, 497.0, 190.0, 97.0, 45.0, 20.0, 19.0, 12.0, 15.0, 9.0, 5.0, 5.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0634765625, -0.06109428405761719, -0.058712005615234375, -0.05632972717285156, -0.05394744873046875, -0.05156517028808594, -0.049182891845703125, -0.04680061340332031, -0.0444183349609375, -0.04203605651855469, -0.039653778076171875, -0.03727149963378906, -0.03488922119140625, -0.03250694274902344, -0.030124664306640625, -0.027742385864257812, -0.025360107421875, -0.022977828979492188, -0.020595550537109375, -0.018213272094726562, -0.01583099365234375, -0.013448715209960938, -0.011066436767578125, -0.008684158325195312, -0.0063018798828125, -0.0039196014404296875, -0.001537322998046875, 0.0008449554443359375, 0.00322723388671875, 0.0056095123291015625, 0.007991790771484375, 0.010374069213867188, 0.01275634765625, 0.015138626098632812, 0.017520904541015625, 0.019903182983398438, 0.02228546142578125, 0.024667739868164062, 0.027050018310546875, 0.029432296752929688, 0.0318145751953125, 0.03419685363769531, 0.036579132080078125, 0.03896141052246094, 0.04134368896484375, 0.04372596740722656, 0.046108245849609375, 0.04849052429199219, 0.050872802734375, 0.05325508117675781, 0.055637359619140625, 0.05801963806152344, 0.06040191650390625, 0.06278419494628906, 0.06516647338867188, 0.06754875183105469, 0.0699310302734375, 0.07231330871582031, 0.07469558715820312, 0.07707786560058594, 0.07946014404296875, 0.08184242248535156, 0.08422470092773438, 0.08660697937011719, 0.0889892578125]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 4.0, 5.0, 7.0, 19.0, 28.0, 37.0, 32.0, 58.0, 67.0, 95.0, 97.0, 96.0, 106.0, 74.0, 71.0, 56.0, 47.0, 23.0, 23.0, 14.0, 11.0, 10.0, 5.0, 4.0, 1.0, 2.0, 2.0, 1.0, 2.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.32781243324279785, -0.3197641670703888, -0.31171587109565735, -0.3036676049232483, -0.29561933875083923, -0.2875710427761078, -0.27952277660369873, -0.2714745104312897, -0.2634262144565582, -0.25537794828414917, -0.24732966721057892, -0.23928138613700867, -0.23123310506343842, -0.22318482398986816, -0.2151365578174591, -0.20708827674388885, -0.1990400105714798, -0.19099172949790955, -0.1829434633255005, -0.17489518225193024, -0.16684690117835999, -0.15879863500595093, -0.15075035393238068, -0.14270207285881042, -0.13465380668640137, -0.12660552561283112, -0.11855725198984146, -0.1105089783668518, -0.10246069729328156, -0.0944124236702919, -0.08636415004730225, -0.078315868973732, -0.07026758790016174, -0.06221931055188179, -0.05417103320360184, -0.04612275958061218, -0.03807448223233223, -0.030026204884052277, -0.021977931261062622, -0.013929653912782669, -0.005881376564502716, 0.0021668998524546623, 0.01021517626941204, 0.018263451755046844, 0.026311729103326797, 0.03436000645160675, 0.042408280074596405, 0.05045655742287636, 0.05850483477115631, 0.06655310839414597, 0.07460138946771622, 0.08264966309070587, 0.09069794416427612, 0.09874621778726578, 0.10679449141025543, 0.11484277248382568, 0.12289104610681534, 0.130939319729805, 0.13898760080337524, 0.1470358669757843, 0.15508414804935455, 0.1631324291229248, 0.17118069529533386, 0.1792289763689041, 0.18727725744247437]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 4.0, 8.0, 11.0, 5.0, 8.0, 8.0, 18.0, 16.0, 9.0, 18.0, 33.0, 25.0, 26.0, 33.0, 36.0, 47.0, 47.0, 34.0, 41.0, 34.0, 34.0, 48.0, 47.0, 45.0, 35.0, 39.0, 40.0, 36.0, 29.0, 31.0, 19.0, 29.0, 16.0, 14.0, 13.0, 16.0, 13.0, 6.0, 8.0, 2.0, 7.0, 2.0, 6.0, 5.0, 6.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0], "bins": [-0.209530770778656, -0.20335735380649567, -0.19718393683433533, -0.19101053476333618, -0.18483711779117584, -0.1786637008190155, -0.17249029874801636, -0.16631688177585602, -0.16014346480369568, -0.15397004783153534, -0.147796630859375, -0.14162322878837585, -0.13544981181621552, -0.12927639484405518, -0.12310298532247543, -0.11692957580089569, -0.11075615882873535, -0.10458274185657501, -0.09840933233499527, -0.09223592281341553, -0.08606250584125519, -0.07988908886909485, -0.0737156793475151, -0.06754226982593536, -0.061368852853775024, -0.055195439606904984, -0.04902202636003494, -0.0428486131131649, -0.03667519986629486, -0.03050178661942482, -0.02432837337255478, -0.018154960125684738, -0.011981546878814697, -0.005808133631944656, 0.0003652796149253845, 0.006538692861795425, 0.012712106108665466, 0.018885519355535507, 0.025058932602405548, 0.03123234584927559, 0.03740575909614563, 0.04357917234301567, 0.04975258558988571, 0.05592599883675575, 0.06209941208362579, 0.06827282905578613, 0.07444623857736588, 0.08061964809894562, 0.08679306507110596, 0.0929664820432663, 0.09913989156484604, 0.10531330108642578, 0.11148671805858612, 0.11766013503074646, 0.1238335445523262, 0.13000695407390594, 0.13618037104606628, 0.14235378801822662, 0.14852720499038696, 0.1547006070613861, 0.16087402403354645, 0.1670474410057068, 0.17322084307670593, 0.17939426004886627, 0.1855676770210266]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 4.0, 9.0, 8.0, 13.0, 21.0, 23.0, 47.0, 65.0, 129.0, 264.0, 494.0, 1185.0, 3064.0, 9838.0, 36682.0, 149234.0, 404492.0, 317176.0, 92687.0, 22877.0, 6299.0, 2178.0, 899.0, 398.0, 198.0, 100.0, 61.0, 39.0, 22.0, 14.0, 11.0, 8.0, 3.0, 8.0, 6.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.269775390625, -0.26224517822265625, -0.2547149658203125, -0.24718475341796875, -0.239654541015625, -0.23212432861328125, -0.2245941162109375, -0.21706390380859375, -0.20953369140625, -0.20200347900390625, -0.1944732666015625, -0.18694305419921875, -0.179412841796875, -0.17188262939453125, -0.1643524169921875, -0.15682220458984375, -0.1492919921875, -0.14176177978515625, -0.1342315673828125, -0.12670135498046875, -0.119171142578125, -0.11164093017578125, -0.1041107177734375, -0.09658050537109375, -0.08905029296875, -0.08152008056640625, -0.0739898681640625, -0.06645965576171875, -0.058929443359375, -0.05139923095703125, -0.0438690185546875, -0.03633880615234375, -0.02880859375, -0.02127838134765625, -0.0137481689453125, -0.00621795654296875, 0.001312255859375, 0.00884246826171875, 0.0163726806640625, 0.02390289306640625, 0.03143310546875, 0.03896331787109375, 0.0464935302734375, 0.05402374267578125, 0.061553955078125, 0.06908416748046875, 0.0766143798828125, 0.08414459228515625, 0.0916748046875, 0.09920501708984375, 0.1067352294921875, 0.11426544189453125, 0.121795654296875, 0.12932586669921875, 0.1368560791015625, 0.14438629150390625, 0.15191650390625, 0.15944671630859375, 0.1669769287109375, 0.17450714111328125, 0.182037353515625, 0.18956756591796875, 0.1970977783203125, 0.20462799072265625, 0.212158203125]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 4.0, 2.0, 1.0, 1.0, 3.0, 5.0, 3.0, 8.0, 5.0, 10.0, 17.0, 14.0, 28.0, 35.0, 40.0, 44.0, 49.0, 53.0, 63.0, 67.0, 51.0, 73.0, 60.0, 71.0, 45.0, 43.0, 47.0, 25.0, 33.0, 23.0, 23.0, 19.0, 13.0, 11.0, 6.0, 4.0, 3.0, 6.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1295166015625, -0.12546157836914062, -0.12140655517578125, -0.11735153198242188, -0.1132965087890625, -0.10924148559570312, -0.10518646240234375, -0.10113143920898438, -0.097076416015625, -0.09302139282226562, -0.08896636962890625, -0.08491134643554688, -0.0808563232421875, -0.07680130004882812, -0.07274627685546875, -0.06869125366210938, -0.06463623046875, -0.060581207275390625, -0.05652618408203125, -0.052471160888671875, -0.0484161376953125, -0.044361114501953125, -0.04030609130859375, -0.036251068115234375, -0.032196044921875, -0.028141021728515625, -0.02408599853515625, -0.020030975341796875, -0.0159759521484375, -0.011920928955078125, -0.00786590576171875, -0.003810882568359375, 0.000244140625, 0.004299163818359375, 0.00835418701171875, 0.012409210205078125, 0.0164642333984375, 0.020519256591796875, 0.02457427978515625, 0.028629302978515625, 0.032684326171875, 0.036739349365234375, 0.04079437255859375, 0.044849395751953125, 0.0489044189453125, 0.052959442138671875, 0.05701446533203125, 0.061069488525390625, 0.06512451171875, 0.06917953491210938, 0.07323455810546875, 0.07728958129882812, 0.0813446044921875, 0.08539962768554688, 0.08945465087890625, 0.09350967407226562, 0.097564697265625, 0.10161972045898438, 0.10567474365234375, 0.10972976684570312, 0.1137847900390625, 0.11783981323242188, 0.12189483642578125, 0.12594985961914062, 0.1300048828125]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 1.0, 1.0, 3.0, 5.0, 9.0, 6.0, 8.0, 17.0, 31.0, 44.0, 89.0, 154.0, 350.0, 868.0, 3074.0, 36944.0, 860635.0, 138122.0, 6038.0, 1247.0, 454.0, 217.0, 95.0, 49.0, 31.0, 15.0, 24.0, 7.0, 8.0, 5.0, 1.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.66015625, -0.639312744140625, -0.61846923828125, -0.597625732421875, -0.5767822265625, -0.555938720703125, -0.53509521484375, -0.514251708984375, -0.493408203125, -0.472564697265625, -0.45172119140625, -0.430877685546875, -0.4100341796875, -0.389190673828125, -0.36834716796875, -0.347503662109375, -0.32666015625, -0.305816650390625, -0.28497314453125, -0.264129638671875, -0.2432861328125, -0.222442626953125, -0.20159912109375, -0.180755615234375, -0.159912109375, -0.139068603515625, -0.11822509765625, -0.097381591796875, -0.0765380859375, -0.055694580078125, -0.03485107421875, -0.014007568359375, 0.0068359375, 0.027679443359375, 0.04852294921875, 0.069366455078125, 0.0902099609375, 0.111053466796875, 0.13189697265625, 0.152740478515625, 0.173583984375, 0.194427490234375, 0.21527099609375, 0.236114501953125, 0.2569580078125, 0.277801513671875, 0.29864501953125, 0.319488525390625, 0.34033203125, 0.361175537109375, 0.38201904296875, 0.402862548828125, 0.4237060546875, 0.444549560546875, 0.46539306640625, 0.486236572265625, 0.507080078125, 0.527923583984375, 0.54876708984375, 0.569610595703125, 0.5904541015625, 0.611297607421875, 0.63214111328125, 0.652984619140625, 0.673828125]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 4.0, 3.0, 3.0, 7.0, 8.0, 8.0, 12.0, 8.0, 16.0, 19.0, 22.0, 15.0, 24.0, 36.0, 37.0, 38.0, 44.0, 57.0, 57.0, 56.0, 54.0, 61.0, 55.0, 53.0, 45.0, 50.0, 41.0, 38.0, 23.0, 16.0, 20.0, 16.0, 14.0, 22.0, 9.0, 5.0, 2.0, 3.0, 3.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.58056640625, -0.563720703125, -0.546875, -0.530029296875, -0.51318359375, -0.496337890625, -0.4794921875, -0.462646484375, -0.44580078125, -0.428955078125, -0.412109375, -0.395263671875, -0.37841796875, -0.361572265625, -0.3447265625, -0.327880859375, -0.31103515625, -0.294189453125, -0.27734375, -0.260498046875, -0.24365234375, -0.226806640625, -0.2099609375, -0.193115234375, -0.17626953125, -0.159423828125, -0.142578125, -0.125732421875, -0.10888671875, -0.092041015625, -0.0751953125, -0.058349609375, -0.04150390625, -0.024658203125, -0.0078125, 0.009033203125, 0.02587890625, 0.042724609375, 0.0595703125, 0.076416015625, 0.09326171875, 0.110107421875, 0.126953125, 0.143798828125, 0.16064453125, 0.177490234375, 0.1943359375, 0.211181640625, 0.22802734375, 0.244873046875, 0.26171875, 0.278564453125, 0.29541015625, 0.312255859375, 0.3291015625, 0.345947265625, 0.36279296875, 0.379638671875, 0.396484375, 0.413330078125, 0.43017578125, 0.447021484375, 0.4638671875, 0.480712890625, 0.49755859375]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 4.0, 4.0, 7.0, 19.0, 6.0, 23.0, 35.0, 56.0, 72.0, 135.0, 235.0, 488.0, 1324.0, 5566.0, 75424.0, 887632.0, 69759.0, 5390.0, 1327.0, 469.0, 219.0, 122.0, 66.0, 41.0, 32.0, 26.0, 17.0, 13.0, 14.0, 8.0, 9.0, 2.0, 3.0, 5.0, 0.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.37109375, -0.36092376708984375, -0.3507537841796875, -0.34058380126953125, -0.330413818359375, -0.32024383544921875, -0.3100738525390625, -0.29990386962890625, -0.28973388671875, -0.27956390380859375, -0.2693939208984375, -0.25922393798828125, -0.249053955078125, -0.23888397216796875, -0.2287139892578125, -0.21854400634765625, -0.2083740234375, -0.19820404052734375, -0.1880340576171875, -0.17786407470703125, -0.167694091796875, -0.15752410888671875, -0.1473541259765625, -0.13718414306640625, -0.12701416015625, -0.11684417724609375, -0.1066741943359375, -0.09650421142578125, -0.086334228515625, -0.07616424560546875, -0.0659942626953125, -0.05582427978515625, -0.045654296875, -0.03548431396484375, -0.0253143310546875, -0.01514434814453125, -0.004974365234375, 0.00519561767578125, 0.0153656005859375, 0.02553558349609375, 0.03570556640625, 0.04587554931640625, 0.0560455322265625, 0.06621551513671875, 0.076385498046875, 0.08655548095703125, 0.0967254638671875, 0.10689544677734375, 0.1170654296875, 0.12723541259765625, 0.1374053955078125, 0.14757537841796875, 0.157745361328125, 0.16791534423828125, 0.1780853271484375, 0.18825531005859375, 0.19842529296875, 0.20859527587890625, 0.2187652587890625, 0.22893524169921875, 0.239105224609375, 0.24927520751953125, 0.2594451904296875, 0.26961517333984375, 0.27978515625]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [4.0, 0.0, 1.0, 3.0, 1.0, 4.0, 7.0, 11.0, 13.0, 17.0, 32.0, 39.0, 65.0, 92.0, 117.0, 139.0, 113.0, 99.0, 93.0, 65.0, 32.0, 32.0, 15.0, 12.0, 2.0, 3.0, 2.0, 4.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.933906555175781e-05, -3.6840327084064484e-05, -3.4341588616371155e-05, -3.1842850148677826e-05, -2.9344111680984497e-05, -2.6845373213291168e-05, -2.434663474559784e-05, -2.184789627790451e-05, -1.934915781021118e-05, -1.6850419342517853e-05, -1.4351680874824524e-05, -1.1852942407131195e-05, -9.354203939437866e-06, -6.855465471744537e-06, -4.3567270040512085e-06, -1.8579885363578796e-06, 6.407499313354492e-07, 3.139488399028778e-06, 5.638226866722107e-06, 8.136965334415436e-06, 1.0635703802108765e-05, 1.3134442269802094e-05, 1.5633180737495422e-05, 1.813191920518875e-05, 2.063065767288208e-05, 2.312939614057541e-05, 2.5628134608268738e-05, 2.8126873075962067e-05, 3.0625611543655396e-05, 3.3124350011348724e-05, 3.562308847904205e-05, 3.812182694673538e-05, 4.062056541442871e-05, 4.311930388212204e-05, 4.561804234981537e-05, 4.81167808175087e-05, 5.0615519285202026e-05, 5.3114257752895355e-05, 5.5612996220588684e-05, 5.811173468828201e-05, 6.061047315597534e-05, 6.310921162366867e-05, 6.5607950091362e-05, 6.810668855905533e-05, 7.060542702674866e-05, 7.310416549444199e-05, 7.560290396213531e-05, 7.810164242982864e-05, 8.060038089752197e-05, 8.30991193652153e-05, 8.559785783290863e-05, 8.809659630060196e-05, 9.059533476829529e-05, 9.309407323598862e-05, 9.559281170368195e-05, 9.809155017137527e-05, 0.0001005902886390686, 0.00010308902710676193, 0.00010558776557445526, 0.00010808650404214859, 0.00011058524250984192, 0.00011308398097753525, 0.00011558271944522858, 0.0001180814579129219, 0.00012058019638061523]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 5.0, 7.0, 6.0, 17.0, 27.0, 48.0, 75.0, 144.0, 243.0, 547.0, 1447.0, 6331.0, 85197.0, 866357.0, 79594.0, 6016.0, 1389.0, 542.0, 221.0, 135.0, 76.0, 48.0, 27.0, 20.0, 13.0, 9.0, 3.0, 3.0, 2.0, 5.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.26416015625, -0.2545509338378906, -0.24494171142578125, -0.23533248901367188, -0.2257232666015625, -0.21611404418945312, -0.20650482177734375, -0.19689559936523438, -0.187286376953125, -0.17767715454101562, -0.16806793212890625, -0.15845870971679688, -0.1488494873046875, -0.13924026489257812, -0.12963104248046875, -0.12002182006835938, -0.11041259765625, -0.10080337524414062, -0.09119415283203125, -0.08158493041992188, -0.0719757080078125, -0.062366485595703125, -0.05275726318359375, -0.043148040771484375, -0.033538818359375, -0.023929595947265625, -0.01432037353515625, -0.004711151123046875, 0.0048980712890625, 0.014507293701171875, 0.02411651611328125, 0.033725738525390625, 0.0433349609375, 0.052944183349609375, 0.06255340576171875, 0.07216262817382812, 0.0817718505859375, 0.09138107299804688, 0.10099029541015625, 0.11059951782226562, 0.120208740234375, 0.12981796264648438, 0.13942718505859375, 0.14903640747070312, 0.1586456298828125, 0.16825485229492188, 0.17786407470703125, 0.18747329711914062, 0.19708251953125, 0.20669174194335938, 0.21630096435546875, 0.22591018676757812, 0.2355194091796875, 0.24512863159179688, 0.25473785400390625, 0.2643470764160156, 0.273956298828125, 0.2835655212402344, 0.29317474365234375, 0.3027839660644531, 0.3123931884765625, 0.3220024108886719, 0.33161163330078125, 0.3412208557128906, 0.350830078125]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 1.0, 3.0, 5.0, 3.0, 14.0, 9.0, 11.0, 26.0, 32.0, 44.0, 70.0, 94.0, 118.0, 109.0, 114.0, 96.0, 61.0, 65.0, 48.0, 28.0, 23.0, 13.0, 9.0, 5.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2388916015625, -0.2315826416015625, -0.224273681640625, -0.2169647216796875, -0.20965576171875, -0.2023468017578125, -0.195037841796875, -0.1877288818359375, -0.180419921875, -0.1731109619140625, -0.165802001953125, -0.1584930419921875, -0.15118408203125, -0.1438751220703125, -0.136566162109375, -0.1292572021484375, -0.1219482421875, -0.1146392822265625, -0.107330322265625, -0.1000213623046875, -0.09271240234375, -0.0854034423828125, -0.078094482421875, -0.0707855224609375, -0.0634765625, -0.0561676025390625, -0.048858642578125, -0.0415496826171875, -0.03424072265625, -0.0269317626953125, -0.019622802734375, -0.0123138427734375, -0.0050048828125, 0.0023040771484375, 0.009613037109375, 0.0169219970703125, 0.02423095703125, 0.0315399169921875, 0.038848876953125, 0.0461578369140625, 0.053466796875, 0.0607757568359375, 0.068084716796875, 0.0753936767578125, 0.08270263671875, 0.0900115966796875, 0.097320556640625, 0.1046295166015625, 0.1119384765625, 0.1192474365234375, 0.126556396484375, 0.1338653564453125, 0.14117431640625, 0.1484832763671875, 0.155792236328125, 0.1631011962890625, 0.17041015625, 0.1777191162109375, 0.185028076171875, 0.1923370361328125, 0.19964599609375, 0.2069549560546875, 0.214263916015625, 0.2215728759765625, 0.2288818359375]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 6.0, 5.0, 14.0, 52.0, 140.0, 276.0, 273.0, 154.0, 62.0, 22.0, 4.0, 3.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0], "bins": [-9.45622444152832, -9.274282455444336, -9.092340469360352, -8.910398483276367, -8.728456497192383, -8.546514511108398, -8.364572525024414, -8.18263053894043, -8.000688552856445, -7.818746566772461, -7.636804580688477, -7.454862594604492, -7.272920608520508, -7.090978622436523, -6.909036636352539, -6.727094650268555, -6.545152187347412, -6.363210201263428, -6.181268215179443, -5.999326229095459, -5.817384243011475, -5.63544225692749, -5.453499794006348, -5.271557807922363, -5.089615821838379, -4.9076738357543945, -4.72573184967041, -4.543789863586426, -4.361847877502441, -4.179905891418457, -3.9979636669158936, -3.816021680831909, -3.634079933166504, -3.4521379470825195, -3.270195960998535, -3.088253974914551, -2.9063119888305664, -2.724370002746582, -2.5424277782440186, -2.360485792160034, -2.17854380607605, -1.9966018199920654, -1.814659833908081, -1.6327177286148071, -1.4507757425308228, -1.2688337564468384, -1.0868916511535645, -0.9049496650695801, -0.7230076789855957, -0.5410656929016113, -0.3591236472129822, -0.17718160152435303, 0.004760384559631348, 0.18670237064361572, 0.36864447593688965, 0.550586462020874, 0.7325284481048584, 0.9144704341888428, 1.0964124202728271, 1.278354525566101, 1.4602965116500854, 1.6422384977340698, 1.8241806030273438, 2.006122589111328, 2.1880645751953125]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 6.0, 2.0, 2.0, 1.0, 10.0, 3.0, 4.0, 11.0, 13.0, 17.0, 17.0, 20.0, 28.0, 36.0, 30.0, 35.0, 46.0, 46.0, 51.0, 56.0, 66.0, 65.0, 56.0, 54.0, 46.0, 52.0, 46.0, 27.0, 25.0, 22.0, 17.0, 24.0, 21.0, 13.0, 8.0, 9.0, 4.0, 6.0, 3.0, 8.0, 1.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7098795175552368, -1.6386661529541016, -1.5674527883529663, -1.496239423751831, -1.4250260591506958, -1.3538126945495605, -1.2825993299484253, -1.21138596534729, -1.1401726007461548, -1.0689592361450195, -0.9977458715438843, -0.926532506942749, -0.8553191423416138, -0.7841057777404785, -0.7128924131393433, -0.641679048538208, -0.5704656839370728, -0.4992523193359375, -0.42803895473480225, -0.356825590133667, -0.28561222553253174, -0.21439886093139648, -0.14318549633026123, -0.07197213172912598, -0.0007587671279907227, 0.07045459747314453, 0.14166796207427979, 0.21288132667541504, 0.2840946912765503, 0.35530805587768555, 0.4265214204788208, 0.49773478507995605, 0.5689482688903809, 0.6401616334915161, 0.7113749980926514, 0.7825883626937866, 0.8538017272949219, 0.9250150918960571, 0.9962284564971924, 1.0674418210983276, 1.138655185699463, 1.2098685503005981, 1.2810819149017334, 1.3522952795028687, 1.423508644104004, 1.4947220087051392, 1.5659353733062744, 1.6371487379074097, 1.708362102508545, 1.7795754671096802, 1.8507888317108154, 1.9220021963119507, 1.993215560913086, 2.0644288063049316, 2.1356422901153564, 2.2068557739257812, 2.278069019317627, 2.3492822647094727, 2.4204957485198975, 2.4917092323303223, 2.562922477722168, 2.6341357231140137, 2.7053492069244385, 2.7765626907348633, 2.847775936126709]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 2.0, 2.0, 2.0, 7.0, 8.0, 19.0, 45.0, 62.0, 109.0, 200.0, 419.0, 1066.0, 3698.0, 22712.0, 3944382.0, 205414.0, 11972.0, 2554.0, 833.0, 374.0, 166.0, 105.0, 50.0, 29.0, 21.0, 8.0, 13.0, 3.0, 5.0, 3.0, 2.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.59765625, -0.5800018310546875, -0.562347412109375, -0.5446929931640625, -0.52703857421875, -0.5093841552734375, -0.491729736328125, -0.4740753173828125, -0.4564208984375, -0.4387664794921875, -0.421112060546875, -0.4034576416015625, -0.38580322265625, -0.3681488037109375, -0.350494384765625, -0.3328399658203125, -0.315185546875, -0.2975311279296875, -0.279876708984375, -0.2622222900390625, -0.24456787109375, -0.2269134521484375, -0.209259033203125, -0.1916046142578125, -0.1739501953125, -0.1562957763671875, -0.138641357421875, -0.1209869384765625, -0.10333251953125, -0.0856781005859375, -0.068023681640625, -0.0503692626953125, -0.03271484375, -0.0150604248046875, 0.002593994140625, 0.0202484130859375, 0.03790283203125, 0.0555572509765625, 0.073211669921875, 0.0908660888671875, 0.1085205078125, 0.1261749267578125, 0.143829345703125, 0.1614837646484375, 0.17913818359375, 0.1967926025390625, 0.214447021484375, 0.2321014404296875, 0.249755859375, 0.2674102783203125, 0.285064697265625, 0.3027191162109375, 0.32037353515625, 0.3380279541015625, 0.355682373046875, 0.3733367919921875, 0.3909912109375, 0.4086456298828125, 0.426300048828125, 0.4439544677734375, 0.46160888671875, 0.4792633056640625, 0.496917724609375, 0.5145721435546875, 0.5322265625]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 0.0, 2.0, 6.0, 5.0, 8.0, 6.0, 15.0, 14.0, 16.0, 31.0, 41.0, 40.0, 52.0, 68.0, 77.0, 69.0, 78.0, 82.0, 71.0, 62.0, 45.0, 42.0, 41.0, 45.0, 20.0, 16.0, 14.0, 11.0, 7.0, 6.0, 4.0, 4.0, 4.0, 3.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1376953125, -0.1325531005859375, -0.127410888671875, -0.1222686767578125, -0.11712646484375, -0.1119842529296875, -0.106842041015625, -0.1016998291015625, -0.0965576171875, -0.0914154052734375, -0.086273193359375, -0.0811309814453125, -0.07598876953125, -0.0708465576171875, -0.065704345703125, -0.0605621337890625, -0.055419921875, -0.0502777099609375, -0.045135498046875, -0.0399932861328125, -0.03485107421875, -0.0297088623046875, -0.024566650390625, -0.0194244384765625, -0.0142822265625, -0.0091400146484375, -0.003997802734375, 0.0011444091796875, 0.00628662109375, 0.0114288330078125, 0.016571044921875, 0.0217132568359375, 0.02685546875, 0.0319976806640625, 0.037139892578125, 0.0422821044921875, 0.04742431640625, 0.0525665283203125, 0.057708740234375, 0.0628509521484375, 0.0679931640625, 0.0731353759765625, 0.078277587890625, 0.0834197998046875, 0.08856201171875, 0.0937042236328125, 0.098846435546875, 0.1039886474609375, 0.109130859375, 0.1142730712890625, 0.119415283203125, 0.1245574951171875, 0.12969970703125, 0.1348419189453125, 0.139984130859375, 0.1451263427734375, 0.1502685546875, 0.1554107666015625, 0.160552978515625, 0.1656951904296875, 0.17083740234375, 0.1759796142578125, 0.181121826171875, 0.1862640380859375, 0.19140625]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 1.0, 1.0, 4.0, 3.0, 11.0, 16.0, 18.0, 30.0, 33.0, 62.0, 87.0, 122.0, 187.0, 328.0, 517.0, 973.0, 1843.0, 3672.0, 8527.0, 23566.0, 89257.0, 3416170.0, 549729.0, 66122.0, 18900.0, 7099.0, 3339.0, 1581.0, 864.0, 437.0, 305.0, 179.0, 97.0, 76.0, 50.0, 31.0, 16.0, 9.0, 9.0, 4.0, 5.0, 5.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.2340087890625, -0.22710609436035156, -0.22020339965820312, -0.2133007049560547, -0.20639801025390625, -0.1994953155517578, -0.19259262084960938, -0.18568992614746094, -0.1787872314453125, -0.17188453674316406, -0.16498184204101562, -0.1580791473388672, -0.15117645263671875, -0.1442737579345703, -0.13737106323242188, -0.13046836853027344, -0.123565673828125, -0.11666297912597656, -0.10976028442382812, -0.10285758972167969, -0.09595489501953125, -0.08905220031738281, -0.08214950561523438, -0.07524681091308594, -0.0683441162109375, -0.06144142150878906, -0.054538726806640625, -0.04763603210449219, -0.04073333740234375, -0.03383064270019531, -0.026927947998046875, -0.020025253295898438, -0.01312255859375, -0.0062198638916015625, 0.000682830810546875, 0.0075855255126953125, 0.01448822021484375, 0.021390914916992188, 0.028293609619140625, 0.03519630432128906, 0.0420989990234375, 0.04900169372558594, 0.055904388427734375, 0.06280708312988281, 0.06970977783203125, 0.07661247253417969, 0.08351516723632812, 0.09041786193847656, 0.097320556640625, 0.10422325134277344, 0.11112594604492188, 0.11802864074707031, 0.12493133544921875, 0.1318340301513672, 0.13873672485351562, 0.14563941955566406, 0.1525421142578125, 0.15944480895996094, 0.16634750366210938, 0.1732501983642578, 0.18015289306640625, 0.1870555877685547, 0.19395828247070312, 0.20086097717285156, 0.207763671875]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 4.0, 1.0, 4.0, 11.0, 12.0, 21.0, 24.0, 33.0, 58.0, 124.0, 252.0, 2854.0, 352.0, 124.0, 87.0, 37.0, 26.0, 17.0, 11.0, 9.0, 5.0, 9.0, 3.0, 2.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.09454345703125, -0.09227180480957031, -0.09000015258789062, -0.08772850036621094, -0.08545684814453125, -0.08318519592285156, -0.08091354370117188, -0.07864189147949219, -0.0763702392578125, -0.07409858703613281, -0.07182693481445312, -0.06955528259277344, -0.06728363037109375, -0.06501197814941406, -0.06274032592773438, -0.06046867370605469, -0.058197021484375, -0.05592536926269531, -0.053653717041015625, -0.05138206481933594, -0.04911041259765625, -0.04683876037597656, -0.044567108154296875, -0.04229545593261719, -0.0400238037109375, -0.03775215148925781, -0.035480499267578125, -0.03320884704589844, -0.03093719482421875, -0.028665542602539062, -0.026393890380859375, -0.024122238159179688, -0.0218505859375, -0.019578933715820312, -0.017307281494140625, -0.015035629272460938, -0.01276397705078125, -0.010492324829101562, -0.008220672607421875, -0.0059490203857421875, -0.0036773681640625, -0.0014057159423828125, 0.000865936279296875, 0.0031375885009765625, 0.00540924072265625, 0.0076808929443359375, 0.009952545166015625, 0.012224197387695312, 0.014495849609375, 0.016767501831054688, 0.019039154052734375, 0.021310806274414062, 0.02358245849609375, 0.025854110717773438, 0.028125762939453125, 0.030397415161132812, 0.0326690673828125, 0.03494071960449219, 0.037212371826171875, 0.03948402404785156, 0.04175567626953125, 0.04402732849121094, 0.046298980712890625, 0.04857063293457031, 0.05084228515625]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 4.0, 5.0, 15.0, 19.0, 24.0, 32.0, 57.0, 86.0, 91.0, 130.0, 109.0, 103.0, 91.0, 81.0, 64.0, 29.0, 31.0, 11.0, 7.0, 3.0, 1.0, 1.0, 5.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.23041397333145142, -0.22208306193351746, -0.2137521505355835, -0.20542123913764954, -0.19709032773971558, -0.18875941634178162, -0.18042851984500885, -0.1720976084470749, -0.16376669704914093, -0.15543578565120697, -0.147104874253273, -0.13877396285533905, -0.13044306635856628, -0.12211214751005173, -0.11378124356269836, -0.1054503321647644, -0.09711942076683044, -0.08878850936889648, -0.08045759797096252, -0.07212669402360916, -0.0637957826256752, -0.05546487122774124, -0.04713396355509758, -0.03880305588245392, -0.03047214448451996, -0.022141234949231148, -0.013810325413942337, -0.005479415878653526, 0.0028514936566352844, 0.011182405054569244, 0.019513312727212906, 0.027844220399856567, 0.036175161600112915, 0.044506072998046875, 0.052836980670690536, 0.0611678883433342, 0.06949879974126816, 0.07782971113920212, 0.08616061508655548, 0.09449152648448944, 0.1028224378824234, 0.11115334928035736, 0.11948426067829132, 0.12781517207622528, 0.13614606857299805, 0.144476979970932, 0.15280789136886597, 0.16113880276679993, 0.1694697141647339, 0.17780062556266785, 0.1861315369606018, 0.19446244835853577, 0.20279335975646973, 0.2111242711544037, 0.21945516765117645, 0.2277860790491104, 0.23611699044704437, 0.24444790184497833, 0.2527787983417511, 0.26110970973968506, 0.269440621137619, 0.277771532535553, 0.28610244393348694, 0.2944333553314209, 0.30276426672935486]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 3.0, 3.0, 4.0, 8.0, 12.0, 7.0, 9.0, 22.0, 20.0, 14.0, 28.0, 27.0, 29.0, 36.0, 34.0, 36.0, 32.0, 42.0, 42.0, 43.0, 39.0, 47.0, 39.0, 33.0, 47.0, 37.0, 38.0, 26.0, 37.0, 27.0, 18.0, 28.0, 22.0, 20.0, 13.0, 13.0, 10.0, 7.0, 11.0, 5.0, 11.0, 10.0, 2.0, 3.0, 3.0, 6.0, 2.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.1151648759841919, -0.11126790195703506, -0.10737093538045883, -0.103473961353302, -0.09957699477672577, -0.09568002074956894, -0.09178304672241211, -0.08788608014583588, -0.08398910611867905, -0.08009213209152222, -0.07619516551494598, -0.07229819148778915, -0.06840121746063232, -0.06450425088405609, -0.06060727685689926, -0.05671030655503273, -0.0528133362531662, -0.04891636595129967, -0.045019395649433136, -0.041122421622276306, -0.037225451320409775, -0.03332848101854324, -0.029431508854031563, -0.025534536689519882, -0.02163756638765335, -0.01774059608578682, -0.013843623921275139, -0.009946652688086033, -0.006049681454896927, -0.0021527111530303955, 0.001744261011481285, 0.005641233175992966, 0.009538203477859497, 0.013435174711048603, 0.01733214594423771, 0.02122911810874939, 0.02512608841061592, 0.029023058712482452, 0.03292003273963928, 0.036817003041505814, 0.040713973343372345, 0.044610943645238876, 0.04850791394710541, 0.05240488797426224, 0.05630185827612877, 0.0601988285779953, 0.06409580260515213, 0.06799277663230896, 0.07188974320888519, 0.07578671723604202, 0.07968368381261826, 0.08358065783977509, 0.08747762441635132, 0.09137459844350815, 0.09527157247066498, 0.09916853904724121, 0.10306551307439804, 0.10696248710155487, 0.1108594536781311, 0.11475642770528793, 0.11865340173244476, 0.122550368309021, 0.12644733488559723, 0.13034431636333466, 0.1342412829399109]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 4.0, 6.0, 7.0, 8.0, 13.0, 35.0, 45.0, 73.0, 84.0, 144.0, 256.0, 476.0, 1096.0, 2508.0, 7595.0, 31130.0, 170640.0, 544946.0, 232152.0, 42187.0, 9501.0, 3067.0, 1243.0, 582.0, 287.0, 173.0, 84.0, 71.0, 43.0, 29.0, 22.0, 14.0, 10.0, 5.0, 4.0, 3.0, 3.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.2271728515625, -0.2186298370361328, -0.21008682250976562, -0.20154380798339844, -0.19300079345703125, -0.18445777893066406, -0.17591476440429688, -0.1673717498779297, -0.1588287353515625, -0.1502857208251953, -0.14174270629882812, -0.13319969177246094, -0.12465667724609375, -0.11611366271972656, -0.10757064819335938, -0.09902763366699219, -0.090484619140625, -0.08194160461425781, -0.07339859008789062, -0.06485557556152344, -0.05631256103515625, -0.04776954650878906, -0.039226531982421875, -0.030683517456054688, -0.0221405029296875, -0.013597488403320312, -0.005054473876953125, 0.0034885406494140625, 0.01203155517578125, 0.020574569702148438, 0.029117584228515625, 0.03766059875488281, 0.04620361328125, 0.05474662780761719, 0.06328964233398438, 0.07183265686035156, 0.08037567138671875, 0.08891868591308594, 0.09746170043945312, 0.10600471496582031, 0.1145477294921875, 0.12309074401855469, 0.13163375854492188, 0.14017677307128906, 0.14871978759765625, 0.15726280212402344, 0.16580581665039062, 0.1743488311767578, 0.182891845703125, 0.1914348602294922, 0.19997787475585938, 0.20852088928222656, 0.21706390380859375, 0.22560691833496094, 0.23414993286132812, 0.2426929473876953, 0.2512359619140625, 0.2597789764404297, 0.2683219909667969, 0.27686500549316406, 0.28540802001953125, 0.29395103454589844, 0.3024940490722656, 0.3110370635986328, 0.319580078125]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 3.0, 2.0, 2.0, 10.0, 7.0, 7.0, 7.0, 10.0, 13.0, 25.0, 28.0, 43.0, 36.0, 62.0, 65.0, 69.0, 75.0, 60.0, 80.0, 73.0, 59.0, 42.0, 46.0, 39.0, 39.0, 26.0, 22.0, 17.0, 7.0, 9.0, 4.0, 6.0, 4.0, 2.0, 2.0, 4.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1307373046875, -0.1258392333984375, -0.120941162109375, -0.1160430908203125, -0.11114501953125, -0.1062469482421875, -0.101348876953125, -0.0964508056640625, -0.091552734375, -0.0866546630859375, -0.081756591796875, -0.0768585205078125, -0.07196044921875, -0.0670623779296875, -0.062164306640625, -0.0572662353515625, -0.0523681640625, -0.0474700927734375, -0.042572021484375, -0.0376739501953125, -0.03277587890625, -0.0278778076171875, -0.022979736328125, -0.0180816650390625, -0.01318359375, -0.0082855224609375, -0.003387451171875, 0.0015106201171875, 0.00640869140625, 0.0113067626953125, 0.016204833984375, 0.0211029052734375, 0.0260009765625, 0.0308990478515625, 0.035797119140625, 0.0406951904296875, 0.04559326171875, 0.0504913330078125, 0.055389404296875, 0.0602874755859375, 0.065185546875, 0.0700836181640625, 0.074981689453125, 0.0798797607421875, 0.08477783203125, 0.0896759033203125, 0.094573974609375, 0.0994720458984375, 0.1043701171875, 0.1092681884765625, 0.114166259765625, 0.1190643310546875, 0.12396240234375, 0.1288604736328125, 0.133758544921875, 0.1386566162109375, 0.1435546875, 0.1484527587890625, 0.153350830078125, 0.1582489013671875, 0.16314697265625, 0.1680450439453125, 0.172943115234375, 0.1778411865234375, 0.1827392578125]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 5.0, 7.0, 7.0, 10.0, 16.0, 11.0, 24.0, 22.0, 42.0, 69.0, 130.0, 242.0, 404.0, 833.0, 2429.0, 15780.0, 504129.0, 504781.0, 15519.0, 2309.0, 814.0, 401.0, 201.0, 121.0, 83.0, 54.0, 36.0, 35.0, 13.0, 10.0, 5.0, 7.0, 5.0, 5.0, 0.0, 1.0, 0.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.50439453125, -0.4886322021484375, -0.472869873046875, -0.4571075439453125, -0.44134521484375, -0.4255828857421875, -0.409820556640625, -0.3940582275390625, -0.3782958984375, -0.3625335693359375, -0.346771240234375, -0.3310089111328125, -0.31524658203125, -0.2994842529296875, -0.283721923828125, -0.2679595947265625, -0.252197265625, -0.2364349365234375, -0.220672607421875, -0.2049102783203125, -0.18914794921875, -0.1733856201171875, -0.157623291015625, -0.1418609619140625, -0.1260986328125, -0.1103363037109375, -0.094573974609375, -0.0788116455078125, -0.06304931640625, -0.0472869873046875, -0.031524658203125, -0.0157623291015625, 0.0, 0.0157623291015625, 0.031524658203125, 0.0472869873046875, 0.06304931640625, 0.0788116455078125, 0.094573974609375, 0.1103363037109375, 0.1260986328125, 0.1418609619140625, 0.157623291015625, 0.1733856201171875, 0.18914794921875, 0.2049102783203125, 0.220672607421875, 0.2364349365234375, 0.252197265625, 0.2679595947265625, 0.283721923828125, 0.2994842529296875, 0.31524658203125, 0.3310089111328125, 0.346771240234375, 0.3625335693359375, 0.3782958984375, 0.3940582275390625, 0.409820556640625, 0.4255828857421875, 0.44134521484375, 0.4571075439453125, 0.472869873046875, 0.4886322021484375, 0.50439453125]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 1.0, 3.0, 5.0, 14.0, 15.0, 11.0, 16.0, 16.0, 31.0, 30.0, 36.0, 36.0, 41.0, 43.0, 47.0, 48.0, 42.0, 58.0, 68.0, 55.0, 57.0, 53.0, 46.0, 39.0, 41.0, 35.0, 24.0, 17.0, 16.0, 20.0, 11.0, 11.0, 8.0, 2.0, 5.0, 4.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.423583984375, -0.4073448181152344, -0.39110565185546875, -0.3748664855957031, -0.3586273193359375, -0.3423881530761719, -0.32614898681640625, -0.3099098205566406, -0.293670654296875, -0.2774314880371094, -0.26119232177734375, -0.24495315551757812, -0.2287139892578125, -0.21247482299804688, -0.19623565673828125, -0.17999649047851562, -0.16375732421875, -0.14751815795898438, -0.13127899169921875, -0.11503982543945312, -0.0988006591796875, -0.08256149291992188, -0.06632232666015625, -0.050083160400390625, -0.033843994140625, -0.017604827880859375, -0.00136566162109375, 0.014873504638671875, 0.0311126708984375, 0.047351837158203125, 0.06359100341796875, 0.07983016967773438, 0.0960693359375, 0.11230850219726562, 0.12854766845703125, 0.14478683471679688, 0.1610260009765625, 0.17726516723632812, 0.19350433349609375, 0.20974349975585938, 0.225982666015625, 0.24222183227539062, 0.25846099853515625, 0.2747001647949219, 0.2909393310546875, 0.3071784973144531, 0.32341766357421875, 0.3396568298339844, 0.35589599609375, 0.3721351623535156, 0.38837432861328125, 0.4046134948730469, 0.4208526611328125, 0.4370918273925781, 0.45333099365234375, 0.4695701599121094, 0.485809326171875, 0.5020484924316406, 0.5182876586914062, 0.5345268249511719, 0.5507659912109375, 0.5670051574707031, 0.5832443237304688, 0.5994834899902344, 0.61572265625]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 3.0, 3.0, 4.0, 3.0, 2.0, 8.0, 21.0, 23.0, 34.0, 47.0, 65.0, 122.0, 210.0, 467.0, 1272.0, 5610.0, 89865.0, 890815.0, 53547.0, 4308.0, 1112.0, 467.0, 210.0, 131.0, 71.0, 56.0, 22.0, 23.0, 14.0, 7.0, 5.0, 5.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.213134765625, -0.20507049560546875, -0.1970062255859375, -0.18894195556640625, -0.180877685546875, -0.17281341552734375, -0.1647491455078125, -0.15668487548828125, -0.14862060546875, -0.14055633544921875, -0.1324920654296875, -0.12442779541015625, -0.116363525390625, -0.10829925537109375, -0.1002349853515625, -0.09217071533203125, -0.0841064453125, -0.07604217529296875, -0.0679779052734375, -0.05991363525390625, -0.051849365234375, -0.04378509521484375, -0.0357208251953125, -0.02765655517578125, -0.01959228515625, -0.01152801513671875, -0.0034637451171875, 0.00460052490234375, 0.012664794921875, 0.02072906494140625, 0.0287933349609375, 0.03685760498046875, 0.044921875, 0.05298614501953125, 0.0610504150390625, 0.06911468505859375, 0.077178955078125, 0.08524322509765625, 0.0933074951171875, 0.10137176513671875, 0.10943603515625, 0.11750030517578125, 0.1255645751953125, 0.13362884521484375, 0.141693115234375, 0.14975738525390625, 0.1578216552734375, 0.16588592529296875, 0.1739501953125, 0.18201446533203125, 0.1900787353515625, 0.19814300537109375, 0.206207275390625, 0.21427154541015625, 0.2223358154296875, 0.23040008544921875, 0.23846435546875, 0.24652862548828125, 0.2545928955078125, 0.26265716552734375, 0.270721435546875, 0.27878570556640625, 0.2868499755859375, 0.29491424560546875, 0.302978515625]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 4.0, 3.0, 4.0, 12.0, 13.0, 11.0, 21.0, 25.0, 34.0, 44.0, 56.0, 81.0, 89.0, 88.0, 86.0, 85.0, 72.0, 70.0, 53.0, 41.0, 34.0, 26.0, 17.0, 12.0, 5.0, 10.0, 4.0, 2.0, 1.0, 5.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.2438507080078125e-05, -4.0940940380096436e-05, -3.9443373680114746e-05, -3.794580698013306e-05, -3.644824028015137e-05, -3.495067358016968e-05, -3.345310688018799e-05, -3.19555401802063e-05, -3.045797348022461e-05, -2.896040678024292e-05, -2.746284008026123e-05, -2.596527338027954e-05, -2.446770668029785e-05, -2.2970139980316162e-05, -2.1472573280334473e-05, -1.9975006580352783e-05, -1.8477439880371094e-05, -1.6979873180389404e-05, -1.5482306480407715e-05, -1.3984739780426025e-05, -1.2487173080444336e-05, -1.0989606380462646e-05, -9.492039680480957e-06, -7.994472980499268e-06, -6.496906280517578e-06, -4.999339580535889e-06, -3.5017728805541992e-06, -2.0042061805725098e-06, -5.066394805908203e-07, 9.909272193908691e-07, 2.4884939193725586e-06, 3.986060619354248e-06, 5.4836273193359375e-06, 6.981194019317627e-06, 8.478760719299316e-06, 9.976327419281006e-06, 1.1473894119262695e-05, 1.2971460819244385e-05, 1.4469027519226074e-05, 1.5966594219207764e-05, 1.7464160919189453e-05, 1.8961727619171143e-05, 2.0459294319152832e-05, 2.195686101913452e-05, 2.345442771911621e-05, 2.49519944190979e-05, 2.644956111907959e-05, 2.794712781906128e-05, 2.944469451904297e-05, 3.094226121902466e-05, 3.243982791900635e-05, 3.393739461898804e-05, 3.5434961318969727e-05, 3.6932528018951416e-05, 3.8430094718933105e-05, 3.9927661418914795e-05, 4.1425228118896484e-05, 4.2922794818878174e-05, 4.442036151885986e-05, 4.591792821884155e-05, 4.741549491882324e-05, 4.891306161880493e-05, 5.041062831878662e-05, 5.190819501876831e-05, 5.340576171875e-05]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 5.0, 5.0, 11.0, 14.0, 34.0, 45.0, 82.0, 141.0, 296.0, 689.0, 1821.0, 8085.0, 117706.0, 845522.0, 65383.0, 5954.0, 1552.0, 621.0, 273.0, 139.0, 66.0, 39.0, 20.0, 17.0, 11.0, 9.0, 5.0, 8.0, 3.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.26123046875, -0.25363922119140625, -0.2460479736328125, -0.23845672607421875, -0.230865478515625, -0.22327423095703125, -0.2156829833984375, -0.20809173583984375, -0.20050048828125, -0.19290924072265625, -0.1853179931640625, -0.17772674560546875, -0.170135498046875, -0.16254425048828125, -0.1549530029296875, -0.14736175537109375, -0.1397705078125, -0.13217926025390625, -0.1245880126953125, -0.11699676513671875, -0.109405517578125, -0.10181427001953125, -0.0942230224609375, -0.08663177490234375, -0.07904052734375, -0.07144927978515625, -0.0638580322265625, -0.05626678466796875, -0.048675537109375, -0.04108428955078125, -0.0334930419921875, -0.02590179443359375, -0.018310546875, -0.01071929931640625, -0.0031280517578125, 0.00446319580078125, 0.012054443359375, 0.01964569091796875, 0.0272369384765625, 0.03482818603515625, 0.04241943359375, 0.05001068115234375, 0.0576019287109375, 0.06519317626953125, 0.072784423828125, 0.08037567138671875, 0.0879669189453125, 0.09555816650390625, 0.1031494140625, 0.11074066162109375, 0.1183319091796875, 0.12592315673828125, 0.133514404296875, 0.14110565185546875, 0.1486968994140625, 0.15628814697265625, 0.16387939453125, 0.17147064208984375, 0.1790618896484375, 0.18665313720703125, 0.194244384765625, 0.20183563232421875, 0.2094268798828125, 0.21701812744140625, 0.224609375]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 8.0, 10.0, 16.0, 39.0, 36.0, 57.0, 93.0, 80.0, 123.0, 132.0, 106.0, 89.0, 77.0, 38.0, 32.0, 24.0, 16.0, 9.0, 3.0, 9.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.2061767578125, -0.19938278198242188, -0.19258880615234375, -0.18579483032226562, -0.1790008544921875, -0.17220687866210938, -0.16541290283203125, -0.15861892700195312, -0.151824951171875, -0.14503097534179688, -0.13823699951171875, -0.13144302368164062, -0.1246490478515625, -0.11785507202148438, -0.11106109619140625, -0.10426712036132812, -0.09747314453125, -0.09067916870117188, -0.08388519287109375, -0.07709121704101562, -0.0702972412109375, -0.06350326538085938, -0.05670928955078125, -0.049915313720703125, -0.043121337890625, -0.036327362060546875, -0.02953338623046875, -0.022739410400390625, -0.0159454345703125, -0.009151458740234375, -0.00235748291015625, 0.004436492919921875, 0.01123046875, 0.018024444580078125, 0.02481842041015625, 0.031612396240234375, 0.0384063720703125, 0.045200347900390625, 0.05199432373046875, 0.058788299560546875, 0.065582275390625, 0.07237625122070312, 0.07917022705078125, 0.08596420288085938, 0.0927581787109375, 0.09955215454101562, 0.10634613037109375, 0.11314010620117188, 0.11993408203125, 0.12672805786132812, 0.13352203369140625, 0.14031600952148438, 0.1471099853515625, 0.15390396118164062, 0.16069793701171875, 0.16749191284179688, 0.174285888671875, 0.18107986450195312, 0.18787384033203125, 0.19466781616210938, 0.2014617919921875, 0.20825576782226562, 0.21504974365234375, 0.22184371948242188, 0.2286376953125]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 3.0, 8.0, 4.0, 9.0, 20.0, 64.0, 124.0, 208.0, 228.0, 183.0, 87.0, 41.0, 18.0, 9.0, 3.0, 2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.8693244457244873, -3.755748748779297, -3.6421730518341064, -3.528597354888916, -3.4150216579437256, -3.301445960998535, -3.187870502471924, -3.0742945671081543, -2.960719108581543, -2.8471434116363525, -2.733567714691162, -2.6199920177459717, -2.5064163208007812, -2.392840623855591, -2.2792649269104004, -2.165689468383789, -2.0521135330200195, -1.938537836074829, -1.8249621391296387, -1.7113864421844482, -1.5978107452392578, -1.4842350482940674, -1.3706594705581665, -1.257083773612976, -1.1435080766677856, -1.0299323797225952, -0.9163566827774048, -0.8027810454368591, -0.6892053484916687, -0.5756296515464783, -0.4620540142059326, -0.3484783172607422, -0.23490262031555176, -0.12132693827152252, -0.007751256227493286, 0.10582441091537476, 0.21940010786056519, 0.3329758048057556, 0.44655144214630127, 0.5601271390914917, 0.6737028360366821, 0.7872785329818726, 0.900854229927063, 1.0144298076629639, 1.1280055046081543, 1.2415812015533447, 1.3551568984985352, 1.4687325954437256, 1.582308292388916, 1.6958839893341064, 1.8094596862792969, 1.9230353832244873, 2.0366110801696777, 2.150186777114868, 2.2637624740600586, 2.37733793258667, 2.4909138679504395, 2.60448956489563, 2.7180652618408203, 2.8316409587860107, 2.945216655731201, 3.0587923526763916, 3.172368049621582, 3.2859435081481934, 3.399519205093384]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 5.0, 4.0, 6.0, 8.0, 12.0, 6.0, 13.0, 15.0, 23.0, 23.0, 31.0, 22.0, 38.0, 38.0, 47.0, 44.0, 45.0, 56.0, 48.0, 58.0, 58.0, 57.0, 51.0, 40.0, 40.0, 43.0, 34.0, 28.0, 20.0, 26.0, 20.0, 19.0, 10.0, 8.0, 4.0, 5.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.0460784435272217, -1.9790561199188232, -1.9120337963104248, -1.845011591911316, -1.7779892683029175, -1.710966944694519, -1.6439447402954102, -1.5769224166870117, -1.5099000930786133, -1.4428777694702148, -1.3758554458618164, -1.3088332414627075, -1.241810917854309, -1.1747885942459106, -1.1077663898468018, -1.0407440662384033, -0.9737217426300049, -0.9066994190216064, -0.8396771550178528, -0.7726548910140991, -0.7056325674057007, -0.6386102437973022, -0.5715879797935486, -0.5045657157897949, -0.4375433921813965, -0.37052109837532043, -0.3034988045692444, -0.23647651076316833, -0.16945421695709229, -0.10243192315101624, -0.035409629344940186, 0.031612664461135864, 0.09863471984863281, 0.16565701365470886, 0.2326793074607849, 0.29970160126686096, 0.366723895072937, 0.43374618887901306, 0.5007684826850891, 0.5677907466888428, 0.6348130702972412, 0.7018353939056396, 0.7688576579093933, 0.835879921913147, 0.9029022455215454, 0.9699245691299438, 1.0369467735290527, 1.1039690971374512, 1.1709914207458496, 1.238013744354248, 1.3050360679626465, 1.3720582723617554, 1.4390805959701538, 1.5061029195785522, 1.5731251239776611, 1.6401474475860596, 1.707169771194458, 1.7741920948028564, 1.8412144184112549, 1.9082366228103638, 1.9752589464187622, 2.042281150817871, 2.1093034744262695, 2.176325798034668, 2.2433481216430664]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 0.0, 5.0, 6.0, 12.0, 10.0, 9.0, 16.0, 24.0, 38.0, 45.0, 72.0, 133.0, 195.0, 479.0, 996.0, 2569.0, 8085.0, 38062.0, 603813.0, 3470764.0, 53146.0, 10246.0, 3132.0, 1189.0, 571.0, 268.0, 136.0, 95.0, 47.0, 27.0, 26.0, 15.0, 13.0, 7.0, 6.0, 3.0, 8.0, 3.0, 8.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2073974609375, -0.19800758361816406, -0.18861770629882812, -0.1792278289794922, -0.16983795166015625, -0.1604480743408203, -0.15105819702148438, -0.14166831970214844, -0.1322784423828125, -0.12288856506347656, -0.11349868774414062, -0.10410881042480469, -0.09471893310546875, -0.08532905578613281, -0.07593917846679688, -0.06654930114746094, -0.057159423828125, -0.04776954650878906, -0.038379669189453125, -0.028989791870117188, -0.01959991455078125, -0.010210037231445312, -0.000820159912109375, 0.008569717407226562, 0.0179595947265625, 0.027349472045898438, 0.036739349365234375, 0.04612922668457031, 0.05551910400390625, 0.06490898132324219, 0.07429885864257812, 0.08368873596191406, 0.09307861328125, 0.10246849060058594, 0.11185836791992188, 0.12124824523925781, 0.13063812255859375, 0.1400279998779297, 0.14941787719726562, 0.15880775451660156, 0.1681976318359375, 0.17758750915527344, 0.18697738647460938, 0.1963672637939453, 0.20575714111328125, 0.2151470184326172, 0.22453689575195312, 0.23392677307128906, 0.243316650390625, 0.25270652770996094, 0.2620964050292969, 0.2714862823486328, 0.28087615966796875, 0.2902660369873047, 0.2996559143066406, 0.30904579162597656, 0.3184356689453125, 0.32782554626464844, 0.3372154235839844, 0.3466053009033203, 0.35599517822265625, 0.3653850555419922, 0.3747749328613281, 0.38416481018066406, 0.3935546875]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 4.0, 4.0, 3.0, 9.0, 7.0, 8.0, 15.0, 18.0, 27.0, 34.0, 41.0, 55.0, 70.0, 60.0, 70.0, 65.0, 64.0, 57.0, 75.0, 66.0, 39.0, 41.0, 34.0, 48.0, 17.0, 17.0, 14.0, 10.0, 9.0, 7.0, 5.0, 3.0, 5.0, 2.0, 4.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.154296875, -0.1498088836669922, -0.14532089233398438, -0.14083290100097656, -0.13634490966796875, -0.13185691833496094, -0.12736892700195312, -0.12288093566894531, -0.1183929443359375, -0.11390495300292969, -0.10941696166992188, -0.10492897033691406, -0.10044097900390625, -0.09595298767089844, -0.09146499633789062, -0.08697700500488281, -0.082489013671875, -0.07800102233886719, -0.07351303100585938, -0.06902503967285156, -0.06453704833984375, -0.06004905700683594, -0.055561065673828125, -0.05107307434082031, -0.0465850830078125, -0.04209709167480469, -0.037609100341796875, -0.03312110900878906, -0.02863311767578125, -0.024145126342773438, -0.019657135009765625, -0.015169143676757812, -0.01068115234375, -0.0061931610107421875, -0.001705169677734375, 0.0027828216552734375, 0.00727081298828125, 0.011758804321289062, 0.016246795654296875, 0.020734786987304688, 0.0252227783203125, 0.029710769653320312, 0.034198760986328125, 0.03868675231933594, 0.04317474365234375, 0.04766273498535156, 0.052150726318359375, 0.05663871765136719, 0.061126708984375, 0.06561470031738281, 0.07010269165039062, 0.07459068298339844, 0.07907867431640625, 0.08356666564941406, 0.08805465698242188, 0.09254264831542969, 0.0970306396484375, 0.10151863098144531, 0.10600662231445312, 0.11049461364746094, 0.11498260498046875, 0.11947059631347656, 0.12395858764648438, 0.1284465789794922, 0.1329345703125]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 2.0, 2.0, 10.0, 10.0, 14.0, 22.0, 26.0, 30.0, 45.0, 56.0, 96.0, 153.0, 233.0, 409.0, 585.0, 1012.0, 1710.0, 3198.0, 5990.0, 12294.0, 28938.0, 83848.0, 397545.0, 3253454.0, 287270.0, 69228.0, 24811.0, 10856.0, 5340.0, 2869.0, 1649.0, 900.0, 576.0, 354.0, 257.0, 145.0, 105.0, 65.0, 57.0, 39.0, 25.0, 18.0, 12.0, 11.0, 6.0, 4.0, 3.0, 1.0, 5.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1317138671875, -0.12752151489257812, -0.12332916259765625, -0.11913681030273438, -0.1149444580078125, -0.11075210571289062, -0.10655975341796875, -0.10236740112304688, -0.098175048828125, -0.09398269653320312, -0.08979034423828125, -0.08559799194335938, -0.0814056396484375, -0.07721328735351562, -0.07302093505859375, -0.06882858276367188, -0.06463623046875, -0.060443878173828125, -0.05625152587890625, -0.052059173583984375, -0.0478668212890625, -0.043674468994140625, -0.03948211669921875, -0.035289764404296875, -0.031097412109375, -0.026905059814453125, -0.02271270751953125, -0.018520355224609375, -0.0143280029296875, -0.010135650634765625, -0.00594329833984375, -0.001750946044921875, 0.00244140625, 0.006633758544921875, 0.01082611083984375, 0.015018463134765625, 0.0192108154296875, 0.023403167724609375, 0.02759552001953125, 0.031787872314453125, 0.035980224609375, 0.040172576904296875, 0.04436492919921875, 0.048557281494140625, 0.0527496337890625, 0.056941986083984375, 0.06113433837890625, 0.06532669067382812, 0.06951904296875, 0.07371139526367188, 0.07790374755859375, 0.08209609985351562, 0.0862884521484375, 0.09048080444335938, 0.09467315673828125, 0.09886550903320312, 0.103057861328125, 0.10725021362304688, 0.11144256591796875, 0.11563491821289062, 0.1198272705078125, 0.12401962280273438, 0.12821197509765625, 0.13240432739257812, 0.1365966796875]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 4.0, 2.0, 6.0, 2.0, 9.0, 7.0, 12.0, 9.0, 16.0, 19.0, 24.0, 32.0, 45.0, 74.0, 104.0, 157.0, 331.0, 1500.0, 922.0, 311.0, 154.0, 87.0, 74.0, 42.0, 35.0, 19.0, 15.0, 10.0, 11.0, 13.0, 6.0, 3.0, 5.0, 5.0, 5.0, 4.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.05926513671875, -0.05697822570800781, -0.054691314697265625, -0.05240440368652344, -0.05011749267578125, -0.04783058166503906, -0.045543670654296875, -0.04325675964355469, -0.0409698486328125, -0.03868293762207031, -0.036396026611328125, -0.03410911560058594, -0.03182220458984375, -0.029535293579101562, -0.027248382568359375, -0.024961471557617188, -0.022674560546875, -0.020387649536132812, -0.018100738525390625, -0.015813827514648438, -0.01352691650390625, -0.011240005493164062, -0.008953094482421875, -0.0066661834716796875, -0.0043792724609375, -0.0020923614501953125, 0.000194549560546875, 0.0024814605712890625, 0.00476837158203125, 0.0070552825927734375, 0.009342193603515625, 0.011629104614257812, 0.013916015625, 0.016202926635742188, 0.018489837646484375, 0.020776748657226562, 0.02306365966796875, 0.025350570678710938, 0.027637481689453125, 0.029924392700195312, 0.0322113037109375, 0.03449821472167969, 0.036785125732421875, 0.03907203674316406, 0.04135894775390625, 0.04364585876464844, 0.045932769775390625, 0.04821968078613281, 0.050506591796875, 0.05279350280761719, 0.055080413818359375, 0.05736732482910156, 0.05965423583984375, 0.06194114685058594, 0.06422805786132812, 0.06651496887207031, 0.0688018798828125, 0.07108879089355469, 0.07337570190429688, 0.07566261291503906, 0.07794952392578125, 0.08023643493652344, 0.08252334594726562, 0.08481025695800781, 0.08709716796875]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 6.0, 2.0, 2.0, 8.0, 14.0, 36.0, 50.0, 101.0, 151.0, 164.0, 138.0, 122.0, 89.0, 44.0, 26.0, 19.0, 10.0, 8.0, 6.0, 3.0, 1.0, 0.0, 2.0, 2.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3507859706878662, -0.33178627490997314, -0.3127865791320801, -0.293786883354187, -0.27478715777397156, -0.2557874619960785, -0.23678776621818542, -0.21778805553913116, -0.1987883597612381, -0.17978866398334503, -0.16078895330429077, -0.1417892575263977, -0.12278955429792404, -0.10378985106945038, -0.08479015529155731, -0.06579044461250305, -0.046790748834609985, -0.02779104746878147, -0.008791346102952957, 0.010208353400230408, 0.02920805662870407, 0.048207759857177734, 0.0672074556350708, 0.08620716631412506, 0.10520686209201813, 0.12420656532049179, 0.14320626854896545, 0.16220596432685852, 0.1812056601047516, 0.20020537078380585, 0.2192050665616989, 0.23820477724075317, 0.25720447301864624, 0.2762041687965393, 0.2952038645744324, 0.31420356035232544, 0.3332032859325409, 0.35220298171043396, 0.371202677488327, 0.3902024030685425, 0.40920209884643555, 0.4282017946243286, 0.4472014904022217, 0.46620118618011475, 0.4852009117603302, 0.5042005777359009, 0.523200273513794, 0.5422000288963318, 0.5611996650695801, 0.5801993608474731, 0.5991990566253662, 0.6181987524032593, 0.6371984481811523, 0.6561981439590454, 0.6751978397369385, 0.6941975951194763, 0.7131972908973694, 0.7321969866752625, 0.7511966824531555, 0.7701963782310486, 0.7891960740089417, 0.8081958293914795, 0.8271955251693726, 0.8461952209472656, 0.8651949167251587]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 9.0, 4.0, 2.0, 5.0, 8.0, 5.0, 10.0, 14.0, 14.0, 12.0, 10.0, 16.0, 19.0, 24.0, 25.0, 26.0, 31.0, 32.0, 25.0, 34.0, 30.0, 50.0, 34.0, 35.0, 37.0, 39.0, 35.0, 40.0, 41.0, 33.0, 37.0, 40.0, 38.0, 28.0, 23.0, 16.0, 27.0, 14.0, 15.0, 8.0, 12.0, 10.0, 9.0, 9.0, 5.0, 2.0, 3.0, 5.0, 2.0, 2.0, 1.0, 4.0, 5.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.25023192167282104, -0.24231058359146118, -0.23438923060894012, -0.22646789252758026, -0.2185465395450592, -0.21062520146369934, -0.20270386338233948, -0.19478252530097961, -0.18686117231845856, -0.1789398342370987, -0.17101848125457764, -0.16309714317321777, -0.1551758050918579, -0.14725445210933685, -0.139333114027977, -0.13141176104545593, -0.12349042296409607, -0.11556907743215561, -0.10764773190021515, -0.09972639381885529, -0.09180504828691483, -0.08388370275497437, -0.0759623646736145, -0.06804101914167404, -0.06011967360973358, -0.05219832807779312, -0.04427698627114296, -0.0363556444644928, -0.028434298932552338, -0.020512953400611877, -0.012591611593961716, -0.004670269787311554, 0.0032510757446289062, 0.011172419413924217, 0.019093763083219528, 0.02701510675251484, 0.03493645042181015, 0.04285779595375061, 0.05077913776040077, 0.058700479567050934, 0.0666218250989914, 0.07454317063093185, 0.08246451616287231, 0.09038585424423218, 0.09830719977617264, 0.1062285453081131, 0.11414988338947296, 0.12207122892141342, 0.12999257445335388, 0.13791391253471375, 0.1458352655172348, 0.15375660359859467, 0.16167795658111572, 0.16959929466247559, 0.17752063274383545, 0.1854419708251953, 0.19336332380771637, 0.20128466188907623, 0.2092060148715973, 0.21712735295295715, 0.22504869103431702, 0.23297004401683807, 0.24089138209819794, 0.248812735080719, 0.25673407316207886]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 1.0, 3.0, 1.0, 0.0, 2.0, 3.0, 1.0, 4.0, 4.0, 6.0, 6.0, 7.0, 10.0, 13.0, 29.0, 34.0, 51.0, 58.0, 135.0, 254.0, 572.0, 1595.0, 5480.0, 28910.0, 215964.0, 628011.0, 141176.0, 19775.0, 4195.0, 1272.0, 451.0, 220.0, 133.0, 62.0, 27.0, 25.0, 18.0, 15.0, 11.0, 9.0, 7.0, 7.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.41357421875, -0.4018898010253906, -0.39020538330078125, -0.3785209655761719, -0.3668365478515625, -0.3551521301269531, -0.34346771240234375, -0.3317832946777344, -0.320098876953125, -0.3084144592285156, -0.29673004150390625, -0.2850456237792969, -0.2733612060546875, -0.2616767883300781, -0.24999237060546875, -0.23830795288085938, -0.22662353515625, -0.21493911743164062, -0.20325469970703125, -0.19157028198242188, -0.1798858642578125, -0.16820144653320312, -0.15651702880859375, -0.14483261108398438, -0.133148193359375, -0.12146377563476562, -0.10977935791015625, -0.09809494018554688, -0.0864105224609375, -0.07472610473632812, -0.06304168701171875, -0.051357269287109375, -0.0396728515625, -0.027988433837890625, -0.01630401611328125, -0.004619598388671875, 0.0070648193359375, 0.018749237060546875, 0.03043365478515625, 0.042118072509765625, 0.053802490234375, 0.06548690795898438, 0.07717132568359375, 0.08885574340820312, 0.1005401611328125, 0.11222457885742188, 0.12390899658203125, 0.13559341430664062, 0.14727783203125, 0.15896224975585938, 0.17064666748046875, 0.18233108520507812, 0.1940155029296875, 0.20569992065429688, 0.21738433837890625, 0.22906875610351562, 0.240753173828125, 0.2524375915527344, 0.26412200927734375, 0.2758064270019531, 0.2874908447265625, 0.2991752624511719, 0.31085968017578125, 0.3225440979003906, 0.334228515625]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 6.0, 3.0, 9.0, 10.0, 9.0, 22.0, 20.0, 27.0, 35.0, 39.0, 51.0, 52.0, 69.0, 65.0, 58.0, 69.0, 65.0, 57.0, 62.0, 45.0, 48.0, 45.0, 28.0, 33.0, 17.0, 12.0, 19.0, 3.0, 11.0, 4.0, 2.0, 6.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1434326171875, -0.1389923095703125, -0.134552001953125, -0.1301116943359375, -0.12567138671875, -0.1212310791015625, -0.116790771484375, -0.1123504638671875, -0.10791015625, -0.1034698486328125, -0.099029541015625, -0.0945892333984375, -0.09014892578125, -0.0857086181640625, -0.081268310546875, -0.0768280029296875, -0.0723876953125, -0.0679473876953125, -0.063507080078125, -0.0590667724609375, -0.05462646484375, -0.0501861572265625, -0.045745849609375, -0.0413055419921875, -0.036865234375, -0.0324249267578125, -0.027984619140625, -0.0235443115234375, -0.01910400390625, -0.0146636962890625, -0.010223388671875, -0.0057830810546875, -0.0013427734375, 0.0030975341796875, 0.007537841796875, 0.0119781494140625, 0.01641845703125, 0.0208587646484375, 0.025299072265625, 0.0297393798828125, 0.0341796875, 0.0386199951171875, 0.043060302734375, 0.0475006103515625, 0.05194091796875, 0.0563812255859375, 0.060821533203125, 0.0652618408203125, 0.0697021484375, 0.0741424560546875, 0.078582763671875, 0.0830230712890625, 0.08746337890625, 0.0919036865234375, 0.096343994140625, 0.1007843017578125, 0.105224609375, 0.1096649169921875, 0.114105224609375, 0.1185455322265625, 0.12298583984375, 0.1274261474609375, 0.131866455078125, 0.1363067626953125, 0.1407470703125]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 0.0, 5.0, 2.0, 6.0, 8.0, 4.0, 16.0, 12.0, 30.0, 48.0, 62.0, 128.0, 267.0, 497.0, 1362.0, 5365.0, 83482.0, 896562.0, 54146.0, 4340.0, 1161.0, 490.0, 234.0, 113.0, 63.0, 50.0, 31.0, 20.0, 14.0, 12.0, 6.0, 5.0, 6.0, 4.0, 2.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.6611328125, -0.641937255859375, -0.62274169921875, -0.603546142578125, -0.5843505859375, -0.565155029296875, -0.54595947265625, -0.526763916015625, -0.507568359375, -0.488372802734375, -0.46917724609375, -0.449981689453125, -0.4307861328125, -0.411590576171875, -0.39239501953125, -0.373199462890625, -0.35400390625, -0.334808349609375, -0.31561279296875, -0.296417236328125, -0.2772216796875, -0.258026123046875, -0.23883056640625, -0.219635009765625, -0.200439453125, -0.181243896484375, -0.16204833984375, -0.142852783203125, -0.1236572265625, -0.104461669921875, -0.08526611328125, -0.066070556640625, -0.046875, -0.027679443359375, -0.00848388671875, 0.010711669921875, 0.0299072265625, 0.049102783203125, 0.06829833984375, 0.087493896484375, 0.106689453125, 0.125885009765625, 0.14508056640625, 0.164276123046875, 0.1834716796875, 0.202667236328125, 0.22186279296875, 0.241058349609375, 0.26025390625, 0.279449462890625, 0.29864501953125, 0.317840576171875, 0.3370361328125, 0.356231689453125, 0.37542724609375, 0.394622802734375, 0.413818359375, 0.433013916015625, 0.45220947265625, 0.471405029296875, 0.4906005859375, 0.509796142578125, 0.52899169921875, 0.548187255859375, 0.5673828125]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 0.0, 5.0, 3.0, 6.0, 3.0, 5.0, 11.0, 20.0, 11.0, 16.0, 15.0, 19.0, 27.0, 33.0, 30.0, 47.0, 31.0, 50.0, 50.0, 40.0, 55.0, 54.0, 57.0, 43.0, 45.0, 42.0, 33.0, 39.0, 36.0, 36.0, 25.0, 21.0, 23.0, 15.0, 12.0, 13.0, 9.0, 5.0, 7.0, 8.0, 3.0, 2.0, 1.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.41357421875, -0.40007781982421875, -0.3865814208984375, -0.37308502197265625, -0.359588623046875, -0.34609222412109375, -0.3325958251953125, -0.31909942626953125, -0.30560302734375, -0.29210662841796875, -0.2786102294921875, -0.26511383056640625, -0.251617431640625, -0.23812103271484375, -0.2246246337890625, -0.21112823486328125, -0.1976318359375, -0.18413543701171875, -0.1706390380859375, -0.15714263916015625, -0.143646240234375, -0.13014984130859375, -0.1166534423828125, -0.10315704345703125, -0.08966064453125, -0.07616424560546875, -0.0626678466796875, -0.04917144775390625, -0.035675048828125, -0.02217864990234375, -0.0086822509765625, 0.00481414794921875, 0.018310546875, 0.03180694580078125, 0.0453033447265625, 0.05879974365234375, 0.072296142578125, 0.08579254150390625, 0.0992889404296875, 0.11278533935546875, 0.12628173828125, 0.13977813720703125, 0.1532745361328125, 0.16677093505859375, 0.180267333984375, 0.19376373291015625, 0.2072601318359375, 0.22075653076171875, 0.2342529296875, 0.24774932861328125, 0.2612457275390625, 0.27474212646484375, 0.288238525390625, 0.30173492431640625, 0.3152313232421875, 0.32872772216796875, 0.34222412109375, 0.35572052001953125, 0.3692169189453125, 0.38271331787109375, 0.396209716796875, 0.40970611572265625, 0.4232025146484375, 0.43669891357421875, 0.4501953125]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 4.0, 3.0, 7.0, 4.0, 13.0, 21.0, 27.0, 37.0, 47.0, 89.0, 115.0, 207.0, 419.0, 931.0, 2198.0, 7099.0, 31334.0, 214864.0, 661620.0, 104127.0, 17734.0, 4550.0, 1579.0, 686.0, 357.0, 174.0, 97.0, 75.0, 39.0, 23.0, 24.0, 10.0, 17.0, 5.0, 6.0, 8.0, 7.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11004638671875, -0.1060190200805664, -0.10199165344238281, -0.09796428680419922, -0.09393692016601562, -0.08990955352783203, -0.08588218688964844, -0.08185482025146484, -0.07782745361328125, -0.07380008697509766, -0.06977272033691406, -0.06574535369873047, -0.061717987060546875, -0.05769062042236328, -0.05366325378417969, -0.049635887145996094, -0.0456085205078125, -0.041581153869628906, -0.03755378723144531, -0.03352642059326172, -0.029499053955078125, -0.02547168731689453, -0.021444320678710938, -0.017416954040527344, -0.01338958740234375, -0.009362220764160156, -0.0053348541259765625, -0.0013074874877929688, 0.002719879150390625, 0.006747245788574219, 0.010774612426757812, 0.014801979064941406, 0.018829345703125, 0.022856712341308594, 0.026884078979492188, 0.03091144561767578, 0.034938812255859375, 0.03896617889404297, 0.04299354553222656, 0.047020912170410156, 0.05104827880859375, 0.055075645446777344, 0.05910301208496094, 0.06313037872314453, 0.06715774536132812, 0.07118511199951172, 0.07521247863769531, 0.0792398452758789, 0.0832672119140625, 0.0872945785522461, 0.09132194519042969, 0.09534931182861328, 0.09937667846679688, 0.10340404510498047, 0.10743141174316406, 0.11145877838134766, 0.11548614501953125, 0.11951351165771484, 0.12354087829589844, 0.12756824493408203, 0.13159561157226562, 0.13562297821044922, 0.1396503448486328, 0.1436777114868164, 0.147705078125]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 5.0, 3.0, 4.0, 4.0, 8.0, 7.0, 5.0, 5.0, 11.0, 15.0, 10.0, 19.0, 20.0, 28.0, 27.0, 35.0, 38.0, 56.0, 62.0, 78.0, 90.0, 87.0, 69.0, 53.0, 52.0, 28.0, 34.0, 30.0, 15.0, 20.0, 12.0, 17.0, 17.0, 16.0, 8.0, 7.0, 4.0, 5.0, 5.0, 2.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.26173210144043e-05, -4.1268765926361084e-05, -3.992021083831787e-05, -3.857165575027466e-05, -3.7223100662231445e-05, -3.587454557418823e-05, -3.452599048614502e-05, -3.317743539810181e-05, -3.1828880310058594e-05, -3.048032522201538e-05, -2.9131770133972168e-05, -2.7783215045928955e-05, -2.6434659957885742e-05, -2.508610486984253e-05, -2.3737549781799316e-05, -2.2388994693756104e-05, -2.104043960571289e-05, -1.9691884517669678e-05, -1.8343329429626465e-05, -1.6994774341583252e-05, -1.564621925354004e-05, -1.4297664165496826e-05, -1.2949109077453613e-05, -1.16005539894104e-05, -1.0251998901367188e-05, -8.903443813323975e-06, -7.554888725280762e-06, -6.206333637237549e-06, -4.857778549194336e-06, -3.509223461151123e-06, -2.16066837310791e-06, -8.121132850646973e-07, 5.364418029785156e-07, 1.8849968910217285e-06, 3.2335519790649414e-06, 4.582107067108154e-06, 5.930662155151367e-06, 7.27921724319458e-06, 8.627772331237793e-06, 9.976327419281006e-06, 1.1324882507324219e-05, 1.2673437595367432e-05, 1.4021992683410645e-05, 1.5370547771453857e-05, 1.671910285949707e-05, 1.8067657947540283e-05, 1.9416213035583496e-05, 2.076476812362671e-05, 2.2113323211669922e-05, 2.3461878299713135e-05, 2.4810433387756348e-05, 2.615898847579956e-05, 2.7507543563842773e-05, 2.8856098651885986e-05, 3.02046537399292e-05, 3.155320882797241e-05, 3.2901763916015625e-05, 3.425031900405884e-05, 3.559887409210205e-05, 3.6947429180145264e-05, 3.8295984268188477e-05, 3.964453935623169e-05, 4.09930944442749e-05, 4.2341649532318115e-05, 4.369020462036133e-05]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 6.0, 9.0, 6.0, 17.0, 22.0, 32.0, 35.0, 41.0, 85.0, 151.0, 239.0, 483.0, 1014.0, 2593.0, 9716.0, 73469.0, 731006.0, 202840.0, 19648.0, 4232.0, 1464.0, 622.0, 338.0, 173.0, 110.0, 79.0, 48.0, 26.0, 20.0, 10.0, 7.0, 1.0, 5.0, 6.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.130859375, -0.12556076049804688, -0.12026214599609375, -0.11496353149414062, -0.1096649169921875, -0.10436630249023438, -0.09906768798828125, -0.09376907348632812, -0.088470458984375, -0.08317184448242188, -0.07787322998046875, -0.07257461547851562, -0.0672760009765625, -0.061977386474609375, -0.05667877197265625, -0.051380157470703125, -0.04608154296875, -0.040782928466796875, -0.03548431396484375, -0.030185699462890625, -0.0248870849609375, -0.019588470458984375, -0.01428985595703125, -0.008991241455078125, -0.003692626953125, 0.001605987548828125, 0.00690460205078125, 0.012203216552734375, 0.0175018310546875, 0.022800445556640625, 0.02809906005859375, 0.033397674560546875, 0.0386962890625, 0.043994903564453125, 0.04929351806640625, 0.054592132568359375, 0.0598907470703125, 0.06518936157226562, 0.07048797607421875, 0.07578659057617188, 0.081085205078125, 0.08638381958007812, 0.09168243408203125, 0.09698104858398438, 0.1022796630859375, 0.10757827758789062, 0.11287689208984375, 0.11817550659179688, 0.12347412109375, 0.12877273559570312, 0.13407135009765625, 0.13936996459960938, 0.1446685791015625, 0.14996719360351562, 0.15526580810546875, 0.16056442260742188, 0.165863037109375, 0.17116165161132812, 0.17646026611328125, 0.18175888061523438, 0.1870574951171875, 0.19235610961914062, 0.19765472412109375, 0.20295333862304688, 0.208251953125]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 8.0, 4.0, 10.0, 8.0, 9.0, 11.0, 8.0, 8.0, 10.0, 18.0, 21.0, 35.0, 39.0, 61.0, 54.0, 71.0, 76.0, 83.0, 66.0, 75.0, 38.0, 54.0, 47.0, 42.0, 23.0, 19.0, 15.0, 20.0, 16.0, 13.0, 9.0, 6.0, 5.0, 4.0, 6.0, 6.0, 2.0, 3.0, 4.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09130859375, -0.0880289077758789, -0.08474922180175781, -0.08146953582763672, -0.07818984985351562, -0.07491016387939453, -0.07163047790527344, -0.06835079193115234, -0.06507110595703125, -0.061791419982910156, -0.05851173400878906, -0.05523204803466797, -0.051952362060546875, -0.04867267608642578, -0.04539299011230469, -0.042113304138183594, -0.0388336181640625, -0.035553932189941406, -0.03227424621582031, -0.02899456024169922, -0.025714874267578125, -0.02243518829345703, -0.019155502319335938, -0.015875816345214844, -0.01259613037109375, -0.009316444396972656, -0.0060367584228515625, -0.0027570724487304688, 0.000522613525390625, 0.0038022994995117188, 0.0070819854736328125, 0.010361671447753906, 0.013641357421875, 0.016921043395996094, 0.020200729370117188, 0.02348041534423828, 0.026760101318359375, 0.03003978729248047, 0.03331947326660156, 0.036599159240722656, 0.03987884521484375, 0.043158531188964844, 0.04643821716308594, 0.04971790313720703, 0.052997589111328125, 0.05627727508544922, 0.05955696105957031, 0.0628366470336914, 0.0661163330078125, 0.0693960189819336, 0.07267570495605469, 0.07595539093017578, 0.07923507690429688, 0.08251476287841797, 0.08579444885253906, 0.08907413482666016, 0.09235382080078125, 0.09563350677490234, 0.09891319274902344, 0.10219287872314453, 0.10547256469726562, 0.10875225067138672, 0.11203193664550781, 0.1153116226196289, 0.11859130859375]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 4.0, 3.0, 3.0, 7.0, 6.0, 9.0, 17.0, 44.0, 96.0, 144.0, 211.0, 199.0, 133.0, 80.0, 27.0, 15.0, 5.0, 1.0, 2.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.9341628551483154, -2.8327794075012207, -2.731395959854126, -2.6300125122070312, -2.5286288261413574, -2.4272453784942627, -2.325861930847168, -2.2244784832000732, -2.1230950355529785, -2.021711587905884, -1.9203280210494995, -1.8189445734024048, -1.7175610065460205, -1.6161775588989258, -1.514794111251831, -1.4134106636047363, -1.3120269775390625, -1.2106435298919678, -1.1092599630355835, -1.0078765153884888, -0.9064930081367493, -0.8051095008850098, -0.703726053237915, -0.6023425459861755, -0.500959038734436, -0.39957553148269653, -0.2981920540332794, -0.1968085765838623, -0.0954250693321228, 0.005958437919616699, 0.10734188556671143, 0.20872539281845093, 0.31010913848876953, 0.41149264574050903, 0.5128761529922485, 0.6142596006393433, 0.7156431078910828, 0.8170266151428223, 0.918410062789917, 1.0197935104370117, 1.121177077293396, 1.2225605249404907, 1.323944091796875, 1.4253275394439697, 1.5267109870910645, 1.6280945539474487, 1.7294780015945435, 1.8308615684509277, 1.9322450160980225, 2.033628463745117, 2.135011911392212, 2.2363953590393066, 2.3377790451049805, 2.439162492752075, 2.54054594039917, 2.6419293880462646, 2.7433128356933594, 2.844696283340454, 2.946079730987549, 3.0474634170532227, 3.1488468647003174, 3.250230312347412, 3.351613759994507, 3.4529972076416016, 3.5543808937072754]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 2.0, 5.0, 3.0, 6.0, 9.0, 5.0, 14.0, 12.0, 16.0, 20.0, 22.0, 20.0, 27.0, 33.0, 22.0, 28.0, 48.0, 48.0, 48.0, 52.0, 56.0, 50.0, 60.0, 41.0, 43.0, 47.0, 33.0, 51.0, 33.0, 25.0, 21.0, 19.0, 17.0, 16.0, 9.0, 9.0, 5.0, 12.0, 3.0, 5.0, 2.0, 3.0, 4.0, 1.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9295673370361328, -1.8716405630111694, -1.813713788986206, -1.7557870149612427, -1.6978602409362793, -1.639933466911316, -1.5820066928863525, -1.5240797996520996, -1.4661531448364258, -1.4082263708114624, -1.350299596786499, -1.2923728227615356, -1.2344460487365723, -1.1765192747116089, -1.1185925006866455, -1.0606656074523926, -1.0027388334274292, -0.9448120594024658, -0.8868852853775024, -0.8289585113525391, -0.7710317373275757, -0.7131049633026123, -0.6551781296730042, -0.5972513556480408, -0.5393245816230774, -0.481397807598114, -0.42347103357315063, -0.36554422974586487, -0.3076174557209015, -0.2496906816959381, -0.19176387786865234, -0.13383710384368896, -0.07591032981872559, -0.01798354834318161, 0.039943233132362366, 0.09787002205848694, 0.15579679608345032, 0.2137235701084137, 0.27165037393569946, 0.32957714796066284, 0.3875039219856262, 0.4454306960105896, 0.503357470035553, 0.5612843036651611, 0.6192110776901245, 0.6771378517150879, 0.7350646257400513, 0.7929913997650146, 0.850918173789978, 0.9088449478149414, 0.9667717218399048, 1.0246984958648682, 1.0826252698898315, 1.140552043914795, 1.1984789371490479, 1.2564055919647217, 1.3143324851989746, 1.372259259223938, 1.4301860332489014, 1.4881128072738647, 1.5460395812988281, 1.6039663553237915, 1.6618931293487549, 1.7198200225830078, 1.7777466773986816]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 5.0, 1.0, 4.0, 5.0, 2.0, 6.0, 5.0, 10.0, 12.0, 26.0, 27.0, 44.0, 64.0, 101.0, 204.0, 451.0, 1436.0, 6231.0, 51583.0, 1801543.0, 2260067.0, 62900.0, 7049.0, 1518.0, 464.0, 203.0, 116.0, 71.0, 42.0, 23.0, 23.0, 12.0, 10.0, 5.0, 9.0, 7.0, 5.0, 3.0, 0.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.240234375, -0.23196029663085938, -0.22368621826171875, -0.21541213989257812, -0.2071380615234375, -0.19886398315429688, -0.19058990478515625, -0.18231582641601562, -0.174041748046875, -0.16576766967773438, -0.15749359130859375, -0.14921951293945312, -0.1409454345703125, -0.13267135620117188, -0.12439727783203125, -0.11612319946289062, -0.10784912109375, -0.09957504272460938, -0.09130096435546875, -0.08302688598632812, -0.0747528076171875, -0.06647872924804688, -0.05820465087890625, -0.049930572509765625, -0.041656494140625, -0.033382415771484375, -0.02510833740234375, -0.016834259033203125, -0.0085601806640625, -0.000286102294921875, 0.00798797607421875, 0.016262054443359375, 0.0245361328125, 0.032810211181640625, 0.04108428955078125, 0.049358367919921875, 0.0576324462890625, 0.06590652465820312, 0.07418060302734375, 0.08245468139648438, 0.090728759765625, 0.09900283813476562, 0.10727691650390625, 0.11555099487304688, 0.1238250732421875, 0.13209915161132812, 0.14037322998046875, 0.14864730834960938, 0.15692138671875, 0.16519546508789062, 0.17346954345703125, 0.18174362182617188, 0.1900177001953125, 0.19829177856445312, 0.20656585693359375, 0.21483993530273438, 0.223114013671875, 0.23138809204101562, 0.23966217041015625, 0.24793624877929688, 0.2562103271484375, 0.2644844055175781, 0.27275848388671875, 0.2810325622558594, 0.289306640625]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 6.0, 8.0, 9.0, 12.0, 20.0, 26.0, 47.0, 59.0, 64.0, 73.0, 73.0, 91.0, 103.0, 68.0, 78.0, 69.0, 53.0, 43.0, 32.0, 29.0, 17.0, 12.0, 7.0, 5.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1463623046875, -0.1411590576171875, -0.135955810546875, -0.1307525634765625, -0.12554931640625, -0.1203460693359375, -0.115142822265625, -0.1099395751953125, -0.104736328125, -0.0995330810546875, -0.094329833984375, -0.0891265869140625, -0.08392333984375, -0.0787200927734375, -0.073516845703125, -0.0683135986328125, -0.0631103515625, -0.0579071044921875, -0.052703857421875, -0.0475006103515625, -0.04229736328125, -0.0370941162109375, -0.031890869140625, -0.0266876220703125, -0.021484375, -0.0162811279296875, -0.011077880859375, -0.0058746337890625, -0.00067138671875, 0.0045318603515625, 0.009735107421875, 0.0149383544921875, 0.0201416015625, 0.0253448486328125, 0.030548095703125, 0.0357513427734375, 0.04095458984375, 0.0461578369140625, 0.051361083984375, 0.0565643310546875, 0.061767578125, 0.0669708251953125, 0.072174072265625, 0.0773773193359375, 0.08258056640625, 0.0877838134765625, 0.092987060546875, 0.0981903076171875, 0.1033935546875, 0.1085968017578125, 0.113800048828125, 0.1190032958984375, 0.12420654296875, 0.1294097900390625, 0.134613037109375, 0.1398162841796875, 0.14501953125, 0.1502227783203125, 0.155426025390625, 0.1606292724609375, 0.16583251953125, 0.1710357666015625, 0.176239013671875, 0.1814422607421875, 0.1866455078125]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 3.0, 2.0, 4.0, 4.0, 4.0, 7.0, 10.0, 12.0, 22.0, 42.0, 51.0, 116.0, 244.0, 691.0, 2316.0, 11559.0, 102990.0, 3042637.0, 982803.0, 42337.0, 6151.0, 1410.0, 499.0, 166.0, 81.0, 49.0, 19.0, 16.0, 11.0, 13.0, 10.0, 7.0, 0.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.3447265625, -0.33628273010253906, -0.3278388977050781, -0.3193950653076172, -0.31095123291015625, -0.3025074005126953, -0.2940635681152344, -0.28561973571777344, -0.2771759033203125, -0.26873207092285156, -0.2602882385253906, -0.2518444061279297, -0.24340057373046875, -0.2349567413330078, -0.22651290893554688, -0.21806907653808594, -0.209625244140625, -0.20118141174316406, -0.19273757934570312, -0.1842937469482422, -0.17584991455078125, -0.1674060821533203, -0.15896224975585938, -0.15051841735839844, -0.1420745849609375, -0.13363075256347656, -0.12518692016601562, -0.11674308776855469, -0.10829925537109375, -0.09985542297363281, -0.09141159057617188, -0.08296775817871094, -0.07452392578125, -0.06608009338378906, -0.057636260986328125, -0.04919242858886719, -0.04074859619140625, -0.03230476379394531, -0.023860931396484375, -0.015417098999023438, -0.0069732666015625, 0.0014705657958984375, 0.009914398193359375, 0.018358230590820312, 0.02680206298828125, 0.03524589538574219, 0.043689727783203125, 0.05213356018066406, 0.060577392578125, 0.06902122497558594, 0.07746505737304688, 0.08590888977050781, 0.09435272216796875, 0.10279655456542969, 0.11124038696289062, 0.11968421936035156, 0.1281280517578125, 0.13657188415527344, 0.14501571655273438, 0.1534595489501953, 0.16190338134765625, 0.1703472137451172, 0.17879104614257812, 0.18723487854003906, 0.1956787109375]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 4.0, 2.0, 7.0, 11.0, 10.0, 15.0, 23.0, 24.0, 54.0, 88.0, 130.0, 240.0, 419.0, 670.0, 805.0, 674.0, 397.0, 196.0, 122.0, 55.0, 45.0, 28.0, 17.0, 12.0, 6.0, 10.0, 5.0, 1.0, 6.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.2489013671875, -0.2412395477294922, -0.23357772827148438, -0.22591590881347656, -0.21825408935546875, -0.21059226989746094, -0.20293045043945312, -0.1952686309814453, -0.1876068115234375, -0.1799449920654297, -0.17228317260742188, -0.16462135314941406, -0.15695953369140625, -0.14929771423339844, -0.14163589477539062, -0.1339740753173828, -0.126312255859375, -0.11865043640136719, -0.11098861694335938, -0.10332679748535156, -0.09566497802734375, -0.08800315856933594, -0.08034133911132812, -0.07267951965332031, -0.0650177001953125, -0.05735588073730469, -0.049694061279296875, -0.04203224182128906, -0.03437042236328125, -0.026708602905273438, -0.019046783447265625, -0.011384963989257812, -0.00372314453125, 0.0039386749267578125, 0.011600494384765625, 0.019262313842773438, 0.02692413330078125, 0.03458595275878906, 0.042247772216796875, 0.04990959167480469, 0.0575714111328125, 0.06523323059082031, 0.07289505004882812, 0.08055686950683594, 0.08821868896484375, 0.09588050842285156, 0.10354232788085938, 0.11120414733886719, 0.118865966796875, 0.1265277862548828, 0.13418960571289062, 0.14185142517089844, 0.14951324462890625, 0.15717506408691406, 0.16483688354492188, 0.1724987030029297, 0.1801605224609375, 0.1878223419189453, 0.19548416137695312, 0.20314598083496094, 0.21080780029296875, 0.21846961975097656, 0.22613143920898438, 0.2337932586669922, 0.241455078125]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 3.0, 8.0, 5.0, 5.0, 6.0, 8.0, 3.0, 20.0, 21.0, 35.0, 86.0, 108.0, 179.0, 199.0, 149.0, 92.0, 42.0, 18.0, 4.0, 7.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.0547385215759277, -2.9882168769836426, -2.9216954708099365, -2.8551738262176514, -2.788652181625366, -2.72213077545166, -2.655609130859375, -2.58908748626709, -2.522566080093384, -2.4560444355010986, -2.3895230293273926, -2.3230013847351074, -2.2564797401428223, -2.189958333969116, -2.123436689376831, -2.056915044784546, -1.9903935194015503, -1.9238719940185547, -1.8573503494262695, -1.790828824043274, -1.7243072986602783, -1.6577856540679932, -1.5912641286849976, -1.524742603302002, -1.4582209587097168, -1.3916994333267212, -1.325177788734436, -1.2586562633514404, -1.1921347379684448, -1.1256132125854492, -1.059091567993164, -0.9925700426101685, -0.9260485172271729, -0.8595269322395325, -0.7930054068565369, -0.7264838218688965, -0.6599622964859009, -0.5934407114982605, -0.5269191265106201, -0.4603975713253021, -0.39387601613998413, -0.32735446095466614, -0.26083290576934814, -0.19431132078170776, -0.12778976559638977, -0.06126821041107178, 0.0052533745765686035, 0.0717749297618866, 0.1382964849472046, 0.20481804013252258, 0.2713395953178406, 0.33786118030548096, 0.40438273549079895, 0.47090429067611694, 0.5374258756637573, 0.6039474010467529, 0.6704689860343933, 0.7369905710220337, 0.8035120964050293, 0.8700336813926697, 0.9365552663803101, 1.0030767917633057, 1.0695984363555908, 1.1361199617385864, 1.202641487121582]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 3.0, 4.0, 6.0, 8.0, 9.0, 15.0, 16.0, 20.0, 21.0, 34.0, 38.0, 44.0, 39.0, 53.0, 57.0, 62.0, 62.0, 56.0, 72.0, 54.0, 58.0, 49.0, 42.0, 37.0, 27.0, 23.0, 32.0, 14.0, 16.0, 10.0, 13.0, 7.0, 3.0, 2.0, 0.0, 3.0, 0.0, 3.0, 0.0, 0.0, 3.0], "bins": [-1.5951663255691528, -1.5554850101470947, -1.5158038139343262, -1.476122498512268, -1.43644118309021, -1.3967599868774414, -1.3570786714553833, -1.3173973560333252, -1.2777161598205566, -1.2380348443984985, -1.19835364818573, -1.1586723327636719, -1.1189910173416138, -1.0793097019195557, -1.039628505706787, -0.999947190284729, -0.9602658748626709, -0.9205846190452576, -0.8809033036231995, -0.8412220478057861, -0.801540732383728, -0.7618594765663147, -0.7221782207489014, -0.6824969053268433, -0.6428156495094299, -0.6031343936920166, -0.5634530782699585, -0.5237718224525452, -0.48409053683280945, -0.44440925121307373, -0.4047279953956604, -0.3650467097759247, -0.3253653049468994, -0.2856840193271637, -0.24600274860858917, -0.20632147789001465, -0.16664019227027893, -0.1269589066505432, -0.08727763593196869, -0.047596365213394165, -0.007915079593658447, 0.031766198575496674, 0.0714474767446518, 0.11112875491380692, 0.15081003308296204, 0.19049131870269775, 0.23017258942127228, 0.2698538601398468, 0.3095351457595825, 0.34921643137931824, 0.38889771699905396, 0.4285789728164673, 0.468260258436203, 0.5079415440559387, 0.547622799873352, 0.5873041152954102, 0.6269853711128235, 0.6666666269302368, 0.7063479423522949, 0.7460291981697083, 0.7857104539871216, 0.8253917694091797, 0.865073025226593, 0.9047542810440063, 0.9444355964660645]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 5.0, 2.0, 11.0, 18.0, 20.0, 24.0, 46.0, 50.0, 91.0, 159.0, 278.0, 501.0, 860.0, 1655.0, 3266.0, 6505.0, 13787.0, 32123.0, 79313.0, 207159.0, 372106.0, 197888.0, 75827.0, 30669.0, 13319.0, 6112.0, 3060.0, 1602.0, 878.0, 483.0, 314.0, 173.0, 79.0, 69.0, 38.0, 26.0, 12.0, 8.0, 9.0, 8.0, 1.0, 6.0, 4.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.12469482421875, -0.12015628814697266, -0.11561775207519531, -0.11107921600341797, -0.10654067993164062, -0.10200214385986328, -0.09746360778808594, -0.0929250717163086, -0.08838653564453125, -0.0838479995727539, -0.07930946350097656, -0.07477092742919922, -0.07023239135742188, -0.06569385528564453, -0.06115531921386719, -0.056616783142089844, -0.0520782470703125, -0.047539710998535156, -0.04300117492675781, -0.03846263885498047, -0.033924102783203125, -0.02938556671142578, -0.024847030639648438, -0.020308494567871094, -0.01576995849609375, -0.011231422424316406, -0.0066928863525390625, -0.0021543502807617188, 0.002384185791015625, 0.006922721862792969, 0.011461257934570312, 0.015999794006347656, 0.020538330078125, 0.025076866149902344, 0.029615402221679688, 0.03415393829345703, 0.038692474365234375, 0.04323101043701172, 0.04776954650878906, 0.052308082580566406, 0.05684661865234375, 0.061385154724121094, 0.06592369079589844, 0.07046222686767578, 0.07500076293945312, 0.07953929901123047, 0.08407783508300781, 0.08861637115478516, 0.0931549072265625, 0.09769344329833984, 0.10223197937011719, 0.10677051544189453, 0.11130905151367188, 0.11584758758544922, 0.12038612365722656, 0.1249246597290039, 0.12946319580078125, 0.1340017318725586, 0.13854026794433594, 0.14307880401611328, 0.14761734008789062, 0.15215587615966797, 0.1566944122314453, 0.16123294830322266, 0.165771484375]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 6.0, 1.0, 3.0, 5.0, 3.0, 15.0, 10.0, 12.0, 19.0, 20.0, 32.0, 37.0, 41.0, 44.0, 44.0, 48.0, 64.0, 48.0, 66.0, 70.0, 57.0, 40.0, 59.0, 46.0, 40.0, 31.0, 31.0, 20.0, 27.0, 18.0, 18.0, 9.0, 4.0, 6.0, 3.0, 2.0, 3.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.13134765625, -0.12786006927490234, -0.12437248229980469, -0.12088489532470703, -0.11739730834960938, -0.11390972137451172, -0.11042213439941406, -0.1069345474243164, -0.10344696044921875, -0.0999593734741211, -0.09647178649902344, -0.09298419952392578, -0.08949661254882812, -0.08600902557373047, -0.08252143859863281, -0.07903385162353516, -0.0755462646484375, -0.07205867767333984, -0.06857109069824219, -0.06508350372314453, -0.061595916748046875, -0.05810832977294922, -0.05462074279785156, -0.051133155822753906, -0.04764556884765625, -0.044157981872558594, -0.04067039489746094, -0.03718280792236328, -0.033695220947265625, -0.03020763397216797, -0.026720046997070312, -0.023232460021972656, -0.019744873046875, -0.016257286071777344, -0.012769699096679688, -0.009282112121582031, -0.005794525146484375, -0.0023069381713867188, 0.0011806488037109375, 0.004668235778808594, 0.00815582275390625, 0.011643409729003906, 0.015130996704101562, 0.01861858367919922, 0.022106170654296875, 0.02559375762939453, 0.029081344604492188, 0.032568931579589844, 0.0360565185546875, 0.039544105529785156, 0.04303169250488281, 0.04651927947998047, 0.050006866455078125, 0.05349445343017578, 0.05698204040527344, 0.060469627380371094, 0.06395721435546875, 0.0674448013305664, 0.07093238830566406, 0.07441997528076172, 0.07790756225585938, 0.08139514923095703, 0.08488273620605469, 0.08837032318115234, 0.09185791015625]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 2.0, 2.0, 3.0, 2.0, 6.0, 8.0, 11.0, 11.0, 16.0, 26.0, 38.0, 47.0, 65.0, 87.0, 137.0, 208.0, 330.0, 563.0, 1032.0, 2115.0, 6830.0, 39973.0, 559949.0, 394705.0, 31945.0, 6003.0, 1954.0, 975.0, 540.0, 337.0, 213.0, 126.0, 97.0, 61.0, 39.0, 31.0, 23.0, 16.0, 11.0, 5.0, 6.0, 4.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0], "bins": [-0.377685546875, -0.3668785095214844, -0.35607147216796875, -0.3452644348144531, -0.3344573974609375, -0.3236503601074219, -0.31284332275390625, -0.3020362854003906, -0.291229248046875, -0.2804222106933594, -0.26961517333984375, -0.2588081359863281, -0.2480010986328125, -0.23719406127929688, -0.22638702392578125, -0.21557998657226562, -0.20477294921875, -0.19396591186523438, -0.18315887451171875, -0.17235183715820312, -0.1615447998046875, -0.15073776245117188, -0.13993072509765625, -0.12912368774414062, -0.118316650390625, -0.10750961303710938, -0.09670257568359375, -0.08589553833007812, -0.0750885009765625, -0.06428146362304688, -0.05347442626953125, -0.042667388916015625, -0.0318603515625, -0.021053314208984375, -0.01024627685546875, 0.000560760498046875, 0.0113677978515625, 0.022174835205078125, 0.03298187255859375, 0.043788909912109375, 0.054595947265625, 0.06540298461914062, 0.07621002197265625, 0.08701705932617188, 0.0978240966796875, 0.10863113403320312, 0.11943817138671875, 0.13024520874023438, 0.14105224609375, 0.15185928344726562, 0.16266632080078125, 0.17347335815429688, 0.1842803955078125, 0.19508743286132812, 0.20589447021484375, 0.21670150756835938, 0.227508544921875, 0.23831558227539062, 0.24912261962890625, 0.2599296569824219, 0.2707366943359375, 0.2815437316894531, 0.29235076904296875, 0.3031578063964844, 0.31396484375]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 3.0, 7.0, 11.0, 6.0, 12.0, 12.0, 10.0, 17.0, 16.0, 19.0, 12.0, 12.0, 35.0, 41.0, 28.0, 29.0, 38.0, 35.0, 35.0, 45.0, 53.0, 46.0, 46.0, 48.0, 43.0, 42.0, 40.0, 39.0, 41.0, 24.0, 18.0, 26.0, 26.0, 19.0, 15.0, 8.0, 9.0, 11.0, 7.0, 8.0, 7.0, 2.0, 4.0, 2.0, 4.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.300537109375, -0.28987884521484375, -0.2792205810546875, -0.26856231689453125, -0.257904052734375, -0.24724578857421875, -0.2365875244140625, -0.22592926025390625, -0.21527099609375, -0.20461273193359375, -0.1939544677734375, -0.18329620361328125, -0.172637939453125, -0.16197967529296875, -0.1513214111328125, -0.14066314697265625, -0.1300048828125, -0.11934661865234375, -0.1086883544921875, -0.09803009033203125, -0.087371826171875, -0.07671356201171875, -0.0660552978515625, -0.05539703369140625, -0.04473876953125, -0.03408050537109375, -0.0234222412109375, -0.01276397705078125, -0.002105712890625, 0.00855255126953125, 0.0192108154296875, 0.02986907958984375, 0.04052734375, 0.05118560791015625, 0.0618438720703125, 0.07250213623046875, 0.083160400390625, 0.09381866455078125, 0.1044769287109375, 0.11513519287109375, 0.12579345703125, 0.13645172119140625, 0.1471099853515625, 0.15776824951171875, 0.168426513671875, 0.17908477783203125, 0.1897430419921875, 0.20040130615234375, 0.2110595703125, 0.22171783447265625, 0.2323760986328125, 0.24303436279296875, 0.253692626953125, 0.26435089111328125, 0.2750091552734375, 0.28566741943359375, 0.29632568359375, 0.30698394775390625, 0.3176422119140625, 0.32830047607421875, 0.338958740234375, 0.34961700439453125, 0.3602752685546875, 0.37093353271484375, 0.381591796875]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 5.0, 5.0, 6.0, 9.0, 10.0, 14.0, 32.0, 36.0, 48.0, 92.0, 148.0, 303.0, 550.0, 1312.0, 3616.0, 14653.0, 94680.0, 808089.0, 103258.0, 15268.0, 3852.0, 1318.0, 600.0, 270.0, 140.0, 101.0, 45.0, 38.0, 18.0, 12.0, 9.0, 7.0, 4.0, 6.0, 1.0, 0.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.158935546875, -0.1535511016845703, -0.14816665649414062, -0.14278221130371094, -0.13739776611328125, -0.13201332092285156, -0.12662887573242188, -0.12124443054199219, -0.1158599853515625, -0.11047554016113281, -0.10509109497070312, -0.09970664978027344, -0.09432220458984375, -0.08893775939941406, -0.08355331420898438, -0.07816886901855469, -0.072784423828125, -0.06739997863769531, -0.062015533447265625, -0.05663108825683594, -0.05124664306640625, -0.04586219787597656, -0.040477752685546875, -0.03509330749511719, -0.0297088623046875, -0.024324417114257812, -0.018939971923828125, -0.013555526733398438, -0.00817108154296875, -0.0027866363525390625, 0.002597808837890625, 0.007982254028320312, 0.01336669921875, 0.018751144409179688, 0.024135589599609375, 0.029520034790039062, 0.03490447998046875, 0.04028892517089844, 0.045673370361328125, 0.05105781555175781, 0.0564422607421875, 0.06182670593261719, 0.06721115112304688, 0.07259559631347656, 0.07798004150390625, 0.08336448669433594, 0.08874893188476562, 0.09413337707519531, 0.099517822265625, 0.10490226745605469, 0.11028671264648438, 0.11567115783691406, 0.12105560302734375, 0.12644004821777344, 0.13182449340820312, 0.1372089385986328, 0.1425933837890625, 0.1479778289794922, 0.15336227416992188, 0.15874671936035156, 0.16413116455078125, 0.16951560974121094, 0.17490005493164062, 0.1802845001220703, 0.1856689453125]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 6.0, 1.0, 2.0, 1.0, 4.0, 8.0, 9.0, 4.0, 4.0, 11.0, 6.0, 9.0, 13.0, 21.0, 22.0, 20.0, 36.0, 50.0, 65.0, 99.0, 112.0, 120.0, 93.0, 65.0, 47.0, 40.0, 27.0, 18.0, 19.0, 22.0, 9.0, 11.0, 12.0, 7.0, 4.0, 5.0, 3.0, 6.0, 1.0, 1.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.9948692321777344e-05, -4.816707223653793e-05, -4.638545215129852e-05, -4.460383206605911e-05, -4.28222119808197e-05, -4.104059189558029e-05, -3.925897181034088e-05, -3.747735172510147e-05, -3.569573163986206e-05, -3.391411155462265e-05, -3.213249146938324e-05, -3.035087138414383e-05, -2.856925129890442e-05, -2.678763121366501e-05, -2.5006011128425598e-05, -2.3224391043186188e-05, -2.1442770957946777e-05, -1.9661150872707367e-05, -1.7879530787467957e-05, -1.6097910702228546e-05, -1.4316290616989136e-05, -1.2534670531749725e-05, -1.0753050446510315e-05, -8.971430361270905e-06, -7.189810276031494e-06, -5.408190190792084e-06, -3.6265701055526733e-06, -1.844950020313263e-06, -6.332993507385254e-08, 1.7182901501655579e-06, 3.4999102354049683e-06, 5.281530320644379e-06, 7.063150405883789e-06, 8.8447704911232e-06, 1.062639057636261e-05, 1.240801066160202e-05, 1.418963074684143e-05, 1.597125083208084e-05, 1.775287091732025e-05, 1.9534491002559662e-05, 2.1316111087799072e-05, 2.3097731173038483e-05, 2.4879351258277893e-05, 2.6660971343517303e-05, 2.8442591428756714e-05, 3.0224211513996124e-05, 3.2005831599235535e-05, 3.3787451684474945e-05, 3.5569071769714355e-05, 3.7350691854953766e-05, 3.9132311940193176e-05, 4.091393202543259e-05, 4.2695552110672e-05, 4.447717219591141e-05, 4.625879228115082e-05, 4.804041236639023e-05, 4.982203245162964e-05, 5.160365253686905e-05, 5.338527262210846e-05, 5.516689270734787e-05, 5.694851279258728e-05, 5.873013287782669e-05, 6.05117529630661e-05, 6.229337304830551e-05, 6.407499313354492e-05]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 4.0, 6.0, 6.0, 6.0, 12.0, 18.0, 23.0, 27.0, 40.0, 51.0, 45.0, 91.0, 107.0, 169.0, 210.0, 367.0, 553.0, 920.0, 1606.0, 3331.0, 8632.0, 26476.0, 112002.0, 679314.0, 161556.0, 33957.0, 10333.0, 4043.0, 1910.0, 913.0, 562.0, 383.0, 235.0, 168.0, 134.0, 85.0, 62.0, 55.0, 28.0, 23.0, 18.0, 26.0, 23.0, 8.0, 6.0, 4.0, 6.0, 2.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.1300048828125, -0.12601661682128906, -0.12202835083007812, -0.11804008483886719, -0.11405181884765625, -0.11006355285644531, -0.10607528686523438, -0.10208702087402344, -0.0980987548828125, -0.09411048889160156, -0.09012222290039062, -0.08613395690917969, -0.08214569091796875, -0.07815742492675781, -0.07416915893554688, -0.07018089294433594, -0.066192626953125, -0.06220436096191406, -0.058216094970703125, -0.05422782897949219, -0.05023956298828125, -0.04625129699707031, -0.042263031005859375, -0.03827476501464844, -0.0342864990234375, -0.030298233032226562, -0.026309967041015625, -0.022321701049804688, -0.01833343505859375, -0.014345169067382812, -0.010356903076171875, -0.0063686370849609375, -0.00238037109375, 0.0016078948974609375, 0.005596160888671875, 0.009584426879882812, 0.01357269287109375, 0.017560958862304688, 0.021549224853515625, 0.025537490844726562, 0.0295257568359375, 0.03351402282714844, 0.037502288818359375, 0.04149055480957031, 0.04547882080078125, 0.04946708679199219, 0.053455352783203125, 0.05744361877441406, 0.061431884765625, 0.06542015075683594, 0.06940841674804688, 0.07339668273925781, 0.07738494873046875, 0.08137321472167969, 0.08536148071289062, 0.08934974670410156, 0.0933380126953125, 0.09732627868652344, 0.10131454467773438, 0.10530281066894531, 0.10929107666015625, 0.11327934265136719, 0.11726760864257812, 0.12125587463378906, 0.125244140625]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 3.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 2.0, 2.0, 3.0, 6.0, 1.0, 8.0, 5.0, 15.0, 9.0, 12.0, 19.0, 17.0, 13.0, 34.0, 30.0, 31.0, 60.0, 75.0, 81.0, 75.0, 76.0, 67.0, 56.0, 53.0, 33.0, 46.0, 28.0, 22.0, 21.0, 16.0, 13.0, 6.0, 11.0, 8.0, 9.0, 9.0, 4.0, 4.0, 3.0, 3.0, 2.0, 7.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.09539794921875, -0.09224319458007812, -0.08908843994140625, -0.08593368530273438, -0.0827789306640625, -0.07962417602539062, -0.07646942138671875, -0.07331466674804688, -0.070159912109375, -0.06700515747070312, -0.06385040283203125, -0.060695648193359375, -0.0575408935546875, -0.054386138916015625, -0.05123138427734375, -0.048076629638671875, -0.044921875, -0.041767120361328125, -0.03861236572265625, -0.035457611083984375, -0.0323028564453125, -0.029148101806640625, -0.02599334716796875, -0.022838592529296875, -0.019683837890625, -0.016529083251953125, -0.01337432861328125, -0.010219573974609375, -0.0070648193359375, -0.003910064697265625, -0.00075531005859375, 0.002399444580078125, 0.00555419921875, 0.008708953857421875, 0.01186370849609375, 0.015018463134765625, 0.0181732177734375, 0.021327972412109375, 0.02448272705078125, 0.027637481689453125, 0.030792236328125, 0.033946990966796875, 0.03710174560546875, 0.040256500244140625, 0.0434112548828125, 0.046566009521484375, 0.04972076416015625, 0.052875518798828125, 0.0560302734375, 0.059185028076171875, 0.06233978271484375, 0.06549453735351562, 0.0686492919921875, 0.07180404663085938, 0.07495880126953125, 0.07811355590820312, 0.081268310546875, 0.08442306518554688, 0.08757781982421875, 0.09073257446289062, 0.0938873291015625, 0.09704208374023438, 0.10019683837890625, 0.10335159301757812, 0.10650634765625]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 3.0, 1.0, 1.0, 3.0, 6.0, 9.0, 9.0, 16.0, 46.0, 74.0, 125.0, 162.0, 200.0, 139.0, 100.0, 54.0, 24.0, 12.0, 7.0, 5.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.766864061355591, -2.693016529083252, -2.619168996810913, -2.545321464538574, -2.4714739322662354, -2.3976263999938965, -2.3237788677215576, -2.2499313354492188, -2.17608380317688, -2.102236270904541, -2.028388738632202, -1.9545412063598633, -1.8806936740875244, -1.8068461418151855, -1.7329986095428467, -1.6591510772705078, -1.585303544998169, -1.51145601272583, -1.4376084804534912, -1.3637609481811523, -1.2899134159088135, -1.2160658836364746, -1.1422183513641357, -1.0683708190917969, -0.994523286819458, -0.9206757545471191, -0.8468282222747803, -0.7729806900024414, -0.6991331577301025, -0.6252856254577637, -0.5514380931854248, -0.47759056091308594, -0.40374279022216797, -0.3298952579498291, -0.25604772567749023, -0.18220019340515137, -0.1083526611328125, -0.03450512886047363, 0.039342403411865234, 0.1131899356842041, 0.18703746795654297, 0.26088500022888184, 0.3347325325012207, 0.40858006477355957, 0.48242759704589844, 0.5562751293182373, 0.6301226615905762, 0.703970193862915, 0.7778177261352539, 0.8516652584075928, 0.9255127906799316, 0.9993603229522705, 1.0732078552246094, 1.1470553874969482, 1.220902919769287, 1.294750452041626, 1.3685979843139648, 1.4424455165863037, 1.5162930488586426, 1.5901405811309814, 1.6639881134033203, 1.7378356456756592, 1.811683177947998, 1.885530710220337, 1.9593782424926758]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 4.0, 1.0, 1.0, 1.0, 4.0, 3.0, 9.0, 11.0, 7.0, 14.0, 16.0, 16.0, 17.0, 23.0, 25.0, 35.0, 37.0, 39.0, 35.0, 49.0, 56.0, 60.0, 52.0, 66.0, 57.0, 48.0, 45.0, 31.0, 30.0, 29.0, 34.0, 29.0, 22.0, 23.0, 14.0, 13.0, 11.0, 16.0, 8.0, 3.0, 5.0, 5.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-1.2354381084442139, -1.1894893646240234, -1.143540620803833, -1.097591757774353, -1.0516430139541626, -1.0056942701339722, -0.959745466709137, -0.9137966632843018, -0.8678479194641113, -0.8218991756439209, -0.7759503722190857, -0.7300015687942505, -0.6840528249740601, -0.6381040811538696, -0.5921552777290344, -0.5462064743041992, -0.5002577304840088, -0.45430895686149597, -0.40836018323898315, -0.36241140961647034, -0.3164626359939575, -0.2705138623714447, -0.22456508874893188, -0.17861631512641907, -0.13266754150390625, -0.08671876788139343, -0.040769994258880615, 0.005178779363632202, 0.05112755298614502, 0.09707632660865784, 0.14302510023117065, 0.18897387385368347, 0.2349226474761963, 0.2808714210987091, 0.3268201947212219, 0.37276896834373474, 0.41871774196624756, 0.4646665155887604, 0.5106152892112732, 0.5565640926361084, 0.6025128364562988, 0.6484615802764893, 0.6944103837013245, 0.7403591871261597, 0.7863079309463501, 0.8322566747665405, 0.8782054781913757, 0.9241542816162109, 0.9701030254364014, 1.0160517692565918, 1.0620005130767822, 1.1079493761062622, 1.1538981199264526, 1.199846863746643, 1.245795726776123, 1.2917444705963135, 1.337693214416504, 1.3836419582366943, 1.4295907020568848, 1.4755395650863647, 1.5214883089065552, 1.5674370527267456, 1.6133859157562256, 1.659334659576416, 1.7052834033966064]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 5.0, 5.0, 4.0, 5.0, 6.0, 5.0, 8.0, 14.0, 20.0, 21.0, 33.0, 45.0, 73.0, 77.0, 142.0, 153.0, 305.0, 1797.0, 4121819.0, 68403.0, 557.0, 236.0, 161.0, 102.0, 79.0, 60.0, 45.0, 29.0, 22.0, 13.0, 13.0, 11.0, 4.0, 6.0, 2.0, 4.0, 5.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 3.0], "bins": [-1.2275390625, -1.1932373046875, -1.158935546875, -1.1246337890625, -1.09033203125, -1.0560302734375, -1.021728515625, -0.9874267578125, -0.953125, -0.9188232421875, -0.884521484375, -0.8502197265625, -0.81591796875, -0.7816162109375, -0.747314453125, -0.7130126953125, -0.6787109375, -0.6444091796875, -0.610107421875, -0.5758056640625, -0.54150390625, -0.5072021484375, -0.472900390625, -0.4385986328125, -0.404296875, -0.3699951171875, -0.335693359375, -0.3013916015625, -0.26708984375, -0.2327880859375, -0.198486328125, -0.1641845703125, -0.1298828125, -0.0955810546875, -0.061279296875, -0.0269775390625, 0.00732421875, 0.0416259765625, 0.075927734375, 0.1102294921875, 0.14453125, 0.1788330078125, 0.213134765625, 0.2474365234375, 0.28173828125, 0.3160400390625, 0.350341796875, 0.3846435546875, 0.4189453125, 0.4532470703125, 0.487548828125, 0.5218505859375, 0.55615234375, 0.5904541015625, 0.624755859375, 0.6590576171875, 0.693359375, 0.7276611328125, 0.761962890625, 0.7962646484375, 0.83056640625, 0.8648681640625, 0.899169921875, 0.9334716796875, 0.9677734375]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 5.0, 5.0, 3.0, 9.0, 6.0, 14.0, 30.0, 27.0, 32.0, 48.0, 60.0, 58.0, 57.0, 96.0, 71.0, 60.0, 82.0, 60.0, 56.0, 50.0, 44.0, 33.0, 28.0, 21.0, 17.0, 11.0, 6.0, 4.0, 4.0, 3.0, 3.0, 1.0, 1.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11785888671875, -0.11363697052001953, -0.10941505432128906, -0.1051931381225586, -0.10097122192382812, -0.09674930572509766, -0.09252738952636719, -0.08830547332763672, -0.08408355712890625, -0.07986164093017578, -0.07563972473144531, -0.07141780853271484, -0.06719589233398438, -0.0629739761352539, -0.05875205993652344, -0.05453014373779297, -0.0503082275390625, -0.04608631134033203, -0.04186439514160156, -0.037642478942871094, -0.033420562744140625, -0.029198646545410156, -0.024976730346679688, -0.02075481414794922, -0.01653289794921875, -0.012310981750488281, -0.008089065551757812, -0.0038671493530273438, 0.000354766845703125, 0.004576683044433594, 0.008798599243164062, 0.013020515441894531, 0.017242431640625, 0.02146434783935547, 0.025686264038085938, 0.029908180236816406, 0.034130096435546875, 0.038352012634277344, 0.04257392883300781, 0.04679584503173828, 0.05101776123046875, 0.05523967742919922, 0.05946159362792969, 0.06368350982666016, 0.06790542602539062, 0.0721273422241211, 0.07634925842285156, 0.08057117462158203, 0.0847930908203125, 0.08901500701904297, 0.09323692321777344, 0.0974588394165039, 0.10168075561523438, 0.10590267181396484, 0.11012458801269531, 0.11434650421142578, 0.11856842041015625, 0.12279033660888672, 0.1270122528076172, 0.13123416900634766, 0.13545608520507812, 0.1396780014038086, 0.14389991760253906, 0.14812183380126953, 0.15234375]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 2.0, 2.0, 5.0, 6.0, 6.0, 4.0, 10.0, 25.0, 30.0, 27.0, 72.0, 119.0, 244.0, 555.0, 1195.0, 2764.0, 7052.0, 19437.0, 66526.0, 343802.0, 2165546.0, 1324593.0, 193160.0, 44469.0, 14321.0, 5551.0, 2384.0, 1196.0, 550.0, 277.0, 144.0, 87.0, 40.0, 27.0, 17.0, 13.0, 7.0, 12.0, 4.0, 3.0, 1.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1376953125, -0.13362598419189453, -0.12955665588378906, -0.1254873275756836, -0.12141799926757812, -0.11734867095947266, -0.11327934265136719, -0.10921001434326172, -0.10514068603515625, -0.10107135772705078, -0.09700202941894531, -0.09293270111083984, -0.08886337280273438, -0.0847940444946289, -0.08072471618652344, -0.07665538787841797, -0.0725860595703125, -0.06851673126220703, -0.06444740295410156, -0.060378074645996094, -0.056308746337890625, -0.052239418029785156, -0.04817008972167969, -0.04410076141357422, -0.04003143310546875, -0.03596210479736328, -0.03189277648925781, -0.027823448181152344, -0.023754119873046875, -0.019684791564941406, -0.015615463256835938, -0.011546134948730469, -0.007476806640625, -0.0034074783325195312, 0.0006618499755859375, 0.004731178283691406, 0.008800506591796875, 0.012869834899902344, 0.016939163208007812, 0.02100849151611328, 0.02507781982421875, 0.02914714813232422, 0.03321647644042969, 0.037285804748535156, 0.041355133056640625, 0.045424461364746094, 0.04949378967285156, 0.05356311798095703, 0.0576324462890625, 0.06170177459716797, 0.06577110290527344, 0.0698404312133789, 0.07390975952148438, 0.07797908782958984, 0.08204841613769531, 0.08611774444580078, 0.09018707275390625, 0.09425640106201172, 0.09832572937011719, 0.10239505767822266, 0.10646438598632812, 0.1105337142944336, 0.11460304260253906, 0.11867237091064453, 0.12274169921875]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 6.0, 8.0, 4.0, 8.0, 9.0, 13.0, 13.0, 21.0, 22.0, 47.0, 45.0, 69.0, 86.0, 167.0, 224.0, 290.0, 372.0, 454.0, 495.0, 428.0, 330.0, 289.0, 182.0, 142.0, 101.0, 54.0, 41.0, 37.0, 31.0, 20.0, 17.0, 11.0, 9.0, 7.0, 4.0, 7.0, 3.0, 0.0, 4.0, 3.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.11376953125, -0.10959625244140625, -0.1054229736328125, -0.10124969482421875, -0.097076416015625, -0.09290313720703125, -0.0887298583984375, -0.08455657958984375, -0.08038330078125, -0.07621002197265625, -0.0720367431640625, -0.06786346435546875, -0.063690185546875, -0.05951690673828125, -0.0553436279296875, -0.05117034912109375, -0.0469970703125, -0.04282379150390625, -0.0386505126953125, -0.03447723388671875, -0.030303955078125, -0.02613067626953125, -0.0219573974609375, -0.01778411865234375, -0.01361083984375, -0.00943756103515625, -0.0052642822265625, -0.00109100341796875, 0.003082275390625, 0.00725555419921875, 0.0114288330078125, 0.01560211181640625, 0.019775390625, 0.02394866943359375, 0.0281219482421875, 0.03229522705078125, 0.036468505859375, 0.04064178466796875, 0.0448150634765625, 0.04898834228515625, 0.05316162109375, 0.05733489990234375, 0.0615081787109375, 0.06568145751953125, 0.069854736328125, 0.07402801513671875, 0.0782012939453125, 0.08237457275390625, 0.0865478515625, 0.09072113037109375, 0.0948944091796875, 0.09906768798828125, 0.103240966796875, 0.10741424560546875, 0.1115875244140625, 0.11576080322265625, 0.11993408203125, 0.12410736083984375, 0.1282806396484375, 0.13245391845703125, 0.136627197265625, 0.14080047607421875, 0.1449737548828125, 0.14914703369140625, 0.1533203125]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 5.0, 5.0, 7.0, 9.0, 13.0, 42.0, 64.0, 134.0, 207.0, 208.0, 145.0, 97.0, 40.0, 9.0, 7.0, 5.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-2.613504409790039, -2.549882650375366, -2.4862611293792725, -2.4226393699645996, -2.359017848968506, -2.295396089553833, -2.23177433013916, -2.1681528091430664, -2.1045310497283936, -2.0409092903137207, -1.977287769317627, -1.913666009902954, -1.8500443696975708, -1.7864227294921875, -1.7228009700775146, -1.6591793298721313, -1.595557689666748, -1.5319360494613647, -1.4683144092559814, -1.4046926498413086, -1.3410710096359253, -1.277449369430542, -1.2138276100158691, -1.1502059698104858, -1.0865843296051025, -1.0229626893997192, -0.9593409895896912, -0.8957192897796631, -0.8320976495742798, -0.7684760093688965, -0.7048543095588684, -0.6412326097488403, -0.5776112079620361, -0.5139895677566528, -0.45036786794662476, -0.38674619793891907, -0.3231245279312134, -0.2595028579235077, -0.195881187915802, -0.1322595179080963, -0.06863784790039062, -0.0050161778926849365, 0.05860549211502075, 0.12222716212272644, 0.18584883213043213, 0.24947050213813782, 0.3130921721458435, 0.3767138421535492, 0.4403355121612549, 0.5039571523666382, 0.5675788521766663, 0.6312005519866943, 0.6948221921920776, 0.7584438323974609, 0.822065532207489, 0.8856872320175171, 0.9493088722229004, 1.0129305124282837, 1.076552152633667, 1.1401739120483398, 1.2037955522537231, 1.2674171924591064, 1.3310389518737793, 1.3946605920791626, 1.458282232284546]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 4.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 6.0, 4.0, 7.0, 9.0, 6.0, 7.0, 14.0, 18.0, 20.0, 24.0, 20.0, 28.0, 34.0, 28.0, 36.0, 29.0, 51.0, 50.0, 47.0, 48.0, 51.0, 46.0, 34.0, 47.0, 36.0, 40.0, 30.0, 37.0, 26.0, 25.0, 28.0, 20.0, 15.0, 13.0, 7.0, 8.0, 8.0, 13.0, 5.0, 11.0, 6.0, 4.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.7177573442459106, -0.6952441334724426, -0.6727309226989746, -0.6502177119255066, -0.6277045011520386, -0.6051913499832153, -0.5826781392097473, -0.5601649284362793, -0.5376517176628113, -0.5151385068893433, -0.49262529611587524, -0.4701121151447296, -0.4475989043712616, -0.4250856935977936, -0.40257251262664795, -0.38005930185317993, -0.3575460910797119, -0.3350328803062439, -0.3125196695327759, -0.29000648856163025, -0.26749327778816223, -0.2449800670146942, -0.2224668711423874, -0.19995367527008057, -0.17744046449661255, -0.15492725372314453, -0.1324140578508377, -0.10990085452795029, -0.08738765120506287, -0.06487444788217545, -0.042361244559288025, -0.0198480486869812, 0.0026651620864868164, 0.025178365409374237, 0.04769156873226166, 0.07020477205514908, 0.0927179753780365, 0.11523117870092392, 0.13774438202381134, 0.16025757789611816, 0.18277078866958618, 0.2052839994430542, 0.22779719531536102, 0.25031039118766785, 0.27282360196113586, 0.2953368127346039, 0.3178499937057495, 0.34036320447921753, 0.36287641525268555, 0.38538962602615356, 0.4079028367996216, 0.4304160177707672, 0.45292922854423523, 0.47544243931770325, 0.4979556202888489, 0.5204688310623169, 0.5429820418357849, 0.5654952526092529, 0.588008463382721, 0.610521674156189, 0.6330348253250122, 0.6555480360984802, 0.6780612468719482, 0.7005744576454163, 0.7230876684188843]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 5.0, 2.0, 4.0, 4.0, 10.0, 7.0, 4.0, 17.0, 15.0, 27.0, 45.0, 56.0, 79.0, 136.0, 151.0, 279.0, 393.0, 669.0, 1089.0, 1976.0, 3579.0, 6751.0, 13780.0, 28169.0, 63055.0, 157015.0, 345626.0, 247458.0, 96519.0, 41372.0, 19308.0, 9534.0, 4945.0, 2748.0, 1383.0, 844.0, 499.0, 339.0, 221.0, 142.0, 104.0, 53.0, 36.0, 38.0, 23.0, 16.0, 10.0, 13.0, 4.0, 4.0, 6.0, 3.0, 2.0, 3.0, 1.0, 0.0, 1.0], "bins": [-0.130615234375, -0.12674427032470703, -0.12287330627441406, -0.1190023422241211, -0.11513137817382812, -0.11126041412353516, -0.10738945007324219, -0.10351848602294922, -0.09964752197265625, -0.09577655792236328, -0.09190559387207031, -0.08803462982177734, -0.08416366577148438, -0.0802927017211914, -0.07642173767089844, -0.07255077362060547, -0.0686798095703125, -0.06480884552001953, -0.06093788146972656, -0.057066917419433594, -0.053195953369140625, -0.049324989318847656, -0.04545402526855469, -0.04158306121826172, -0.03771209716796875, -0.03384113311767578, -0.029970169067382812, -0.026099205017089844, -0.022228240966796875, -0.018357276916503906, -0.014486312866210938, -0.010615348815917969, -0.006744384765625, -0.0028734207153320312, 0.0009975433349609375, 0.004868507385253906, 0.008739471435546875, 0.012610435485839844, 0.016481399536132812, 0.02035236358642578, 0.02422332763671875, 0.02809429168701172, 0.03196525573730469, 0.035836219787597656, 0.039707183837890625, 0.043578147888183594, 0.04744911193847656, 0.05132007598876953, 0.0551910400390625, 0.05906200408935547, 0.06293296813964844, 0.0668039321899414, 0.07067489624023438, 0.07454586029052734, 0.07841682434082031, 0.08228778839111328, 0.08615875244140625, 0.09002971649169922, 0.09390068054199219, 0.09777164459228516, 0.10164260864257812, 0.1055135726928711, 0.10938453674316406, 0.11325550079345703, 0.11712646484375]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 1.0, 4.0, 8.0, 5.0, 8.0, 7.0, 15.0, 14.0, 35.0, 28.0, 23.0, 32.0, 39.0, 46.0, 49.0, 50.0, 31.0, 54.0, 64.0, 53.0, 72.0, 48.0, 58.0, 37.0, 39.0, 36.0, 31.0, 13.0, 23.0, 18.0, 13.0, 14.0, 16.0, 8.0, 3.0, 4.0, 2.0, 1.0, 1.0, 4.0, 0.0, 3.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.11700439453125, -0.11380481719970703, -0.11060523986816406, -0.1074056625366211, -0.10420608520507812, -0.10100650787353516, -0.09780693054199219, -0.09460735321044922, -0.09140777587890625, -0.08820819854736328, -0.08500862121582031, -0.08180904388427734, -0.07860946655273438, -0.0754098892211914, -0.07221031188964844, -0.06901073455810547, -0.0658111572265625, -0.06261157989501953, -0.05941200256347656, -0.056212425231933594, -0.053012847900390625, -0.049813270568847656, -0.04661369323730469, -0.04341411590576172, -0.04021453857421875, -0.03701496124267578, -0.03381538391113281, -0.030615806579589844, -0.027416229248046875, -0.024216651916503906, -0.021017074584960938, -0.01781749725341797, -0.014617919921875, -0.011418342590332031, -0.008218765258789062, -0.005019187927246094, -0.001819610595703125, 0.0013799667358398438, 0.0045795440673828125, 0.007779121398925781, 0.01097869873046875, 0.014178276062011719, 0.017377853393554688, 0.020577430725097656, 0.023777008056640625, 0.026976585388183594, 0.030176162719726562, 0.03337574005126953, 0.0365753173828125, 0.03977489471435547, 0.04297447204589844, 0.046174049377441406, 0.049373626708984375, 0.052573204040527344, 0.05577278137207031, 0.05897235870361328, 0.06217193603515625, 0.06537151336669922, 0.06857109069824219, 0.07177066802978516, 0.07497024536132812, 0.0781698226928711, 0.08136940002441406, 0.08456897735595703, 0.0877685546875]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0, 4.0, 0.0, 2.0, 3.0, 8.0, 5.0, 6.0, 14.0, 27.0, 43.0, 46.0, 66.0, 144.0, 231.0, 453.0, 882.0, 2547.0, 10080.0, 66635.0, 711132.0, 224392.0, 24197.0, 4825.0, 1498.0, 592.0, 301.0, 169.0, 76.0, 62.0, 31.0, 26.0, 15.0, 21.0, 8.0, 2.0, 4.0, 7.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3271484375, -0.3165092468261719, -0.30587005615234375, -0.2952308654785156, -0.2845916748046875, -0.2739524841308594, -0.26331329345703125, -0.2526741027832031, -0.242034912109375, -0.23139572143554688, -0.22075653076171875, -0.21011734008789062, -0.1994781494140625, -0.18883895874023438, -0.17819976806640625, -0.16756057739257812, -0.15692138671875, -0.14628219604492188, -0.13564300537109375, -0.12500381469726562, -0.1143646240234375, -0.10372543334960938, -0.09308624267578125, -0.08244705200195312, -0.071807861328125, -0.061168670654296875, -0.05052947998046875, -0.039890289306640625, -0.0292510986328125, -0.018611907958984375, -0.00797271728515625, 0.002666473388671875, 0.0133056640625, 0.023944854736328125, 0.03458404541015625, 0.045223236083984375, 0.0558624267578125, 0.06650161743164062, 0.07714080810546875, 0.08777999877929688, 0.098419189453125, 0.10905838012695312, 0.11969757080078125, 0.13033676147460938, 0.1409759521484375, 0.15161514282226562, 0.16225433349609375, 0.17289352416992188, 0.18353271484375, 0.19417190551757812, 0.20481109619140625, 0.21545028686523438, 0.2260894775390625, 0.23672866821289062, 0.24736785888671875, 0.2580070495605469, 0.268646240234375, 0.2792854309082031, 0.28992462158203125, 0.3005638122558594, 0.3112030029296875, 0.3218421936035156, 0.33248138427734375, 0.3431205749511719, 0.353759765625]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 6.0, 5.0, 12.0, 14.0, 13.0, 17.0, 18.0, 27.0, 29.0, 37.0, 37.0, 37.0, 49.0, 44.0, 60.0, 65.0, 54.0, 56.0, 36.0, 58.0, 48.0, 41.0, 30.0, 43.0, 29.0, 22.0, 27.0, 22.0, 21.0, 6.0, 10.0, 8.0, 8.0, 5.0, 6.0, 5.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.36962890625, -0.3577232360839844, -0.34581756591796875, -0.3339118957519531, -0.3220062255859375, -0.3101005554199219, -0.29819488525390625, -0.2862892150878906, -0.274383544921875, -0.2624778747558594, -0.25057220458984375, -0.23866653442382812, -0.2267608642578125, -0.21485519409179688, -0.20294952392578125, -0.19104385375976562, -0.17913818359375, -0.16723251342773438, -0.15532684326171875, -0.14342117309570312, -0.1315155029296875, -0.11960983276367188, -0.10770416259765625, -0.09579849243164062, -0.083892822265625, -0.07198715209960938, -0.06008148193359375, -0.048175811767578125, -0.0362701416015625, -0.024364471435546875, -0.01245880126953125, -0.000553131103515625, 0.0113525390625, 0.023258209228515625, 0.03516387939453125, 0.047069549560546875, 0.0589752197265625, 0.07088088989257812, 0.08278656005859375, 0.09469223022460938, 0.106597900390625, 0.11850357055664062, 0.13040924072265625, 0.14231491088867188, 0.1542205810546875, 0.16612625122070312, 0.17803192138671875, 0.18993759155273438, 0.20184326171875, 0.21374893188476562, 0.22565460205078125, 0.23756027221679688, 0.2494659423828125, 0.2613716125488281, 0.27327728271484375, 0.2851829528808594, 0.297088623046875, 0.3089942932128906, 0.32089996337890625, 0.3328056335449219, 0.3447113037109375, 0.3566169738769531, 0.36852264404296875, 0.3804283142089844, 0.392333984375]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 3.0, 2.0, 4.0, 3.0, 3.0, 4.0, 4.0, 11.0, 10.0, 16.0, 29.0, 36.0, 57.0, 121.0, 242.0, 508.0, 1378.0, 5657.0, 43576.0, 768936.0, 207543.0, 16112.0, 2765.0, 823.0, 322.0, 157.0, 96.0, 44.0, 27.0, 14.0, 12.0, 16.0, 9.0, 4.0, 5.0, 1.0, 3.0, 4.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.2080078125, -0.2014617919921875, -0.194915771484375, -0.1883697509765625, -0.18182373046875, -0.1752777099609375, -0.168731689453125, -0.1621856689453125, -0.1556396484375, -0.1490936279296875, -0.142547607421875, -0.1360015869140625, -0.12945556640625, -0.1229095458984375, -0.116363525390625, -0.1098175048828125, -0.103271484375, -0.0967254638671875, -0.090179443359375, -0.0836334228515625, -0.07708740234375, -0.0705413818359375, -0.063995361328125, -0.0574493408203125, -0.0509033203125, -0.0443572998046875, -0.037811279296875, -0.0312652587890625, -0.02471923828125, -0.0181732177734375, -0.011627197265625, -0.0050811767578125, 0.00146484375, 0.0080108642578125, 0.014556884765625, 0.0211029052734375, 0.02764892578125, 0.0341949462890625, 0.040740966796875, 0.0472869873046875, 0.0538330078125, 0.0603790283203125, 0.066925048828125, 0.0734710693359375, 0.08001708984375, 0.0865631103515625, 0.093109130859375, 0.0996551513671875, 0.106201171875, 0.1127471923828125, 0.119293212890625, 0.1258392333984375, 0.13238525390625, 0.1389312744140625, 0.145477294921875, 0.1520233154296875, 0.1585693359375, 0.1651153564453125, 0.171661376953125, 0.1782073974609375, 0.18475341796875, 0.1912994384765625, 0.197845458984375, 0.2043914794921875, 0.2109375]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 5.0, 1.0, 2.0, 7.0, 6.0, 10.0, 10.0, 9.0, 8.0, 21.0, 29.0, 40.0, 39.0, 57.0, 80.0, 94.0, 116.0, 89.0, 83.0, 79.0, 45.0, 30.0, 32.0, 26.0, 16.0, 17.0, 10.0, 5.0, 6.0, 6.0, 3.0, 3.0, 7.0, 4.0, 4.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-4.1604042053222656e-05, -4.024524241685867e-05, -3.888644278049469e-05, -3.752764314413071e-05, -3.6168843507766724e-05, -3.481004387140274e-05, -3.345124423503876e-05, -3.2092444598674774e-05, -3.073364496231079e-05, -2.9374845325946808e-05, -2.8016045689582825e-05, -2.665724605321884e-05, -2.529844641685486e-05, -2.3939646780490875e-05, -2.2580847144126892e-05, -2.122204750776291e-05, -1.9863247871398926e-05, -1.8504448235034943e-05, -1.714564859867096e-05, -1.5786848962306976e-05, -1.4428049325942993e-05, -1.306924968957901e-05, -1.1710450053215027e-05, -1.0351650416851044e-05, -8.99285078048706e-06, -7.634051144123077e-06, -6.275251507759094e-06, -4.916451871395111e-06, -3.557652235031128e-06, -2.1988525986671448e-06, -8.400529623031616e-07, 5.187466740608215e-07, 1.8775463104248047e-06, 3.236345946788788e-06, 4.595145583152771e-06, 5.953945219516754e-06, 7.312744855880737e-06, 8.67154449224472e-06, 1.0030344128608704e-05, 1.1389143764972687e-05, 1.274794340133667e-05, 1.4106743037700653e-05, 1.5465542674064636e-05, 1.682434231042862e-05, 1.8183141946792603e-05, 1.9541941583156586e-05, 2.090074121952057e-05, 2.2259540855884552e-05, 2.3618340492248535e-05, 2.497714012861252e-05, 2.63359397649765e-05, 2.7694739401340485e-05, 2.9053539037704468e-05, 3.041233867406845e-05, 3.1771138310432434e-05, 3.312993794679642e-05, 3.44887375831604e-05, 3.5847537219524384e-05, 3.720633685588837e-05, 3.856513649225235e-05, 3.992393612861633e-05, 4.1282735764980316e-05, 4.26415354013443e-05, 4.400033503770828e-05, 4.5359134674072266e-05]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 5.0, 2.0, 3.0, 3.0, 4.0, 12.0, 9.0, 12.0, 26.0, 32.0, 37.0, 78.0, 122.0, 189.0, 291.0, 614.0, 1193.0, 3003.0, 8516.0, 31941.0, 221284.0, 674318.0, 81334.0, 16601.0, 4940.0, 1943.0, 905.0, 475.0, 258.0, 165.0, 63.0, 55.0, 50.0, 29.0, 16.0, 9.0, 3.0, 4.0, 5.0, 3.0, 2.0, 4.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.136474609375, -0.13196563720703125, -0.1274566650390625, -0.12294769287109375, -0.118438720703125, -0.11392974853515625, -0.1094207763671875, -0.10491180419921875, -0.10040283203125, -0.09589385986328125, -0.0913848876953125, -0.08687591552734375, -0.082366943359375, -0.07785797119140625, -0.0733489990234375, -0.06884002685546875, -0.0643310546875, -0.05982208251953125, -0.0553131103515625, -0.05080413818359375, -0.046295166015625, -0.04178619384765625, -0.0372772216796875, -0.03276824951171875, -0.02825927734375, -0.02375030517578125, -0.0192413330078125, -0.01473236083984375, -0.010223388671875, -0.00571441650390625, -0.0012054443359375, 0.00330352783203125, 0.0078125, 0.01232147216796875, 0.0168304443359375, 0.02133941650390625, 0.025848388671875, 0.03035736083984375, 0.0348663330078125, 0.03937530517578125, 0.04388427734375, 0.04839324951171875, 0.0529022216796875, 0.05741119384765625, 0.061920166015625, 0.06642913818359375, 0.0709381103515625, 0.07544708251953125, 0.0799560546875, 0.08446502685546875, 0.0889739990234375, 0.09348297119140625, 0.097991943359375, 0.10250091552734375, 0.1070098876953125, 0.11151885986328125, 0.11602783203125, 0.12053680419921875, 0.1250457763671875, 0.12955474853515625, 0.134063720703125, 0.13857269287109375, 0.1430816650390625, 0.14759063720703125, 0.152099609375]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 2.0, 9.0, 1.0, 4.0, 3.0, 7.0, 4.0, 5.0, 8.0, 4.0, 11.0, 19.0, 22.0, 30.0, 36.0, 47.0, 66.0, 57.0, 61.0, 71.0, 62.0, 89.0, 57.0, 64.0, 48.0, 48.0, 28.0, 26.0, 20.0, 25.0, 12.0, 7.0, 10.0, 4.0, 8.0, 5.0, 5.0, 2.0, 1.0, 5.0, 0.0, 2.0, 3.0, 2.0, 3.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.09112548828125, -0.08821392059326172, -0.08530235290527344, -0.08239078521728516, -0.07947921752929688, -0.0765676498413086, -0.07365608215332031, -0.07074451446533203, -0.06783294677734375, -0.06492137908935547, -0.06200981140136719, -0.059098243713378906, -0.056186676025390625, -0.053275108337402344, -0.05036354064941406, -0.04745197296142578, -0.0445404052734375, -0.04162883758544922, -0.03871726989746094, -0.035805702209472656, -0.032894134521484375, -0.029982566833496094, -0.027070999145507812, -0.02415943145751953, -0.02124786376953125, -0.01833629608154297, -0.015424728393554688, -0.012513160705566406, -0.009601593017578125, -0.006690025329589844, -0.0037784576416015625, -0.0008668899536132812, 0.002044677734375, 0.004956245422363281, 0.007867813110351562, 0.010779380798339844, 0.013690948486328125, 0.016602516174316406, 0.019514083862304688, 0.02242565155029297, 0.02533721923828125, 0.02824878692626953, 0.031160354614257812, 0.034071922302246094, 0.036983489990234375, 0.039895057678222656, 0.04280662536621094, 0.04571819305419922, 0.0486297607421875, 0.05154132843017578, 0.05445289611816406, 0.057364463806152344, 0.060276031494140625, 0.0631875991821289, 0.06609916687011719, 0.06901073455810547, 0.07192230224609375, 0.07483386993408203, 0.07774543762207031, 0.0806570053100586, 0.08356857299804688, 0.08648014068603516, 0.08939170837402344, 0.09230327606201172, 0.09521484375]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 2.0, 3.0, 2.0, 6.0, 6.0, 23.0, 90.0, 148.0, 255.0, 231.0, 127.0, 59.0, 20.0, 12.0, 9.0, 2.0, 2.0, 2.0, 4.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.634068489074707, -3.545316457748413, -3.456564426422119, -3.3678126335144043, -3.2790606021881104, -3.1903085708618164, -3.1015565395355225, -3.0128045082092285, -2.9240527153015137, -2.8353006839752197, -2.746548652648926, -2.657796859741211, -2.569044828414917, -2.480292797088623, -2.391540765762329, -2.302788734436035, -2.2140369415283203, -2.1252849102020264, -2.0365328788757324, -1.947780966758728, -1.8590290546417236, -1.7702770233154297, -1.6815249919891357, -1.5927730798721313, -1.5040209293365479, -1.415268898010254, -1.3265169858932495, -1.2377649545669556, -1.1490130424499512, -1.0602610111236572, -0.9715090394020081, -0.8827570676803589, -0.7940051555633545, -0.7052531838417053, -0.6165012121200562, -0.5277491807937622, -0.4389972388744354, -0.35024526715278625, -0.2614932656288147, -0.17274129390716553, -0.08398932218551636, 0.004762656986713409, 0.09351463615894318, 0.18226662278175354, 0.2710185945034027, 0.3597705662250519, 0.44852256774902344, 0.5372745394706726, 0.6260265111923218, 0.714778482913971, 0.8035304546356201, 0.8922824859619141, 0.9810343980789185, 1.0697864294052124, 1.1585383415222168, 1.2472903728485107, 1.3360424041748047, 1.4247944355010986, 1.513546347618103, 1.602298378944397, 1.6910502910614014, 1.7798023223876953, 1.8685543537139893, 1.9573062658309937, 2.046058177947998]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 6.0, 3.0, 6.0, 9.0, 5.0, 7.0, 11.0, 6.0, 15.0, 10.0, 24.0, 19.0, 21.0, 21.0, 29.0, 27.0, 33.0, 34.0, 36.0, 43.0, 51.0, 47.0, 53.0, 62.0, 51.0, 46.0, 40.0, 35.0, 38.0, 31.0, 27.0, 27.0, 25.0, 21.0, 13.0, 13.0, 15.0, 11.0, 10.0, 6.0, 4.0, 7.0, 2.0, 4.0, 2.0, 6.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.2282485961914062, -1.1893563270568848, -1.1504640579223633, -1.1115717887878418, -1.0726795196533203, -1.0337872505187988, -0.9948949813842773, -0.9560027122497559, -0.9171104431152344, -0.8782181739807129, -0.8393259048461914, -0.8004336357116699, -0.7615413665771484, -0.722649097442627, -0.6837568283081055, -0.644864559173584, -0.6059723496437073, -0.5670800805091858, -0.5281878113746643, -0.4892955422401428, -0.45040327310562134, -0.41151100397109985, -0.37261876463890076, -0.3337264955043793, -0.2948342263698578, -0.2559419572353363, -0.21704968810081482, -0.17815743386745453, -0.13926516473293304, -0.10037289559841156, -0.06148064136505127, -0.022588372230529785, 0.0163038969039917, 0.055196162313222885, 0.09408842772245407, 0.13298068940639496, 0.17187295854091644, 0.21076522767543793, 0.24965748190879822, 0.2885497510433197, 0.3274420201778412, 0.36633428931236267, 0.40522655844688416, 0.44411879777908325, 0.48301106691360474, 0.5219033360481262, 0.5607956051826477, 0.5996878743171692, 0.6385801434516907, 0.6774724125862122, 0.7163646817207336, 0.7552569508552551, 0.7941492199897766, 0.8330414891242981, 0.8719336986541748, 0.9108259677886963, 0.9497182369232178, 0.9886105060577393, 1.0275027751922607, 1.0663950443267822, 1.1052873134613037, 1.1441795825958252, 1.1830718517303467, 1.2219641208648682, 1.2608563899993896]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 6.0, 6.0, 10.0, 11.0, 11.0, 23.0, 37.0, 54.0, 78.0, 128.0, 212.0, 312.0, 570.0, 1147.0, 2663.0, 6494.0, 22044.0, 104097.0, 841015.0, 2593734.0, 524577.0, 71769.0, 16198.0, 5080.0, 1962.0, 891.0, 424.0, 244.0, 145.0, 102.0, 63.0, 48.0, 32.0, 25.0, 10.0, 18.0, 12.0, 12.0, 3.0, 4.0, 6.0, 3.0, 2.0, 2.0, 4.0, 3.0, 0.0, 1.0, 4.0], "bins": [-0.1444091796875, -0.14021015167236328, -0.13601112365722656, -0.13181209564208984, -0.12761306762695312, -0.1234140396118164, -0.11921501159667969, -0.11501598358154297, -0.11081695556640625, -0.10661792755126953, -0.10241889953613281, -0.0982198715209961, -0.09402084350585938, -0.08982181549072266, -0.08562278747558594, -0.08142375946044922, -0.0772247314453125, -0.07302570343017578, -0.06882667541503906, -0.06462764739990234, -0.060428619384765625, -0.056229591369628906, -0.05203056335449219, -0.04783153533935547, -0.04363250732421875, -0.03943347930908203, -0.03523445129394531, -0.031035423278808594, -0.026836395263671875, -0.022637367248535156, -0.018438339233398438, -0.014239311218261719, -0.010040283203125, -0.005841255187988281, -0.0016422271728515625, 0.0025568008422851562, 0.006755828857421875, 0.010954856872558594, 0.015153884887695312, 0.01935291290283203, 0.02355194091796875, 0.02775096893310547, 0.03194999694824219, 0.036149024963378906, 0.040348052978515625, 0.044547080993652344, 0.04874610900878906, 0.05294513702392578, 0.0571441650390625, 0.06134319305419922, 0.06554222106933594, 0.06974124908447266, 0.07394027709960938, 0.0781393051147461, 0.08233833312988281, 0.08653736114501953, 0.09073638916015625, 0.09493541717529297, 0.09913444519042969, 0.1033334732055664, 0.10753250122070312, 0.11173152923583984, 0.11593055725097656, 0.12012958526611328, 0.12432861328125]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 3.0, 10.0, 7.0, 8.0, 5.0, 12.0, 18.0, 18.0, 23.0, 35.0, 39.0, 45.0, 48.0, 53.0, 50.0, 64.0, 56.0, 54.0, 61.0, 59.0, 61.0, 56.0, 36.0, 35.0, 35.0, 23.0, 17.0, 14.0, 22.0, 8.0, 11.0, 6.0, 5.0, 2.0, 3.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.11578369140625, -0.112579345703125, -0.109375, -0.106170654296875, -0.10296630859375, -0.099761962890625, -0.0965576171875, -0.093353271484375, -0.09014892578125, -0.086944580078125, -0.083740234375, -0.080535888671875, -0.07733154296875, -0.074127197265625, -0.0709228515625, -0.067718505859375, -0.06451416015625, -0.061309814453125, -0.05810546875, -0.054901123046875, -0.05169677734375, -0.048492431640625, -0.0452880859375, -0.042083740234375, -0.03887939453125, -0.035675048828125, -0.032470703125, -0.029266357421875, -0.02606201171875, -0.022857666015625, -0.0196533203125, -0.016448974609375, -0.01324462890625, -0.010040283203125, -0.0068359375, -0.003631591796875, -0.00042724609375, 0.002777099609375, 0.0059814453125, 0.009185791015625, 0.01239013671875, 0.015594482421875, 0.018798828125, 0.022003173828125, 0.02520751953125, 0.028411865234375, 0.0316162109375, 0.034820556640625, 0.03802490234375, 0.041229248046875, 0.04443359375, 0.047637939453125, 0.05084228515625, 0.054046630859375, 0.0572509765625, 0.060455322265625, 0.06365966796875, 0.066864013671875, 0.070068359375, 0.073272705078125, 0.07647705078125, 0.079681396484375, 0.0828857421875, 0.086090087890625, 0.08929443359375]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 6.0, 8.0, 19.0, 15.0, 34.0, 33.0, 63.0, 105.0, 166.0, 320.0, 646.0, 1318.0, 2959.0, 7724.0, 23660.0, 88162.0, 520793.0, 2656185.0, 728538.0, 116259.0, 30151.0, 9977.0, 3833.0, 1607.0, 750.0, 391.0, 218.0, 121.0, 75.0, 46.0, 25.0, 20.0, 20.0, 9.0, 9.0, 6.0, 5.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.1658935546875, -0.16123008728027344, -0.15656661987304688, -0.1519031524658203, -0.14723968505859375, -0.1425762176513672, -0.13791275024414062, -0.13324928283691406, -0.1285858154296875, -0.12392234802246094, -0.11925888061523438, -0.11459541320800781, -0.10993194580078125, -0.10526847839355469, -0.10060501098632812, -0.09594154357910156, -0.091278076171875, -0.08661460876464844, -0.08195114135742188, -0.07728767395019531, -0.07262420654296875, -0.06796073913574219, -0.06329727172851562, -0.05863380432128906, -0.0539703369140625, -0.04930686950683594, -0.044643402099609375, -0.03997993469238281, -0.03531646728515625, -0.030652999877929688, -0.025989532470703125, -0.021326065063476562, -0.01666259765625, -0.011999130249023438, -0.007335662841796875, -0.0026721954345703125, 0.00199127197265625, 0.0066547393798828125, 0.011318206787109375, 0.015981674194335938, 0.0206451416015625, 0.025308609008789062, 0.029972076416015625, 0.03463554382324219, 0.03929901123046875, 0.04396247863769531, 0.048625946044921875, 0.05328941345214844, 0.057952880859375, 0.06261634826660156, 0.06727981567382812, 0.07194328308105469, 0.07660675048828125, 0.08127021789550781, 0.08593368530273438, 0.09059715270996094, 0.0952606201171875, 0.09992408752441406, 0.10458755493164062, 0.10925102233886719, 0.11391448974609375, 0.11857795715332031, 0.12324142456054688, 0.12790489196777344, 0.132568359375]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 3.0, 5.0, 3.0, 4.0, 8.0, 12.0, 7.0, 16.0, 16.0, 23.0, 34.0, 44.0, 51.0, 68.0, 79.0, 149.0, 227.0, 285.0, 387.0, 475.0, 472.0, 446.0, 355.0, 265.0, 169.0, 98.0, 91.0, 67.0, 40.0, 46.0, 36.0, 17.0, 23.0, 14.0, 11.0, 8.0, 8.0, 5.0, 2.0, 3.0, 3.0, 3.0, 3.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1693115234375, -0.16405105590820312, -0.15879058837890625, -0.15353012084960938, -0.1482696533203125, -0.14300918579101562, -0.13774871826171875, -0.13248825073242188, -0.127227783203125, -0.12196731567382812, -0.11670684814453125, -0.11144638061523438, -0.1061859130859375, -0.10092544555664062, -0.09566497802734375, -0.09040451049804688, -0.08514404296875, -0.07988357543945312, -0.07462310791015625, -0.06936264038085938, -0.0641021728515625, -0.058841705322265625, -0.05358123779296875, -0.048320770263671875, -0.043060302734375, -0.037799835205078125, -0.03253936767578125, -0.027278900146484375, -0.0220184326171875, -0.016757965087890625, -0.01149749755859375, -0.006237030029296875, -0.0009765625, 0.004283905029296875, 0.00954437255859375, 0.014804840087890625, 0.0200653076171875, 0.025325775146484375, 0.03058624267578125, 0.035846710205078125, 0.041107177734375, 0.046367645263671875, 0.05162811279296875, 0.056888580322265625, 0.0621490478515625, 0.06740951538085938, 0.07266998291015625, 0.07793045043945312, 0.08319091796875, 0.08845138549804688, 0.09371185302734375, 0.09897232055664062, 0.1042327880859375, 0.10949325561523438, 0.11475372314453125, 0.12001419067382812, 0.125274658203125, 0.13053512573242188, 0.13579559326171875, 0.14105606079101562, 0.1463165283203125, 0.15157699584960938, 0.15683746337890625, 0.16209793090820312, 0.1673583984375]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 5.0, 13.0, 9.0, 28.0, 72.0, 129.0, 224.0, 231.0, 156.0, 80.0, 22.0, 14.0, 10.0, 4.0, 4.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.351358413696289, -2.2611982822418213, -2.1710381507873535, -2.0808780193328857, -1.9907177686691284, -1.9005576372146606, -1.8103973865509033, -1.7202372550964355, -1.6300771236419678, -1.5399169921875, -1.4497568607330322, -1.359596610069275, -1.2694364786148071, -1.1792763471603394, -1.089116096496582, -0.9989559650421143, -0.9087958335876465, -0.8186357021331787, -0.7284755110740662, -0.6383153200149536, -0.5481551885604858, -0.4579950273036957, -0.3678348660469055, -0.27767467498779297, -0.1875145435333252, -0.09735438227653503, -0.007194221019744873, 0.08296594023704529, 0.17312610149383545, 0.2632862627506256, 0.35344642400741577, 0.4436066150665283, 0.5337669849395752, 0.623927116394043, 0.7140873074531555, 0.8042474985122681, 0.8944076299667358, 0.9845677614212036, 1.074728012084961, 1.1648881435394287, 1.2550482749938965, 1.3452084064483643, 1.435368537902832, 1.5255287885665894, 1.6156889200210571, 1.705849051475525, 1.7960093021392822, 1.88616943359375, 1.9763295650482178, 2.0664896965026855, 2.1566498279571533, 2.246809959411621, 2.336970329284668, 2.4271304607391357, 2.5172905921936035, 2.6074507236480713, 2.697610855102539, 2.787770986557007, 2.8779311180114746, 2.9680912494659424, 3.05825138092041, 3.148411750793457, 3.238571882247925, 3.3287320137023926, 3.4188921451568604]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 0.0, 2.0, 1.0, 5.0, 6.0, 10.0, 6.0, 12.0, 14.0, 19.0, 19.0, 21.0, 34.0, 34.0, 37.0, 36.0, 47.0, 45.0, 58.0, 58.0, 51.0, 51.0, 56.0, 41.0, 50.0, 38.0, 39.0, 42.0, 33.0, 28.0, 25.0, 19.0, 14.0, 10.0, 10.0, 8.0, 5.0, 5.0, 9.0, 4.0, 5.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.0525121688842773, -1.0177582502365112, -0.9830042123794556, -0.9482502937316895, -0.9134963154792786, -0.8787423372268677, -0.8439884185791016, -0.8092344403266907, -0.7744804620742798, -0.7397264838218689, -0.704972505569458, -0.6702185869216919, -0.635464608669281, -0.6007106304168701, -0.565956711769104, -0.5312027335166931, -0.4964487552642822, -0.46169477701187134, -0.42694082856178284, -0.39218688011169434, -0.35743290185928345, -0.32267892360687256, -0.28792497515678406, -0.25317102670669556, -0.21841704845428467, -0.18366308510303497, -0.14890912175178528, -0.11415515840053558, -0.07940119504928589, -0.044647231698036194, -0.009893268346786499, 0.024860695004463196, 0.05961453914642334, 0.09436850249767303, 0.12912246584892273, 0.16387642920017242, 0.19863039255142212, 0.23338435590267181, 0.2681383192539215, 0.30289226770401, 0.3376462459564209, 0.3724002242088318, 0.4071541726589203, 0.4419081211090088, 0.4766620993614197, 0.5114160776138306, 0.5461699962615967, 0.5809239745140076, 0.6156779527664185, 0.6504319310188293, 0.6851859092712402, 0.7199398279190063, 0.7546938061714172, 0.7894477844238281, 0.8242017030715942, 0.8589556813240051, 0.893709659576416, 0.9284636378288269, 0.9632176160812378, 0.9979715347290039, 1.0327255725860596, 1.0674794912338257, 1.1022334098815918, 1.1369874477386475, 1.1717413663864136]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 4.0, 2.0, 5.0, 6.0, 7.0, 8.0, 15.0, 13.0, 20.0, 41.0, 55.0, 75.0, 103.0, 176.0, 312.0, 472.0, 857.0, 1636.0, 3404.0, 7283.0, 16522.0, 38616.0, 95643.0, 234303.0, 349410.0, 175251.0, 70826.0, 29497.0, 12594.0, 5625.0, 2657.0, 1317.0, 715.0, 388.0, 230.0, 146.0, 81.0, 65.0, 51.0, 43.0, 29.0, 16.0, 13.0, 12.0, 4.0, 4.0, 5.0, 6.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.14892578125, -0.14458847045898438, -0.14025115966796875, -0.13591384887695312, -0.1315765380859375, -0.12723922729492188, -0.12290191650390625, -0.11856460571289062, -0.114227294921875, -0.10988998413085938, -0.10555267333984375, -0.10121536254882812, -0.0968780517578125, -0.09254074096679688, -0.08820343017578125, -0.08386611938476562, -0.07952880859375, -0.07519149780273438, -0.07085418701171875, -0.06651687622070312, -0.0621795654296875, -0.057842254638671875, -0.05350494384765625, -0.049167633056640625, -0.044830322265625, -0.040493011474609375, -0.03615570068359375, -0.031818389892578125, -0.0274810791015625, -0.023143768310546875, -0.01880645751953125, -0.014469146728515625, -0.0101318359375, -0.005794525146484375, -0.00145721435546875, 0.002880096435546875, 0.0072174072265625, 0.011554718017578125, 0.01589202880859375, 0.020229339599609375, 0.024566650390625, 0.028903961181640625, 0.03324127197265625, 0.037578582763671875, 0.0419158935546875, 0.046253204345703125, 0.05059051513671875, 0.054927825927734375, 0.05926513671875, 0.06360244750976562, 0.06793975830078125, 0.07227706909179688, 0.0766143798828125, 0.08095169067382812, 0.08528900146484375, 0.08962631225585938, 0.093963623046875, 0.09830093383789062, 0.10263824462890625, 0.10697555541992188, 0.1113128662109375, 0.11565017700195312, 0.11998748779296875, 0.12432479858398438, 0.128662109375]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 8.0, 3.0, 7.0, 5.0, 13.0, 15.0, 23.0, 19.0, 20.0, 32.0, 50.0, 51.0, 49.0, 50.0, 50.0, 55.0, 55.0, 75.0, 52.0, 57.0, 53.0, 43.0, 40.0, 38.0, 24.0, 27.0, 21.0, 17.0, 11.0, 10.0, 10.0, 8.0, 6.0, 4.0, 5.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11474609375, -0.11144542694091797, -0.10814476013183594, -0.1048440933227539, -0.10154342651367188, -0.09824275970458984, -0.09494209289550781, -0.09164142608642578, -0.08834075927734375, -0.08504009246826172, -0.08173942565917969, -0.07843875885009766, -0.07513809204101562, -0.0718374252319336, -0.06853675842285156, -0.06523609161376953, -0.0619354248046875, -0.05863475799560547, -0.05533409118652344, -0.052033424377441406, -0.048732757568359375, -0.045432090759277344, -0.04213142395019531, -0.03883075714111328, -0.03553009033203125, -0.03222942352294922, -0.028928756713867188, -0.025628089904785156, -0.022327423095703125, -0.019026756286621094, -0.015726089477539062, -0.012425422668457031, -0.009124755859375, -0.005824089050292969, -0.0025234222412109375, 0.0007772445678710938, 0.004077911376953125, 0.007378578186035156, 0.010679244995117188, 0.013979911804199219, 0.01728057861328125, 0.02058124542236328, 0.023881912231445312, 0.027182579040527344, 0.030483245849609375, 0.033783912658691406, 0.03708457946777344, 0.04038524627685547, 0.0436859130859375, 0.04698657989501953, 0.05028724670410156, 0.053587913513183594, 0.056888580322265625, 0.060189247131347656, 0.06348991394042969, 0.06679058074951172, 0.07009124755859375, 0.07339191436767578, 0.07669258117675781, 0.07999324798583984, 0.08329391479492188, 0.0865945816040039, 0.08989524841308594, 0.09319591522216797, 0.09649658203125]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 2.0, 4.0, 3.0, 10.0, 13.0, 11.0, 18.0, 23.0, 23.0, 53.0, 61.0, 84.0, 113.0, 174.0, 241.0, 385.0, 564.0, 956.0, 1660.0, 3542.0, 10096.0, 49987.0, 432805.0, 478637.0, 50819.0, 10333.0, 3547.0, 1656.0, 924.0, 550.0, 378.0, 259.0, 179.0, 137.0, 92.0, 64.0, 36.0, 28.0, 24.0, 19.0, 17.0, 10.0, 7.0, 5.0, 4.0, 2.0, 2.0, 3.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.308349609375, -0.2984046936035156, -0.28845977783203125, -0.2785148620605469, -0.2685699462890625, -0.2586250305175781, -0.24868011474609375, -0.23873519897460938, -0.228790283203125, -0.21884536743164062, -0.20890045166015625, -0.19895553588867188, -0.1890106201171875, -0.17906570434570312, -0.16912078857421875, -0.15917587280273438, -0.14923095703125, -0.13928604125976562, -0.12934112548828125, -0.11939620971679688, -0.1094512939453125, -0.09950637817382812, -0.08956146240234375, -0.07961654663085938, -0.069671630859375, -0.059726715087890625, -0.04978179931640625, -0.039836883544921875, -0.0298919677734375, -0.019947052001953125, -0.01000213623046875, -5.7220458984375e-05, 0.0098876953125, 0.019832611083984375, 0.02977752685546875, 0.039722442626953125, 0.0496673583984375, 0.059612274169921875, 0.06955718994140625, 0.07950210571289062, 0.089447021484375, 0.09939193725585938, 0.10933685302734375, 0.11928176879882812, 0.1292266845703125, 0.13917160034179688, 0.14911651611328125, 0.15906143188476562, 0.16900634765625, 0.17895126342773438, 0.18889617919921875, 0.19884109497070312, 0.2087860107421875, 0.21873092651367188, 0.22867584228515625, 0.23862075805664062, 0.248565673828125, 0.2585105895996094, 0.26845550537109375, 0.2784004211425781, 0.2883453369140625, 0.2982902526855469, 0.30823516845703125, 0.3181800842285156, 0.328125]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 2.0, 5.0, 4.0, 2.0, 1.0, 4.0, 6.0, 4.0, 12.0, 9.0, 9.0, 11.0, 17.0, 21.0, 15.0, 15.0, 17.0, 23.0, 26.0, 26.0, 32.0, 41.0, 42.0, 33.0, 34.0, 39.0, 39.0, 56.0, 48.0, 54.0, 40.0, 43.0, 34.0, 24.0, 28.0, 28.0, 27.0, 29.0, 17.0, 15.0, 11.0, 13.0, 8.0, 6.0, 12.0, 6.0, 2.0, 7.0, 6.0, 1.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0], "bins": [-0.342041015625, -0.33063507080078125, -0.3192291259765625, -0.30782318115234375, -0.296417236328125, -0.28501129150390625, -0.2736053466796875, -0.26219940185546875, -0.25079345703125, -0.23938751220703125, -0.2279815673828125, -0.21657562255859375, -0.205169677734375, -0.19376373291015625, -0.1823577880859375, -0.17095184326171875, -0.1595458984375, -0.14813995361328125, -0.1367340087890625, -0.12532806396484375, -0.113922119140625, -0.10251617431640625, -0.0911102294921875, -0.07970428466796875, -0.06829833984375, -0.05689239501953125, -0.0454864501953125, -0.03408050537109375, -0.022674560546875, -0.01126861572265625, 0.0001373291015625, 0.01154327392578125, 0.02294921875, 0.03435516357421875, 0.0457611083984375, 0.05716705322265625, 0.068572998046875, 0.07997894287109375, 0.0913848876953125, 0.10279083251953125, 0.11419677734375, 0.12560272216796875, 0.1370086669921875, 0.14841461181640625, 0.159820556640625, 0.17122650146484375, 0.1826324462890625, 0.19403839111328125, 0.2054443359375, 0.21685028076171875, 0.2282562255859375, 0.23966217041015625, 0.251068115234375, 0.26247406005859375, 0.2738800048828125, 0.28528594970703125, 0.29669189453125, 0.30809783935546875, 0.3195037841796875, 0.33090972900390625, 0.342315673828125, 0.35372161865234375, 0.3651275634765625, 0.37653350830078125, 0.387939453125]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 5.0, 3.0, 8.0, 13.0, 14.0, 22.0, 41.0, 56.0, 98.0, 172.0, 238.0, 531.0, 1144.0, 3132.0, 12093.0, 75143.0, 765673.0, 160647.0, 21517.0, 4869.0, 1654.0, 665.0, 354.0, 185.0, 100.0, 62.0, 34.0, 28.0, 23.0, 16.0, 8.0, 7.0, 4.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1427001953125, -0.1369171142578125, -0.131134033203125, -0.1253509521484375, -0.11956787109375, -0.1137847900390625, -0.108001708984375, -0.1022186279296875, -0.096435546875, -0.0906524658203125, -0.084869384765625, -0.0790863037109375, -0.07330322265625, -0.0675201416015625, -0.061737060546875, -0.0559539794921875, -0.0501708984375, -0.0443878173828125, -0.038604736328125, -0.0328216552734375, -0.02703857421875, -0.0212554931640625, -0.015472412109375, -0.0096893310546875, -0.00390625, 0.0018768310546875, 0.007659912109375, 0.0134429931640625, 0.01922607421875, 0.0250091552734375, 0.030792236328125, 0.0365753173828125, 0.0423583984375, 0.0481414794921875, 0.053924560546875, 0.0597076416015625, 0.06549072265625, 0.0712738037109375, 0.077056884765625, 0.0828399658203125, 0.088623046875, 0.0944061279296875, 0.100189208984375, 0.1059722900390625, 0.11175537109375, 0.1175384521484375, 0.123321533203125, 0.1291046142578125, 0.1348876953125, 0.1406707763671875, 0.146453857421875, 0.1522369384765625, 0.15802001953125, 0.1638031005859375, 0.169586181640625, 0.1753692626953125, 0.18115234375, 0.1869354248046875, 0.192718505859375, 0.1985015869140625, 0.20428466796875, 0.2100677490234375, 0.215850830078125, 0.2216339111328125, 0.2274169921875]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 2.0, 0.0, 4.0, 5.0, 4.0, 9.0, 10.0, 6.0, 13.0, 11.0, 20.0, 16.0, 13.0, 24.0, 30.0, 37.0, 30.0, 65.0, 74.0, 86.0, 96.0, 84.0, 65.0, 54.0, 35.0, 40.0, 26.0, 20.0, 15.0, 15.0, 14.0, 10.0, 13.0, 11.0, 12.0, 8.0, 6.0, 2.0, 7.0, 0.0, 2.0, 3.0, 1.0, 3.0, 1.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-4.6253204345703125e-05, -4.467833787202835e-05, -4.310347139835358e-05, -4.15286049246788e-05, -3.995373845100403e-05, -3.8378871977329254e-05, -3.680400550365448e-05, -3.5229139029979706e-05, -3.365427255630493e-05, -3.207940608263016e-05, -3.0504539608955383e-05, -2.892967313528061e-05, -2.7354806661605835e-05, -2.577994018793106e-05, -2.4205073714256287e-05, -2.2630207240581512e-05, -2.1055340766906738e-05, -1.9480474293231964e-05, -1.790560781955719e-05, -1.6330741345882416e-05, -1.4755874872207642e-05, -1.3181008398532867e-05, -1.1606141924858093e-05, -1.0031275451183319e-05, -8.456408977508545e-06, -6.881542503833771e-06, -5.306676030158997e-06, -3.7318095564842224e-06, -2.1569430828094482e-06, -5.820766091346741e-07, 9.927898645401e-07, 2.5676563382148743e-06, 4.1425228118896484e-06, 5.717389285564423e-06, 7.292255759239197e-06, 8.867122232913971e-06, 1.0441988706588745e-05, 1.201685518026352e-05, 1.3591721653938293e-05, 1.5166588127613068e-05, 1.6741454601287842e-05, 1.8316321074962616e-05, 1.989118754863739e-05, 2.1466054022312164e-05, 2.304092049598694e-05, 2.4615786969661713e-05, 2.6190653443336487e-05, 2.776551991701126e-05, 2.9340386390686035e-05, 3.091525286436081e-05, 3.2490119338035583e-05, 3.406498581171036e-05, 3.563985228538513e-05, 3.7214718759059906e-05, 3.878958523273468e-05, 4.0364451706409454e-05, 4.193931818008423e-05, 4.3514184653759e-05, 4.508905112743378e-05, 4.666391760110855e-05, 4.8238784074783325e-05, 4.98136505484581e-05, 5.1388517022132874e-05, 5.296338349580765e-05, 5.453824996948242e-05]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 4.0, 4.0, 8.0, 4.0, 9.0, 15.0, 22.0, 29.0, 42.0, 58.0, 71.0, 105.0, 145.0, 220.0, 361.0, 608.0, 1150.0, 1994.0, 4853.0, 13494.0, 49887.0, 337173.0, 554482.0, 58535.0, 14804.0, 5344.0, 2251.0, 1116.0, 614.0, 370.0, 237.0, 173.0, 111.0, 82.0, 52.0, 40.0, 34.0, 12.0, 13.0, 11.0, 7.0, 3.0, 1.0, 3.0, 7.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0], "bins": [-0.1611328125, -0.1564006805419922, -0.15166854858398438, -0.14693641662597656, -0.14220428466796875, -0.13747215270996094, -0.13274002075195312, -0.1280078887939453, -0.1232757568359375, -0.11854362487792969, -0.11381149291992188, -0.10907936096191406, -0.10434722900390625, -0.09961509704589844, -0.09488296508789062, -0.09015083312988281, -0.085418701171875, -0.08068656921386719, -0.07595443725585938, -0.07122230529785156, -0.06649017333984375, -0.06175804138183594, -0.057025909423828125, -0.05229377746582031, -0.0475616455078125, -0.04282951354980469, -0.038097381591796875, -0.03336524963378906, -0.02863311767578125, -0.023900985717773438, -0.019168853759765625, -0.014436721801757812, -0.00970458984375, -0.0049724578857421875, -0.000240325927734375, 0.0044918060302734375, 0.00922393798828125, 0.013956069946289062, 0.018688201904296875, 0.023420333862304688, 0.0281524658203125, 0.03288459777832031, 0.037616729736328125, 0.04234886169433594, 0.04708099365234375, 0.05181312561035156, 0.056545257568359375, 0.06127738952636719, 0.066009521484375, 0.07074165344238281, 0.07547378540039062, 0.08020591735839844, 0.08493804931640625, 0.08967018127441406, 0.09440231323242188, 0.09913444519042969, 0.1038665771484375, 0.10859870910644531, 0.11333084106445312, 0.11806297302246094, 0.12279510498046875, 0.12752723693847656, 0.13225936889648438, 0.1369915008544922, 0.1417236328125]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 4.0, 3.0, 4.0, 5.0, 6.0, 7.0, 10.0, 17.0, 27.0, 34.0, 32.0, 32.0, 60.0, 115.0, 112.0, 123.0, 99.0, 64.0, 46.0, 57.0, 37.0, 23.0, 13.0, 20.0, 16.0, 10.0, 6.0, 9.0, 3.0, 3.0, 6.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1336669921875, -0.12853622436523438, -0.12340545654296875, -0.11827468872070312, -0.1131439208984375, -0.10801315307617188, -0.10288238525390625, -0.09775161743164062, -0.092620849609375, -0.08749008178710938, -0.08235931396484375, -0.07722854614257812, -0.0720977783203125, -0.06696701049804688, -0.06183624267578125, -0.056705474853515625, -0.05157470703125, -0.046443939208984375, -0.04131317138671875, -0.036182403564453125, -0.0310516357421875, -0.025920867919921875, -0.02079010009765625, -0.015659332275390625, -0.010528564453125, -0.005397796630859375, -0.00026702880859375, 0.004863739013671875, 0.0099945068359375, 0.015125274658203125, 0.02025604248046875, 0.025386810302734375, 0.030517578125, 0.035648345947265625, 0.04077911376953125, 0.045909881591796875, 0.0510406494140625, 0.056171417236328125, 0.06130218505859375, 0.06643295288085938, 0.071563720703125, 0.07669448852539062, 0.08182525634765625, 0.08695602416992188, 0.0920867919921875, 0.09721755981445312, 0.10234832763671875, 0.10747909545898438, 0.11260986328125, 0.11774063110351562, 0.12287139892578125, 0.12800216674804688, 0.1331329345703125, 0.13826370239257812, 0.14339447021484375, 0.14852523803710938, 0.153656005859375, 0.15878677368164062, 0.16391754150390625, 0.16904830932617188, 0.1741790771484375, 0.17930984497070312, 0.18444061279296875, 0.18957138061523438, 0.1947021484375]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 6.0, 4.0, 8.0, 19.0, 52.0, 169.0, 413.0, 220.0, 76.0, 18.0, 5.0, 7.0, 4.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.840893268585205, -2.6961872577667236, -2.551481008529663, -2.4067749977111816, -2.262068748474121, -2.1173627376556396, -1.9726567268371582, -1.8279505968093872, -1.6832444667816162, -1.5385383367538452, -1.3938322067260742, -1.2491261959075928, -1.1044200658798218, -0.9597139358520508, -0.8150078654289246, -0.6703017950057983, -0.5255956649780273, -0.38088956475257874, -0.23618346452713013, -0.09147736430168152, 0.05322873592376709, 0.19793486595153809, 0.3426409363746643, 0.4873470067977905, 0.6320531368255615, 0.7767592668533325, 0.9214653372764587, 1.066171407699585, 1.210877537727356, 1.355583667755127, 1.5002896785736084, 1.6449958086013794, 1.7897014617919922, 1.9344075918197632, 2.079113721847534, 2.2238197326660156, 2.368525981903076, 2.5132319927215576, 2.657938003540039, 2.8026442527770996, 2.947350263595581, 3.0920562744140625, 3.236762523651123, 3.3814685344696045, 3.526174545288086, 3.6708807945251465, 3.815586805343628, 3.9602928161621094, 4.10499906539917, 4.2497053146362305, 4.394411087036133, 4.539117336273193, 4.683823585510254, 4.828529357910156, 4.973235607147217, 5.117941856384277, 5.26264762878418, 5.40735387802124, 5.552059650421143, 5.696765899658203, 5.841472148895264, 5.986178398132324, 6.130884170532227, 6.275590419769287, 6.420296669006348]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 7.0, 5.0, 3.0, 3.0, 4.0, 11.0, 21.0, 10.0, 20.0, 19.0, 22.0, 26.0, 24.0, 37.0, 35.0, 28.0, 29.0, 41.0, 43.0, 70.0, 78.0, 74.0, 48.0, 37.0, 46.0, 27.0, 38.0, 30.0, 24.0, 21.0, 19.0, 11.0, 11.0, 11.0, 15.0, 11.0, 8.0, 5.0, 7.0, 4.0, 7.0, 5.0, 3.0, 3.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.4916245937347412, -1.4426367282867432, -1.3936489820480347, -1.3446611166000366, -1.2956733703613281, -1.24668550491333, -1.197697639465332, -1.1487098932266235, -1.099722146987915, -1.050734281539917, -1.0017465353012085, -0.9527586698532104, -0.903770923614502, -0.8547830581665039, -0.8057952523231506, -0.7568074464797974, -0.7078195810317993, -0.658831775188446, -0.6098439693450928, -0.5608561038970947, -0.5118683576583862, -0.46288052201271057, -0.4138926863670349, -0.36490488052368164, -0.31591707468032837, -0.2669292688369751, -0.21794144809246063, -0.16895362734794617, -0.1199658215045929, -0.07097801566123962, -0.021990180015563965, 0.026997625827789307, 0.07598543167114258, 0.12497324496507645, 0.17396105825901031, 0.22294887900352478, 0.27193668484687805, 0.3209244906902313, 0.369912326335907, 0.41890013217926025, 0.4678879380226135, 0.5168757438659668, 0.5658635497093201, 0.6148513555526733, 0.6638392210006714, 0.7128269672393799, 0.7618148326873779, 0.8108026385307312, 0.8597904443740845, 0.9087782502174377, 0.957766056060791, 1.006753921508789, 1.0557416677474976, 1.1047295331954956, 1.153717279434204, 1.2027051448822021, 1.2516930103302002, 1.3006808757781982, 1.3496686220169067, 1.3986564874649048, 1.4476442337036133, 1.4966320991516113, 1.5456199645996094, 1.5946077108383179, 1.6435954570770264]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 5.0, 6.0, 9.0, 10.0, 11.0, 26.0, 29.0, 41.0, 57.0, 100.0, 134.0, 217.0, 333.0, 601.0, 1181.0, 2630.0, 7385.0, 29440.0, 214711.0, 2266949.0, 1512942.0, 126368.0, 20720.0, 5857.0, 2195.0, 1059.0, 484.0, 286.0, 162.0, 110.0, 74.0, 53.0, 26.0, 20.0, 12.0, 12.0, 8.0, 5.0, 8.0, 4.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1376953125, -0.13292884826660156, -0.12816238403320312, -0.12339591979980469, -0.11862945556640625, -0.11386299133300781, -0.10909652709960938, -0.10433006286621094, -0.0995635986328125, -0.09479713439941406, -0.09003067016601562, -0.08526420593261719, -0.08049774169921875, -0.07573127746582031, -0.07096481323242188, -0.06619834899902344, -0.061431884765625, -0.05666542053222656, -0.051898956298828125, -0.04713249206542969, -0.04236602783203125, -0.03759956359863281, -0.032833099365234375, -0.028066635131835938, -0.0233001708984375, -0.018533706665039062, -0.013767242431640625, -0.009000778198242188, -0.00423431396484375, 0.0005321502685546875, 0.005298614501953125, 0.010065078735351562, 0.01483154296875, 0.019598007202148438, 0.024364471435546875, 0.029130935668945312, 0.03389739990234375, 0.03866386413574219, 0.043430328369140625, 0.04819679260253906, 0.0529632568359375, 0.05772972106933594, 0.062496185302734375, 0.06726264953613281, 0.07202911376953125, 0.07679557800292969, 0.08156204223632812, 0.08632850646972656, 0.091094970703125, 0.09586143493652344, 0.10062789916992188, 0.10539436340332031, 0.11016082763671875, 0.11492729187011719, 0.11969375610351562, 0.12446022033691406, 0.1292266845703125, 0.13399314880371094, 0.13875961303710938, 0.1435260772705078, 0.14829254150390625, 0.1530590057373047, 0.15782546997070312, 0.16259193420410156, 0.1673583984375]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 3.0, 4.0, 4.0, 10.0, 1.0, 9.0, 16.0, 18.0, 29.0, 25.0, 33.0, 45.0, 63.0, 47.0, 46.0, 53.0, 74.0, 59.0, 58.0, 55.0, 45.0, 48.0, 52.0, 27.0, 40.0, 27.0, 26.0, 22.0, 20.0, 10.0, 12.0, 6.0, 4.0, 11.0, 2.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08721923828125, -0.0836782455444336, -0.08013725280761719, -0.07659626007080078, -0.07305526733398438, -0.06951427459716797, -0.06597328186035156, -0.062432289123535156, -0.05889129638671875, -0.055350303649902344, -0.05180931091308594, -0.04826831817626953, -0.044727325439453125, -0.04118633270263672, -0.03764533996582031, -0.034104347229003906, -0.0305633544921875, -0.027022361755371094, -0.023481369018554688, -0.01994037628173828, -0.016399383544921875, -0.012858390808105469, -0.009317398071289062, -0.005776405334472656, -0.00223541259765625, 0.0013055801391601562, 0.0048465728759765625, 0.008387565612792969, 0.011928558349609375, 0.015469551086425781, 0.019010543823242188, 0.022551536560058594, 0.026092529296875, 0.029633522033691406, 0.03317451477050781, 0.03671550750732422, 0.040256500244140625, 0.04379749298095703, 0.04733848571777344, 0.050879478454589844, 0.05442047119140625, 0.057961463928222656, 0.06150245666503906, 0.06504344940185547, 0.06858444213867188, 0.07212543487548828, 0.07566642761230469, 0.0792074203491211, 0.0827484130859375, 0.0862894058227539, 0.08983039855957031, 0.09337139129638672, 0.09691238403320312, 0.10045337677001953, 0.10399436950683594, 0.10753536224365234, 0.11107635498046875, 0.11461734771728516, 0.11815834045410156, 0.12169933319091797, 0.12524032592773438, 0.12878131866455078, 0.1323223114013672, 0.1358633041381836, 0.139404296875]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 6.0, 9.0, 16.0, 32.0, 38.0, 83.0, 200.0, 487.0, 1186.0, 3997.0, 24177.0, 504080.0, 3520922.0, 124241.0, 10932.0, 2335.0, 783.0, 321.0, 178.0, 99.0, 64.0, 37.0, 18.0, 16.0, 12.0, 5.0, 7.0, 2.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.271484375, -0.26189422607421875, -0.2523040771484375, -0.24271392822265625, -0.233123779296875, -0.22353363037109375, -0.2139434814453125, -0.20435333251953125, -0.19476318359375, -0.18517303466796875, -0.1755828857421875, -0.16599273681640625, -0.156402587890625, -0.14681243896484375, -0.1372222900390625, -0.12763214111328125, -0.1180419921875, -0.10845184326171875, -0.0988616943359375, -0.08927154541015625, -0.079681396484375, -0.07009124755859375, -0.0605010986328125, -0.05091094970703125, -0.04132080078125, -0.03173065185546875, -0.0221405029296875, -0.01255035400390625, -0.002960205078125, 0.00662994384765625, 0.0162200927734375, 0.02581024169921875, 0.035400390625, 0.04499053955078125, 0.0545806884765625, 0.06417083740234375, 0.073760986328125, 0.08335113525390625, 0.0929412841796875, 0.10253143310546875, 0.11212158203125, 0.12171173095703125, 0.1313018798828125, 0.14089202880859375, 0.150482177734375, 0.16007232666015625, 0.1696624755859375, 0.17925262451171875, 0.1888427734375, 0.19843292236328125, 0.2080230712890625, 0.21761322021484375, 0.227203369140625, 0.23679351806640625, 0.2463836669921875, 0.25597381591796875, 0.26556396484375, 0.27515411376953125, 0.2847442626953125, 0.29433441162109375, 0.303924560546875, 0.31351470947265625, 0.3231048583984375, 0.33269500732421875, 0.34228515625]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 4.0, 2.0, 6.0, 5.0, 10.0, 15.0, 15.0, 22.0, 44.0, 84.0, 124.0, 193.0, 323.0, 590.0, 804.0, 726.0, 455.0, 248.0, 148.0, 84.0, 62.0, 40.0, 18.0, 16.0, 11.0, 8.0, 5.0, 8.0, 3.0, 1.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.2083740234375, -0.20058250427246094, -0.19279098510742188, -0.1849994659423828, -0.17720794677734375, -0.1694164276123047, -0.16162490844726562, -0.15383338928222656, -0.1460418701171875, -0.13825035095214844, -0.13045883178710938, -0.12266731262207031, -0.11487579345703125, -0.10708427429199219, -0.09929275512695312, -0.09150123596191406, -0.083709716796875, -0.07591819763183594, -0.06812667846679688, -0.06033515930175781, -0.05254364013671875, -0.04475212097167969, -0.036960601806640625, -0.029169082641601562, -0.0213775634765625, -0.013586044311523438, -0.005794525146484375, 0.0019969940185546875, 0.00978851318359375, 0.017580032348632812, 0.025371551513671875, 0.03316307067871094, 0.04095458984375, 0.04874610900878906, 0.056537628173828125, 0.06432914733886719, 0.07212066650390625, 0.07991218566894531, 0.08770370483398438, 0.09549522399902344, 0.1032867431640625, 0.11107826232910156, 0.11886978149414062, 0.1266613006591797, 0.13445281982421875, 0.1422443389892578, 0.15003585815429688, 0.15782737731933594, 0.165618896484375, 0.17341041564941406, 0.18120193481445312, 0.1889934539794922, 0.19678497314453125, 0.2045764923095703, 0.21236801147460938, 0.22015953063964844, 0.2279510498046875, 0.23574256896972656, 0.24353408813476562, 0.2513256072998047, 0.25911712646484375, 0.2669086456298828, 0.2747001647949219, 0.28249168395996094, 0.290283203125]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 0.0, 3.0, 0.0, 4.0, 5.0, 10.0, 13.0, 32.0, 131.0, 213.0, 291.0, 168.0, 83.0, 30.0, 9.0, 6.0, 5.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-4.533990859985352, -4.431568622589111, -4.329146385192871, -4.226723670959473, -4.124301433563232, -4.021879196166992, -3.919456958770752, -3.8170347213745117, -3.7146122455596924, -3.612190008163452, -3.509767532348633, -3.4073452949523926, -3.3049230575561523, -3.202500581741333, -3.1000783443450928, -2.9976558685302734, -2.895233631134033, -2.792811393737793, -2.6903889179229736, -2.5879666805267334, -2.485544443130493, -2.383121967315674, -2.2806997299194336, -2.1782774925231934, -2.075855255126953, -1.9734328985214233, -1.871010661125183, -1.7685883045196533, -1.6661659479141235, -1.5637435913085938, -1.4613213539123535, -1.3588989973068237, -1.256476640701294, -1.1540542840957642, -1.051632046699524, -0.9492096900939941, -0.8467873334884644, -0.7443650364875793, -0.6419427394866943, -0.5395203828811646, -0.43709808588027954, -0.33467575907707214, -0.23225344717502594, -0.12983113527297974, -0.02740880846977234, 0.07501351833343506, 0.17743581533432007, 0.27985817193984985, 0.38228046894073486, 0.48470279574394226, 0.5871251225471497, 0.6895474195480347, 0.7919697761535645, 0.8943920731544495, 0.9968143701553345, 1.0992367267608643, 1.2016589641571045, 1.3040813207626343, 1.4065035581588745, 1.5089259147644043, 1.611348271369934, 1.7137706279754639, 1.816192865371704, 1.9186152219772339, 2.0210375785827637]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 3.0, 5.0, 5.0, 4.0, 6.0, 6.0, 7.0, 2.0, 5.0, 6.0, 23.0, 19.0, 30.0, 32.0, 52.0, 49.0, 48.0, 62.0, 58.0, 66.0, 76.0, 56.0, 67.0, 45.0, 47.0, 55.0, 33.0, 39.0, 19.0, 19.0, 17.0, 14.0, 7.0, 7.0, 12.0, 8.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0220189094543457, -0.9813469648361206, -0.9406750798225403, -0.9000031352043152, -0.8593312501907349, -0.8186593055725098, -0.7779873609542847, -0.7373154759407043, -0.696643590927124, -0.6559716463088989, -0.6152997612953186, -0.5746278166770935, -0.5339559316635132, -0.4932839870452881, -0.4526120722293854, -0.41194015741348267, -0.37126821279525757, -0.33059629797935486, -0.28992438316345215, -0.24925245344638824, -0.20858053863048553, -0.16790862381458282, -0.12723669409751892, -0.08656477928161621, -0.0458928644657135, -0.0052209459245204926, 0.035450972616672516, 0.07612289488315582, 0.11679480969905853, 0.15746672451496124, 0.19813865423202515, 0.23881056904792786, 0.27948248386383057, 0.3201543986797333, 0.360826313495636, 0.4014982581138611, 0.4421701431274414, 0.4828420877456665, 0.5235140323638916, 0.5641859173774719, 0.6048578023910522, 0.6455297470092773, 0.6862016320228577, 0.7268735766410828, 0.7675454616546631, 0.8082174062728882, 0.8488893508911133, 0.8895612359046936, 0.9302331805229187, 0.9709051251411438, 1.0115770101547241, 1.0522489547729492, 1.0929208993911743, 1.1335927248001099, 1.174264669418335, 1.21493661403656, 1.2556085586547852, 1.2962805032730103, 1.3369524478912354, 1.377624273300171, 1.418296217918396, 1.458968162536621, 1.4996401071548462, 1.5403120517730713, 1.5809838771820068]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 4.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 5.0, 5.0, 7.0, 10.0, 18.0, 15.0, 17.0, 43.0, 64.0, 102.0, 154.0, 287.0, 506.0, 1089.0, 2501.0, 6664.0, 20055.0, 73360.0, 308557.0, 464328.0, 122482.0, 31865.0, 9749.0, 3510.0, 1562.0, 702.0, 340.0, 217.0, 118.0, 62.0, 51.0, 45.0, 15.0, 15.0, 8.0, 6.0, 5.0, 3.0, 5.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.212158203125, -0.20556640625, -0.198974609375, -0.1923828125, -0.185791015625, -0.17919921875, -0.172607421875, -0.166015625, -0.159423828125, -0.15283203125, -0.146240234375, -0.1396484375, -0.133056640625, -0.12646484375, -0.119873046875, -0.11328125, -0.106689453125, -0.10009765625, -0.093505859375, -0.0869140625, -0.080322265625, -0.07373046875, -0.067138671875, -0.060546875, -0.053955078125, -0.04736328125, -0.040771484375, -0.0341796875, -0.027587890625, -0.02099609375, -0.014404296875, -0.0078125, -0.001220703125, 0.00537109375, 0.011962890625, 0.0185546875, 0.025146484375, 0.03173828125, 0.038330078125, 0.044921875, 0.051513671875, 0.05810546875, 0.064697265625, 0.0712890625, 0.077880859375, 0.08447265625, 0.091064453125, 0.09765625, 0.104248046875, 0.11083984375, 0.117431640625, 0.1240234375, 0.130615234375, 0.13720703125, 0.143798828125, 0.150390625, 0.156982421875, 0.16357421875, 0.170166015625, 0.1767578125, 0.183349609375, 0.18994140625, 0.196533203125, 0.203125, 0.209716796875]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 2.0, 7.0, 7.0, 7.0, 7.0, 14.0, 13.0, 22.0, 24.0, 17.0, 30.0, 28.0, 35.0, 45.0, 39.0, 46.0, 51.0, 43.0, 53.0, 53.0, 47.0, 37.0, 46.0, 43.0, 34.0, 42.0, 27.0, 28.0, 19.0, 21.0, 28.0, 22.0, 12.0, 18.0, 10.0, 4.0, 5.0, 5.0, 5.0, 3.0, 2.0, 2.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.09765625, -0.0947275161743164, -0.09179878234863281, -0.08887004852294922, -0.08594131469726562, -0.08301258087158203, -0.08008384704589844, -0.07715511322021484, -0.07422637939453125, -0.07129764556884766, -0.06836891174316406, -0.06544017791748047, -0.06251144409179688, -0.05958271026611328, -0.05665397644042969, -0.053725242614746094, -0.0507965087890625, -0.047867774963378906, -0.04493904113769531, -0.04201030731201172, -0.039081573486328125, -0.03615283966064453, -0.03322410583496094, -0.030295372009277344, -0.02736663818359375, -0.024437904357910156, -0.021509170532226562, -0.01858043670654297, -0.015651702880859375, -0.012722969055175781, -0.009794235229492188, -0.006865501403808594, -0.003936767578125, -0.0010080337524414062, 0.0019207000732421875, 0.004849433898925781, 0.007778167724609375, 0.010706901550292969, 0.013635635375976562, 0.016564369201660156, 0.01949310302734375, 0.022421836853027344, 0.025350570678710938, 0.02827930450439453, 0.031208038330078125, 0.03413677215576172, 0.03706550598144531, 0.039994239807128906, 0.0429229736328125, 0.045851707458496094, 0.04878044128417969, 0.05170917510986328, 0.054637908935546875, 0.05756664276123047, 0.06049537658691406, 0.06342411041259766, 0.06635284423828125, 0.06928157806396484, 0.07221031188964844, 0.07513904571533203, 0.07806777954101562, 0.08099651336669922, 0.08392524719238281, 0.0868539810180664, 0.08978271484375]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 8.0, 8.0, 12.0, 13.0, 24.0, 41.0, 103.0, 145.0, 330.0, 687.0, 1813.0, 7400.0, 97777.0, 890651.0, 42325.0, 4719.0, 1317.0, 595.0, 272.0, 132.0, 79.0, 38.0, 24.0, 25.0, 11.0, 4.0, 1.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.79052734375, -0.7714195251464844, -0.7523117065429688, -0.7332038879394531, -0.7140960693359375, -0.6949882507324219, -0.6758804321289062, -0.6567726135253906, -0.637664794921875, -0.6185569763183594, -0.5994491577148438, -0.5803413391113281, -0.5612335205078125, -0.5421257019042969, -0.5230178833007812, -0.5039100646972656, -0.48480224609375, -0.4656944274902344, -0.44658660888671875, -0.4274787902832031, -0.4083709716796875, -0.3892631530761719, -0.37015533447265625, -0.3510475158691406, -0.331939697265625, -0.3128318786621094, -0.29372406005859375, -0.2746162414550781, -0.2555084228515625, -0.23640060424804688, -0.21729278564453125, -0.19818496704101562, -0.1790771484375, -0.15996932983398438, -0.14086151123046875, -0.12175369262695312, -0.1026458740234375, -0.08353805541992188, -0.06443023681640625, -0.045322418212890625, -0.026214599609375, -0.007106781005859375, 0.01200103759765625, 0.031108856201171875, 0.0502166748046875, 0.06932449340820312, 0.08843231201171875, 0.10754013061523438, 0.12664794921875, 0.14575576782226562, 0.16486358642578125, 0.18397140502929688, 0.2030792236328125, 0.22218704223632812, 0.24129486083984375, 0.2604026794433594, 0.279510498046875, 0.2986183166503906, 0.31772613525390625, 0.3368339538574219, 0.3559417724609375, 0.3750495910644531, 0.39415740966796875, 0.4132652282714844, 0.432373046875]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 4.0, 0.0, 4.0, 3.0, 4.0, 3.0, 9.0, 7.0, 9.0, 14.0, 13.0, 20.0, 22.0, 17.0, 19.0, 21.0, 30.0, 31.0, 46.0, 42.0, 46.0, 40.0, 53.0, 43.0, 42.0, 44.0, 56.0, 43.0, 38.0, 28.0, 30.0, 33.0, 28.0, 24.0, 25.0, 21.0, 17.0, 15.0, 15.0, 7.0, 5.0, 9.0, 5.0, 9.0, 5.0, 7.0, 0.0, 3.0, 2.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.340087890625, -0.3293113708496094, -0.31853485107421875, -0.3077583312988281, -0.2969818115234375, -0.2862052917480469, -0.27542877197265625, -0.2646522521972656, -0.253875732421875, -0.24309921264648438, -0.23232269287109375, -0.22154617309570312, -0.2107696533203125, -0.19999313354492188, -0.18921661376953125, -0.17844009399414062, -0.16766357421875, -0.15688705444335938, -0.14611053466796875, -0.13533401489257812, -0.1245574951171875, -0.11378097534179688, -0.10300445556640625, -0.09222793579101562, -0.081451416015625, -0.07067489624023438, -0.05989837646484375, -0.049121856689453125, -0.0383453369140625, -0.027568817138671875, -0.01679229736328125, -0.006015777587890625, 0.0047607421875, 0.015537261962890625, 0.02631378173828125, 0.037090301513671875, 0.0478668212890625, 0.058643341064453125, 0.06941986083984375, 0.08019638061523438, 0.090972900390625, 0.10174942016601562, 0.11252593994140625, 0.12330245971679688, 0.1340789794921875, 0.14485549926757812, 0.15563201904296875, 0.16640853881835938, 0.17718505859375, 0.18796157836914062, 0.19873809814453125, 0.20951461791992188, 0.2202911376953125, 0.23106765747070312, 0.24184417724609375, 0.2526206970214844, 0.263397216796875, 0.2741737365722656, 0.28495025634765625, 0.2957267761230469, 0.3065032958984375, 0.3172798156738281, 0.32805633544921875, 0.3388328552246094, 0.349609375]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 2.0, 7.0, 2.0, 5.0, 9.0, 8.0, 12.0, 12.0, 21.0, 33.0, 41.0, 93.0, 124.0, 184.0, 319.0, 639.0, 1486.0, 4065.0, 15441.0, 81689.0, 811746.0, 106096.0, 18486.0, 4808.0, 1593.0, 705.0, 362.0, 196.0, 125.0, 85.0, 48.0, 26.0, 24.0, 15.0, 14.0, 13.0, 6.0, 3.0, 6.0, 3.0, 3.0, 1.0, 5.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.228271484375, -0.22146987915039062, -0.21466827392578125, -0.20786666870117188, -0.2010650634765625, -0.19426345825195312, -0.18746185302734375, -0.18066024780273438, -0.173858642578125, -0.16705703735351562, -0.16025543212890625, -0.15345382690429688, -0.1466522216796875, -0.13985061645507812, -0.13304901123046875, -0.12624740600585938, -0.11944580078125, -0.11264419555664062, -0.10584259033203125, -0.09904098510742188, -0.0922393798828125, -0.08543777465820312, -0.07863616943359375, -0.07183456420898438, -0.065032958984375, -0.058231353759765625, -0.05142974853515625, -0.044628143310546875, -0.0378265380859375, -0.031024932861328125, -0.02422332763671875, -0.017421722412109375, -0.0106201171875, -0.003818511962890625, 0.00298309326171875, 0.009784698486328125, 0.0165863037109375, 0.023387908935546875, 0.03018951416015625, 0.036991119384765625, 0.043792724609375, 0.050594329833984375, 0.05739593505859375, 0.06419754028320312, 0.0709991455078125, 0.07780075073242188, 0.08460235595703125, 0.09140396118164062, 0.09820556640625, 0.10500717163085938, 0.11180877685546875, 0.11861038208007812, 0.1254119873046875, 0.13221359252929688, 0.13901519775390625, 0.14581680297851562, 0.152618408203125, 0.15942001342773438, 0.16622161865234375, 0.17302322387695312, 0.1798248291015625, 0.18662643432617188, 0.19342803955078125, 0.20022964477539062, 0.20703125]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 2.0, 6.0, 7.0, 9.0, 6.0, 9.0, 6.0, 14.0, 8.0, 15.0, 22.0, 27.0, 34.0, 39.0, 66.0, 87.0, 107.0, 105.0, 99.0, 82.0, 63.0, 41.0, 30.0, 25.0, 18.0, 8.0, 12.0, 11.0, 6.0, 11.0, 6.0, 3.0, 5.0, 3.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-6.0677528381347656e-05, -5.879346281290054e-05, -5.690939724445343e-05, -5.502533167600632e-05, -5.3141266107559204e-05, -5.125720053911209e-05, -4.937313497066498e-05, -4.7489069402217865e-05, -4.560500383377075e-05, -4.372093826532364e-05, -4.1836872696876526e-05, -3.995280712842941e-05, -3.80687415599823e-05, -3.618467599153519e-05, -3.4300610423088074e-05, -3.241654485464096e-05, -3.053247928619385e-05, -2.8648413717746735e-05, -2.676434814929962e-05, -2.488028258085251e-05, -2.2996217012405396e-05, -2.1112151443958282e-05, -1.922808587551117e-05, -1.7344020307064056e-05, -1.5459954738616943e-05, -1.357588917016983e-05, -1.1691823601722717e-05, -9.807758033275604e-06, -7.923692464828491e-06, -6.039626896381378e-06, -4.155561327934265e-06, -2.271495759487152e-06, -3.8743019104003906e-07, 1.496635377407074e-06, 3.380700945854187e-06, 5.2647665143013e-06, 7.148832082748413e-06, 9.032897651195526e-06, 1.091696321964264e-05, 1.2801028788089752e-05, 1.4685094356536865e-05, 1.6569159924983978e-05, 1.845322549343109e-05, 2.0337291061878204e-05, 2.2221356630325317e-05, 2.410542219877243e-05, 2.5989487767219543e-05, 2.7873553335666656e-05, 2.975761890411377e-05, 3.164168447256088e-05, 3.3525750041007996e-05, 3.540981560945511e-05, 3.729388117790222e-05, 3.9177946746349335e-05, 4.106201231479645e-05, 4.294607788324356e-05, 4.4830143451690674e-05, 4.671420902013779e-05, 4.85982745885849e-05, 5.048234015703201e-05, 5.2366405725479126e-05, 5.425047129392624e-05, 5.613453686237335e-05, 5.8018602430820465e-05, 5.990266799926758e-05]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 5.0, 7.0, 5.0, 5.0, 5.0, 5.0, 4.0, 13.0, 16.0, 22.0, 29.0, 29.0, 45.0, 79.0, 96.0, 130.0, 214.0, 326.0, 498.0, 910.0, 1807.0, 3885.0, 10291.0, 33712.0, 169403.0, 713610.0, 79435.0, 20973.0, 6896.0, 2760.0, 1278.0, 744.0, 449.0, 260.0, 161.0, 136.0, 86.0, 62.0, 55.0, 29.0, 23.0, 18.0, 10.0, 10.0, 8.0, 2.0, 6.0, 2.0, 4.0, 4.0, 0.0, 1.0, 5.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.161865234375, -0.15685462951660156, -0.15184402465820312, -0.1468334197998047, -0.14182281494140625, -0.1368122100830078, -0.13180160522460938, -0.12679100036621094, -0.1217803955078125, -0.11676979064941406, -0.11175918579101562, -0.10674858093261719, -0.10173797607421875, -0.09672737121582031, -0.09171676635742188, -0.08670616149902344, -0.081695556640625, -0.07668495178222656, -0.07167434692382812, -0.06666374206542969, -0.06165313720703125, -0.05664253234863281, -0.051631927490234375, -0.04662132263183594, -0.0416107177734375, -0.03660011291503906, -0.031589508056640625, -0.026578903198242188, -0.02156829833984375, -0.016557693481445312, -0.011547088623046875, -0.0065364837646484375, -0.00152587890625, 0.0034847259521484375, 0.008495330810546875, 0.013505935668945312, 0.01851654052734375, 0.023527145385742188, 0.028537750244140625, 0.03354835510253906, 0.0385589599609375, 0.04356956481933594, 0.048580169677734375, 0.05359077453613281, 0.05860137939453125, 0.06361198425292969, 0.06862258911132812, 0.07363319396972656, 0.078643798828125, 0.08365440368652344, 0.08866500854492188, 0.09367561340332031, 0.09868621826171875, 0.10369682312011719, 0.10870742797851562, 0.11371803283691406, 0.1187286376953125, 0.12373924255371094, 0.12874984741210938, 0.1337604522705078, 0.13877105712890625, 0.1437816619873047, 0.14879226684570312, 0.15380287170410156, 0.1588134765625]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 3.0, 4.0, 3.0, 5.0, 6.0, 0.0, 4.0, 8.0, 11.0, 7.0, 15.0, 14.0, 9.0, 12.0, 12.0, 23.0, 33.0, 37.0, 56.0, 69.0, 100.0, 106.0, 98.0, 88.0, 58.0, 45.0, 34.0, 28.0, 16.0, 15.0, 13.0, 11.0, 10.0, 11.0, 7.0, 9.0, 1.0, 1.0, 8.0, 4.0, 4.0, 3.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.11822509765625, -0.11449337005615234, -0.11076164245605469, -0.10702991485595703, -0.10329818725585938, -0.09956645965576172, -0.09583473205566406, -0.0921030044555664, -0.08837127685546875, -0.0846395492553711, -0.08090782165527344, -0.07717609405517578, -0.07344436645507812, -0.06971263885498047, -0.06598091125488281, -0.062249183654785156, -0.0585174560546875, -0.054785728454589844, -0.05105400085449219, -0.04732227325439453, -0.043590545654296875, -0.03985881805419922, -0.03612709045410156, -0.032395362854003906, -0.02866363525390625, -0.024931907653808594, -0.021200180053710938, -0.01746845245361328, -0.013736724853515625, -0.010004997253417969, -0.0062732696533203125, -0.0025415420532226562, 0.001190185546875, 0.004921913146972656, 0.008653640747070312, 0.012385368347167969, 0.016117095947265625, 0.01984882354736328, 0.023580551147460938, 0.027312278747558594, 0.03104400634765625, 0.034775733947753906, 0.03850746154785156, 0.04223918914794922, 0.045970916748046875, 0.04970264434814453, 0.05343437194824219, 0.057166099548339844, 0.0608978271484375, 0.06462955474853516, 0.06836128234863281, 0.07209300994873047, 0.07582473754882812, 0.07955646514892578, 0.08328819274902344, 0.0870199203491211, 0.09075164794921875, 0.0944833755493164, 0.09821510314941406, 0.10194683074951172, 0.10567855834960938, 0.10941028594970703, 0.11314201354980469, 0.11687374114990234, 0.12060546875]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 6.0, 11.0, 9.0, 27.0, 66.0, 121.0, 255.0, 250.0, 136.0, 49.0, 29.0, 9.0, 5.0, 7.0, 5.0, 3.0, 4.0, 3.0, 2.0, 2.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.3943662643432617, -3.294478178024292, -3.194589853286743, -3.0947017669677734, -2.9948136806488037, -2.894925355911255, -2.795037269592285, -2.6951489448547363, -2.5952608585357666, -2.495372772216797, -2.395484447479248, -2.2955963611602783, -2.1957082748413086, -2.0958199501037598, -1.99593186378479, -1.8960436582565308, -1.796155571937561, -1.6962673664093018, -1.596379280090332, -1.4964910745620728, -1.3966028690338135, -1.2967147827148438, -1.1968265771865845, -1.0969383716583252, -0.9970502257347107, -0.8971620798110962, -0.7972738742828369, -0.6973857283592224, -0.5974975824356079, -0.49760937690734863, -0.39772123098373413, -0.29783302545547485, -0.19794487953186035, -0.09805671125650406, 0.0018314570188522339, 0.10171961784362793, 0.20160779356956482, 0.3014959692955017, 0.4013841152191162, 0.5012723207473755, 0.60116046667099, 0.7010486125946045, 0.8009368181228638, 0.9008249640464783, 1.0007131099700928, 1.100601315498352, 1.2004895210266113, 1.300377607345581, 1.4002658128738403, 1.5001540184020996, 1.6000421047210693, 1.6999303102493286, 1.799818515777588, 1.8997066020965576, 1.999594807624817, 2.099483013153076, 2.199371099472046, 2.2992591857910156, 2.3991475105285645, 2.499035596847534, 2.598923683166504, 2.6988120079040527, 2.7987000942230225, 2.898588180541992, 2.998476505279541]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 8.0, 10.0, 7.0, 10.0, 13.0, 9.0, 11.0, 17.0, 24.0, 20.0, 22.0, 22.0, 23.0, 34.0, 39.0, 43.0, 30.0, 63.0, 63.0, 81.0, 59.0, 53.0, 40.0, 36.0, 36.0, 28.0, 28.0, 32.0, 18.0, 24.0, 12.0, 17.0, 9.0, 11.0, 9.0, 11.0, 7.0, 7.0, 3.0, 6.0, 8.0, 6.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3342461585998535, -1.2885558605194092, -1.2428655624389648, -1.1971752643585205, -1.1514849662780762, -1.1057946681976318, -1.0601043701171875, -1.0144140720367432, -0.9687238335609436, -0.9230335354804993, -0.8773432374000549, -0.8316529989242554, -0.785962700843811, -0.7402724027633667, -0.6945821046829224, -0.648891806602478, -0.6032015085220337, -0.5575112104415894, -0.511820912361145, -0.46613064408302307, -0.42044034600257874, -0.3747500479221344, -0.32905977964401245, -0.2833694815635681, -0.23767918348312378, -0.19198888540267944, -0.1462986022233963, -0.10060831904411316, -0.05491802096366882, -0.009227722883224487, 0.03646254539489746, 0.0821528434753418, 0.12784326076507568, 0.17353355884552002, 0.21922384202480316, 0.2649141252040863, 0.31060442328453064, 0.356294721364975, 0.4019849896430969, 0.44767528772354126, 0.4933655858039856, 0.5390558838844299, 0.5847461819648743, 0.6304364204406738, 0.6761267185211182, 0.7218170166015625, 0.7675073146820068, 0.8131976127624512, 0.8588879108428955, 0.9045782089233398, 0.9502685070037842, 0.9959588050842285, 1.0416491031646729, 1.0873394012451172, 1.1330296993255615, 1.1787199974060059, 1.2244102954864502, 1.2701005935668945, 1.3157908916473389, 1.3614811897277832, 1.4071714878082275, 1.4528617858886719, 1.4985520839691162, 1.5442423820495605, 1.5899325609207153]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 1.0, 9.0, 6.0, 14.0, 12.0, 30.0, 29.0, 49.0, 105.0, 177.0, 351.0, 793.0, 2236.0, 11430.0, 282400.0, 3811292.0, 76453.0, 6439.0, 1486.0, 499.0, 234.0, 95.0, 52.0, 32.0, 15.0, 13.0, 8.0, 8.0, 1.0, 2.0, 2.0, 3.0, 3.0, 1.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.258544921875, -0.24792861938476562, -0.23731231689453125, -0.22669601440429688, -0.2160797119140625, -0.20546340942382812, -0.19484710693359375, -0.18423080444335938, -0.173614501953125, -0.16299819946289062, -0.15238189697265625, -0.14176559448242188, -0.1311492919921875, -0.12053298950195312, -0.10991668701171875, -0.09930038452148438, -0.08868408203125, -0.07806777954101562, -0.06745147705078125, -0.056835174560546875, -0.0462188720703125, -0.035602569580078125, -0.02498626708984375, -0.014369964599609375, -0.003753662109375, 0.006862640380859375, 0.01747894287109375, 0.028095245361328125, 0.0387115478515625, 0.049327850341796875, 0.05994415283203125, 0.07056045532226562, 0.0811767578125, 0.09179306030273438, 0.10240936279296875, 0.11302566528320312, 0.1236419677734375, 0.13425827026367188, 0.14487457275390625, 0.15549087524414062, 0.166107177734375, 0.17672348022460938, 0.18733978271484375, 0.19795608520507812, 0.2085723876953125, 0.21918869018554688, 0.22980499267578125, 0.24042129516601562, 0.25103759765625, 0.2616539001464844, 0.27227020263671875, 0.2828865051269531, 0.2935028076171875, 0.3041191101074219, 0.31473541259765625, 0.3253517150878906, 0.335968017578125, 0.3465843200683594, 0.35720062255859375, 0.3678169250488281, 0.3784332275390625, 0.3890495300292969, 0.39966583251953125, 0.4102821350097656, 0.4208984375]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 4.0, 3.0, 4.0, 6.0, 8.0, 12.0, 11.0, 24.0, 20.0, 18.0, 21.0, 25.0, 24.0, 45.0, 41.0, 38.0, 45.0, 48.0, 53.0, 46.0, 50.0, 62.0, 47.0, 36.0, 36.0, 35.0, 32.0, 50.0, 34.0, 28.0, 22.0, 19.0, 8.0, 10.0, 8.0, 13.0, 5.0, 6.0, 3.0, 1.0, 2.0, 5.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0843505859375, -0.08154010772705078, -0.07872962951660156, -0.07591915130615234, -0.07310867309570312, -0.0702981948852539, -0.06748771667480469, -0.06467723846435547, -0.06186676025390625, -0.05905628204345703, -0.05624580383300781, -0.053435325622558594, -0.050624847412109375, -0.047814369201660156, -0.04500389099121094, -0.04219341278076172, -0.0393829345703125, -0.03657245635986328, -0.03376197814941406, -0.030951499938964844, -0.028141021728515625, -0.025330543518066406, -0.022520065307617188, -0.01970958709716797, -0.01689910888671875, -0.014088630676269531, -0.011278152465820312, -0.008467674255371094, -0.005657196044921875, -0.0028467178344726562, -3.62396240234375e-05, 0.0027742385864257812, 0.005584716796875, 0.008395195007324219, 0.011205673217773438, 0.014016151428222656, 0.016826629638671875, 0.019637107849121094, 0.022447586059570312, 0.02525806427001953, 0.02806854248046875, 0.03087902069091797, 0.03368949890136719, 0.036499977111816406, 0.039310455322265625, 0.042120933532714844, 0.04493141174316406, 0.04774188995361328, 0.0505523681640625, 0.05336284637451172, 0.05617332458496094, 0.058983802795410156, 0.061794281005859375, 0.0646047592163086, 0.06741523742675781, 0.07022571563720703, 0.07303619384765625, 0.07584667205810547, 0.07865715026855469, 0.0814676284790039, 0.08427810668945312, 0.08708858489990234, 0.08989906311035156, 0.09270954132080078, 0.09552001953125]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 0.0, 4.0, 1.0, 1.0, 4.0, 3.0, 3.0, 4.0, 11.0, 21.0, 26.0, 30.0, 51.0, 94.0, 152.0, 260.0, 515.0, 812.0, 1741.0, 3692.0, 10770.0, 93109.0, 3670113.0, 382404.0, 20198.0, 5350.0, 2249.0, 1157.0, 618.0, 374.0, 195.0, 128.0, 73.0, 34.0, 31.0, 17.0, 14.0, 12.0, 5.0, 3.0, 5.0, 2.0, 5.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.26318359375, -0.2529335021972656, -0.24268341064453125, -0.23243331909179688, -0.2221832275390625, -0.21193313598632812, -0.20168304443359375, -0.19143295288085938, -0.181182861328125, -0.17093276977539062, -0.16068267822265625, -0.15043258666992188, -0.1401824951171875, -0.12993240356445312, -0.11968231201171875, -0.10943222045898438, -0.09918212890625, -0.08893203735351562, -0.07868194580078125, -0.06843185424804688, -0.0581817626953125, -0.047931671142578125, -0.03768157958984375, -0.027431488037109375, -0.017181396484375, -0.006931304931640625, 0.00331878662109375, 0.013568878173828125, 0.0238189697265625, 0.034069061279296875, 0.04431915283203125, 0.054569244384765625, 0.0648193359375, 0.07506942749023438, 0.08531951904296875, 0.09556961059570312, 0.1058197021484375, 0.11606979370117188, 0.12631988525390625, 0.13656997680664062, 0.146820068359375, 0.15707015991210938, 0.16732025146484375, 0.17757034301757812, 0.1878204345703125, 0.19807052612304688, 0.20832061767578125, 0.21857070922851562, 0.22882080078125, 0.23907089233398438, 0.24932098388671875, 0.2595710754394531, 0.2698211669921875, 0.2800712585449219, 0.29032135009765625, 0.3005714416503906, 0.310821533203125, 0.3210716247558594, 0.33132171630859375, 0.3415718078613281, 0.3518218994140625, 0.3620719909667969, 0.37232208251953125, 0.3825721740722656, 0.392822265625]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 5.0, 3.0, 7.0, 7.0, 10.0, 24.0, 42.0, 93.0, 183.0, 422.0, 866.0, 1094.0, 729.0, 282.0, 127.0, 76.0, 40.0, 18.0, 20.0, 7.0, 7.0, 5.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.276123046875, -0.2663421630859375, -0.256561279296875, -0.2467803955078125, -0.23699951171875, -0.2272186279296875, -0.217437744140625, -0.2076568603515625, -0.1978759765625, -0.1880950927734375, -0.178314208984375, -0.1685333251953125, -0.15875244140625, -0.1489715576171875, -0.139190673828125, -0.1294097900390625, -0.11962890625, -0.1098480224609375, -0.100067138671875, -0.0902862548828125, -0.08050537109375, -0.0707244873046875, -0.060943603515625, -0.0511627197265625, -0.0413818359375, -0.0316009521484375, -0.021820068359375, -0.0120391845703125, -0.00225830078125, 0.0075225830078125, 0.017303466796875, 0.0270843505859375, 0.036865234375, 0.0466461181640625, 0.056427001953125, 0.0662078857421875, 0.07598876953125, 0.0857696533203125, 0.095550537109375, 0.1053314208984375, 0.1151123046875, 0.1248931884765625, 0.134674072265625, 0.1444549560546875, 0.15423583984375, 0.1640167236328125, 0.173797607421875, 0.1835784912109375, 0.193359375, 0.2031402587890625, 0.212921142578125, 0.2227020263671875, 0.23248291015625, 0.2422637939453125, 0.252044677734375, 0.2618255615234375, 0.2716064453125, 0.2813873291015625, 0.291168212890625, 0.3009490966796875, 0.31072998046875, 0.3205108642578125, 0.330291748046875, 0.3400726318359375, 0.349853515625]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 4.0, 2.0, 3.0, 7.0, 12.0, 24.0, 45.0, 104.0, 191.0, 275.0, 172.0, 95.0, 29.0, 21.0, 1.0, 3.0, 5.0, 3.0, 4.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9455642700195312, -1.8582165241241455, -1.7708687782287598, -1.683521032333374, -1.5961732864379883, -1.5088255405426025, -1.4214777946472168, -1.334130048751831, -1.2467823028564453, -1.1594345569610596, -1.0720868110656738, -0.9847390651702881, -0.8973913192749023, -0.8100435733795166, -0.7226957678794861, -0.6353480219841003, -0.5480002164840698, -0.4606524705886841, -0.37330472469329834, -0.2859569489955902, -0.19860920310020447, -0.11126145720481873, -0.023913681507110596, 0.06343406438827515, 0.1507818102836609, 0.23812955617904663, 0.3254773020744324, 0.4128250777721405, 0.5001728534698486, 0.5875205993652344, 0.6748683452606201, 0.7622160911560059, 0.8495638370513916, 0.9369115829467773, 1.024259328842163, 1.1116070747375488, 1.1989548206329346, 1.2863025665283203, 1.373650312423706, 1.4609980583190918, 1.5483458042144775, 1.6356935501098633, 1.723041296005249, 1.8103890419006348, 1.8977367877960205, 1.9850845336914062, 2.072432279586792, 2.1597800254821777, 2.2471280097961426, 2.3344757556915283, 2.421823501586914, 2.5091712474823, 2.5965189933776855, 2.6838667392730713, 2.771214485168457, 2.8585622310638428, 2.9459099769592285, 3.0332577228546143, 3.12060546875, 3.2079532146453857, 3.2953009605407715, 3.3826487064361572, 3.469996452331543, 3.5573441982269287, 3.6446919441223145]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 6.0, 8.0, 10.0, 26.0, 34.0, 43.0, 49.0, 67.0, 66.0, 81.0, 81.0, 98.0, 76.0, 82.0, 68.0, 57.0, 51.0, 38.0, 22.0, 15.0, 14.0, 7.0, 5.0, 3.0, 0.0, 1.0, 1.0], "bins": [-2.4637389183044434, -2.413572072982788, -2.363405227661133, -2.3132386207580566, -2.2630717754364014, -2.212904930114746, -2.16273832321167, -2.1125714778900146, -2.0624046325683594, -2.012237787246704, -1.9620710611343384, -1.9119043350219727, -1.8617374897003174, -1.811570644378662, -1.7614039182662964, -1.7112371921539307, -1.6610703468322754, -1.6109035015106201, -1.5607367753982544, -1.5105700492858887, -1.4604032039642334, -1.4102363586425781, -1.3600696325302124, -1.3099029064178467, -1.2597360610961914, -1.2095692157745361, -1.1594024896621704, -1.1092357635498047, -1.0590689182281494, -1.0089020729064941, -0.9587353467941284, -0.9085685610771179, -0.8584018349647522, -0.8082350492477417, -0.7580682635307312, -0.7079014778137207, -0.6577346920967102, -0.6075679063796997, -0.5574011206626892, -0.5072343349456787, -0.4570675492286682, -0.4069007635116577, -0.3567339777946472, -0.3065671920776367, -0.2564004063606262, -0.20623362064361572, -0.15606683492660522, -0.10590004920959473, -0.05573326349258423, -0.0055664777755737305, 0.04460030794143677, 0.09476709365844727, 0.14493387937545776, 0.19510066509246826, 0.24526745080947876, 0.29543423652648926, 0.34560102224349976, 0.39576780796051025, 0.44593459367752075, 0.49610137939453125, 0.5462681651115417, 0.5964349508285522, 0.6466017365455627, 0.6967685222625732, 0.7469353079795837]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 5.0, 2.0, 1.0, 3.0, 4.0, 13.0, 11.0, 22.0, 32.0, 65.0, 87.0, 186.0, 470.0, 1615.0, 8281.0, 94634.0, 788254.0, 141041.0, 10720.0, 2026.0, 610.0, 201.0, 111.0, 54.0, 47.0, 28.0, 16.0, 7.0, 6.0, 6.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.294921875, -0.28338623046875, -0.2718505859375, -0.26031494140625, -0.248779296875, -0.23724365234375, -0.2257080078125, -0.21417236328125, -0.20263671875, -0.19110107421875, -0.1795654296875, -0.16802978515625, -0.156494140625, -0.14495849609375, -0.1334228515625, -0.12188720703125, -0.1103515625, -0.09881591796875, -0.0872802734375, -0.07574462890625, -0.064208984375, -0.05267333984375, -0.0411376953125, -0.02960205078125, -0.01806640625, -0.00653076171875, 0.0050048828125, 0.01654052734375, 0.028076171875, 0.03961181640625, 0.0511474609375, 0.06268310546875, 0.07421875, 0.08575439453125, 0.0972900390625, 0.10882568359375, 0.120361328125, 0.13189697265625, 0.1434326171875, 0.15496826171875, 0.16650390625, 0.17803955078125, 0.1895751953125, 0.20111083984375, 0.212646484375, 0.22418212890625, 0.2357177734375, 0.24725341796875, 0.2587890625, 0.27032470703125, 0.2818603515625, 0.29339599609375, 0.304931640625, 0.31646728515625, 0.3280029296875, 0.33953857421875, 0.35107421875, 0.36260986328125, 0.3741455078125, 0.38568115234375, 0.397216796875, 0.40875244140625, 0.4202880859375, 0.43182373046875, 0.443359375]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 6.0, 5.0, 10.0, 13.0, 15.0, 9.0, 17.0, 18.0, 32.0, 46.0, 49.0, 62.0, 65.0, 50.0, 52.0, 76.0, 57.0, 49.0, 58.0, 51.0, 43.0, 54.0, 27.0, 36.0, 28.0, 24.0, 16.0, 9.0, 12.0, 9.0, 6.0, 1.0, 3.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.1597900390625, -0.15606021881103516, -0.1523303985595703, -0.14860057830810547, -0.14487075805664062, -0.14114093780517578, -0.13741111755371094, -0.1336812973022461, -0.12995147705078125, -0.1262216567993164, -0.12249183654785156, -0.11876201629638672, -0.11503219604492188, -0.11130237579345703, -0.10757255554199219, -0.10384273529052734, -0.1001129150390625, -0.09638309478759766, -0.09265327453613281, -0.08892345428466797, -0.08519363403320312, -0.08146381378173828, -0.07773399353027344, -0.0740041732788086, -0.07027435302734375, -0.0665445327758789, -0.06281471252441406, -0.05908489227294922, -0.055355072021484375, -0.05162525177001953, -0.04789543151855469, -0.044165611267089844, -0.040435791015625, -0.036705970764160156, -0.03297615051269531, -0.02924633026123047, -0.025516510009765625, -0.02178668975830078, -0.018056869506835938, -0.014327049255371094, -0.01059722900390625, -0.006867408752441406, -0.0031375885009765625, 0.0005922317504882812, 0.004322052001953125, 0.008051872253417969, 0.011781692504882812, 0.015511512756347656, 0.0192413330078125, 0.022971153259277344, 0.026700973510742188, 0.03043079376220703, 0.034160614013671875, 0.03789043426513672, 0.04162025451660156, 0.045350074768066406, 0.04907989501953125, 0.052809715270996094, 0.05653953552246094, 0.06026935577392578, 0.06399917602539062, 0.06772899627685547, 0.07145881652832031, 0.07518863677978516, 0.07891845703125]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 4.0, 5.0, 4.0, 3.0, 11.0, 14.0, 16.0, 30.0, 35.0, 66.0, 93.0, 153.0, 253.0, 456.0, 1142.0, 3221.0, 11831.0, 68412.0, 634255.0, 280606.0, 36612.0, 7340.0, 2223.0, 794.0, 392.0, 194.0, 132.0, 95.0, 42.0, 41.0, 22.0, 24.0, 14.0, 10.0, 5.0, 2.0, 5.0, 3.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2349853515625, -0.2271099090576172, -0.21923446655273438, -0.21135902404785156, -0.20348358154296875, -0.19560813903808594, -0.18773269653320312, -0.1798572540283203, -0.1719818115234375, -0.1641063690185547, -0.15623092651367188, -0.14835548400878906, -0.14048004150390625, -0.13260459899902344, -0.12472915649414062, -0.11685371398925781, -0.108978271484375, -0.10110282897949219, -0.09322738647460938, -0.08535194396972656, -0.07747650146484375, -0.06960105895996094, -0.061725616455078125, -0.05385017395019531, -0.0459747314453125, -0.03809928894042969, -0.030223846435546875, -0.022348403930664062, -0.01447296142578125, -0.0065975189208984375, 0.001277923583984375, 0.009153366088867188, 0.01702880859375, 0.024904251098632812, 0.032779693603515625, 0.04065513610839844, 0.04853057861328125, 0.05640602111816406, 0.06428146362304688, 0.07215690612792969, 0.0800323486328125, 0.08790779113769531, 0.09578323364257812, 0.10365867614746094, 0.11153411865234375, 0.11940956115722656, 0.12728500366210938, 0.1351604461669922, 0.143035888671875, 0.1509113311767578, 0.15878677368164062, 0.16666221618652344, 0.17453765869140625, 0.18241310119628906, 0.19028854370117188, 0.1981639862060547, 0.2060394287109375, 0.2139148712158203, 0.22179031372070312, 0.22966575622558594, 0.23754119873046875, 0.24541664123535156, 0.2532920837402344, 0.2611675262451172, 0.26904296875]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 5.0, 7.0, 8.0, 6.0, 10.0, 10.0, 13.0, 16.0, 17.0, 20.0, 25.0, 28.0, 30.0, 48.0, 35.0, 54.0, 41.0, 57.0, 56.0, 65.0, 62.0, 40.0, 51.0, 51.0, 40.0, 39.0, 34.0, 21.0, 26.0, 20.0, 17.0, 12.0, 10.0, 10.0, 4.0, 5.0, 3.0, 1.0, 5.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.367919921875, -0.3560981750488281, -0.34427642822265625, -0.3324546813964844, -0.3206329345703125, -0.3088111877441406, -0.29698944091796875, -0.2851676940917969, -0.273345947265625, -0.2615242004394531, -0.24970245361328125, -0.23788070678710938, -0.2260589599609375, -0.21423721313476562, -0.20241546630859375, -0.19059371948242188, -0.17877197265625, -0.16695022583007812, -0.15512847900390625, -0.14330673217773438, -0.1314849853515625, -0.11966323852539062, -0.10784149169921875, -0.09601974487304688, -0.084197998046875, -0.07237625122070312, -0.06055450439453125, -0.048732757568359375, -0.0369110107421875, -0.025089263916015625, -0.01326751708984375, -0.001445770263671875, 0.0103759765625, 0.022197723388671875, 0.03401947021484375, 0.045841217041015625, 0.0576629638671875, 0.06948471069335938, 0.08130645751953125, 0.09312820434570312, 0.104949951171875, 0.11677169799804688, 0.12859344482421875, 0.14041519165039062, 0.1522369384765625, 0.16405868530273438, 0.17588043212890625, 0.18770217895507812, 0.19952392578125, 0.21134567260742188, 0.22316741943359375, 0.23498916625976562, 0.2468109130859375, 0.2586326599121094, 0.27045440673828125, 0.2822761535644531, 0.294097900390625, 0.3059196472167969, 0.31774139404296875, 0.3295631408691406, 0.3413848876953125, 0.3532066345214844, 0.36502838134765625, 0.3768501281738281, 0.388671875]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 1.0, 2.0, 8.0, 7.0, 7.0, 7.0, 20.0, 26.0, 41.0, 69.0, 115.0, 245.0, 433.0, 970.0, 2297.0, 6391.0, 22950.0, 125836.0, 725951.0, 128760.0, 23352.0, 6696.0, 2351.0, 1015.0, 446.0, 241.0, 122.0, 62.0, 47.0, 39.0, 9.0, 13.0, 7.0, 7.0, 4.0, 2.0, 4.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10992431640625, -0.1066436767578125, -0.103363037109375, -0.1000823974609375, -0.0968017578125, -0.0935211181640625, -0.090240478515625, -0.0869598388671875, -0.08367919921875, -0.0803985595703125, -0.077117919921875, -0.0738372802734375, -0.070556640625, -0.0672760009765625, -0.063995361328125, -0.0607147216796875, -0.05743408203125, -0.0541534423828125, -0.050872802734375, -0.0475921630859375, -0.0443115234375, -0.0410308837890625, -0.037750244140625, -0.0344696044921875, -0.03118896484375, -0.0279083251953125, -0.024627685546875, -0.0213470458984375, -0.01806640625, -0.0147857666015625, -0.011505126953125, -0.0082244873046875, -0.00494384765625, -0.0016632080078125, 0.001617431640625, 0.0048980712890625, 0.0081787109375, 0.0114593505859375, 0.014739990234375, 0.0180206298828125, 0.02130126953125, 0.0245819091796875, 0.027862548828125, 0.0311431884765625, 0.034423828125, 0.0377044677734375, 0.040985107421875, 0.0442657470703125, 0.04754638671875, 0.0508270263671875, 0.054107666015625, 0.0573883056640625, 0.0606689453125, 0.0639495849609375, 0.067230224609375, 0.0705108642578125, 0.07379150390625, 0.0770721435546875, 0.080352783203125, 0.0836334228515625, 0.0869140625, 0.0901947021484375, 0.093475341796875, 0.0967559814453125, 0.10003662109375]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 1.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 3.0, 3.0, 3.0, 6.0, 20.0, 12.0, 25.0, 39.0, 66.0, 105.0, 129.0, 156.0, 136.0, 120.0, 57.0, 54.0, 24.0, 16.0, 10.0, 10.0, 2.0, 5.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.269050598144531e-05, -5.0838105380535126e-05, -4.898570477962494e-05, -4.713330417871475e-05, -4.5280903577804565e-05, -4.342850297689438e-05, -4.157610237598419e-05, -3.9723701775074005e-05, -3.787130117416382e-05, -3.601890057325363e-05, -3.4166499972343445e-05, -3.231409937143326e-05, -3.046169877052307e-05, -2.8609298169612885e-05, -2.6756897568702698e-05, -2.490449696779251e-05, -2.3052096366882324e-05, -2.1199695765972137e-05, -1.934729516506195e-05, -1.7494894564151764e-05, -1.5642493963241577e-05, -1.379009336233139e-05, -1.1937692761421204e-05, -1.0085292160511017e-05, -8.23289155960083e-06, -6.380490958690643e-06, -4.5280903577804565e-06, -2.6756897568702698e-06, -8.23289155960083e-07, 1.0291114449501038e-06, 2.8815120458602905e-06, 4.733912646770477e-06, 6.586313247680664e-06, 8.43871384859085e-06, 1.0291114449501038e-05, 1.2143515050411224e-05, 1.3995915651321411e-05, 1.5848316252231598e-05, 1.7700716853141785e-05, 1.955311745405197e-05, 2.1405518054962158e-05, 2.3257918655872345e-05, 2.5110319256782532e-05, 2.696271985769272e-05, 2.8815120458602905e-05, 3.066752105951309e-05, 3.251992166042328e-05, 3.4372322261333466e-05, 3.622472286224365e-05, 3.807712346315384e-05, 3.9929524064064026e-05, 4.178192466497421e-05, 4.36343252658844e-05, 4.5486725866794586e-05, 4.733912646770477e-05, 4.919152706861496e-05, 5.1043927669525146e-05, 5.289632827043533e-05, 5.474872887134552e-05, 5.660112947225571e-05, 5.8453530073165894e-05, 6.030593067407608e-05, 6.215833127498627e-05, 6.401073187589645e-05, 6.586313247680664e-05]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 3.0, 4.0, 8.0, 7.0, 4.0, 6.0, 8.0, 18.0, 25.0, 29.0, 55.0, 79.0, 139.0, 230.0, 405.0, 784.0, 1538.0, 3454.0, 8135.0, 22376.0, 80776.0, 539000.0, 297651.0, 62281.0, 18505.0, 7097.0, 2972.0, 1349.0, 730.0, 367.0, 199.0, 105.0, 70.0, 38.0, 29.0, 19.0, 26.0, 8.0, 13.0, 3.0, 7.0, 3.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0718994140625, -0.06932353973388672, -0.06674766540527344, -0.06417179107666016, -0.061595916748046875, -0.059020042419433594, -0.05644416809082031, -0.05386829376220703, -0.05129241943359375, -0.04871654510498047, -0.04614067077636719, -0.043564796447753906, -0.040988922119140625, -0.038413047790527344, -0.03583717346191406, -0.03326129913330078, -0.0306854248046875, -0.02810955047607422, -0.025533676147460938, -0.022957801818847656, -0.020381927490234375, -0.017806053161621094, -0.015230178833007812, -0.012654304504394531, -0.01007843017578125, -0.007502555847167969, -0.0049266815185546875, -0.0023508071899414062, 0.000225067138671875, 0.0028009414672851562, 0.0053768157958984375, 0.007952690124511719, 0.010528564453125, 0.013104438781738281, 0.015680313110351562, 0.018256187438964844, 0.020832061767578125, 0.023407936096191406, 0.025983810424804688, 0.02855968475341797, 0.03113555908203125, 0.03371143341064453, 0.03628730773925781, 0.038863182067871094, 0.041439056396484375, 0.044014930725097656, 0.04659080505371094, 0.04916667938232422, 0.0517425537109375, 0.05431842803955078, 0.05689430236816406, 0.059470176696777344, 0.062046051025390625, 0.0646219253540039, 0.06719779968261719, 0.06977367401123047, 0.07234954833984375, 0.07492542266845703, 0.07750129699707031, 0.0800771713256836, 0.08265304565429688, 0.08522891998291016, 0.08780479431152344, 0.09038066864013672, 0.09295654296875]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 4.0, 3.0, 3.0, 5.0, 7.0, 15.0, 11.0, 10.0, 23.0, 27.0, 34.0, 40.0, 63.0, 90.0, 81.0, 93.0, 88.0, 92.0, 69.0, 69.0, 44.0, 35.0, 23.0, 12.0, 20.0, 11.0, 9.0, 10.0, 3.0, 4.0, 1.0, 2.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.10260009765625, -0.09984207153320312, -0.09708404541015625, -0.09432601928710938, -0.0915679931640625, -0.08880996704101562, -0.08605194091796875, -0.08329391479492188, -0.080535888671875, -0.07777786254882812, -0.07501983642578125, -0.07226181030273438, -0.0695037841796875, -0.06674575805664062, -0.06398773193359375, -0.061229705810546875, -0.0584716796875, -0.055713653564453125, -0.05295562744140625, -0.050197601318359375, -0.0474395751953125, -0.044681549072265625, -0.04192352294921875, -0.039165496826171875, -0.036407470703125, -0.033649444580078125, -0.03089141845703125, -0.028133392333984375, -0.0253753662109375, -0.022617340087890625, -0.01985931396484375, -0.017101287841796875, -0.01434326171875, -0.011585235595703125, -0.00882720947265625, -0.006069183349609375, -0.0033111572265625, -0.000553131103515625, 0.00220489501953125, 0.004962921142578125, 0.007720947265625, 0.010478973388671875, 0.01323699951171875, 0.015995025634765625, 0.0187530517578125, 0.021511077880859375, 0.02426910400390625, 0.027027130126953125, 0.02978515625, 0.032543182373046875, 0.03530120849609375, 0.038059234619140625, 0.0408172607421875, 0.043575286865234375, 0.04633331298828125, 0.049091339111328125, 0.051849365234375, 0.054607391357421875, 0.05736541748046875, 0.060123443603515625, 0.0628814697265625, 0.06563949584960938, 0.06839752197265625, 0.07115554809570312, 0.07391357421875]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 1.0, 2.0, 3.0, 10.0, 9.0, 23.0, 38.0, 73.0, 114.0, 265.0, 270.0, 102.0, 53.0, 14.0, 6.0, 9.0, 5.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.4403464794158936, -2.3665807247161865, -2.2928147315979004, -2.2190489768981934, -2.1452829837799072, -2.0715172290802, -1.9977513551712036, -1.923985481262207, -1.8502196073532104, -1.7764537334442139, -1.7026878595352173, -1.6289219856262207, -1.5551562309265137, -1.4813902378082275, -1.4076244831085205, -1.333858609199524, -1.2600927352905273, -1.1863268613815308, -1.1125609874725342, -1.0387951135635376, -0.9650292992591858, -0.8912634253501892, -0.8174976110458374, -0.7437317371368408, -0.6699658632278442, -0.5961999893188477, -0.5224341154098511, -0.44866830110549927, -0.3749024271965027, -0.3011365532875061, -0.2273707091808319, -0.15360486507415771, -0.07983922958374023, -0.006073370575904846, 0.06769248843193054, 0.14145834743976593, 0.21522420644760132, 0.2889900803565979, 0.3627559244632721, 0.4365217685699463, 0.5102876424789429, 0.5840535163879395, 0.657819390296936, 0.7315852046012878, 0.8053510785102844, 0.879116952419281, 0.9528827667236328, 1.0266486406326294, 1.100414514541626, 1.1741803884506226, 1.2479462623596191, 1.3217121362686157, 1.3954780101776123, 1.4692437648773193, 1.543009638786316, 1.6167755126953125, 1.690541386604309, 1.7643072605133057, 1.8380731344223022, 1.9118390083312988, 1.9856047630310059, 2.059370756149292, 2.133136510848999, 2.206902503967285, 2.280668258666992]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 1.0, 4.0, 5.0, 7.0, 4.0, 15.0, 20.0, 16.0, 19.0, 16.0, 26.0, 33.0, 26.0, 47.0, 28.0, 41.0, 67.0, 92.0, 81.0, 86.0, 65.0, 51.0, 43.0, 41.0, 38.0, 23.0, 23.0, 17.0, 21.0, 11.0, 10.0, 8.0, 10.0, 6.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.2091469764709473, -1.1628299951553345, -1.1165128946304321, -1.0701959133148193, -1.0238789319992065, -0.977561891078949, -0.9312448501586914, -0.8849278688430786, -0.8386108875274658, -0.7922938466072083, -0.7459768652915955, -0.6996598243713379, -0.6533428430557251, -0.6070258021354675, -0.56070876121521, -0.5143917798995972, -0.4680747389793396, -0.4217577278614044, -0.37544071674346924, -0.32912367582321167, -0.2828066945075989, -0.2364896684885025, -0.19017264246940613, -0.14385563135147095, -0.09753862023353577, -0.05122160539031029, -0.004904590547084808, 0.04141242802143097, 0.08772943913936615, 0.13404645025730133, 0.1803634762763977, 0.22668048739433289, 0.27299749851226807, 0.31931450963020325, 0.3656315207481384, 0.411948561668396, 0.4582655429840088, 0.5045825839042664, 0.5508996248245239, 0.5972166061401367, 0.6435335874557495, 0.6898506283760071, 0.7361676096916199, 0.7824846506118774, 0.8288016319274902, 0.8751186728477478, 0.9214357137680054, 0.9677526950836182, 1.0140697956085205, 1.0603867769241333, 1.1067038774490356, 1.1530208587646484, 1.1993378400802612, 1.245654821395874, 1.2919719219207764, 1.3382889032363892, 1.384605884552002, 1.4309228658676147, 1.477239966392517, 1.5235569477081299, 1.5698739290237427, 1.6161909103393555, 1.6625080108642578, 1.7088249921798706, 1.7551419734954834]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 2.0, 3.0, 3.0, 3.0, 4.0, 4.0, 10.0, 6.0, 7.0, 15.0, 7.0, 17.0, 31.0, 51.0, 48.0, 77.0, 114.0, 220.0, 414.0, 775.0, 2008.0, 7420.0, 57410.0, 1864168.0, 2180270.0, 66696.0, 9591.0, 2803.0, 1091.0, 506.0, 212.0, 136.0, 70.0, 41.0, 21.0, 14.0, 8.0, 5.0, 5.0, 3.0, 0.0, 2.0, 2.0], "bins": [-0.32666015625, -0.31940460205078125, -0.3121490478515625, -0.30489349365234375, -0.297637939453125, -0.29038238525390625, -0.2831268310546875, -0.27587127685546875, -0.26861572265625, -0.26136016845703125, -0.2541046142578125, -0.24684906005859375, -0.239593505859375, -0.23233795166015625, -0.2250823974609375, -0.21782684326171875, -0.2105712890625, -0.20331573486328125, -0.1960601806640625, -0.18880462646484375, -0.181549072265625, -0.17429351806640625, -0.1670379638671875, -0.15978240966796875, -0.15252685546875, -0.14527130126953125, -0.1380157470703125, -0.13076019287109375, -0.123504638671875, -0.11624908447265625, -0.1089935302734375, -0.10173797607421875, -0.094482421875, -0.08722686767578125, -0.0799713134765625, -0.07271575927734375, -0.065460205078125, -0.05820465087890625, -0.0509490966796875, -0.04369354248046875, -0.03643798828125, -0.02918243408203125, -0.0219268798828125, -0.01467132568359375, -0.007415771484375, -0.00016021728515625, 0.0070953369140625, 0.01435089111328125, 0.0216064453125, 0.02886199951171875, 0.0361175537109375, 0.04337310791015625, 0.050628662109375, 0.05788421630859375, 0.0651397705078125, 0.07239532470703125, 0.07965087890625, 0.08690643310546875, 0.0941619873046875, 0.10141754150390625, 0.108673095703125, 0.11592864990234375, 0.1231842041015625, 0.13043975830078125, 0.1376953125]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 5.0, 7.0, 11.0, 16.0, 22.0, 32.0, 48.0, 68.0, 69.0, 91.0, 76.0, 78.0, 71.0, 86.0, 75.0, 63.0, 56.0, 38.0, 28.0, 19.0, 18.0, 14.0, 5.0, 5.0, 5.0, 3.0, 1.0, 1.0, 2.0], "bins": [-0.2362060546875, -0.23117351531982422, -0.22614097595214844, -0.22110843658447266, -0.21607589721679688, -0.2110433578491211, -0.2060108184814453, -0.20097827911376953, -0.19594573974609375, -0.19091320037841797, -0.1858806610107422, -0.1808481216430664, -0.17581558227539062, -0.17078304290771484, -0.16575050354003906, -0.16071796417236328, -0.1556854248046875, -0.15065288543701172, -0.14562034606933594, -0.14058780670166016, -0.13555526733398438, -0.1305227279663086, -0.1254901885986328, -0.12045764923095703, -0.11542510986328125, -0.11039257049560547, -0.10536003112792969, -0.1003274917602539, -0.09529495239257812, -0.09026241302490234, -0.08522987365722656, -0.08019733428955078, -0.075164794921875, -0.07013225555419922, -0.06509971618652344, -0.060067176818847656, -0.055034637451171875, -0.050002098083496094, -0.04496955871582031, -0.03993701934814453, -0.03490447998046875, -0.02987194061279297, -0.024839401245117188, -0.019806861877441406, -0.014774322509765625, -0.009741783142089844, -0.0047092437744140625, 0.00032329559326171875, 0.0053558349609375, 0.010388374328613281, 0.015420913696289062, 0.020453453063964844, 0.025485992431640625, 0.030518531799316406, 0.03555107116699219, 0.04058361053466797, 0.04561614990234375, 0.05064868927001953, 0.05568122863769531, 0.060713768005371094, 0.06574630737304688, 0.07077884674072266, 0.07581138610839844, 0.08084392547607422, 0.08587646484375]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 10.0, 13.0, 20.0, 40.0, 113.0, 302.0, 1043.0, 7490.0, 1690503.0, 2484820.0, 8248.0, 1069.0, 381.0, 121.0, 59.0, 24.0, 16.0, 7.0, 4.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5166015625, -0.49880218505859375, -0.4810028076171875, -0.46320343017578125, -0.445404052734375, -0.42760467529296875, -0.4098052978515625, -0.39200592041015625, -0.37420654296875, -0.35640716552734375, -0.3386077880859375, -0.32080841064453125, -0.303009033203125, -0.28520965576171875, -0.2674102783203125, -0.24961090087890625, -0.2318115234375, -0.21401214599609375, -0.1962127685546875, -0.17841339111328125, -0.160614013671875, -0.14281463623046875, -0.1250152587890625, -0.10721588134765625, -0.08941650390625, -0.07161712646484375, -0.0538177490234375, -0.03601837158203125, -0.018218994140625, -0.00041961669921875, 0.0173797607421875, 0.03517913818359375, 0.052978515625, 0.07077789306640625, 0.0885772705078125, 0.10637664794921875, 0.124176025390625, 0.14197540283203125, 0.1597747802734375, 0.17757415771484375, 0.19537353515625, 0.21317291259765625, 0.2309722900390625, 0.24877166748046875, 0.266571044921875, 0.28437042236328125, 0.3021697998046875, 0.31996917724609375, 0.3377685546875, 0.35556793212890625, 0.3733673095703125, 0.39116668701171875, 0.408966064453125, 0.42676544189453125, 0.4445648193359375, 0.46236419677734375, 0.48016357421875, 0.49796295166015625, 0.5157623291015625, 0.5335617065429688, 0.551361083984375, 0.5691604614257812, 0.5869598388671875, 0.6047592163085938, 0.62255859375]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 0.0, 4.0, 0.0, 1.0, 3.0, 7.0, 4.0, 10.0, 12.0, 24.0, 35.0, 66.0, 114.0, 195.0, 358.0, 636.0, 924.0, 727.0, 421.0, 221.0, 124.0, 81.0, 48.0, 28.0, 7.0, 8.0, 7.0, 7.0, 3.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.216796875, -0.2092132568359375, -0.201629638671875, -0.1940460205078125, -0.18646240234375, -0.1788787841796875, -0.171295166015625, -0.1637115478515625, -0.1561279296875, -0.1485443115234375, -0.140960693359375, -0.1333770751953125, -0.12579345703125, -0.1182098388671875, -0.110626220703125, -0.1030426025390625, -0.095458984375, -0.0878753662109375, -0.080291748046875, -0.0727081298828125, -0.06512451171875, -0.0575408935546875, -0.049957275390625, -0.0423736572265625, -0.0347900390625, -0.0272064208984375, -0.019622802734375, -0.0120391845703125, -0.00445556640625, 0.0031280517578125, 0.010711669921875, 0.0182952880859375, 0.02587890625, 0.0334625244140625, 0.041046142578125, 0.0486297607421875, 0.05621337890625, 0.0637969970703125, 0.071380615234375, 0.0789642333984375, 0.0865478515625, 0.0941314697265625, 0.101715087890625, 0.1092987060546875, 0.11688232421875, 0.1244659423828125, 0.132049560546875, 0.1396331787109375, 0.147216796875, 0.1548004150390625, 0.162384033203125, 0.1699676513671875, 0.17755126953125, 0.1851348876953125, 0.192718505859375, 0.2003021240234375, 0.2078857421875, 0.2154693603515625, 0.223052978515625, 0.2306365966796875, 0.23822021484375, 0.2458038330078125, 0.253387451171875, 0.2609710693359375, 0.2685546875]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0, 10.0, 15.0, 34.0, 77.0, 168.0, 204.0, 209.0, 131.0, 82.0, 38.0, 14.0, 8.0, 5.0, 3.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6589196920394897, -1.5832395553588867, -1.5075592994689941, -1.4318791627883911, -1.356199026107788, -1.2805187702178955, -1.2048386335372925, -1.1291584968566895, -1.0534782409667969, -0.9777980446815491, -0.9021178483963013, -0.8264377117156982, -0.7507575154304504, -0.6750773191452026, -0.5993971824645996, -0.5237169861793518, -0.448036789894104, -0.3723565936088562, -0.2966764271259308, -0.22099624574184418, -0.14531606435775757, -0.06963586807250977, 0.006044298410415649, 0.08172446489334106, 0.15740466117858887, 0.23308484256267548, 0.3087650239467621, 0.3844451904296875, 0.4601253867149353, 0.5358055830001831, 0.6114857196807861, 0.6871659159660339, 0.7628459930419922, 0.83852618932724, 0.9142063856124878, 0.9898865222930908, 1.0655667781829834, 1.1412469148635864, 1.2169270515441895, 1.292607307434082, 1.368287444114685, 1.443967580795288, 1.5196478366851807, 1.5953279733657837, 1.6710081100463867, 1.7466883659362793, 1.8223685026168823, 1.8980486392974854, 1.973728895187378, 2.0494091510772705, 2.125089168548584, 2.2007694244384766, 2.276449680328369, 2.3521299362182617, 2.427809953689575, 2.5034902095794678, 2.5791702270507812, 2.654850482940674, 2.7305305004119873, 2.80621075630188, 2.8818910121917725, 2.957571029663086, 3.0332512855529785, 3.108931541442871, 3.1846117973327637]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 4.0, 2.0, 4.0, 3.0, 2.0, 6.0, 8.0, 15.0, 14.0, 19.0, 19.0, 23.0, 29.0, 32.0, 45.0, 55.0, 58.0, 54.0, 59.0, 65.0, 62.0, 54.0, 51.0, 52.0, 49.0, 38.0, 31.0, 34.0, 25.0, 20.0, 15.0, 21.0, 13.0, 8.0, 7.0, 8.0, 1.0, 4.0, 3.0, 0.0, 1.0, 1.0, 1.0], "bins": [-1.320117712020874, -1.2880189418792725, -1.2559202909469604, -1.2238215208053589, -1.1917227506637573, -1.1596240997314453, -1.1275253295898438, -1.0954265594482422, -1.0633279085159302, -1.0312291383743286, -0.9991304278373718, -0.967031717300415, -0.9349330067634583, -0.9028342962265015, -0.8707355260848999, -0.8386368155479431, -0.8065380454063416, -0.7744393348693848, -0.7423405647277832, -0.7102418541908264, -0.6781431436538696, -0.6460443735122681, -0.6139456629753113, -0.5818469524383545, -0.5497481822967529, -0.5176494717597961, -0.48555073142051697, -0.4534519910812378, -0.421353280544281, -0.38925454020500183, -0.35715579986572266, -0.32505708932876587, -0.29295843839645386, -0.2608596980571747, -0.2287609875202179, -0.19666224718093872, -0.16456352174282074, -0.13246479630470276, -0.10036605596542358, -0.0682673305273056, -0.03616860508918762, -0.004069875925779343, 0.028028853237628937, 0.060127586126327515, 0.0922263115644455, 0.12432503700256348, 0.15642377734184265, 0.18852250277996063, 0.2206212282180786, 0.2527199685573578, 0.2848186790943146, 0.31691741943359375, 0.34901612997055054, 0.3811148703098297, 0.4132136106491089, 0.4453123211860657, 0.47741106152534485, 0.509509801864624, 0.5416085124015808, 0.5737072229385376, 0.6058059930801392, 0.637904703617096, 0.6700034141540527, 0.7021021842956543, 0.7342008948326111]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 9.0, 5.0, 4.0, 5.0, 12.0, 19.0, 40.0, 46.0, 131.0, 299.0, 1068.0, 6229.0, 75211.0, 850993.0, 104888.0, 7644.0, 1317.0, 363.0, 136.0, 63.0, 34.0, 9.0, 13.0, 7.0, 3.0, 6.0, 1.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.49560546875, -0.48274993896484375, -0.4698944091796875, -0.45703887939453125, -0.444183349609375, -0.43132781982421875, -0.4184722900390625, -0.40561676025390625, -0.39276123046875, -0.37990570068359375, -0.3670501708984375, -0.35419464111328125, -0.341339111328125, -0.32848358154296875, -0.3156280517578125, -0.30277252197265625, -0.2899169921875, -0.27706146240234375, -0.2642059326171875, -0.25135040283203125, -0.238494873046875, -0.22563934326171875, -0.2127838134765625, -0.19992828369140625, -0.18707275390625, -0.17421722412109375, -0.1613616943359375, -0.14850616455078125, -0.135650634765625, -0.12279510498046875, -0.1099395751953125, -0.09708404541015625, -0.084228515625, -0.07137298583984375, -0.0585174560546875, -0.04566192626953125, -0.032806396484375, -0.01995086669921875, -0.0070953369140625, 0.00576019287109375, 0.01861572265625, 0.03147125244140625, 0.0443267822265625, 0.05718231201171875, 0.070037841796875, 0.08289337158203125, 0.0957489013671875, 0.10860443115234375, 0.1214599609375, 0.13431549072265625, 0.1471710205078125, 0.16002655029296875, 0.172882080078125, 0.18573760986328125, 0.1985931396484375, 0.21144866943359375, 0.22430419921875, 0.23715972900390625, 0.2500152587890625, 0.26287078857421875, 0.275726318359375, 0.28858184814453125, 0.3014373779296875, 0.31429290771484375, 0.3271484375]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 4.0, 4.0, 3.0, 2.0, 6.0, 10.0, 7.0, 20.0, 14.0, 14.0, 19.0, 23.0, 39.0, 31.0, 27.0, 46.0, 48.0, 44.0, 59.0, 51.0, 51.0, 42.0, 55.0, 60.0, 45.0, 44.0, 38.0, 39.0, 27.0, 25.0, 19.0, 21.0, 16.0, 14.0, 8.0, 5.0, 9.0, 5.0, 7.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0933837890625, -0.09024906158447266, -0.08711433410644531, -0.08397960662841797, -0.08084487915039062, -0.07771015167236328, -0.07457542419433594, -0.0714406967163086, -0.06830596923828125, -0.0651712417602539, -0.06203651428222656, -0.05890178680419922, -0.055767059326171875, -0.05263233184814453, -0.04949760437011719, -0.046362876892089844, -0.0432281494140625, -0.040093421936035156, -0.03695869445800781, -0.03382396697998047, -0.030689239501953125, -0.02755451202392578, -0.024419784545898438, -0.021285057067871094, -0.01815032958984375, -0.015015602111816406, -0.011880874633789062, -0.008746147155761719, -0.005611419677734375, -0.0024766921997070312, 0.0006580352783203125, 0.0037927627563476562, 0.006927490234375, 0.010062217712402344, 0.013196945190429688, 0.01633167266845703, 0.019466400146484375, 0.02260112762451172, 0.025735855102539062, 0.028870582580566406, 0.03200531005859375, 0.035140037536621094, 0.03827476501464844, 0.04140949249267578, 0.044544219970703125, 0.04767894744873047, 0.05081367492675781, 0.053948402404785156, 0.0570831298828125, 0.060217857360839844, 0.06335258483886719, 0.06648731231689453, 0.06962203979492188, 0.07275676727294922, 0.07589149475097656, 0.0790262222290039, 0.08216094970703125, 0.0852956771850586, 0.08843040466308594, 0.09156513214111328, 0.09469985961914062, 0.09783458709716797, 0.10096931457519531, 0.10410404205322266, 0.10723876953125]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 1.0, 2.0, 4.0, 2.0, 7.0, 5.0, 7.0, 7.0, 17.0, 16.0, 22.0, 19.0, 33.0, 56.0, 77.0, 110.0, 160.0, 284.0, 473.0, 926.0, 2067.0, 6125.0, 25215.0, 191789.0, 725978.0, 75005.0, 13197.0, 3770.0, 1430.0, 654.0, 375.0, 212.0, 167.0, 86.0, 92.0, 44.0, 38.0, 22.0, 16.0, 16.0, 10.0, 7.0, 2.0, 6.0, 3.0, 2.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.281494140625, -0.273284912109375, -0.26507568359375, -0.256866455078125, -0.2486572265625, -0.240447998046875, -0.23223876953125, -0.224029541015625, -0.2158203125, -0.207611083984375, -0.19940185546875, -0.191192626953125, -0.1829833984375, -0.174774169921875, -0.16656494140625, -0.158355712890625, -0.150146484375, -0.141937255859375, -0.13372802734375, -0.125518798828125, -0.1173095703125, -0.109100341796875, -0.10089111328125, -0.092681884765625, -0.08447265625, -0.076263427734375, -0.06805419921875, -0.059844970703125, -0.0516357421875, -0.043426513671875, -0.03521728515625, -0.027008056640625, -0.018798828125, -0.010589599609375, -0.00238037109375, 0.005828857421875, 0.0140380859375, 0.022247314453125, 0.03045654296875, 0.038665771484375, 0.046875, 0.055084228515625, 0.06329345703125, 0.071502685546875, 0.0797119140625, 0.087921142578125, 0.09613037109375, 0.104339599609375, 0.112548828125, 0.120758056640625, 0.12896728515625, 0.137176513671875, 0.1453857421875, 0.153594970703125, 0.16180419921875, 0.170013427734375, 0.17822265625, 0.186431884765625, 0.19464111328125, 0.202850341796875, 0.2110595703125, 0.219268798828125, 0.22747802734375, 0.235687255859375, 0.243896484375]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 0.0, 4.0, 0.0, 8.0, 6.0, 2.0, 11.0, 9.0, 15.0, 16.0, 20.0, 22.0, 28.0, 39.0, 34.0, 35.0, 41.0, 46.0, 55.0, 62.0, 54.0, 60.0, 46.0, 53.0, 62.0, 39.0, 35.0, 38.0, 32.0, 24.0, 27.0, 22.0, 14.0, 11.0, 8.0, 7.0, 9.0, 3.0, 3.0, 6.0, 4.0, 1.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.298828125, -0.2868461608886719, -0.27486419677734375, -0.2628822326660156, -0.2509002685546875, -0.23891830444335938, -0.22693634033203125, -0.21495437622070312, -0.202972412109375, -0.19099044799804688, -0.17900848388671875, -0.16702651977539062, -0.1550445556640625, -0.14306259155273438, -0.13108062744140625, -0.11909866333007812, -0.10711669921875, -0.09513473510742188, -0.08315277099609375, -0.07117080688476562, -0.0591888427734375, -0.047206878662109375, -0.03522491455078125, -0.023242950439453125, -0.011260986328125, 0.000720977783203125, 0.01270294189453125, 0.024684906005859375, 0.0366668701171875, 0.048648834228515625, 0.06063079833984375, 0.07261276245117188, 0.0845947265625, 0.09657669067382812, 0.10855865478515625, 0.12054061889648438, 0.1325225830078125, 0.14450454711914062, 0.15648651123046875, 0.16846847534179688, 0.180450439453125, 0.19243240356445312, 0.20441436767578125, 0.21639633178710938, 0.2283782958984375, 0.24036026000976562, 0.25234222412109375, 0.2643241882324219, 0.27630615234375, 0.2882881164550781, 0.30027008056640625, 0.3122520446777344, 0.3242340087890625, 0.3362159729003906, 0.34819793701171875, 0.3601799011230469, 0.372161865234375, 0.3841438293457031, 0.39612579345703125, 0.4081077575683594, 0.4200897216796875, 0.4320716857910156, 0.44405364990234375, 0.4560356140136719, 0.468017578125]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 5.0, 8.0, 1.0, 8.0, 5.0, 17.0, 17.0, 23.0, 32.0, 37.0, 64.0, 95.0, 146.0, 224.0, 395.0, 644.0, 1057.0, 2016.0, 4227.0, 8899.0, 21752.0, 64411.0, 525434.0, 319633.0, 61061.0, 20955.0, 8573.0, 4120.0, 2067.0, 1036.0, 554.0, 381.0, 205.0, 142.0, 104.0, 64.0, 35.0, 34.0, 17.0, 15.0, 8.0, 8.0, 7.0, 8.0, 6.0, 5.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 2.0], "bins": [-0.07098388671875, -0.0688314437866211, -0.06667900085449219, -0.06452655792236328, -0.062374114990234375, -0.06022167205810547, -0.05806922912597656, -0.055916786193847656, -0.05376434326171875, -0.051611900329589844, -0.04945945739746094, -0.04730701446533203, -0.045154571533203125, -0.04300212860107422, -0.04084968566894531, -0.038697242736816406, -0.0365447998046875, -0.034392356872558594, -0.03223991394042969, -0.03008747100830078, -0.027935028076171875, -0.02578258514404297, -0.023630142211914062, -0.021477699279785156, -0.01932525634765625, -0.017172813415527344, -0.015020370483398438, -0.012867927551269531, -0.010715484619140625, -0.008563041687011719, -0.0064105987548828125, -0.004258155822753906, -0.002105712890625, 4.673004150390625e-05, 0.0021991729736328125, 0.004351615905761719, 0.006504058837890625, 0.008656501770019531, 0.010808944702148438, 0.012961387634277344, 0.01511383056640625, 0.017266273498535156, 0.019418716430664062, 0.02157115936279297, 0.023723602294921875, 0.02587604522705078, 0.028028488159179688, 0.030180931091308594, 0.0323333740234375, 0.034485816955566406, 0.03663825988769531, 0.03879070281982422, 0.040943145751953125, 0.04309558868408203, 0.04524803161621094, 0.047400474548339844, 0.04955291748046875, 0.051705360412597656, 0.05385780334472656, 0.05601024627685547, 0.058162689208984375, 0.06031513214111328, 0.06246757507324219, 0.0646200180053711, 0.0667724609375]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 3.0, 2.0, 4.0, 4.0, 10.0, 8.0, 8.0, 18.0, 16.0, 19.0, 21.0, 39.0, 72.0, 93.0, 112.0, 123.0, 128.0, 86.0, 71.0, 43.0, 35.0, 15.0, 14.0, 22.0, 9.0, 9.0, 3.0, 3.0, 4.0, 4.0, 4.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.676248550415039e-05, -2.552475780248642e-05, -2.428703010082245e-05, -2.3049302399158478e-05, -2.1811574697494507e-05, -2.0573846995830536e-05, -1.9336119294166565e-05, -1.8098391592502594e-05, -1.6860663890838623e-05, -1.5622936189174652e-05, -1.4385208487510681e-05, -1.314748078584671e-05, -1.190975308418274e-05, -1.0672025382518768e-05, -9.434297680854797e-06, -8.196569979190826e-06, -6.9588422775268555e-06, -5.7211145758628845e-06, -4.4833868741989136e-06, -3.2456591725349426e-06, -2.0079314708709717e-06, -7.702037692070007e-07, 4.675239324569702e-07, 1.7052516341209412e-06, 2.942979335784912e-06, 4.180707037448883e-06, 5.418434739112854e-06, 6.656162440776825e-06, 7.893890142440796e-06, 9.131617844104767e-06, 1.0369345545768738e-05, 1.1607073247432709e-05, 1.284480094909668e-05, 1.408252865076065e-05, 1.532025635242462e-05, 1.6557984054088593e-05, 1.7795711755752563e-05, 1.9033439457416534e-05, 2.0271167159080505e-05, 2.1508894860744476e-05, 2.2746622562408447e-05, 2.3984350264072418e-05, 2.522207796573639e-05, 2.645980566740036e-05, 2.769753336906433e-05, 2.8935261070728302e-05, 3.0172988772392273e-05, 3.1410716474056244e-05, 3.2648444175720215e-05, 3.3886171877384186e-05, 3.512389957904816e-05, 3.636162728071213e-05, 3.75993549823761e-05, 3.883708268404007e-05, 4.007481038570404e-05, 4.131253808736801e-05, 4.255026578903198e-05, 4.378799349069595e-05, 4.5025721192359924e-05, 4.6263448894023895e-05, 4.7501176595687866e-05, 4.873890429735184e-05, 4.997663199901581e-05, 5.121435970067978e-05, 5.245208740234375e-05]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 6.0, 7.0, 9.0, 16.0, 15.0, 14.0, 30.0, 35.0, 65.0, 76.0, 143.0, 193.0, 329.0, 558.0, 1085.0, 2109.0, 4849.0, 12477.0, 37230.0, 173778.0, 688083.0, 88275.0, 23494.0, 8364.0, 3569.0, 1680.0, 798.0, 474.0, 248.0, 180.0, 120.0, 88.0, 47.0, 37.0, 23.0, 19.0, 6.0, 6.0, 9.0, 6.0, 4.0, 6.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0706787109375, -0.06809043884277344, -0.06550216674804688, -0.06291389465332031, -0.06032562255859375, -0.05773735046386719, -0.055149078369140625, -0.05256080627441406, -0.0499725341796875, -0.04738426208496094, -0.044795989990234375, -0.04220771789550781, -0.03961944580078125, -0.03703117370605469, -0.034442901611328125, -0.03185462951660156, -0.029266357421875, -0.026678085327148438, -0.024089813232421875, -0.021501541137695312, -0.01891326904296875, -0.016324996948242188, -0.013736724853515625, -0.011148452758789062, -0.0085601806640625, -0.0059719085693359375, -0.003383636474609375, -0.0007953643798828125, 0.00179290771484375, 0.0043811798095703125, 0.006969451904296875, 0.009557723999023438, 0.01214599609375, 0.014734268188476562, 0.017322540283203125, 0.019910812377929688, 0.02249908447265625, 0.025087356567382812, 0.027675628662109375, 0.030263900756835938, 0.0328521728515625, 0.03544044494628906, 0.038028717041015625, 0.04061698913574219, 0.04320526123046875, 0.04579353332519531, 0.048381805419921875, 0.05097007751464844, 0.053558349609375, 0.05614662170410156, 0.058734893798828125, 0.06132316589355469, 0.06391143798828125, 0.06649971008300781, 0.06908798217773438, 0.07167625427246094, 0.0742645263671875, 0.07685279846191406, 0.07944107055664062, 0.08202934265136719, 0.08461761474609375, 0.08720588684082031, 0.08979415893554688, 0.09238243103027344, 0.094970703125]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 3.0, 4.0, 2.0, 9.0, 5.0, 6.0, 8.0, 12.0, 9.0, 11.0, 15.0, 33.0, 40.0, 56.0, 94.0, 117.0, 130.0, 109.0, 86.0, 68.0, 41.0, 35.0, 21.0, 21.0, 15.0, 10.0, 16.0, 7.0, 4.0, 8.0, 0.0, 4.0, 2.0, 3.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0802001953125, -0.0773019790649414, -0.07440376281738281, -0.07150554656982422, -0.06860733032226562, -0.06570911407470703, -0.06281089782714844, -0.059912681579589844, -0.05701446533203125, -0.054116249084472656, -0.05121803283691406, -0.04831981658935547, -0.045421600341796875, -0.04252338409423828, -0.03962516784667969, -0.036726951599121094, -0.0338287353515625, -0.030930519104003906, -0.028032302856445312, -0.02513408660888672, -0.022235870361328125, -0.01933765411376953, -0.016439437866210938, -0.013541221618652344, -0.01064300537109375, -0.007744789123535156, -0.0048465728759765625, -0.0019483566284179688, 0.000949859619140625, 0.0038480758666992188, 0.0067462921142578125, 0.009644508361816406, 0.012542724609375, 0.015440940856933594, 0.018339157104492188, 0.02123737335205078, 0.024135589599609375, 0.02703380584716797, 0.029932022094726562, 0.032830238342285156, 0.03572845458984375, 0.038626670837402344, 0.04152488708496094, 0.04442310333251953, 0.047321319580078125, 0.05021953582763672, 0.05311775207519531, 0.056015968322753906, 0.0589141845703125, 0.061812400817871094, 0.06471061706542969, 0.06760883331298828, 0.07050704956054688, 0.07340526580810547, 0.07630348205566406, 0.07920169830322266, 0.08209991455078125, 0.08499813079833984, 0.08789634704589844, 0.09079456329345703, 0.09369277954101562, 0.09659099578857422, 0.09948921203613281, 0.1023874282836914, 0.10528564453125]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 1.0, 4.0, 7.0, 10.0, 15.0, 32.0, 41.0, 66.0, 94.0, 213.0, 187.0, 101.0, 72.0, 57.0, 40.0, 17.0, 8.0, 6.0, 6.0, 4.0, 4.0, 3.0, 0.0, 4.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6782475709915161, -1.6288036108016968, -1.5793596506118774, -1.5299155712127686, -1.4804716110229492, -1.4310276508331299, -1.3815836906433105, -1.3321397304534912, -1.2826957702636719, -1.2332518100738525, -1.1838078498840332, -1.1343638896942139, -1.084919810295105, -1.0354758501052856, -0.9860318899154663, -0.936587929725647, -0.8871438503265381, -0.8376998901367188, -0.7882558703422546, -0.7388119101524353, -0.6893678903579712, -0.6399239301681519, -0.5904799699783325, -0.5410360097885132, -0.4915919899940491, -0.44214800000190735, -0.3927040100097656, -0.3432600498199463, -0.29381605982780457, -0.24437206983566284, -0.1949281096458435, -0.14548411965370178, -0.09604001045227051, -0.04659602791070938, 0.0028479546308517456, 0.052291929721832275, 0.101735919713974, 0.15117990970611572, 0.20062386989593506, 0.2500678598880768, 0.2995118498802185, 0.34895583987236023, 0.39839982986450195, 0.4478437900543213, 0.497287780046463, 0.5467317700386047, 0.5961757302284241, 0.6456197500228882, 0.6950637102127075, 0.7445076704025269, 0.793951690196991, 0.8433956503868103, 0.8928396701812744, 0.9422836303710938, 0.9917275905609131, 1.0411715507507324, 1.0906155109405518, 1.140059471130371, 1.1895034313201904, 1.2389473915100098, 1.2883914709091187, 1.337835431098938, 1.3872793912887573, 1.4367233514785767, 1.4861674308776855]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 3.0, 2.0, 2.0, 1.0, 3.0, 6.0, 15.0, 10.0, 12.0, 9.0, 10.0, 21.0, 18.0, 20.0, 26.0, 20.0, 27.0, 25.0, 45.0, 47.0, 70.0, 86.0, 100.0, 84.0, 65.0, 38.0, 26.0, 32.0, 34.0, 16.0, 20.0, 23.0, 17.0, 15.0, 9.0, 13.0, 10.0, 1.0, 14.0, 6.0, 7.0, 2.0, 1.0, 5.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.564016580581665, -1.519797921180725, -1.4755792617797852, -1.4313606023788452, -1.3871419429779053, -1.3429231643676758, -1.2987046241760254, -1.254485845565796, -1.210267186164856, -1.166048526763916, -1.121829867362976, -1.0776112079620361, -1.0333925485610962, -0.9891738295555115, -0.9449551701545715, -0.9007364511489868, -0.8565178513526917, -0.8122991919517517, -0.7680805325508118, -0.723861813545227, -0.6796431541442871, -0.6354244947433472, -0.5912058353424072, -0.5469871759414673, -0.5027685165405273, -0.4585498571395874, -0.4143311679363251, -0.37011250853538513, -0.3258938193321228, -0.28167515993118286, -0.23745650053024292, -0.1932378113269806, -0.14901912212371826, -0.10480044782161713, -0.06058178097009659, -0.01636311411857605, 0.027855560183525085, 0.07207423448562622, 0.11629289388656616, 0.1605115830898285, 0.20473024249076843, 0.24894891679286957, 0.2931675910949707, 0.33738625049591064, 0.3816049098968506, 0.4258235991001129, 0.47004225850105286, 0.5142609477043152, 0.5584796071052551, 0.6026982665061951, 0.646916925907135, 0.6911356449127197, 0.7353543043136597, 0.7795729637145996, 0.8237916231155396, 0.8680102825164795, 0.9122289419174194, 0.9564476013183594, 1.0006662607192993, 1.0448849201202393, 1.0891035795211792, 1.1333222389221191, 1.1775410175323486, 1.2217596769332886, 1.2659783363342285]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 4.0, 8.0, 11.0, 14.0, 22.0, 39.0, 92.0, 184.0, 449.0, 1273.0, 6011.0, 117420.0, 3826947.0, 231498.0, 8156.0, 1408.0, 429.0, 151.0, 64.0, 31.0, 19.0, 23.0, 9.0, 9.0, 6.0, 3.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.255126953125, -0.24382400512695312, -0.23252105712890625, -0.22121810913085938, -0.2099151611328125, -0.19861221313476562, -0.18730926513671875, -0.17600631713867188, -0.164703369140625, -0.15340042114257812, -0.14209747314453125, -0.13079452514648438, -0.1194915771484375, -0.10818862915039062, -0.09688568115234375, -0.08558273315429688, -0.07427978515625, -0.06297683715820312, -0.05167388916015625, -0.040370941162109375, -0.0290679931640625, -0.017765045166015625, -0.00646209716796875, 0.004840850830078125, 0.016143798828125, 0.027446746826171875, 0.03874969482421875, 0.050052642822265625, 0.0613555908203125, 0.07265853881835938, 0.08396148681640625, 0.09526443481445312, 0.1065673828125, 0.11787033081054688, 0.12917327880859375, 0.14047622680664062, 0.1517791748046875, 0.16308212280273438, 0.17438507080078125, 0.18568801879882812, 0.196990966796875, 0.20829391479492188, 0.21959686279296875, 0.23089981079101562, 0.2422027587890625, 0.2535057067871094, 0.26480865478515625, 0.2761116027832031, 0.28741455078125, 0.2987174987792969, 0.31002044677734375, 0.3213233947753906, 0.3326263427734375, 0.3439292907714844, 0.35523223876953125, 0.3665351867675781, 0.377838134765625, 0.3891410827636719, 0.40044403076171875, 0.4117469787597656, 0.4230499267578125, 0.4343528747558594, 0.44565582275390625, 0.4569587707519531, 0.46826171875]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 4.0, 1.0, 5.0, 3.0, 7.0, 9.0, 9.0, 12.0, 17.0, 20.0, 21.0, 31.0, 25.0, 31.0, 32.0, 29.0, 40.0, 37.0, 56.0, 44.0, 51.0, 54.0, 50.0, 46.0, 47.0, 38.0, 37.0, 48.0, 35.0, 20.0, 20.0, 23.0, 23.0, 13.0, 12.0, 10.0, 13.0, 12.0, 7.0, 2.0, 2.0, 1.0, 6.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0], "bins": [-0.08782958984375, -0.08502006530761719, -0.08221054077148438, -0.07940101623535156, -0.07659149169921875, -0.07378196716308594, -0.07097244262695312, -0.06816291809082031, -0.0653533935546875, -0.06254386901855469, -0.059734344482421875, -0.05692481994628906, -0.05411529541015625, -0.05130577087402344, -0.048496246337890625, -0.04568672180175781, -0.042877197265625, -0.04006767272949219, -0.037258148193359375, -0.03444862365722656, -0.03163909912109375, -0.028829574584960938, -0.026020050048828125, -0.023210525512695312, -0.0204010009765625, -0.017591476440429688, -0.014781951904296875, -0.011972427368164062, -0.00916290283203125, -0.0063533782958984375, -0.003543853759765625, -0.0007343292236328125, 0.0020751953125, 0.0048847198486328125, 0.007694244384765625, 0.010503768920898438, 0.01331329345703125, 0.016122817993164062, 0.018932342529296875, 0.021741867065429688, 0.0245513916015625, 0.027360916137695312, 0.030170440673828125, 0.03297996520996094, 0.03578948974609375, 0.03859901428222656, 0.041408538818359375, 0.04421806335449219, 0.047027587890625, 0.04983711242675781, 0.052646636962890625, 0.05545616149902344, 0.05826568603515625, 0.06107521057128906, 0.06388473510742188, 0.06669425964355469, 0.0695037841796875, 0.07231330871582031, 0.07512283325195312, 0.07793235778808594, 0.08074188232421875, 0.08355140686035156, 0.08636093139648438, 0.08917045593261719, 0.09197998046875]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 3.0, 2.0, 5.0, 4.0, 7.0, 9.0, 18.0, 37.0, 67.0, 138.0, 273.0, 663.0, 2253.0, 16449.0, 958523.0, 3176525.0, 34515.0, 3193.0, 871.0, 363.0, 176.0, 86.0, 34.0, 28.0, 19.0, 12.0, 6.0, 5.0, 1.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5205078125, -0.5081520080566406, -0.49579620361328125, -0.4834403991699219, -0.4710845947265625, -0.4587287902832031, -0.44637298583984375, -0.4340171813964844, -0.421661376953125, -0.4093055725097656, -0.39694976806640625, -0.3845939636230469, -0.3722381591796875, -0.3598823547363281, -0.34752655029296875, -0.3351707458496094, -0.32281494140625, -0.3104591369628906, -0.29810333251953125, -0.2857475280761719, -0.2733917236328125, -0.2610359191894531, -0.24868011474609375, -0.23632431030273438, -0.223968505859375, -0.21161270141601562, -0.19925689697265625, -0.18690109252929688, -0.1745452880859375, -0.16218948364257812, -0.14983367919921875, -0.13747787475585938, -0.1251220703125, -0.11276626586914062, -0.10041046142578125, -0.08805465698242188, -0.0756988525390625, -0.06334304809570312, -0.05098724365234375, -0.038631439208984375, -0.026275634765625, -0.013919830322265625, -0.00156402587890625, 0.010791778564453125, 0.0231475830078125, 0.035503387451171875, 0.04785919189453125, 0.060214996337890625, 0.07257080078125, 0.08492660522460938, 0.09728240966796875, 0.10963821411132812, 0.1219940185546875, 0.13434982299804688, 0.14670562744140625, 0.15906143188476562, 0.171417236328125, 0.18377304077148438, 0.19612884521484375, 0.20848464965820312, 0.2208404541015625, 0.23319625854492188, 0.24555206298828125, 0.2579078674316406, 0.270263671875]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 2.0, 3.0, 2.0, 4.0, 2.0, 8.0, 10.0, 4.0, 11.0, 17.0, 23.0, 28.0, 63.0, 77.0, 88.0, 148.0, 214.0, 297.0, 481.0, 578.0, 613.0, 422.0, 325.0, 211.0, 158.0, 82.0, 59.0, 44.0, 31.0, 19.0, 15.0, 12.0, 9.0, 7.0, 3.0, 2.0, 3.0, 2.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.174072265625, -0.1682415008544922, -0.16241073608398438, -0.15657997131347656, -0.15074920654296875, -0.14491844177246094, -0.13908767700195312, -0.1332569122314453, -0.1274261474609375, -0.12159538269042969, -0.11576461791992188, -0.10993385314941406, -0.10410308837890625, -0.09827232360839844, -0.09244155883789062, -0.08661079406738281, -0.080780029296875, -0.07494926452636719, -0.06911849975585938, -0.06328773498535156, -0.05745697021484375, -0.05162620544433594, -0.045795440673828125, -0.03996467590332031, -0.0341339111328125, -0.028303146362304688, -0.022472381591796875, -0.016641616821289062, -0.01081085205078125, -0.0049800872802734375, 0.000850677490234375, 0.0066814422607421875, 0.01251220703125, 0.018342971801757812, 0.024173736572265625, 0.030004501342773438, 0.03583526611328125, 0.04166603088378906, 0.047496795654296875, 0.05332756042480469, 0.0591583251953125, 0.06498908996582031, 0.07081985473632812, 0.07665061950683594, 0.08248138427734375, 0.08831214904785156, 0.09414291381835938, 0.09997367858886719, 0.105804443359375, 0.11163520812988281, 0.11746597290039062, 0.12329673767089844, 0.12912750244140625, 0.13495826721191406, 0.14078903198242188, 0.1466197967529297, 0.1524505615234375, 0.1582813262939453, 0.16411209106445312, 0.16994285583496094, 0.17577362060546875, 0.18160438537597656, 0.18743515014648438, 0.1932659149169922, 0.1990966796875]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 5.0, 2.0, 15.0, 17.0, 20.0, 54.0, 100.0, 168.0, 190.0, 188.0, 112.0, 55.0, 35.0, 23.0, 9.0, 9.0, 3.0, 0.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5186384916305542, -1.4484360218048096, -1.3782334327697754, -1.3080308437347412, -1.2378283739089966, -1.167625904083252, -1.0974233150482178, -1.0272207260131836, -0.957018256187439, -0.8868157267570496, -0.8166131973266602, -0.7464106678962708, -0.6762081384658813, -0.6060056090354919, -0.5358030796051025, -0.46560055017471313, -0.39539802074432373, -0.3251954913139343, -0.2549929618835449, -0.18479043245315552, -0.11458790302276611, -0.04438537359237671, 0.025817155838012695, 0.0960196852684021, 0.1662222146987915, 0.2364247441291809, 0.3066272735595703, 0.3768298029899597, 0.4470323324203491, 0.5172348618507385, 0.5874373912811279, 0.6576399207115173, 0.7278423309326172, 0.7980448603630066, 0.868247389793396, 0.9384499192237854, 1.0086524486541748, 1.078855037689209, 1.1490575075149536, 1.2192599773406982, 1.2894625663757324, 1.3596651554107666, 1.4298676252365112, 1.5000700950622559, 1.57027268409729, 1.6404752731323242, 1.7106777429580688, 1.7808802127838135, 1.8510828018188477, 1.9212853908538818, 1.9914878606796265, 2.061690330505371, 2.1318929195404053, 2.2020955085754395, 2.2722978591918945, 2.3425004482269287, 2.412703037261963, 2.482905626296997, 2.5531082153320312, 2.6233105659484863, 2.6935131549835205, 2.7637157440185547, 2.8339180946350098, 2.904120683670044, 2.974323272705078]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 0.0, 3.0, 3.0, 3.0, 3.0, 2.0, 4.0, 6.0, 9.0, 12.0, 12.0, 17.0, 19.0, 29.0, 27.0, 36.0, 32.0, 27.0, 41.0, 50.0, 44.0, 56.0, 42.0, 60.0, 40.0, 32.0, 41.0, 58.0, 49.0, 44.0, 31.0, 31.0, 23.0, 25.0, 18.0, 19.0, 19.0, 11.0, 9.0, 9.0, 6.0, 4.0, 2.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1407835483551025, -1.1096351146697998, -1.0784865617752075, -1.0473381280899048, -1.016189694404602, -0.9850411415100098, -0.953892707824707, -0.9227442145347595, -0.891595721244812, -0.8604472279548645, -0.8292987942695618, -0.7981503009796143, -0.7670018076896667, -0.7358533143997192, -0.7047048807144165, -0.673556387424469, -0.6424079537391663, -0.6112594604492188, -0.580111026763916, -0.5489625334739685, -0.517814040184021, -0.4866655766963959, -0.45551711320877075, -0.42436861991882324, -0.3932201564311981, -0.362071692943573, -0.3309231996536255, -0.29977473616600037, -0.26862627267837524, -0.23747777938842773, -0.2063293159008026, -0.1751808375120163, -0.14403241872787476, -0.11288394033908844, -0.08173546940088272, -0.050586998462677, -0.019438520073890686, 0.01170995831489563, 0.04285842180252075, 0.07400690019130707, 0.10515537858009338, 0.1363038569688797, 0.16745233535766602, 0.19860079884529114, 0.22974927723407745, 0.26089775562286377, 0.2920462191104889, 0.323194682598114, 0.3543431758880615, 0.38549163937568665, 0.41664013266563416, 0.4477885961532593, 0.4789370894432068, 0.5100855827331543, 0.541234016418457, 0.5723825097084045, 0.603531002998352, 0.6346794962882996, 0.6658279299736023, 0.6969764232635498, 0.7281249165534973, 0.7592734098434448, 0.7904218435287476, 0.8215703368186951, 0.8527187705039978]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 8.0, 5.0, 6.0, 15.0, 19.0, 21.0, 36.0, 71.0, 155.0, 204.0, 452.0, 901.0, 2527.0, 8611.0, 38434.0, 234516.0, 606068.0, 124657.0, 23025.0, 5648.0, 1715.0, 730.0, 323.0, 156.0, 87.0, 49.0, 33.0, 25.0, 15.0, 16.0, 9.0, 6.0, 4.0, 1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2086181640625, -0.2009868621826172, -0.19335556030273438, -0.18572425842285156, -0.17809295654296875, -0.17046165466308594, -0.16283035278320312, -0.1551990509033203, -0.1475677490234375, -0.1399364471435547, -0.13230514526367188, -0.12467384338378906, -0.11704254150390625, -0.10941123962402344, -0.10177993774414062, -0.09414863586425781, -0.086517333984375, -0.07888603210449219, -0.07125473022460938, -0.06362342834472656, -0.05599212646484375, -0.04836082458496094, -0.040729522705078125, -0.03309822082519531, -0.0254669189453125, -0.017835617065429688, -0.010204315185546875, -0.0025730133056640625, 0.00505828857421875, 0.012689590454101562, 0.020320892333984375, 0.027952194213867188, 0.03558349609375, 0.04321479797363281, 0.050846099853515625, 0.05847740173339844, 0.06610870361328125, 0.07374000549316406, 0.08137130737304688, 0.08900260925292969, 0.0966339111328125, 0.10426521301269531, 0.11189651489257812, 0.11952781677246094, 0.12715911865234375, 0.13479042053222656, 0.14242172241210938, 0.1500530242919922, 0.157684326171875, 0.1653156280517578, 0.17294692993164062, 0.18057823181152344, 0.18820953369140625, 0.19584083557128906, 0.20347213745117188, 0.2111034393310547, 0.2187347412109375, 0.2263660430908203, 0.23399734497070312, 0.24162864685058594, 0.24925994873046875, 0.25689125061035156, 0.2645225524902344, 0.2721538543701172, 0.27978515625]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 2.0, 2.0, 4.0, 2.0, 5.0, 9.0, 3.0, 16.0, 21.0, 29.0, 35.0, 34.0, 36.0, 50.0, 58.0, 57.0, 62.0, 48.0, 61.0, 60.0, 59.0, 54.0, 56.0, 32.0, 37.0, 36.0, 32.0, 23.0, 21.0, 18.0, 17.0, 8.0, 9.0, 4.0, 5.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.14453125, -0.140777587890625, -0.13702392578125, -0.133270263671875, -0.1295166015625, -0.125762939453125, -0.12200927734375, -0.118255615234375, -0.114501953125, -0.110748291015625, -0.10699462890625, -0.103240966796875, -0.0994873046875, -0.095733642578125, -0.09197998046875, -0.088226318359375, -0.08447265625, -0.080718994140625, -0.07696533203125, -0.073211669921875, -0.0694580078125, -0.065704345703125, -0.06195068359375, -0.058197021484375, -0.054443359375, -0.050689697265625, -0.04693603515625, -0.043182373046875, -0.0394287109375, -0.035675048828125, -0.03192138671875, -0.028167724609375, -0.0244140625, -0.020660400390625, -0.01690673828125, -0.013153076171875, -0.0093994140625, -0.005645751953125, -0.00189208984375, 0.001861572265625, 0.005615234375, 0.009368896484375, 0.01312255859375, 0.016876220703125, 0.0206298828125, 0.024383544921875, 0.02813720703125, 0.031890869140625, 0.03564453125, 0.039398193359375, 0.04315185546875, 0.046905517578125, 0.0506591796875, 0.054412841796875, 0.05816650390625, 0.061920166015625, 0.065673828125, 0.069427490234375, 0.07318115234375, 0.076934814453125, 0.0806884765625, 0.084442138671875, 0.08819580078125, 0.091949462890625, 0.095703125]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 4.0, 8.0, 6.0, 10.0, 14.0, 13.0, 15.0, 28.0, 50.0, 54.0, 91.0, 160.0, 212.0, 336.0, 615.0, 1237.0, 3186.0, 10714.0, 59256.0, 740058.0, 197988.0, 24418.0, 5780.0, 2016.0, 938.0, 486.0, 274.0, 176.0, 138.0, 77.0, 58.0, 36.0, 24.0, 26.0, 14.0, 14.0, 5.0, 7.0, 5.0, 2.0, 2.0, 3.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.260009765625, -0.25127410888671875, -0.2425384521484375, -0.23380279541015625, -0.225067138671875, -0.21633148193359375, -0.2075958251953125, -0.19886016845703125, -0.19012451171875, -0.18138885498046875, -0.1726531982421875, -0.16391754150390625, -0.155181884765625, -0.14644622802734375, -0.1377105712890625, -0.12897491455078125, -0.1202392578125, -0.11150360107421875, -0.1027679443359375, -0.09403228759765625, -0.085296630859375, -0.07656097412109375, -0.0678253173828125, -0.05908966064453125, -0.05035400390625, -0.04161834716796875, -0.0328826904296875, -0.02414703369140625, -0.015411376953125, -0.00667572021484375, 0.0020599365234375, 0.01079559326171875, 0.01953125, 0.02826690673828125, 0.0370025634765625, 0.04573822021484375, 0.054473876953125, 0.06320953369140625, 0.0719451904296875, 0.08068084716796875, 0.08941650390625, 0.09815216064453125, 0.1068878173828125, 0.11562347412109375, 0.124359130859375, 0.13309478759765625, 0.1418304443359375, 0.15056610107421875, 0.1593017578125, 0.16803741455078125, 0.1767730712890625, 0.18550872802734375, 0.194244384765625, 0.20298004150390625, 0.2117156982421875, 0.22045135498046875, 0.22918701171875, 0.23792266845703125, 0.2466583251953125, 0.25539398193359375, 0.264129638671875, 0.27286529541015625, 0.2816009521484375, 0.29033660888671875, 0.299072265625]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 5.0, 2.0, 3.0, 7.0, 7.0, 10.0, 12.0, 21.0, 24.0, 33.0, 32.0, 36.0, 37.0, 46.0, 62.0, 47.0, 54.0, 59.0, 55.0, 59.0, 56.0, 55.0, 47.0, 39.0, 32.0, 29.0, 32.0, 21.0, 14.0, 12.0, 8.0, 13.0, 9.0, 4.0, 9.0, 3.0, 2.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.38623046875, -0.3740234375, -0.36181640625, -0.349609375, -0.33740234375, -0.3251953125, -0.31298828125, -0.30078125, -0.28857421875, -0.2763671875, -0.26416015625, -0.251953125, -0.23974609375, -0.2275390625, -0.21533203125, -0.203125, -0.19091796875, -0.1787109375, -0.16650390625, -0.154296875, -0.14208984375, -0.1298828125, -0.11767578125, -0.10546875, -0.09326171875, -0.0810546875, -0.06884765625, -0.056640625, -0.04443359375, -0.0322265625, -0.02001953125, -0.0078125, 0.00439453125, 0.0166015625, 0.02880859375, 0.041015625, 0.05322265625, 0.0654296875, 0.07763671875, 0.08984375, 0.10205078125, 0.1142578125, 0.12646484375, 0.138671875, 0.15087890625, 0.1630859375, 0.17529296875, 0.1875, 0.19970703125, 0.2119140625, 0.22412109375, 0.236328125, 0.24853515625, 0.2607421875, 0.27294921875, 0.28515625, 0.29736328125, 0.3095703125, 0.32177734375, 0.333984375, 0.34619140625, 0.3583984375, 0.37060546875, 0.3828125, 0.39501953125]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 2.0, 1.0, 2.0, 5.0, 2.0, 3.0, 4.0, 8.0, 6.0, 6.0, 9.0, 9.0, 22.0, 22.0, 26.0, 45.0, 51.0, 101.0, 151.0, 251.0, 452.0, 959.0, 2283.0, 7002.0, 26717.0, 185233.0, 755189.0, 52134.0, 11471.0, 3495.0, 1388.0, 610.0, 329.0, 180.0, 119.0, 60.0, 59.0, 37.0, 26.0, 22.0, 14.0, 13.0, 11.0, 4.0, 9.0, 4.0, 7.0, 4.0, 0.0, 4.0, 2.0, 2.0, 0.0, 0.0, 3.0, 0.0, 2.0], "bins": [-0.11676025390625, -0.11324405670166016, -0.10972785949707031, -0.10621166229248047, -0.10269546508789062, -0.09917926788330078, -0.09566307067871094, -0.0921468734741211, -0.08863067626953125, -0.0851144790649414, -0.08159828186035156, -0.07808208465576172, -0.07456588745117188, -0.07104969024658203, -0.06753349304199219, -0.06401729583740234, -0.0605010986328125, -0.056984901428222656, -0.05346870422363281, -0.04995250701904297, -0.046436309814453125, -0.04292011260986328, -0.03940391540527344, -0.035887718200683594, -0.03237152099609375, -0.028855323791503906, -0.025339126586914062, -0.02182292938232422, -0.018306732177734375, -0.014790534973144531, -0.011274337768554688, -0.007758140563964844, -0.004241943359375, -0.0007257461547851562, 0.0027904510498046875, 0.006306648254394531, 0.009822845458984375, 0.013339042663574219, 0.016855239868164062, 0.020371437072753906, 0.02388763427734375, 0.027403831481933594, 0.030920028686523438, 0.03443622589111328, 0.037952423095703125, 0.04146862030029297, 0.04498481750488281, 0.048501014709472656, 0.0520172119140625, 0.055533409118652344, 0.05904960632324219, 0.06256580352783203, 0.06608200073242188, 0.06959819793701172, 0.07311439514160156, 0.0766305923461914, 0.08014678955078125, 0.0836629867553711, 0.08717918395996094, 0.09069538116455078, 0.09421157836914062, 0.09772777557373047, 0.10124397277832031, 0.10476016998291016, 0.1082763671875]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 2.0, 0.0, 3.0, 3.0, 7.0, 8.0, 6.0, 11.0, 20.0, 25.0, 27.0, 43.0, 68.0, 77.0, 101.0, 102.0, 124.0, 81.0, 68.0, 63.0, 45.0, 32.0, 17.0, 18.0, 9.0, 3.0, 14.0, 5.0, 7.0, 2.0, 7.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.4332275390625e-05, -3.3146701753139496e-05, -3.196112811565399e-05, -3.077555447816849e-05, -2.9589980840682983e-05, -2.840440720319748e-05, -2.7218833565711975e-05, -2.603325992822647e-05, -2.4847686290740967e-05, -2.3662112653255463e-05, -2.247653901576996e-05, -2.1290965378284454e-05, -2.010539174079895e-05, -1.8919818103313446e-05, -1.7734244465827942e-05, -1.6548670828342438e-05, -1.5363097190856934e-05, -1.417752355337143e-05, -1.2991949915885925e-05, -1.1806376278400421e-05, -1.0620802640914917e-05, -9.435229003429413e-06, -8.249655365943909e-06, -7.0640817284584045e-06, -5.8785080909729e-06, -4.692934453487396e-06, -3.507360816001892e-06, -2.321787178516388e-06, -1.1362135410308838e-06, 4.936009645462036e-08, 1.2349337339401245e-06, 2.4205073714256287e-06, 3.606081008911133e-06, 4.791654646396637e-06, 5.977228283882141e-06, 7.162801921367645e-06, 8.34837555885315e-06, 9.533949196338654e-06, 1.0719522833824158e-05, 1.1905096471309662e-05, 1.3090670108795166e-05, 1.427624374628067e-05, 1.5461817383766174e-05, 1.664739102125168e-05, 1.7832964658737183e-05, 1.9018538296222687e-05, 2.020411193370819e-05, 2.1389685571193695e-05, 2.25752592086792e-05, 2.3760832846164703e-05, 2.4946406483650208e-05, 2.613198012113571e-05, 2.7317553758621216e-05, 2.850312739610672e-05, 2.9688701033592224e-05, 3.087427467107773e-05, 3.205984830856323e-05, 3.3245421946048737e-05, 3.443099558353424e-05, 3.5616569221019745e-05, 3.680214285850525e-05, 3.798771649599075e-05, 3.917329013347626e-05, 4.035886377096176e-05, 4.1544437408447266e-05]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 3.0, 3.0, 10.0, 10.0, 21.0, 29.0, 47.0, 67.0, 96.0, 167.0, 307.0, 564.0, 1171.0, 2967.0, 9546.0, 40143.0, 360013.0, 575910.0, 41927.0, 9913.0, 3095.0, 1190.0, 568.0, 308.0, 173.0, 104.0, 66.0, 44.0, 31.0, 20.0, 16.0, 8.0, 6.0, 6.0, 6.0, 3.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11328125, -0.10984992980957031, -0.10641860961914062, -0.10298728942871094, -0.09955596923828125, -0.09612464904785156, -0.09269332885742188, -0.08926200866699219, -0.0858306884765625, -0.08239936828613281, -0.07896804809570312, -0.07553672790527344, -0.07210540771484375, -0.06867408752441406, -0.06524276733398438, -0.06181144714355469, -0.058380126953125, -0.05494880676269531, -0.051517486572265625, -0.04808616638183594, -0.04465484619140625, -0.04122352600097656, -0.037792205810546875, -0.03436088562011719, -0.0309295654296875, -0.027498245239257812, -0.024066925048828125, -0.020635604858398438, -0.01720428466796875, -0.013772964477539062, -0.010341644287109375, -0.0069103240966796875, -0.00347900390625, -4.76837158203125e-05, 0.003383636474609375, 0.0068149566650390625, 0.01024627685546875, 0.013677597045898438, 0.017108917236328125, 0.020540237426757812, 0.0239715576171875, 0.027402877807617188, 0.030834197998046875, 0.03426551818847656, 0.03769683837890625, 0.04112815856933594, 0.044559478759765625, 0.04799079895019531, 0.051422119140625, 0.05485343933105469, 0.058284759521484375, 0.06171607971191406, 0.06514739990234375, 0.06857872009277344, 0.07201004028320312, 0.07544136047363281, 0.0788726806640625, 0.08230400085449219, 0.08573532104492188, 0.08916664123535156, 0.09259796142578125, 0.09602928161621094, 0.09946060180664062, 0.10289192199707031, 0.1063232421875]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 4.0, 5.0, 5.0, 4.0, 9.0, 7.0, 10.0, 12.0, 14.0, 17.0, 33.0, 42.0, 51.0, 57.0, 67.0, 100.0, 131.0, 90.0, 81.0, 61.0, 39.0, 28.0, 22.0, 18.0, 21.0, 25.0, 10.0, 8.0, 9.0, 5.0, 4.0, 9.0, 2.0, 3.0, 2.0, 3.0, 0.0, 0.0, 1.0, 2.0, 1.0], "bins": [-0.10821533203125, -0.10547161102294922, -0.10272789001464844, -0.09998416900634766, -0.09724044799804688, -0.0944967269897461, -0.09175300598144531, -0.08900928497314453, -0.08626556396484375, -0.08352184295654297, -0.08077812194824219, -0.0780344009399414, -0.07529067993164062, -0.07254695892333984, -0.06980323791503906, -0.06705951690673828, -0.0643157958984375, -0.06157207489013672, -0.05882835388183594, -0.056084632873535156, -0.053340911865234375, -0.050597190856933594, -0.04785346984863281, -0.04510974884033203, -0.04236602783203125, -0.03962230682373047, -0.03687858581542969, -0.034134864807128906, -0.031391143798828125, -0.028647422790527344, -0.025903701782226562, -0.02315998077392578, -0.020416259765625, -0.01767253875732422, -0.014928817749023438, -0.012185096740722656, -0.009441375732421875, -0.006697654724121094, -0.0039539337158203125, -0.0012102127075195312, 0.00153350830078125, 0.004277229309082031, 0.0070209503173828125, 0.009764671325683594, 0.012508392333984375, 0.015252113342285156, 0.017995834350585938, 0.02073955535888672, 0.0234832763671875, 0.02622699737548828, 0.028970718383789062, 0.031714439392089844, 0.034458160400390625, 0.037201881408691406, 0.03994560241699219, 0.04268932342529297, 0.04543304443359375, 0.04817676544189453, 0.05092048645019531, 0.053664207458496094, 0.056407928466796875, 0.059151649475097656, 0.06189537048339844, 0.06463909149169922, 0.0673828125]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 3.0, 19.0, 83.0, 317.0, 482.0, 71.0, 12.0, 3.0, 5.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.450579643249512, -6.266711235046387, -6.0828423500061035, -5.8989739418029785, -5.715105056762695, -5.53123664855957, -5.347367763519287, -5.163499355316162, -4.979630470275879, -4.795762062072754, -4.611893177032471, -4.428024768829346, -4.2441558837890625, -4.0602874755859375, -3.8764185905456543, -3.6925501823425293, -3.508681535720825, -3.324812889099121, -3.140944242477417, -2.957075595855713, -2.773206949234009, -2.5893383026123047, -2.4054698944091797, -2.2216010093688965, -2.0377326011657715, -1.8538639545440674, -1.6699953079223633, -1.4861266613006592, -1.302258014678955, -1.118389368057251, -0.9345208406448364, -0.7506521940231323, -0.5667834281921387, -0.38291478157043457, -0.19904616475105286, -0.015177547931671143, 0.16869109869003296, 0.35255974531173706, 0.5364283323287964, 0.7202969789505005, 0.9041656255722046, 1.0880342721939087, 1.2719029188156128, 1.4557714462280273, 1.6396400928497314, 1.8235087394714355, 2.0073773860931396, 2.1912460327148438, 2.375114679336548, 2.558983325958252, 2.742851972579956, 2.92672061920166, 3.1105892658233643, 3.2944579124450684, 3.4783263206481934, 3.6621952056884766, 3.8460636138916016, 4.029932022094727, 4.21380090713501, 4.397669315338135, 4.581538200378418, 4.765406608581543, 4.949275493621826, 5.133143901824951, 5.317012786865234]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 5.0, 5.0, 5.0, 5.0, 6.0, 4.0, 9.0, 9.0, 9.0, 14.0, 12.0, 12.0, 16.0, 25.0, 18.0, 23.0, 12.0, 20.0, 38.0, 24.0, 42.0, 58.0, 82.0, 97.0, 103.0, 55.0, 31.0, 26.0, 25.0, 23.0, 17.0, 15.0, 31.0, 20.0, 20.0, 6.0, 16.0, 5.0, 13.0, 11.0, 7.0, 9.0, 9.0, 2.0, 4.0, 2.0, 3.0, 1.0, 1.0, 4.0, 3.0, 1.0, 1.0, 1.0], "bins": [-1.3335986137390137, -1.293694257736206, -1.2537897825241089, -1.2138853073120117, -1.173980951309204, -1.1340765953063965, -1.0941721200942993, -1.0542676448822021, -1.0143632888793945, -0.9744588732719421, -0.9345544576644897, -0.8946500420570374, -0.854745626449585, -0.8148412108421326, -0.7749367952346802, -0.7350323796272278, -0.6951279640197754, -0.655223548412323, -0.6153191328048706, -0.5754147171974182, -0.5355103015899658, -0.4956058859825134, -0.45570147037506104, -0.41579705476760864, -0.37589263916015625, -0.33598822355270386, -0.29608380794525146, -0.2561793923377991, -0.21627497673034668, -0.1763705611228943, -0.1364661455154419, -0.0965617299079895, -0.05665719509124756, -0.016752779483795166, 0.023151636123657227, 0.06305605173110962, 0.10296046733856201, 0.1428648829460144, 0.1827692985534668, 0.2226737141609192, 0.2625781297683716, 0.302482545375824, 0.34238696098327637, 0.38229137659072876, 0.42219579219818115, 0.46210020780563354, 0.5020046234130859, 0.5419090390205383, 0.5818134546279907, 0.6217178702354431, 0.6616222858428955, 0.7015267014503479, 0.7414311170578003, 0.7813355326652527, 0.8212399482727051, 0.8611443638801575, 0.9010487794876099, 0.9409531950950623, 0.9808576107025146, 1.0207619667053223, 1.0606664419174194, 1.1005709171295166, 1.1404752731323242, 1.1803796291351318, 1.220284104347229]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 0.0, 2.0, 4.0, 6.0, 9.0, 5.0, 14.0, 10.0, 21.0, 28.0, 47.0, 79.0, 118.0, 220.0, 449.0, 1042.0, 2538.0, 7073.0, 30959.0, 294358.0, 2829473.0, 942927.0, 67004.0, 11899.0, 3382.0, 1339.0, 552.0, 301.0, 150.0, 90.0, 56.0, 34.0, 22.0, 18.0, 14.0, 7.0, 5.0, 5.0, 7.0, 6.0, 3.0, 1.0, 2.0, 4.0, 3.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-0.256591796875, -0.2473297119140625, -0.238067626953125, -0.2288055419921875, -0.21954345703125, -0.2102813720703125, -0.201019287109375, -0.1917572021484375, -0.1824951171875, -0.1732330322265625, -0.163970947265625, -0.1547088623046875, -0.14544677734375, -0.1361846923828125, -0.126922607421875, -0.1176605224609375, -0.1083984375, -0.0991363525390625, -0.089874267578125, -0.0806121826171875, -0.07135009765625, -0.0620880126953125, -0.052825927734375, -0.0435638427734375, -0.0343017578125, -0.0250396728515625, -0.015777587890625, -0.0065155029296875, 0.00274658203125, 0.0120086669921875, 0.021270751953125, 0.0305328369140625, 0.039794921875, 0.0490570068359375, 0.058319091796875, 0.0675811767578125, 0.07684326171875, 0.0861053466796875, 0.095367431640625, 0.1046295166015625, 0.1138916015625, 0.1231536865234375, 0.132415771484375, 0.1416778564453125, 0.15093994140625, 0.1602020263671875, 0.169464111328125, 0.1787261962890625, 0.18798828125, 0.1972503662109375, 0.206512451171875, 0.2157745361328125, 0.22503662109375, 0.2342987060546875, 0.243560791015625, 0.2528228759765625, 0.2620849609375, 0.2713470458984375, 0.280609130859375, 0.2898712158203125, 0.29913330078125, 0.3083953857421875, 0.317657470703125, 0.3269195556640625, 0.336181640625]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 5.0, 4.0, 5.0, 4.0, 16.0, 11.0, 20.0, 23.0, 27.0, 45.0, 46.0, 49.0, 57.0, 69.0, 65.0, 79.0, 61.0, 67.0, 50.0, 62.0, 50.0, 41.0, 32.0, 32.0, 24.0, 22.0, 15.0, 9.0, 6.0, 4.0, 6.0, 0.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1160888671875, -0.11193084716796875, -0.1077728271484375, -0.10361480712890625, -0.099456787109375, -0.09529876708984375, -0.0911407470703125, -0.08698272705078125, -0.08282470703125, -0.07866668701171875, -0.0745086669921875, -0.07035064697265625, -0.066192626953125, -0.06203460693359375, -0.0578765869140625, -0.05371856689453125, -0.049560546875, -0.04540252685546875, -0.0412445068359375, -0.03708648681640625, -0.032928466796875, -0.02877044677734375, -0.0246124267578125, -0.02045440673828125, -0.01629638671875, -0.01213836669921875, -0.0079803466796875, -0.00382232666015625, 0.000335693359375, 0.00449371337890625, 0.0086517333984375, 0.01280975341796875, 0.0169677734375, 0.02112579345703125, 0.0252838134765625, 0.02944183349609375, 0.033599853515625, 0.03775787353515625, 0.0419158935546875, 0.04607391357421875, 0.05023193359375, 0.05438995361328125, 0.0585479736328125, 0.06270599365234375, 0.066864013671875, 0.07102203369140625, 0.0751800537109375, 0.07933807373046875, 0.08349609375, 0.08765411376953125, 0.0918121337890625, 0.09597015380859375, 0.100128173828125, 0.10428619384765625, 0.1084442138671875, 0.11260223388671875, 0.11676025390625, 0.12091827392578125, 0.1250762939453125, 0.12923431396484375, 0.133392333984375, 0.13755035400390625, 0.1417083740234375, 0.14586639404296875, 0.1500244140625]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 2.0, 6.0, 4.0, 4.0, 8.0, 7.0, 20.0, 35.0, 70.0, 147.0, 388.0, 913.0, 3120.0, 49243.0, 4121428.0, 15346.0, 2204.0, 734.0, 284.0, 152.0, 73.0, 30.0, 20.0, 17.0, 4.0, 2.0, 2.0, 5.0, 3.0, 5.0, 0.0, 2.0, 4.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1884765625, -1.146575927734375, -1.10467529296875, -1.062774658203125, -1.0208740234375, -0.978973388671875, -0.93707275390625, -0.895172119140625, -0.853271484375, -0.811370849609375, -0.76947021484375, -0.727569580078125, -0.6856689453125, -0.643768310546875, -0.60186767578125, -0.559967041015625, -0.51806640625, -0.476165771484375, -0.43426513671875, -0.392364501953125, -0.3504638671875, -0.308563232421875, -0.26666259765625, -0.224761962890625, -0.182861328125, -0.140960693359375, -0.09906005859375, -0.057159423828125, -0.0152587890625, 0.026641845703125, 0.06854248046875, 0.110443115234375, 0.15234375, 0.194244384765625, 0.23614501953125, 0.278045654296875, 0.3199462890625, 0.361846923828125, 0.40374755859375, 0.445648193359375, 0.487548828125, 0.529449462890625, 0.57135009765625, 0.613250732421875, 0.6551513671875, 0.697052001953125, 0.73895263671875, 0.780853271484375, 0.82275390625, 0.864654541015625, 0.90655517578125, 0.948455810546875, 0.9903564453125, 1.032257080078125, 1.07415771484375, 1.116058349609375, 1.157958984375, 1.199859619140625, 1.24176025390625, 1.283660888671875, 1.3255615234375, 1.367462158203125, 1.40936279296875, 1.451263427734375, 1.4931640625]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 6.0, 17.0, 25.0, 40.0, 76.0, 137.0, 291.0, 546.0, 925.0, 921.0, 508.0, 272.0, 112.0, 78.0, 45.0, 29.0, 17.0, 8.0, 9.0, 5.0, 2.0, 3.0, 0.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.50341796875, -0.48471832275390625, -0.4660186767578125, -0.44731903076171875, -0.428619384765625, -0.40991973876953125, -0.3912200927734375, -0.37252044677734375, -0.35382080078125, -0.33512115478515625, -0.3164215087890625, -0.29772186279296875, -0.279022216796875, -0.26032257080078125, -0.2416229248046875, -0.22292327880859375, -0.2042236328125, -0.18552398681640625, -0.1668243408203125, -0.14812469482421875, -0.129425048828125, -0.11072540283203125, -0.0920257568359375, -0.07332611083984375, -0.05462646484375, -0.03592681884765625, -0.0172271728515625, 0.00147247314453125, 0.020172119140625, 0.03887176513671875, 0.0575714111328125, 0.07627105712890625, 0.094970703125, 0.11367034912109375, 0.1323699951171875, 0.15106964111328125, 0.169769287109375, 0.18846893310546875, 0.2071685791015625, 0.22586822509765625, 0.24456787109375, 0.26326751708984375, 0.2819671630859375, 0.30066680908203125, 0.319366455078125, 0.33806610107421875, 0.3567657470703125, 0.37546539306640625, 0.3941650390625, 0.41286468505859375, 0.4315643310546875, 0.45026397705078125, 0.468963623046875, 0.48766326904296875, 0.5063629150390625, 0.5250625610351562, 0.54376220703125, 0.5624618530273438, 0.5811614990234375, 0.5998611450195312, 0.618560791015625, 0.6372604370117188, 0.6559600830078125, 0.6746597290039062, 0.693359375]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 2.0, 3.0, 4.0, 5.0, 7.0, 7.0, 16.0, 20.0, 47.0, 77.0, 118.0, 198.0, 157.0, 132.0, 72.0, 37.0, 26.0, 16.0, 8.0, 8.0, 10.0, 4.0, 5.0, 3.0, 4.0, 3.0, 3.0, 4.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.406118392944336, -4.267202377319336, -4.128286838531494, -3.989370822906494, -3.850454807281494, -3.7115390300750732, -3.5726232528686523, -3.4337072372436523, -3.2947914600372314, -3.1558756828308105, -3.0169596672058105, -2.8780438899993896, -2.7391281127929688, -2.6002120971679688, -2.461296319961548, -2.322380542755127, -2.183464527130127, -2.044548749923706, -1.905632734298706, -1.7667169570922852, -1.6278010606765747, -1.4888851642608643, -1.3499693870544434, -1.211053490638733, -1.0721375942230225, -0.933221697807312, -0.7943058609962463, -0.6553900241851807, -0.5164741277694702, -0.37755823135375977, -0.2386423945426941, -0.09972655773162842, 0.039189815521240234, 0.1781056821346283, 0.31702154874801636, 0.4559374153614044, 0.5948532819747925, 0.7337691783905029, 0.8726850152015686, 1.0116008520126343, 1.1505167484283447, 1.2894326448440552, 1.4283485412597656, 1.5672643184661865, 1.706180214881897, 1.8450961112976074, 1.9840118885040283, 2.122927665710449, 2.261843681335449, 2.40075945854187, 2.53967547416687, 2.678591251373291, 2.817507266998291, 2.956423044204712, 3.095338821411133, 3.234254837036133, 3.3731706142425537, 3.5120863914489746, 3.6510024070739746, 3.7899181842803955, 3.9288339614868164, 4.067749977111816, 4.206665992736816, 4.345581531524658, 4.484497547149658]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 5.0, 1.0, 7.0, 11.0, 17.0, 13.0, 23.0, 45.0, 37.0, 42.0, 69.0, 71.0, 89.0, 86.0, 110.0, 84.0, 73.0, 54.0, 48.0, 38.0, 23.0, 20.0, 10.0, 9.0, 3.0, 4.0, 4.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.6779420375823975, -3.5676016807556152, -3.457261323928833, -3.346920967102051, -3.2365806102752686, -3.1262402534484863, -3.015900135040283, -2.905559539794922, -2.7952194213867188, -2.6848790645599365, -2.5745387077331543, -2.464198350906372, -2.35385799407959, -2.2435176372528076, -2.1331772804260254, -2.0228371620178223, -1.912496566772461, -1.8021562099456787, -1.6918158531188965, -1.5814754962921143, -1.471135139465332, -1.3607947826385498, -1.2504545450210571, -1.140114188194275, -1.0297738313674927, -0.9194334745407104, -0.8090931177139282, -0.6987528204917908, -0.5884124636650085, -0.4780721068382263, -0.36773180961608887, -0.25739145278930664, -0.1470508575439453, -0.03671051561832428, 0.07362982630729675, 0.1839701533317566, 0.2943105101585388, 0.40465086698532104, 0.5149911642074585, 0.6253315210342407, 0.735671877861023, 0.8460122346878052, 0.9563525915145874, 1.06669282913208, 1.1770331859588623, 1.2873735427856445, 1.3977138996124268, 1.508054256439209, 1.6183946132659912, 1.7287349700927734, 1.8390753269195557, 1.949415683746338, 2.05975604057312, 2.1700963973999023, 2.2804365158081055, 2.390777111053467, 2.50111722946167, 2.611457586288452, 2.7217979431152344, 2.8321382999420166, 2.942478656768799, 3.052819013595581, 3.1631593704223633, 3.2734994888305664, 3.3838400840759277]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 5.0, 3.0, 0.0, 3.0, 5.0, 4.0, 16.0, 18.0, 22.0, 25.0, 49.0, 91.0, 165.0, 248.0, 503.0, 1212.0, 3409.0, 12143.0, 78253.0, 738597.0, 184522.0, 20966.0, 5061.0, 1801.0, 686.0, 294.0, 187.0, 98.0, 56.0, 31.0, 26.0, 16.0, 15.0, 12.0, 3.0, 2.0, 7.0, 2.0, 3.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.319580078125, -0.30843353271484375, -0.2972869873046875, -0.28614044189453125, -0.274993896484375, -0.26384735107421875, -0.2527008056640625, -0.24155426025390625, -0.23040771484375, -0.21926116943359375, -0.2081146240234375, -0.19696807861328125, -0.185821533203125, -0.17467498779296875, -0.1635284423828125, -0.15238189697265625, -0.1412353515625, -0.13008880615234375, -0.1189422607421875, -0.10779571533203125, -0.096649169921875, -0.08550262451171875, -0.0743560791015625, -0.06320953369140625, -0.05206298828125, -0.04091644287109375, -0.0297698974609375, -0.01862335205078125, -0.007476806640625, 0.00366973876953125, 0.0148162841796875, 0.02596282958984375, 0.037109375, 0.04825592041015625, 0.0594024658203125, 0.07054901123046875, 0.081695556640625, 0.09284210205078125, 0.1039886474609375, 0.11513519287109375, 0.12628173828125, 0.13742828369140625, 0.1485748291015625, 0.15972137451171875, 0.170867919921875, 0.18201446533203125, 0.1931610107421875, 0.20430755615234375, 0.2154541015625, 0.22660064697265625, 0.2377471923828125, 0.24889373779296875, 0.260040283203125, 0.27118682861328125, 0.2823333740234375, 0.29347991943359375, 0.30462646484375, 0.31577301025390625, 0.3269195556640625, 0.33806610107421875, 0.349212646484375, 0.36035919189453125, 0.3715057373046875, 0.38265228271484375, 0.393798828125]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 3.0, 1.0, 1.0, 5.0, 4.0, 5.0, 13.0, 20.0, 30.0, 33.0, 42.0, 58.0, 72.0, 71.0, 76.0, 69.0, 100.0, 82.0, 71.0, 70.0, 52.0, 27.0, 30.0, 19.0, 20.0, 12.0, 5.0, 6.0, 4.0, 3.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2015380859375, -0.19476699829101562, -0.18799591064453125, -0.18122482299804688, -0.1744537353515625, -0.16768264770507812, -0.16091156005859375, -0.15414047241210938, -0.147369384765625, -0.14059829711914062, -0.13382720947265625, -0.12705612182617188, -0.1202850341796875, -0.11351394653320312, -0.10674285888671875, -0.09997177124023438, -0.09320068359375, -0.08642959594726562, -0.07965850830078125, -0.07288742065429688, -0.0661163330078125, -0.059345245361328125, -0.05257415771484375, -0.045803070068359375, -0.039031982421875, -0.032260894775390625, -0.02548980712890625, -0.018718719482421875, -0.0119476318359375, -0.005176544189453125, 0.00159454345703125, 0.008365631103515625, 0.01513671875, 0.021907806396484375, 0.02867889404296875, 0.035449981689453125, 0.0422210693359375, 0.048992156982421875, 0.05576324462890625, 0.06253433227539062, 0.069305419921875, 0.07607650756835938, 0.08284759521484375, 0.08961868286132812, 0.0963897705078125, 0.10316085815429688, 0.10993194580078125, 0.11670303344726562, 0.12347412109375, 0.13024520874023438, 0.13701629638671875, 0.14378738403320312, 0.1505584716796875, 0.15732955932617188, 0.16410064697265625, 0.17087173461914062, 0.177642822265625, 0.18441390991210938, 0.19118499755859375, 0.19795608520507812, 0.2047271728515625, 0.21149826049804688, 0.21826934814453125, 0.22504043579101562, 0.2318115234375]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 4.0, 6.0, 7.0, 8.0, 10.0, 5.0, 13.0, 23.0, 23.0, 37.0, 40.0, 64.0, 86.0, 118.0, 180.0, 338.0, 629.0, 1695.0, 5969.0, 41641.0, 871731.0, 111030.0, 10570.0, 2408.0, 873.0, 410.0, 211.0, 135.0, 85.0, 43.0, 50.0, 33.0, 24.0, 13.0, 9.0, 15.0, 6.0, 5.0, 4.0, 5.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.3701171875, -0.3600273132324219, -0.34993743896484375, -0.3398475646972656, -0.3297576904296875, -0.3196678161621094, -0.30957794189453125, -0.2994880676269531, -0.289398193359375, -0.2793083190917969, -0.26921844482421875, -0.2591285705566406, -0.2490386962890625, -0.23894882202148438, -0.22885894775390625, -0.21876907348632812, -0.20867919921875, -0.19858932495117188, -0.18849945068359375, -0.17840957641601562, -0.1683197021484375, -0.15822982788085938, -0.14813995361328125, -0.13805007934570312, -0.127960205078125, -0.11787033081054688, -0.10778045654296875, -0.09769058227539062, -0.0876007080078125, -0.07751083374023438, -0.06742095947265625, -0.057331085205078125, -0.0472412109375, -0.037151336669921875, -0.02706146240234375, -0.016971588134765625, -0.0068817138671875, 0.003208160400390625, 0.01329803466796875, 0.023387908935546875, 0.033477783203125, 0.043567657470703125, 0.05365753173828125, 0.06374740600585938, 0.0738372802734375, 0.08392715454101562, 0.09401702880859375, 0.10410690307617188, 0.11419677734375, 0.12428665161132812, 0.13437652587890625, 0.14446640014648438, 0.1545562744140625, 0.16464614868164062, 0.17473602294921875, 0.18482589721679688, 0.194915771484375, 0.20500564575195312, 0.21509552001953125, 0.22518539428710938, 0.2352752685546875, 0.24536514282226562, 0.25545501708984375, 0.2655448913574219, 0.275634765625]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 4.0, 1.0, 5.0, 6.0, 8.0, 9.0, 10.0, 12.0, 20.0, 28.0, 28.0, 28.0, 38.0, 40.0, 52.0, 84.0, 89.0, 98.0, 93.0, 79.0, 57.0, 47.0, 29.0, 24.0, 19.0, 22.0, 20.0, 17.0, 9.0, 7.0, 8.0, 7.0, 1.0, 3.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0], "bins": [-0.8486328125, -0.827789306640625, -0.80694580078125, -0.786102294921875, -0.7652587890625, -0.744415283203125, -0.72357177734375, -0.702728271484375, -0.681884765625, -0.661041259765625, -0.64019775390625, -0.619354248046875, -0.5985107421875, -0.577667236328125, -0.55682373046875, -0.535980224609375, -0.51513671875, -0.494293212890625, -0.47344970703125, -0.452606201171875, -0.4317626953125, -0.410919189453125, -0.39007568359375, -0.369232177734375, -0.348388671875, -0.327545166015625, -0.30670166015625, -0.285858154296875, -0.2650146484375, -0.244171142578125, -0.22332763671875, -0.202484130859375, -0.181640625, -0.160797119140625, -0.13995361328125, -0.119110107421875, -0.0982666015625, -0.077423095703125, -0.05657958984375, -0.035736083984375, -0.014892578125, 0.005950927734375, 0.02679443359375, 0.047637939453125, 0.0684814453125, 0.089324951171875, 0.11016845703125, 0.131011962890625, 0.15185546875, 0.172698974609375, 0.19354248046875, 0.214385986328125, 0.2352294921875, 0.256072998046875, 0.27691650390625, 0.297760009765625, 0.318603515625, 0.339447021484375, 0.36029052734375, 0.381134033203125, 0.4019775390625, 0.422821044921875, 0.44366455078125, 0.464508056640625, 0.4853515625]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 5.0, 3.0, 2.0, 7.0, 6.0, 6.0, 9.0, 17.0, 16.0, 23.0, 39.0, 63.0, 90.0, 142.0, 252.0, 529.0, 1108.0, 2760.0, 8171.0, 35201.0, 833650.0, 139401.0, 18042.0, 5194.0, 1968.0, 842.0, 403.0, 226.0, 131.0, 79.0, 60.0, 30.0, 21.0, 18.0, 19.0, 6.0, 1.0, 7.0, 9.0, 4.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0740966796875, -0.07213640213012695, -0.0701761245727539, -0.06821584701538086, -0.06625556945800781, -0.06429529190063477, -0.06233501434326172, -0.06037473678588867, -0.058414459228515625, -0.05645418167114258, -0.05449390411376953, -0.052533626556396484, -0.05057334899902344, -0.04861307144165039, -0.046652793884277344, -0.0446925163269043, -0.04273223876953125, -0.0407719612121582, -0.038811683654785156, -0.03685140609741211, -0.03489112854003906, -0.032930850982666016, -0.03097057342529297, -0.029010295867919922, -0.027050018310546875, -0.025089740753173828, -0.02312946319580078, -0.021169185638427734, -0.019208908081054688, -0.01724863052368164, -0.015288352966308594, -0.013328075408935547, -0.0113677978515625, -0.009407520294189453, -0.007447242736816406, -0.005486965179443359, -0.0035266876220703125, -0.0015664100646972656, 0.00039386749267578125, 0.002354145050048828, 0.004314422607421875, 0.006274700164794922, 0.008234977722167969, 0.010195255279541016, 0.012155532836914062, 0.01411581039428711, 0.016076087951660156, 0.018036365509033203, 0.01999664306640625, 0.021956920623779297, 0.023917198181152344, 0.02587747573852539, 0.027837753295898438, 0.029798030853271484, 0.03175830841064453, 0.03371858596801758, 0.035678863525390625, 0.03763914108276367, 0.03959941864013672, 0.041559696197509766, 0.04351997375488281, 0.04548025131225586, 0.047440528869628906, 0.04940080642700195, 0.051361083984375]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 2.0, 2.0, 1.0, 3.0, 4.0, 6.0, 7.0, 2.0, 4.0, 7.0, 9.0, 11.0, 13.0, 11.0, 23.0, 30.0, 42.0, 47.0, 46.0, 75.0, 100.0, 109.0, 78.0, 73.0, 63.0, 56.0, 53.0, 30.0, 13.0, 17.0, 15.0, 13.0, 9.0, 8.0, 4.0, 3.0, 8.0, 2.0, 2.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.6166439056396484e-05, -2.5323592126369476e-05, -2.4480745196342468e-05, -2.363789826631546e-05, -2.2795051336288452e-05, -2.1952204406261444e-05, -2.1109357476234436e-05, -2.0266510546207428e-05, -1.942366361618042e-05, -1.8580816686153412e-05, -1.7737969756126404e-05, -1.6895122826099396e-05, -1.6052275896072388e-05, -1.520942896604538e-05, -1.4366582036018372e-05, -1.3523735105991364e-05, -1.2680888175964355e-05, -1.1838041245937347e-05, -1.099519431591034e-05, -1.0152347385883331e-05, -9.309500455856323e-06, -8.466653525829315e-06, -7.623806595802307e-06, -6.780959665775299e-06, -5.938112735748291e-06, -5.095265805721283e-06, -4.252418875694275e-06, -3.409571945667267e-06, -2.566725015640259e-06, -1.7238780856132507e-06, -8.810311555862427e-07, -3.818422555923462e-08, 8.046627044677734e-07, 1.6475096344947815e-06, 2.4903565645217896e-06, 3.3332034945487976e-06, 4.176050424575806e-06, 5.018897354602814e-06, 5.861744284629822e-06, 6.70459121465683e-06, 7.547438144683838e-06, 8.390285074710846e-06, 9.233132004737854e-06, 1.0075978934764862e-05, 1.091882586479187e-05, 1.1761672794818878e-05, 1.2604519724845886e-05, 1.3447366654872894e-05, 1.4290213584899902e-05, 1.513306051492691e-05, 1.597590744495392e-05, 1.6818754374980927e-05, 1.7661601305007935e-05, 1.8504448235034943e-05, 1.934729516506195e-05, 2.019014209508896e-05, 2.1032989025115967e-05, 2.1875835955142975e-05, 2.2718682885169983e-05, 2.356152981519699e-05, 2.4404376745224e-05, 2.5247223675251007e-05, 2.6090070605278015e-05, 2.6932917535305023e-05, 2.777576446533203e-05]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 4.0, 3.0, 3.0, 4.0, 4.0, 13.0, 19.0, 14.0, 20.0, 42.0, 63.0, 84.0, 133.0, 180.0, 354.0, 569.0, 1082.0, 2085.0, 4539.0, 11174.0, 33435.0, 206948.0, 713746.0, 47890.0, 14635.0, 5699.0, 2644.0, 1335.0, 705.0, 414.0, 251.0, 147.0, 91.0, 73.0, 46.0, 26.0, 35.0, 17.0, 11.0, 11.0, 6.0, 4.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.041229248046875, -0.039813995361328125, -0.03839874267578125, -0.036983489990234375, -0.0355682373046875, -0.034152984619140625, -0.03273773193359375, -0.031322479248046875, -0.0299072265625, -0.028491973876953125, -0.02707672119140625, -0.025661468505859375, -0.0242462158203125, -0.022830963134765625, -0.02141571044921875, -0.020000457763671875, -0.018585205078125, -0.017169952392578125, -0.01575469970703125, -0.014339447021484375, -0.0129241943359375, -0.011508941650390625, -0.01009368896484375, -0.008678436279296875, -0.00726318359375, -0.005847930908203125, -0.00443267822265625, -0.003017425537109375, -0.0016021728515625, -0.000186920166015625, 0.00122833251953125, 0.002643585205078125, 0.004058837890625, 0.005474090576171875, 0.00688934326171875, 0.008304595947265625, 0.0097198486328125, 0.011135101318359375, 0.01255035400390625, 0.013965606689453125, 0.015380859375, 0.016796112060546875, 0.01821136474609375, 0.019626617431640625, 0.0210418701171875, 0.022457122802734375, 0.02387237548828125, 0.025287628173828125, 0.026702880859375, 0.028118133544921875, 0.02953338623046875, 0.030948638916015625, 0.0323638916015625, 0.033779144287109375, 0.03519439697265625, 0.036609649658203125, 0.03802490234375, 0.039440155029296875, 0.04085540771484375, 0.042270660400390625, 0.0436859130859375, 0.045101165771484375, 0.04651641845703125, 0.047931671142578125, 0.049346923828125]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 0.0, 0.0, 2.0, 4.0, 2.0, 2.0, 3.0, 2.0, 9.0, 10.0, 6.0, 7.0, 17.0, 14.0, 18.0, 22.0, 27.0, 40.0, 57.0, 65.0, 92.0, 131.0, 90.0, 85.0, 70.0, 50.0, 35.0, 27.0, 21.0, 21.0, 17.0, 10.0, 9.0, 8.0, 7.0, 9.0, 3.0, 5.0, 6.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.05010986328125, -0.04842948913574219, -0.046749114990234375, -0.04506874084472656, -0.04338836669921875, -0.04170799255371094, -0.040027618408203125, -0.03834724426269531, -0.0366668701171875, -0.03498649597167969, -0.033306121826171875, -0.03162574768066406, -0.02994537353515625, -0.028264999389648438, -0.026584625244140625, -0.024904251098632812, -0.023223876953125, -0.021543502807617188, -0.019863128662109375, -0.018182754516601562, -0.01650238037109375, -0.014822006225585938, -0.013141632080078125, -0.011461257934570312, -0.0097808837890625, -0.008100509643554688, -0.006420135498046875, -0.0047397613525390625, -0.00305938720703125, -0.0013790130615234375, 0.000301361083984375, 0.0019817352294921875, 0.003662109375, 0.0053424835205078125, 0.007022857666015625, 0.008703231811523438, 0.01038360595703125, 0.012063980102539062, 0.013744354248046875, 0.015424728393554688, 0.0171051025390625, 0.018785476684570312, 0.020465850830078125, 0.022146224975585938, 0.02382659912109375, 0.025506973266601562, 0.027187347412109375, 0.028867721557617188, 0.030548095703125, 0.03222846984863281, 0.033908843994140625, 0.03558921813964844, 0.03726959228515625, 0.03894996643066406, 0.040630340576171875, 0.04231071472167969, 0.0439910888671875, 0.04567146301269531, 0.047351837158203125, 0.04903221130371094, 0.05071258544921875, 0.05239295959472656, 0.054073333740234375, 0.05575370788574219, 0.05743408203125]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 2.0, 3.0, 3.0, 5.0, 9.0, 17.0, 26.0, 44.0, 89.0, 398.0, 248.0, 96.0, 27.0, 14.0, 12.0, 6.0, 4.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.7262933254241943, -2.6408090591430664, -2.5553250312805176, -2.4698407649993896, -2.3843564987182617, -2.298872470855713, -2.213388204574585, -2.127903938293457, -2.042419910430908, -1.9569357633590698, -1.871451497077942, -1.7859673500061035, -1.7004830837249756, -1.6149989366531372, -1.5295147895812988, -1.444030523300171, -1.358546257019043, -1.2730621099472046, -1.1875778436660767, -1.1020936965942383, -1.0166094303131104, -0.931125283241272, -0.8456411361694336, -0.7601569294929504, -0.6746727228164673, -0.5891885161399841, -0.503704309463501, -0.4182201623916626, -0.33273595571517944, -0.2472517490386963, -0.1617676019668579, -0.07628339529037476, 0.0092010498046875, 0.09468524158000946, 0.18016943335533142, 0.2656536102294922, 0.35113781690597534, 0.4366220235824585, 0.5221061706542969, 0.60759037733078, 0.6930745840072632, 0.7785587906837463, 0.8640429973602295, 0.9495271444320679, 1.0350112915039062, 1.1204955577850342, 1.2059797048568726, 1.291463851928711, 1.3769481182098389, 1.4624322652816772, 1.5479165315628052, 1.6334006786346436, 1.7188849449157715, 1.8043690919876099, 1.8898532390594482, 1.9753375053405762, 2.060821533203125, 2.146305799484253, 2.2317898273468018, 2.3172740936279297, 2.4027583599090576, 2.4882426261901855, 2.5737266540527344, 2.6592109203338623, 2.7446951866149902]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 4.0, 4.0, 3.0, 7.0, 14.0, 14.0, 10.0, 21.0, 18.0, 24.0, 30.0, 21.0, 56.0, 98.0, 292.0, 123.0, 55.0, 34.0, 29.0, 27.0, 35.0, 19.0, 26.0, 16.0, 7.0, 5.0, 1.0, 3.0, 6.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0], "bins": [-2.7694602012634277, -2.7011349201202393, -2.632809638977051, -2.5644843578338623, -2.496159076690674, -2.4278337955474854, -2.359508514404297, -2.2911832332611084, -2.22285795211792, -2.1545326709747314, -2.086207389831543, -2.0178821086883545, -1.949556827545166, -1.8812315464019775, -1.812906265258789, -1.7445809841156006, -1.6762555837631226, -1.607930302619934, -1.5396050214767456, -1.4712797403335571, -1.4029544591903687, -1.3346291780471802, -1.2663037776947021, -1.1979784965515137, -1.1296532154083252, -1.0613279342651367, -0.9930026531219482, -0.9246773719787598, -0.8563520908355713, -0.7880268096923828, -0.7197014689445496, -0.6513761878013611, -0.5830509662628174, -0.5147256851196289, -0.44640040397644043, -0.37807509303092957, -0.3097498118877411, -0.2414245307445526, -0.17309921979904175, -0.10477393865585327, -0.036448657512664795, 0.03187663108110428, 0.10020191967487335, 0.16852721571922302, 0.2368524968624115, 0.3051777780056, 0.37350308895111084, 0.4418283700942993, 0.5101536512374878, 0.5784789323806763, 0.6468042135238647, 0.7151294946670532, 0.7834547758102417, 0.8517800569534302, 0.9201053977012634, 0.9884306788444519, 1.0567560195922852, 1.1250813007354736, 1.193406581878662, 1.2617318630218506, 1.330057144165039, 1.3983824253082275, 1.466707706451416, 1.5350329875946045, 1.603358268737793]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 5.0, 3.0, 2.0, 6.0, 7.0, 15.0, 18.0, 22.0, 23.0, 44.0, 38.0, 54.0, 63.0, 220.0, 159.0, 74.0, 57.0, 36.0, 46.0, 24.0, 20.0, 26.0, 16.0, 3.0, 11.0, 7.0, 6.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1494140625, -0.14316940307617188, -0.13692474365234375, -0.13068008422851562, -0.1244354248046875, -0.11819076538085938, -0.11194610595703125, -0.10570144653320312, -0.099456787109375, -0.09321212768554688, -0.08696746826171875, -0.08072280883789062, -0.0744781494140625, -0.06823348999023438, -0.06198883056640625, -0.055744171142578125, -0.04949951171875, -0.043254852294921875, -0.03701019287109375, -0.030765533447265625, -0.0245208740234375, -0.018276214599609375, -0.01203155517578125, -0.005786895751953125, 0.000457763671875, 0.006702423095703125, 0.01294708251953125, 0.019191741943359375, 0.0254364013671875, 0.031681060791015625, 0.03792572021484375, 0.044170379638671875, 0.0504150390625, 0.056659698486328125, 0.06290435791015625, 0.06914901733398438, 0.0753936767578125, 0.08163833618164062, 0.08788299560546875, 0.09412765502929688, 0.100372314453125, 0.10661697387695312, 0.11286163330078125, 0.11910629272460938, 0.1253509521484375, 0.13159561157226562, 0.13784027099609375, 0.14408493041992188, 0.15032958984375, 0.15657424926757812, 0.16281890869140625, 0.16906356811523438, 0.1753082275390625, 0.18155288696289062, 0.18779754638671875, 0.19404220581054688, 0.200286865234375, 0.20653152465820312, 0.21277618408203125, 0.21902084350585938, 0.2252655029296875, 0.23151016235351562, 0.23775482177734375, 0.24399948120117188, 0.250244140625]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 8.0, 2.0, 2.0, 1.0, 3.0, 2.0, 2.0, 7.0, 9.0, 5.0, 8.0, 13.0, 29.0, 42.0, 78.0, 96.0, 255.0, 985.0, 7980.0, 8365612.0, 11657.0, 1196.0, 279.0, 133.0, 81.0, 46.0, 16.0, 4.0, 8.0, 10.0, 3.0, 6.0, 5.0, 3.0, 4.0, 5.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.5400357246398926, -2.4705750942230225, -2.4011144638061523, -2.3316540718078613, -2.262193441390991, -2.192732810974121, -2.12327241897583, -2.05381178855896, -1.9843511581420898, -1.9148905277252197, -1.8454300165176392, -1.7759695053100586, -1.7065088748931885, -1.6370482444763184, -1.5675877332687378, -1.4981272220611572, -1.428666591644287, -1.359205961227417, -1.2897454500198364, -1.2202849388122559, -1.1508243083953857, -1.0813636779785156, -1.011903166770935, -0.9424425959587097, -0.8729820251464844, -0.803521454334259, -0.7340608835220337, -0.6646003127098083, -0.595139741897583, -0.5256791710853577, -0.4562186002731323, -0.386758029460907, -0.31729745864868164, -0.2478368878364563, -0.17837631702423096, -0.10891574621200562, -0.03945517539978027, 0.03000539541244507, 0.09946596622467041, 0.16892653703689575, 0.2383871078491211, 0.30784767866134644, 0.3773082494735718, 0.4467688202857971, 0.5162293910980225, 0.5856899619102478, 0.6551505327224731, 0.7246111035346985, 0.7940716743469238, 0.8635322451591492, 0.9329928159713745, 1.002453327178955, 1.0719139575958252, 1.1413745880126953, 1.2108350992202759, 1.2802956104278564, 1.3497562408447266, 1.4192168712615967, 1.4886773824691772, 1.5581378936767578, 1.627598524093628, 1.697059154510498, 1.7665196657180786, 1.8359801769256592, 1.9054408073425293]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 5.0, 5.0, 2.0, 5.0, 4.0, 4.0, 2.0, 2.0, 6.0, 6.0, 6.0, 3.0, 12.0, 3.0, 4.0, 5.0, 2.0, 3.0, 5.0, 3.0, 5.0, 4.0, 5.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.945923328399658, -3.8382351398468018, -3.7305469512939453, -3.622858762741089, -3.5151705741882324, -3.407482385635376, -3.2997941970825195, -3.192105770111084, -3.0844178199768066, -2.97672963142395, -2.8690414428710938, -2.7613532543182373, -2.653665065765381, -2.5459768772125244, -2.438288688659668, -2.3306002616882324, -2.222912073135376, -2.1152238845825195, -2.007535696029663, -1.8998475074768066, -1.7921593189239502, -1.6844711303710938, -1.5767828226089478, -1.4690946340560913, -1.3614064455032349, -1.2537182569503784, -1.146030068397522, -1.038341760635376, -0.9306536316871643, -0.8229654431343079, -0.7152771949768066, -0.6075890064239502, -0.49990105628967285, -0.3922128677368164, -0.2845246493816376, -0.17683643102645874, -0.0691482424736023, 0.03853994607925415, 0.14622819423675537, 0.2539163827896118, 0.36160457134246826, 0.4692927598953247, 0.5769809484481812, 0.6846691966056824, 0.7923573851585388, 0.9000455737113953, 1.0077338218688965, 1.115422010421753, 1.2231101989746094, 1.3307983875274658, 1.4384865760803223, 1.5461747646331787, 1.6538629531860352, 1.7615511417388916, 1.8692394495010376, 1.976927638053894, 2.084615707397461, 2.1923038959503174, 2.299992084503174, 2.4076802730560303, 2.5153684616088867, 2.623056650161743, 2.7307448387145996, 2.838433265686035, 2.9461214542388916]}, "gradients/encoder.masked_spec_embed": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 1.0, 4.0, 6.0, 7.0, 11.0, 20.0, 16.0, 34.0, 44.0, 59.0, 64.0, 88.0, 89.0, 97.0, 107.0, 94.0, 60.0, 50.0, 35.0, 26.0, 29.0, 12.0, 12.0, 9.0, 12.0, 5.0, 5.0, 4.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08526611328125, -0.08197498321533203, -0.07868385314941406, -0.0753927230834961, -0.07210159301757812, -0.06881046295166016, -0.06551933288574219, -0.06222820281982422, -0.05893707275390625, -0.05564594268798828, -0.05235481262207031, -0.049063682556152344, -0.045772552490234375, -0.042481422424316406, -0.03919029235839844, -0.03589916229248047, -0.0326080322265625, -0.02931690216064453, -0.026025772094726562, -0.022734642028808594, -0.019443511962890625, -0.016152381896972656, -0.012861251831054688, -0.009570121765136719, -0.00627899169921875, -0.0029878616333007812, 0.0003032684326171875, 0.0035943984985351562, 0.006885528564453125, 0.010176658630371094, 0.013467788696289062, 0.01675891876220703, 0.020050048828125, 0.02334117889404297, 0.026632308959960938, 0.029923439025878906, 0.033214569091796875, 0.036505699157714844, 0.03979682922363281, 0.04308795928955078, 0.04637908935546875, 0.04967021942138672, 0.05296134948730469, 0.056252479553222656, 0.059543609619140625, 0.0628347396850586, 0.06612586975097656, 0.06941699981689453, 0.0727081298828125, 0.07599925994873047, 0.07929039001464844, 0.0825815200805664, 0.08587265014648438, 0.08916378021240234, 0.09245491027832031, 0.09574604034423828, 0.09903717041015625, 0.10232830047607422, 0.10561943054199219, 0.10891056060791016, 0.11220169067382812, 0.1154928207397461, 0.11878395080566406, 0.12207508087158203, 0.1253662109375]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 6.0, 0.0, 2.0, 1.0, 6.0, 9.0, 4.0, 10.0, 22.0, 27.0, 47.0, 45.0, 97.0, 119.0, 210.0, 306.0, 469.0, 873.0, 1436.0, 2692.0, 5425.0, 11095.0, 24335.0, 55575.0, 120951.0, 151844.0, 81525.0, 35437.0, 16000.0, 7386.0, 3687.0, 1905.0, 1056.0, 571.0, 382.0, 241.0, 132.0, 111.0, 80.0, 49.0, 27.0, 21.0, 21.0, 10.0, 10.0, 12.0, 4.0, 2.0, 2.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0], "bins": [-0.75634765625, -0.7342529296875, -0.712158203125, -0.6900634765625, -0.66796875, -0.6458740234375, -0.623779296875, -0.6016845703125, -0.57958984375, -0.5574951171875, -0.535400390625, -0.5133056640625, -0.4912109375, -0.4691162109375, -0.447021484375, -0.4249267578125, -0.40283203125, -0.3807373046875, -0.358642578125, -0.3365478515625, -0.314453125, -0.2923583984375, -0.270263671875, -0.2481689453125, -0.22607421875, -0.2039794921875, -0.181884765625, -0.1597900390625, -0.1376953125, -0.1156005859375, -0.093505859375, -0.0714111328125, -0.04931640625, -0.0272216796875, -0.005126953125, 0.0169677734375, 0.0390625, 0.0611572265625, 0.083251953125, 0.1053466796875, 0.12744140625, 0.1495361328125, 0.171630859375, 0.1937255859375, 0.2158203125, 0.2379150390625, 0.260009765625, 0.2821044921875, 0.30419921875, 0.3262939453125, 0.348388671875, 0.3704833984375, 0.392578125, 0.4146728515625, 0.436767578125, 0.4588623046875, 0.48095703125, 0.5030517578125, 0.525146484375, 0.5472412109375, 0.5693359375, 0.5914306640625, 0.613525390625, 0.6356201171875, 0.65771484375]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 4.0, 5.0, 6.0, 8.0, 5.0, 14.0, 12.0, 24.0, 21.0, 26.0, 29.0, 39.0, 60.0, 53.0, 69.0, 84.0, 62.0, 80.0, 68.0, 81.0, 57.0, 43.0, 40.0, 31.0, 25.0, 13.0, 12.0, 11.0, 13.0, 3.0, 3.0, 1.0, 2.0, 4.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.2122802734375, -0.20678329467773438, -0.20128631591796875, -0.19578933715820312, -0.1902923583984375, -0.18479537963867188, -0.17929840087890625, -0.17380142211914062, -0.168304443359375, -0.16280746459960938, -0.15731048583984375, -0.15181350708007812, -0.1463165283203125, -0.14081954956054688, -0.13532257080078125, -0.12982559204101562, -0.12432861328125, -0.11883163452148438, -0.11333465576171875, -0.10783767700195312, -0.1023406982421875, -0.09684371948242188, -0.09134674072265625, -0.08584976196289062, -0.080352783203125, -0.07485580444335938, -0.06935882568359375, -0.06386184692382812, -0.0583648681640625, -0.052867889404296875, -0.04737091064453125, -0.041873931884765625, -0.036376953125, -0.030879974365234375, -0.02538299560546875, -0.019886016845703125, -0.0143890380859375, -0.008892059326171875, -0.00339508056640625, 0.002101898193359375, 0.007598876953125, 0.013095855712890625, 0.01859283447265625, 0.024089813232421875, 0.0295867919921875, 0.035083770751953125, 0.04058074951171875, 0.046077728271484375, 0.05157470703125, 0.057071685791015625, 0.06256866455078125, 0.06806564331054688, 0.0735626220703125, 0.07905960083007812, 0.08455657958984375, 0.09005355834960938, 0.095550537109375, 0.10104751586914062, 0.10654449462890625, 0.11204147338867188, 0.1175384521484375, 0.12303543090820312, 0.12853240966796875, 0.13402938842773438, 0.1395263671875]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 7.0, 4.0, 18.0, 23.0, 41.0, 84.0, 93.0, 90.0, 56.0, 25.0, 12.0, 8.0, 10.0, 6.0, 5.0, 5.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8905225992202759, -0.8457006216049194, -0.8008787035942078, -0.7560567855834961, -0.7112348079681396, -0.6664128303527832, -0.6215909123420715, -0.5767689943313599, -0.5319470167160034, -0.48712506890296936, -0.4423031210899353, -0.39748117327690125, -0.3526592254638672, -0.30783727765083313, -0.2630153298377991, -0.21819338202476501, -0.17337143421173096, -0.1285494863986969, -0.08372753858566284, -0.038905590772628784, 0.0059163570404052734, 0.05073830485343933, 0.09556025266647339, 0.14038220047950745, 0.1852041482925415, 0.23002609610557556, 0.2748480439186096, 0.3196699917316437, 0.36449193954467773, 0.4093138873577118, 0.45413583517074585, 0.4989577829837799, 0.5437796115875244, 0.5886015892028809, 0.6334235072135925, 0.6782454252243042, 0.7230674028396606, 0.7678893804550171, 0.8127112984657288, 0.8575332164764404, 0.9023551940917969, 0.9471771717071533, 0.991999089717865, 1.0368210077285767, 1.081642985343933, 1.1264649629592896, 1.1712868213653564, 1.216108798980713, 1.2609307765960693, 1.3057527542114258, 1.3505747318267822, 1.3953965902328491, 1.4402185678482056, 1.485040545463562, 1.529862403869629, 1.5746843814849854, 1.6195063591003418, 1.6643283367156982, 1.7091503143310547, 1.7539721727371216, 1.798794150352478, 1.8436161279678345, 1.8884379863739014, 1.9332599639892578, 1.9780819416046143]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 1.0, 1.0, 3.0, 0.0, 4.0, 3.0, 3.0, 10.0, 7.0, 6.0, 6.0, 16.0, 31.0, 25.0, 41.0, 48.0, 43.0, 48.0, 34.0, 35.0, 30.0, 16.0, 16.0, 10.0, 7.0, 11.0, 3.0, 3.0, 1.0, 1.0, 5.0, 4.0, 1.0, 3.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0], "bins": [-0.5323032736778259, -0.5148088335990906, -0.49731433391571045, -0.4798198640346527, -0.46232539415359497, -0.4448309540748596, -0.4273364841938019, -0.40984201431274414, -0.3923475444316864, -0.37485307455062866, -0.3573586046695709, -0.3398641347885132, -0.32236969470977783, -0.3048751950263977, -0.28738075494766235, -0.2698862850666046, -0.2523918151855469, -0.23489734530448914, -0.2174028754234314, -0.19990842044353485, -0.1824139505624771, -0.16491948068141937, -0.14742502570152283, -0.1299305558204651, -0.11243608593940735, -0.09494161605834961, -0.07744715362787247, -0.059952687472105026, -0.042458221316337585, -0.024963751435279846, -0.007469289004802704, 0.010025173425674438, 0.027519702911376953, 0.045014169067144394, 0.06250863522291183, 0.08000309765338898, 0.09749756753444672, 0.11499203741550446, 0.132486492395401, 0.14998096227645874, 0.16747543215751648, 0.18496990203857422, 0.20246437191963196, 0.2199588268995285, 0.23745329678058624, 0.2549477815628052, 0.2724422216415405, 0.28993669152259827, 0.307431161403656, 0.32492563128471375, 0.3424201011657715, 0.3599145710468292, 0.37740904092788696, 0.3949034810066223, 0.41239795088768005, 0.4298924207687378, 0.44738689064979553, 0.46488136053085327, 0.482375830411911, 0.49987030029296875, 0.5173647403717041, 0.5348592400550842, 0.5523536801338196, 0.5698481798171997, 0.5873426198959351]}, "train/train_runtime": 5009.4893, "train/train_samples_per_second": 5.697, "train/train_steps_per_second": 0.178, "train/total_flos": 0.0, "train/train_loss": 4.8473983449786235, "eval/loss": 3.5855588912963867, "eval/wer": 1.32929393097977, "eval/runtime": 681.9871, "eval/samples_per_second": 3.874, "eval/steps_per_second": 0.485} \ No newline at end of file