diff --git "a/wandb/run-20220505_173818-i9acyhfo/files/wandb-summary.json" "b/wandb/run-20220505_173818-i9acyhfo/files/wandb-summary.json" --- "a/wandb/run-20220505_173818-i9acyhfo/files/wandb-summary.json" +++ "b/wandb/run-20220505_173818-i9acyhfo/files/wandb-summary.json" @@ -1 +1 @@ -{"train/loss": 1.0364, "train/learning_rate": 2.525229357798165e-05, "train/epoch": 2.78, "train/global_step": 4500, "_runtime": 64734, "_timestamp": 1651837032, "_step": 4508, "gradients/decoder.model.decoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 3.0, 15.0, 61.0, 148.0, 221.0, 273.0, 171.0, 90.0, 29.0, 7.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1353365182876587, -0.9496013522148132, -0.7638661861419678, -0.5781310796737671, -0.39239591360092163, -0.20666074752807617, -0.02092564105987549, 0.16480958461761475, 0.35054469108581543, 0.5362798571586609, 0.7220150232315063, 0.907750129699707, 1.0934853553771973, 1.279220461845398, 1.4649555683135986, 1.6506907939910889, 1.8364259004592896, 2.0221610069274902, 2.2078962326049805, 2.3936314582824707, 2.579366445541382, 2.765101671218872, 2.950836658477783, 3.1365718841552734, 3.3223071098327637, 3.508042335510254, 3.693777322769165, 3.8795125484466553, 4.065247535705566, 4.250982761383057, 4.436717987060547, 4.622453212738037, 4.808187961578369, 4.993923187255859, 5.17965841293335, 5.36539363861084, 5.551128387451172, 5.736863613128662, 5.922598838806152, 6.108334064483643, 6.294069290161133, 6.479804515838623, 6.665539741516113, 6.851274490356445, 7.0370097160339355, 7.222744941711426, 7.408480167388916, 7.594215393066406, 7.779950141906738, 7.9656853675842285, 8.151420593261719, 8.33715534210205, 8.5228910446167, 8.708625793457031, 8.89436149597168, 9.080096244812012, 9.26583194732666, 9.451566696166992, 9.63730239868164, 9.823037147521973, 10.008772850036621, 10.194507598876953, 10.380243301391602, 10.565978050231934, 10.751712799072266]}, "gradients/decoder.model.decoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 1.0, 4.0, 8.0, 4.0, 6.0, 11.0, 8.0, 14.0, 10.0, 15.0, 18.0, 16.0, 13.0, 28.0, 28.0, 34.0, 26.0, 38.0, 29.0, 36.0, 40.0, 58.0, 39.0, 35.0, 45.0, 49.0, 39.0, 33.0, 30.0, 30.0, 38.0, 33.0, 24.0, 17.0, 25.0, 23.0, 13.0, 19.0, 15.0, 11.0, 12.0, 10.0, 4.0, 7.0, 7.0, 3.0, 0.0, 3.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8245123624801636, -1.7663763761520386, -1.7082405090332031, -1.6501045227050781, -1.5919686555862427, -1.5338326692581177, -1.4756968021392822, -1.4175608158111572, -1.3594249486923218, -1.3012889623641968, -1.2431530952453613, -1.1850171089172363, -1.1268812417984009, -1.0687452554702759, -1.0106093883514404, -0.9524734020233154, -0.8943374752998352, -0.836201548576355, -0.7780656218528748, -0.7199296951293945, -0.6617937684059143, -0.6036578416824341, -0.5455218553543091, -0.48738595843315125, -0.429250031709671, -0.3711141049861908, -0.31297817826271057, -0.25484222173690796, -0.19670630991458893, -0.1385703682899475, -0.08043444156646729, -0.02229851484298706, 0.035837411880493164, 0.09397333860397339, 0.1521092653274536, 0.21024520695209503, 0.26838111877441406, 0.3265170753002167, 0.3846530020236969, 0.4427889287471771, 0.500924825668335, 0.5590607523918152, 0.6171966791152954, 0.6753326058387756, 0.7334685325622559, 0.7916045188903809, 0.8497403860092163, 0.9078763723373413, 0.9660122990608215, 1.0241482257843018, 1.0822842121124268, 1.1404200792312622, 1.1985560655593872, 1.2566919326782227, 1.3148279190063477, 1.372963786125183, 1.431099772453308, 1.489235758781433, 1.5473716259002686, 1.6055076122283936, 1.663643479347229, 1.721779465675354, 1.7799153327941895, 1.8380513191223145, 1.89618718624115]}, "gradients/decoder.model.decoder.layers.11.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 6.0, 6.0, 6.0, 9.0, 5.0, 16.0, 24.0, 28.0, 54.0, 86.0, 156.0, 224.0, 365.0, 592.0, 1170.0, 2104.0, 4120.0, 8333.0, 18769.0, 46320.0, 133166.0, 487299.0, 1931996.0, 1147121.0, 274746.0, 82744.0, 30181.0, 12620.0, 5903.0, 2832.0, 1484.0, 778.0, 407.0, 251.0, 128.0, 80.0, 53.0, 32.0, 32.0, 15.0, 8.0, 11.0, 3.0, 6.0, 0.0, 3.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0], "bins": [-2.810546875, -2.729736328125, -2.64892578125, -2.568115234375, -2.4873046875, -2.406494140625, -2.32568359375, -2.244873046875, -2.1640625, -2.083251953125, -2.00244140625, -1.921630859375, -1.8408203125, -1.760009765625, -1.67919921875, -1.598388671875, -1.517578125, -1.436767578125, -1.35595703125, -1.275146484375, -1.1943359375, -1.113525390625, -1.03271484375, -0.951904296875, -0.87109375, -0.790283203125, -0.70947265625, -0.628662109375, -0.5478515625, -0.467041015625, -0.38623046875, -0.305419921875, -0.224609375, -0.143798828125, -0.06298828125, 0.017822265625, 0.0986328125, 0.179443359375, 0.26025390625, 0.341064453125, 0.421875, 0.502685546875, 0.58349609375, 0.664306640625, 0.7451171875, 0.825927734375, 0.90673828125, 0.987548828125, 1.068359375, 1.149169921875, 1.22998046875, 1.310791015625, 1.3916015625, 1.472412109375, 1.55322265625, 1.634033203125, 1.71484375, 1.795654296875, 1.87646484375, 1.957275390625, 2.0380859375, 2.118896484375, 2.19970703125, 2.280517578125, 2.361328125]}, "gradients/decoder.model.decoder.layers.11.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 1.0, 5.0, 9.0, 13.0, 10.0, 8.0, 2.0, 17.0, 13.0, 34.0, 15.0, 23.0, 34.0, 29.0, 39.0, 22.0, 41.0, 24.0, 37.0, 55.0, 40.0, 44.0, 42.0, 56.0, 49.0, 49.0, 37.0, 30.0, 26.0, 24.0, 27.0, 28.0, 15.0, 25.0, 17.0, 9.0, 8.0, 10.0, 7.0, 5.0, 9.0, 6.0, 5.0, 3.0, 5.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.85546875, -2.770599365234375, -2.68572998046875, -2.600860595703125, -2.5159912109375, -2.431121826171875, -2.34625244140625, -2.261383056640625, -2.176513671875, -2.091644287109375, -2.00677490234375, -1.921905517578125, -1.8370361328125, -1.752166748046875, -1.66729736328125, -1.582427978515625, -1.49755859375, -1.412689208984375, -1.32781982421875, -1.242950439453125, -1.1580810546875, -1.073211669921875, -0.98834228515625, -0.903472900390625, -0.818603515625, -0.733734130859375, -0.64886474609375, -0.563995361328125, -0.4791259765625, -0.394256591796875, -0.30938720703125, -0.224517822265625, -0.1396484375, -0.054779052734375, 0.03009033203125, 0.114959716796875, 0.1998291015625, 0.284698486328125, 0.36956787109375, 0.454437255859375, 0.539306640625, 0.624176025390625, 0.70904541015625, 0.793914794921875, 0.8787841796875, 0.963653564453125, 1.04852294921875, 1.133392333984375, 1.21826171875, 1.303131103515625, 1.38800048828125, 1.472869873046875, 1.5577392578125, 1.642608642578125, 1.72747802734375, 1.812347412109375, 1.897216796875, 1.982086181640625, 2.06695556640625, 2.151824951171875, 2.2366943359375, 2.321563720703125, 2.40643310546875, 2.491302490234375, 2.576171875]}, "gradients/decoder.model.decoder.layers.11.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 1.0, 5.0, 0.0, 3.0, 6.0, 10.0, 10.0, 14.0, 33.0, 35.0, 67.0, 113.0, 154.0, 435.0, 4304.0, 4186829.0, 1565.0, 309.0, 148.0, 87.0, 54.0, 33.0, 18.0, 22.0, 13.0, 11.0, 5.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-38.8125, -37.34130859375, -35.8701171875, -34.39892578125, -32.927734375, -31.45654296875, -29.9853515625, -28.51416015625, -27.04296875, -25.57177734375, -24.1005859375, -22.62939453125, -21.158203125, -19.68701171875, -18.2158203125, -16.74462890625, -15.2734375, -13.80224609375, -12.3310546875, -10.85986328125, -9.388671875, -7.91748046875, -6.4462890625, -4.97509765625, -3.50390625, -2.03271484375, -0.5615234375, 0.90966796875, 2.380859375, 3.85205078125, 5.3232421875, 6.79443359375, 8.265625, 9.73681640625, 11.2080078125, 12.67919921875, 14.150390625, 15.62158203125, 17.0927734375, 18.56396484375, 20.03515625, 21.50634765625, 22.9775390625, 24.44873046875, 25.919921875, 27.39111328125, 28.8623046875, 30.33349609375, 31.8046875, 33.27587890625, 34.7470703125, 36.21826171875, 37.689453125, 39.16064453125, 40.6318359375, 42.10302734375, 43.57421875, 45.04541015625, 46.5166015625, 47.98779296875, 49.458984375, 50.93017578125, 52.4013671875, 53.87255859375, 55.34375]}, "gradients/decoder.model.decoder.layers.11.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 3.0, 7.0, 5.0, 10.0, 6.0, 14.0, 22.0, 27.0, 28.0, 65.0, 77.0, 108.0, 197.0, 362.0, 811.0, 1131.0, 520.0, 215.0, 136.0, 102.0, 70.0, 49.0, 25.0, 17.0, 17.0, 20.0, 16.0, 3.0, 7.0, 2.0, 2.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0400390625, -0.9989013671875, -0.957763671875, -0.9166259765625, -0.87548828125, -0.8343505859375, -0.793212890625, -0.7520751953125, -0.7109375, -0.6697998046875, -0.628662109375, -0.5875244140625, -0.54638671875, -0.5052490234375, -0.464111328125, -0.4229736328125, -0.3818359375, -0.3406982421875, -0.299560546875, -0.2584228515625, -0.21728515625, -0.1761474609375, -0.135009765625, -0.0938720703125, -0.052734375, -0.0115966796875, 0.029541015625, 0.0706787109375, 0.11181640625, 0.1529541015625, 0.194091796875, 0.2352294921875, 0.2763671875, 0.3175048828125, 0.358642578125, 0.3997802734375, 0.44091796875, 0.4820556640625, 0.523193359375, 0.5643310546875, 0.60546875, 0.6466064453125, 0.687744140625, 0.7288818359375, 0.77001953125, 0.8111572265625, 0.852294921875, 0.8934326171875, 0.9345703125, 0.9757080078125, 1.016845703125, 1.0579833984375, 1.09912109375, 1.1402587890625, 1.181396484375, 1.2225341796875, 1.263671875, 1.3048095703125, 1.345947265625, 1.3870849609375, 1.42822265625, 1.4693603515625, 1.510498046875, 1.5516357421875, 1.5927734375]}, "gradients/decoder.model.decoder.layers.11.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 3.0, 8.0, 10.0, 14.0, 16.0, 20.0, 34.0, 34.0, 41.0, 52.0, 52.0, 69.0, 61.0, 59.0, 70.0, 68.0, 69.0, 62.0, 55.0, 42.0, 37.0, 30.0, 32.0, 16.0, 13.0, 11.0, 7.0, 8.0, 8.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-4.690121650695801, -4.5727458000183105, -4.45536994934082, -4.33799409866333, -4.22061824798584, -4.10324239730835, -3.9858665466308594, -3.868490695953369, -3.751114845275879, -3.6337389945983887, -3.5163631439208984, -3.398987293243408, -3.281611442565918, -3.1642355918884277, -3.0468597412109375, -2.9294838905334473, -2.812108039855957, -2.694732189178467, -2.5773563385009766, -2.4599804878234863, -2.342604637145996, -2.225228786468506, -2.1078529357910156, -1.9904770851135254, -1.873100996017456, -1.7557251453399658, -1.6383492946624756, -1.5209734439849854, -1.4035975933074951, -1.2862217426300049, -1.1688458919525146, -1.0514700412750244, -0.9340941905975342, -0.816718339920044, -0.6993424892425537, -0.5819666385650635, -0.46459075808525085, -0.34721487760543823, -0.229839026927948, -0.11246317625045776, 0.004912674427032471, 0.1222885325551033, 0.23966439068317413, 0.35704025626182556, 0.4744161069393158, 0.5917919874191284, 0.7091678380966187, 0.8265436887741089, 0.9439195394515991, 1.0612953901290894, 1.1786712408065796, 1.2960470914840698, 1.41342294216156, 1.5307989120483398, 1.64817476272583, 1.7655506134033203, 1.8829264640808105, 2.000302314758301, 2.117678165435791, 2.2350540161132812, 2.3524298667907715, 2.4698057174682617, 2.587181568145752, 2.704557418823242, 2.8219332695007324]}, "gradients/decoder.model.decoder.layers.11.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 3.0, 2.0, 2.0, 0.0, 10.0, 8.0, 8.0, 4.0, 8.0, 10.0, 9.0, 17.0, 18.0, 30.0, 19.0, 27.0, 28.0, 35.0, 35.0, 41.0, 52.0, 49.0, 43.0, 51.0, 37.0, 39.0, 43.0, 42.0, 32.0, 36.0, 20.0, 38.0, 29.0, 27.0, 26.0, 26.0, 25.0, 16.0, 16.0, 17.0, 15.0, 5.0, 4.0, 6.0, 3.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.5703699588775635, -2.4822986125946045, -2.3942270278930664, -2.3061556816101074, -2.2180840969085693, -2.1300127506256104, -2.0419411659240723, -1.9538698196411133, -1.8657983541488647, -1.7777268886566162, -1.6896554231643677, -1.6015839576721191, -1.5135126113891602, -1.425441026687622, -1.337369680404663, -1.2492982149124146, -1.161226749420166, -1.0731552839279175, -0.985083818435669, -0.8970124125480652, -0.8089409470558167, -0.7208694815635681, -0.6327980756759644, -0.5447266101837158, -0.4566551446914673, -0.36858367919921875, -0.2805122435092926, -0.19244080781936646, -0.10436934232711792, -0.016297876834869385, 0.07177352905273438, 0.1598449945449829, 0.24791669845581055, 0.3359881639480591, 0.42405959963798523, 0.5121310353279114, 0.6002025008201599, 0.6882739663124084, 0.7763453722000122, 0.8644168376922607, 0.9524883031845093, 1.0405597686767578, 1.1286312341690063, 1.2167026996612549, 1.3047740459442139, 1.392845630645752, 1.480916976928711, 1.5689884424209595, 1.657059907913208, 1.7451313734054565, 1.833202838897705, 1.921274185180664, 2.009345769882202, 2.097417116165161, 2.185488700866699, 2.273560047149658, 2.361631393432617, 2.449702739715576, 2.5377743244171143, 2.6258456707000732, 2.7139172554016113, 2.8019886016845703, 2.8900599479675293, 2.9781315326690674, 3.0662031173706055]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 4.0, 1.0, 4.0, 8.0, 11.0, 15.0, 24.0, 50.0, 78.0, 122.0, 164.0, 293.0, 467.0, 726.0, 1254.0, 2063.0, 3390.0, 6025.0, 10959.0, 20958.0, 41669.0, 83854.0, 160516.0, 258093.0, 214746.0, 118542.0, 59995.0, 29880.0, 15111.0, 8232.0, 4582.0, 2647.0, 1541.0, 957.0, 607.0, 379.0, 220.0, 130.0, 89.0, 69.0, 28.0, 25.0, 11.0, 7.0, 7.0, 6.0, 5.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.86865234375, -0.8384475708007812, -0.8082427978515625, -0.7780380249023438, -0.747833251953125, -0.7176284790039062, -0.6874237060546875, -0.6572189331054688, -0.62701416015625, -0.5968093872070312, -0.5666046142578125, -0.5363998413085938, -0.506195068359375, -0.47599029541015625, -0.4457855224609375, -0.41558074951171875, -0.3853759765625, -0.35517120361328125, -0.3249664306640625, -0.29476165771484375, -0.264556884765625, -0.23435211181640625, -0.2041473388671875, -0.17394256591796875, -0.14373779296875, -0.11353302001953125, -0.0833282470703125, -0.05312347412109375, -0.022918701171875, 0.00728607177734375, 0.0374908447265625, 0.06769561767578125, 0.097900390625, 0.12810516357421875, 0.1583099365234375, 0.18851470947265625, 0.218719482421875, 0.24892425537109375, 0.2791290283203125, 0.30933380126953125, 0.33953857421875, 0.36974334716796875, 0.3999481201171875, 0.43015289306640625, 0.460357666015625, 0.49056243896484375, 0.5207672119140625, 0.5509719848632812, 0.5811767578125, 0.6113815307617188, 0.6415863037109375, 0.6717910766601562, 0.701995849609375, 0.7322006225585938, 0.7624053955078125, 0.7926101684570312, 0.82281494140625, 0.8530197143554688, 0.8832244873046875, 0.9134292602539062, 0.943634033203125, 0.9738388061523438, 1.0040435791015625, 1.0342483520507812, 1.064453125]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 3.0, 7.0, 4.0, 9.0, 7.0, 8.0, 7.0, 9.0, 8.0, 9.0, 15.0, 21.0, 23.0, 31.0, 36.0, 30.0, 40.0, 39.0, 54.0, 42.0, 40.0, 49.0, 44.0, 44.0, 37.0, 49.0, 29.0, 30.0, 36.0, 30.0, 30.0, 30.0, 22.0, 22.0, 17.0, 15.0, 20.0, 16.0, 10.0, 9.0, 7.0, 5.0, 6.0, 7.0, 2.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.9521484375, -1.8882904052734375, -1.824432373046875, -1.7605743408203125, -1.69671630859375, -1.6328582763671875, -1.569000244140625, -1.5051422119140625, -1.4412841796875, -1.3774261474609375, -1.313568115234375, -1.2497100830078125, -1.18585205078125, -1.1219940185546875, -1.058135986328125, -0.9942779541015625, -0.930419921875, -0.8665618896484375, -0.802703857421875, -0.7388458251953125, -0.67498779296875, -0.6111297607421875, -0.547271728515625, -0.4834136962890625, -0.4195556640625, -0.3556976318359375, -0.291839599609375, -0.2279815673828125, -0.16412353515625, -0.1002655029296875, -0.036407470703125, 0.0274505615234375, 0.09130859375, 0.1551666259765625, 0.219024658203125, 0.2828826904296875, 0.34674072265625, 0.4105987548828125, 0.474456787109375, 0.5383148193359375, 0.6021728515625, 0.6660308837890625, 0.729888916015625, 0.7937469482421875, 0.85760498046875, 0.9214630126953125, 0.985321044921875, 1.0491790771484375, 1.113037109375, 1.1768951416015625, 1.240753173828125, 1.3046112060546875, 1.36846923828125, 1.4323272705078125, 1.496185302734375, 1.5600433349609375, 1.6239013671875, 1.6877593994140625, 1.751617431640625, 1.8154754638671875, 1.87933349609375, 1.9431915283203125, 2.007049560546875, 2.0709075927734375, 2.134765625]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 0.0, 4.0, 8.0, 7.0, 17.0, 25.0, 31.0, 29.0, 69.0, 110.0, 194.0, 436.0, 1075.0, 3701.0, 18046.0, 163852.0, 725623.0, 116100.0, 14131.0, 3260.0, 964.0, 440.0, 189.0, 90.0, 51.0, 42.0, 24.0, 13.0, 8.0, 7.0, 3.0, 2.0, 5.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-2.96875, -2.889434814453125, -2.81011962890625, -2.730804443359375, -2.6514892578125, -2.572174072265625, -2.49285888671875, -2.413543701171875, -2.334228515625, -2.254913330078125, -2.17559814453125, -2.096282958984375, -2.0169677734375, -1.937652587890625, -1.85833740234375, -1.779022216796875, -1.69970703125, -1.620391845703125, -1.54107666015625, -1.461761474609375, -1.3824462890625, -1.303131103515625, -1.22381591796875, -1.144500732421875, -1.065185546875, -0.985870361328125, -0.90655517578125, -0.827239990234375, -0.7479248046875, -0.668609619140625, -0.58929443359375, -0.509979248046875, -0.4306640625, -0.351348876953125, -0.27203369140625, -0.192718505859375, -0.1134033203125, -0.034088134765625, 0.04522705078125, 0.124542236328125, 0.203857421875, 0.283172607421875, 0.36248779296875, 0.441802978515625, 0.5211181640625, 0.600433349609375, 0.67974853515625, 0.759063720703125, 0.83837890625, 0.917694091796875, 0.99700927734375, 1.076324462890625, 1.1556396484375, 1.234954833984375, 1.31427001953125, 1.393585205078125, 1.472900390625, 1.552215576171875, 1.63153076171875, 1.710845947265625, 1.7901611328125, 1.869476318359375, 1.94879150390625, 2.028106689453125, 2.107421875]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 5.0, 3.0, 9.0, 11.0, 2.0, 5.0, 18.0, 16.0, 23.0, 15.0, 11.0, 26.0, 23.0, 21.0, 30.0, 39.0, 44.0, 34.0, 34.0, 36.0, 39.0, 33.0, 44.0, 36.0, 42.0, 42.0, 36.0, 27.0, 33.0, 33.0, 24.0, 33.0, 19.0, 30.0, 24.0, 11.0, 17.0, 15.0, 9.0, 13.0, 7.0, 7.0, 7.0, 6.0, 6.0, 0.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 3.0], "bins": [-3.931640625, -3.8089599609375, -3.686279296875, -3.5635986328125, -3.44091796875, -3.3182373046875, -3.195556640625, -3.0728759765625, -2.9501953125, -2.8275146484375, -2.704833984375, -2.5821533203125, -2.45947265625, -2.3367919921875, -2.214111328125, -2.0914306640625, -1.96875, -1.8460693359375, -1.723388671875, -1.6007080078125, -1.47802734375, -1.3553466796875, -1.232666015625, -1.1099853515625, -0.9873046875, -0.8646240234375, -0.741943359375, -0.6192626953125, -0.49658203125, -0.3739013671875, -0.251220703125, -0.1285400390625, -0.005859375, 0.1168212890625, 0.239501953125, 0.3621826171875, 0.48486328125, 0.6075439453125, 0.730224609375, 0.8529052734375, 0.9755859375, 1.0982666015625, 1.220947265625, 1.3436279296875, 1.46630859375, 1.5889892578125, 1.711669921875, 1.8343505859375, 1.95703125, 2.0797119140625, 2.202392578125, 2.3250732421875, 2.44775390625, 2.5704345703125, 2.693115234375, 2.8157958984375, 2.9384765625, 3.0611572265625, 3.183837890625, 3.3065185546875, 3.42919921875, 3.5518798828125, 3.674560546875, 3.7972412109375, 3.919921875]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 2.0, 2.0, 5.0, 6.0, 8.0, 10.0, 22.0, 28.0, 30.0, 49.0, 70.0, 92.0, 158.0, 240.0, 386.0, 582.0, 1039.0, 1852.0, 3764.0, 8673.0, 24318.0, 101768.0, 566776.0, 264254.0, 48006.0, 14312.0, 5739.0, 2726.0, 1414.0, 812.0, 509.0, 329.0, 171.0, 131.0, 68.0, 54.0, 51.0, 35.0, 20.0, 14.0, 11.0, 4.0, 3.0, 3.0, 4.0, 2.0, 7.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-0.8603515625, -0.835601806640625, -0.81085205078125, -0.786102294921875, -0.7613525390625, -0.736602783203125, -0.71185302734375, -0.687103271484375, -0.662353515625, -0.637603759765625, -0.61285400390625, -0.588104248046875, -0.5633544921875, -0.538604736328125, -0.51385498046875, -0.489105224609375, -0.46435546875, -0.439605712890625, -0.41485595703125, -0.390106201171875, -0.3653564453125, -0.340606689453125, -0.31585693359375, -0.291107177734375, -0.266357421875, -0.241607666015625, -0.21685791015625, -0.192108154296875, -0.1673583984375, -0.142608642578125, -0.11785888671875, -0.093109130859375, -0.068359375, -0.043609619140625, -0.01885986328125, 0.005889892578125, 0.0306396484375, 0.055389404296875, 0.08013916015625, 0.104888916015625, 0.129638671875, 0.154388427734375, 0.17913818359375, 0.203887939453125, 0.2286376953125, 0.253387451171875, 0.27813720703125, 0.302886962890625, 0.32763671875, 0.352386474609375, 0.37713623046875, 0.401885986328125, 0.4266357421875, 0.451385498046875, 0.47613525390625, 0.500885009765625, 0.525634765625, 0.550384521484375, 0.57513427734375, 0.599884033203125, 0.6246337890625, 0.649383544921875, 0.67413330078125, 0.698883056640625, 0.7236328125]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 6.0, 5.0, 7.0, 6.0, 12.0, 18.0, 42.0, 74.0, 151.0, 265.0, 186.0, 109.0, 51.0, 27.0, 16.0, 18.0, 4.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0010919570922851562, -0.0010637789964675903, -0.0010356009006500244, -0.0010074228048324585, -0.0009792447090148926, -0.0009510666131973267, -0.0009228885173797607, -0.0008947104215621948, -0.0008665323257446289, -0.000838354229927063, -0.0008101761341094971, -0.0007819980382919312, -0.0007538199424743652, -0.0007256418466567993, -0.0006974637508392334, -0.0006692856550216675, -0.0006411075592041016, -0.0006129294633865356, -0.0005847513675689697, -0.0005565732717514038, -0.0005283951759338379, -0.000500217080116272, -0.00047203898429870605, -0.00044386088848114014, -0.0004156827926635742, -0.0003875046968460083, -0.0003593266010284424, -0.00033114850521087646, -0.00030297040939331055, -0.00027479231357574463, -0.0002466142177581787, -0.0002184361219406128, -0.00019025802612304688, -0.00016207993030548096, -0.00013390183448791504, -0.00010572373867034912, -7.75456428527832e-05, -4.9367547035217285e-05, -2.1189451217651367e-05, 6.988644599914551e-06, 3.516674041748047e-05, 6.334483623504639e-05, 9.15229320526123e-05, 0.00011970102787017822, 0.00014787912368774414, 0.00017605721950531006, 0.00020423531532287598, 0.0002324134111404419, 0.0002605915069580078, 0.00028876960277557373, 0.00031694769859313965, 0.00034512579441070557, 0.0003733038902282715, 0.0004014819860458374, 0.0004296600818634033, 0.00045783817768096924, 0.00048601627349853516, 0.0005141943693161011, 0.000542372465133667, 0.0005705505609512329, 0.0005987286567687988, 0.0006269067525863647, 0.0006550848484039307, 0.0006832629442214966, 0.0007114410400390625]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 4.0, 3.0, 6.0, 9.0, 12.0, 17.0, 21.0, 20.0, 25.0, 68.0, 119.0, 326.0, 1170.0, 6216.0, 101671.0, 888566.0, 44876.0, 4057.0, 813.0, 252.0, 100.0, 59.0, 32.0, 24.0, 18.0, 9.0, 12.0, 10.0, 10.0, 10.0, 6.0, 1.0, 4.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9833984375, -1.9135284423828125, -1.843658447265625, -1.7737884521484375, -1.70391845703125, -1.6340484619140625, -1.564178466796875, -1.4943084716796875, -1.4244384765625, -1.3545684814453125, -1.284698486328125, -1.2148284912109375, -1.14495849609375, -1.0750885009765625, -1.005218505859375, -0.9353485107421875, -0.865478515625, -0.7956085205078125, -0.725738525390625, -0.6558685302734375, -0.58599853515625, -0.5161285400390625, -0.446258544921875, -0.3763885498046875, -0.3065185546875, -0.2366485595703125, -0.166778564453125, -0.0969085693359375, -0.02703857421875, 0.0428314208984375, 0.112701416015625, 0.1825714111328125, 0.25244140625, 0.3223114013671875, 0.392181396484375, 0.4620513916015625, 0.53192138671875, 0.6017913818359375, 0.671661376953125, 0.7415313720703125, 0.8114013671875, 0.8812713623046875, 0.951141357421875, 1.0210113525390625, 1.09088134765625, 1.1607513427734375, 1.230621337890625, 1.3004913330078125, 1.370361328125, 1.4402313232421875, 1.510101318359375, 1.5799713134765625, 1.64984130859375, 1.7197113037109375, 1.789581298828125, 1.8594512939453125, 1.9293212890625, 1.9991912841796875, 2.069061279296875, 2.1389312744140625, 2.20880126953125, 2.2786712646484375, 2.348541259765625, 2.4184112548828125, 2.48828125]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 3.0, 2.0, 5.0, 6.0, 5.0, 10.0, 10.0, 20.0, 15.0, 25.0, 33.0, 38.0, 53.0, 75.0, 80.0, 105.0, 117.0, 89.0, 64.0, 42.0, 40.0, 31.0, 25.0, 24.0, 14.0, 7.0, 13.0, 6.0, 9.0, 5.0, 6.0, 7.0, 6.0, 4.0, 3.0, 2.0, 0.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.212890625, -0.20503997802734375, -0.1971893310546875, -0.18933868408203125, -0.181488037109375, -0.17363739013671875, -0.1657867431640625, -0.15793609619140625, -0.15008544921875, -0.14223480224609375, -0.1343841552734375, -0.12653350830078125, -0.118682861328125, -0.11083221435546875, -0.1029815673828125, -0.09513092041015625, -0.0872802734375, -0.07942962646484375, -0.0715789794921875, -0.06372833251953125, -0.055877685546875, -0.04802703857421875, -0.0401763916015625, -0.03232574462890625, -0.02447509765625, -0.01662445068359375, -0.0087738037109375, -0.00092315673828125, 0.006927490234375, 0.01477813720703125, 0.0226287841796875, 0.03047943115234375, 0.038330078125, 0.04618072509765625, 0.0540313720703125, 0.06188201904296875, 0.069732666015625, 0.07758331298828125, 0.0854339599609375, 0.09328460693359375, 0.10113525390625, 0.10898590087890625, 0.1168365478515625, 0.12468719482421875, 0.132537841796875, 0.14038848876953125, 0.1482391357421875, 0.15608978271484375, 0.1639404296875, 0.17179107666015625, 0.1796417236328125, 0.18749237060546875, 0.195343017578125, 0.20319366455078125, 0.2110443115234375, 0.21889495849609375, 0.22674560546875, 0.23459625244140625, 0.2424468994140625, 0.25029754638671875, 0.258148193359375, 0.26599884033203125, 0.2738494873046875, 0.28170013427734375, 0.28955078125]}, "gradients/decoder.model.decoder.layers.11.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 8.0, 12.0, 27.0, 82.0, 179.0, 241.0, 237.0, 130.0, 54.0, 23.0, 12.0, 7.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.870283126831055, -13.573585510253906, -13.276887893676758, -12.980191230773926, -12.683493614196777, -12.386795997619629, -12.090099334716797, -11.793401718139648, -11.4967041015625, -11.200006484985352, -10.903308868408203, -10.606612205505371, -10.309914588928223, -10.013216972351074, -9.716520309448242, -9.419822692871094, -9.123125076293945, -8.826427459716797, -8.529729843139648, -8.233033180236816, -7.936335563659668, -7.6396379470825195, -7.342940807342529, -7.046243667602539, -6.749546051025391, -6.452848434448242, -6.156151294708252, -5.859454154968262, -5.562756538391113, -5.266058921813965, -4.969361782073975, -4.672664642333984, -4.375966548919678, -4.0792694091796875, -3.782571792602539, -3.4858744144439697, -3.1891770362854004, -2.892479658126831, -2.5957822799682617, -2.2990849018096924, -2.002387523651123, -1.7056901454925537, -1.4089927673339844, -1.112295389175415, -0.8155980110168457, -0.5189006328582764, -0.22220325469970703, 0.0744941234588623, 0.37119150161743164, 0.667888879776001, 0.9645862579345703, 1.2612836360931396, 1.557981014251709, 1.8546783924102783, 2.1513757705688477, 2.448073148727417, 2.7447705268859863, 3.0414679050445557, 3.338165283203125, 3.6348626613616943, 3.9315600395202637, 4.228257179260254, 4.524954795837402, 4.821652412414551, 5.118349552154541]}, "gradients/decoder.model.decoder.layers.11.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 2.0, 3.0, 4.0, 4.0, 3.0, 7.0, 9.0, 16.0, 15.0, 18.0, 20.0, 16.0, 27.0, 28.0, 43.0, 36.0, 41.0, 32.0, 37.0, 45.0, 53.0, 58.0, 61.0, 42.0, 37.0, 37.0, 45.0, 43.0, 44.0, 29.0, 26.0, 25.0, 22.0, 18.0, 15.0, 9.0, 11.0, 10.0, 7.0, 2.0, 6.0, 3.0, 3.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.871025562286377, -1.798896312713623, -1.7267670631408691, -1.6546378135681152, -1.5825085639953613, -1.5103793144226074, -1.438250184059143, -1.3661209344863892, -1.2939916849136353, -1.2218624353408813, -1.1497331857681274, -1.0776039361953735, -1.0054748058319092, -0.9333454966545105, -0.8612163066864014, -0.7890870571136475, -0.7169578075408936, -0.6448285579681396, -0.5726993083953857, -0.5005701184272766, -0.4284408688545227, -0.3563116192817688, -0.2841823995113373, -0.21205317974090576, -0.13992393016815186, -0.06779469549655914, 0.004334539175033569, 0.07646377384662628, 0.148593008518219, 0.2207222580909729, 0.2928514778614044, 0.36498069763183594, 0.43711018562316895, 0.5092394351959229, 0.5813686847686768, 0.6534978747367859, 0.7256271243095398, 0.7977563738822937, 0.8698855638504028, 0.9420148134231567, 1.0141440629959106, 1.0862733125686646, 1.1584025621414185, 1.2305318117141724, 1.3026609420776367, 1.3747901916503906, 1.4469194412231445, 1.5190486907958984, 1.5911779403686523, 1.6633071899414062, 1.7354364395141602, 1.807565689086914, 1.879694938659668, 1.9518241882324219, 2.023953437805176, 2.0960826873779297, 2.1682119369506836, 2.2403411865234375, 2.3124704360961914, 2.3845996856689453, 2.456728935241699, 2.528858184814453, 2.600987434387207, 2.673116683959961, 2.7452456951141357]}, "gradients/decoder.model.decoder.layers.11.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 2.0, 1.0, 1.0, 6.0, 8.0, 15.0, 13.0, 15.0, 23.0, 30.0, 33.0, 60.0, 90.0, 141.0, 203.0, 270.0, 400.0, 589.0, 943.0, 1375.0, 2447.0, 4285.0, 8690.0, 20454.0, 50774.0, 131401.0, 271245.0, 294601.0, 153426.0, 60700.0, 24169.0, 10195.0, 4880.0, 2556.0, 1506.0, 966.0, 690.0, 411.0, 271.0, 208.0, 142.0, 88.0, 90.0, 47.0, 31.0, 16.0, 18.0, 9.0, 11.0, 4.0, 8.0, 2.0, 0.0, 6.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.1474609375, -1.1093292236328125, -1.071197509765625, -1.0330657958984375, -0.99493408203125, -0.9568023681640625, -0.918670654296875, -0.8805389404296875, -0.8424072265625, -0.8042755126953125, -0.766143798828125, -0.7280120849609375, -0.68988037109375, -0.6517486572265625, -0.613616943359375, -0.5754852294921875, -0.537353515625, -0.4992218017578125, -0.461090087890625, -0.4229583740234375, -0.38482666015625, -0.3466949462890625, -0.308563232421875, -0.2704315185546875, -0.2322998046875, -0.1941680908203125, -0.156036376953125, -0.1179046630859375, -0.07977294921875, -0.0416412353515625, -0.003509521484375, 0.0346221923828125, 0.07275390625, 0.1108856201171875, 0.149017333984375, 0.1871490478515625, 0.22528076171875, 0.2634124755859375, 0.301544189453125, 0.3396759033203125, 0.3778076171875, 0.4159393310546875, 0.454071044921875, 0.4922027587890625, 0.53033447265625, 0.5684661865234375, 0.606597900390625, 0.6447296142578125, 0.682861328125, 0.7209930419921875, 0.759124755859375, 0.7972564697265625, 0.83538818359375, 0.8735198974609375, 0.911651611328125, 0.9497833251953125, 0.9879150390625, 1.0260467529296875, 1.064178466796875, 1.1023101806640625, 1.14044189453125, 1.1785736083984375, 1.216705322265625, 1.2548370361328125, 1.29296875]}, "gradients/decoder.model.decoder.layers.11.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 4.0, 3.0, 11.0, 10.0, 10.0, 10.0, 28.0, 17.0, 24.0, 25.0, 30.0, 41.0, 36.0, 41.0, 40.0, 42.0, 55.0, 63.0, 52.0, 48.0, 42.0, 42.0, 42.0, 44.0, 31.0, 32.0, 39.0, 34.0, 21.0, 14.0, 14.0, 17.0, 10.0, 6.0, 8.0, 9.0, 2.0, 6.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-11.578125, -11.2093505859375, -10.840576171875, -10.4718017578125, -10.10302734375, -9.7342529296875, -9.365478515625, -8.9967041015625, -8.6279296875, -8.2591552734375, -7.890380859375, -7.5216064453125, -7.15283203125, -6.7840576171875, -6.415283203125, -6.0465087890625, -5.677734375, -5.3089599609375, -4.940185546875, -4.5714111328125, -4.20263671875, -3.8338623046875, -3.465087890625, -3.0963134765625, -2.7275390625, -2.3587646484375, -1.989990234375, -1.6212158203125, -1.25244140625, -0.8836669921875, -0.514892578125, -0.1461181640625, 0.22265625, 0.5914306640625, 0.960205078125, 1.3289794921875, 1.69775390625, 2.0665283203125, 2.435302734375, 2.8040771484375, 3.1728515625, 3.5416259765625, 3.910400390625, 4.2791748046875, 4.64794921875, 5.0167236328125, 5.385498046875, 5.7542724609375, 6.123046875, 6.4918212890625, 6.860595703125, 7.2293701171875, 7.59814453125, 7.9669189453125, 8.335693359375, 8.7044677734375, 9.0732421875, 9.4420166015625, 9.810791015625, 10.1795654296875, 10.54833984375, 10.9171142578125, 11.285888671875, 11.6546630859375, 12.0234375]}, "gradients/decoder.model.decoder.layers.11.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 6.0, 2.0, 4.0, 4.0, 5.0, 3.0, 11.0, 5.0, 9.0, 17.0, 19.0, 25.0, 31.0, 40.0, 52.0, 68.0, 97.0, 148.0, 225.0, 306.0, 597.0, 2537.0, 64918.0, 949342.0, 26930.0, 1654.0, 562.0, 269.0, 193.0, 131.0, 83.0, 63.0, 42.0, 43.0, 32.0, 23.0, 13.0, 13.0, 10.0, 11.0, 7.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0], "bins": [-5.95703125, -5.7611083984375, -5.565185546875, -5.3692626953125, -5.17333984375, -4.9774169921875, -4.781494140625, -4.5855712890625, -4.3896484375, -4.1937255859375, -3.997802734375, -3.8018798828125, -3.60595703125, -3.4100341796875, -3.214111328125, -3.0181884765625, -2.822265625, -2.6263427734375, -2.430419921875, -2.2344970703125, -2.03857421875, -1.8426513671875, -1.646728515625, -1.4508056640625, -1.2548828125, -1.0589599609375, -0.863037109375, -0.6671142578125, -0.47119140625, -0.2752685546875, -0.079345703125, 0.1165771484375, 0.3125, 0.5084228515625, 0.704345703125, 0.9002685546875, 1.09619140625, 1.2921142578125, 1.488037109375, 1.6839599609375, 1.8798828125, 2.0758056640625, 2.271728515625, 2.4676513671875, 2.66357421875, 2.8594970703125, 3.055419921875, 3.2513427734375, 3.447265625, 3.6431884765625, 3.839111328125, 4.0350341796875, 4.23095703125, 4.4268798828125, 4.622802734375, 4.8187255859375, 5.0146484375, 5.2105712890625, 5.406494140625, 5.6024169921875, 5.79833984375, 5.9942626953125, 6.190185546875, 6.3861083984375, 6.58203125]}, "gradients/decoder.model.decoder.layers.11.self_attn.v_proj.bias": {"_type": "histogram", "values": [4.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 4.0, 2.0, 5.0, 5.0, 11.0, 6.0, 15.0, 13.0, 23.0, 30.0, 35.0, 34.0, 46.0, 52.0, 60.0, 57.0, 56.0, 46.0, 67.0, 60.0, 58.0, 47.0, 44.0, 38.0, 41.0, 27.0, 34.0, 20.0, 11.0, 11.0, 15.0, 11.0, 10.0, 6.0, 5.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-12.28125, -11.8748779296875, -11.468505859375, -11.0621337890625, -10.65576171875, -10.2493896484375, -9.843017578125, -9.4366455078125, -9.0302734375, -8.6239013671875, -8.217529296875, -7.8111572265625, -7.40478515625, -6.9984130859375, -6.592041015625, -6.1856689453125, -5.779296875, -5.3729248046875, -4.966552734375, -4.5601806640625, -4.15380859375, -3.7474365234375, -3.341064453125, -2.9346923828125, -2.5283203125, -2.1219482421875, -1.715576171875, -1.3092041015625, -0.90283203125, -0.4964599609375, -0.090087890625, 0.3162841796875, 0.72265625, 1.1290283203125, 1.535400390625, 1.9417724609375, 2.34814453125, 2.7545166015625, 3.160888671875, 3.5672607421875, 3.9736328125, 4.3800048828125, 4.786376953125, 5.1927490234375, 5.59912109375, 6.0054931640625, 6.411865234375, 6.8182373046875, 7.224609375, 7.6309814453125, 8.037353515625, 8.4437255859375, 8.85009765625, 9.2564697265625, 9.662841796875, 10.0692138671875, 10.4755859375, 10.8819580078125, 11.288330078125, 11.6947021484375, 12.10107421875, 12.5074462890625, 12.913818359375, 13.3201904296875, 13.7265625]}, "gradients/decoder.model.decoder.layers.11.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 2.0, 3.0, 7.0, 9.0, 7.0, 12.0, 22.0, 42.0, 49.0, 56.0, 110.0, 206.0, 481.0, 1382.0, 4653.0, 25017.0, 766287.0, 229479.0, 15436.0, 3422.0, 1050.0, 379.0, 173.0, 111.0, 58.0, 35.0, 23.0, 10.0, 10.0, 10.0, 7.0, 3.0, 0.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.572265625, -0.5524444580078125, -0.532623291015625, -0.5128021240234375, -0.49298095703125, -0.4731597900390625, -0.453338623046875, -0.4335174560546875, -0.4136962890625, -0.3938751220703125, -0.374053955078125, -0.3542327880859375, -0.33441162109375, -0.3145904541015625, -0.294769287109375, -0.2749481201171875, -0.255126953125, -0.2353057861328125, -0.215484619140625, -0.1956634521484375, -0.17584228515625, -0.1560211181640625, -0.136199951171875, -0.1163787841796875, -0.0965576171875, -0.0767364501953125, -0.056915283203125, -0.0370941162109375, -0.01727294921875, 0.0025482177734375, 0.022369384765625, 0.0421905517578125, 0.06201171875, 0.0818328857421875, 0.101654052734375, 0.1214752197265625, 0.14129638671875, 0.1611175537109375, 0.180938720703125, 0.2007598876953125, 0.2205810546875, 0.2404022216796875, 0.260223388671875, 0.2800445556640625, 0.29986572265625, 0.3196868896484375, 0.339508056640625, 0.3593292236328125, 0.379150390625, 0.3989715576171875, 0.418792724609375, 0.4386138916015625, 0.45843505859375, 0.4782562255859375, 0.498077392578125, 0.5178985595703125, 0.5377197265625, 0.5575408935546875, 0.577362060546875, 0.5971832275390625, 0.61700439453125, 0.6368255615234375, 0.656646728515625, 0.6764678955078125, 0.6962890625]}, "gradients/decoder.model.decoder.layers.11.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 6.0, 7.0, 13.0, 28.0, 39.0, 84.0, 177.0, 284.0, 185.0, 90.0, 47.0, 20.0, 14.0, 6.0, 7.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00018215179443359375, -0.00017787236720323563, -0.0001735929399728775, -0.00016931351274251938, -0.00016503408551216125, -0.00016075465828180313, -0.000156475231051445, -0.00015219580382108688, -0.00014791637659072876, -0.00014363694936037064, -0.0001393575221300125, -0.0001350780948996544, -0.00013079866766929626, -0.00012651924043893814, -0.00012223981320858002, -0.0001179603859782219, -0.00011368095874786377, -0.00010940153151750565, -0.00010512210428714752, -0.0001008426770567894, -9.656324982643127e-05, -9.228382259607315e-05, -8.800439536571503e-05, -8.37249681353569e-05, -7.944554090499878e-05, -7.516611367464066e-05, -7.088668644428253e-05, -6.660725921392441e-05, -6.232783198356628e-05, -5.804840475320816e-05, -5.376897752285004e-05, -4.948955029249191e-05, -4.521012306213379e-05, -4.0930695831775665e-05, -3.665126860141754e-05, -3.237184137105942e-05, -2.8092414140701294e-05, -2.381298691034317e-05, -1.9533559679985046e-05, -1.5254132449626923e-05, -1.0974705219268799e-05, -6.695277988910675e-06, -2.4158507585525513e-06, 1.8635764718055725e-06, 6.143003702163696e-06, 1.042243093252182e-05, 1.4701858162879944e-05, 1.8981285393238068e-05, 2.326071262359619e-05, 2.7540139853954315e-05, 3.181956708431244e-05, 3.609899431467056e-05, 4.0378421545028687e-05, 4.465784877538681e-05, 4.8937276005744934e-05, 5.321670323610306e-05, 5.749613046646118e-05, 6.17755576968193e-05, 6.605498492717743e-05, 7.033441215753555e-05, 7.461383938789368e-05, 7.88932666182518e-05, 8.317269384860992e-05, 8.745212107896805e-05, 9.173154830932617e-05]}, "gradients/decoder.model.decoder.layers.11.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 2.0, 5.0, 3.0, 7.0, 6.0, 16.0, 25.0, 23.0, 62.0, 113.0, 226.0, 544.0, 1425.0, 4788.0, 21875.0, 562636.0, 429006.0, 20831.0, 4623.0, 1376.0, 491.0, 240.0, 88.0, 52.0, 38.0, 21.0, 4.0, 11.0, 8.0, 4.0, 4.0, 1.0, 2.0, 0.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.6376953125, -0.6183624267578125, -0.599029541015625, -0.5796966552734375, -0.56036376953125, -0.5410308837890625, -0.521697998046875, -0.5023651123046875, -0.4830322265625, -0.4636993408203125, -0.444366455078125, -0.4250335693359375, -0.40570068359375, -0.3863677978515625, -0.367034912109375, -0.3477020263671875, -0.328369140625, -0.3090362548828125, -0.289703369140625, -0.2703704833984375, -0.25103759765625, -0.2317047119140625, -0.212371826171875, -0.1930389404296875, -0.1737060546875, -0.1543731689453125, -0.135040283203125, -0.1157073974609375, -0.09637451171875, -0.0770416259765625, -0.057708740234375, -0.0383758544921875, -0.01904296875, 0.0002899169921875, 0.019622802734375, 0.0389556884765625, 0.05828857421875, 0.0776214599609375, 0.096954345703125, 0.1162872314453125, 0.1356201171875, 0.1549530029296875, 0.174285888671875, 0.1936187744140625, 0.21295166015625, 0.2322845458984375, 0.251617431640625, 0.2709503173828125, 0.290283203125, 0.3096160888671875, 0.328948974609375, 0.3482818603515625, 0.36761474609375, 0.3869476318359375, 0.406280517578125, 0.4256134033203125, 0.4449462890625, 0.4642791748046875, 0.483612060546875, 0.5029449462890625, 0.52227783203125, 0.5416107177734375, 0.560943603515625, 0.5802764892578125, 0.599609375]}, "gradients/decoder.model.decoder.layers.11.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 6.0, 1.0, 1.0, 4.0, 5.0, 8.0, 4.0, 10.0, 7.0, 21.0, 16.0, 29.0, 34.0, 58.0, 87.0, 131.0, 195.0, 131.0, 88.0, 46.0, 29.0, 29.0, 12.0, 15.0, 15.0, 4.0, 6.0, 2.0, 4.0, 2.0, 2.0, 3.0, 0.0, 1.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1639404296875, -0.15889549255371094, -0.15385055541992188, -0.1488056182861328, -0.14376068115234375, -0.1387157440185547, -0.13367080688476562, -0.12862586975097656, -0.1235809326171875, -0.11853599548339844, -0.11349105834960938, -0.10844612121582031, -0.10340118408203125, -0.09835624694824219, -0.09331130981445312, -0.08826637268066406, -0.083221435546875, -0.07817649841308594, -0.07313156127929688, -0.06808662414550781, -0.06304168701171875, -0.05799674987792969, -0.052951812744140625, -0.04790687561035156, -0.0428619384765625, -0.03781700134277344, -0.032772064208984375, -0.027727127075195312, -0.02268218994140625, -0.017637252807617188, -0.012592315673828125, -0.0075473785400390625, -0.00250244140625, 0.0025424957275390625, 0.007587432861328125, 0.012632369995117188, 0.01767730712890625, 0.022722244262695312, 0.027767181396484375, 0.03281211853027344, 0.0378570556640625, 0.04290199279785156, 0.047946929931640625, 0.05299186706542969, 0.05803680419921875, 0.06308174133300781, 0.06812667846679688, 0.07317161560058594, 0.078216552734375, 0.08326148986816406, 0.08830642700195312, 0.09335136413574219, 0.09839630126953125, 0.10344123840332031, 0.10848617553710938, 0.11353111267089844, 0.1185760498046875, 0.12362098693847656, 0.12866592407226562, 0.1337108612060547, 0.13875579833984375, 0.1438007354736328, 0.14884567260742188, 0.15389060974121094, 0.158935546875]}, "gradients/decoder.model.decoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 19.0, 835.0, 168.0], "bins": [-163.92906188964844, -161.3145751953125, -158.70008850097656, -156.08560180664062, -153.4711151123047, -150.8566436767578, -148.24215698242188, -145.62767028808594, -143.01318359375, -140.39869689941406, -137.78421020507812, -135.1697235107422, -132.55523681640625, -129.94076538085938, -127.3262710571289, -124.7117919921875, -122.09730529785156, -119.48281860351562, -116.86833190917969, -114.25385284423828, -111.63936614990234, -109.0248794555664, -106.41039276123047, -103.79591369628906, -101.1814193725586, -98.56693267822266, -95.95244598388672, -93.33796691894531, -90.72348022460938, -88.10899353027344, -85.4945068359375, -82.88002014160156, -80.26554870605469, -77.65106201171875, -75.03657531738281, -72.4220962524414, -69.80760955810547, -67.19312286376953, -64.5786361694336, -61.96415328979492, -59.349666595458984, -56.73517990112305, -54.120697021484375, -51.50621032714844, -48.891727447509766, -46.27724075317383, -43.662757873535156, -41.04827117919922, -38.43378448486328, -35.819297790527344, -33.20481491088867, -30.590328216552734, -27.975845336914062, -25.361358642578125, -22.74687385559082, -20.132389068603516, -17.517906188964844, -14.903421401977539, -12.288936614990234, -9.674450874328613, -7.059966087341309, -4.445481300354004, -1.8309955596923828, 0.7834892272949219, 3.3979740142822266]}, "gradients/decoder.model.decoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 2.0, 0.0, 5.0, 1.0, 3.0, 5.0, 5.0, 6.0, 5.0, 12.0, 12.0, 17.0, 27.0, 26.0, 32.0, 25.0, 18.0, 33.0, 38.0, 31.0, 38.0, 46.0, 51.0, 36.0, 50.0, 41.0, 32.0, 39.0, 35.0, 32.0, 34.0, 29.0, 37.0, 24.0, 30.0, 16.0, 30.0, 20.0, 8.0, 14.0, 12.0, 12.0, 10.0, 9.0, 4.0, 11.0, 4.0, 2.0, 4.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-12.770748138427734, -12.32409381866455, -11.877439498901367, -11.430785179138184, -10.984130859375, -10.537476539611816, -10.090822219848633, -9.64416790008545, -9.197513580322266, -8.750859260559082, -8.304204940795898, -7.857550621032715, -7.410896301269531, -6.964241981506348, -6.517587661743164, -6.0709333419799805, -5.624278545379639, -5.177624225616455, -4.7309699058532715, -4.284315586090088, -3.8376612663269043, -3.3910067081451416, -2.944352388381958, -2.4976980686187744, -2.051043748855591, -1.6043894290924072, -1.1577351093292236, -0.7110806703567505, -0.2644263505935669, 0.18222808837890625, 0.6288824081420898, 1.0755367279052734, 1.522191047668457, 1.9688453674316406, 2.415499687194824, 2.862154006958008, 3.3088083267211914, 3.755462884902954, 4.202116966247559, 4.648771286010742, 5.095425605773926, 5.542079925537109, 5.988734245300293, 6.435388565063477, 6.88204288482666, 7.328697204589844, 7.775351524353027, 8.222005844116211, 8.668661117553711, 9.115315437316895, 9.561969757080078, 10.008624076843262, 10.455278396606445, 10.901932716369629, 11.348587036132812, 11.795241355895996, 12.24189567565918, 12.688549995422363, 13.135204315185547, 13.58185863494873, 14.028512954711914, 14.475167274475098, 14.921821594238281, 15.368475914001465, 15.815130233764648]}, "gradients/decoder.model.decoder.layers.10.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 6.0, 6.0, 7.0, 6.0, 18.0, 25.0, 30.0, 39.0, 76.0, 128.0, 214.0, 529.0, 1366.0, 5521.0, 36752.0, 957872.0, 3074641.0, 102383.0, 10777.0, 2500.0, 743.0, 302.0, 135.0, 71.0, 53.0, 27.0, 18.0, 14.0, 10.0, 13.0, 7.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.796875, -6.6141357421875, -6.431396484375, -6.2486572265625, -6.06591796875, -5.8831787109375, -5.700439453125, -5.5177001953125, -5.3349609375, -5.1522216796875, -4.969482421875, -4.7867431640625, -4.60400390625, -4.4212646484375, -4.238525390625, -4.0557861328125, -3.873046875, -3.6903076171875, -3.507568359375, -3.3248291015625, -3.14208984375, -2.9593505859375, -2.776611328125, -2.5938720703125, -2.4111328125, -2.2283935546875, -2.045654296875, -1.8629150390625, -1.68017578125, -1.4974365234375, -1.314697265625, -1.1319580078125, -0.94921875, -0.7664794921875, -0.583740234375, -0.4010009765625, -0.21826171875, -0.0355224609375, 0.147216796875, 0.3299560546875, 0.5126953125, 0.6954345703125, 0.878173828125, 1.0609130859375, 1.24365234375, 1.4263916015625, 1.609130859375, 1.7918701171875, 1.974609375, 2.1573486328125, 2.340087890625, 2.5228271484375, 2.70556640625, 2.8883056640625, 3.071044921875, 3.2537841796875, 3.4365234375, 3.6192626953125, 3.802001953125, 3.9847412109375, 4.16748046875, 4.3502197265625, 4.532958984375, 4.7156982421875, 4.8984375]}, "gradients/decoder.model.decoder.layers.10.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 8.0, 13.0, 8.0, 11.0, 18.0, 19.0, 40.0, 43.0, 53.0, 59.0, 44.0, 54.0, 72.0, 64.0, 83.0, 85.0, 55.0, 50.0, 42.0, 43.0, 42.0, 22.0, 20.0, 29.0, 8.0, 13.0, 8.0, 3.0, 2.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.677734375, -3.56591796875, -3.4541015625, -3.34228515625, -3.23046875, -3.11865234375, -3.0068359375, -2.89501953125, -2.783203125, -2.67138671875, -2.5595703125, -2.44775390625, -2.3359375, -2.22412109375, -2.1123046875, -2.00048828125, -1.888671875, -1.77685546875, -1.6650390625, -1.55322265625, -1.44140625, -1.32958984375, -1.2177734375, -1.10595703125, -0.994140625, -0.88232421875, -0.7705078125, -0.65869140625, -0.546875, -0.43505859375, -0.3232421875, -0.21142578125, -0.099609375, 0.01220703125, 0.1240234375, 0.23583984375, 0.34765625, 0.45947265625, 0.5712890625, 0.68310546875, 0.794921875, 0.90673828125, 1.0185546875, 1.13037109375, 1.2421875, 1.35400390625, 1.4658203125, 1.57763671875, 1.689453125, 1.80126953125, 1.9130859375, 2.02490234375, 2.13671875, 2.24853515625, 2.3603515625, 2.47216796875, 2.583984375, 2.69580078125, 2.8076171875, 2.91943359375, 3.03125, 3.14306640625, 3.2548828125, 3.36669921875, 3.478515625]}, "gradients/decoder.model.decoder.layers.10.fc1.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 3.0, 0.0, 5.0, 4.0, 3.0, 14.0, 23.0, 63.0, 180.0, 879.0, 4191183.0, 1571.0, 209.0, 61.0, 33.0, 12.0, 8.0, 9.0, 3.0, 5.0, 3.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.90625, -35.462890625, -34.01953125, -32.576171875, -31.1328125, -29.689453125, -28.24609375, -26.802734375, -25.359375, -23.916015625, -22.47265625, -21.029296875, -19.5859375, -18.142578125, -16.69921875, -15.255859375, -13.8125, -12.369140625, -10.92578125, -9.482421875, -8.0390625, -6.595703125, -5.15234375, -3.708984375, -2.265625, -0.822265625, 0.62109375, 2.064453125, 3.5078125, 4.951171875, 6.39453125, 7.837890625, 9.28125, 10.724609375, 12.16796875, 13.611328125, 15.0546875, 16.498046875, 17.94140625, 19.384765625, 20.828125, 22.271484375, 23.71484375, 25.158203125, 26.6015625, 28.044921875, 29.48828125, 30.931640625, 32.375, 33.818359375, 35.26171875, 36.705078125, 38.1484375, 39.591796875, 41.03515625, 42.478515625, 43.921875, 45.365234375, 46.80859375, 48.251953125, 49.6953125, 51.138671875, 52.58203125, 54.025390625, 55.46875]}, "gradients/decoder.model.decoder.layers.10.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 5.0, 6.0, 1.0, 6.0, 10.0, 12.0, 37.0, 28.0, 62.0, 84.0, 171.0, 265.0, 514.0, 988.0, 779.0, 460.0, 236.0, 155.0, 94.0, 60.0, 38.0, 24.0, 19.0, 8.0, 9.0, 7.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.083984375, -1.04644775390625, -1.0089111328125, -0.97137451171875, -0.933837890625, -0.89630126953125, -0.8587646484375, -0.82122802734375, -0.78369140625, -0.74615478515625, -0.7086181640625, -0.67108154296875, -0.633544921875, -0.59600830078125, -0.5584716796875, -0.52093505859375, -0.4833984375, -0.44586181640625, -0.4083251953125, -0.37078857421875, -0.333251953125, -0.29571533203125, -0.2581787109375, -0.22064208984375, -0.18310546875, -0.14556884765625, -0.1080322265625, -0.07049560546875, -0.032958984375, 0.00457763671875, 0.0421142578125, 0.07965087890625, 0.1171875, 0.15472412109375, 0.1922607421875, 0.22979736328125, 0.267333984375, 0.30487060546875, 0.3424072265625, 0.37994384765625, 0.41748046875, 0.45501708984375, 0.4925537109375, 0.53009033203125, 0.567626953125, 0.60516357421875, 0.6427001953125, 0.68023681640625, 0.7177734375, 0.75531005859375, 0.7928466796875, 0.83038330078125, 0.867919921875, 0.90545654296875, 0.9429931640625, 0.98052978515625, 1.01806640625, 1.05560302734375, 1.0931396484375, 1.13067626953125, 1.168212890625, 1.20574951171875, 1.2432861328125, 1.28082275390625, 1.318359375]}, "gradients/decoder.model.decoder.layers.10.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 5.0, 8.0, 19.0, 34.0, 33.0, 86.0, 136.0, 178.0, 145.0, 125.0, 95.0, 68.0, 37.0, 17.0, 13.0, 7.0, 3.0, 4.0, 2.0], "bins": [-11.495306968688965, -11.279047966003418, -11.062788963317871, -10.846529960632324, -10.630270957946777, -10.41401195526123, -10.197752952575684, -9.981493949890137, -9.76523494720459, -9.548975944519043, -9.332716941833496, -9.11645793914795, -8.900198936462402, -8.683939933776855, -8.467680931091309, -8.251421928405762, -8.035163879394531, -7.818904876708984, -7.6026458740234375, -7.386386871337891, -7.170127868652344, -6.953868865966797, -6.73760986328125, -6.521350860595703, -6.305091857910156, -6.088832855224609, -5.8725738525390625, -5.656314849853516, -5.440055847167969, -5.223796844482422, -5.007537841796875, -4.791278839111328, -4.575019836425781, -4.358760833740234, -4.1425018310546875, -3.9262428283691406, -3.7099838256835938, -3.493724822998047, -3.277466058731079, -3.0612070560455322, -2.8449482917785645, -2.6286892890930176, -2.4124302864074707, -2.196171283721924, -1.9799124002456665, -1.7636533975601196, -1.5473945140838623, -1.3311355113983154, -1.1148765087127686, -0.8986175060272217, -0.6823585629463196, -0.4660996198654175, -0.2498406171798706, -0.03358161449432373, 0.1826772689819336, 0.39893627166748047, 0.6151952743530273, 0.8314542770385742, 1.047713279724121, 1.2639721632003784, 1.4802311658859253, 1.6964901685714722, 1.9127490520477295, 2.1290080547332764, 2.3452670574188232]}, "gradients/decoder.model.decoder.layers.10.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 6.0, 8.0, 8.0, 17.0, 17.0, 21.0, 23.0, 25.0, 37.0, 26.0, 47.0, 52.0, 53.0, 66.0, 55.0, 83.0, 73.0, 73.0, 46.0, 39.0, 48.0, 40.0, 31.0, 31.0, 29.0, 16.0, 13.0, 10.0, 13.0, 1.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.450479745864868, -3.341418504714966, -3.2323570251464844, -3.123295783996582, -3.0142343044281006, -2.9051730632781982, -2.796111583709717, -2.6870503425598145, -2.577988862991333, -2.4689276218414307, -2.359866142272949, -2.250804901123047, -2.1417434215545654, -2.032682180404663, -1.9236207008361816, -1.8145594596862793, -1.7054980993270874, -1.5964367389678955, -1.4873753786087036, -1.3783140182495117, -1.2692526578903198, -1.160191297531128, -1.0511300563812256, -0.9420686364173889, -0.833007276058197, -0.7239459156990051, -0.6148845553398132, -0.5058232545852661, -0.39676186442375183, -0.2877005338668823, -0.17863917350769043, -0.06957781314849854, 0.03948354721069336, 0.14854490756988525, 0.25760626792907715, 0.36666759848594666, 0.47572895884513855, 0.5847902894020081, 0.6938516497612, 0.8029130101203918, 0.9119743704795837, 1.0210356712341309, 1.1300970315933228, 1.2391583919525146, 1.3482197523117065, 1.4572811126708984, 1.5663424730300903, 1.6754038333892822, 1.7844651937484741, 1.893526554107666, 2.0025877952575684, 2.11164927482605, 2.220710515975952, 2.3297719955444336, 2.438833236694336, 2.5478947162628174, 2.6569559574127197, 2.766017198562622, 2.8750786781311035, 2.984139919281006, 3.0932013988494873, 3.2022626399993896, 3.311324119567871, 3.4203853607177734, 3.529446840286255]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 6.0, 4.0, 11.0, 25.0, 31.0, 31.0, 72.0, 125.0, 212.0, 337.0, 695.0, 1305.0, 2523.0, 5495.0, 12619.0, 32359.0, 86453.0, 226955.0, 377775.0, 185391.0, 70039.0, 26149.0, 10451.0, 4659.0, 2274.0, 1192.0, 622.0, 296.0, 190.0, 104.0, 57.0, 37.0, 20.0, 17.0, 8.0, 6.0, 6.0, 3.0, 1.0, 2.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2705078125, -1.2335662841796875, -1.196624755859375, -1.1596832275390625, -1.12274169921875, -1.0858001708984375, -1.048858642578125, -1.0119171142578125, -0.9749755859375, -0.9380340576171875, -0.901092529296875, -0.8641510009765625, -0.82720947265625, -0.7902679443359375, -0.753326416015625, -0.7163848876953125, -0.679443359375, -0.6425018310546875, -0.605560302734375, -0.5686187744140625, -0.53167724609375, -0.4947357177734375, -0.457794189453125, -0.4208526611328125, -0.3839111328125, -0.3469696044921875, -0.310028076171875, -0.2730865478515625, -0.23614501953125, -0.1992034912109375, -0.162261962890625, -0.1253204345703125, -0.08837890625, -0.0514373779296875, -0.014495849609375, 0.0224456787109375, 0.05938720703125, 0.0963287353515625, 0.133270263671875, 0.1702117919921875, 0.2071533203125, 0.2440948486328125, 0.281036376953125, 0.3179779052734375, 0.35491943359375, 0.3918609619140625, 0.428802490234375, 0.4657440185546875, 0.502685546875, 0.5396270751953125, 0.576568603515625, 0.6135101318359375, 0.65045166015625, 0.6873931884765625, 0.724334716796875, 0.7612762451171875, 0.7982177734375, 0.8351593017578125, 0.872100830078125, 0.9090423583984375, 0.94598388671875, 0.9829254150390625, 1.019866943359375, 1.0568084716796875, 1.09375]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 4.0, 5.0, 6.0, 19.0, 27.0, 14.0, 30.0, 27.0, 33.0, 43.0, 52.0, 68.0, 80.0, 74.0, 70.0, 74.0, 67.0, 61.0, 50.0, 42.0, 45.0, 24.0, 28.0, 17.0, 21.0, 13.0, 7.0, 1.0, 4.0, 4.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.220703125, -2.139556884765625, -2.05841064453125, -1.977264404296875, -1.8961181640625, -1.814971923828125, -1.73382568359375, -1.652679443359375, -1.571533203125, -1.490386962890625, -1.40924072265625, -1.328094482421875, -1.2469482421875, -1.165802001953125, -1.08465576171875, -1.003509521484375, -0.92236328125, -0.841217041015625, -0.76007080078125, -0.678924560546875, -0.5977783203125, -0.516632080078125, -0.43548583984375, -0.354339599609375, -0.273193359375, -0.192047119140625, -0.11090087890625, -0.029754638671875, 0.0513916015625, 0.132537841796875, 0.21368408203125, 0.294830322265625, 0.3759765625, 0.457122802734375, 0.53826904296875, 0.619415283203125, 0.7005615234375, 0.781707763671875, 0.86285400390625, 0.944000244140625, 1.025146484375, 1.106292724609375, 1.18743896484375, 1.268585205078125, 1.3497314453125, 1.430877685546875, 1.51202392578125, 1.593170166015625, 1.67431640625, 1.755462646484375, 1.83660888671875, 1.917755126953125, 1.9989013671875, 2.080047607421875, 2.16119384765625, 2.242340087890625, 2.323486328125, 2.404632568359375, 2.48577880859375, 2.566925048828125, 2.6480712890625, 2.729217529296875, 2.81036376953125, 2.891510009765625, 2.97265625]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 7.0, 3.0, 5.0, 4.0, 10.0, 15.0, 18.0, 19.0, 31.0, 40.0, 44.0, 75.0, 95.0, 202.0, 251.0, 454.0, 860.0, 1716.0, 4037.0, 11517.0, 40840.0, 177868.0, 536123.0, 205824.0, 47040.0, 12914.0, 4439.0, 1850.0, 857.0, 521.0, 285.0, 183.0, 116.0, 84.0, 46.0, 36.0, 34.0, 26.0, 26.0, 9.0, 6.0, 8.0, 5.0, 5.0, 4.0, 4.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-1.3779296875, -1.33685302734375, -1.2957763671875, -1.25469970703125, -1.213623046875, -1.17254638671875, -1.1314697265625, -1.09039306640625, -1.04931640625, -1.00823974609375, -0.9671630859375, -0.92608642578125, -0.885009765625, -0.84393310546875, -0.8028564453125, -0.76177978515625, -0.720703125, -0.67962646484375, -0.6385498046875, -0.59747314453125, -0.556396484375, -0.51531982421875, -0.4742431640625, -0.43316650390625, -0.39208984375, -0.35101318359375, -0.3099365234375, -0.26885986328125, -0.227783203125, -0.18670654296875, -0.1456298828125, -0.10455322265625, -0.0634765625, -0.02239990234375, 0.0186767578125, 0.05975341796875, 0.100830078125, 0.14190673828125, 0.1829833984375, 0.22406005859375, 0.26513671875, 0.30621337890625, 0.3472900390625, 0.38836669921875, 0.429443359375, 0.47052001953125, 0.5115966796875, 0.55267333984375, 0.59375, 0.63482666015625, 0.6759033203125, 0.71697998046875, 0.758056640625, 0.79913330078125, 0.8402099609375, 0.88128662109375, 0.92236328125, 0.96343994140625, 1.0045166015625, 1.04559326171875, 1.086669921875, 1.12774658203125, 1.1688232421875, 1.20989990234375, 1.2509765625]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 7.0, 4.0, 7.0, 3.0, 6.0, 4.0, 5.0, 5.0, 15.0, 14.0, 17.0, 13.0, 21.0, 24.0, 28.0, 33.0, 35.0, 39.0, 33.0, 48.0, 36.0, 54.0, 39.0, 45.0, 35.0, 46.0, 40.0, 38.0, 35.0, 40.0, 32.0, 30.0, 21.0, 24.0, 29.0, 20.0, 13.0, 13.0, 14.0, 9.0, 8.0, 9.0, 3.0, 6.0, 4.0, 3.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.001953125, -2.90283203125, -2.8037109375, -2.70458984375, -2.60546875, -2.50634765625, -2.4072265625, -2.30810546875, -2.208984375, -2.10986328125, -2.0107421875, -1.91162109375, -1.8125, -1.71337890625, -1.6142578125, -1.51513671875, -1.416015625, -1.31689453125, -1.2177734375, -1.11865234375, -1.01953125, -0.92041015625, -0.8212890625, -0.72216796875, -0.623046875, -0.52392578125, -0.4248046875, -0.32568359375, -0.2265625, -0.12744140625, -0.0283203125, 0.07080078125, 0.169921875, 0.26904296875, 0.3681640625, 0.46728515625, 0.56640625, 0.66552734375, 0.7646484375, 0.86376953125, 0.962890625, 1.06201171875, 1.1611328125, 1.26025390625, 1.359375, 1.45849609375, 1.5576171875, 1.65673828125, 1.755859375, 1.85498046875, 1.9541015625, 2.05322265625, 2.15234375, 2.25146484375, 2.3505859375, 2.44970703125, 2.548828125, 2.64794921875, 2.7470703125, 2.84619140625, 2.9453125, 3.04443359375, 3.1435546875, 3.24267578125, 3.341796875]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 5.0, 1.0, 3.0, 6.0, 6.0, 12.0, 20.0, 26.0, 42.0, 52.0, 117.0, 135.0, 249.0, 412.0, 691.0, 1388.0, 2788.0, 6033.0, 16358.0, 57628.0, 300299.0, 514160.0, 105442.0, 25801.0, 8956.0, 3858.0, 1813.0, 915.0, 549.0, 297.0, 162.0, 113.0, 71.0, 57.0, 38.0, 21.0, 14.0, 8.0, 7.0, 7.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5087890625, -0.491363525390625, -0.47393798828125, -0.456512451171875, -0.4390869140625, -0.421661376953125, -0.40423583984375, -0.386810302734375, -0.369384765625, -0.351959228515625, -0.33453369140625, -0.317108154296875, -0.2996826171875, -0.282257080078125, -0.26483154296875, -0.247406005859375, -0.22998046875, -0.212554931640625, -0.19512939453125, -0.177703857421875, -0.1602783203125, -0.142852783203125, -0.12542724609375, -0.108001708984375, -0.090576171875, -0.073150634765625, -0.05572509765625, -0.038299560546875, -0.0208740234375, -0.003448486328125, 0.01397705078125, 0.031402587890625, 0.048828125, 0.066253662109375, 0.08367919921875, 0.101104736328125, 0.1185302734375, 0.135955810546875, 0.15338134765625, 0.170806884765625, 0.188232421875, 0.205657958984375, 0.22308349609375, 0.240509033203125, 0.2579345703125, 0.275360107421875, 0.29278564453125, 0.310211181640625, 0.32763671875, 0.345062255859375, 0.36248779296875, 0.379913330078125, 0.3973388671875, 0.414764404296875, 0.43218994140625, 0.449615478515625, 0.467041015625, 0.484466552734375, 0.50189208984375, 0.519317626953125, 0.5367431640625, 0.554168701171875, 0.57159423828125, 0.589019775390625, 0.6064453125]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 4.0, 4.0, 6.0, 12.0, 12.0, 26.0, 32.0, 61.0, 94.0, 165.0, 180.0, 163.0, 92.0, 65.0, 32.0, 26.0, 9.0, 6.0, 3.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0005164146423339844, -0.000498257577419281, -0.00048010051250457764, -0.00046194344758987427, -0.0004437863826751709, -0.00042562931776046753, -0.00040747225284576416, -0.0003893151879310608, -0.0003711581230163574, -0.00035300105810165405, -0.0003348439931869507, -0.0003166869282722473, -0.00029852986335754395, -0.0002803727984428406, -0.0002622157335281372, -0.00024405866861343384, -0.00022590160369873047, -0.0002077445387840271, -0.00018958747386932373, -0.00017143040895462036, -0.000153273344039917, -0.00013511627912521362, -0.00011695921421051025, -9.880214929580688e-05, -8.064508438110352e-05, -6.248801946640015e-05, -4.433095455169678e-05, -2.6173889636993408e-05, -8.016824722290039e-06, 1.014024019241333e-05, 2.82973051071167e-05, 4.645437002182007e-05, 6.461143493652344e-05, 8.27684998512268e-05, 0.00010092556476593018, 0.00011908262968063354, 0.00013723969459533691, 0.00015539675951004028, 0.00017355382442474365, 0.00019171088933944702, 0.0002098679542541504, 0.00022802501916885376, 0.00024618208408355713, 0.0002643391489982605, 0.00028249621391296387, 0.00030065327882766724, 0.0003188103437423706, 0.000336967408657074, 0.00035512447357177734, 0.0003732815384864807, 0.0003914386034011841, 0.00040959566831588745, 0.0004277527332305908, 0.0004459097981452942, 0.00046406686305999756, 0.00048222392797470093, 0.0005003809928894043, 0.0005185380578041077, 0.000536695122718811, 0.0005548521876335144, 0.0005730092525482178, 0.0005911663174629211, 0.0006093233823776245, 0.0006274804472923279, 0.0006456375122070312]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 2.0, 2.0, 6.0, 4.0, 5.0, 3.0, 5.0, 6.0, 21.0, 36.0, 75.0, 313.0, 28583.0, 1017246.0, 1994.0, 133.0, 38.0, 35.0, 8.0, 5.0, 8.0, 4.0, 4.0, 1.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.849609375, -3.722503662109375, -3.59539794921875, -3.468292236328125, -3.3411865234375, -3.214080810546875, -3.08697509765625, -2.959869384765625, -2.832763671875, -2.705657958984375, -2.57855224609375, -2.451446533203125, -2.3243408203125, -2.197235107421875, -2.07012939453125, -1.943023681640625, -1.81591796875, -1.688812255859375, -1.56170654296875, -1.434600830078125, -1.3074951171875, -1.180389404296875, -1.05328369140625, -0.926177978515625, -0.799072265625, -0.671966552734375, -0.54486083984375, -0.417755126953125, -0.2906494140625, -0.163543701171875, -0.03643798828125, 0.090667724609375, 0.2177734375, 0.344879150390625, 0.47198486328125, 0.599090576171875, 0.7261962890625, 0.853302001953125, 0.98040771484375, 1.107513427734375, 1.234619140625, 1.361724853515625, 1.48883056640625, 1.615936279296875, 1.7430419921875, 1.870147705078125, 1.99725341796875, 2.124359130859375, 2.25146484375, 2.378570556640625, 2.50567626953125, 2.632781982421875, 2.7598876953125, 2.886993408203125, 3.01409912109375, 3.141204833984375, 3.268310546875, 3.395416259765625, 3.52252197265625, 3.649627685546875, 3.7767333984375, 3.903839111328125, 4.03094482421875, 4.158050537109375, 4.28515625]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 4.0, 2.0, 1.0, 1.0, 6.0, 7.0, 1.0, 3.0, 3.0, 5.0, 8.0, 9.0, 13.0, 12.0, 23.0, 24.0, 33.0, 34.0, 52.0, 45.0, 79.0, 74.0, 81.0, 83.0, 62.0, 62.0, 64.0, 45.0, 34.0, 28.0, 17.0, 22.0, 16.0, 11.0, 6.0, 11.0, 5.0, 5.0, 3.0, 4.0, 1.0, 3.0, 5.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1431884765625, -0.13840293884277344, -0.13361740112304688, -0.1288318634033203, -0.12404632568359375, -0.11926078796386719, -0.11447525024414062, -0.10968971252441406, -0.1049041748046875, -0.10011863708496094, -0.09533309936523438, -0.09054756164550781, -0.08576202392578125, -0.08097648620605469, -0.07619094848632812, -0.07140541076660156, -0.066619873046875, -0.06183433532714844, -0.057048797607421875, -0.05226325988769531, -0.04747772216796875, -0.04269218444824219, -0.037906646728515625, -0.03312110900878906, -0.0283355712890625, -0.023550033569335938, -0.018764495849609375, -0.013978958129882812, -0.00919342041015625, -0.0044078826904296875, 0.000377655029296875, 0.0051631927490234375, 0.00994873046875, 0.014734268188476562, 0.019519805908203125, 0.024305343627929688, 0.02909088134765625, 0.03387641906738281, 0.038661956787109375, 0.04344749450683594, 0.0482330322265625, 0.05301856994628906, 0.057804107666015625, 0.06258964538574219, 0.06737518310546875, 0.07216072082519531, 0.07694625854492188, 0.08173179626464844, 0.086517333984375, 0.09130287170410156, 0.09608840942382812, 0.10087394714355469, 0.10565948486328125, 0.11044502258300781, 0.11523056030273438, 0.12001609802246094, 0.1248016357421875, 0.12958717346191406, 0.13437271118164062, 0.1391582489013672, 0.14394378662109375, 0.1487293243408203, 0.15351486206054688, 0.15830039978027344, 0.1630859375]}, "gradients/decoder.model.decoder.layers.10.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 6.0, 6.0, 9.0, 33.0, 74.0, 130.0, 202.0, 259.0, 143.0, 61.0, 45.0, 19.0, 9.0, 9.0, 2.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.1501359939575195, -6.976284980773926, -6.802433490753174, -6.628582000732422, -6.454730987548828, -6.280879974365234, -6.107028484344482, -5.9331769943237305, -5.759325981140137, -5.585474967956543, -5.411623477935791, -5.237771987915039, -5.063920974731445, -4.890069961547852, -4.7162184715271, -4.542366981506348, -4.368515968322754, -4.19466495513916, -4.020813465118408, -3.8469622135162354, -3.6731109619140625, -3.4992597103118896, -3.325408458709717, -3.151557207107544, -2.977705955505371, -2.8038547039031982, -2.6300034523010254, -2.4561522006988525, -2.2823009490966797, -2.108449697494507, -1.934598445892334, -1.7607471942901611, -1.5868961811065674, -1.4130449295043945, -1.2391936779022217, -1.0653424263000488, -0.891491174697876, -0.7176399230957031, -0.5437886714935303, -0.3699374198913574, -0.19608616828918457, -0.02223491668701172, 0.15161633491516113, 0.325467586517334, 0.49931883811950684, 0.6731700897216797, 0.8470213413238525, 1.0208725929260254, 1.1947238445281982, 1.368575096130371, 1.542426347732544, 1.7162775993347168, 1.8901288509368896, 2.0639801025390625, 2.2378313541412354, 2.411682605743408, 2.585533857345581, 2.759385108947754, 2.9332363605499268, 3.1070876121520996, 3.2809388637542725, 3.4547901153564453, 3.628641366958618, 3.802492618560791, 3.976343870162964]}, "gradients/decoder.model.decoder.layers.10.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 4.0, 9.0, 3.0, 11.0, 9.0, 24.0, 27.0, 30.0, 25.0, 45.0, 48.0, 53.0, 61.0, 61.0, 83.0, 91.0, 65.0, 46.0, 64.0, 64.0, 38.0, 30.0, 34.0, 24.0, 22.0, 14.0, 7.0, 11.0, 3.0, 4.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.413825511932373, -2.331449270248413, -2.2490732669830322, -2.1666970252990723, -2.0843210220336914, -2.0019447803497314, -1.919568657875061, -1.8371925354003906, -1.7548162937164307, -1.6724401712417603, -1.5900640487670898, -1.5076878070831299, -1.4253116846084595, -1.342935562133789, -1.2605594396591187, -1.1781833171844482, -1.0958071947097778, -1.0134310722351074, -0.9310548901557922, -0.8486787676811218, -0.7663025856018066, -0.6839264631271362, -0.6015503406524658, -0.5191741585731506, -0.4367980360984802, -0.3544218838214874, -0.27204573154449463, -0.18966960906982422, -0.10729345679283142, -0.024917304515838623, 0.05745881795883179, 0.13983500003814697, 0.22221112251281738, 0.3045872747898102, 0.386963427066803, 0.4693395495414734, 0.5517157316207886, 0.634091854095459, 0.7164679765701294, 0.7988441586494446, 0.881220281124115, 0.9635964035987854, 1.0459725856781006, 1.128348708152771, 1.2107248306274414, 1.2931010723114014, 1.3754770755767822, 1.4578533172607422, 1.5402294397354126, 1.622605562210083, 1.7049816846847534, 1.7873578071594238, 1.8697340488433838, 1.9521101713180542, 2.0344862937927246, 2.1168625354766846, 2.1992385387420654, 2.2816147804260254, 2.3639907836914062, 2.446367025375366, 2.528743028640747, 2.611119270324707, 2.693495273590088, 2.775871515274048, 2.858247756958008]}, "gradients/decoder.model.decoder.layers.10.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 4.0, 7.0, 4.0, 13.0, 18.0, 19.0, 28.0, 49.0, 91.0, 183.0, 357.0, 710.0, 1272.0, 2684.0, 5716.0, 13061.0, 34654.0, 111573.0, 459299.0, 302297.0, 73079.0, 24782.0, 9849.0, 4382.0, 2109.0, 1068.0, 614.0, 264.0, 145.0, 89.0, 50.0, 29.0, 14.0, 12.0, 11.0, 7.0, 4.0, 2.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-1.65625, -1.60870361328125, -1.5611572265625, -1.51361083984375, -1.466064453125, -1.41851806640625, -1.3709716796875, -1.32342529296875, -1.27587890625, -1.22833251953125, -1.1807861328125, -1.13323974609375, -1.085693359375, -1.03814697265625, -0.9906005859375, -0.94305419921875, -0.8955078125, -0.84796142578125, -0.8004150390625, -0.75286865234375, -0.705322265625, -0.65777587890625, -0.6102294921875, -0.56268310546875, -0.51513671875, -0.46759033203125, -0.4200439453125, -0.37249755859375, -0.324951171875, -0.27740478515625, -0.2298583984375, -0.18231201171875, -0.134765625, -0.08721923828125, -0.0396728515625, 0.00787353515625, 0.055419921875, 0.10296630859375, 0.1505126953125, 0.19805908203125, 0.24560546875, 0.29315185546875, 0.3406982421875, 0.38824462890625, 0.435791015625, 0.48333740234375, 0.5308837890625, 0.57843017578125, 0.6259765625, 0.67352294921875, 0.7210693359375, 0.76861572265625, 0.816162109375, 0.86370849609375, 0.9112548828125, 0.95880126953125, 1.00634765625, 1.05389404296875, 1.1014404296875, 1.14898681640625, 1.196533203125, 1.24407958984375, 1.2916259765625, 1.33917236328125, 1.38671875]}, "gradients/decoder.model.decoder.layers.10.self_attn.out_proj.bias": {"_type": "histogram", "values": [5.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 5.0, 4.0, 5.0, 13.0, 17.0, 20.0, 11.0, 31.0, 27.0, 24.0, 29.0, 24.0, 30.0, 41.0, 47.0, 40.0, 47.0, 42.0, 38.0, 45.0, 39.0, 44.0, 41.0, 41.0, 33.0, 42.0, 31.0, 27.0, 33.0, 21.0, 19.0, 21.0, 16.0, 13.0, 8.0, 4.0, 9.0, 6.0, 2.0, 8.0, 3.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.21875, -4.05718994140625, -3.8956298828125, -3.73406982421875, -3.572509765625, -3.41094970703125, -3.2493896484375, -3.08782958984375, -2.92626953125, -2.76470947265625, -2.6031494140625, -2.44158935546875, -2.280029296875, -2.11846923828125, -1.9569091796875, -1.79534912109375, -1.6337890625, -1.47222900390625, -1.3106689453125, -1.14910888671875, -0.987548828125, -0.82598876953125, -0.6644287109375, -0.50286865234375, -0.34130859375, -0.17974853515625, -0.0181884765625, 0.14337158203125, 0.304931640625, 0.46649169921875, 0.6280517578125, 0.78961181640625, 0.951171875, 1.11273193359375, 1.2742919921875, 1.43585205078125, 1.597412109375, 1.75897216796875, 1.9205322265625, 2.08209228515625, 2.24365234375, 2.40521240234375, 2.5667724609375, 2.72833251953125, 2.889892578125, 3.05145263671875, 3.2130126953125, 3.37457275390625, 3.5361328125, 3.69769287109375, 3.8592529296875, 4.02081298828125, 4.182373046875, 4.34393310546875, 4.5054931640625, 4.66705322265625, 4.82861328125, 4.99017333984375, 5.1517333984375, 5.31329345703125, 5.474853515625, 5.63641357421875, 5.7979736328125, 5.95953369140625, 6.12109375]}, "gradients/decoder.model.decoder.layers.10.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 0.0, 1.0, 3.0, 2.0, 3.0, 6.0, 7.0, 12.0, 27.0, 46.0, 77.0, 174.0, 870.0, 1046940.0, 166.0, 107.0, 54.0, 20.0, 21.0, 5.0, 4.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-87.8125, -85.166015625, -82.51953125, -79.873046875, -77.2265625, -74.580078125, -71.93359375, -69.287109375, -66.640625, -63.994140625, -61.34765625, -58.701171875, -56.0546875, -53.408203125, -50.76171875, -48.115234375, -45.46875, -42.822265625, -40.17578125, -37.529296875, -34.8828125, -32.236328125, -29.58984375, -26.943359375, -24.296875, -21.650390625, -19.00390625, -16.357421875, -13.7109375, -11.064453125, -8.41796875, -5.771484375, -3.125, -0.478515625, 2.16796875, 4.814453125, 7.4609375, 10.107421875, 12.75390625, 15.400390625, 18.046875, 20.693359375, 23.33984375, 25.986328125, 28.6328125, 31.279296875, 33.92578125, 36.572265625, 39.21875, 41.865234375, 44.51171875, 47.158203125, 49.8046875, 52.451171875, 55.09765625, 57.744140625, 60.390625, 63.037109375, 65.68359375, 68.330078125, 70.9765625, 73.623046875, 76.26953125, 78.916015625, 81.5625]}, "gradients/decoder.model.decoder.layers.10.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 0.0, 1.0, 3.0, 2.0, 3.0, 6.0, 7.0, 13.0, 28.0, 48.0, 79.0, 141.0, 167.0, 160.0, 125.0, 106.0, 48.0, 25.0, 22.0, 5.0, 4.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.765625, -24.989013671875, -24.21240234375, -23.435791015625, -22.6591796875, -21.882568359375, -21.10595703125, -20.329345703125, -19.552734375, -18.776123046875, -17.99951171875, -17.222900390625, -16.4462890625, -15.669677734375, -14.89306640625, -14.116455078125, -13.33984375, -12.563232421875, -11.78662109375, -11.010009765625, -10.2333984375, -9.456787109375, -8.68017578125, -7.903564453125, -7.126953125, -6.350341796875, -5.57373046875, -4.797119140625, -4.0205078125, -3.243896484375, -2.46728515625, -1.690673828125, -0.9140625, -0.137451171875, 0.63916015625, 1.415771484375, 2.1923828125, 2.968994140625, 3.74560546875, 4.522216796875, 5.298828125, 6.075439453125, 6.85205078125, 7.628662109375, 8.4052734375, 9.181884765625, 9.95849609375, 10.735107421875, 11.51171875, 12.288330078125, 13.06494140625, 13.841552734375, 14.6181640625, 15.394775390625, 16.17138671875, 16.947998046875, 17.724609375, 18.501220703125, 19.27783203125, 20.054443359375, 20.8310546875, 21.607666015625, 22.38427734375, 23.160888671875, 23.9375]}, "gradients/decoder.model.decoder.layers.10.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 7.0, 5.0, 6.0, 8.0, 13.0, 23.0, 20.0, 39.0, 65.0, 112.0, 266.0, 1193.0, 10580.0, 729627.0, 297675.0, 7445.0, 947.0, 231.0, 112.0, 59.0, 29.0, 20.0, 16.0, 11.0, 6.0, 5.0, 6.0, 4.0, 5.0, 6.0, 1.0, 3.0, 1.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3447265625, -1.2998046875, -1.2548828125, -1.2099609375, -1.1650390625, -1.1201171875, -1.0751953125, -1.0302734375, -0.9853515625, -0.9404296875, -0.8955078125, -0.8505859375, -0.8056640625, -0.7607421875, -0.7158203125, -0.6708984375, -0.6259765625, -0.5810546875, -0.5361328125, -0.4912109375, -0.4462890625, -0.4013671875, -0.3564453125, -0.3115234375, -0.2666015625, -0.2216796875, -0.1767578125, -0.1318359375, -0.0869140625, -0.0419921875, 0.0029296875, 0.0478515625, 0.0927734375, 0.1376953125, 0.1826171875, 0.2275390625, 0.2724609375, 0.3173828125, 0.3623046875, 0.4072265625, 0.4521484375, 0.4970703125, 0.5419921875, 0.5869140625, 0.6318359375, 0.6767578125, 0.7216796875, 0.7666015625, 0.8115234375, 0.8564453125, 0.9013671875, 0.9462890625, 0.9912109375, 1.0361328125, 1.0810546875, 1.1259765625, 1.1708984375, 1.2158203125, 1.2607421875, 1.3056640625, 1.3505859375, 1.3955078125, 1.4404296875, 1.4853515625, 1.5302734375]}, "gradients/decoder.model.decoder.layers.10.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 6.0, 7.0, 9.0, 18.0, 23.0, 49.0, 87.0, 196.0, 275.0, 161.0, 92.0, 37.0, 19.0, 13.0, 5.0, 4.0, 2.0, 1.0, 0.0, 6.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.912252426147461e-05, -9.371433407068253e-05, -8.830614387989044e-05, -8.289795368909836e-05, -7.748976349830627e-05, -7.208157330751419e-05, -6.667338311672211e-05, -6.126519292593002e-05, -5.585700273513794e-05, -5.0448812544345856e-05, -4.504062235355377e-05, -3.963243216276169e-05, -3.4224241971969604e-05, -2.881605178117752e-05, -2.3407861590385437e-05, -1.7999671399593353e-05, -1.259148120880127e-05, -7.183291018009186e-06, -1.775100827217102e-06, 3.6330893635749817e-06, 9.041279554367065e-06, 1.444946974515915e-05, 1.9857659935951233e-05, 2.5265850126743317e-05, 3.06740403175354e-05, 3.6082230508327484e-05, 4.149042069911957e-05, 4.689861088991165e-05, 5.2306801080703735e-05, 5.771499127149582e-05, 6.31231814622879e-05, 6.853137165307999e-05, 7.393956184387207e-05, 7.934775203466415e-05, 8.475594222545624e-05, 9.016413241624832e-05, 9.55723226070404e-05, 0.00010098051279783249, 0.00010638870298862457, 0.00011179689317941666, 0.00011720508337020874, 0.00012261327356100082, 0.0001280214637517929, 0.000133429653942585, 0.00013883784413337708, 0.00014424603432416916, 0.00014965422451496124, 0.00015506241470575333, 0.0001604706048965454, 0.0001658787950873375, 0.00017128698527812958, 0.00017669517546892166, 0.00018210336565971375, 0.00018751155585050583, 0.0001929197460412979, 0.00019832793623209, 0.00020373612642288208, 0.00020914431661367416, 0.00021455250680446625, 0.00021996069699525833, 0.00022536888718605042, 0.0002307770773768425, 0.00023618526756763458, 0.00024159345775842667, 0.00024700164794921875]}, "gradients/decoder.model.decoder.layers.10.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 3.0, 3.0, 3.0, 6.0, 11.0, 21.0, 31.0, 47.0, 130.0, 609.0, 10831.0, 975372.0, 59746.0, 1370.0, 224.0, 84.0, 26.0, 11.0, 16.0, 5.0, 8.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8193359375, -1.7619171142578125, -1.704498291015625, -1.6470794677734375, -1.58966064453125, -1.5322418212890625, -1.474822998046875, -1.4174041748046875, -1.3599853515625, -1.3025665283203125, -1.245147705078125, -1.1877288818359375, -1.13031005859375, -1.0728912353515625, -1.015472412109375, -0.9580535888671875, -0.900634765625, -0.8432159423828125, -0.785797119140625, -0.7283782958984375, -0.67095947265625, -0.6135406494140625, -0.556121826171875, -0.4987030029296875, -0.4412841796875, -0.3838653564453125, -0.326446533203125, -0.2690277099609375, -0.21160888671875, -0.1541900634765625, -0.096771240234375, -0.0393524169921875, 0.01806640625, 0.0754852294921875, 0.132904052734375, 0.1903228759765625, 0.24774169921875, 0.3051605224609375, 0.362579345703125, 0.4199981689453125, 0.4774169921875, 0.5348358154296875, 0.592254638671875, 0.6496734619140625, 0.70709228515625, 0.7645111083984375, 0.821929931640625, 0.8793487548828125, 0.936767578125, 0.9941864013671875, 1.051605224609375, 1.1090240478515625, 1.16644287109375, 1.2238616943359375, 1.281280517578125, 1.3386993408203125, 1.3961181640625, 1.4535369873046875, 1.510955810546875, 1.5683746337890625, 1.62579345703125, 1.6832122802734375, 1.740631103515625, 1.7980499267578125, 1.85546875]}, "gradients/decoder.model.decoder.layers.10.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 5.0, 8.0, 4.0, 14.0, 11.0, 14.0, 14.0, 20.0, 28.0, 32.0, 58.0, 68.0, 119.0, 215.0, 109.0, 81.0, 41.0, 40.0, 31.0, 24.0, 20.0, 11.0, 9.0, 10.0, 4.0, 1.0, 5.0, 2.0, 1.0, 3.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.181640625, -0.17502784729003906, -0.16841506958007812, -0.1618022918701172, -0.15518951416015625, -0.1485767364501953, -0.14196395874023438, -0.13535118103027344, -0.1287384033203125, -0.12212562561035156, -0.11551284790039062, -0.10890007019042969, -0.10228729248046875, -0.09567451477050781, -0.08906173706054688, -0.08244895935058594, -0.075836181640625, -0.06922340393066406, -0.06261062622070312, -0.05599784851074219, -0.04938507080078125, -0.04277229309082031, -0.036159515380859375, -0.029546737670898438, -0.0229339599609375, -0.016321182250976562, -0.009708404541015625, -0.0030956268310546875, 0.00351715087890625, 0.010129928588867188, 0.016742706298828125, 0.023355484008789062, 0.02996826171875, 0.03658103942871094, 0.043193817138671875, 0.04980659484863281, 0.05641937255859375, 0.06303215026855469, 0.06964492797851562, 0.07625770568847656, 0.0828704833984375, 0.08948326110839844, 0.09609603881835938, 0.10270881652832031, 0.10932159423828125, 0.11593437194824219, 0.12254714965820312, 0.12915992736816406, 0.135772705078125, 0.14238548278808594, 0.14899826049804688, 0.1556110382080078, 0.16222381591796875, 0.1688365936279297, 0.17544937133789062, 0.18206214904785156, 0.1886749267578125, 0.19528770446777344, 0.20190048217773438, 0.2085132598876953, 0.21512603759765625, 0.2217388153076172, 0.22835159301757812, 0.23496437072753906, 0.2415771484375]}, "gradients/decoder.model.decoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 152.0, 743.0, 113.0, 9.0], "bins": [-88.92949676513672, -87.48173522949219, -86.03398132324219, -84.58621978759766, -83.13846588134766, -81.69070434570312, -80.24295043945312, -78.7951889038086, -77.34742736816406, -75.89966583251953, -74.45191192626953, -73.004150390625, -71.556396484375, -70.10863494873047, -68.66087341308594, -67.21311950683594, -65.76536560058594, -64.3176040649414, -62.869850158691406, -61.422088623046875, -59.97433090209961, -58.526573181152344, -57.07881546020508, -55.63105773925781, -54.18329620361328, -52.735538482666016, -51.28778076171875, -49.84001922607422, -48.39226150512695, -46.94450378417969, -45.49674606323242, -44.048988342285156, -42.60123062133789, -41.153472900390625, -39.70571517944336, -38.257957458496094, -36.81019592285156, -35.3624382019043, -33.91468048095703, -32.466922760009766, -31.019163131713867, -29.5714054107666, -28.123645782470703, -26.675888061523438, -25.228130340576172, -23.780372619628906, -22.332612991333008, -20.884855270385742, -19.437095642089844, -17.989337921142578, -16.54157829284668, -15.093820571899414, -13.646062850952148, -12.198304176330566, -10.750545501708984, -9.302787780761719, -7.855030059814453, -6.407271862030029, -4.9595136642456055, -3.5117549896240234, -2.0639967918395996, -0.6162385940551758, 0.8315200805664062, 2.279277801513672, 3.727036714553833]}, "gradients/decoder.model.decoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 5.0, 4.0, 7.0, 5.0, 10.0, 19.0, 13.0, 18.0, 11.0, 21.0, 23.0, 23.0, 33.0, 32.0, 23.0, 52.0, 29.0, 42.0, 25.0, 45.0, 46.0, 52.0, 46.0, 51.0, 48.0, 38.0, 38.0, 33.0, 32.0, 29.0, 19.0, 22.0, 21.0, 16.0, 15.0, 15.0, 17.0, 8.0, 5.0, 3.0, 4.0, 2.0, 4.0, 5.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.628915786743164, -7.366003513336182, -7.103091716766357, -6.840179443359375, -6.577267169952393, -6.31435489654541, -6.051443099975586, -5.7885308265686035, -5.525618553161621, -5.262706279754639, -4.9997944831848145, -4.736882209777832, -4.47396993637085, -4.211057662963867, -3.948145866394043, -3.6852335929870605, -3.4223217964172363, -3.159409761428833, -2.8964974880218506, -2.6335854530334473, -2.370673179626465, -2.1077611446380615, -1.8448491096496582, -1.5819369554519653, -1.3190248012542725, -1.0561126470565796, -0.7932005524635315, -0.5302884578704834, -0.2673763036727905, -0.004464149475097656, 0.25844788551330566, 0.5213600397109985, 0.7842721939086914, 1.0471843481063843, 1.3100965023040771, 1.5730085372924805, 1.8359206914901733, 2.098832845687866, 2.3617448806762695, 2.624657154083252, 2.8875691890716553, 3.1504812240600586, 3.413393497467041, 3.6763055324554443, 3.9392175674438477, 4.20212984085083, 4.4650421142578125, 4.727953910827637, 4.990866184234619, 5.253778457641602, 5.516690254211426, 5.779602527618408, 6.042514801025391, 6.305426597595215, 6.568338871002197, 6.83125114440918, 7.094162940979004, 7.357075214385986, 7.6199870109558105, 7.882899284362793, 8.145811080932617, 8.408723831176758, 8.671635627746582, 8.934547424316406, 9.197460174560547]}, "gradients/decoder.model.decoder.layers.9.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 3.0, 2.0, 6.0, 9.0, 7.0, 12.0, 10.0, 8.0, 21.0, 20.0, 14.0, 27.0, 23.0, 26.0, 51.0, 83.0, 131.0, 303.0, 860.0, 3260.0, 18613.0, 255490.0, 3616158.0, 274277.0, 19615.0, 3662.0, 924.0, 261.0, 110.0, 68.0, 41.0, 43.0, 25.0, 27.0, 14.0, 16.0, 17.0, 14.0, 7.0, 8.0, 7.0, 4.0, 5.0, 7.0, 3.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.26953125, -5.102294921875, -4.93505859375, -4.767822265625, -4.6005859375, -4.433349609375, -4.26611328125, -4.098876953125, -3.931640625, -3.764404296875, -3.59716796875, -3.429931640625, -3.2626953125, -3.095458984375, -2.92822265625, -2.760986328125, -2.59375, -2.426513671875, -2.25927734375, -2.092041015625, -1.9248046875, -1.757568359375, -1.59033203125, -1.423095703125, -1.255859375, -1.088623046875, -0.92138671875, -0.754150390625, -0.5869140625, -0.419677734375, -0.25244140625, -0.085205078125, 0.08203125, 0.249267578125, 0.41650390625, 0.583740234375, 0.7509765625, 0.918212890625, 1.08544921875, 1.252685546875, 1.419921875, 1.587158203125, 1.75439453125, 1.921630859375, 2.0888671875, 2.256103515625, 2.42333984375, 2.590576171875, 2.7578125, 2.925048828125, 3.09228515625, 3.259521484375, 3.4267578125, 3.593994140625, 3.76123046875, 3.928466796875, 4.095703125, 4.262939453125, 4.43017578125, 4.597412109375, 4.7646484375, 4.931884765625, 5.09912109375, 5.266357421875, 5.43359375]}, "gradients/decoder.model.decoder.layers.9.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 4.0, 9.0, 7.0, 13.0, 9.0, 15.0, 20.0, 32.0, 36.0, 49.0, 49.0, 61.0, 64.0, 81.0, 87.0, 83.0, 80.0, 63.0, 44.0, 52.0, 44.0, 30.0, 19.0, 15.0, 18.0, 10.0, 7.0, 5.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.27734375, -3.1876220703125, -3.097900390625, -3.0081787109375, -2.91845703125, -2.8287353515625, -2.739013671875, -2.6492919921875, -2.5595703125, -2.4698486328125, -2.380126953125, -2.2904052734375, -2.20068359375, -2.1109619140625, -2.021240234375, -1.9315185546875, -1.841796875, -1.7520751953125, -1.662353515625, -1.5726318359375, -1.48291015625, -1.3931884765625, -1.303466796875, -1.2137451171875, -1.1240234375, -1.0343017578125, -0.944580078125, -0.8548583984375, -0.76513671875, -0.6754150390625, -0.585693359375, -0.4959716796875, -0.40625, -0.3165283203125, -0.226806640625, -0.1370849609375, -0.04736328125, 0.0423583984375, 0.132080078125, 0.2218017578125, 0.3115234375, 0.4012451171875, 0.490966796875, 0.5806884765625, 0.67041015625, 0.7601318359375, 0.849853515625, 0.9395751953125, 1.029296875, 1.1190185546875, 1.208740234375, 1.2984619140625, 1.38818359375, 1.4779052734375, 1.567626953125, 1.6573486328125, 1.7470703125, 1.8367919921875, 1.926513671875, 2.0162353515625, 2.10595703125, 2.1956787109375, 2.285400390625, 2.3751220703125, 2.46484375]}, "gradients/decoder.model.decoder.layers.9.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 5.0, 0.0, 3.0, 7.0, 5.0, 2.0, 11.0, 13.0, 52.0, 304.0, 154433.0, 4038917.0, 426.0, 79.0, 14.0, 11.0, 6.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.3125, -39.25390625, -38.1953125, -37.13671875, -36.078125, -35.01953125, -33.9609375, -32.90234375, -31.84375, -30.78515625, -29.7265625, -28.66796875, -27.609375, -26.55078125, -25.4921875, -24.43359375, -23.375, -22.31640625, -21.2578125, -20.19921875, -19.140625, -18.08203125, -17.0234375, -15.96484375, -14.90625, -13.84765625, -12.7890625, -11.73046875, -10.671875, -9.61328125, -8.5546875, -7.49609375, -6.4375, -5.37890625, -4.3203125, -3.26171875, -2.203125, -1.14453125, -0.0859375, 0.97265625, 2.03125, 3.08984375, 4.1484375, 5.20703125, 6.265625, 7.32421875, 8.3828125, 9.44140625, 10.5, 11.55859375, 12.6171875, 13.67578125, 14.734375, 15.79296875, 16.8515625, 17.91015625, 18.96875, 20.02734375, 21.0859375, 22.14453125, 23.203125, 24.26171875, 25.3203125, 26.37890625, 27.4375]}, "gradients/decoder.model.decoder.layers.9.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 5.0, 6.0, 5.0, 5.0, 8.0, 11.0, 15.0, 14.0, 26.0, 23.0, 43.0, 43.0, 55.0, 91.0, 105.0, 156.0, 273.0, 359.0, 558.0, 640.0, 533.0, 343.0, 205.0, 167.0, 111.0, 70.0, 47.0, 33.0, 40.0, 22.0, 19.0, 12.0, 10.0, 6.0, 3.0, 7.0, 5.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-0.78369140625, -0.7608795166015625, -0.738067626953125, -0.7152557373046875, -0.69244384765625, -0.6696319580078125, -0.646820068359375, -0.6240081787109375, -0.6011962890625, -0.5783843994140625, -0.555572509765625, -0.5327606201171875, -0.50994873046875, -0.4871368408203125, -0.464324951171875, -0.4415130615234375, -0.418701171875, -0.3958892822265625, -0.373077392578125, -0.3502655029296875, -0.32745361328125, -0.3046417236328125, -0.281829833984375, -0.2590179443359375, -0.2362060546875, -0.2133941650390625, -0.190582275390625, -0.1677703857421875, -0.14495849609375, -0.1221466064453125, -0.099334716796875, -0.0765228271484375, -0.0537109375, -0.0308990478515625, -0.008087158203125, 0.0147247314453125, 0.03753662109375, 0.0603485107421875, 0.083160400390625, 0.1059722900390625, 0.1287841796875, 0.1515960693359375, 0.174407958984375, 0.1972198486328125, 0.22003173828125, 0.2428436279296875, 0.265655517578125, 0.2884674072265625, 0.311279296875, 0.3340911865234375, 0.356903076171875, 0.3797149658203125, 0.40252685546875, 0.4253387451171875, 0.448150634765625, 0.4709625244140625, 0.4937744140625, 0.5165863037109375, 0.539398193359375, 0.5622100830078125, 0.58502197265625, 0.6078338623046875, 0.630645751953125, 0.6534576416015625, 0.67626953125]}, "gradients/decoder.model.decoder.layers.9.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 7.0, 5.0, 9.0, 17.0, 15.0, 21.0, 33.0, 40.0, 75.0, 78.0, 89.0, 110.0, 111.0, 99.0, 76.0, 73.0, 43.0, 25.0, 28.0, 16.0, 15.0, 11.0, 4.0, 3.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.463042259216309, -4.342831134796143, -4.222620010375977, -4.1024088859558105, -3.9821975231170654, -3.8619863986968994, -3.7417752742767334, -3.6215641498565674, -3.5013530254364014, -3.3811419010162354, -3.2609307765960693, -3.140719413757324, -3.020508289337158, -2.900297164916992, -2.780086040496826, -2.65987491607666, -2.539663791656494, -2.419452667236328, -2.299241542816162, -2.179030418395996, -2.058819055557251, -1.938607931137085, -1.818396806716919, -1.698185682296753, -1.5779743194580078, -1.4577631950378418, -1.3375519514083862, -1.2173408269882202, -1.0971297025680542, -0.9769185185432434, -0.8567073345184326, -0.7364962100982666, -0.6162850856781006, -0.4960739314556122, -0.3758627772331238, -0.255651593208313, -0.13544043898582458, -0.015229284763336182, 0.10498189926147461, 0.22519302368164062, 0.3454042077064514, 0.4656153619289398, 0.5858265161514282, 0.706037700176239, 0.8262488842010498, 0.9464600086212158, 1.0666711330413818, 1.1868822574615479, 1.3070935010910034, 1.4273046255111694, 1.547515869140625, 1.667726993560791, 1.787938117980957, 1.908149242401123, 2.028360366821289, 2.148571491241455, 2.2687828540802, 2.388993978500366, 2.5092051029205322, 2.6294164657592773, 2.7496275901794434, 2.8698387145996094, 2.9900498390197754, 3.1102609634399414, 3.2304720878601074]}, "gradients/decoder.model.decoder.layers.9.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 3.0, 10.0, 12.0, 12.0, 10.0, 12.0, 26.0, 20.0, 23.0, 19.0, 26.0, 45.0, 40.0, 51.0, 48.0, 66.0, 49.0, 54.0, 54.0, 47.0, 42.0, 52.0, 31.0, 45.0, 39.0, 38.0, 34.0, 25.0, 11.0, 18.0, 10.0, 9.0, 9.0, 3.0, 4.0, 6.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.323835849761963, -2.2528347969055176, -2.1818339824676514, -2.110832929611206, -2.03983211517334, -1.9688310623168945, -1.8978301286697388, -1.826829195022583, -1.7558281421661377, -1.684827208518982, -1.6138262748718262, -1.5428252220153809, -1.471824288368225, -1.4008233547210693, -1.3298224210739136, -1.2588214874267578, -1.187820553779602, -1.1168196201324463, -1.0458186864852905, -0.97481769323349, -0.9038166999816895, -0.8328157663345337, -0.7618148326873779, -0.6908138990402222, -0.6198129057884216, -0.5488119721412659, -0.47781097888946533, -0.40681004524230957, -0.3358090817928314, -0.26480811834335327, -0.1938071846961975, -0.12280622124671936, -0.05180525779724121, 0.01919569820165634, 0.0901966542005539, 0.16119760274887085, 0.232198566198349, 0.30319952964782715, 0.3742004632949829, 0.44520142674446106, 0.5162023901939392, 0.587203323841095, 0.6582043170928955, 0.7292052507400513, 0.800206184387207, 0.8712071776390076, 0.9422081112861633, 1.0132091045379639, 1.0842100381851196, 1.1552109718322754, 1.2262119054794312, 1.297212839126587, 1.3682138919830322, 1.439214825630188, 1.5102157592773438, 1.5812166929244995, 1.6522176265716553, 1.723218560218811, 1.7942194938659668, 1.865220546722412, 1.9362214803695679, 2.0072224140167236, 2.07822322845459, 2.149224281311035, 2.2202253341674805]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 3.0, 11.0, 10.0, 7.0, 12.0, 41.0, 57.0, 170.0, 476.0, 1944.0, 11731.0, 113449.0, 727284.0, 173712.0, 16112.0, 2629.0, 576.0, 176.0, 68.0, 30.0, 24.0, 11.0, 12.0, 8.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.083984375, -2.02001953125, -1.9560546875, -1.89208984375, -1.828125, -1.76416015625, -1.7001953125, -1.63623046875, -1.572265625, -1.50830078125, -1.4443359375, -1.38037109375, -1.31640625, -1.25244140625, -1.1884765625, -1.12451171875, -1.060546875, -0.99658203125, -0.9326171875, -0.86865234375, -0.8046875, -0.74072265625, -0.6767578125, -0.61279296875, -0.548828125, -0.48486328125, -0.4208984375, -0.35693359375, -0.29296875, -0.22900390625, -0.1650390625, -0.10107421875, -0.037109375, 0.02685546875, 0.0908203125, 0.15478515625, 0.21875, 0.28271484375, 0.3466796875, 0.41064453125, 0.474609375, 0.53857421875, 0.6025390625, 0.66650390625, 0.73046875, 0.79443359375, 0.8583984375, 0.92236328125, 0.986328125, 1.05029296875, 1.1142578125, 1.17822265625, 1.2421875, 1.30615234375, 1.3701171875, 1.43408203125, 1.498046875, 1.56201171875, 1.6259765625, 1.68994140625, 1.75390625, 1.81787109375, 1.8818359375, 1.94580078125, 2.009765625]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 6.0, 1.0, 5.0, 26.0, 15.0, 37.0, 43.0, 76.0, 100.0, 101.0, 124.0, 114.0, 100.0, 91.0, 65.0, 42.0, 26.0, 21.0, 13.0, 6.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.515625, -4.4208984375, -4.326171875, -4.2314453125, -4.13671875, -4.0419921875, -3.947265625, -3.8525390625, -3.7578125, -3.6630859375, -3.568359375, -3.4736328125, -3.37890625, -3.2841796875, -3.189453125, -3.0947265625, -3.0, -2.9052734375, -2.810546875, -2.7158203125, -2.62109375, -2.5263671875, -2.431640625, -2.3369140625, -2.2421875, -2.1474609375, -2.052734375, -1.9580078125, -1.86328125, -1.7685546875, -1.673828125, -1.5791015625, -1.484375, -1.3896484375, -1.294921875, -1.2001953125, -1.10546875, -1.0107421875, -0.916015625, -0.8212890625, -0.7265625, -0.6318359375, -0.537109375, -0.4423828125, -0.34765625, -0.2529296875, -0.158203125, -0.0634765625, 0.03125, 0.1259765625, 0.220703125, 0.3154296875, 0.41015625, 0.5048828125, 0.599609375, 0.6943359375, 0.7890625, 0.8837890625, 0.978515625, 1.0732421875, 1.16796875, 1.2626953125, 1.357421875, 1.4521484375, 1.546875]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 2.0, 8.0, 6.0, 7.0, 10.0, 21.0, 24.0, 33.0, 45.0, 62.0, 79.0, 162.0, 207.0, 423.0, 760.0, 1915.0, 4982.0, 16812.0, 80455.0, 471531.0, 387246.0, 62336.0, 13806.0, 4245.0, 1587.0, 762.0, 393.0, 216.0, 113.0, 86.0, 62.0, 47.0, 35.0, 23.0, 11.0, 11.0, 11.0, 5.0, 5.0, 6.0, 4.0, 1.0, 1.0, 4.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-1.0419921875, -1.0093536376953125, -0.976715087890625, -0.9440765380859375, -0.91143798828125, -0.8787994384765625, -0.846160888671875, -0.8135223388671875, -0.7808837890625, -0.7482452392578125, -0.715606689453125, -0.6829681396484375, -0.65032958984375, -0.6176910400390625, -0.585052490234375, -0.5524139404296875, -0.519775390625, -0.4871368408203125, -0.454498291015625, -0.4218597412109375, -0.38922119140625, -0.3565826416015625, -0.323944091796875, -0.2913055419921875, -0.2586669921875, -0.2260284423828125, -0.193389892578125, -0.1607513427734375, -0.12811279296875, -0.0954742431640625, -0.062835693359375, -0.0301971435546875, 0.00244140625, 0.0350799560546875, 0.067718505859375, 0.1003570556640625, 0.13299560546875, 0.1656341552734375, 0.198272705078125, 0.2309112548828125, 0.2635498046875, 0.2961883544921875, 0.328826904296875, 0.3614654541015625, 0.39410400390625, 0.4267425537109375, 0.459381103515625, 0.4920196533203125, 0.524658203125, 0.5572967529296875, 0.589935302734375, 0.6225738525390625, 0.65521240234375, 0.6878509521484375, 0.720489501953125, 0.7531280517578125, 0.7857666015625, 0.8184051513671875, 0.851043701171875, 0.8836822509765625, 0.91632080078125, 0.9489593505859375, 0.981597900390625, 1.0142364501953125, 1.046875]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 5.0, 3.0, 3.0, 5.0, 5.0, 9.0, 15.0, 9.0, 14.0, 24.0, 24.0, 16.0, 23.0, 24.0, 35.0, 29.0, 32.0, 45.0, 39.0, 40.0, 37.0, 44.0, 49.0, 47.0, 56.0, 35.0, 49.0, 32.0, 32.0, 38.0, 33.0, 30.0, 19.0, 16.0, 22.0, 12.0, 15.0, 10.0, 11.0, 8.0, 6.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.158203125, -2.08453369140625, -2.0108642578125, -1.93719482421875, -1.863525390625, -1.78985595703125, -1.7161865234375, -1.64251708984375, -1.56884765625, -1.49517822265625, -1.4215087890625, -1.34783935546875, -1.274169921875, -1.20050048828125, -1.1268310546875, -1.05316162109375, -0.9794921875, -0.90582275390625, -0.8321533203125, -0.75848388671875, -0.684814453125, -0.61114501953125, -0.5374755859375, -0.46380615234375, -0.39013671875, -0.31646728515625, -0.2427978515625, -0.16912841796875, -0.095458984375, -0.02178955078125, 0.0518798828125, 0.12554931640625, 0.19921875, 0.27288818359375, 0.3465576171875, 0.42022705078125, 0.493896484375, 0.56756591796875, 0.6412353515625, 0.71490478515625, 0.78857421875, 0.86224365234375, 0.9359130859375, 1.00958251953125, 1.083251953125, 1.15692138671875, 1.2305908203125, 1.30426025390625, 1.3779296875, 1.45159912109375, 1.5252685546875, 1.59893798828125, 1.672607421875, 1.74627685546875, 1.8199462890625, 1.89361572265625, 1.96728515625, 2.04095458984375, 2.1146240234375, 2.18829345703125, 2.261962890625, 2.33563232421875, 2.4093017578125, 2.48297119140625, 2.556640625]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 5.0, 8.0, 8.0, 21.0, 15.0, 46.0, 78.0, 143.0, 315.0, 757.0, 1958.0, 6803.0, 31957.0, 308264.0, 615996.0, 66342.0, 11037.0, 3031.0, 1032.0, 389.0, 187.0, 76.0, 47.0, 23.0, 12.0, 8.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.642578125, -0.6243133544921875, -0.606048583984375, -0.5877838134765625, -0.56951904296875, -0.5512542724609375, -0.532989501953125, -0.5147247314453125, -0.4964599609375, -0.4781951904296875, -0.459930419921875, -0.4416656494140625, -0.42340087890625, -0.4051361083984375, -0.386871337890625, -0.3686065673828125, -0.350341796875, -0.3320770263671875, -0.313812255859375, -0.2955474853515625, -0.27728271484375, -0.2590179443359375, -0.240753173828125, -0.2224884033203125, -0.2042236328125, -0.1859588623046875, -0.167694091796875, -0.1494293212890625, -0.13116455078125, -0.1128997802734375, -0.094635009765625, -0.0763702392578125, -0.05810546875, -0.0398406982421875, -0.021575927734375, -0.0033111572265625, 0.01495361328125, 0.0332183837890625, 0.051483154296875, 0.0697479248046875, 0.0880126953125, 0.1062774658203125, 0.124542236328125, 0.1428070068359375, 0.16107177734375, 0.1793365478515625, 0.197601318359375, 0.2158660888671875, 0.234130859375, 0.2523956298828125, 0.270660400390625, 0.2889251708984375, 0.30718994140625, 0.3254547119140625, 0.343719482421875, 0.3619842529296875, 0.3802490234375, 0.3985137939453125, 0.416778564453125, 0.4350433349609375, 0.45330810546875, 0.4715728759765625, 0.489837646484375, 0.5081024169921875, 0.5263671875]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 6.0, 10.0, 10.0, 27.0, 23.0, 64.0, 109.0, 108.0, 160.0, 163.0, 125.0, 74.0, 48.0, 31.0, 17.0, 7.0, 5.0, 4.0, 6.0, 2.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0004119873046875, -0.0004004649817943573, -0.0003889426589012146, -0.0003774203360080719, -0.0003658980131149292, -0.0003543756902217865, -0.0003428533673286438, -0.0003313310444355011, -0.0003198087215423584, -0.0003082863986492157, -0.000296764075756073, -0.0002852417528629303, -0.0002737194299697876, -0.0002621971070766449, -0.0002506747841835022, -0.0002391524612903595, -0.0002276301383972168, -0.0002161078155040741, -0.0002045854926109314, -0.0001930631697177887, -0.000181540846824646, -0.0001700185239315033, -0.0001584962010383606, -0.0001469738781452179, -0.0001354515552520752, -0.0001239292323589325, -0.0001124069094657898, -0.0001008845865726471, -8.93622636795044e-05, -7.78399407863617e-05, -6.6317617893219e-05, -5.4795295000076294e-05, -4.3272972106933594e-05, -3.1750649213790894e-05, -2.0228326320648193e-05, -8.706003427505493e-06, 2.816319465637207e-06, 1.4338642358779907e-05, 2.5860965251922607e-05, 3.738328814506531e-05, 4.890561103820801e-05, 6.042793393135071e-05, 7.195025682449341e-05, 8.347257971763611e-05, 9.499490261077881e-05, 0.00010651722550392151, 0.00011803954839706421, 0.0001295618712902069, 0.0001410841941833496, 0.0001526065170764923, 0.000164128839969635, 0.0001756511628627777, 0.0001871734857559204, 0.0001986958086490631, 0.0002102181315422058, 0.0002217404544353485, 0.0002332627773284912, 0.0002447851002216339, 0.0002563074231147766, 0.0002678297460079193, 0.000279352068901062, 0.0002908743917942047, 0.0003023967146873474, 0.0003139190375804901, 0.0003254413604736328]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 5.0, 5.0, 10.0, 6.0, 6.0, 8.0, 17.0, 16.0, 36.0, 44.0, 67.0, 140.0, 211.0, 339.0, 610.0, 1128.0, 2373.0, 5271.0, 13815.0, 43945.0, 183962.0, 502367.0, 216816.0, 50600.0, 15579.0, 5857.0, 2502.0, 1252.0, 636.0, 330.0, 215.0, 131.0, 90.0, 50.0, 34.0, 25.0, 15.0, 15.0, 10.0, 6.0, 8.0, 3.0, 5.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.379638671875, -0.3679771423339844, -0.35631561279296875, -0.3446540832519531, -0.3329925537109375, -0.3213310241699219, -0.30966949462890625, -0.2980079650878906, -0.286346435546875, -0.2746849060058594, -0.26302337646484375, -0.2513618469238281, -0.2397003173828125, -0.22803878784179688, -0.21637725830078125, -0.20471572875976562, -0.19305419921875, -0.18139266967773438, -0.16973114013671875, -0.15806961059570312, -0.1464080810546875, -0.13474655151367188, -0.12308502197265625, -0.11142349243164062, -0.099761962890625, -0.08810043334960938, -0.07643890380859375, -0.06477737426757812, -0.0531158447265625, -0.041454315185546875, -0.02979278564453125, -0.018131256103515625, -0.0064697265625, 0.005191802978515625, 0.01685333251953125, 0.028514862060546875, 0.0401763916015625, 0.051837921142578125, 0.06349945068359375, 0.07516098022460938, 0.086822509765625, 0.09848403930664062, 0.11014556884765625, 0.12180709838867188, 0.1334686279296875, 0.14513015747070312, 0.15679168701171875, 0.16845321655273438, 0.18011474609375, 0.19177627563476562, 0.20343780517578125, 0.21509933471679688, 0.2267608642578125, 0.23842239379882812, 0.25008392333984375, 0.2617454528808594, 0.273406982421875, 0.2850685119628906, 0.29673004150390625, 0.3083915710449219, 0.3200531005859375, 0.3317146301269531, 0.34337615966796875, 0.3550376892089844, 0.36669921875]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 0.0, 2.0, 2.0, 10.0, 6.0, 10.0, 15.0, 17.0, 19.0, 27.0, 25.0, 39.0, 68.0, 72.0, 77.0, 96.0, 88.0, 92.0, 72.0, 61.0, 49.0, 40.0, 34.0, 21.0, 14.0, 14.0, 9.0, 12.0, 6.0, 3.0, 7.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08636474609375, -0.08329296112060547, -0.08022117614746094, -0.0771493911743164, -0.07407760620117188, -0.07100582122802734, -0.06793403625488281, -0.06486225128173828, -0.06179046630859375, -0.05871868133544922, -0.05564689636230469, -0.052575111389160156, -0.049503326416015625, -0.046431541442871094, -0.04335975646972656, -0.04028797149658203, -0.0372161865234375, -0.03414440155029297, -0.031072616577148438, -0.028000831604003906, -0.024929046630859375, -0.021857261657714844, -0.018785476684570312, -0.01571369171142578, -0.01264190673828125, -0.009570121765136719, -0.0064983367919921875, -0.0034265518188476562, -0.000354766845703125, 0.0027170181274414062, 0.0057888031005859375, 0.008860588073730469, 0.011932373046875, 0.015004158020019531, 0.018075942993164062, 0.021147727966308594, 0.024219512939453125, 0.027291297912597656, 0.030363082885742188, 0.03343486785888672, 0.03650665283203125, 0.03957843780517578, 0.04265022277832031, 0.045722007751464844, 0.048793792724609375, 0.051865577697753906, 0.05493736267089844, 0.05800914764404297, 0.0610809326171875, 0.06415271759033203, 0.06722450256347656, 0.0702962875366211, 0.07336807250976562, 0.07643985748291016, 0.07951164245605469, 0.08258342742919922, 0.08565521240234375, 0.08872699737548828, 0.09179878234863281, 0.09487056732177734, 0.09794235229492188, 0.1010141372680664, 0.10408592224121094, 0.10715770721435547, 0.1102294921875]}, "gradients/decoder.model.decoder.layers.9.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 8.0, 5.0, 9.0, 20.0, 33.0, 36.0, 79.0, 128.0, 165.0, 178.0, 135.0, 84.0, 52.0, 25.0, 17.0, 13.0, 10.0, 5.0, 4.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.156867027282715, -4.0504069328308105, -3.9439468383789062, -3.837486743927002, -3.7310266494750977, -3.6245665550231934, -3.51810622215271, -3.4116461277008057, -3.3051860332489014, -3.198725938796997, -3.0922658443450928, -2.9858057498931885, -2.879345417022705, -2.772885322570801, -2.6664252281188965, -2.559965133666992, -2.453505039215088, -2.3470449447631836, -2.2405848503112793, -2.134124755859375, -2.0276646614074707, -1.9212044477462769, -1.814744234085083, -1.7082841396331787, -1.6018240451812744, -1.4953639507293701, -1.3889038562774658, -1.282443642616272, -1.1759835481643677, -1.0695234537124634, -0.9630632996559143, -0.8566031455993652, -0.75014328956604, -0.6436831951141357, -0.5372230410575867, -0.43076291680336, -0.3243027925491333, -0.217842698097229, -0.11138254404067993, -0.004922389984130859, 0.10153770446777344, 0.20799782872200012, 0.3144579529762268, 0.4209180772304535, 0.5273782014846802, 0.6338382959365845, 0.7402984499931335, 0.8467586040496826, 0.9532186985015869, 1.0596787929534912, 1.1661388874053955, 1.2725991010665894, 1.3790591955184937, 1.485519289970398, 1.5919795036315918, 1.698439598083496, 1.8048996925354004, 1.9113597869873047, 2.017819881439209, 2.1242799758911133, 2.2307400703430176, 2.337200164794922, 2.4436604976654053, 2.5501205921173096, 2.656580686569214]}, "gradients/decoder.model.decoder.layers.9.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 3.0, 6.0, 16.0, 25.0, 27.0, 36.0, 42.0, 73.0, 87.0, 108.0, 118.0, 97.0, 96.0, 76.0, 75.0, 44.0, 30.0, 23.0, 12.0, 8.0, 8.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.5842669010162354, -3.5020751953125, -3.4198837280273438, -3.3376920223236084, -3.255500555038452, -3.173308849334717, -3.0911173820495605, -3.008925676345825, -2.926734209060669, -2.8445425033569336, -2.7623510360717773, -2.680159330368042, -2.5979678630828857, -2.5157761573791504, -2.433584690093994, -2.351392984390259, -2.2692012786865234, -2.187009572982788, -2.104818105697632, -2.0226263999938965, -1.9404349327087402, -1.8582433462142944, -1.7760517597198486, -1.6938600540161133, -1.611668586730957, -1.5294770002365112, -1.4472854137420654, -1.3650938272476196, -1.2829022407531738, -1.200710654258728, -1.1185190677642822, -1.0363273620605469, -0.9541360139846802, -0.8719444274902344, -0.7897528409957886, -0.7075612545013428, -0.625369668006897, -0.5431780815124512, -0.4609864354133606, -0.3787948489189148, -0.296603262424469, -0.2144116759300232, -0.1322200745344162, -0.050028473138809204, 0.0321631133556366, 0.1143546998500824, 0.19654631614685059, 0.2787379026412964, 0.3609294891357422, 0.443121075630188, 0.5253126621246338, 0.6075042486190796, 0.6896958351135254, 0.7718874216079712, 0.8540790677070618, 0.9362706542015076, 1.0184621810913086, 1.1006537675857544, 1.1828453540802002, 1.265036940574646, 1.3472285270690918, 1.4294201135635376, 1.5116117000579834, 1.5938034057617188, 1.6759949922561646]}, "gradients/decoder.model.decoder.layers.9.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 5.0, 2.0, 3.0, 3.0, 4.0, 9.0, 18.0, 23.0, 33.0, 46.0, 70.0, 198.0, 523.0, 1611.0, 5869.0, 27454.0, 168200.0, 656680.0, 154157.0, 25645.0, 5578.0, 1472.0, 519.0, 187.0, 99.0, 53.0, 36.0, 17.0, 18.0, 10.0, 5.0, 8.0, 4.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5927734375, -1.5302581787109375, -1.467742919921875, -1.4052276611328125, -1.34271240234375, -1.2801971435546875, -1.217681884765625, -1.1551666259765625, -1.0926513671875, -1.0301361083984375, -0.967620849609375, -0.9051055908203125, -0.84259033203125, -0.7800750732421875, -0.717559814453125, -0.6550445556640625, -0.592529296875, -0.5300140380859375, -0.467498779296875, -0.4049835205078125, -0.34246826171875, -0.2799530029296875, -0.217437744140625, -0.1549224853515625, -0.0924072265625, -0.0298919677734375, 0.032623291015625, 0.0951385498046875, 0.15765380859375, 0.2201690673828125, 0.282684326171875, 0.3451995849609375, 0.40771484375, 0.4702301025390625, 0.532745361328125, 0.5952606201171875, 0.65777587890625, 0.7202911376953125, 0.782806396484375, 0.8453216552734375, 0.9078369140625, 0.9703521728515625, 1.032867431640625, 1.0953826904296875, 1.15789794921875, 1.2204132080078125, 1.282928466796875, 1.3454437255859375, 1.407958984375, 1.4704742431640625, 1.532989501953125, 1.5955047607421875, 1.65802001953125, 1.7205352783203125, 1.783050537109375, 1.8455657958984375, 1.9080810546875, 1.9705963134765625, 2.033111572265625, 2.0956268310546875, 2.15814208984375, 2.2206573486328125, 2.283172607421875, 2.3456878662109375, 2.408203125]}, "gradients/decoder.model.decoder.layers.9.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 5.0, 5.0, 6.0, 12.0, 10.0, 25.0, 28.0, 39.0, 49.0, 72.0, 92.0, 108.0, 90.0, 107.0, 86.0, 83.0, 62.0, 47.0, 34.0, 21.0, 20.0, 6.0, 7.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.953125, -7.75701904296875, -7.5609130859375, -7.36480712890625, -7.168701171875, -6.97259521484375, -6.7764892578125, -6.58038330078125, -6.38427734375, -6.18817138671875, -5.9920654296875, -5.79595947265625, -5.599853515625, -5.40374755859375, -5.2076416015625, -5.01153564453125, -4.8154296875, -4.61932373046875, -4.4232177734375, -4.22711181640625, -4.031005859375, -3.83489990234375, -3.6387939453125, -3.44268798828125, -3.24658203125, -3.05047607421875, -2.8543701171875, -2.65826416015625, -2.462158203125, -2.26605224609375, -2.0699462890625, -1.87384033203125, -1.677734375, -1.48162841796875, -1.2855224609375, -1.08941650390625, -0.893310546875, -0.69720458984375, -0.5010986328125, -0.30499267578125, -0.10888671875, 0.08721923828125, 0.2833251953125, 0.47943115234375, 0.675537109375, 0.87164306640625, 1.0677490234375, 1.26385498046875, 1.4599609375, 1.65606689453125, 1.8521728515625, 2.04827880859375, 2.244384765625, 2.44049072265625, 2.6365966796875, 2.83270263671875, 3.02880859375, 3.22491455078125, 3.4210205078125, 3.61712646484375, 3.813232421875, 4.00933837890625, 4.2054443359375, 4.40155029296875, 4.59765625]}, "gradients/decoder.model.decoder.layers.9.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 4.0, 7.0, 3.0, 8.0, 8.0, 13.0, 11.0, 11.0, 15.0, 21.0, 24.0, 32.0, 31.0, 40.0, 52.0, 39.0, 37.0, 49.0, 116.0, 4480.0, 1041986.0, 1113.0, 96.0, 35.0, 36.0, 49.0, 42.0, 28.0, 32.0, 28.0, 18.0, 17.0, 17.0, 8.0, 15.0, 9.0, 10.0, 6.0, 4.0, 3.0, 2.0, 2.0, 3.0, 1.0, 4.0, 2.0], "bins": [-15.140625, -14.7462158203125, -14.351806640625, -13.9573974609375, -13.56298828125, -13.1685791015625, -12.774169921875, -12.3797607421875, -11.9853515625, -11.5909423828125, -11.196533203125, -10.8021240234375, -10.40771484375, -10.0133056640625, -9.618896484375, -9.2244873046875, -8.830078125, -8.4356689453125, -8.041259765625, -7.6468505859375, -7.25244140625, -6.8580322265625, -6.463623046875, -6.0692138671875, -5.6748046875, -5.2803955078125, -4.885986328125, -4.4915771484375, -4.09716796875, -3.7027587890625, -3.308349609375, -2.9139404296875, -2.51953125, -2.1251220703125, -1.730712890625, -1.3363037109375, -0.94189453125, -0.5474853515625, -0.153076171875, 0.2413330078125, 0.6357421875, 1.0301513671875, 1.424560546875, 1.8189697265625, 2.21337890625, 2.6077880859375, 3.002197265625, 3.3966064453125, 3.791015625, 4.1854248046875, 4.579833984375, 4.9742431640625, 5.36865234375, 5.7630615234375, 6.157470703125, 6.5518798828125, 6.9462890625, 7.3406982421875, 7.735107421875, 8.1295166015625, 8.52392578125, 8.9183349609375, 9.312744140625, 9.7071533203125, 10.1015625]}, "gradients/decoder.model.decoder.layers.9.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 5.0, 3.0, 6.0, 11.0, 11.0, 10.0, 9.0, 18.0, 14.0, 33.0, 19.0, 36.0, 33.0, 40.0, 42.0, 39.0, 40.0, 32.0, 51.0, 53.0, 45.0, 50.0, 45.0, 48.0, 36.0, 41.0, 26.0, 30.0, 36.0, 26.0, 21.0, 15.0, 16.0, 11.0, 19.0, 7.0, 6.0, 10.0, 2.0, 1.0, 1.0, 4.0, 2.0, 2.0, 3.0, 1.0], "bins": [-4.3828125, -4.26727294921875, -4.1517333984375, -4.03619384765625, -3.920654296875, -3.80511474609375, -3.6895751953125, -3.57403564453125, -3.45849609375, -3.34295654296875, -3.2274169921875, -3.11187744140625, -2.996337890625, -2.88079833984375, -2.7652587890625, -2.64971923828125, -2.5341796875, -2.41864013671875, -2.3031005859375, -2.18756103515625, -2.072021484375, -1.95648193359375, -1.8409423828125, -1.72540283203125, -1.60986328125, -1.49432373046875, -1.3787841796875, -1.26324462890625, -1.147705078125, -1.03216552734375, -0.9166259765625, -0.80108642578125, -0.685546875, -0.57000732421875, -0.4544677734375, -0.33892822265625, -0.223388671875, -0.10784912109375, 0.0076904296875, 0.12322998046875, 0.23876953125, 0.35430908203125, 0.4698486328125, 0.58538818359375, 0.700927734375, 0.81646728515625, 0.9320068359375, 1.04754638671875, 1.1630859375, 1.27862548828125, 1.3941650390625, 1.50970458984375, 1.625244140625, 1.74078369140625, 1.8563232421875, 1.97186279296875, 2.08740234375, 2.20294189453125, 2.3184814453125, 2.43402099609375, 2.549560546875, 2.66510009765625, 2.7806396484375, 2.89617919921875, 3.01171875]}, "gradients/decoder.model.decoder.layers.9.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 3.0, 3.0, 3.0, 6.0, 1.0, 7.0, 12.0, 15.0, 9.0, 20.0, 29.0, 47.0, 65.0, 100.0, 161.0, 276.0, 514.0, 1002.0, 2388.0, 5999.0, 20817.0, 109187.0, 615614.0, 239199.0, 37825.0, 9260.0, 3185.0, 1269.0, 605.0, 328.0, 206.0, 104.0, 74.0, 50.0, 39.0, 28.0, 24.0, 19.0, 19.0, 7.0, 11.0, 8.0, 4.0, 3.0, 0.0, 7.0, 1.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.53515625, -0.5182723999023438, -0.5013885498046875, -0.48450469970703125, -0.467620849609375, -0.45073699951171875, -0.4338531494140625, -0.41696929931640625, -0.40008544921875, -0.38320159912109375, -0.3663177490234375, -0.34943389892578125, -0.332550048828125, -0.31566619873046875, -0.2987823486328125, -0.28189849853515625, -0.2650146484375, -0.24813079833984375, -0.2312469482421875, -0.21436309814453125, -0.197479248046875, -0.18059539794921875, -0.1637115478515625, -0.14682769775390625, -0.12994384765625, -0.11305999755859375, -0.0961761474609375, -0.07929229736328125, -0.062408447265625, -0.04552459716796875, -0.0286407470703125, -0.01175689697265625, 0.005126953125, 0.02201080322265625, 0.0388946533203125, 0.05577850341796875, 0.072662353515625, 0.08954620361328125, 0.1064300537109375, 0.12331390380859375, 0.14019775390625, 0.15708160400390625, 0.1739654541015625, 0.19084930419921875, 0.207733154296875, 0.22461700439453125, 0.2415008544921875, 0.25838470458984375, 0.2752685546875, 0.29215240478515625, 0.3090362548828125, 0.32592010498046875, 0.342803955078125, 0.35968780517578125, 0.3765716552734375, 0.39345550537109375, 0.41033935546875, 0.42722320556640625, 0.4441070556640625, 0.46099090576171875, 0.477874755859375, 0.49475860595703125, 0.5116424560546875, 0.5285263061523438, 0.54541015625]}, "gradients/decoder.model.decoder.layers.9.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 9.0, 6.0, 3.0, 6.0, 20.0, 22.0, 38.0, 82.0, 90.0, 134.0, 152.0, 148.0, 100.0, 66.0, 45.0, 25.0, 14.0, 19.0, 11.0, 4.0, 5.0, 5.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00013756752014160156, -0.00013367179781198502, -0.00012977607548236847, -0.00012588035315275192, -0.00012198463082313538, -0.00011808890849351883, -0.00011419318616390228, -0.00011029746383428574, -0.00010640174150466919, -0.00010250601917505264, -9.86102968454361e-05, -9.471457451581955e-05, -9.0818852186203e-05, -8.692312985658646e-05, -8.302740752696991e-05, -7.913168519735336e-05, -7.523596286773682e-05, -7.134024053812027e-05, -6.744451820850372e-05, -6.354879587888718e-05, -5.965307354927063e-05, -5.575735121965408e-05, -5.186162889003754e-05, -4.796590656042099e-05, -4.407018423080444e-05, -4.01744619011879e-05, -3.627873957157135e-05, -3.2383017241954803e-05, -2.8487294912338257e-05, -2.459157258272171e-05, -2.0695850253105164e-05, -1.6800127923488617e-05, -1.290440559387207e-05, -9.008683264255524e-06, -5.112960934638977e-06, -1.2172386050224304e-06, 2.678483724594116e-06, 6.574206054210663e-06, 1.046992838382721e-05, 1.4365650713443756e-05, 1.8261373043060303e-05, 2.215709537267685e-05, 2.6052817702293396e-05, 2.9948540031909943e-05, 3.384426236152649e-05, 3.7739984691143036e-05, 4.163570702075958e-05, 4.553142935037613e-05, 4.9427151679992676e-05, 5.332287400960922e-05, 5.721859633922577e-05, 6.111431866884232e-05, 6.501004099845886e-05, 6.890576332807541e-05, 7.280148565769196e-05, 7.66972079873085e-05, 8.059293031692505e-05, 8.44886526465416e-05, 8.838437497615814e-05, 9.228009730577469e-05, 9.617581963539124e-05, 0.00010007154196500778, 0.00010396726429462433, 0.00010786298662424088, 0.00011175870895385742]}, "gradients/decoder.model.decoder.layers.9.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 2.0, 2.0, 5.0, 4.0, 13.0, 19.0, 27.0, 32.0, 46.0, 78.0, 135.0, 253.0, 422.0, 804.0, 1710.0, 3955.0, 11558.0, 40230.0, 183802.0, 569785.0, 177786.0, 39194.0, 11206.0, 3978.0, 1668.0, 756.0, 422.0, 244.0, 151.0, 96.0, 57.0, 30.0, 27.0, 24.0, 12.0, 7.0, 3.0, 4.0, 3.0, 5.0, 4.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3974609375, -0.3844261169433594, -0.37139129638671875, -0.3583564758300781, -0.3453216552734375, -0.3322868347167969, -0.31925201416015625, -0.3062171936035156, -0.293182373046875, -0.2801475524902344, -0.26711273193359375, -0.2540779113769531, -0.2410430908203125, -0.22800827026367188, -0.21497344970703125, -0.20193862915039062, -0.18890380859375, -0.17586898803710938, -0.16283416748046875, -0.14979934692382812, -0.1367645263671875, -0.12372970581054688, -0.11069488525390625, -0.09766006469726562, -0.084625244140625, -0.07159042358398438, -0.05855560302734375, -0.045520782470703125, -0.0324859619140625, -0.019451141357421875, -0.00641632080078125, 0.006618499755859375, 0.0196533203125, 0.032688140869140625, 0.04572296142578125, 0.058757781982421875, 0.0717926025390625, 0.08482742309570312, 0.09786224365234375, 0.11089706420898438, 0.123931884765625, 0.13696670532226562, 0.15000152587890625, 0.16303634643554688, 0.1760711669921875, 0.18910598754882812, 0.20214080810546875, 0.21517562866210938, 0.22821044921875, 0.24124526977539062, 0.25428009033203125, 0.2673149108886719, 0.2803497314453125, 0.2933845520019531, 0.30641937255859375, 0.3194541931152344, 0.332489013671875, 0.3455238342285156, 0.35855865478515625, 0.3715934753417969, 0.3846282958984375, 0.3976631164550781, 0.41069793701171875, 0.4237327575683594, 0.436767578125]}, "gradients/decoder.model.decoder.layers.9.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 4.0, 5.0, 3.0, 4.0, 9.0, 10.0, 16.0, 22.0, 24.0, 30.0, 43.0, 46.0, 79.0, 71.0, 93.0, 105.0, 90.0, 74.0, 60.0, 54.0, 43.0, 31.0, 25.0, 15.0, 10.0, 11.0, 9.0, 4.0, 7.0, 7.0, 6.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1700439453125, -0.1636524200439453, -0.15726089477539062, -0.15086936950683594, -0.14447784423828125, -0.13808631896972656, -0.13169479370117188, -0.1253032684326172, -0.1189117431640625, -0.11252021789550781, -0.10612869262695312, -0.09973716735839844, -0.09334564208984375, -0.08695411682128906, -0.08056259155273438, -0.07417106628417969, -0.067779541015625, -0.06138801574707031, -0.054996490478515625, -0.04860496520996094, -0.04221343994140625, -0.03582191467285156, -0.029430389404296875, -0.023038864135742188, -0.0166473388671875, -0.010255813598632812, -0.003864288330078125, 0.0025272369384765625, 0.00891876220703125, 0.015310287475585938, 0.021701812744140625, 0.028093338012695312, 0.03448486328125, 0.04087638854980469, 0.047267913818359375, 0.05365943908691406, 0.06005096435546875, 0.06644248962402344, 0.07283401489257812, 0.07922554016113281, 0.0856170654296875, 0.09200859069824219, 0.09840011596679688, 0.10479164123535156, 0.11118316650390625, 0.11757469177246094, 0.12396621704101562, 0.1303577423095703, 0.136749267578125, 0.1431407928466797, 0.14953231811523438, 0.15592384338378906, 0.16231536865234375, 0.16870689392089844, 0.17509841918945312, 0.1814899444580078, 0.1878814697265625, 0.1942729949951172, 0.20066452026367188, 0.20705604553222656, 0.21344757080078125, 0.21983909606933594, 0.22623062133789062, 0.2326221466064453, 0.239013671875]}, "gradients/decoder.model.decoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 5.0, 19.0, 26.0, 58.0, 107.0, 195.0, 257.0, 155.0, 98.0, 42.0, 26.0, 9.0, 6.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-14.347673416137695, -14.044269561767578, -13.740865707397461, -13.437461853027344, -13.134057998657227, -12.83065414428711, -12.527250289916992, -12.223846435546875, -11.920442581176758, -11.61703872680664, -11.313634872436523, -11.010231018066406, -10.706827163696289, -10.403423309326172, -10.100019454956055, -9.796615600585938, -9.49321174621582, -9.189807891845703, -8.886404037475586, -8.583000183105469, -8.279596328735352, -7.976192474365234, -7.672788619995117, -7.369384765625, -7.065979957580566, -6.762576103210449, -6.459172248840332, -6.155768394470215, -5.852364540100098, -5.5489606857299805, -5.245556831359863, -4.942152976989746, -4.638749599456787, -4.33534574508667, -4.031941890716553, -3.7285380363464355, -3.4251341819763184, -3.121730327606201, -2.818326234817505, -2.5149223804473877, -2.2115185260772705, -1.9081146717071533, -1.6047108173370361, -1.3013068437576294, -0.9979029893875122, -0.694499135017395, -0.3910951614379883, -0.0876913070678711, 0.2157125473022461, 0.5191164016723633, 0.8225203156471252, 1.1259242296218872, 1.4293280839920044, 1.7327319383621216, 2.0361359119415283, 2.3395397663116455, 2.6429436206817627, 2.94634747505188, 3.249751329421997, 3.5531554222106934, 3.8565592765808105, 4.159963130950928, 4.463366985321045, 4.766770839691162, 5.070174694061279]}, "gradients/decoder.model.decoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 6.0, 3.0, 3.0, 9.0, 8.0, 10.0, 15.0, 11.0, 19.0, 19.0, 29.0, 35.0, 38.0, 43.0, 31.0, 38.0, 39.0, 47.0, 56.0, 55.0, 52.0, 50.0, 46.0, 57.0, 37.0, 41.0, 40.0, 24.0, 26.0, 19.0, 15.0, 12.0, 12.0, 14.0, 12.0, 4.0, 10.0, 7.0, 3.0, 3.0, 4.0, 4.0, 2.0, 5.0, 0.0, 1.0], "bins": [-6.61086368560791, -6.436980247497559, -6.263096809387207, -6.0892133712768555, -5.915329933166504, -5.741446018218994, -5.567562580108643, -5.393679141998291, -5.2197957038879395, -5.045912265777588, -4.872028827667236, -4.698145389556885, -4.524261474609375, -4.350378036499023, -4.176494598388672, -4.00261116027832, -3.8287277221679688, -3.654844284057617, -3.4809608459472656, -3.307077169418335, -3.1331937313079834, -2.959310293197632, -2.785426616668701, -2.6115431785583496, -2.437659740447998, -2.2637763023376465, -2.089892864227295, -1.9160091876983643, -1.7421257495880127, -1.5682423114776611, -1.39435875415802, -1.220475196838379, -1.0465917587280273, -0.872708261013031, -0.6988247632980347, -0.5249412655830383, -0.351057767868042, -0.17717427015304565, -0.0032907724380493164, 0.1705927848815918, 0.34447622299194336, 0.5183597207069397, 0.692243218421936, 0.8661267161369324, 1.0400102138519287, 1.2138936519622803, 1.3877772092819214, 1.5616607666015625, 1.735544204711914, 1.9094276428222656, 2.083311080932617, 2.257194757461548, 2.4310781955718994, 2.604961633682251, 2.7788453102111816, 2.952728748321533, 3.1266121864318848, 3.3004956245422363, 3.474379062652588, 3.6482627391815186, 3.82214617729187, 3.9960296154022217, 4.169913291931152, 4.343796730041504, 4.5176801681518555]}, "gradients/decoder.model.decoder.layers.8.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 5.0, 5.0, 7.0, 6.0, 15.0, 21.0, 23.0, 25.0, 63.0, 81.0, 122.0, 210.0, 359.0, 679.0, 1412.0, 3378.0, 10035.0, 40214.0, 316434.0, 2942835.0, 774698.0, 78702.0, 16415.0, 4844.0, 1771.0, 838.0, 430.0, 232.0, 140.0, 109.0, 60.0, 52.0, 27.0, 18.0, 14.0, 7.0, 2.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.388671875, -2.299102783203125, -2.20953369140625, -2.119964599609375, -2.0303955078125, -1.940826416015625, -1.85125732421875, -1.761688232421875, -1.672119140625, -1.582550048828125, -1.49298095703125, -1.403411865234375, -1.3138427734375, -1.224273681640625, -1.13470458984375, -1.045135498046875, -0.95556640625, -0.865997314453125, -0.77642822265625, -0.686859130859375, -0.5972900390625, -0.507720947265625, -0.41815185546875, -0.328582763671875, -0.239013671875, -0.149444580078125, -0.05987548828125, 0.029693603515625, 0.1192626953125, 0.208831787109375, 0.29840087890625, 0.387969970703125, 0.4775390625, 0.567108154296875, 0.65667724609375, 0.746246337890625, 0.8358154296875, 0.925384521484375, 1.01495361328125, 1.104522705078125, 1.194091796875, 1.283660888671875, 1.37322998046875, 1.462799072265625, 1.5523681640625, 1.641937255859375, 1.73150634765625, 1.821075439453125, 1.91064453125, 2.000213623046875, 2.08978271484375, 2.179351806640625, 2.2689208984375, 2.358489990234375, 2.44805908203125, 2.537628173828125, 2.627197265625, 2.716766357421875, 2.80633544921875, 2.895904541015625, 2.9854736328125, 3.075042724609375, 3.16461181640625, 3.254180908203125, 3.34375]}, "gradients/decoder.model.decoder.layers.8.fc2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 9.0, 9.0, 5.0, 21.0, 26.0, 30.0, 25.0, 39.0, 68.0, 86.0, 84.0, 87.0, 74.0, 98.0, 78.0, 60.0, 67.0, 40.0, 27.0, 15.0, 19.0, 14.0, 7.0, 9.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.556640625, -2.474456787109375, -2.39227294921875, -2.310089111328125, -2.2279052734375, -2.145721435546875, -2.06353759765625, -1.981353759765625, -1.899169921875, -1.816986083984375, -1.73480224609375, -1.652618408203125, -1.5704345703125, -1.488250732421875, -1.40606689453125, -1.323883056640625, -1.24169921875, -1.159515380859375, -1.07733154296875, -0.995147705078125, -0.9129638671875, -0.830780029296875, -0.74859619140625, -0.666412353515625, -0.584228515625, -0.502044677734375, -0.41986083984375, -0.337677001953125, -0.2554931640625, -0.173309326171875, -0.09112548828125, -0.008941650390625, 0.0732421875, 0.155426025390625, 0.23760986328125, 0.319793701171875, 0.4019775390625, 0.484161376953125, 0.56634521484375, 0.648529052734375, 0.730712890625, 0.812896728515625, 0.89508056640625, 0.977264404296875, 1.0594482421875, 1.141632080078125, 1.22381591796875, 1.305999755859375, 1.38818359375, 1.470367431640625, 1.55255126953125, 1.634735107421875, 1.7169189453125, 1.799102783203125, 1.88128662109375, 1.963470458984375, 2.045654296875, 2.127838134765625, 2.21002197265625, 2.292205810546875, 2.3743896484375, 2.456573486328125, 2.53875732421875, 2.620941162109375, 2.703125]}, "gradients/decoder.model.decoder.layers.8.fc1.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 4.0, 1.0, 3.0, 5.0, 3.0, 5.0, 7.0, 13.0, 12.0, 16.0, 31.0, 27.0, 57.0, 96.0, 140.0, 280.0, 751.0, 3681.0, 58935.0, 3970915.0, 151626.0, 5866.0, 1000.0, 378.0, 154.0, 104.0, 62.0, 38.0, 29.0, 17.0, 9.0, 5.0, 5.0, 6.0, 4.0, 5.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.51171875, -4.32061767578125, -4.1295166015625, -3.93841552734375, -3.747314453125, -3.55621337890625, -3.3651123046875, -3.17401123046875, -2.98291015625, -2.79180908203125, -2.6007080078125, -2.40960693359375, -2.218505859375, -2.02740478515625, -1.8363037109375, -1.64520263671875, -1.4541015625, -1.26300048828125, -1.0718994140625, -0.88079833984375, -0.689697265625, -0.49859619140625, -0.3074951171875, -0.11639404296875, 0.07470703125, 0.26580810546875, 0.4569091796875, 0.64801025390625, 0.839111328125, 1.03021240234375, 1.2213134765625, 1.41241455078125, 1.603515625, 1.79461669921875, 1.9857177734375, 2.17681884765625, 2.367919921875, 2.55902099609375, 2.7501220703125, 2.94122314453125, 3.13232421875, 3.32342529296875, 3.5145263671875, 3.70562744140625, 3.896728515625, 4.08782958984375, 4.2789306640625, 4.47003173828125, 4.6611328125, 4.85223388671875, 5.0433349609375, 5.23443603515625, 5.425537109375, 5.61663818359375, 5.8077392578125, 5.99884033203125, 6.18994140625, 6.38104248046875, 6.5721435546875, 6.76324462890625, 6.954345703125, 7.14544677734375, 7.3365478515625, 7.52764892578125, 7.71875]}, "gradients/decoder.model.decoder.layers.8.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 6.0, 2.0, 8.0, 9.0, 7.0, 16.0, 22.0, 52.0, 53.0, 96.0, 122.0, 200.0, 337.0, 602.0, 797.0, 657.0, 403.0, 231.0, 158.0, 104.0, 65.0, 50.0, 22.0, 18.0, 12.0, 12.0, 3.0, 1.0, 6.0, 7.0, 3.0, 1.0, 2.0, 2.0], "bins": [-1.1611328125, -1.1351089477539062, -1.1090850830078125, -1.0830612182617188, -1.057037353515625, -1.0310134887695312, -1.0049896240234375, -0.9789657592773438, -0.95294189453125, -0.9269180297851562, -0.9008941650390625, -0.8748703002929688, -0.848846435546875, -0.8228225708007812, -0.7967987060546875, -0.7707748413085938, -0.7447509765625, -0.7187271118164062, -0.6927032470703125, -0.6666793823242188, -0.640655517578125, -0.6146316528320312, -0.5886077880859375, -0.5625839233398438, -0.53656005859375, -0.5105361938476562, -0.4845123291015625, -0.45848846435546875, -0.432464599609375, -0.40644073486328125, -0.3804168701171875, -0.35439300537109375, -0.328369140625, -0.30234527587890625, -0.2763214111328125, -0.25029754638671875, -0.224273681640625, -0.19824981689453125, -0.1722259521484375, -0.14620208740234375, -0.12017822265625, -0.09415435791015625, -0.0681304931640625, -0.04210662841796875, -0.016082763671875, 0.00994110107421875, 0.0359649658203125, 0.06198883056640625, 0.0880126953125, 0.11403656005859375, 0.1400604248046875, 0.16608428955078125, 0.192108154296875, 0.21813201904296875, 0.2441558837890625, 0.27017974853515625, 0.29620361328125, 0.32222747802734375, 0.3482513427734375, 0.37427520751953125, 0.400299072265625, 0.42632293701171875, 0.4523468017578125, 0.47837066650390625, 0.50439453125]}, "gradients/decoder.model.decoder.layers.8.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 6.0, 6.0, 6.0, 5.0, 12.0, 23.0, 35.0, 60.0, 72.0, 116.0, 140.0, 156.0, 131.0, 69.0, 60.0, 31.0, 24.0, 19.0, 14.0, 4.0, 6.0, 6.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.216501712799072, -4.09208869934082, -3.9676756858825684, -3.8432626724243164, -3.7188496589660645, -3.5944366455078125, -3.4700236320495605, -3.3456106185913086, -3.2211976051330566, -3.0967845916748047, -2.9723715782165527, -2.847958564758301, -2.723545551300049, -2.599132537841797, -2.474719524383545, -2.350306510925293, -2.225893497467041, -2.101480484008789, -1.977067470550537, -1.8526544570922852, -1.7282414436340332, -1.6038284301757812, -1.4794154167175293, -1.3550024032592773, -1.2305893898010254, -1.1061763763427734, -0.9817633628845215, -0.8573503494262695, -0.7329373359680176, -0.6085243225097656, -0.48411130905151367, -0.3596982955932617, -0.23528552055358887, -0.11087250709533691, 0.013540506362915039, 0.137953519821167, 0.26236653327941895, 0.3867795467376709, 0.5111925601959229, 0.6356055736541748, 0.7600185871124268, 0.8844316005706787, 1.0088446140289307, 1.1332576274871826, 1.2576706409454346, 1.3820836544036865, 1.5064966678619385, 1.6309096813201904, 1.7553226947784424, 1.8797357082366943, 2.0041487216949463, 2.1285617351531982, 2.25297474861145, 2.377387762069702, 2.501800775527954, 2.626213788986206, 2.750626802444458, 2.87503981590271, 2.999452829360962, 3.123865842819214, 3.248278856277466, 3.3726918697357178, 3.4971048831939697, 3.6215178966522217, 3.7459309101104736]}, "gradients/decoder.model.decoder.layers.8.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 4.0, 6.0, 13.0, 13.0, 14.0, 15.0, 23.0, 20.0, 24.0, 38.0, 41.0, 40.0, 65.0, 65.0, 70.0, 74.0, 67.0, 58.0, 43.0, 62.0, 40.0, 43.0, 26.0, 35.0, 20.0, 30.0, 13.0, 11.0, 8.0, 8.0, 7.0, 2.0, 4.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.40828537940979, -2.340625762939453, -2.272966146469116, -2.2053065299987793, -2.1376471519470215, -2.0699875354766846, -2.0023279190063477, -1.9346683025360107, -1.8670086860656738, -1.799349069595337, -1.731689453125, -1.6640299558639526, -1.5963703393936157, -1.5287107229232788, -1.4610512256622314, -1.3933916091918945, -1.3257319927215576, -1.2580723762512207, -1.1904127597808838, -1.1227532625198364, -1.0550936460494995, -0.9874340295791626, -0.9197744727134705, -0.8521149158477783, -0.7844552993774414, -0.7167956829071045, -0.6491361260414124, -0.5814765691757202, -0.5138169527053833, -0.4461573660373688, -0.37849777936935425, -0.3108381927013397, -0.2431783676147461, -0.17551878094673157, -0.10785919427871704, -0.040199607610702515, 0.02745997905731201, 0.09511956572532654, 0.16277915239334106, 0.2304387390613556, 0.2980983257293701, 0.36575791239738464, 0.43341749906539917, 0.5010770559310913, 0.5687366724014282, 0.6363962888717651, 0.7040558457374573, 0.7717154026031494, 0.8393750190734863, 0.9070346355438232, 0.9746941924095154, 1.0423537492752075, 1.1100133657455444, 1.1776729822158813, 1.2453324794769287, 1.3129920959472656, 1.3806517124176025, 1.4483113288879395, 1.5159709453582764, 1.5836304426193237, 1.6512900590896606, 1.7189496755599976, 1.786609172821045, 1.8542687892913818, 1.9219284057617188]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 7.0, 5.0, 9.0, 11.0, 13.0, 45.0, 62.0, 83.0, 172.0, 348.0, 707.0, 1635.0, 4695.0, 16041.0, 73412.0, 458585.0, 405734.0, 65079.0, 14604.0, 4336.0, 1584.0, 695.0, 313.0, 159.0, 82.0, 43.0, 28.0, 19.0, 23.0, 8.0, 5.0, 2.0, 4.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.146484375, -1.1136932373046875, -1.080902099609375, -1.0481109619140625, -1.01531982421875, -0.9825286865234375, -0.949737548828125, -0.9169464111328125, -0.8841552734375, -0.8513641357421875, -0.818572998046875, -0.7857818603515625, -0.75299072265625, -0.7201995849609375, -0.687408447265625, -0.6546173095703125, -0.621826171875, -0.5890350341796875, -0.556243896484375, -0.5234527587890625, -0.49066162109375, -0.4578704833984375, -0.425079345703125, -0.3922882080078125, -0.3594970703125, -0.3267059326171875, -0.293914794921875, -0.2611236572265625, -0.22833251953125, -0.1955413818359375, -0.162750244140625, -0.1299591064453125, -0.09716796875, -0.0643768310546875, -0.031585693359375, 0.0012054443359375, 0.03399658203125, 0.0667877197265625, 0.099578857421875, 0.1323699951171875, 0.1651611328125, 0.1979522705078125, 0.230743408203125, 0.2635345458984375, 0.29632568359375, 0.3291168212890625, 0.361907958984375, 0.3946990966796875, 0.427490234375, 0.4602813720703125, 0.493072509765625, 0.5258636474609375, 0.55865478515625, 0.5914459228515625, 0.624237060546875, 0.6570281982421875, 0.6898193359375, 0.7226104736328125, 0.755401611328125, 0.7881927490234375, 0.82098388671875, 0.8537750244140625, 0.886566162109375, 0.9193572998046875, 0.9521484375]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 4.0, 6.0, 6.0, 11.0, 13.0, 16.0, 28.0, 30.0, 26.0, 37.0, 61.0, 65.0, 81.0, 74.0, 70.0, 89.0, 76.0, 59.0, 55.0, 60.0, 28.0, 18.0, 28.0, 19.0, 18.0, 10.0, 4.0, 7.0, 2.0, 5.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6826171875, -1.6324615478515625, -1.582305908203125, -1.5321502685546875, -1.48199462890625, -1.4318389892578125, -1.381683349609375, -1.3315277099609375, -1.2813720703125, -1.2312164306640625, -1.181060791015625, -1.1309051513671875, -1.08074951171875, -1.0305938720703125, -0.980438232421875, -0.9302825927734375, -0.880126953125, -0.8299713134765625, -0.779815673828125, -0.7296600341796875, -0.67950439453125, -0.6293487548828125, -0.579193115234375, -0.5290374755859375, -0.4788818359375, -0.4287261962890625, -0.378570556640625, -0.3284149169921875, -0.27825927734375, -0.2281036376953125, -0.177947998046875, -0.1277923583984375, -0.07763671875, -0.0274810791015625, 0.022674560546875, 0.0728302001953125, 0.12298583984375, 0.1731414794921875, 0.223297119140625, 0.2734527587890625, 0.3236083984375, 0.3737640380859375, 0.423919677734375, 0.4740753173828125, 0.52423095703125, 0.5743865966796875, 0.624542236328125, 0.6746978759765625, 0.724853515625, 0.7750091552734375, 0.825164794921875, 0.8753204345703125, 0.92547607421875, 0.9756317138671875, 1.025787353515625, 1.0759429931640625, 1.1260986328125, 1.1762542724609375, 1.226409912109375, 1.2765655517578125, 1.32672119140625, 1.3768768310546875, 1.427032470703125, 1.4771881103515625, 1.52734375]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 5.0, 6.0, 8.0, 3.0, 3.0, 6.0, 15.0, 16.0, 16.0, 26.0, 40.0, 63.0, 86.0, 134.0, 226.0, 332.0, 595.0, 1051.0, 2442.0, 6409.0, 20858.0, 89376.0, 474141.0, 360254.0, 66392.0, 16309.0, 5274.0, 2073.0, 1014.0, 509.0, 289.0, 174.0, 119.0, 89.0, 60.0, 46.0, 19.0, 19.0, 18.0, 11.0, 6.0, 4.0, 6.0, 6.0, 5.0, 3.0, 0.0, 2.0, 0.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.6259765625, -0.60504150390625, -0.5841064453125, -0.56317138671875, -0.542236328125, -0.52130126953125, -0.5003662109375, -0.47943115234375, -0.45849609375, -0.43756103515625, -0.4166259765625, -0.39569091796875, -0.374755859375, -0.35382080078125, -0.3328857421875, -0.31195068359375, -0.291015625, -0.27008056640625, -0.2491455078125, -0.22821044921875, -0.207275390625, -0.18634033203125, -0.1654052734375, -0.14447021484375, -0.12353515625, -0.10260009765625, -0.0816650390625, -0.06072998046875, -0.039794921875, -0.01885986328125, 0.0020751953125, 0.02301025390625, 0.0439453125, 0.06488037109375, 0.0858154296875, 0.10675048828125, 0.127685546875, 0.14862060546875, 0.1695556640625, 0.19049072265625, 0.21142578125, 0.23236083984375, 0.2532958984375, 0.27423095703125, 0.295166015625, 0.31610107421875, 0.3370361328125, 0.35797119140625, 0.37890625, 0.39984130859375, 0.4207763671875, 0.44171142578125, 0.462646484375, 0.48358154296875, 0.5045166015625, 0.52545166015625, 0.54638671875, 0.56732177734375, 0.5882568359375, 0.60919189453125, 0.630126953125, 0.65106201171875, 0.6719970703125, 0.69293212890625, 0.7138671875]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 4.0, 3.0, 7.0, 10.0, 11.0, 8.0, 4.0, 15.0, 13.0, 19.0, 19.0, 18.0, 32.0, 28.0, 27.0, 27.0, 32.0, 35.0, 46.0, 37.0, 42.0, 43.0, 44.0, 44.0, 42.0, 28.0, 40.0, 41.0, 35.0, 36.0, 24.0, 24.0, 24.0, 27.0, 28.0, 15.0, 18.0, 14.0, 8.0, 8.0, 10.0, 3.0, 4.0, 4.0, 3.0, 1.0, 2.0, 2.0, 3.0, 3.0, 3.0, 0.0, 0.0, 1.0], "bins": [-1.74609375, -1.6920013427734375, -1.637908935546875, -1.5838165283203125, -1.52972412109375, -1.4756317138671875, -1.421539306640625, -1.3674468994140625, -1.3133544921875, -1.2592620849609375, -1.205169677734375, -1.1510772705078125, -1.09698486328125, -1.0428924560546875, -0.988800048828125, -0.9347076416015625, -0.880615234375, -0.8265228271484375, -0.772430419921875, -0.7183380126953125, -0.66424560546875, -0.6101531982421875, -0.556060791015625, -0.5019683837890625, -0.4478759765625, -0.3937835693359375, -0.339691162109375, -0.2855987548828125, -0.23150634765625, -0.1774139404296875, -0.123321533203125, -0.0692291259765625, -0.01513671875, 0.0389556884765625, 0.093048095703125, 0.1471405029296875, 0.20123291015625, 0.2553253173828125, 0.309417724609375, 0.3635101318359375, 0.4176025390625, 0.4716949462890625, 0.525787353515625, 0.5798797607421875, 0.63397216796875, 0.6880645751953125, 0.742156982421875, 0.7962493896484375, 0.850341796875, 0.9044342041015625, 0.958526611328125, 1.0126190185546875, 1.06671142578125, 1.1208038330078125, 1.174896240234375, 1.2289886474609375, 1.2830810546875, 1.3371734619140625, 1.391265869140625, 1.4453582763671875, 1.49945068359375, 1.5535430908203125, 1.607635498046875, 1.6617279052734375, 1.7158203125]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 9.0, 9.0, 12.0, 18.0, 33.0, 55.0, 98.0, 202.0, 439.0, 1183.0, 3506.0, 12827.0, 72587.0, 653267.0, 262427.0, 31349.0, 6982.0, 2159.0, 758.0, 286.0, 172.0, 70.0, 43.0, 21.0, 14.0, 13.0, 7.0, 2.0, 3.0, 1.0, 1.0, 2.0, 3.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.276123046875, -0.26399993896484375, -0.2518768310546875, -0.23975372314453125, -0.227630615234375, -0.21550750732421875, -0.2033843994140625, -0.19126129150390625, -0.17913818359375, -0.16701507568359375, -0.1548919677734375, -0.14276885986328125, -0.130645751953125, -0.11852264404296875, -0.1063995361328125, -0.09427642822265625, -0.0821533203125, -0.07003021240234375, -0.0579071044921875, -0.04578399658203125, -0.033660888671875, -0.02153778076171875, -0.0094146728515625, 0.00270843505859375, 0.01483154296875, 0.02695465087890625, 0.0390777587890625, 0.05120086669921875, 0.063323974609375, 0.07544708251953125, 0.0875701904296875, 0.09969329833984375, 0.11181640625, 0.12393951416015625, 0.1360626220703125, 0.14818572998046875, 0.160308837890625, 0.17243194580078125, 0.1845550537109375, 0.19667816162109375, 0.20880126953125, 0.22092437744140625, 0.2330474853515625, 0.24517059326171875, 0.257293701171875, 0.26941680908203125, 0.2815399169921875, 0.29366302490234375, 0.3057861328125, 0.31790924072265625, 0.3300323486328125, 0.34215545654296875, 0.354278564453125, 0.36640167236328125, 0.3785247802734375, 0.39064788818359375, 0.40277099609375, 0.41489410400390625, 0.4270172119140625, 0.43914031982421875, 0.451263427734375, 0.46338653564453125, 0.4755096435546875, 0.48763275146484375, 0.499755859375]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 5.0, 8.0, 9.0, 9.0, 10.0, 24.0, 30.0, 31.0, 63.0, 85.0, 123.0, 139.0, 147.0, 113.0, 77.0, 44.0, 26.0, 23.0, 10.0, 11.0, 7.0, 7.0, 0.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002465248107910156, -0.0002396702766418457, -0.00023281574249267578, -0.00022596120834350586, -0.00021910667419433594, -0.00021225214004516602, -0.0002053976058959961, -0.00019854307174682617, -0.00019168853759765625, -0.00018483400344848633, -0.0001779794692993164, -0.00017112493515014648, -0.00016427040100097656, -0.00015741586685180664, -0.00015056133270263672, -0.0001437067985534668, -0.00013685226440429688, -0.00012999773025512695, -0.00012314319610595703, -0.00011628866195678711, -0.00010943412780761719, -0.00010257959365844727, -9.572505950927734e-05, -8.887052536010742e-05, -8.20159912109375e-05, -7.516145706176758e-05, -6.830692291259766e-05, -6.145238876342773e-05, -5.459785461425781e-05, -4.774332046508789e-05, -4.088878631591797e-05, -3.403425216674805e-05, -2.7179718017578125e-05, -2.0325183868408203e-05, -1.3470649719238281e-05, -6.616115570068359e-06, 2.384185791015625e-07, 7.092952728271484e-06, 1.3947486877441406e-05, 2.0802021026611328e-05, 2.765655517578125e-05, 3.451108932495117e-05, 4.1365623474121094e-05, 4.8220157623291016e-05, 5.507469177246094e-05, 6.192922592163086e-05, 6.878376007080078e-05, 7.56382942199707e-05, 8.249282836914062e-05, 8.934736251831055e-05, 9.620189666748047e-05, 0.00010305643081665039, 0.00010991096496582031, 0.00011676549911499023, 0.00012362003326416016, 0.00013047456741333008, 0.0001373291015625, 0.00014418363571166992, 0.00015103816986083984, 0.00015789270401000977, 0.0001647472381591797, 0.0001716017723083496, 0.00017845630645751953, 0.00018531084060668945, 0.00019216537475585938]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 4.0, 2.0, 2.0, 3.0, 5.0, 6.0, 6.0, 7.0, 6.0, 16.0, 15.0, 24.0, 44.0, 77.0, 157.0, 284.0, 545.0, 1366.0, 3789.0, 12151.0, 51463.0, 350543.0, 525942.0, 77318.0, 16773.0, 4924.0, 1727.0, 653.0, 299.0, 166.0, 82.0, 42.0, 32.0, 22.0, 19.0, 11.0, 12.0, 4.0, 3.0, 4.0, 2.0, 2.0, 4.0, 5.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.33203125, -0.3206291198730469, -0.30922698974609375, -0.2978248596191406, -0.2864227294921875, -0.2750205993652344, -0.26361846923828125, -0.2522163391113281, -0.240814208984375, -0.22941207885742188, -0.21800994873046875, -0.20660781860351562, -0.1952056884765625, -0.18380355834960938, -0.17240142822265625, -0.16099929809570312, -0.14959716796875, -0.13819503784179688, -0.12679290771484375, -0.11539077758789062, -0.1039886474609375, -0.09258651733398438, -0.08118438720703125, -0.06978225708007812, -0.058380126953125, -0.046977996826171875, -0.03557586669921875, -0.024173736572265625, -0.0127716064453125, -0.001369476318359375, 0.01003265380859375, 0.021434783935546875, 0.0328369140625, 0.044239044189453125, 0.05564117431640625, 0.06704330444335938, 0.0784454345703125, 0.08984756469726562, 0.10124969482421875, 0.11265182495117188, 0.124053955078125, 0.13545608520507812, 0.14685821533203125, 0.15826034545898438, 0.1696624755859375, 0.18106460571289062, 0.19246673583984375, 0.20386886596679688, 0.21527099609375, 0.22667312622070312, 0.23807525634765625, 0.24947738647460938, 0.2608795166015625, 0.2722816467285156, 0.28368377685546875, 0.2950859069824219, 0.306488037109375, 0.3178901672363281, 0.32929229736328125, 0.3406944274902344, 0.3520965576171875, 0.3634986877441406, 0.37490081787109375, 0.3863029479980469, 0.397705078125]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 2.0, 0.0, 1.0, 3.0, 3.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 12.0, 5.0, 8.0, 10.0, 10.0, 15.0, 23.0, 35.0, 45.0, 56.0, 105.0, 120.0, 108.0, 101.0, 84.0, 72.0, 55.0, 29.0, 18.0, 16.0, 12.0, 11.0, 10.0, 7.0, 6.0, 1.0, 4.0, 6.0, 0.0, 2.0, 3.0, 1.0, 2.0, 1.0, 3.0, 0.0, 0.0, 2.0], "bins": [-0.0899658203125, -0.0876321792602539, -0.08529853820800781, -0.08296489715576172, -0.08063125610351562, -0.07829761505126953, -0.07596397399902344, -0.07363033294677734, -0.07129669189453125, -0.06896305084228516, -0.06662940979003906, -0.06429576873779297, -0.061962127685546875, -0.05962848663330078, -0.05729484558105469, -0.054961204528808594, -0.0526275634765625, -0.050293922424316406, -0.04796028137207031, -0.04562664031982422, -0.043292999267578125, -0.04095935821533203, -0.03862571716308594, -0.036292076110839844, -0.03395843505859375, -0.031624794006347656, -0.029291152954101562, -0.02695751190185547, -0.024623870849609375, -0.02229022979736328, -0.019956588745117188, -0.017622947692871094, -0.015289306640625, -0.012955665588378906, -0.010622024536132812, -0.008288383483886719, -0.005954742431640625, -0.0036211013793945312, -0.0012874603271484375, 0.0010461807250976562, 0.00337982177734375, 0.005713462829589844, 0.008047103881835938, 0.010380744934082031, 0.012714385986328125, 0.015048027038574219, 0.017381668090820312, 0.019715309143066406, 0.0220489501953125, 0.024382591247558594, 0.026716232299804688, 0.02904987335205078, 0.031383514404296875, 0.03371715545654297, 0.03605079650878906, 0.038384437561035156, 0.04071807861328125, 0.043051719665527344, 0.04538536071777344, 0.04771900177001953, 0.050052642822265625, 0.05238628387451172, 0.05471992492675781, 0.057053565979003906, 0.05938720703125]}, "gradients/decoder.model.decoder.layers.8.self_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 3.0, 8.0, 15.0, 9.0, 14.0, 43.0, 50.0, 123.0, 163.0, 195.0, 146.0, 89.0, 50.0, 30.0, 20.0, 14.0, 10.0, 9.0, 4.0, 4.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.110883951187134, -3.022636651992798, -2.934389352798462, -2.846141815185547, -2.757894515991211, -2.669647216796875, -2.581399917602539, -2.493152618408203, -2.404905080795288, -2.316657781600952, -2.228410482406616, -2.140162944793701, -2.0519156455993652, -1.9636683464050293, -1.8754210472106934, -1.7871736288070679, -1.698926329612732, -1.610679030418396, -1.5224316120147705, -1.4341843128204346, -1.345936894416809, -1.2576895952224731, -1.1694421768188477, -1.0811948776245117, -0.992947518825531, -0.9047001600265503, -0.8164528012275696, -0.7282054424285889, -0.6399581432342529, -0.5517107248306274, -0.4634634256362915, -0.3752160668373108, -0.2869687080383301, -0.19872134923934937, -0.11047400534152985, -0.022226661443710327, 0.06602069735527039, 0.1542680561542511, 0.24251538515090942, 0.33076274394989014, 0.41901010274887085, 0.5072574615478516, 0.5955048203468323, 0.683752179145813, 0.7719994783401489, 0.8602468967437744, 0.9484941959381104, 1.0367414951324463, 1.1249889135360718, 1.2132362127304077, 1.3014836311340332, 1.3897309303283691, 1.4779783487319946, 1.5662256479263306, 1.654473066329956, 1.742720365524292, 1.830967664718628, 1.9192149639129639, 2.0074622631073, 2.095709800720215, 2.183957099914551, 2.2722043991088867, 2.3604516983032227, 2.4486989974975586, 2.5369465351104736]}, "gradients/decoder.model.decoder.layers.8.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 8.0, 4.0, 5.0, 12.0, 17.0, 18.0, 26.0, 34.0, 34.0, 45.0, 66.0, 84.0, 75.0, 88.0, 73.0, 74.0, 75.0, 55.0, 48.0, 47.0, 25.0, 20.0, 18.0, 18.0, 14.0, 7.0, 3.0, 5.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.7245286703109741, -1.6751431226730347, -1.6257575750350952, -1.5763720273971558, -1.5269863605499268, -1.4776008129119873, -1.4282152652740479, -1.3788297176361084, -1.329444169998169, -1.2800586223602295, -1.23067307472229, -1.1812875270843506, -1.1319019794464111, -1.0825163125991821, -1.0331307649612427, -0.9837452173233032, -0.9343596696853638, -0.8849741220474243, -0.8355885744094849, -0.7862029671669006, -0.7368174195289612, -0.6874318718910217, -0.6380462646484375, -0.588660717010498, -0.5392751693725586, -0.48988962173461914, -0.4405040442943573, -0.39111846685409546, -0.341732919216156, -0.29234737157821655, -0.2429617941379547, -0.19357621669769287, -0.14419054985046387, -0.09480498731136322, -0.04541942477226257, 0.003966137766838074, 0.05335170030593872, 0.10273726284503937, 0.15212282538414001, 0.20150840282440186, 0.2508939504623413, 0.30027949810028076, 0.3496650755405426, 0.39905065298080444, 0.4484362006187439, 0.49782174825668335, 0.5472073554992676, 0.596592903137207, 0.6459784507751465, 0.6953639984130859, 0.7447495460510254, 0.7941351532936096, 0.8435207009315491, 0.8929062485694885, 0.9422918558120728, 0.9916774034500122, 1.0410629510879517, 1.0904484987258911, 1.1398340463638306, 1.18921959400177, 1.238605260848999, 1.2879908084869385, 1.337376356124878, 1.3867619037628174, 1.4361474514007568]}, "gradients/decoder.model.decoder.layers.8.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 3.0, 7.0, 7.0, 5.0, 9.0, 15.0, 49.0, 64.0, 153.0, 326.0, 835.0, 2464.0, 8725.0, 38566.0, 289302.0, 605313.0, 80914.0, 15492.0, 4068.0, 1356.0, 496.0, 187.0, 77.0, 46.0, 23.0, 17.0, 6.0, 7.0, 2.0, 5.0, 4.0, 3.0, 5.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0], "bins": [-3.04296875, -2.96728515625, -2.8916015625, -2.81591796875, -2.740234375, -2.66455078125, -2.5888671875, -2.51318359375, -2.4375, -2.36181640625, -2.2861328125, -2.21044921875, -2.134765625, -2.05908203125, -1.9833984375, -1.90771484375, -1.83203125, -1.75634765625, -1.6806640625, -1.60498046875, -1.529296875, -1.45361328125, -1.3779296875, -1.30224609375, -1.2265625, -1.15087890625, -1.0751953125, -0.99951171875, -0.923828125, -0.84814453125, -0.7724609375, -0.69677734375, -0.62109375, -0.54541015625, -0.4697265625, -0.39404296875, -0.318359375, -0.24267578125, -0.1669921875, -0.09130859375, -0.015625, 0.06005859375, 0.1357421875, 0.21142578125, 0.287109375, 0.36279296875, 0.4384765625, 0.51416015625, 0.58984375, 0.66552734375, 0.7412109375, 0.81689453125, 0.892578125, 0.96826171875, 1.0439453125, 1.11962890625, 1.1953125, 1.27099609375, 1.3466796875, 1.42236328125, 1.498046875, 1.57373046875, 1.6494140625, 1.72509765625, 1.80078125]}, "gradients/decoder.model.decoder.layers.8.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0, 2.0, 6.0, 5.0, 9.0, 5.0, 9.0, 18.0, 21.0, 32.0, 31.0, 37.0, 55.0, 59.0, 87.0, 83.0, 75.0, 82.0, 62.0, 68.0, 43.0, 45.0, 39.0, 25.0, 20.0, 21.0, 20.0, 10.0, 11.0, 6.0, 5.0, 4.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-3.419921875, -3.321441650390625, -3.22296142578125, -3.124481201171875, -3.0260009765625, -2.927520751953125, -2.82904052734375, -2.730560302734375, -2.632080078125, -2.533599853515625, -2.43511962890625, -2.336639404296875, -2.2381591796875, -2.139678955078125, -2.04119873046875, -1.942718505859375, -1.84423828125, -1.745758056640625, -1.64727783203125, -1.548797607421875, -1.4503173828125, -1.351837158203125, -1.25335693359375, -1.154876708984375, -1.056396484375, -0.957916259765625, -0.85943603515625, -0.760955810546875, -0.6624755859375, -0.563995361328125, -0.46551513671875, -0.367034912109375, -0.2685546875, -0.170074462890625, -0.07159423828125, 0.026885986328125, 0.1253662109375, 0.223846435546875, 0.32232666015625, 0.420806884765625, 0.519287109375, 0.617767333984375, 0.71624755859375, 0.814727783203125, 0.9132080078125, 1.011688232421875, 1.11016845703125, 1.208648681640625, 1.30712890625, 1.405609130859375, 1.50408935546875, 1.602569580078125, 1.7010498046875, 1.799530029296875, 1.89801025390625, 1.996490478515625, 2.094970703125, 2.193450927734375, 2.29193115234375, 2.390411376953125, 2.4888916015625, 2.587371826171875, 2.68585205078125, 2.784332275390625, 2.8828125]}, "gradients/decoder.model.decoder.layers.8.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 1.0, 7.0, 8.0, 8.0, 5.0, 9.0, 15.0, 13.0, 7.0, 21.0, 21.0, 28.0, 38.0, 46.0, 51.0, 70.0, 106.0, 343.0, 6608.0, 1011515.0, 28506.0, 589.0, 138.0, 62.0, 51.0, 51.0, 39.0, 40.0, 39.0, 18.0, 26.0, 18.0, 17.0, 13.0, 6.0, 9.0, 7.0, 6.0, 4.0, 2.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.5078125, -7.24560546875, -6.9833984375, -6.72119140625, -6.458984375, -6.19677734375, -5.9345703125, -5.67236328125, -5.41015625, -5.14794921875, -4.8857421875, -4.62353515625, -4.361328125, -4.09912109375, -3.8369140625, -3.57470703125, -3.3125, -3.05029296875, -2.7880859375, -2.52587890625, -2.263671875, -2.00146484375, -1.7392578125, -1.47705078125, -1.21484375, -0.95263671875, -0.6904296875, -0.42822265625, -0.166015625, 0.09619140625, 0.3583984375, 0.62060546875, 0.8828125, 1.14501953125, 1.4072265625, 1.66943359375, 1.931640625, 2.19384765625, 2.4560546875, 2.71826171875, 2.98046875, 3.24267578125, 3.5048828125, 3.76708984375, 4.029296875, 4.29150390625, 4.5537109375, 4.81591796875, 5.078125, 5.34033203125, 5.6025390625, 5.86474609375, 6.126953125, 6.38916015625, 6.6513671875, 6.91357421875, 7.17578125, 7.43798828125, 7.7001953125, 7.96240234375, 8.224609375, 8.48681640625, 8.7490234375, 9.01123046875, 9.2734375]}, "gradients/decoder.model.decoder.layers.8.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 4.0, 6.0, 8.0, 8.0, 14.0, 14.0, 8.0, 14.0, 16.0, 19.0, 36.0, 35.0, 50.0, 44.0, 38.0, 47.0, 43.0, 46.0, 46.0, 50.0, 41.0, 35.0, 56.0, 40.0, 47.0, 46.0, 33.0, 27.0, 25.0, 19.0, 22.0, 22.0, 12.0, 14.0, 2.0, 6.0, 6.0, 4.0, 4.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.42578125, -2.343658447265625, -2.26153564453125, -2.179412841796875, -2.0972900390625, -2.015167236328125, -1.93304443359375, -1.850921630859375, -1.768798828125, -1.686676025390625, -1.60455322265625, -1.522430419921875, -1.4403076171875, -1.358184814453125, -1.27606201171875, -1.193939208984375, -1.11181640625, -1.029693603515625, -0.94757080078125, -0.865447998046875, -0.7833251953125, -0.701202392578125, -0.61907958984375, -0.536956787109375, -0.454833984375, -0.372711181640625, -0.29058837890625, -0.208465576171875, -0.1263427734375, -0.044219970703125, 0.03790283203125, 0.120025634765625, 0.2021484375, 0.284271240234375, 0.36639404296875, 0.448516845703125, 0.5306396484375, 0.612762451171875, 0.69488525390625, 0.777008056640625, 0.859130859375, 0.941253662109375, 1.02337646484375, 1.105499267578125, 1.1876220703125, 1.269744873046875, 1.35186767578125, 1.433990478515625, 1.51611328125, 1.598236083984375, 1.68035888671875, 1.762481689453125, 1.8446044921875, 1.926727294921875, 2.00885009765625, 2.090972900390625, 2.173095703125, 2.255218505859375, 2.33734130859375, 2.419464111328125, 2.5015869140625, 2.583709716796875, 2.66583251953125, 2.747955322265625, 2.830078125]}, "gradients/decoder.model.decoder.layers.8.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 4.0, 2.0, 2.0, 3.0, 7.0, 9.0, 7.0, 10.0, 19.0, 26.0, 28.0, 42.0, 53.0, 77.0, 140.0, 225.0, 441.0, 955.0, 2470.0, 7907.0, 38751.0, 350951.0, 562266.0, 66823.0, 11539.0, 3327.0, 1232.0, 575.0, 252.0, 156.0, 80.0, 52.0, 47.0, 27.0, 15.0, 17.0, 6.0, 6.0, 5.0, 4.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.53466796875, -0.5174942016601562, -0.5003204345703125, -0.48314666748046875, -0.465972900390625, -0.44879913330078125, -0.4316253662109375, -0.41445159912109375, -0.39727783203125, -0.38010406494140625, -0.3629302978515625, -0.34575653076171875, -0.328582763671875, -0.31140899658203125, -0.2942352294921875, -0.27706146240234375, -0.2598876953125, -0.24271392822265625, -0.2255401611328125, -0.20836639404296875, -0.191192626953125, -0.17401885986328125, -0.1568450927734375, -0.13967132568359375, -0.12249755859375, -0.10532379150390625, -0.0881500244140625, -0.07097625732421875, -0.053802490234375, -0.03662872314453125, -0.0194549560546875, -0.00228118896484375, 0.014892578125, 0.03206634521484375, 0.0492401123046875, 0.06641387939453125, 0.083587646484375, 0.10076141357421875, 0.1179351806640625, 0.13510894775390625, 0.15228271484375, 0.16945648193359375, 0.1866302490234375, 0.20380401611328125, 0.220977783203125, 0.23815155029296875, 0.2553253173828125, 0.27249908447265625, 0.2896728515625, 0.30684661865234375, 0.3240203857421875, 0.34119415283203125, 0.358367919921875, 0.37554168701171875, 0.3927154541015625, 0.40988922119140625, 0.42706298828125, 0.44423675537109375, 0.4614105224609375, 0.47858428955078125, 0.495758056640625, 0.5129318237304688, 0.5301055908203125, 0.5472793579101562, 0.564453125]}, "gradients/decoder.model.decoder.layers.8.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 4.0, 2.0, 2.0, 4.0, 11.0, 10.0, 12.0, 12.0, 23.0, 25.0, 39.0, 58.0, 77.0, 90.0, 94.0, 98.0, 102.0, 71.0, 72.0, 31.0, 42.0, 30.0, 22.0, 27.0, 11.0, 8.0, 5.0, 5.0, 4.0, 3.0, 2.0, 4.0, 4.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0], "bins": [-8.857250213623047e-05, -8.637551218271255e-05, -8.417852222919464e-05, -8.198153227567673e-05, -7.978454232215881e-05, -7.75875523686409e-05, -7.539056241512299e-05, -7.319357246160507e-05, -7.099658250808716e-05, -6.879959255456924e-05, -6.660260260105133e-05, -6.440561264753342e-05, -6.22086226940155e-05, -6.001163274049759e-05, -5.7814642786979675e-05, -5.561765283346176e-05, -5.342066287994385e-05, -5.1223672926425934e-05, -4.902668297290802e-05, -4.6829693019390106e-05, -4.463270306587219e-05, -4.243571311235428e-05, -4.0238723158836365e-05, -3.804173320531845e-05, -3.584474325180054e-05, -3.364775329828262e-05, -3.145076334476471e-05, -2.9253773391246796e-05, -2.7056783437728882e-05, -2.4859793484210968e-05, -2.2662803530693054e-05, -2.046581357717514e-05, -1.8268823623657227e-05, -1.6071833670139313e-05, -1.3874843716621399e-05, -1.1677853763103485e-05, -9.480863809585571e-06, -7.2838738560676575e-06, -5.086883902549744e-06, -2.88989394903183e-06, -6.92903995513916e-07, 1.5040859580039978e-06, 3.7010759115219116e-06, 5.8980658650398254e-06, 8.09505581855774e-06, 1.0292045772075653e-05, 1.2489035725593567e-05, 1.468602567911148e-05, 1.6883015632629395e-05, 1.908000558614731e-05, 2.1276995539665222e-05, 2.3473985493183136e-05, 2.567097544670105e-05, 2.7867965400218964e-05, 3.0064955353736877e-05, 3.226194530725479e-05, 3.4458935260772705e-05, 3.665592521429062e-05, 3.885291516780853e-05, 4.1049905121326447e-05, 4.324689507484436e-05, 4.5443885028362274e-05, 4.764087498188019e-05, 4.98378649353981e-05, 5.2034854888916016e-05]}, "gradients/decoder.model.decoder.layers.8.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 5.0, 1.0, 8.0, 9.0, 13.0, 21.0, 18.0, 33.0, 61.0, 109.0, 169.0, 415.0, 879.0, 2432.0, 8714.0, 55740.0, 595422.0, 344661.0, 30850.0, 5839.0, 1748.0, 704.0, 337.0, 160.0, 74.0, 48.0, 41.0, 12.0, 15.0, 8.0, 4.0, 5.0, 5.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.671875, -0.6526031494140625, -0.633331298828125, -0.6140594482421875, -0.59478759765625, -0.5755157470703125, -0.556243896484375, -0.5369720458984375, -0.5177001953125, -0.4984283447265625, -0.479156494140625, -0.4598846435546875, -0.44061279296875, -0.4213409423828125, -0.402069091796875, -0.3827972412109375, -0.363525390625, -0.3442535400390625, -0.324981689453125, -0.3057098388671875, -0.28643798828125, -0.2671661376953125, -0.247894287109375, -0.2286224365234375, -0.2093505859375, -0.1900787353515625, -0.170806884765625, -0.1515350341796875, -0.13226318359375, -0.1129913330078125, -0.093719482421875, -0.0744476318359375, -0.05517578125, -0.0359039306640625, -0.016632080078125, 0.0026397705078125, 0.02191162109375, 0.0411834716796875, 0.060455322265625, 0.0797271728515625, 0.0989990234375, 0.1182708740234375, 0.137542724609375, 0.1568145751953125, 0.17608642578125, 0.1953582763671875, 0.214630126953125, 0.2339019775390625, 0.253173828125, 0.2724456787109375, 0.291717529296875, 0.3109893798828125, 0.33026123046875, 0.3495330810546875, 0.368804931640625, 0.3880767822265625, 0.4073486328125, 0.4266204833984375, 0.445892333984375, 0.4651641845703125, 0.48443603515625, 0.5037078857421875, 0.522979736328125, 0.5422515869140625, 0.5615234375]}, "gradients/decoder.model.decoder.layers.8.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 3.0, 4.0, 1.0, 3.0, 5.0, 13.0, 9.0, 10.0, 19.0, 17.0, 34.0, 34.0, 42.0, 35.0, 64.0, 64.0, 67.0, 75.0, 87.0, 82.0, 75.0, 48.0, 43.0, 38.0, 30.0, 21.0, 26.0, 21.0, 11.0, 5.0, 9.0, 5.0, 3.0, 5.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1644287109375, -0.15834617614746094, -0.15226364135742188, -0.1461811065673828, -0.14009857177734375, -0.1340160369873047, -0.12793350219726562, -0.12185096740722656, -0.1157684326171875, -0.10968589782714844, -0.10360336303710938, -0.09752082824707031, -0.09143829345703125, -0.08535575866699219, -0.07927322387695312, -0.07319068908691406, -0.067108154296875, -0.06102561950683594, -0.054943084716796875, -0.04886054992675781, -0.04277801513671875, -0.03669548034667969, -0.030612945556640625, -0.024530410766601562, -0.0184478759765625, -0.012365341186523438, -0.006282806396484375, -0.0002002716064453125, 0.00588226318359375, 0.011964797973632812, 0.018047332763671875, 0.024129867553710938, 0.03021240234375, 0.03629493713378906, 0.042377471923828125, 0.04846000671386719, 0.05454254150390625, 0.06062507629394531, 0.06670761108398438, 0.07279014587402344, 0.0788726806640625, 0.08495521545410156, 0.09103775024414062, 0.09712028503417969, 0.10320281982421875, 0.10928535461425781, 0.11536788940429688, 0.12145042419433594, 0.127532958984375, 0.13361549377441406, 0.13969802856445312, 0.1457805633544922, 0.15186309814453125, 0.1579456329345703, 0.16402816772460938, 0.17011070251464844, 0.1761932373046875, 0.18227577209472656, 0.18835830688476562, 0.1944408416748047, 0.20052337646484375, 0.2066059112548828, 0.21268844604492188, 0.21877098083496094, 0.224853515625]}, "gradients/decoder.model.decoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 4.0, 0.0, 5.0, 20.0, 56.0, 323.0, 450.0, 112.0, 32.0, 11.0, 5.0, 0.0, 0.0, 0.0, 2.0], "bins": [-30.545673370361328, -29.992050170898438, -29.438426971435547, -28.884803771972656, -28.331180572509766, -27.777557373046875, -27.223934173583984, -26.670310974121094, -26.116687774658203, -25.563064575195312, -25.009441375732422, -24.45581817626953, -23.90219497680664, -23.34857177734375, -22.79494857788086, -22.24132537841797, -21.687702178955078, -21.134078979492188, -20.580455780029297, -20.026832580566406, -19.473209381103516, -18.919586181640625, -18.365962982177734, -17.812339782714844, -17.258718490600586, -16.705095291137695, -16.151472091674805, -15.597848892211914, -15.044225692749023, -14.490602493286133, -13.936979293823242, -13.383356094360352, -12.829732894897461, -12.27610969543457, -11.72248649597168, -11.168863296508789, -10.615240097045898, -10.061616897583008, -9.507993698120117, -8.954370498657227, -8.400747299194336, -7.847124099731445, -7.293500900268555, -6.739877700805664, -6.186254501342773, -5.632631301879883, -5.07900857925415, -4.52538537979126, -3.971762180328369, -3.4181389808654785, -2.864515781402588, -2.3108928203582764, -1.7572696208953857, -1.2036464214324951, -0.6500234603881836, -0.09640026092529297, 0.45722293853759766, 1.0108461380004883, 1.5644692182540894, 2.1180922985076904, 2.671715497970581, 3.2253386974334717, 3.778961658477783, 4.332584857940674, 4.8862080574035645]}, "gradients/decoder.model.decoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 4.0, 5.0, 7.0, 7.0, 6.0, 9.0, 12.0, 20.0, 18.0, 24.0, 35.0, 36.0, 46.0, 32.0, 33.0, 42.0, 44.0, 39.0, 47.0, 48.0, 40.0, 64.0, 40.0, 41.0, 35.0, 36.0, 24.0, 32.0, 25.0, 25.0, 30.0, 18.0, 14.0, 15.0, 9.0, 9.0, 7.0, 3.0, 4.0, 5.0, 5.0, 9.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0], "bins": [-4.7735114097595215, -4.635075092315674, -4.496638774871826, -4.358202934265137, -4.219766616821289, -4.081330299377441, -3.9428939819335938, -3.804457664489746, -3.6660215854644775, -3.52758526802063, -3.3891491889953613, -3.2507128715515137, -3.112276554107666, -2.9738404750823975, -2.83540415763855, -2.6969680786132812, -2.5585317611694336, -2.420095443725586, -2.2816593647003174, -2.1432230472564697, -2.004786968231201, -1.8663506507873535, -1.7279143333435059, -1.5894781351089478, -1.4510419368743896, -1.3126057386398315, -1.1741695404052734, -1.0357332229614258, -0.8972970247268677, -0.7588608264923096, -0.6204245686531067, -0.4819883108139038, -0.3435521125793457, -0.2051158845424652, -0.06667965650558472, 0.07175657153129578, 0.21019279956817627, 0.3486289978027344, 0.48706525564193726, 0.6255015134811401, 0.7639377117156982, 0.9023739099502563, 1.0408101081848145, 1.179246425628662, 1.3176826238632202, 1.4561188220977783, 1.594555139541626, 1.732991337776184, 1.8714275360107422, 2.00986385345459, 2.1482999324798584, 2.286736249923706, 2.4251723289489746, 2.5636086463928223, 2.70204496383667, 2.8404812812805176, 2.978917360305786, 3.117353677749634, 3.2557897567749023, 3.39422607421875, 3.5326623916625977, 3.671098470687866, 3.809534788131714, 3.9479708671569824, 4.08640718460083]}, "gradients/decoder.model.decoder.layers.7.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 2.0, 2.0, 2.0, 4.0, 10.0, 10.0, 7.0, 13.0, 13.0, 29.0, 26.0, 40.0, 41.0, 63.0, 82.0, 149.0, 267.0, 432.0, 965.0, 2200.0, 6438.0, 23319.0, 140991.0, 2174317.0, 1702468.0, 113040.0, 19853.0, 5467.0, 1982.0, 827.0, 451.0, 246.0, 140.0, 104.0, 72.0, 54.0, 40.0, 27.0, 23.0, 22.0, 11.0, 8.0, 8.0, 5.0, 7.0, 4.0, 2.0, 4.0, 2.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.34765625, -2.269287109375, -2.19091796875, -2.112548828125, -2.0341796875, -1.955810546875, -1.87744140625, -1.799072265625, -1.720703125, -1.642333984375, -1.56396484375, -1.485595703125, -1.4072265625, -1.328857421875, -1.25048828125, -1.172119140625, -1.09375, -1.015380859375, -0.93701171875, -0.858642578125, -0.7802734375, -0.701904296875, -0.62353515625, -0.545166015625, -0.466796875, -0.388427734375, -0.31005859375, -0.231689453125, -0.1533203125, -0.074951171875, 0.00341796875, 0.081787109375, 0.16015625, 0.238525390625, 0.31689453125, 0.395263671875, 0.4736328125, 0.552001953125, 0.63037109375, 0.708740234375, 0.787109375, 0.865478515625, 0.94384765625, 1.022216796875, 1.1005859375, 1.178955078125, 1.25732421875, 1.335693359375, 1.4140625, 1.492431640625, 1.57080078125, 1.649169921875, 1.7275390625, 1.805908203125, 1.88427734375, 1.962646484375, 2.041015625, 2.119384765625, 2.19775390625, 2.276123046875, 2.3544921875, 2.432861328125, 2.51123046875, 2.589599609375, 2.66796875]}, "gradients/decoder.model.decoder.layers.7.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 4.0, 7.0, 10.0, 13.0, 16.0, 28.0, 46.0, 43.0, 60.0, 60.0, 81.0, 79.0, 91.0, 82.0, 79.0, 65.0, 56.0, 47.0, 37.0, 27.0, 16.0, 19.0, 13.0, 8.0, 5.0, 4.0, 5.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.048828125, -1.97723388671875, -1.9056396484375, -1.83404541015625, -1.762451171875, -1.69085693359375, -1.6192626953125, -1.54766845703125, -1.47607421875, -1.40447998046875, -1.3328857421875, -1.26129150390625, -1.189697265625, -1.11810302734375, -1.0465087890625, -0.97491455078125, -0.9033203125, -0.83172607421875, -0.7601318359375, -0.68853759765625, -0.616943359375, -0.54534912109375, -0.4737548828125, -0.40216064453125, -0.33056640625, -0.25897216796875, -0.1873779296875, -0.11578369140625, -0.044189453125, 0.02740478515625, 0.0989990234375, 0.17059326171875, 0.2421875, 0.31378173828125, 0.3853759765625, 0.45697021484375, 0.528564453125, 0.60015869140625, 0.6717529296875, 0.74334716796875, 0.81494140625, 0.88653564453125, 0.9581298828125, 1.02972412109375, 1.101318359375, 1.17291259765625, 1.2445068359375, 1.31610107421875, 1.3876953125, 1.45928955078125, 1.5308837890625, 1.60247802734375, 1.674072265625, 1.74566650390625, 1.8172607421875, 1.88885498046875, 1.96044921875, 2.03204345703125, 2.1036376953125, 2.17523193359375, 2.246826171875, 2.31842041015625, 2.3900146484375, 2.46160888671875, 2.533203125]}, "gradients/decoder.model.decoder.layers.7.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 4.0, 4.0, 2.0, 8.0, 6.0, 15.0, 19.0, 21.0, 37.0, 36.0, 79.0, 135.0, 333.0, 1386.0, 37555.0, 4127597.0, 25189.0, 1171.0, 309.0, 155.0, 77.0, 44.0, 40.0, 23.0, 11.0, 10.0, 2.0, 3.0, 4.0, 7.0, 3.0, 5.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.2734375, -9.01910400390625, -8.7647705078125, -8.51043701171875, -8.256103515625, -8.00177001953125, -7.7474365234375, -7.49310302734375, -7.23876953125, -6.98443603515625, -6.7301025390625, -6.47576904296875, -6.221435546875, -5.96710205078125, -5.7127685546875, -5.45843505859375, -5.2041015625, -4.94976806640625, -4.6954345703125, -4.44110107421875, -4.186767578125, -3.93243408203125, -3.6781005859375, -3.42376708984375, -3.16943359375, -2.91510009765625, -2.6607666015625, -2.40643310546875, -2.152099609375, -1.89776611328125, -1.6434326171875, -1.38909912109375, -1.134765625, -0.88043212890625, -0.6260986328125, -0.37176513671875, -0.117431640625, 0.13690185546875, 0.3912353515625, 0.64556884765625, 0.89990234375, 1.15423583984375, 1.4085693359375, 1.66290283203125, 1.917236328125, 2.17156982421875, 2.4259033203125, 2.68023681640625, 2.9345703125, 3.18890380859375, 3.4432373046875, 3.69757080078125, 3.951904296875, 4.20623779296875, 4.4605712890625, 4.71490478515625, 4.96923828125, 5.22357177734375, 5.4779052734375, 5.73223876953125, 5.986572265625, 6.24090576171875, 6.4952392578125, 6.74957275390625, 7.00390625]}, "gradients/decoder.model.decoder.layers.7.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 3.0, 3.0, 3.0, 5.0, 10.0, 10.0, 9.0, 12.0, 13.0, 36.0, 42.0, 34.0, 58.0, 86.0, 128.0, 167.0, 305.0, 435.0, 710.0, 652.0, 449.0, 287.0, 187.0, 125.0, 89.0, 51.0, 37.0, 33.0, 15.0, 13.0, 22.0, 16.0, 10.0, 8.0, 5.0, 3.0, 2.0, 3.0, 1.0, 4.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.53271484375, -0.5160064697265625, -0.499298095703125, -0.4825897216796875, -0.46588134765625, -0.4491729736328125, -0.432464599609375, -0.4157562255859375, -0.3990478515625, -0.3823394775390625, -0.365631103515625, -0.3489227294921875, -0.33221435546875, -0.3155059814453125, -0.298797607421875, -0.2820892333984375, -0.265380859375, -0.2486724853515625, -0.231964111328125, -0.2152557373046875, -0.19854736328125, -0.1818389892578125, -0.165130615234375, -0.1484222412109375, -0.1317138671875, -0.1150054931640625, -0.098297119140625, -0.0815887451171875, -0.06488037109375, -0.0481719970703125, -0.031463623046875, -0.0147552490234375, 0.001953125, 0.0186614990234375, 0.035369873046875, 0.0520782470703125, 0.06878662109375, 0.0854949951171875, 0.102203369140625, 0.1189117431640625, 0.1356201171875, 0.1523284912109375, 0.169036865234375, 0.1857452392578125, 0.20245361328125, 0.2191619873046875, 0.235870361328125, 0.2525787353515625, 0.269287109375, 0.2859954833984375, 0.302703857421875, 0.3194122314453125, 0.33612060546875, 0.3528289794921875, 0.369537353515625, 0.3862457275390625, 0.4029541015625, 0.4196624755859375, 0.436370849609375, 0.4530792236328125, 0.46978759765625, 0.4864959716796875, 0.503204345703125, 0.5199127197265625, 0.53662109375]}, "gradients/decoder.model.decoder.layers.7.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 8.0, 6.0, 8.0, 12.0, 13.0, 34.0, 46.0, 97.0, 118.0, 158.0, 155.0, 156.0, 65.0, 41.0, 26.0, 13.0, 15.0, 7.0, 10.0, 8.0, 3.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.9439401626586914, -3.8267722129821777, -3.709604263305664, -3.5924363136291504, -3.4752683639526367, -3.358100414276123, -3.2409324645996094, -3.1237645149230957, -3.006596565246582, -2.8894286155700684, -2.7722606658935547, -2.655092716217041, -2.5379247665405273, -2.4207568168640137, -2.3035888671875, -2.1864209175109863, -2.0692527294158936, -1.9520847797393799, -1.8349168300628662, -1.7177488803863525, -1.6005809307098389, -1.4834129810333252, -1.366244912147522, -1.2490769624710083, -1.1319090127944946, -1.014741063117981, -0.8975731134414673, -0.7804051041603088, -0.6632371544837952, -0.5460692048072815, -0.42890119552612305, -0.3117332458496094, -0.1945650577545166, -0.07739709317684174, 0.03977087140083313, 0.1569388508796692, 0.27410680055618286, 0.39127475023269653, 0.508442759513855, 0.6256107091903687, 0.7427786588668823, 0.859946608543396, 0.9771145582199097, 1.094282627105713, 1.2114505767822266, 1.3286185264587402, 1.445786476135254, 1.5629544258117676, 1.6801223754882812, 1.797290325164795, 1.9144582748413086, 2.0316262245178223, 2.148794174194336, 2.2659621238708496, 2.3831300735473633, 2.500298023223877, 2.6174659729003906, 2.7346339225769043, 2.851801872253418, 2.9689698219299316, 3.0861377716064453, 3.203305721282959, 3.3204736709594727, 3.4376416206359863, 3.554809808731079]}, "gradients/decoder.model.decoder.layers.7.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 3.0, 3.0, 1.0, 3.0, 4.0, 14.0, 13.0, 15.0, 15.0, 24.0, 12.0, 30.0, 46.0, 41.0, 49.0, 36.0, 56.0, 59.0, 57.0, 68.0, 47.0, 69.0, 53.0, 46.0, 41.0, 34.0, 37.0, 19.0, 28.0, 21.0, 12.0, 14.0, 11.0, 7.0, 6.0, 2.0, 0.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.8450766801834106, -1.787838101387024, -1.7305995225906372, -1.6733609437942505, -1.6161224842071533, -1.5588839054107666, -1.5016453266143799, -1.4444067478179932, -1.3871681690216064, -1.3299295902252197, -1.272691011428833, -1.2154524326324463, -1.1582138538360596, -1.1009752750396729, -1.0437368154525757, -0.986498236656189, -0.9292596578598022, -0.8720210790634155, -0.8147825002670288, -0.7575439810752869, -0.7003054022789001, -0.6430668234825134, -0.5858283042907715, -0.5285897254943848, -0.47135114669799805, -0.41411256790161133, -0.356874018907547, -0.29963546991348267, -0.24239689111709595, -0.18515831232070923, -0.1279197633266449, -0.07068121433258057, -0.013442754745483398, 0.043795809149742126, 0.10103437304496765, 0.15827293694019318, 0.2155115008354187, 0.2727500796318054, 0.32998862862586975, 0.3872271776199341, 0.4444657564163208, 0.5017043352127075, 0.5589429140090942, 0.6161814332008362, 0.6734200119972229, 0.7306585907936096, 0.7878971099853516, 0.8451356887817383, 0.902374267578125, 0.9596128463745117, 1.0168514251708984, 1.0740900039672852, 1.1313285827636719, 1.1885671615600586, 1.2458056211471558, 1.3030441999435425, 1.3602827787399292, 1.417521357536316, 1.4747599363327026, 1.5319985151290894, 1.5892369747161865, 1.6464755535125732, 1.70371413230896, 1.7609527111053467, 1.8181912899017334]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 5.0, 2.0, 5.0, 4.0, 8.0, 18.0, 19.0, 32.0, 55.0, 119.0, 223.0, 586.0, 1423.0, 4386.0, 14915.0, 60879.0, 330299.0, 513129.0, 92089.0, 21147.0, 5924.0, 1962.0, 732.0, 293.0, 145.0, 67.0, 36.0, 28.0, 12.0, 6.0, 5.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.62255859375, -0.601898193359375, -0.58123779296875, -0.560577392578125, -0.5399169921875, -0.519256591796875, -0.49859619140625, -0.477935791015625, -0.457275390625, -0.436614990234375, -0.41595458984375, -0.395294189453125, -0.3746337890625, -0.353973388671875, -0.33331298828125, -0.312652587890625, -0.2919921875, -0.271331787109375, -0.25067138671875, -0.230010986328125, -0.2093505859375, -0.188690185546875, -0.16802978515625, -0.147369384765625, -0.126708984375, -0.106048583984375, -0.08538818359375, -0.064727783203125, -0.0440673828125, -0.023406982421875, -0.00274658203125, 0.017913818359375, 0.03857421875, 0.059234619140625, 0.07989501953125, 0.100555419921875, 0.1212158203125, 0.141876220703125, 0.16253662109375, 0.183197021484375, 0.203857421875, 0.224517822265625, 0.24517822265625, 0.265838623046875, 0.2864990234375, 0.307159423828125, 0.32781982421875, 0.348480224609375, 0.369140625, 0.389801025390625, 0.41046142578125, 0.431121826171875, 0.4517822265625, 0.472442626953125, 0.49310302734375, 0.513763427734375, 0.534423828125, 0.555084228515625, 0.57574462890625, 0.596405029296875, 0.6170654296875, 0.637725830078125, 0.65838623046875, 0.679046630859375, 0.69970703125]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 5.0, 3.0, 3.0, 9.0, 9.0, 8.0, 15.0, 27.0, 19.0, 29.0, 40.0, 52.0, 54.0, 53.0, 74.0, 85.0, 85.0, 92.0, 60.0, 48.0, 44.0, 56.0, 35.0, 23.0, 28.0, 16.0, 8.0, 10.0, 3.0, 4.0, 4.0, 0.0, 3.0, 4.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.353515625, -1.3069610595703125, -1.260406494140625, -1.2138519287109375, -1.16729736328125, -1.1207427978515625, -1.074188232421875, -1.0276336669921875, -0.9810791015625, -0.9345245361328125, -0.887969970703125, -0.8414154052734375, -0.79486083984375, -0.7483062744140625, -0.701751708984375, -0.6551971435546875, -0.608642578125, -0.5620880126953125, -0.515533447265625, -0.4689788818359375, -0.42242431640625, -0.3758697509765625, -0.329315185546875, -0.2827606201171875, -0.2362060546875, -0.1896514892578125, -0.143096923828125, -0.0965423583984375, -0.04998779296875, -0.0034332275390625, 0.043121337890625, 0.0896759033203125, 0.13623046875, 0.1827850341796875, 0.229339599609375, 0.2758941650390625, 0.32244873046875, 0.3690032958984375, 0.415557861328125, 0.4621124267578125, 0.5086669921875, 0.5552215576171875, 0.601776123046875, 0.6483306884765625, 0.69488525390625, 0.7414398193359375, 0.787994384765625, 0.8345489501953125, 0.881103515625, 0.9276580810546875, 0.974212646484375, 1.0207672119140625, 1.06732177734375, 1.1138763427734375, 1.160430908203125, 1.2069854736328125, 1.2535400390625, 1.3000946044921875, 1.346649169921875, 1.3932037353515625, 1.43975830078125, 1.4863128662109375, 1.532867431640625, 1.5794219970703125, 1.6259765625]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [3.0, 4.0, 4.0, 2.0, 2.0, 1.0, 0.0, 7.0, 3.0, 9.0, 10.0, 8.0, 16.0, 20.0, 16.0, 38.0, 34.0, 57.0, 73.0, 106.0, 134.0, 199.0, 339.0, 702.0, 1226.0, 3126.0, 9577.0, 35832.0, 170001.0, 583718.0, 187547.0, 38993.0, 10197.0, 3398.0, 1332.0, 635.0, 372.0, 238.0, 166.0, 130.0, 71.0, 51.0, 43.0, 32.0, 17.0, 20.0, 16.0, 8.0, 11.0, 7.0, 6.0, 6.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.4404296875, -0.42551422119140625, -0.4105987548828125, -0.39568328857421875, -0.380767822265625, -0.36585235595703125, -0.3509368896484375, -0.33602142333984375, -0.32110595703125, -0.30619049072265625, -0.2912750244140625, -0.27635955810546875, -0.261444091796875, -0.24652862548828125, -0.2316131591796875, -0.21669769287109375, -0.2017822265625, -0.18686676025390625, -0.1719512939453125, -0.15703582763671875, -0.142120361328125, -0.12720489501953125, -0.1122894287109375, -0.09737396240234375, -0.08245849609375, -0.06754302978515625, -0.0526275634765625, -0.03771209716796875, -0.022796630859375, -0.00788116455078125, 0.0070343017578125, 0.02194976806640625, 0.036865234375, 0.05178070068359375, 0.0666961669921875, 0.08161163330078125, 0.096527099609375, 0.11144256591796875, 0.1263580322265625, 0.14127349853515625, 0.15618896484375, 0.17110443115234375, 0.1860198974609375, 0.20093536376953125, 0.215850830078125, 0.23076629638671875, 0.2456817626953125, 0.26059722900390625, 0.2755126953125, 0.29042816162109375, 0.3053436279296875, 0.32025909423828125, 0.335174560546875, 0.35009002685546875, 0.3650054931640625, 0.37992095947265625, 0.39483642578125, 0.40975189208984375, 0.4246673583984375, 0.43958282470703125, 0.454498291015625, 0.46941375732421875, 0.4843292236328125, 0.49924468994140625, 0.51416015625]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 5.0, 5.0, 9.0, 4.0, 4.0, 8.0, 13.0, 10.0, 12.0, 12.0, 24.0, 36.0, 24.0, 34.0, 38.0, 34.0, 38.0, 51.0, 54.0, 54.0, 57.0, 48.0, 43.0, 54.0, 44.0, 35.0, 41.0, 41.0, 33.0, 29.0, 27.0, 16.0, 14.0, 14.0, 8.0, 7.0, 6.0, 8.0, 8.0, 5.0, 2.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9140625, -1.8472900390625, -1.780517578125, -1.7137451171875, -1.64697265625, -1.5802001953125, -1.513427734375, -1.4466552734375, -1.3798828125, -1.3131103515625, -1.246337890625, -1.1795654296875, -1.11279296875, -1.0460205078125, -0.979248046875, -0.9124755859375, -0.845703125, -0.7789306640625, -0.712158203125, -0.6453857421875, -0.57861328125, -0.5118408203125, -0.445068359375, -0.3782958984375, -0.3115234375, -0.2447509765625, -0.177978515625, -0.1112060546875, -0.04443359375, 0.0223388671875, 0.089111328125, 0.1558837890625, 0.22265625, 0.2894287109375, 0.356201171875, 0.4229736328125, 0.48974609375, 0.5565185546875, 0.623291015625, 0.6900634765625, 0.7568359375, 0.8236083984375, 0.890380859375, 0.9571533203125, 1.02392578125, 1.0906982421875, 1.157470703125, 1.2242431640625, 1.291015625, 1.3577880859375, 1.424560546875, 1.4913330078125, 1.55810546875, 1.6248779296875, 1.691650390625, 1.7584228515625, 1.8251953125, 1.8919677734375, 1.958740234375, 2.0255126953125, 2.09228515625, 2.1590576171875, 2.225830078125, 2.2926025390625, 2.359375]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 6.0, 12.0, 14.0, 18.0, 41.0, 53.0, 78.0, 121.0, 197.0, 362.0, 661.0, 1307.0, 2859.0, 7785.0, 25659.0, 121336.0, 636230.0, 197248.0, 37286.0, 10211.0, 3723.0, 1587.0, 730.0, 399.0, 239.0, 126.0, 100.0, 50.0, 33.0, 21.0, 24.0, 13.0, 7.0, 5.0, 5.0, 2.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.205810546875, -0.19808197021484375, -0.1903533935546875, -0.18262481689453125, -0.174896240234375, -0.16716766357421875, -0.1594390869140625, -0.15171051025390625, -0.14398193359375, -0.13625335693359375, -0.1285247802734375, -0.12079620361328125, -0.113067626953125, -0.10533905029296875, -0.0976104736328125, -0.08988189697265625, -0.0821533203125, -0.07442474365234375, -0.0666961669921875, -0.05896759033203125, -0.051239013671875, -0.04351043701171875, -0.0357818603515625, -0.02805328369140625, -0.02032470703125, -0.01259613037109375, -0.0048675537109375, 0.00286102294921875, 0.010589599609375, 0.01831817626953125, 0.0260467529296875, 0.03377532958984375, 0.04150390625, 0.04923248291015625, 0.0569610595703125, 0.06468963623046875, 0.072418212890625, 0.08014678955078125, 0.0878753662109375, 0.09560394287109375, 0.10333251953125, 0.11106109619140625, 0.1187896728515625, 0.12651824951171875, 0.134246826171875, 0.14197540283203125, 0.1497039794921875, 0.15743255615234375, 0.1651611328125, 0.17288970947265625, 0.1806182861328125, 0.18834686279296875, 0.196075439453125, 0.20380401611328125, 0.2115325927734375, 0.21926116943359375, 0.22698974609375, 0.23471832275390625, 0.2424468994140625, 0.25017547607421875, 0.257904052734375, 0.26563262939453125, 0.2733612060546875, 0.28108978271484375, 0.288818359375]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 2.0, 5.0, 3.0, 5.0, 6.0, 10.0, 7.0, 9.0, 24.0, 21.0, 35.0, 56.0, 47.0, 72.0, 111.0, 121.0, 108.0, 102.0, 62.0, 43.0, 30.0, 27.0, 19.0, 27.0, 4.0, 9.0, 9.0, 5.0, 6.0, 4.0, 4.0, 2.0, 3.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00011730194091796875, -0.00011357758194208145, -0.00010985322296619415, -0.00010612886399030685, -0.00010240450501441956, -9.868014603853226e-05, -9.495578706264496e-05, -9.123142808675766e-05, -8.750706911087036e-05, -8.378271013498306e-05, -8.005835115909576e-05, -7.633399218320847e-05, -7.260963320732117e-05, -6.888527423143387e-05, -6.516091525554657e-05, -6.143655627965927e-05, -5.771219730377197e-05, -5.3987838327884674e-05, -5.0263479351997375e-05, -4.653912037611008e-05, -4.281476140022278e-05, -3.909040242433548e-05, -3.536604344844818e-05, -3.164168447256088e-05, -2.7917325496673584e-05, -2.4192966520786285e-05, -2.0468607544898987e-05, -1.6744248569011688e-05, -1.301988959312439e-05, -9.295530617237091e-06, -5.5711716413497925e-06, -1.846812665462494e-06, 1.8775463104248047e-06, 5.601905286312103e-06, 9.326264262199402e-06, 1.30506232380867e-05, 1.6774982213974e-05, 2.0499341189861298e-05, 2.4223700165748596e-05, 2.7948059141635895e-05, 3.167241811752319e-05, 3.539677709341049e-05, 3.912113606929779e-05, 4.284549504518509e-05, 4.656985402107239e-05, 5.0294212996959686e-05, 5.4018571972846985e-05, 5.7742930948734283e-05, 6.146728992462158e-05, 6.519164890050888e-05, 6.891600787639618e-05, 7.264036685228348e-05, 7.636472582817078e-05, 8.008908480405807e-05, 8.381344377994537e-05, 8.753780275583267e-05, 9.126216173171997e-05, 9.498652070760727e-05, 9.871087968349457e-05, 0.00010243523865938187, 0.00010615959763526917, 0.00010988395661115646, 0.00011360831558704376, 0.00011733267456293106, 0.00012105703353881836]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 8.0, 2.0, 3.0, 10.0, 10.0, 16.0, 26.0, 36.0, 87.0, 129.0, 385.0, 957.0, 4034.0, 27831.0, 511328.0, 471561.0, 26627.0, 3834.0, 1007.0, 341.0, 144.0, 87.0, 42.0, 28.0, 8.0, 6.0, 7.0, 1.0, 7.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.42578125, -0.4105682373046875, -0.395355224609375, -0.3801422119140625, -0.36492919921875, -0.3497161865234375, -0.334503173828125, -0.3192901611328125, -0.3040771484375, -0.2888641357421875, -0.273651123046875, -0.2584381103515625, -0.24322509765625, -0.2280120849609375, -0.212799072265625, -0.1975860595703125, -0.182373046875, -0.1671600341796875, -0.151947021484375, -0.1367340087890625, -0.12152099609375, -0.1063079833984375, -0.091094970703125, -0.0758819580078125, -0.0606689453125, -0.0454559326171875, -0.030242919921875, -0.0150299072265625, 0.00018310546875, 0.0153961181640625, 0.030609130859375, 0.0458221435546875, 0.06103515625, 0.0762481689453125, 0.091461181640625, 0.1066741943359375, 0.12188720703125, 0.1371002197265625, 0.152313232421875, 0.1675262451171875, 0.1827392578125, 0.1979522705078125, 0.213165283203125, 0.2283782958984375, 0.24359130859375, 0.2588043212890625, 0.274017333984375, 0.2892303466796875, 0.304443359375, 0.3196563720703125, 0.334869384765625, 0.3500823974609375, 0.36529541015625, 0.3805084228515625, 0.395721435546875, 0.4109344482421875, 0.4261474609375, 0.4413604736328125, 0.456573486328125, 0.4717864990234375, 0.48699951171875, 0.5022125244140625, 0.517425537109375, 0.5326385498046875, 0.5478515625]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 6.0, 1.0, 5.0, 5.0, 9.0, 8.0, 21.0, 21.0, 30.0, 40.0, 56.0, 72.0, 89.0, 129.0, 121.0, 88.0, 82.0, 59.0, 43.0, 37.0, 19.0, 21.0, 11.0, 14.0, 6.0, 8.0, 5.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08258056640625, -0.08029365539550781, -0.07800674438476562, -0.07571983337402344, -0.07343292236328125, -0.07114601135253906, -0.06885910034179688, -0.06657218933105469, -0.0642852783203125, -0.06199836730957031, -0.059711456298828125, -0.05742454528808594, -0.05513763427734375, -0.05285072326660156, -0.050563812255859375, -0.04827690124511719, -0.045989990234375, -0.04370307922363281, -0.041416168212890625, -0.03912925720214844, -0.03684234619140625, -0.03455543518066406, -0.032268524169921875, -0.029981613159179688, -0.0276947021484375, -0.025407791137695312, -0.023120880126953125, -0.020833969116210938, -0.01854705810546875, -0.016260147094726562, -0.013973236083984375, -0.011686325073242188, -0.0093994140625, -0.0071125030517578125, -0.004825592041015625, -0.0025386810302734375, -0.00025177001953125, 0.0020351409912109375, 0.004322052001953125, 0.0066089630126953125, 0.0088958740234375, 0.011182785034179688, 0.013469696044921875, 0.015756607055664062, 0.01804351806640625, 0.020330429077148438, 0.022617340087890625, 0.024904251098632812, 0.027191162109375, 0.029478073120117188, 0.031764984130859375, 0.03405189514160156, 0.03633880615234375, 0.03862571716308594, 0.040912628173828125, 0.04319953918457031, 0.0454864501953125, 0.04777336120605469, 0.050060272216796875, 0.05234718322753906, 0.05463409423828125, 0.05692100524902344, 0.059207916259765625, 0.06149482727050781, 0.06378173828125]}, "gradients/decoder.model.decoder.layers.7.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 4.0, 5.0, 11.0, 10.0, 23.0, 45.0, 86.0, 165.0, 241.0, 200.0, 103.0, 38.0, 27.0, 17.0, 12.0, 4.0, 7.0, 4.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.844099760055542, -3.7415194511413574, -3.638939142227173, -3.5363588333129883, -3.4337782859802246, -3.331198215484619, -3.2286176681518555, -3.126037359237671, -3.0234570503234863, -2.9208767414093018, -2.818296432495117, -2.7157161235809326, -2.613135814666748, -2.5105552673339844, -2.4079749584198, -2.3053946495056152, -2.2028143405914307, -2.100234031677246, -1.9976537227630615, -1.8950732946395874, -1.7924929857254028, -1.6899126768112183, -1.5873322486877441, -1.4847519397735596, -1.382171630859375, -1.2795913219451904, -1.1770110130310059, -1.0744305849075317, -0.9718502759933472, -0.8692699670791626, -0.7666895985603333, -0.6641092300415039, -0.5615291595458984, -0.4589488208293915, -0.3563684821128845, -0.25378814339637756, -0.1512078046798706, -0.048627495765686035, 0.05395287275314331, 0.15653324127197266, 0.2591135501861572, 0.3616938889026642, 0.46427422761917114, 0.5668545961380005, 0.6694349050521851, 0.7720152139663696, 0.874595582485199, 0.9771759510040283, 1.079756259918213, 1.1823365688323975, 1.284916877746582, 1.3874973058700562, 1.4900776147842407, 1.5926579236984253, 1.6952383518218994, 1.797818660736084, 1.9003989696502686, 2.002979278564453, 2.1055595874786377, 2.2081398963928223, 2.310720443725586, 2.4133005142211914, 2.515881061553955, 2.6184613704681396, 2.721041679382324]}, "gradients/decoder.model.decoder.layers.7.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 0.0, 2.0, 2.0, 3.0, 8.0, 9.0, 13.0, 24.0, 23.0, 32.0, 26.0, 45.0, 66.0, 74.0, 70.0, 81.0, 73.0, 92.0, 79.0, 66.0, 40.0, 44.0, 30.0, 28.0, 28.0, 16.0, 9.0, 6.0, 5.0, 3.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.6934717893600464, -1.6462887525558472, -1.5991058349609375, -1.5519227981567383, -1.5047398805618286, -1.4575568437576294, -1.4103739261627197, -1.3631908893585205, -1.3160078525543213, -1.268824815750122, -1.2216418981552124, -1.1744588613510132, -1.1272759437561035, -1.0800929069519043, -1.032909870147705, -0.9857269525527954, -0.9385440349578857, -0.8913610577583313, -0.8441780805587769, -0.7969950437545776, -0.749812126159668, -0.7026290893554688, -0.6554461121559143, -0.6082631349563599, -0.5610801577568054, -0.513897180557251, -0.46671420335769653, -0.4195311963558197, -0.37234821915626526, -0.3251652419567108, -0.277982234954834, -0.23079925775527954, -0.1836162805557251, -0.13643330335617065, -0.08925031125545502, -0.04206731915473938, 0.0051156580448150635, 0.05229863524436951, 0.09948164224624634, 0.14666461944580078, 0.19384759664535522, 0.24103057384490967, 0.2882135510444641, 0.33539655804634094, 0.3825795352458954, 0.42976251244544983, 0.47694551944732666, 0.5241284966468811, 0.5713114738464355, 0.61849445104599, 0.6656774282455444, 0.7128604650497437, 0.7600433826446533, 0.8072264194488525, 0.854409396648407, 0.9015923738479614, 0.9487753510475159, 0.9959583282470703, 1.0431413650512695, 1.0903242826461792, 1.1375073194503784, 1.184690237045288, 1.2318732738494873, 1.2790563106536865, 1.3262392282485962]}, "gradients/decoder.model.decoder.layers.7.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 5.0, 1.0, 4.0, 3.0, 7.0, 6.0, 11.0, 16.0, 9.0, 12.0, 19.0, 21.0, 28.0, 40.0, 65.0, 192.0, 2611.0, 448245.0, 593629.0, 3184.0, 214.0, 61.0, 38.0, 30.0, 16.0, 16.0, 15.0, 11.0, 10.0, 13.0, 5.0, 9.0, 5.0, 3.0, 6.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.91796875, -5.73876953125, -5.5595703125, -5.38037109375, -5.201171875, -5.02197265625, -4.8427734375, -4.66357421875, -4.484375, -4.30517578125, -4.1259765625, -3.94677734375, -3.767578125, -3.58837890625, -3.4091796875, -3.22998046875, -3.05078125, -2.87158203125, -2.6923828125, -2.51318359375, -2.333984375, -2.15478515625, -1.9755859375, -1.79638671875, -1.6171875, -1.43798828125, -1.2587890625, -1.07958984375, -0.900390625, -0.72119140625, -0.5419921875, -0.36279296875, -0.18359375, -0.00439453125, 0.1748046875, 0.35400390625, 0.533203125, 0.71240234375, 0.8916015625, 1.07080078125, 1.25, 1.42919921875, 1.6083984375, 1.78759765625, 1.966796875, 2.14599609375, 2.3251953125, 2.50439453125, 2.68359375, 2.86279296875, 3.0419921875, 3.22119140625, 3.400390625, 3.57958984375, 3.7587890625, 3.93798828125, 4.1171875, 4.29638671875, 4.4755859375, 4.65478515625, 4.833984375, 5.01318359375, 5.1923828125, 5.37158203125, 5.55078125]}, "gradients/decoder.model.decoder.layers.7.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 14.0, 20.0, 45.0, 55.0, 79.0, 128.0, 149.0, 154.0, 137.0, 78.0, 63.0, 42.0, 20.0, 6.0, 10.0, 3.0, 1.0, 2.0, 1.0, 2.0, 1.0], "bins": [-10.671875, -10.458282470703125, -10.24468994140625, -10.031097412109375, -9.8175048828125, -9.603912353515625, -9.39031982421875, -9.176727294921875, -8.963134765625, -8.749542236328125, -8.53594970703125, -8.322357177734375, -8.1087646484375, -7.895172119140625, -7.68157958984375, -7.467987060546875, -7.25439453125, -7.040802001953125, -6.82720947265625, -6.613616943359375, -6.4000244140625, -6.186431884765625, -5.97283935546875, -5.759246826171875, -5.545654296875, -5.332061767578125, -5.11846923828125, -4.904876708984375, -4.6912841796875, -4.477691650390625, -4.26409912109375, -4.050506591796875, -3.8369140625, -3.623321533203125, -3.40972900390625, -3.196136474609375, -2.9825439453125, -2.768951416015625, -2.55535888671875, -2.341766357421875, -2.128173828125, -1.914581298828125, -1.70098876953125, -1.487396240234375, -1.2738037109375, -1.060211181640625, -0.84661865234375, -0.633026123046875, -0.41943359375, -0.205841064453125, 0.00775146484375, 0.221343994140625, 0.4349365234375, 0.648529052734375, 0.86212158203125, 1.075714111328125, 1.289306640625, 1.502899169921875, 1.71649169921875, 1.930084228515625, 2.1436767578125, 2.357269287109375, 2.57086181640625, 2.784454345703125, 2.998046875]}, "gradients/decoder.model.decoder.layers.7.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 2.0, 3.0, 1.0, 7.0, 0.0, 4.0, 8.0, 7.0, 9.0, 13.0, 17.0, 17.0, 27.0, 30.0, 40.0, 47.0, 41.0, 64.0, 69.0, 79.0, 82.0, 130.0, 255.0, 752.0, 7056.0, 424035.0, 604420.0, 9429.0, 926.0, 244.0, 121.0, 105.0, 79.0, 66.0, 56.0, 54.0, 45.0, 37.0, 41.0, 30.0, 30.0, 15.0, 16.0, 12.0, 19.0, 8.0, 5.0, 5.0, 3.0, 0.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.021484375, -2.920928955078125, -2.82037353515625, -2.719818115234375, -2.6192626953125, -2.518707275390625, -2.41815185546875, -2.317596435546875, -2.217041015625, -2.116485595703125, -2.01593017578125, -1.915374755859375, -1.8148193359375, -1.714263916015625, -1.61370849609375, -1.513153076171875, -1.41259765625, -1.312042236328125, -1.21148681640625, -1.110931396484375, -1.0103759765625, -0.909820556640625, -0.80926513671875, -0.708709716796875, -0.608154296875, -0.507598876953125, -0.40704345703125, -0.306488037109375, -0.2059326171875, -0.105377197265625, -0.00482177734375, 0.095733642578125, 0.1962890625, 0.296844482421875, 0.39739990234375, 0.497955322265625, 0.5985107421875, 0.699066162109375, 0.79962158203125, 0.900177001953125, 1.000732421875, 1.101287841796875, 1.20184326171875, 1.302398681640625, 1.4029541015625, 1.503509521484375, 1.60406494140625, 1.704620361328125, 1.80517578125, 1.905731201171875, 2.00628662109375, 2.106842041015625, 2.2073974609375, 2.307952880859375, 2.40850830078125, 2.509063720703125, 2.609619140625, 2.710174560546875, 2.81072998046875, 2.911285400390625, 3.0118408203125, 3.112396240234375, 3.21295166015625, 3.313507080078125, 3.4140625]}, "gradients/decoder.model.decoder.layers.7.self_attn.v_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 4.0, 11.0, 11.0, 8.0, 15.0, 6.0, 16.0, 15.0, 20.0, 23.0, 26.0, 29.0, 35.0, 32.0, 32.0, 45.0, 38.0, 48.0, 41.0, 38.0, 45.0, 49.0, 49.0, 36.0, 41.0, 39.0, 26.0, 38.0, 34.0, 23.0, 23.0, 20.0, 17.0, 19.0, 12.0, 10.0, 4.0, 7.0, 4.0, 3.0, 1.0, 4.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.279296875, -2.201141357421875, -2.12298583984375, -2.044830322265625, -1.9666748046875, -1.888519287109375, -1.81036376953125, -1.732208251953125, -1.654052734375, -1.575897216796875, -1.49774169921875, -1.419586181640625, -1.3414306640625, -1.263275146484375, -1.18511962890625, -1.106964111328125, -1.02880859375, -0.950653076171875, -0.87249755859375, -0.794342041015625, -0.7161865234375, -0.638031005859375, -0.55987548828125, -0.481719970703125, -0.403564453125, -0.325408935546875, -0.24725341796875, -0.169097900390625, -0.0909423828125, -0.012786865234375, 0.06536865234375, 0.143524169921875, 0.2216796875, 0.299835205078125, 0.37799072265625, 0.456146240234375, 0.5343017578125, 0.612457275390625, 0.69061279296875, 0.768768310546875, 0.846923828125, 0.925079345703125, 1.00323486328125, 1.081390380859375, 1.1595458984375, 1.237701416015625, 1.31585693359375, 1.394012451171875, 1.47216796875, 1.550323486328125, 1.62847900390625, 1.706634521484375, 1.7847900390625, 1.862945556640625, 1.94110107421875, 2.019256591796875, 2.097412109375, 2.175567626953125, 2.25372314453125, 2.331878662109375, 2.4100341796875, 2.488189697265625, 2.56634521484375, 2.644500732421875, 2.72265625]}, "gradients/decoder.model.decoder.layers.7.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 3.0, 1.0, 3.0, 4.0, 4.0, 2.0, 3.0, 4.0, 9.0, 8.0, 16.0, 23.0, 28.0, 28.0, 46.0, 68.0, 82.0, 160.0, 274.0, 475.0, 928.0, 2067.0, 5348.0, 17760.0, 70915.0, 320483.0, 465766.0, 122174.0, 28316.0, 8070.0, 2844.0, 1264.0, 538.0, 322.0, 172.0, 109.0, 74.0, 35.0, 40.0, 20.0, 14.0, 11.0, 10.0, 10.0, 9.0, 4.0, 4.0, 4.0, 4.0, 0.0, 3.0, 3.0, 1.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.270751953125, -0.26177978515625, -0.2528076171875, -0.24383544921875, -0.23486328125, -0.22589111328125, -0.2169189453125, -0.20794677734375, -0.198974609375, -0.19000244140625, -0.1810302734375, -0.17205810546875, -0.1630859375, -0.15411376953125, -0.1451416015625, -0.13616943359375, -0.127197265625, -0.11822509765625, -0.1092529296875, -0.10028076171875, -0.09130859375, -0.08233642578125, -0.0733642578125, -0.06439208984375, -0.055419921875, -0.04644775390625, -0.0374755859375, -0.02850341796875, -0.01953125, -0.01055908203125, -0.0015869140625, 0.00738525390625, 0.016357421875, 0.02532958984375, 0.0343017578125, 0.04327392578125, 0.05224609375, 0.06121826171875, 0.0701904296875, 0.07916259765625, 0.088134765625, 0.09710693359375, 0.1060791015625, 0.11505126953125, 0.1240234375, 0.13299560546875, 0.1419677734375, 0.15093994140625, 0.159912109375, 0.16888427734375, 0.1778564453125, 0.18682861328125, 0.19580078125, 0.20477294921875, 0.2137451171875, 0.22271728515625, 0.231689453125, 0.24066162109375, 0.2496337890625, 0.25860595703125, 0.267578125, 0.27655029296875, 0.2855224609375, 0.29449462890625, 0.303466796875]}, "gradients/decoder.model.decoder.layers.7.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 6.0, 2.0, 8.0, 7.0, 7.0, 13.0, 15.0, 12.0, 22.0, 28.0, 37.0, 41.0, 48.0, 66.0, 71.0, 90.0, 92.0, 86.0, 74.0, 64.0, 53.0, 32.0, 34.0, 18.0, 19.0, 17.0, 14.0, 10.0, 7.0, 3.0, 6.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.2928924560546875e-05, -5.1293522119522095e-05, -4.9658119678497314e-05, -4.8022717237472534e-05, -4.6387314796447754e-05, -4.4751912355422974e-05, -4.311650991439819e-05, -4.148110747337341e-05, -3.984570503234863e-05, -3.821030259132385e-05, -3.657490015029907e-05, -3.493949770927429e-05, -3.330409526824951e-05, -3.166869282722473e-05, -3.003329038619995e-05, -2.839788794517517e-05, -2.676248550415039e-05, -2.512708306312561e-05, -2.349168062210083e-05, -2.185627818107605e-05, -2.022087574005127e-05, -1.858547329902649e-05, -1.695007085800171e-05, -1.531466841697693e-05, -1.3679265975952148e-05, -1.2043863534927368e-05, -1.0408461093902588e-05, -8.773058652877808e-06, -7.137656211853027e-06, -5.502253770828247e-06, -3.866851329803467e-06, -2.2314488887786865e-06, -5.960464477539062e-07, 1.039355993270874e-06, 2.6747584342956543e-06, 4.3101608753204346e-06, 5.945563316345215e-06, 7.580965757369995e-06, 9.216368198394775e-06, 1.0851770639419556e-05, 1.2487173080444336e-05, 1.4122575521469116e-05, 1.5757977962493896e-05, 1.7393380403518677e-05, 1.9028782844543457e-05, 2.0664185285568237e-05, 2.2299587726593018e-05, 2.3934990167617798e-05, 2.5570392608642578e-05, 2.720579504966736e-05, 2.884119749069214e-05, 3.047659993171692e-05, 3.21120023727417e-05, 3.374740481376648e-05, 3.538280725479126e-05, 3.701820969581604e-05, 3.865361213684082e-05, 4.02890145778656e-05, 4.192441701889038e-05, 4.355981945991516e-05, 4.519522190093994e-05, 4.683062434196472e-05, 4.84660267829895e-05, 5.010142922401428e-05, 5.173683166503906e-05]}, "gradients/decoder.model.decoder.layers.7.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 6.0, 5.0, 7.0, 11.0, 23.0, 28.0, 33.0, 58.0, 78.0, 166.0, 329.0, 555.0, 1297.0, 3545.0, 12743.0, 63995.0, 424260.0, 452803.0, 68647.0, 13563.0, 3769.0, 1330.0, 610.0, 290.0, 152.0, 85.0, 53.0, 38.0, 25.0, 16.0, 9.0, 9.0, 5.0, 2.0, 1.0, 2.0, 3.0, 1.0, 2.0, 2.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.410888671875, -0.39881134033203125, -0.3867340087890625, -0.37465667724609375, -0.362579345703125, -0.35050201416015625, -0.3384246826171875, -0.32634735107421875, -0.31427001953125, -0.30219268798828125, -0.2901153564453125, -0.27803802490234375, -0.265960693359375, -0.25388336181640625, -0.2418060302734375, -0.22972869873046875, -0.2176513671875, -0.20557403564453125, -0.1934967041015625, -0.18141937255859375, -0.169342041015625, -0.15726470947265625, -0.1451873779296875, -0.13311004638671875, -0.12103271484375, -0.10895538330078125, -0.0968780517578125, -0.08480072021484375, -0.072723388671875, -0.06064605712890625, -0.0485687255859375, -0.03649139404296875, -0.0244140625, -0.01233673095703125, -0.0002593994140625, 0.01181793212890625, 0.023895263671875, 0.03597259521484375, 0.0480499267578125, 0.06012725830078125, 0.07220458984375, 0.08428192138671875, 0.0963592529296875, 0.10843658447265625, 0.120513916015625, 0.13259124755859375, 0.1446685791015625, 0.15674591064453125, 0.1688232421875, 0.18090057373046875, 0.1929779052734375, 0.20505523681640625, 0.217132568359375, 0.22920989990234375, 0.2412872314453125, 0.25336456298828125, 0.26544189453125, 0.27751922607421875, 0.2895965576171875, 0.30167388916015625, 0.313751220703125, 0.32582855224609375, 0.3379058837890625, 0.34998321533203125, 0.362060546875]}, "gradients/decoder.model.decoder.layers.7.self_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 2.0, 3.0, 2.0, 2.0, 3.0, 4.0, 3.0, 10.0, 15.0, 15.0, 15.0, 24.0, 19.0, 34.0, 39.0, 50.0, 63.0, 90.0, 98.0, 107.0, 86.0, 79.0, 61.0, 43.0, 31.0, 36.0, 14.0, 18.0, 12.0, 7.0, 3.0, 5.0, 2.0, 5.0, 4.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1387939453125, -0.13367843627929688, -0.12856292724609375, -0.12344741821289062, -0.1183319091796875, -0.11321640014648438, -0.10810089111328125, -0.10298538208007812, -0.097869873046875, -0.09275436401367188, -0.08763885498046875, -0.08252334594726562, -0.0774078369140625, -0.07229232788085938, -0.06717681884765625, -0.062061309814453125, -0.05694580078125, -0.051830291748046875, -0.04671478271484375, -0.041599273681640625, -0.0364837646484375, -0.031368255615234375, -0.02625274658203125, -0.021137237548828125, -0.016021728515625, -0.010906219482421875, -0.00579071044921875, -0.000675201416015625, 0.0044403076171875, 0.009555816650390625, 0.01467132568359375, 0.019786834716796875, 0.02490234375, 0.030017852783203125, 0.03513336181640625, 0.040248870849609375, 0.0453643798828125, 0.050479888916015625, 0.05559539794921875, 0.060710906982421875, 0.065826416015625, 0.07094192504882812, 0.07605743408203125, 0.08117294311523438, 0.0862884521484375, 0.09140396118164062, 0.09651947021484375, 0.10163497924804688, 0.10675048828125, 0.11186599731445312, 0.11698150634765625, 0.12209701538085938, 0.1272125244140625, 0.13232803344726562, 0.13744354248046875, 0.14255905151367188, 0.147674560546875, 0.15279006958007812, 0.15790557861328125, 0.16302108764648438, 0.1681365966796875, 0.17325210571289062, 0.17836761474609375, 0.18348312377929688, 0.1885986328125]}, "gradients/decoder.model.decoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 5.0, 8.0, 34.0, 142.0, 458.0, 279.0, 56.0, 20.0, 8.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-24.326007843017578, -23.855466842651367, -23.38492774963379, -22.914386749267578, -22.443845748901367, -21.973304748535156, -21.502765655517578, -21.032224655151367, -20.561683654785156, -20.091142654418945, -19.620603561401367, -19.150062561035156, -18.679521560668945, -18.208980560302734, -17.738441467285156, -17.267900466918945, -16.797361373901367, -16.326820373535156, -15.856280326843262, -15.385740280151367, -14.915199279785156, -14.444659233093262, -13.974119186401367, -13.503578186035156, -13.033038139343262, -12.562498092651367, -12.091957092285156, -11.621417045593262, -11.150876998901367, -10.680335998535156, -10.209795951843262, -9.739255905151367, -9.268714904785156, -8.798174858093262, -8.32763385772705, -7.857093811035156, -7.3865532875061035, -6.916012763977051, -6.445472717285156, -5.9749321937561035, -5.504391193389893, -5.03385066986084, -4.563310623168945, -4.092770099639893, -3.62222957611084, -3.151689052581787, -2.6811487674713135, -2.21060848236084, -1.740067958831787, -1.269527554512024, -0.7989871501922607, -0.32844674587249756, 0.14209365844726562, 0.6126341819763184, 1.083174467086792, 1.5537147521972656, 2.0242552757263184, 2.494795799255371, 2.9653360843658447, 3.4358763694763184, 3.906416893005371, 4.376957416534424, 4.847497940063477, 5.318037986755371, 5.788578510284424]}, "gradients/decoder.model.decoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 5.0, 7.0, 5.0, 6.0, 18.0, 13.0, 22.0, 26.0, 33.0, 46.0, 44.0, 57.0, 61.0, 79.0, 69.0, 87.0, 67.0, 61.0, 52.0, 60.0, 31.0, 40.0, 34.0, 29.0, 17.0, 13.0, 11.0, 6.0, 9.0, 3.0, 3.0, 1.0, 1.0, 1.0], "bins": [-9.796515464782715, -9.579832077026367, -9.36314868927002, -9.146465301513672, -8.929780960083008, -8.71309757232666, -8.496414184570312, -8.279730796813965, -8.063047409057617, -7.8463640213012695, -7.629680633544922, -7.412996768951416, -7.196313381195068, -6.979629993438721, -6.762946128845215, -6.546262741088867, -6.3295793533325195, -6.112895965576172, -5.896212577819824, -5.679528713226318, -5.462845325469971, -5.246161937713623, -5.029478073120117, -4.8127946853637695, -4.596111297607422, -4.379427909851074, -4.162744522094727, -3.9460606575012207, -3.729377269744873, -3.5126938819885254, -3.2960102558135986, -3.079326629638672, -2.8626437187194824, -2.6459603309631348, -2.429276704788208, -2.2125930786132812, -1.9959096908569336, -1.7792261838912964, -1.5625426769256592, -1.345859169960022, -1.1291756629943848, -0.9124921560287476, -0.6958086490631104, -0.47912514209747314, -0.26244163513183594, -0.04575812816619873, 0.17092537879943848, 0.3876088857650757, 0.6042923927307129, 0.8209758996963501, 1.0376594066619873, 1.2543429136276245, 1.4710264205932617, 1.687709927558899, 1.9043934345245361, 2.121077060699463, 2.3377604484558105, 2.554443836212158, 2.771127462387085, 2.9878110885620117, 3.2044944763183594, 3.421177864074707, 3.637861490249634, 3.8545451164245605, 4.071228504180908]}, "gradients/decoder.model.decoder.layers.6.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 3.0, 6.0, 5.0, 4.0, 9.0, 10.0, 22.0, 25.0, 29.0, 30.0, 36.0, 58.0, 70.0, 117.0, 143.0, 225.0, 366.0, 586.0, 1106.0, 2254.0, 5148.0, 14781.0, 57716.0, 398974.0, 3019775.0, 589451.0, 74171.0, 17770.0, 5893.0, 2452.0, 1203.0, 618.0, 390.0, 226.0, 145.0, 109.0, 92.0, 64.0, 53.0, 38.0, 27.0, 19.0, 12.0, 15.0, 13.0, 12.0, 5.0, 8.0, 4.0, 0.0, 1.0, 1.0, 3.0], "bins": [-2.09375, -2.0348968505859375, -1.976043701171875, -1.9171905517578125, -1.85833740234375, -1.7994842529296875, -1.740631103515625, -1.6817779541015625, -1.6229248046875, -1.5640716552734375, -1.505218505859375, -1.4463653564453125, -1.38751220703125, -1.3286590576171875, -1.269805908203125, -1.2109527587890625, -1.152099609375, -1.0932464599609375, -1.034393310546875, -0.9755401611328125, -0.91668701171875, -0.8578338623046875, -0.798980712890625, -0.7401275634765625, -0.6812744140625, -0.6224212646484375, -0.563568115234375, -0.5047149658203125, -0.44586181640625, -0.3870086669921875, -0.328155517578125, -0.2693023681640625, -0.21044921875, -0.1515960693359375, -0.092742919921875, -0.0338897705078125, 0.02496337890625, 0.0838165283203125, 0.142669677734375, 0.2015228271484375, 0.2603759765625, 0.3192291259765625, 0.378082275390625, 0.4369354248046875, 0.49578857421875, 0.5546417236328125, 0.613494873046875, 0.6723480224609375, 0.731201171875, 0.7900543212890625, 0.848907470703125, 0.9077606201171875, 0.96661376953125, 1.0254669189453125, 1.084320068359375, 1.1431732177734375, 1.2020263671875, 1.2608795166015625, 1.319732666015625, 1.3785858154296875, 1.43743896484375, 1.4962921142578125, 1.555145263671875, 1.6139984130859375, 1.6728515625]}, "gradients/decoder.model.decoder.layers.6.fc2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 5.0, 0.0, 3.0, 0.0, 1.0, 5.0, 5.0, 8.0, 8.0, 8.0, 18.0, 19.0, 34.0, 39.0, 33.0, 51.0, 56.0, 68.0, 79.0, 78.0, 86.0, 76.0, 56.0, 53.0, 54.0, 44.0, 23.0, 17.0, 21.0, 18.0, 12.0, 8.0, 7.0, 7.0, 4.0, 1.0, 4.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.7919921875, -1.73406982421875, -1.6761474609375, -1.61822509765625, -1.560302734375, -1.50238037109375, -1.4444580078125, -1.38653564453125, -1.32861328125, -1.27069091796875, -1.2127685546875, -1.15484619140625, -1.096923828125, -1.03900146484375, -0.9810791015625, -0.92315673828125, -0.865234375, -0.80731201171875, -0.7493896484375, -0.69146728515625, -0.633544921875, -0.57562255859375, -0.5177001953125, -0.45977783203125, -0.40185546875, -0.34393310546875, -0.2860107421875, -0.22808837890625, -0.170166015625, -0.11224365234375, -0.0543212890625, 0.00360107421875, 0.0615234375, 0.11944580078125, 0.1773681640625, 0.23529052734375, 0.293212890625, 0.35113525390625, 0.4090576171875, 0.46697998046875, 0.52490234375, 0.58282470703125, 0.6407470703125, 0.69866943359375, 0.756591796875, 0.81451416015625, 0.8724365234375, 0.93035888671875, 0.98828125, 1.04620361328125, 1.1041259765625, 1.16204833984375, 1.219970703125, 1.27789306640625, 1.3358154296875, 1.39373779296875, 1.45166015625, 1.50958251953125, 1.5675048828125, 1.62542724609375, 1.683349609375, 1.74127197265625, 1.7991943359375, 1.85711669921875, 1.9150390625]}, "gradients/decoder.model.decoder.layers.6.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 2.0, 3.0, 2.0, 5.0, 13.0, 5.0, 17.0, 12.0, 18.0, 40.0, 57.0, 74.0, 121.0, 238.0, 576.0, 2350.0, 24950.0, 3640921.0, 512255.0, 10328.0, 1405.0, 409.0, 167.0, 103.0, 69.0, 24.0, 37.0, 18.0, 10.0, 10.0, 12.0, 9.0, 6.0, 2.0, 4.0, 7.0, 4.0, 1.0, 0.0, 1.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-4.5, -4.36297607421875, -4.2259521484375, -4.08892822265625, -3.951904296875, -3.81488037109375, -3.6778564453125, -3.54083251953125, -3.40380859375, -3.26678466796875, -3.1297607421875, -2.99273681640625, -2.855712890625, -2.71868896484375, -2.5816650390625, -2.44464111328125, -2.3076171875, -2.17059326171875, -2.0335693359375, -1.89654541015625, -1.759521484375, -1.62249755859375, -1.4854736328125, -1.34844970703125, -1.21142578125, -1.07440185546875, -0.9373779296875, -0.80035400390625, -0.663330078125, -0.52630615234375, -0.3892822265625, -0.25225830078125, -0.115234375, 0.02178955078125, 0.1588134765625, 0.29583740234375, 0.432861328125, 0.56988525390625, 0.7069091796875, 0.84393310546875, 0.98095703125, 1.11798095703125, 1.2550048828125, 1.39202880859375, 1.529052734375, 1.66607666015625, 1.8031005859375, 1.94012451171875, 2.0771484375, 2.21417236328125, 2.3511962890625, 2.48822021484375, 2.625244140625, 2.76226806640625, 2.8992919921875, 3.03631591796875, 3.17333984375, 3.31036376953125, 3.4473876953125, 3.58441162109375, 3.721435546875, 3.85845947265625, 3.9954833984375, 4.13250732421875, 4.26953125]}, "gradients/decoder.model.decoder.layers.6.fc1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 2.0, 5.0, 1.0, 6.0, 6.0, 6.0, 5.0, 12.0, 11.0, 21.0, 28.0, 22.0, 40.0, 66.0, 82.0, 149.0, 239.0, 400.0, 672.0, 760.0, 574.0, 355.0, 199.0, 118.0, 88.0, 61.0, 43.0, 28.0, 24.0, 15.0, 14.0, 11.0, 5.0, 4.0, 3.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.419189453125, -0.4032707214355469, -0.38735198974609375, -0.3714332580566406, -0.3555145263671875, -0.3395957946777344, -0.32367706298828125, -0.3077583312988281, -0.291839599609375, -0.2759208679199219, -0.26000213623046875, -0.24408340454101562, -0.2281646728515625, -0.21224594116210938, -0.19632720947265625, -0.18040847778320312, -0.16448974609375, -0.14857101440429688, -0.13265228271484375, -0.11673355102539062, -0.1008148193359375, -0.08489608764648438, -0.06897735595703125, -0.053058624267578125, -0.037139892578125, -0.021221160888671875, -0.00530242919921875, 0.010616302490234375, 0.0265350341796875, 0.042453765869140625, 0.05837249755859375, 0.07429122924804688, 0.0902099609375, 0.10612869262695312, 0.12204742431640625, 0.13796615600585938, 0.1538848876953125, 0.16980361938476562, 0.18572235107421875, 0.20164108276367188, 0.217559814453125, 0.23347854614257812, 0.24939727783203125, 0.2653160095214844, 0.2812347412109375, 0.2971534729003906, 0.31307220458984375, 0.3289909362792969, 0.34490966796875, 0.3608283996582031, 0.37674713134765625, 0.3926658630371094, 0.4085845947265625, 0.4245033264160156, 0.44042205810546875, 0.4563407897949219, 0.472259521484375, 0.4881782531738281, 0.5040969848632812, 0.5200157165527344, 0.5359344482421875, 0.5518531799316406, 0.5677719116210938, 0.5836906433105469, 0.599609375]}, "gradients/decoder.model.decoder.layers.6.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 6.0, 3.0, 8.0, 14.0, 19.0, 37.0, 69.0, 118.0, 188.0, 200.0, 153.0, 89.0, 27.0, 29.0, 17.0, 9.0, 7.0, 7.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.525543689727783, -4.396544456481934, -4.267545223236084, -4.138545513153076, -4.009546279907227, -3.880547046661377, -3.7515478134155273, -3.6225483417510986, -3.49354887008667, -3.3645496368408203, -3.2355501651763916, -3.106550931930542, -2.9775514602661133, -2.8485522270202637, -2.719552993774414, -2.5905535221099854, -2.4615542888641357, -2.332555055618286, -2.2035555839538574, -2.074556350708008, -1.945556879043579, -1.8165576457977295, -1.6875582933425903, -1.5585589408874512, -1.429559588432312, -1.3005602359771729, -1.1715608835220337, -1.0425615310668945, -0.9135622382164001, -0.784562885761261, -0.6555635929107666, -0.5265642404556274, -0.3975648880004883, -0.2685655355453491, -0.13956621289253235, -0.010566890239715576, 0.11843246221542358, 0.24743181467056274, 0.37643110752105713, 0.5054304599761963, 0.6344298124313354, 0.7634291648864746, 0.8924285173416138, 1.021427869796753, 1.1504271030426025, 1.2794265747070312, 1.4084258079528809, 1.53742516040802, 1.6664245128631592, 1.7954238653182983, 1.9244232177734375, 2.053422451019287, 2.182421922683716, 2.3114211559295654, 2.440420627593994, 2.5694198608398438, 2.6984190940856934, 2.827418327331543, 2.9564177989959717, 3.0854170322418213, 3.21441650390625, 3.3434157371520996, 3.472414970397949, 3.601414442062378, 3.7304139137268066]}, "gradients/decoder.model.decoder.layers.6.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 5.0, 4.0, 10.0, 10.0, 11.0, 19.0, 21.0, 26.0, 24.0, 41.0, 36.0, 51.0, 35.0, 66.0, 57.0, 85.0, 61.0, 66.0, 57.0, 45.0, 43.0, 43.0, 35.0, 30.0, 24.0, 24.0, 18.0, 14.0, 8.0, 9.0, 10.0, 7.0, 4.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.5486196279525757, -1.4949066638946533, -1.4411938190460205, -1.3874808549880981, -1.3337680101394653, -1.280055046081543, -1.2263422012329102, -1.1726292371749878, -1.1189162731170654, -1.065203309059143, -1.0114904642105103, -0.9577775001525879, -0.9040646553039551, -0.8503516912460327, -0.7966387867927551, -0.7429258823394775, -0.6892130374908447, -0.6355001330375671, -0.5817872285842896, -0.5280742645263672, -0.474361389875412, -0.4206484854221344, -0.3669355511665344, -0.31322264671325684, -0.25950974225997925, -0.20579683780670166, -0.15208391845226288, -0.0983709990978241, -0.04465809464454651, 0.009054809808731079, 0.06276774406433105, 0.11648064851760864, 0.17019367218017578, 0.22390657663345337, 0.27761948108673096, 0.33133241534233093, 0.3850453197956085, 0.4387582242488861, 0.4924711585044861, 0.5461840629577637, 0.5998969674110413, 0.6536098718643188, 0.7073227763175964, 0.761035680770874, 0.8147486448287964, 0.8684614896774292, 0.9221744537353516, 0.9758873581886292, 1.0296002626419067, 1.083313226699829, 1.137026071548462, 1.1907390356063843, 1.244451880455017, 1.2981648445129395, 1.3518776893615723, 1.4055906534194946, 1.459303617477417, 1.5130165815353394, 1.5667294263839722, 1.6204423904418945, 1.6741552352905273, 1.7278681993484497, 1.781581163406372, 1.8352940082550049, 1.8890068531036377]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 0.0, 2.0, 4.0, 4.0, 5.0, 17.0, 41.0, 90.0, 241.0, 774.0, 3017.0, 17622.0, 344019.0, 654343.0, 23268.0, 3768.0, 885.0, 259.0, 93.0, 43.0, 22.0, 13.0, 5.0, 9.0, 7.0, 2.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3916015625, -1.349517822265625, -1.30743408203125, -1.265350341796875, -1.2232666015625, -1.181182861328125, -1.13909912109375, -1.097015380859375, -1.054931640625, -1.012847900390625, -0.97076416015625, -0.928680419921875, -0.8865966796875, -0.844512939453125, -0.80242919921875, -0.760345458984375, -0.71826171875, -0.676177978515625, -0.63409423828125, -0.592010498046875, -0.5499267578125, -0.507843017578125, -0.46575927734375, -0.423675537109375, -0.381591796875, -0.339508056640625, -0.29742431640625, -0.255340576171875, -0.2132568359375, -0.171173095703125, -0.12908935546875, -0.087005615234375, -0.044921875, -0.002838134765625, 0.03924560546875, 0.081329345703125, 0.1234130859375, 0.165496826171875, 0.20758056640625, 0.249664306640625, 0.291748046875, 0.333831787109375, 0.37591552734375, 0.417999267578125, 0.4600830078125, 0.502166748046875, 0.54425048828125, 0.586334228515625, 0.62841796875, 0.670501708984375, 0.71258544921875, 0.754669189453125, 0.7967529296875, 0.838836669921875, 0.88092041015625, 0.923004150390625, 0.965087890625, 1.007171630859375, 1.04925537109375, 1.091339111328125, 1.1334228515625, 1.175506591796875, 1.21759033203125, 1.259674072265625, 1.3017578125]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 4.0, 9.0, 19.0, 26.0, 39.0, 55.0, 77.0, 90.0, 125.0, 132.0, 114.0, 91.0, 72.0, 50.0, 42.0, 29.0, 12.0, 10.0, 7.0, 4.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.896484375, -2.8283843994140625, -2.760284423828125, -2.6921844482421875, -2.62408447265625, -2.5559844970703125, -2.487884521484375, -2.4197845458984375, -2.3516845703125, -2.2835845947265625, -2.215484619140625, -2.1473846435546875, -2.07928466796875, -2.0111846923828125, -1.943084716796875, -1.8749847412109375, -1.806884765625, -1.7387847900390625, -1.670684814453125, -1.6025848388671875, -1.53448486328125, -1.4663848876953125, -1.398284912109375, -1.3301849365234375, -1.2620849609375, -1.1939849853515625, -1.125885009765625, -1.0577850341796875, -0.98968505859375, -0.9215850830078125, -0.853485107421875, -0.7853851318359375, -0.71728515625, -0.6491851806640625, -0.581085205078125, -0.5129852294921875, -0.44488525390625, -0.3767852783203125, -0.308685302734375, -0.2405853271484375, -0.1724853515625, -0.1043853759765625, -0.036285400390625, 0.0318145751953125, 0.09991455078125, 0.1680145263671875, 0.236114501953125, 0.3042144775390625, 0.372314453125, 0.4404144287109375, 0.508514404296875, 0.5766143798828125, 0.64471435546875, 0.7128143310546875, 0.780914306640625, 0.8490142822265625, 0.9171142578125, 0.9852142333984375, 1.053314208984375, 1.1214141845703125, 1.18951416015625, 1.2576141357421875, 1.325714111328125, 1.3938140869140625, 1.4619140625]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 0.0, 3.0, 3.0, 1.0, 1.0, 4.0, 4.0, 5.0, 4.0, 8.0, 10.0, 17.0, 21.0, 35.0, 51.0, 55.0, 103.0, 163.0, 308.0, 635.0, 1561.0, 4510.0, 15816.0, 100338.0, 799133.0, 102245.0, 16055.0, 4441.0, 1569.0, 665.0, 303.0, 146.0, 110.0, 61.0, 51.0, 45.0, 23.0, 13.0, 10.0, 11.0, 6.0, 4.0, 6.0, 4.0, 2.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.62939453125, -0.6094131469726562, -0.5894317626953125, -0.5694503784179688, -0.549468994140625, -0.5294876098632812, -0.5095062255859375, -0.48952484130859375, -0.46954345703125, -0.44956207275390625, -0.4295806884765625, -0.40959930419921875, -0.389617919921875, -0.36963653564453125, -0.3496551513671875, -0.32967376708984375, -0.3096923828125, -0.28971099853515625, -0.2697296142578125, -0.24974822998046875, -0.229766845703125, -0.20978546142578125, -0.1898040771484375, -0.16982269287109375, -0.14984130859375, -0.12985992431640625, -0.1098785400390625, -0.08989715576171875, -0.069915771484375, -0.04993438720703125, -0.0299530029296875, -0.00997161865234375, 0.010009765625, 0.02999114990234375, 0.0499725341796875, 0.06995391845703125, 0.089935302734375, 0.10991668701171875, 0.1298980712890625, 0.14987945556640625, 0.16986083984375, 0.18984222412109375, 0.2098236083984375, 0.22980499267578125, 0.249786376953125, 0.26976776123046875, 0.2897491455078125, 0.30973052978515625, 0.3297119140625, 0.34969329833984375, 0.3696746826171875, 0.38965606689453125, 0.409637451171875, 0.42961883544921875, 0.4496002197265625, 0.46958160400390625, 0.48956298828125, 0.5095443725585938, 0.5295257568359375, 0.5495071411132812, 0.569488525390625, 0.5894699096679688, 0.6094512939453125, 0.6294326782226562, 0.6494140625]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 5.0, 6.0, 7.0, 13.0, 17.0, 14.0, 29.0, 25.0, 37.0, 35.0, 50.0, 60.0, 82.0, 70.0, 73.0, 60.0, 68.0, 75.0, 62.0, 49.0, 38.0, 34.0, 26.0, 22.0, 10.0, 9.0, 9.0, 8.0, 9.0, 2.0, 0.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.109375, -3.02386474609375, -2.9383544921875, -2.85284423828125, -2.767333984375, -2.68182373046875, -2.5963134765625, -2.51080322265625, -2.42529296875, -2.33978271484375, -2.2542724609375, -2.16876220703125, -2.083251953125, -1.99774169921875, -1.9122314453125, -1.82672119140625, -1.7412109375, -1.65570068359375, -1.5701904296875, -1.48468017578125, -1.399169921875, -1.31365966796875, -1.2281494140625, -1.14263916015625, -1.05712890625, -0.97161865234375, -0.8861083984375, -0.80059814453125, -0.715087890625, -0.62957763671875, -0.5440673828125, -0.45855712890625, -0.373046875, -0.28753662109375, -0.2020263671875, -0.11651611328125, -0.031005859375, 0.05450439453125, 0.1400146484375, 0.22552490234375, 0.31103515625, 0.39654541015625, 0.4820556640625, 0.56756591796875, 0.653076171875, 0.73858642578125, 0.8240966796875, 0.90960693359375, 0.9951171875, 1.08062744140625, 1.1661376953125, 1.25164794921875, 1.337158203125, 1.42266845703125, 1.5081787109375, 1.59368896484375, 1.67919921875, 1.76470947265625, 1.8502197265625, 1.93572998046875, 2.021240234375, 2.10675048828125, 2.1922607421875, 2.27777099609375, 2.36328125]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 8.0, 7.0, 5.0, 4.0, 10.0, 9.0, 18.0, 19.0, 29.0, 36.0, 44.0, 75.0, 100.0, 156.0, 237.0, 389.0, 655.0, 1245.0, 2234.0, 4466.0, 9934.0, 25349.0, 87874.0, 490563.0, 326809.0, 62593.0, 19535.0, 8083.0, 3558.0, 1863.0, 1063.0, 596.0, 340.0, 207.0, 135.0, 100.0, 58.0, 46.0, 31.0, 17.0, 18.0, 12.0, 7.0, 7.0, 5.0, 4.0, 7.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.142822265625, -0.13834190368652344, -0.13386154174804688, -0.1293811798095703, -0.12490081787109375, -0.12042045593261719, -0.11594009399414062, -0.11145973205566406, -0.1069793701171875, -0.10249900817871094, -0.09801864624023438, -0.09353828430175781, -0.08905792236328125, -0.08457756042480469, -0.08009719848632812, -0.07561683654785156, -0.071136474609375, -0.06665611267089844, -0.062175750732421875, -0.05769538879394531, -0.05321502685546875, -0.04873466491699219, -0.044254302978515625, -0.03977394104003906, -0.0352935791015625, -0.030813217163085938, -0.026332855224609375, -0.021852493286132812, -0.01737213134765625, -0.012891769409179688, -0.008411407470703125, -0.0039310455322265625, 0.00054931640625, 0.0050296783447265625, 0.009510040283203125, 0.013990402221679688, 0.01847076416015625, 0.022951126098632812, 0.027431488037109375, 0.03191184997558594, 0.0363922119140625, 0.04087257385253906, 0.045352935791015625, 0.04983329772949219, 0.05431365966796875, 0.05879402160644531, 0.06327438354492188, 0.06775474548339844, 0.072235107421875, 0.07671546936035156, 0.08119583129882812, 0.08567619323730469, 0.09015655517578125, 0.09463691711425781, 0.09911727905273438, 0.10359764099121094, 0.1080780029296875, 0.11255836486816406, 0.11703872680664062, 0.12151908874511719, 0.12599945068359375, 0.1304798126220703, 0.13496017456054688, 0.13944053649902344, 0.1439208984375]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 6.0, 5.0, 6.0, 8.0, 8.0, 16.0, 20.0, 36.0, 45.0, 61.0, 84.0, 119.0, 159.0, 113.0, 89.0, 73.0, 33.0, 35.0, 14.0, 23.0, 17.0, 11.0, 7.0, 8.0, 1.0, 2.0, 2.0, 3.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.952617645263672e-05, -8.650124073028564e-05, -8.347630500793457e-05, -8.04513692855835e-05, -7.742643356323242e-05, -7.440149784088135e-05, -7.137656211853027e-05, -6.83516263961792e-05, -6.532669067382812e-05, -6.230175495147705e-05, -5.9276819229125977e-05, -5.62518835067749e-05, -5.322694778442383e-05, -5.0202012062072754e-05, -4.717707633972168e-05, -4.4152140617370605e-05, -4.112720489501953e-05, -3.810226917266846e-05, -3.507733345031738e-05, -3.205239772796631e-05, -2.9027462005615234e-05, -2.600252628326416e-05, -2.2977590560913086e-05, -1.9952654838562012e-05, -1.6927719116210938e-05, -1.3902783393859863e-05, -1.0877847671508789e-05, -7.852911949157715e-06, -4.827976226806641e-06, -1.8030405044555664e-06, 1.2218952178955078e-06, 4.246830940246582e-06, 7.271766662597656e-06, 1.029670238494873e-05, 1.3321638107299805e-05, 1.634657382965088e-05, 1.9371509552001953e-05, 2.2396445274353027e-05, 2.54213809967041e-05, 2.8446316719055176e-05, 3.147125244140625e-05, 3.4496188163757324e-05, 3.75211238861084e-05, 4.054605960845947e-05, 4.357099533081055e-05, 4.659593105316162e-05, 4.9620866775512695e-05, 5.264580249786377e-05, 5.5670738220214844e-05, 5.869567394256592e-05, 6.172060966491699e-05, 6.474554538726807e-05, 6.777048110961914e-05, 7.079541683197021e-05, 7.382035255432129e-05, 7.684528827667236e-05, 7.987022399902344e-05, 8.289515972137451e-05, 8.592009544372559e-05, 8.894503116607666e-05, 9.196996688842773e-05, 9.499490261077881e-05, 9.801983833312988e-05, 0.00010104477405548096, 0.00010406970977783203]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 6.0, 6.0, 2.0, 8.0, 15.0, 13.0, 34.0, 66.0, 97.0, 214.0, 565.0, 1531.0, 5132.0, 21916.0, 163566.0, 757902.0, 78948.0, 13302.0, 3344.0, 1100.0, 421.0, 166.0, 96.0, 45.0, 29.0, 12.0, 4.0, 5.0, 7.0, 4.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.276123046875, -0.26758575439453125, -0.2590484619140625, -0.25051116943359375, -0.241973876953125, -0.23343658447265625, -0.2248992919921875, -0.21636199951171875, -0.20782470703125, -0.19928741455078125, -0.1907501220703125, -0.18221282958984375, -0.173675537109375, -0.16513824462890625, -0.1566009521484375, -0.14806365966796875, -0.1395263671875, -0.13098907470703125, -0.1224517822265625, -0.11391448974609375, -0.105377197265625, -0.09683990478515625, -0.0883026123046875, -0.07976531982421875, -0.07122802734375, -0.06269073486328125, -0.0541534423828125, -0.04561614990234375, -0.037078857421875, -0.02854156494140625, -0.0200042724609375, -0.01146697998046875, -0.0029296875, 0.00560760498046875, 0.0141448974609375, 0.02268218994140625, 0.031219482421875, 0.03975677490234375, 0.0482940673828125, 0.05683135986328125, 0.06536865234375, 0.07390594482421875, 0.0824432373046875, 0.09098052978515625, 0.099517822265625, 0.10805511474609375, 0.1165924072265625, 0.12512969970703125, 0.1336669921875, 0.14220428466796875, 0.1507415771484375, 0.15927886962890625, 0.167816162109375, 0.17635345458984375, 0.1848907470703125, 0.19342803955078125, 0.20196533203125, 0.21050262451171875, 0.2190399169921875, 0.22757720947265625, 0.236114501953125, 0.24465179443359375, 0.2531890869140625, 0.26172637939453125, 0.270263671875]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 2.0, 2.0, 2.0, 4.0, 2.0, 2.0, 3.0, 5.0, 5.0, 4.0, 6.0, 6.0, 18.0, 18.0, 18.0, 30.0, 44.0, 52.0, 70.0, 99.0, 133.0, 122.0, 105.0, 60.0, 37.0, 26.0, 23.0, 28.0, 19.0, 15.0, 5.0, 7.0, 2.0, 11.0, 6.0, 4.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0367431640625, -0.03550910949707031, -0.034275054931640625, -0.03304100036621094, -0.03180694580078125, -0.030572891235351562, -0.029338836669921875, -0.028104782104492188, -0.0268707275390625, -0.025636672973632812, -0.024402618408203125, -0.023168563842773438, -0.02193450927734375, -0.020700454711914062, -0.019466400146484375, -0.018232345581054688, -0.016998291015625, -0.015764236450195312, -0.014530181884765625, -0.013296127319335938, -0.01206207275390625, -0.010828018188476562, -0.009593963623046875, -0.008359909057617188, -0.0071258544921875, -0.0058917999267578125, -0.004657745361328125, -0.0034236907958984375, -0.00218963623046875, -0.0009555816650390625, 0.000278472900390625, 0.0015125274658203125, 0.00274658203125, 0.0039806365966796875, 0.005214691162109375, 0.0064487457275390625, 0.00768280029296875, 0.008916854858398438, 0.010150909423828125, 0.011384963989257812, 0.0126190185546875, 0.013853073120117188, 0.015087127685546875, 0.016321182250976562, 0.01755523681640625, 0.018789291381835938, 0.020023345947265625, 0.021257400512695312, 0.022491455078125, 0.023725509643554688, 0.024959564208984375, 0.026193618774414062, 0.02742767333984375, 0.028661727905273438, 0.029895782470703125, 0.031129837036132812, 0.0323638916015625, 0.03359794616699219, 0.034832000732421875, 0.03606605529785156, 0.03730010986328125, 0.03853416442871094, 0.039768218994140625, 0.04100227355957031, 0.042236328125]}, "gradients/decoder.model.decoder.layers.6.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 4.0, 2.0, 4.0, 8.0, 14.0, 19.0, 38.0, 89.0, 193.0, 254.0, 202.0, 88.0, 37.0, 18.0, 12.0, 11.0, 10.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.6881020069122314, -3.584131956100464, -3.4801621437072754, -3.376192092895508, -3.2722220420837402, -3.1682519912719727, -3.064281940460205, -2.9603121280670166, -2.856342077255249, -2.7523720264434814, -2.648402214050293, -2.5444321632385254, -2.440462112426758, -2.3364920616149902, -2.2325220108032227, -2.128552198410034, -2.0245821475982666, -1.920612096786499, -1.816642165184021, -1.712672233581543, -1.6087021827697754, -1.5047321319580078, -1.4007622003555298, -1.2967922687530518, -1.1928222179412842, -1.0888521671295166, -0.9848822355270386, -0.8809122443199158, -0.776942253112793, -0.6729722619056702, -0.5690022706985474, -0.46503227949142456, -0.36106252670288086, -0.25709253549575806, -0.15312254428863525, -0.04915255308151245, 0.05481743812561035, 0.15878742933273315, 0.26275742053985596, 0.36672741174697876, 0.47069740295410156, 0.5746673941612244, 0.6786373853683472, 0.78260737657547, 0.8865773677825928, 0.9905473589897156, 1.0945173501968384, 1.1984872817993164, 1.302457332611084, 1.4064273834228516, 1.5103973150253296, 1.6143672466278076, 1.7183372974395752, 1.8223073482513428, 1.9262772798538208, 2.030247211456299, 2.1342172622680664, 2.238187313079834, 2.3421573638916016, 2.44612717628479, 2.5500972270965576, 2.654067277908325, 2.7580370903015137, 2.8620071411132812, 2.965977191925049]}, "gradients/decoder.model.decoder.layers.6.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 8.0, 6.0, 13.0, 18.0, 32.0, 40.0, 54.0, 73.0, 64.0, 113.0, 123.0, 92.0, 103.0, 65.0, 61.0, 42.0, 34.0, 22.0, 16.0, 11.0, 5.0, 12.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.192941188812256, -2.1362147331237793, -2.079488515853882, -2.0227620601654053, -1.9660356044769287, -1.9093092679977417, -1.8525829315185547, -1.7958564758300781, -1.7391301393508911, -1.682403802871704, -1.6256773471832275, -1.5689510107040405, -1.5122246742248535, -1.455498218536377, -1.39877188205719, -1.342045545578003, -1.2853190898895264, -1.2285927534103394, -1.1718662977218628, -1.1151399612426758, -1.0584135055541992, -1.0016871690750122, -0.9449608325958252, -0.8882344365119934, -0.8315080404281616, -0.7747816443443298, -0.718055248260498, -0.661328911781311, -0.6046025156974792, -0.5478761196136475, -0.49114975333213806, -0.43442338705062866, -0.3776971101760864, -0.32097071409225464, -0.26424434781074524, -0.20751796662807465, -0.15079158544540405, -0.09406518936157227, -0.037338823080062866, 0.019387543201446533, 0.07611393928527832, 0.1328403204679489, 0.1895667016506195, 0.2462930828332901, 0.3030194640159607, 0.3597458600997925, 0.4164722263813019, 0.4731985926628113, 0.5299249887466431, 0.5866513848304749, 0.6433777809143066, 0.7001041173934937, 0.7568305134773254, 0.8135569095611572, 0.8702832460403442, 0.927009642124176, 0.9837360382080078, 1.0404623746871948, 1.0971888303756714, 1.1539151668548584, 1.210641622543335, 1.267367959022522, 1.324094295501709, 1.3808207511901855, 1.4375470876693726]}, "gradients/decoder.model.decoder.layers.6.self_attn.out_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0, 2.0, 5.0, 3.0, 10.0, 4.0, 4.0, 5.0, 13.0, 15.0, 13.0, 17.0, 20.0, 30.0, 65.0, 206.0, 1857.0, 201843.0, 839717.0, 4125.0, 334.0, 80.0, 40.0, 29.0, 20.0, 17.0, 11.0, 13.0, 10.0, 6.0, 11.0, 5.0, 5.0, 8.0, 5.0, 1.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.50390625, -5.3377685546875, -5.171630859375, -5.0054931640625, -4.83935546875, -4.6732177734375, -4.507080078125, -4.3409423828125, -4.1748046875, -4.0086669921875, -3.842529296875, -3.6763916015625, -3.51025390625, -3.3441162109375, -3.177978515625, -3.0118408203125, -2.845703125, -2.6795654296875, -2.513427734375, -2.3472900390625, -2.18115234375, -2.0150146484375, -1.848876953125, -1.6827392578125, -1.5166015625, -1.3504638671875, -1.184326171875, -1.0181884765625, -0.85205078125, -0.6859130859375, -0.519775390625, -0.3536376953125, -0.1875, -0.0213623046875, 0.144775390625, 0.3109130859375, 0.47705078125, 0.6431884765625, 0.809326171875, 0.9754638671875, 1.1416015625, 1.3077392578125, 1.473876953125, 1.6400146484375, 1.80615234375, 1.9722900390625, 2.138427734375, 2.3045654296875, 2.470703125, 2.6368408203125, 2.802978515625, 2.9691162109375, 3.13525390625, 3.3013916015625, 3.467529296875, 3.6336669921875, 3.7998046875, 3.9659423828125, 4.132080078125, 4.2982177734375, 4.46435546875, 4.6304931640625, 4.796630859375, 4.9627685546875, 5.12890625]}, "gradients/decoder.model.decoder.layers.6.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 3.0, 12.0, 28.0, 56.0, 88.0, 154.0, 214.0, 165.0, 148.0, 68.0, 39.0, 19.0, 15.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0], "bins": [-13.4375, -13.177886962890625, -12.91827392578125, -12.658660888671875, -12.3990478515625, -12.139434814453125, -11.87982177734375, -11.620208740234375, -11.360595703125, -11.100982666015625, -10.84136962890625, -10.581756591796875, -10.3221435546875, -10.062530517578125, -9.80291748046875, -9.543304443359375, -9.28369140625, -9.024078369140625, -8.76446533203125, -8.504852294921875, -8.2452392578125, -7.985626220703125, -7.72601318359375, -7.466400146484375, -7.206787109375, -6.947174072265625, -6.68756103515625, -6.427947998046875, -6.1683349609375, -5.908721923828125, -5.64910888671875, -5.389495849609375, -5.1298828125, -4.870269775390625, -4.61065673828125, -4.351043701171875, -4.0914306640625, -3.831817626953125, -3.57220458984375, -3.312591552734375, -3.052978515625, -2.793365478515625, -2.53375244140625, -2.274139404296875, -2.0145263671875, -1.754913330078125, -1.49530029296875, -1.235687255859375, -0.97607421875, -0.716461181640625, -0.45684814453125, -0.197235107421875, 0.0623779296875, 0.321990966796875, 0.58160400390625, 0.841217041015625, 1.100830078125, 1.360443115234375, 1.62005615234375, 1.879669189453125, 2.1392822265625, 2.398895263671875, 2.65850830078125, 2.918121337890625, 3.177734375]}, "gradients/decoder.model.decoder.layers.6.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 4.0, 7.0, 5.0, 8.0, 21.0, 21.0, 25.0, 31.0, 25.0, 45.0, 61.0, 67.0, 97.0, 160.0, 285.0, 568.0, 1347.0, 4329.0, 20899.0, 179108.0, 691407.0, 127487.0, 16311.0, 3695.0, 1208.0, 504.0, 298.0, 149.0, 99.0, 73.0, 53.0, 27.0, 23.0, 26.0, 18.0, 15.0, 9.0, 11.0, 6.0, 7.0, 6.0, 5.0, 0.0, 5.0, 5.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2158203125, -1.1783294677734375, -1.140838623046875, -1.1033477783203125, -1.06585693359375, -1.0283660888671875, -0.990875244140625, -0.9533843994140625, -0.9158935546875, -0.8784027099609375, -0.840911865234375, -0.8034210205078125, -0.76593017578125, -0.7284393310546875, -0.690948486328125, -0.6534576416015625, -0.615966796875, -0.5784759521484375, -0.540985107421875, -0.5034942626953125, -0.46600341796875, -0.4285125732421875, -0.391021728515625, -0.3535308837890625, -0.3160400390625, -0.2785491943359375, -0.241058349609375, -0.2035675048828125, -0.16607666015625, -0.1285858154296875, -0.091094970703125, -0.0536041259765625, -0.01611328125, 0.0213775634765625, 0.058868408203125, 0.0963592529296875, 0.13385009765625, 0.1713409423828125, 0.208831787109375, 0.2463226318359375, 0.2838134765625, 0.3213043212890625, 0.358795166015625, 0.3962860107421875, 0.43377685546875, 0.4712677001953125, 0.508758544921875, 0.5462493896484375, 0.583740234375, 0.6212310791015625, 0.658721923828125, 0.6962127685546875, 0.73370361328125, 0.7711944580078125, 0.808685302734375, 0.8461761474609375, 0.8836669921875, 0.9211578369140625, 0.958648681640625, 0.9961395263671875, 1.03363037109375, 1.0711212158203125, 1.108612060546875, 1.1461029052734375, 1.18359375]}, "gradients/decoder.model.decoder.layers.6.self_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 2.0, 3.0, 2.0, 4.0, 5.0, 13.0, 10.0, 8.0, 12.0, 21.0, 13.0, 16.0, 16.0, 16.0, 16.0, 24.0, 30.0, 25.0, 33.0, 29.0, 37.0, 39.0, 30.0, 42.0, 36.0, 44.0, 46.0, 28.0, 35.0, 40.0, 48.0, 35.0, 24.0, 27.0, 22.0, 24.0, 20.0, 22.0, 21.0, 12.0, 7.0, 9.0, 8.0, 7.0, 8.0, 6.0, 6.0, 10.0, 4.0, 3.0, 5.0, 1.0, 3.0, 1.0, 1.0, 3.0, 3.0, 1.0, 1.0, 2.0], "bins": [-2.0546875, -1.985748291015625, -1.91680908203125, -1.847869873046875, -1.7789306640625, -1.709991455078125, -1.64105224609375, -1.572113037109375, -1.503173828125, -1.434234619140625, -1.36529541015625, -1.296356201171875, -1.2274169921875, -1.158477783203125, -1.08953857421875, -1.020599365234375, -0.95166015625, -0.882720947265625, -0.81378173828125, -0.744842529296875, -0.6759033203125, -0.606964111328125, -0.53802490234375, -0.469085693359375, -0.400146484375, -0.331207275390625, -0.26226806640625, -0.193328857421875, -0.1243896484375, -0.055450439453125, 0.01348876953125, 0.082427978515625, 0.1513671875, 0.220306396484375, 0.28924560546875, 0.358184814453125, 0.4271240234375, 0.496063232421875, 0.56500244140625, 0.633941650390625, 0.702880859375, 0.771820068359375, 0.84075927734375, 0.909698486328125, 0.9786376953125, 1.047576904296875, 1.11651611328125, 1.185455322265625, 1.25439453125, 1.323333740234375, 1.39227294921875, 1.461212158203125, 1.5301513671875, 1.599090576171875, 1.66802978515625, 1.736968994140625, 1.805908203125, 1.874847412109375, 1.94378662109375, 2.012725830078125, 2.0816650390625, 2.150604248046875, 2.21954345703125, 2.288482666015625, 2.357421875]}, "gradients/decoder.model.decoder.layers.6.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 4.0, 5.0, 8.0, 14.0, 18.0, 17.0, 28.0, 45.0, 64.0, 99.0, 177.0, 289.0, 628.0, 1345.0, 3268.0, 11069.0, 55705.0, 415289.0, 476163.0, 65586.0, 12225.0, 3632.0, 1407.0, 646.0, 299.0, 197.0, 109.0, 76.0, 44.0, 25.0, 22.0, 16.0, 10.0, 4.0, 8.0, 3.0, 0.0, 2.0, 6.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 4.0], "bins": [-0.367919921875, -0.3571128845214844, -0.34630584716796875, -0.3354988098144531, -0.3246917724609375, -0.3138847351074219, -0.30307769775390625, -0.2922706604003906, -0.281463623046875, -0.2706565856933594, -0.25984954833984375, -0.24904251098632812, -0.2382354736328125, -0.22742843627929688, -0.21662139892578125, -0.20581436157226562, -0.19500732421875, -0.18420028686523438, -0.17339324951171875, -0.16258621215820312, -0.1517791748046875, -0.14097213745117188, -0.13016510009765625, -0.11935806274414062, -0.108551025390625, -0.09774398803710938, -0.08693695068359375, -0.07612991333007812, -0.0653228759765625, -0.054515838623046875, -0.04370880126953125, -0.032901763916015625, -0.0220947265625, -0.011287689208984375, -0.00048065185546875, 0.010326385498046875, 0.0211334228515625, 0.031940460205078125, 0.04274749755859375, 0.053554534912109375, 0.064361572265625, 0.07516860961914062, 0.08597564697265625, 0.09678268432617188, 0.1075897216796875, 0.11839675903320312, 0.12920379638671875, 0.14001083374023438, 0.15081787109375, 0.16162490844726562, 0.17243194580078125, 0.18323898315429688, 0.1940460205078125, 0.20485305786132812, 0.21566009521484375, 0.22646713256835938, 0.237274169921875, 0.24808120727539062, 0.25888824462890625, 0.2696952819824219, 0.2805023193359375, 0.2913093566894531, 0.30211639404296875, 0.3129234313964844, 0.32373046875]}, "gradients/decoder.model.decoder.layers.6.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 2.0, 5.0, 6.0, 9.0, 17.0, 18.0, 17.0, 34.0, 51.0, 60.0, 81.0, 118.0, 117.0, 124.0, 105.0, 71.0, 51.0, 29.0, 24.0, 20.0, 18.0, 8.0, 6.0, 3.0, 4.0, 2.0, 1.0, 1.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-6.0617923736572266e-05, -5.8498233556747437e-05, -5.637854337692261e-05, -5.425885319709778e-05, -5.213916301727295e-05, -5.001947283744812e-05, -4.789978265762329e-05, -4.578009247779846e-05, -4.366040229797363e-05, -4.1540712118148804e-05, -3.9421021938323975e-05, -3.7301331758499146e-05, -3.5181641578674316e-05, -3.306195139884949e-05, -3.094226121902466e-05, -2.882257103919983e-05, -2.6702880859375e-05, -2.458319067955017e-05, -2.2463500499725342e-05, -2.0343810319900513e-05, -1.8224120140075684e-05, -1.6104429960250854e-05, -1.3984739780426025e-05, -1.1865049600601196e-05, -9.745359420776367e-06, -7.625669240951538e-06, -5.505979061126709e-06, -3.38628888130188e-06, -1.2665987014770508e-06, 8.530914783477783e-07, 2.9727816581726074e-06, 5.0924718379974365e-06, 7.212162017822266e-06, 9.331852197647095e-06, 1.1451542377471924e-05, 1.3571232557296753e-05, 1.5690922737121582e-05, 1.781061291694641e-05, 1.993030309677124e-05, 2.204999327659607e-05, 2.41696834564209e-05, 2.6289373636245728e-05, 2.8409063816070557e-05, 3.0528753995895386e-05, 3.2648444175720215e-05, 3.4768134355545044e-05, 3.688782453536987e-05, 3.90075147151947e-05, 4.112720489501953e-05, 4.324689507484436e-05, 4.536658525466919e-05, 4.748627543449402e-05, 4.960596561431885e-05, 5.172565579414368e-05, 5.3845345973968506e-05, 5.5965036153793335e-05, 5.8084726333618164e-05, 6.020441651344299e-05, 6.232410669326782e-05, 6.444379687309265e-05, 6.656348705291748e-05, 6.868317723274231e-05, 7.080286741256714e-05, 7.292255759239197e-05, 7.50422477722168e-05]}, "gradients/decoder.model.decoder.layers.6.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 6.0, 5.0, 2.0, 6.0, 13.0, 5.0, 30.0, 28.0, 54.0, 91.0, 144.0, 245.0, 476.0, 1118.0, 3057.0, 10220.0, 48706.0, 390259.0, 509198.0, 65691.0, 12886.0, 3643.0, 1365.0, 612.0, 267.0, 173.0, 109.0, 47.0, 33.0, 27.0, 16.0, 9.0, 6.0, 7.0, 6.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.454345703125, -0.442718505859375, -0.43109130859375, -0.419464111328125, -0.4078369140625, -0.396209716796875, -0.38458251953125, -0.372955322265625, -0.361328125, -0.349700927734375, -0.33807373046875, -0.326446533203125, -0.3148193359375, -0.303192138671875, -0.29156494140625, -0.279937744140625, -0.268310546875, -0.256683349609375, -0.24505615234375, -0.233428955078125, -0.2218017578125, -0.210174560546875, -0.19854736328125, -0.186920166015625, -0.17529296875, -0.163665771484375, -0.15203857421875, -0.140411376953125, -0.1287841796875, -0.117156982421875, -0.10552978515625, -0.093902587890625, -0.082275390625, -0.070648193359375, -0.05902099609375, -0.047393798828125, -0.0357666015625, -0.024139404296875, -0.01251220703125, -0.000885009765625, 0.0107421875, 0.022369384765625, 0.03399658203125, 0.045623779296875, 0.0572509765625, 0.068878173828125, 0.08050537109375, 0.092132568359375, 0.103759765625, 0.115386962890625, 0.12701416015625, 0.138641357421875, 0.1502685546875, 0.161895751953125, 0.17352294921875, 0.185150146484375, 0.19677734375, 0.208404541015625, 0.22003173828125, 0.231658935546875, 0.2432861328125, 0.254913330078125, 0.26654052734375, 0.278167724609375, 0.289794921875]}, "gradients/decoder.model.decoder.layers.6.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 1.0, 4.0, 4.0, 12.0, 10.0, 13.0, 25.0, 24.0, 41.0, 58.0, 80.0, 92.0, 109.0, 123.0, 90.0, 89.0, 62.0, 40.0, 37.0, 27.0, 21.0, 14.0, 14.0, 6.0, 2.0, 3.0, 3.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1436767578125, -0.1374645233154297, -0.13125228881835938, -0.12504005432128906, -0.11882781982421875, -0.11261558532714844, -0.10640335083007812, -0.10019111633300781, -0.0939788818359375, -0.08776664733886719, -0.08155441284179688, -0.07534217834472656, -0.06912994384765625, -0.06291770935058594, -0.056705474853515625, -0.05049324035644531, -0.044281005859375, -0.03806877136230469, -0.031856536865234375, -0.025644302368164062, -0.01943206787109375, -0.013219833374023438, -0.007007598876953125, -0.0007953643798828125, 0.0054168701171875, 0.011629104614257812, 0.017841339111328125, 0.024053573608398438, 0.03026580810546875, 0.03647804260253906, 0.042690277099609375, 0.04890251159667969, 0.05511474609375, 0.06132698059082031, 0.06753921508789062, 0.07375144958496094, 0.07996368408203125, 0.08617591857910156, 0.09238815307617188, 0.09860038757324219, 0.1048126220703125, 0.11102485656738281, 0.11723709106445312, 0.12344932556152344, 0.12966156005859375, 0.13587379455566406, 0.14208602905273438, 0.1482982635498047, 0.154510498046875, 0.1607227325439453, 0.16693496704101562, 0.17314720153808594, 0.17935943603515625, 0.18557167053222656, 0.19178390502929688, 0.1979961395263672, 0.2042083740234375, 0.2104206085205078, 0.21663284301757812, 0.22284507751464844, 0.22905731201171875, 0.23526954650878906, 0.24148178100585938, 0.2476940155029297, 0.25390625]}, "gradients/decoder.model.decoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 5.0, 16.0, 54.0, 243.0, 489.0, 150.0, 29.0, 19.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-21.15981101989746, -20.730831146240234, -20.301849365234375, -19.87286949157715, -19.443889617919922, -19.014909744262695, -18.585927963256836, -18.15694808959961, -17.727968215942383, -17.298988342285156, -16.870006561279297, -16.44102668762207, -16.012046813964844, -15.5830659866333, -15.154085159301758, -14.725105285644531, -14.296124458312988, -13.867143630981445, -13.438163757324219, -13.009182929992676, -12.58020305633545, -12.151222229003906, -11.72224235534668, -11.293261528015137, -10.864280700683594, -10.43529987335205, -10.006319999694824, -9.577339172363281, -9.148359298706055, -8.719378471374512, -8.290397644042969, -7.861417770385742, -7.432438850402832, -7.003458499908447, -6.5744781494140625, -6.1454973220825195, -5.716517448425293, -5.28753662109375, -4.858556270599365, -4.4295759201049805, -4.000595569610596, -3.571615219116211, -3.142634868621826, -2.7136542797088623, -2.2846739292144775, -1.8556935787200928, -1.426712989807129, -0.9977326393127441, -0.5687522888183594, -0.13977187871932983, 0.2892085313796997, 0.718189001083374, 1.1471693515777588, 1.5761497020721436, 2.0051302909851074, 2.434110641479492, 2.863090991973877, 3.2920713424682617, 3.7210516929626465, 4.150032043457031, 4.579012870788574, 5.007992744445801, 5.436973571777344, 5.8659539222717285, 6.294934272766113]}, "gradients/decoder.model.decoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 6.0, 9.0, 13.0, 14.0, 29.0, 24.0, 42.0, 50.0, 65.0, 70.0, 79.0, 85.0, 92.0, 76.0, 77.0, 59.0, 63.0, 33.0, 39.0, 34.0, 18.0, 17.0, 8.0, 6.0, 3.0, 1.0, 1.0, 3.0, 1.0], "bins": [-12.702086448669434, -12.432903289794922, -12.163719177246094, -11.894535064697266, -11.625351905822754, -11.356168746948242, -11.086984634399414, -10.817800521850586, -10.548617362976074, -10.279434204101562, -10.010250091552734, -9.741065979003906, -9.471882820129395, -9.202699661254883, -8.933515548706055, -8.664331436157227, -8.395148277282715, -8.125965118408203, -7.856781005859375, -7.587597370147705, -7.318413734436035, -7.049230098724365, -6.780046463012695, -6.510862827301025, -6.2416791915893555, -5.9724955558776855, -5.703311920166016, -5.434128284454346, -5.164944648742676, -4.895761013031006, -4.626577377319336, -4.357393741607666, -4.088210582733154, -3.8190269470214844, -3.5498433113098145, -3.2806596755981445, -3.0114760398864746, -2.7422924041748047, -2.4731087684631348, -2.203925132751465, -1.934741497039795, -1.665557861328125, -1.396374225616455, -1.1271905899047852, -0.8580069541931152, -0.5888233184814453, -0.3196396827697754, -0.05045604705810547, 0.21872758865356445, 0.4879112243652344, 0.7570948600769043, 1.0262784957885742, 1.2954621315002441, 1.564645767211914, 1.833829402923584, 2.103013038635254, 2.372196674346924, 2.6413803100585938, 2.9105639457702637, 3.1797475814819336, 3.4489312171936035, 3.7181148529052734, 3.9872984886169434, 4.256482124328613, 4.525665760040283]}, "gradients/decoder.model.decoder.layers.5.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 3.0, 3.0, 3.0, 8.0, 6.0, 14.0, 14.0, 25.0, 35.0, 49.0, 81.0, 111.0, 175.0, 291.0, 502.0, 785.0, 1554.0, 3415.0, 8100.0, 23450.0, 109344.0, 1200413.0, 2595917.0, 197890.0, 33832.0, 10035.0, 3866.0, 1848.0, 972.0, 548.0, 359.0, 224.0, 152.0, 94.0, 55.0, 32.0, 18.0, 18.0, 18.0, 12.0, 6.0, 5.0, 5.0, 0.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8720703125, -1.8155975341796875, -1.759124755859375, -1.7026519775390625, -1.64617919921875, -1.5897064208984375, -1.533233642578125, -1.4767608642578125, -1.4202880859375, -1.3638153076171875, -1.307342529296875, -1.2508697509765625, -1.19439697265625, -1.1379241943359375, -1.081451416015625, -1.0249786376953125, -0.968505859375, -0.9120330810546875, -0.855560302734375, -0.7990875244140625, -0.74261474609375, -0.6861419677734375, -0.629669189453125, -0.5731964111328125, -0.5167236328125, -0.4602508544921875, -0.403778076171875, -0.3473052978515625, -0.29083251953125, -0.2343597412109375, -0.177886962890625, -0.1214141845703125, -0.06494140625, -0.0084686279296875, 0.048004150390625, 0.1044769287109375, 0.16094970703125, 0.2174224853515625, 0.273895263671875, 0.3303680419921875, 0.3868408203125, 0.4433135986328125, 0.499786376953125, 0.5562591552734375, 0.61273193359375, 0.6692047119140625, 0.725677490234375, 0.7821502685546875, 0.838623046875, 0.8950958251953125, 0.951568603515625, 1.0080413818359375, 1.06451416015625, 1.1209869384765625, 1.177459716796875, 1.2339324951171875, 1.2904052734375, 1.3468780517578125, 1.403350830078125, 1.4598236083984375, 1.51629638671875, 1.5727691650390625, 1.629241943359375, 1.6857147216796875, 1.7421875]}, "gradients/decoder.model.decoder.layers.5.fc2.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 4.0, 7.0, 6.0, 16.0, 22.0, 22.0, 25.0, 39.0, 44.0, 48.0, 70.0, 91.0, 78.0, 96.0, 66.0, 87.0, 66.0, 53.0, 41.0, 34.0, 23.0, 20.0, 12.0, 7.0, 6.0, 5.0, 9.0, 6.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4091796875, -1.3536224365234375, -1.298065185546875, -1.2425079345703125, -1.18695068359375, -1.1313934326171875, -1.075836181640625, -1.0202789306640625, -0.9647216796875, -0.9091644287109375, -0.853607177734375, -0.7980499267578125, -0.74249267578125, -0.6869354248046875, -0.631378173828125, -0.5758209228515625, -0.520263671875, -0.4647064208984375, -0.409149169921875, -0.3535919189453125, -0.29803466796875, -0.2424774169921875, -0.186920166015625, -0.1313629150390625, -0.0758056640625, -0.0202484130859375, 0.035308837890625, 0.0908660888671875, 0.14642333984375, 0.2019805908203125, 0.257537841796875, 0.3130950927734375, 0.36865234375, 0.4242095947265625, 0.479766845703125, 0.5353240966796875, 0.59088134765625, 0.6464385986328125, 0.701995849609375, 0.7575531005859375, 0.8131103515625, 0.8686676025390625, 0.924224853515625, 0.9797821044921875, 1.03533935546875, 1.0908966064453125, 1.146453857421875, 1.2020111083984375, 1.257568359375, 1.3131256103515625, 1.368682861328125, 1.4242401123046875, 1.47979736328125, 1.5353546142578125, 1.590911865234375, 1.6464691162109375, 1.7020263671875, 1.7575836181640625, 1.813140869140625, 1.8686981201171875, 1.92425537109375, 1.9798126220703125, 2.035369873046875, 2.0909271240234375, 2.146484375]}, "gradients/decoder.model.decoder.layers.5.fc1.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 4.0, 4.0, 6.0, 9.0, 8.0, 12.0, 18.0, 19.0, 42.0, 39.0, 69.0, 99.0, 146.0, 219.0, 355.0, 693.0, 1294.0, 2999.0, 8023.0, 28874.0, 172304.0, 3103084.0, 782579.0, 68522.0, 15508.0, 4996.0, 2028.0, 981.0, 529.0, 251.0, 186.0, 95.0, 71.0, 45.0, 41.0, 33.0, 29.0, 16.0, 17.0, 13.0, 6.0, 7.0, 7.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 2.0], "bins": [-1.798828125, -1.74853515625, -1.6982421875, -1.64794921875, -1.59765625, -1.54736328125, -1.4970703125, -1.44677734375, -1.396484375, -1.34619140625, -1.2958984375, -1.24560546875, -1.1953125, -1.14501953125, -1.0947265625, -1.04443359375, -0.994140625, -0.94384765625, -0.8935546875, -0.84326171875, -0.79296875, -0.74267578125, -0.6923828125, -0.64208984375, -0.591796875, -0.54150390625, -0.4912109375, -0.44091796875, -0.390625, -0.34033203125, -0.2900390625, -0.23974609375, -0.189453125, -0.13916015625, -0.0888671875, -0.03857421875, 0.01171875, 0.06201171875, 0.1123046875, 0.16259765625, 0.212890625, 0.26318359375, 0.3134765625, 0.36376953125, 0.4140625, 0.46435546875, 0.5146484375, 0.56494140625, 0.615234375, 0.66552734375, 0.7158203125, 0.76611328125, 0.81640625, 0.86669921875, 0.9169921875, 0.96728515625, 1.017578125, 1.06787109375, 1.1181640625, 1.16845703125, 1.21875, 1.26904296875, 1.3193359375, 1.36962890625, 1.419921875]}, "gradients/decoder.model.decoder.layers.5.fc1.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 2.0, 3.0, 2.0, 4.0, 2.0, 3.0, 2.0, 3.0, 3.0, 2.0, 9.0, 14.0, 13.0, 17.0, 17.0, 19.0, 37.0, 49.0, 58.0, 68.0, 107.0, 135.0, 242.0, 340.0, 500.0, 613.0, 582.0, 346.0, 275.0, 166.0, 107.0, 87.0, 62.0, 54.0, 40.0, 26.0, 19.0, 11.0, 10.0, 4.0, 7.0, 5.0, 3.0, 6.0, 3.0, 5.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.343505859375, -0.3318939208984375, -0.320281982421875, -0.3086700439453125, -0.29705810546875, -0.2854461669921875, -0.273834228515625, -0.2622222900390625, -0.2506103515625, -0.2389984130859375, -0.227386474609375, -0.2157745361328125, -0.20416259765625, -0.1925506591796875, -0.180938720703125, -0.1693267822265625, -0.15771484375, -0.1461029052734375, -0.134490966796875, -0.1228790283203125, -0.11126708984375, -0.0996551513671875, -0.088043212890625, -0.0764312744140625, -0.0648193359375, -0.0532073974609375, -0.041595458984375, -0.0299835205078125, -0.01837158203125, -0.0067596435546875, 0.004852294921875, 0.0164642333984375, 0.028076171875, 0.0396881103515625, 0.051300048828125, 0.0629119873046875, 0.07452392578125, 0.0861358642578125, 0.097747802734375, 0.1093597412109375, 0.1209716796875, 0.1325836181640625, 0.144195556640625, 0.1558074951171875, 0.16741943359375, 0.1790313720703125, 0.190643310546875, 0.2022552490234375, 0.2138671875, 0.2254791259765625, 0.237091064453125, 0.2487030029296875, 0.26031494140625, 0.2719268798828125, 0.283538818359375, 0.2951507568359375, 0.3067626953125, 0.3183746337890625, 0.329986572265625, 0.3415985107421875, 0.35321044921875, 0.3648223876953125, 0.376434326171875, 0.3880462646484375, 0.399658203125]}, "gradients/decoder.model.decoder.layers.5.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 5.0, 8.0, 8.0, 11.0, 22.0, 41.0, 64.0, 175.0, 222.0, 186.0, 107.0, 73.0, 30.0, 24.0, 11.0, 7.0, 2.0, 3.0, 3.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.782784461975098, -4.655999183654785, -4.529213905334473, -4.402428150177002, -4.2756428718566895, -4.148857593536377, -4.022071838378906, -3.8952865600585938, -3.7685012817382812, -3.6417160034179688, -3.514930486679077, -3.3881449699401855, -3.261359691619873, -3.1345744132995605, -3.007788896560669, -2.8810033798217773, -2.754218101501465, -2.6274328231811523, -2.5006473064422607, -2.373861789703369, -2.2470765113830566, -2.120291233062744, -1.9935057163238525, -1.8667203187942505, -1.7399349212646484, -1.6131495237350464, -1.4863641262054443, -1.3595787286758423, -1.2327933311462402, -1.1060079336166382, -0.9792225360870361, -0.8524371385574341, -0.7256519794464111, -0.5988665819168091, -0.47208118438720703, -0.345295786857605, -0.21851038932800293, -0.09172499179840088, 0.03506040573120117, 0.16184580326080322, 0.2886312007904053, 0.4154165983200073, 0.5422019958496094, 0.6689873933792114, 0.7957727909088135, 0.9225581884384155, 1.0493435859680176, 1.1761289834976196, 1.3029143810272217, 1.4296997785568237, 1.5564851760864258, 1.6832705736160278, 1.8100559711456299, 1.936841368675232, 2.063626766204834, 2.1904120445251465, 2.317197561264038, 2.4439830780029297, 2.570768356323242, 2.6975536346435547, 2.8243391513824463, 2.951124668121338, 3.0779099464416504, 3.204695224761963, 3.3314807415008545]}, "gradients/decoder.model.decoder.layers.5.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 3.0, 5.0, 3.0, 6.0, 2.0, 10.0, 12.0, 12.0, 22.0, 25.0, 33.0, 50.0, 47.0, 50.0, 59.0, 66.0, 82.0, 48.0, 66.0, 58.0, 68.0, 53.0, 35.0, 37.0, 32.0, 39.0, 22.0, 15.0, 20.0, 9.0, 9.0, 2.0, 3.0, 2.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.3661792278289795, -1.3155618906021118, -1.2649445533752441, -1.2143272161483765, -1.1637098789215088, -1.1130926609039307, -1.062475323677063, -1.0118579864501953, -0.9612406492233276, -0.91062331199646, -0.8600059747695923, -0.8093886971473694, -0.7587713599205017, -0.708154022693634, -0.6575367450714111, -0.6069194078445435, -0.5563020706176758, -0.5056847333908081, -0.4550674259662628, -0.40445011854171753, -0.35383278131484985, -0.3032154440879822, -0.2525981366634369, -0.2019808292388916, -0.15136349201202393, -0.10074616968631744, -0.05012884736061096, 0.00048847496509552, 0.051105797290802, 0.10172313451766968, 0.15234044194221497, 0.20295774936676025, 0.25357508659362793, 0.3041924238204956, 0.3548097312450409, 0.4054270386695862, 0.45604437589645386, 0.5066617131233215, 0.5572789907455444, 0.6078963279724121, 0.6585136651992798, 0.7091310024261475, 0.7597483396530151, 0.810365617275238, 0.8609829545021057, 0.9116002917289734, 0.9622175693511963, 1.012834906578064, 1.0634522438049316, 1.1140695810317993, 1.164686918258667, 1.2153042554855347, 1.2659215927124023, 1.3165388107299805, 1.3671561479568481, 1.4177734851837158, 1.4683908224105835, 1.5190081596374512, 1.5696254968643188, 1.6202428340911865, 1.6708600521087646, 1.7214775085449219, 1.7720947265625, 1.8227120637893677, 1.8733294010162354]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 3.0, 1.0, 1.0, 9.0, 12.0, 16.0, 21.0, 32.0, 51.0, 65.0, 135.0, 208.0, 400.0, 676.0, 1251.0, 2526.0, 5535.0, 13063.0, 33421.0, 104267.0, 388087.0, 353473.0, 92753.0, 30238.0, 11904.0, 5221.0, 2458.0, 1241.0, 646.0, 325.0, 190.0, 134.0, 68.0, 51.0, 29.0, 20.0, 14.0, 6.0, 4.0, 4.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.25244140625, -0.24500656127929688, -0.23757171630859375, -0.23013687133789062, -0.2227020263671875, -0.21526718139648438, -0.20783233642578125, -0.20039749145507812, -0.192962646484375, -0.18552780151367188, -0.17809295654296875, -0.17065811157226562, -0.1632232666015625, -0.15578842163085938, -0.14835357666015625, -0.14091873168945312, -0.13348388671875, -0.12604904174804688, -0.11861419677734375, -0.11117935180664062, -0.1037445068359375, -0.09630966186523438, -0.08887481689453125, -0.08143997192382812, -0.074005126953125, -0.06657028198242188, -0.05913543701171875, -0.051700592041015625, -0.0442657470703125, -0.036830902099609375, -0.02939605712890625, -0.021961212158203125, -0.0145263671875, -0.007091522216796875, 0.00034332275390625, 0.007778167724609375, 0.0152130126953125, 0.022647857666015625, 0.03008270263671875, 0.037517547607421875, 0.044952392578125, 0.052387237548828125, 0.05982208251953125, 0.06725692749023438, 0.0746917724609375, 0.08212661743164062, 0.08956146240234375, 0.09699630737304688, 0.10443115234375, 0.11186599731445312, 0.11930084228515625, 0.12673568725585938, 0.1341705322265625, 0.14160537719726562, 0.14904022216796875, 0.15647506713867188, 0.163909912109375, 0.17134475708007812, 0.17877960205078125, 0.18621444702148438, 0.1936492919921875, 0.20108413696289062, 0.20851898193359375, 0.21595382690429688, 0.223388671875]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 5.0, 10.0, 1.0, 9.0, 12.0, 19.0, 19.0, 37.0, 56.0, 61.0, 73.0, 77.0, 75.0, 94.0, 83.0, 76.0, 79.0, 51.0, 42.0, 27.0, 34.0, 22.0, 16.0, 8.0, 7.0, 7.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.23046875, -1.1873931884765625, -1.144317626953125, -1.1012420654296875, -1.05816650390625, -1.0150909423828125, -0.972015380859375, -0.9289398193359375, -0.8858642578125, -0.8427886962890625, -0.799713134765625, -0.7566375732421875, -0.71356201171875, -0.6704864501953125, -0.627410888671875, -0.5843353271484375, -0.541259765625, -0.4981842041015625, -0.455108642578125, -0.4120330810546875, -0.36895751953125, -0.3258819580078125, -0.282806396484375, -0.2397308349609375, -0.1966552734375, -0.1535797119140625, -0.110504150390625, -0.0674285888671875, -0.02435302734375, 0.0187225341796875, 0.061798095703125, 0.1048736572265625, 0.14794921875, 0.1910247802734375, 0.234100341796875, 0.2771759033203125, 0.32025146484375, 0.3633270263671875, 0.406402587890625, 0.4494781494140625, 0.4925537109375, 0.5356292724609375, 0.578704833984375, 0.6217803955078125, 0.66485595703125, 0.7079315185546875, 0.751007080078125, 0.7940826416015625, 0.837158203125, 0.8802337646484375, 0.923309326171875, 0.9663848876953125, 1.00946044921875, 1.0525360107421875, 1.095611572265625, 1.1386871337890625, 1.1817626953125, 1.2248382568359375, 1.267913818359375, 1.3109893798828125, 1.35406494140625, 1.3971405029296875, 1.440216064453125, 1.4832916259765625, 1.5263671875]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 5.0, 4.0, 5.0, 10.0, 9.0, 20.0, 22.0, 29.0, 38.0, 60.0, 77.0, 115.0, 228.0, 369.0, 698.0, 1697.0, 4915.0, 17908.0, 90890.0, 540675.0, 324848.0, 48922.0, 11043.0, 3341.0, 1225.0, 581.0, 267.0, 168.0, 117.0, 81.0, 57.0, 33.0, 28.0, 22.0, 8.0, 15.0, 9.0, 9.0, 4.0, 4.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0], "bins": [-0.321533203125, -0.3123016357421875, -0.303070068359375, -0.2938385009765625, -0.28460693359375, -0.2753753662109375, -0.266143798828125, -0.2569122314453125, -0.2476806640625, -0.2384490966796875, -0.229217529296875, -0.2199859619140625, -0.21075439453125, -0.2015228271484375, -0.192291259765625, -0.1830596923828125, -0.173828125, -0.1645965576171875, -0.155364990234375, -0.1461334228515625, -0.13690185546875, -0.1276702880859375, -0.118438720703125, -0.1092071533203125, -0.0999755859375, -0.0907440185546875, -0.081512451171875, -0.0722808837890625, -0.06304931640625, -0.0538177490234375, -0.044586181640625, -0.0353546142578125, -0.026123046875, -0.0168914794921875, -0.007659912109375, 0.0015716552734375, 0.01080322265625, 0.0200347900390625, 0.029266357421875, 0.0384979248046875, 0.0477294921875, 0.0569610595703125, 0.066192626953125, 0.0754241943359375, 0.08465576171875, 0.0938873291015625, 0.103118896484375, 0.1123504638671875, 0.12158203125, 0.1308135986328125, 0.140045166015625, 0.1492767333984375, 0.15850830078125, 0.1677398681640625, 0.176971435546875, 0.1862030029296875, 0.1954345703125, 0.2046661376953125, 0.213897705078125, 0.2231292724609375, 0.23236083984375, 0.2415924072265625, 0.250823974609375, 0.2600555419921875, 0.269287109375]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 5.0, 7.0, 7.0, 6.0, 12.0, 10.0, 16.0, 24.0, 30.0, 32.0, 43.0, 30.0, 60.0, 62.0, 60.0, 57.0, 46.0, 50.0, 65.0, 64.0, 69.0, 55.0, 46.0, 38.0, 27.0, 21.0, 18.0, 20.0, 11.0, 4.0, 7.0, 3.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.224609375, -2.1589508056640625, -2.093292236328125, -2.0276336669921875, -1.96197509765625, -1.8963165283203125, -1.830657958984375, -1.7649993896484375, -1.6993408203125, -1.6336822509765625, -1.568023681640625, -1.5023651123046875, -1.43670654296875, -1.3710479736328125, -1.305389404296875, -1.2397308349609375, -1.174072265625, -1.1084136962890625, -1.042755126953125, -0.9770965576171875, -0.91143798828125, -0.8457794189453125, -0.780120849609375, -0.7144622802734375, -0.6488037109375, -0.5831451416015625, -0.517486572265625, -0.4518280029296875, -0.38616943359375, -0.3205108642578125, -0.254852294921875, -0.1891937255859375, -0.12353515625, -0.0578765869140625, 0.007781982421875, 0.0734405517578125, 0.13909912109375, 0.2047576904296875, 0.270416259765625, 0.3360748291015625, 0.4017333984375, 0.4673919677734375, 0.533050537109375, 0.5987091064453125, 0.66436767578125, 0.7300262451171875, 0.795684814453125, 0.8613433837890625, 0.927001953125, 0.9926605224609375, 1.058319091796875, 1.1239776611328125, 1.18963623046875, 1.2552947998046875, 1.320953369140625, 1.3866119384765625, 1.4522705078125, 1.5179290771484375, 1.583587646484375, 1.6492462158203125, 1.71490478515625, 1.7805633544921875, 1.846221923828125, 1.9118804931640625, 1.9775390625]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 7.0, 2.0, 6.0, 6.0, 8.0, 17.0, 22.0, 27.0, 56.0, 49.0, 125.0, 162.0, 313.0, 588.0, 1266.0, 2887.0, 8247.0, 31203.0, 182272.0, 668116.0, 118171.0, 23474.0, 6713.0, 2481.0, 1133.0, 515.0, 272.0, 149.0, 88.0, 59.0, 38.0, 21.0, 18.0, 9.0, 12.0, 10.0, 6.0, 6.0, 2.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.13330078125, -0.12953472137451172, -0.12576866149902344, -0.12200260162353516, -0.11823654174804688, -0.1144704818725586, -0.11070442199707031, -0.10693836212158203, -0.10317230224609375, -0.09940624237060547, -0.09564018249511719, -0.0918741226196289, -0.08810806274414062, -0.08434200286865234, -0.08057594299316406, -0.07680988311767578, -0.0730438232421875, -0.06927776336669922, -0.06551170349121094, -0.061745643615722656, -0.057979583740234375, -0.054213523864746094, -0.05044746398925781, -0.04668140411376953, -0.04291534423828125, -0.03914928436279297, -0.03538322448730469, -0.031617164611816406, -0.027851104736328125, -0.024085044860839844, -0.020318984985351562, -0.01655292510986328, -0.012786865234375, -0.009020805358886719, -0.0052547454833984375, -0.0014886856079101562, 0.002277374267578125, 0.006043434143066406, 0.009809494018554688, 0.013575553894042969, 0.01734161376953125, 0.02110767364501953, 0.024873733520507812, 0.028639793395996094, 0.032405853271484375, 0.036171913146972656, 0.03993797302246094, 0.04370403289794922, 0.0474700927734375, 0.05123615264892578, 0.05500221252441406, 0.058768272399902344, 0.06253433227539062, 0.0663003921508789, 0.07006645202636719, 0.07383251190185547, 0.07759857177734375, 0.08136463165283203, 0.08513069152832031, 0.0888967514038086, 0.09266281127929688, 0.09642887115478516, 0.10019493103027344, 0.10396099090576172, 0.10772705078125]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 2.0, 4.0, 1.0, 8.0, 6.0, 9.0, 6.0, 23.0, 41.0, 51.0, 93.0, 115.0, 147.0, 149.0, 118.0, 88.0, 58.0, 28.0, 24.0, 13.0, 9.0, 3.0, 6.0, 5.0, 0.0, 4.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.738040924072266e-05, -8.519552648067474e-05, -8.301064372062683e-05, -8.082576096057892e-05, -7.8640878200531e-05, -7.64559954404831e-05, -7.427111268043518e-05, -7.208622992038727e-05, -6.990134716033936e-05, -6.771646440029144e-05, -6.553158164024353e-05, -6.334669888019562e-05, -6.11618161201477e-05, -5.897693336009979e-05, -5.679205060005188e-05, -5.460716784000397e-05, -5.2422285079956055e-05, -5.023740231990814e-05, -4.805251955986023e-05, -4.586763679981232e-05, -4.3682754039764404e-05, -4.149787127971649e-05, -3.931298851966858e-05, -3.7128105759620667e-05, -3.4943222999572754e-05, -3.275834023952484e-05, -3.057345747947693e-05, -2.8388574719429016e-05, -2.6203691959381104e-05, -2.401880919933319e-05, -2.183392643928528e-05, -1.9649043679237366e-05, -1.7464160919189453e-05, -1.527927815914154e-05, -1.3094395399093628e-05, -1.0909512639045715e-05, -8.724629878997803e-06, -6.53974711894989e-06, -4.3548643589019775e-06, -2.169981598854065e-06, 1.4901161193847656e-08, 2.1997839212417603e-06, 4.384666681289673e-06, 6.5695494413375854e-06, 8.754432201385498e-06, 1.093931496143341e-05, 1.3124197721481323e-05, 1.5309080481529236e-05, 1.749396324157715e-05, 1.967884600162506e-05, 2.1863728761672974e-05, 2.4048611521720886e-05, 2.62334942817688e-05, 2.841837704181671e-05, 3.0603259801864624e-05, 3.278814256191254e-05, 3.497302532196045e-05, 3.715790808200836e-05, 3.9342790842056274e-05, 4.152767360210419e-05, 4.37125563621521e-05, 4.589743912220001e-05, 4.8082321882247925e-05, 5.026720464229584e-05, 5.245208740234375e-05]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 5.0, 5.0, 6.0, 11.0, 8.0, 15.0, 18.0, 22.0, 62.0, 64.0, 114.0, 253.0, 497.0, 1038.0, 2345.0, 6203.0, 19232.0, 71509.0, 354624.0, 460201.0, 95056.0, 24468.0, 7537.0, 2796.0, 1258.0, 537.0, 257.0, 147.0, 90.0, 53.0, 38.0, 18.0, 20.0, 15.0, 12.0, 10.0, 9.0, 0.0, 4.0, 0.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10736083984375, -0.10390853881835938, -0.10045623779296875, -0.09700393676757812, -0.0935516357421875, -0.09009933471679688, -0.08664703369140625, -0.08319473266601562, -0.079742431640625, -0.07629013061523438, -0.07283782958984375, -0.06938552856445312, -0.0659332275390625, -0.062480926513671875, -0.05902862548828125, -0.055576324462890625, -0.0521240234375, -0.048671722412109375, -0.04521942138671875, -0.041767120361328125, -0.0383148193359375, -0.034862518310546875, -0.03141021728515625, -0.027957916259765625, -0.024505615234375, -0.021053314208984375, -0.01760101318359375, -0.014148712158203125, -0.0106964111328125, -0.007244110107421875, -0.00379180908203125, -0.000339508056640625, 0.00311279296875, 0.006565093994140625, 0.01001739501953125, 0.013469696044921875, 0.0169219970703125, 0.020374298095703125, 0.02382659912109375, 0.027278900146484375, 0.030731201171875, 0.034183502197265625, 0.03763580322265625, 0.041088104248046875, 0.0445404052734375, 0.047992706298828125, 0.05144500732421875, 0.054897308349609375, 0.058349609375, 0.061801910400390625, 0.06525421142578125, 0.06870651245117188, 0.0721588134765625, 0.07561111450195312, 0.07906341552734375, 0.08251571655273438, 0.085968017578125, 0.08942031860351562, 0.09287261962890625, 0.09632492065429688, 0.0997772216796875, 0.10322952270507812, 0.10668182373046875, 0.11013412475585938, 0.11358642578125]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 1.0, 3.0, 0.0, 5.0, 5.0, 5.0, 8.0, 7.0, 12.0, 13.0, 13.0, 10.0, 24.0, 18.0, 25.0, 22.0, 34.0, 41.0, 50.0, 65.0, 83.0, 86.0, 78.0, 67.0, 59.0, 55.0, 33.0, 29.0, 23.0, 26.0, 17.0, 17.0, 10.0, 12.0, 6.0, 11.0, 8.0, 5.0, 3.0, 5.0, 8.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.022125244140625, -0.021451950073242188, -0.020778656005859375, -0.020105361938476562, -0.01943206787109375, -0.018758773803710938, -0.018085479736328125, -0.017412185668945312, -0.0167388916015625, -0.016065597534179688, -0.015392303466796875, -0.014719009399414062, -0.01404571533203125, -0.013372421264648438, -0.012699127197265625, -0.012025833129882812, -0.0113525390625, -0.010679244995117188, -0.010005950927734375, -0.009332656860351562, -0.00865936279296875, -0.007986068725585938, -0.007312774658203125, -0.0066394805908203125, -0.0059661865234375, -0.0052928924560546875, -0.004619598388671875, -0.0039463043212890625, -0.00327301025390625, -0.0025997161865234375, -0.001926422119140625, -0.0012531280517578125, -0.000579833984375, 9.34600830078125e-05, 0.000766754150390625, 0.0014400482177734375, 0.00211334228515625, 0.0027866363525390625, 0.003459930419921875, 0.0041332244873046875, 0.0048065185546875, 0.0054798126220703125, 0.006153106689453125, 0.0068264007568359375, 0.00749969482421875, 0.008172988891601562, 0.008846282958984375, 0.009519577026367188, 0.01019287109375, 0.010866165161132812, 0.011539459228515625, 0.012212753295898438, 0.01288604736328125, 0.013559341430664062, 0.014232635498046875, 0.014905929565429688, 0.0155792236328125, 0.016252517700195312, 0.016925811767578125, 0.017599105834960938, 0.01827239990234375, 0.018945693969726562, 0.019618988037109375, 0.020292282104492188, 0.020965576171875]}, "gradients/decoder.model.decoder.layers.5.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 6.0, 14.0, 13.0, 46.0, 95.0, 257.0, 291.0, 146.0, 68.0, 30.0, 15.0, 6.0, 4.0, 8.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.301478385925293, -4.194454669952393, -4.087430953979492, -3.980407476425171, -3.8733839988708496, -3.766360282897949, -3.659336566925049, -3.5523130893707275, -3.445289373397827, -3.3382656574249268, -3.2312421798706055, -3.124218463897705, -3.017194986343384, -2.9101712703704834, -2.803147792816162, -2.6961240768432617, -2.5891003608703613, -2.482076644897461, -2.3750531673431396, -2.2680294513702393, -2.161005973815918, -2.0539822578430176, -1.9469586610794067, -1.839935064315796, -1.7329115867614746, -1.6258879899978638, -1.518864393234253, -1.4118406772613525, -1.3048170804977417, -1.1977934837341309, -1.09076988697052, -0.9837462306022644, -0.8767225742340088, -0.769698977470398, -0.6626753211021423, -0.5556517243385315, -0.44862809777259827, -0.34160447120666504, -0.2345808744430542, -0.12755721807479858, -0.020533621311187744, 0.08648999780416489, 0.19351361691951752, 0.30053722858428955, 0.4075608551502228, 0.514584481716156, 0.6216080784797668, 0.7286317348480225, 0.8356553316116333, 0.9426789283752441, 1.049702525138855, 1.1567261219024658, 1.2637498378753662, 1.370773434638977, 1.477797031402588, 1.5848207473754883, 1.6918442249298096, 1.7988678216934204, 1.9058914184570312, 2.0129151344299316, 2.119938611984253, 2.2269623279571533, 2.3339858055114746, 2.441009521484375, 2.5480332374572754]}, "gradients/decoder.model.decoder.layers.5.self_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 6.0, 2.0, 4.0, 7.0, 7.0, 14.0, 14.0, 8.0, 28.0, 33.0, 52.0, 52.0, 58.0, 74.0, 87.0, 67.0, 81.0, 68.0, 66.0, 59.0, 50.0, 34.0, 34.0, 27.0, 22.0, 20.0, 10.0, 11.0, 6.0, 3.0, 2.0, 0.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9372439384460449, -0.9011213779449463, -0.8649988174438477, -0.8288761973381042, -0.7927536368370056, -0.756631076335907, -0.7205084562301636, -0.6843858957290649, -0.6482633352279663, -0.6121407747268677, -0.576018214225769, -0.5398955941200256, -0.503773033618927, -0.46765047311782837, -0.43152788281440735, -0.39540529251098633, -0.3592827320098877, -0.32316017150878906, -0.28703758120536804, -0.250914990901947, -0.2147924304008484, -0.17866985499858856, -0.14254727959632874, -0.10642468929290771, -0.07030212879180908, -0.034179553389549255, 0.0019430220127105713, 0.0380655974149704, 0.07418817281723022, 0.11031074821949005, 0.14643332362174988, 0.1825559139251709, 0.21867847442626953, 0.25480103492736816, 0.2909236252307892, 0.3270462155342102, 0.36316877603530884, 0.39929133653640747, 0.4354139268398285, 0.4715365171432495, 0.5076590776443481, 0.5437816381454468, 0.5799041986465454, 0.6160268187522888, 0.6521493792533875, 0.6882719397544861, 0.7243945598602295, 0.7605171203613281, 0.7966396808624268, 0.8327622413635254, 0.868884801864624, 0.9050074219703674, 0.9411299824714661, 0.9772525429725647, 1.013375163078308, 1.0494977235794067, 1.0856202840805054, 1.121742844581604, 1.1578654050827026, 1.1939879655838013, 1.2301106452941895, 1.266233205795288, 1.3023557662963867, 1.3384783267974854, 1.374600887298584]}, "gradients/decoder.model.decoder.layers.5.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 8.0, 8.0, 7.0, 15.0, 27.0, 26.0, 33.0, 53.0, 81.0, 126.0, 141.0, 278.0, 404.0, 650.0, 1143.0, 2134.0, 4446.0, 10891.0, 31739.0, 132908.0, 563056.0, 227582.0, 46576.0, 14261.0, 5692.0, 2663.0, 1487.0, 772.0, 468.0, 281.0, 181.0, 125.0, 87.0, 62.0, 37.0, 39.0, 22.0, 10.0, 8.0, 17.0, 6.0, 5.0, 4.0, 3.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.82373046875, -0.7928237915039062, -0.7619171142578125, -0.7310104370117188, -0.700103759765625, -0.6691970825195312, -0.6382904052734375, -0.6073837280273438, -0.57647705078125, -0.5455703735351562, -0.5146636962890625, -0.48375701904296875, -0.452850341796875, -0.42194366455078125, -0.3910369873046875, -0.36013031005859375, -0.3292236328125, -0.29831695556640625, -0.2674102783203125, -0.23650360107421875, -0.205596923828125, -0.17469024658203125, -0.1437835693359375, -0.11287689208984375, -0.08197021484375, -0.05106353759765625, -0.0201568603515625, 0.01074981689453125, 0.041656494140625, 0.07256317138671875, 0.1034698486328125, 0.13437652587890625, 0.165283203125, 0.19618988037109375, 0.2270965576171875, 0.25800323486328125, 0.288909912109375, 0.31981658935546875, 0.3507232666015625, 0.38162994384765625, 0.41253662109375, 0.44344329833984375, 0.4743499755859375, 0.5052566528320312, 0.536163330078125, 0.5670700073242188, 0.5979766845703125, 0.6288833618164062, 0.6597900390625, 0.6906967163085938, 0.7216033935546875, 0.7525100708007812, 0.783416748046875, 0.8143234252929688, 0.8452301025390625, 0.8761367797851562, 0.90704345703125, 0.9379501342773438, 0.9688568115234375, 0.9997634887695312, 1.030670166015625, 1.0615768432617188, 1.0924835205078125, 1.1233901977539062, 1.154296875]}, "gradients/decoder.model.decoder.layers.5.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 3.0, 4.0, 2.0, 4.0, 6.0, 9.0, 13.0, 14.0, 20.0, 25.0, 37.0, 56.0, 55.0, 61.0, 87.0, 74.0, 79.0, 73.0, 66.0, 70.0, 46.0, 42.0, 35.0, 32.0, 25.0, 25.0, 14.0, 10.0, 7.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-2.580078125, -2.492919921875, -2.40576171875, -2.318603515625, -2.2314453125, -2.144287109375, -2.05712890625, -1.969970703125, -1.8828125, -1.795654296875, -1.70849609375, -1.621337890625, -1.5341796875, -1.447021484375, -1.35986328125, -1.272705078125, -1.185546875, -1.098388671875, -1.01123046875, -0.924072265625, -0.8369140625, -0.749755859375, -0.66259765625, -0.575439453125, -0.48828125, -0.401123046875, -0.31396484375, -0.226806640625, -0.1396484375, -0.052490234375, 0.03466796875, 0.121826171875, 0.208984375, 0.296142578125, 0.38330078125, 0.470458984375, 0.5576171875, 0.644775390625, 0.73193359375, 0.819091796875, 0.90625, 0.993408203125, 1.08056640625, 1.167724609375, 1.2548828125, 1.342041015625, 1.42919921875, 1.516357421875, 1.603515625, 1.690673828125, 1.77783203125, 1.864990234375, 1.9521484375, 2.039306640625, 2.12646484375, 2.213623046875, 2.30078125, 2.387939453125, 2.47509765625, 2.562255859375, 2.6494140625, 2.736572265625, 2.82373046875, 2.910888671875, 2.998046875]}, "gradients/decoder.model.decoder.layers.5.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 1.0, 4.0, 6.0, 0.0, 9.0, 9.0, 13.0, 18.0, 24.0, 35.0, 51.0, 69.0, 79.0, 136.0, 191.0, 350.0, 600.0, 1245.0, 3255.0, 12187.0, 69934.0, 602175.0, 311006.0, 35367.0, 7192.0, 2308.0, 956.0, 480.0, 294.0, 151.0, 123.0, 83.0, 47.0, 40.0, 27.0, 25.0, 18.0, 8.0, 9.0, 12.0, 6.0, 7.0, 4.0, 2.0, 1.0, 4.0, 0.0, 0.0, 1.0, 4.0], "bins": [-1.1806640625, -1.147705078125, -1.11474609375, -1.081787109375, -1.048828125, -1.015869140625, -0.98291015625, -0.949951171875, -0.9169921875, -0.884033203125, -0.85107421875, -0.818115234375, -0.78515625, -0.752197265625, -0.71923828125, -0.686279296875, -0.6533203125, -0.620361328125, -0.58740234375, -0.554443359375, -0.521484375, -0.488525390625, -0.45556640625, -0.422607421875, -0.3896484375, -0.356689453125, -0.32373046875, -0.290771484375, -0.2578125, -0.224853515625, -0.19189453125, -0.158935546875, -0.1259765625, -0.093017578125, -0.06005859375, -0.027099609375, 0.005859375, 0.038818359375, 0.07177734375, 0.104736328125, 0.1376953125, 0.170654296875, 0.20361328125, 0.236572265625, 0.26953125, 0.302490234375, 0.33544921875, 0.368408203125, 0.4013671875, 0.434326171875, 0.46728515625, 0.500244140625, 0.533203125, 0.566162109375, 0.59912109375, 0.632080078125, 0.6650390625, 0.697998046875, 0.73095703125, 0.763916015625, 0.796875, 0.829833984375, 0.86279296875, 0.895751953125, 0.9287109375]}, "gradients/decoder.model.decoder.layers.5.self_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 3.0, 3.0, 1.0, 3.0, 3.0, 7.0, 10.0, 5.0, 8.0, 6.0, 18.0, 18.0, 13.0, 22.0, 15.0, 17.0, 13.0, 19.0, 32.0, 29.0, 27.0, 27.0, 32.0, 35.0, 47.0, 36.0, 50.0, 40.0, 47.0, 31.0, 48.0, 32.0, 35.0, 33.0, 28.0, 27.0, 32.0, 21.0, 26.0, 13.0, 14.0, 18.0, 15.0, 11.0, 8.0, 6.0, 6.0, 7.0, 3.0, 4.0, 5.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-1.8251953125, -1.7656707763671875, -1.706146240234375, -1.6466217041015625, -1.58709716796875, -1.5275726318359375, -1.468048095703125, -1.4085235595703125, -1.3489990234375, -1.2894744873046875, -1.229949951171875, -1.1704254150390625, -1.11090087890625, -1.0513763427734375, -0.991851806640625, -0.9323272705078125, -0.872802734375, -0.8132781982421875, -0.753753662109375, -0.6942291259765625, -0.63470458984375, -0.5751800537109375, -0.515655517578125, -0.4561309814453125, -0.3966064453125, -0.3370819091796875, -0.277557373046875, -0.2180328369140625, -0.15850830078125, -0.0989837646484375, -0.039459228515625, 0.0200653076171875, 0.07958984375, 0.1391143798828125, 0.198638916015625, 0.2581634521484375, 0.31768798828125, 0.3772125244140625, 0.436737060546875, 0.4962615966796875, 0.5557861328125, 0.6153106689453125, 0.674835205078125, 0.7343597412109375, 0.79388427734375, 0.8534088134765625, 0.912933349609375, 0.9724578857421875, 1.031982421875, 1.0915069580078125, 1.151031494140625, 1.2105560302734375, 1.27008056640625, 1.3296051025390625, 1.389129638671875, 1.4486541748046875, 1.5081787109375, 1.5677032470703125, 1.627227783203125, 1.6867523193359375, 1.74627685546875, 1.8058013916015625, 1.865325927734375, 1.9248504638671875, 1.984375]}, "gradients/decoder.model.decoder.layers.5.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 4.0, 1.0, 4.0, 4.0, 2.0, 3.0, 4.0, 10.0, 13.0, 14.0, 16.0, 27.0, 36.0, 64.0, 63.0, 140.0, 198.0, 297.0, 536.0, 922.0, 1892.0, 4647.0, 13747.0, 54763.0, 331401.0, 518909.0, 89868.0, 19598.0, 6183.0, 2428.0, 1153.0, 600.0, 354.0, 219.0, 144.0, 78.0, 61.0, 37.0, 30.0, 17.0, 15.0, 11.0, 8.0, 8.0, 7.0, 10.0, 7.0, 8.0, 5.0, 1.0, 0.0, 2.0], "bins": [-0.34619140625, -0.3368721008300781, -0.32755279541015625, -0.3182334899902344, -0.3089141845703125, -0.2995948791503906, -0.29027557373046875, -0.2809562683105469, -0.271636962890625, -0.2623176574707031, -0.25299835205078125, -0.24367904663085938, -0.2343597412109375, -0.22504043579101562, -0.21572113037109375, -0.20640182495117188, -0.19708251953125, -0.18776321411132812, -0.17844390869140625, -0.16912460327148438, -0.1598052978515625, -0.15048599243164062, -0.14116668701171875, -0.13184738159179688, -0.122528076171875, -0.11320877075195312, -0.10388946533203125, -0.09457015991210938, -0.0852508544921875, -0.07593154907226562, -0.06661224365234375, -0.057292938232421875, -0.0479736328125, -0.038654327392578125, -0.02933502197265625, -0.020015716552734375, -0.0106964111328125, -0.001377105712890625, 0.00794219970703125, 0.017261505126953125, 0.026580810546875, 0.035900115966796875, 0.04521942138671875, 0.054538726806640625, 0.0638580322265625, 0.07317733764648438, 0.08249664306640625, 0.09181594848632812, 0.10113525390625, 0.11045455932617188, 0.11977386474609375, 0.12909317016601562, 0.1384124755859375, 0.14773178100585938, 0.15705108642578125, 0.16637039184570312, 0.175689697265625, 0.18500900268554688, 0.19432830810546875, 0.20364761352539062, 0.2129669189453125, 0.22228622436523438, 0.23160552978515625, 0.24092483520507812, 0.250244140625]}, "gradients/decoder.model.decoder.layers.5.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 2.0, 3.0, 6.0, 6.0, 10.0, 6.0, 10.0, 15.0, 17.0, 19.0, 35.0, 34.0, 60.0, 80.0, 86.0, 116.0, 89.0, 91.0, 72.0, 67.0, 54.0, 32.0, 28.0, 12.0, 12.0, 16.0, 6.0, 8.0, 2.0, 2.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.131959915161133e-05, -4.955567419528961e-05, -4.7791749238967896e-05, -4.602782428264618e-05, -4.426389932632446e-05, -4.2499974370002747e-05, -4.073604941368103e-05, -3.8972124457359314e-05, -3.72081995010376e-05, -3.544427454471588e-05, -3.3680349588394165e-05, -3.191642463207245e-05, -3.0152499675750732e-05, -2.8388574719429016e-05, -2.66246497631073e-05, -2.4860724806785583e-05, -2.3096799850463867e-05, -2.133287489414215e-05, -1.9568949937820435e-05, -1.7805024981498718e-05, -1.6041100025177002e-05, -1.4277175068855286e-05, -1.251325011253357e-05, -1.0749325156211853e-05, -8.985400199890137e-06, -7.22147524356842e-06, -5.457550287246704e-06, -3.693625330924988e-06, -1.9297003746032715e-06, -1.6577541828155518e-07, 1.5981495380401611e-06, 3.3620744943618774e-06, 5.125999450683594e-06, 6.88992440700531e-06, 8.653849363327026e-06, 1.0417774319648743e-05, 1.2181699275970459e-05, 1.3945624232292175e-05, 1.570954918861389e-05, 1.7473474144935608e-05, 1.9237399101257324e-05, 2.100132405757904e-05, 2.2765249013900757e-05, 2.4529173970222473e-05, 2.629309892654419e-05, 2.8057023882865906e-05, 2.9820948839187622e-05, 3.158487379550934e-05, 3.3348798751831055e-05, 3.511272370815277e-05, 3.687664866447449e-05, 3.8640573620796204e-05, 4.040449857711792e-05, 4.2168423533439636e-05, 4.393234848976135e-05, 4.569627344608307e-05, 4.7460198402404785e-05, 4.92241233587265e-05, 5.098804831504822e-05, 5.2751973271369934e-05, 5.451589822769165e-05, 5.627982318401337e-05, 5.804374814033508e-05, 5.98076730966568e-05, 6.157159805297852e-05]}, "gradients/decoder.model.decoder.layers.5.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 4.0, 3.0, 1.0, 4.0, 8.0, 4.0, 7.0, 6.0, 12.0, 11.0, 16.0, 23.0, 28.0, 41.0, 60.0, 73.0, 131.0, 198.0, 296.0, 531.0, 978.0, 2004.0, 4330.0, 10913.0, 33298.0, 135723.0, 555163.0, 228335.0, 49822.0, 15354.0, 5826.0, 2457.0, 1243.0, 653.0, 333.0, 223.0, 136.0, 89.0, 65.0, 42.0, 24.0, 28.0, 13.0, 11.0, 13.0, 9.0, 3.0, 8.0, 3.0, 2.0, 6.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.267578125, -0.25885009765625, -0.2501220703125, -0.24139404296875, -0.232666015625, -0.22393798828125, -0.2152099609375, -0.20648193359375, -0.19775390625, -0.18902587890625, -0.1802978515625, -0.17156982421875, -0.162841796875, -0.15411376953125, -0.1453857421875, -0.13665771484375, -0.1279296875, -0.11920166015625, -0.1104736328125, -0.10174560546875, -0.093017578125, -0.08428955078125, -0.0755615234375, -0.06683349609375, -0.05810546875, -0.04937744140625, -0.0406494140625, -0.03192138671875, -0.023193359375, -0.01446533203125, -0.0057373046875, 0.00299072265625, 0.01171875, 0.02044677734375, 0.0291748046875, 0.03790283203125, 0.046630859375, 0.05535888671875, 0.0640869140625, 0.07281494140625, 0.08154296875, 0.09027099609375, 0.0989990234375, 0.10772705078125, 0.116455078125, 0.12518310546875, 0.1339111328125, 0.14263916015625, 0.1513671875, 0.16009521484375, 0.1688232421875, 0.17755126953125, 0.186279296875, 0.19500732421875, 0.2037353515625, 0.21246337890625, 0.22119140625, 0.22991943359375, 0.2386474609375, 0.24737548828125, 0.256103515625, 0.26483154296875, 0.2735595703125, 0.28228759765625, 0.291015625]}, "gradients/decoder.model.decoder.layers.5.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 3.0, 8.0, 8.0, 5.0, 2.0, 9.0, 24.0, 12.0, 18.0, 22.0, 33.0, 37.0, 51.0, 62.0, 81.0, 70.0, 79.0, 86.0, 82.0, 59.0, 38.0, 46.0, 34.0, 35.0, 20.0, 15.0, 11.0, 12.0, 9.0, 8.0, 4.0, 6.0, 2.0, 3.0, 1.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.148193359375, -0.1434917449951172, -0.13879013061523438, -0.13408851623535156, -0.12938690185546875, -0.12468528747558594, -0.11998367309570312, -0.11528205871582031, -0.1105804443359375, -0.10587882995605469, -0.10117721557617188, -0.09647560119628906, -0.09177398681640625, -0.08707237243652344, -0.08237075805664062, -0.07766914367675781, -0.072967529296875, -0.06826591491699219, -0.06356430053710938, -0.05886268615722656, -0.05416107177734375, -0.04945945739746094, -0.044757843017578125, -0.04005622863769531, -0.0353546142578125, -0.030652999877929688, -0.025951385498046875, -0.021249771118164062, -0.01654815673828125, -0.011846542358398438, -0.007144927978515625, -0.0024433135986328125, 0.00225830078125, 0.0069599151611328125, 0.011661529541015625, 0.016363143920898438, 0.02106475830078125, 0.025766372680664062, 0.030467987060546875, 0.03516960144042969, 0.0398712158203125, 0.04457283020019531, 0.049274444580078125, 0.05397605895996094, 0.05867767333984375, 0.06337928771972656, 0.06808090209960938, 0.07278251647949219, 0.077484130859375, 0.08218574523925781, 0.08688735961914062, 0.09158897399902344, 0.09629058837890625, 0.10099220275878906, 0.10569381713867188, 0.11039543151855469, 0.1150970458984375, 0.11979866027832031, 0.12450027465820312, 0.12920188903808594, 0.13390350341796875, 0.13860511779785156, 0.14330673217773438, 0.1480083465576172, 0.1527099609375]}, "gradients/decoder.model.decoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 7.0, 10.0, 19.0, 16.0, 48.0, 113.0, 218.0, 251.0, 160.0, 67.0, 44.0, 24.0, 7.0, 7.0, 2.0, 5.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.223835468292236, -7.044222354888916, -6.864609241485596, -6.684996128082275, -6.505383014678955, -6.325769901275635, -6.146156311035156, -5.966543197631836, -5.786930084228516, -5.607316970825195, -5.427703857421875, -5.248090744018555, -5.068477630615234, -4.888864517211914, -4.709251403808594, -4.529638290405273, -4.350025177001953, -4.170412063598633, -3.9907989501953125, -3.811185836791992, -3.631572723388672, -3.4519596099853516, -3.272346258163452, -3.092733144760132, -2.9131200313568115, -2.733506917953491, -2.553893804550171, -2.3742804527282715, -2.194667339324951, -2.015054225921631, -1.8354411125183105, -1.6558279991149902, -1.47621488571167, -1.2966017723083496, -1.1169886589050293, -0.9373754262924194, -0.7577623128890991, -0.5781491994857788, -0.39853596687316895, -0.21892285346984863, -0.03930974006652832, 0.14030340313911438, 0.3199165463447571, 0.49952971935272217, 0.6791428327560425, 0.8587559461593628, 1.0383691787719727, 1.217982292175293, 1.3975954055786133, 1.5772085189819336, 1.756821632385254, 1.9364348649978638, 2.1160478591918945, 2.295660972595215, 2.4752743244171143, 2.6548874378204346, 2.834500551223755, 3.014113664627075, 3.1937267780303955, 3.373340129852295, 3.5529532432556152, 3.7325663566589355, 3.912179470062256, 4.091792583465576, 4.2714056968688965]}, "gradients/decoder.model.decoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 0.0, 3.0, 0.0, 5.0, 5.0, 4.0, 3.0, 9.0, 1.0, 6.0, 12.0, 12.0, 18.0, 13.0, 14.0, 25.0, 27.0, 27.0, 28.0, 36.0, 32.0, 41.0, 33.0, 38.0, 37.0, 51.0, 52.0, 40.0, 47.0, 40.0, 50.0, 41.0, 28.0, 34.0, 29.0, 22.0, 19.0, 18.0, 24.0, 18.0, 13.0, 13.0, 7.0, 7.0, 11.0, 6.0, 4.0, 4.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.6714460849761963, -3.5509238243103027, -3.4304018020629883, -3.3098795413970947, -3.189357280731201, -3.0688352584838867, -2.948312997817993, -2.8277907371520996, -2.707268714904785, -2.5867464542388916, -2.466224431991577, -2.3457021713256836, -2.22517991065979, -2.1046576499938965, -1.984135627746582, -1.8636133670806885, -1.743091106414795, -1.622568964958191, -1.5020467042922974, -1.3815245628356934, -1.2610023021697998, -1.1404801607131958, -1.0199580192565918, -0.899435818195343, -0.7789136171340942, -0.6583914160728455, -0.5378692150115967, -0.4173470735549927, -0.2968248724937439, -0.17630267143249512, -0.05578052997589111, 0.06474167108535767, 0.18526411056518555, 0.3057863116264343, 0.4263084828853607, 0.5468306541442871, 0.6673528552055359, 0.7878750562667847, 0.9083971977233887, 1.0289194583892822, 1.1494415998458862, 1.2699637413024902, 1.3904860019683838, 1.5110081434249878, 1.6315302848815918, 1.7520525455474854, 1.8725746870040894, 1.9930968284606934, 2.113619089126587, 2.2341413497924805, 2.354663372039795, 2.4751856327056885, 2.595707893371582, 2.7162299156188965, 2.83675217628479, 2.9572744369506836, 3.077796459197998, 3.1983187198638916, 3.318840742111206, 3.4393630027770996, 3.559885263442993, 3.6804075241088867, 3.800929546356201, 3.9214518070220947, 4.041974067687988]}, "gradients/decoder.model.decoder.layers.4.fc2.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 5.0, 6.0, 3.0, 8.0, 11.0, 8.0, 26.0, 30.0, 78.0, 122.0, 189.0, 389.0, 756.0, 1629.0, 3943.0, 12757.0, 64885.0, 1006183.0, 2937306.0, 136726.0, 19702.0, 5435.0, 2006.0, 966.0, 480.0, 248.0, 144.0, 82.0, 60.0, 35.0, 18.0, 15.0, 13.0, 9.0, 5.0, 4.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.75, -1.683135986328125, -1.61627197265625, -1.549407958984375, -1.4825439453125, -1.415679931640625, -1.34881591796875, -1.281951904296875, -1.215087890625, -1.148223876953125, -1.08135986328125, -1.014495849609375, -0.9476318359375, -0.880767822265625, -0.81390380859375, -0.747039794921875, -0.68017578125, -0.613311767578125, -0.54644775390625, -0.479583740234375, -0.4127197265625, -0.345855712890625, -0.27899169921875, -0.212127685546875, -0.145263671875, -0.078399658203125, -0.01153564453125, 0.055328369140625, 0.1221923828125, 0.189056396484375, 0.25592041015625, 0.322784423828125, 0.3896484375, 0.456512451171875, 0.52337646484375, 0.590240478515625, 0.6571044921875, 0.723968505859375, 0.79083251953125, 0.857696533203125, 0.924560546875, 0.991424560546875, 1.05828857421875, 1.125152587890625, 1.1920166015625, 1.258880615234375, 1.32574462890625, 1.392608642578125, 1.45947265625, 1.526336669921875, 1.59320068359375, 1.660064697265625, 1.7269287109375, 1.793792724609375, 1.86065673828125, 1.927520751953125, 1.994384765625, 2.061248779296875, 2.12811279296875, 2.194976806640625, 2.2618408203125, 2.328704833984375, 2.39556884765625, 2.462432861328125, 2.529296875]}, "gradients/decoder.model.decoder.layers.4.fc2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 3.0, 0.0, 3.0, 2.0, 1.0, 8.0, 5.0, 10.0, 11.0, 14.0, 18.0, 32.0, 34.0, 31.0, 43.0, 44.0, 64.0, 67.0, 90.0, 67.0, 64.0, 66.0, 76.0, 55.0, 46.0, 33.0, 26.0, 20.0, 19.0, 15.0, 9.0, 6.0, 9.0, 6.0, 7.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.1435546875, -1.1021575927734375, -1.060760498046875, -1.0193634033203125, -0.97796630859375, -0.9365692138671875, -0.895172119140625, -0.8537750244140625, -0.8123779296875, -0.7709808349609375, -0.729583740234375, -0.6881866455078125, -0.64678955078125, -0.6053924560546875, -0.563995361328125, -0.5225982666015625, -0.481201171875, -0.4398040771484375, -0.398406982421875, -0.3570098876953125, -0.31561279296875, -0.2742156982421875, -0.232818603515625, -0.1914215087890625, -0.1500244140625, -0.1086273193359375, -0.067230224609375, -0.0258331298828125, 0.01556396484375, 0.0569610595703125, 0.098358154296875, 0.1397552490234375, 0.18115234375, 0.2225494384765625, 0.263946533203125, 0.3053436279296875, 0.34674072265625, 0.3881378173828125, 0.429534912109375, 0.4709320068359375, 0.5123291015625, 0.5537261962890625, 0.595123291015625, 0.6365203857421875, 0.67791748046875, 0.7193145751953125, 0.760711669921875, 0.8021087646484375, 0.843505859375, 0.8849029541015625, 0.926300048828125, 0.9676971435546875, 1.00909423828125, 1.0504913330078125, 1.091888427734375, 1.1332855224609375, 1.1746826171875, 1.2160797119140625, 1.257476806640625, 1.2988739013671875, 1.34027099609375, 1.3816680908203125, 1.423065185546875, 1.4644622802734375, 1.505859375]}, "gradients/decoder.model.decoder.layers.4.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 6.0, 3.0, 5.0, 6.0, 10.0, 9.0, 16.0, 27.0, 34.0, 54.0, 83.0, 142.0, 200.0, 392.0, 772.0, 1771.0, 5173.0, 18818.0, 108228.0, 2450300.0, 1503458.0, 82276.0, 14924.0, 4293.0, 1618.0, 708.0, 344.0, 218.0, 126.0, 85.0, 64.0, 47.0, 26.0, 15.0, 9.0, 4.0, 8.0, 9.0, 2.0, 2.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5400390625, -1.48681640625, -1.43359375, -1.38037109375, -1.3271484375, -1.27392578125, -1.220703125, -1.16748046875, -1.1142578125, -1.06103515625, -1.0078125, -0.95458984375, -0.9013671875, -0.84814453125, -0.794921875, -0.74169921875, -0.6884765625, -0.63525390625, -0.58203125, -0.52880859375, -0.4755859375, -0.42236328125, -0.369140625, -0.31591796875, -0.2626953125, -0.20947265625, -0.15625, -0.10302734375, -0.0498046875, 0.00341796875, 0.056640625, 0.10986328125, 0.1630859375, 0.21630859375, 0.26953125, 0.32275390625, 0.3759765625, 0.42919921875, 0.482421875, 0.53564453125, 0.5888671875, 0.64208984375, 0.6953125, 0.74853515625, 0.8017578125, 0.85498046875, 0.908203125, 0.96142578125, 1.0146484375, 1.06787109375, 1.12109375, 1.17431640625, 1.2275390625, 1.28076171875, 1.333984375, 1.38720703125, 1.4404296875, 1.49365234375, 1.546875, 1.60009765625, 1.6533203125, 1.70654296875, 1.759765625, 1.81298828125, 1.8662109375]}, "gradients/decoder.model.decoder.layers.4.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 0.0, 3.0, 2.0, 7.0, 8.0, 10.0, 11.0, 8.0, 8.0, 21.0, 32.0, 32.0, 45.0, 50.0, 89.0, 90.0, 143.0, 197.0, 292.0, 432.0, 554.0, 557.0, 417.0, 296.0, 192.0, 134.0, 97.0, 72.0, 66.0, 48.0, 32.0, 26.0, 26.0, 24.0, 10.0, 17.0, 5.0, 5.0, 7.0, 4.0, 5.0, 4.0, 0.0, 2.0, 1.0, 2.0, 2.0], "bins": [-0.402099609375, -0.3914947509765625, -0.380889892578125, -0.3702850341796875, -0.35968017578125, -0.3490753173828125, -0.338470458984375, -0.3278656005859375, -0.3172607421875, -0.3066558837890625, -0.296051025390625, -0.2854461669921875, -0.27484130859375, -0.2642364501953125, -0.253631591796875, -0.2430267333984375, -0.232421875, -0.2218170166015625, -0.211212158203125, -0.2006072998046875, -0.19000244140625, -0.1793975830078125, -0.168792724609375, -0.1581878662109375, -0.1475830078125, -0.1369781494140625, -0.126373291015625, -0.1157684326171875, -0.10516357421875, -0.0945587158203125, -0.083953857421875, -0.0733489990234375, -0.062744140625, -0.0521392822265625, -0.041534423828125, -0.0309295654296875, -0.02032470703125, -0.0097198486328125, 0.000885009765625, 0.0114898681640625, 0.0220947265625, 0.0326995849609375, 0.043304443359375, 0.0539093017578125, 0.06451416015625, 0.0751190185546875, 0.085723876953125, 0.0963287353515625, 0.10693359375, 0.1175384521484375, 0.128143310546875, 0.1387481689453125, 0.14935302734375, 0.1599578857421875, 0.170562744140625, 0.1811676025390625, 0.1917724609375, 0.2023773193359375, 0.212982177734375, 0.2235870361328125, 0.23419189453125, 0.2447967529296875, 0.255401611328125, 0.2660064697265625, 0.276611328125]}, "gradients/decoder.model.decoder.layers.4.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 0.0, 5.0, 8.0, 16.0, 25.0, 47.0, 150.0, 211.0, 246.0, 141.0, 66.0, 31.0, 25.0, 10.0, 11.0, 5.0, 6.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.414216995239258, -5.285703182220459, -5.157188892364502, -5.028675079345703, -4.900161266326904, -4.7716474533081055, -4.643133163452148, -4.51461935043335, -4.386105537414551, -4.257591724395752, -4.129077434539795, -4.000563621520996, -3.8720498085021973, -3.7435357570648193, -3.6150217056274414, -3.4865078926086426, -3.3579938411712646, -3.2294797897338867, -3.100965976715088, -2.97245192527771, -2.843938112258911, -2.715424060821533, -2.5869102478027344, -2.4583961963653564, -2.3298821449279785, -2.2013680934906006, -2.0728542804718018, -1.9443402290344238, -1.815826416015625, -1.687312364578247, -1.5587984323501587, -1.4302845001220703, -1.3017704486846924, -1.173256516456604, -1.0447425842285156, -0.9162285923957825, -0.7877146601676941, -0.6592007279396057, -0.5306867361068726, -0.4021728038787842, -0.2736588716506958, -0.14514492452144623, -0.016630977392196655, 0.11188298463821411, 0.2403969168663025, 0.36891084909439087, 0.497424840927124, 0.6259387731552124, 0.7544527053833008, 0.8829666376113892, 1.0114805698394775, 1.1399946212768555, 1.2685084342956543, 1.3970224857330322, 1.5255364179611206, 1.654050350189209, 1.7825642824172974, 1.9110782146453857, 2.0395922660827637, 2.1681060791015625, 2.2966201305389404, 2.4251339435577393, 2.553647994995117, 2.682161808013916, 2.810675859451294]}, "gradients/decoder.model.decoder.layers.4.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 0.0, 3.0, 3.0, 4.0, 6.0, 9.0, 8.0, 10.0, 18.0, 24.0, 21.0, 30.0, 28.0, 40.0, 51.0, 44.0, 58.0, 66.0, 41.0, 57.0, 57.0, 50.0, 48.0, 47.0, 56.0, 32.0, 38.0, 34.0, 21.0, 29.0, 18.0, 16.0, 10.0, 10.0, 5.0, 6.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.0576013326644897, -1.0165938138961792, -0.9755864143371582, -0.9345789551734924, -0.8935714960098267, -0.8525639772415161, -0.8115565180778503, -0.7705490589141846, -0.7295415997505188, -0.688534140586853, -0.6475266814231873, -0.6065192222595215, -0.5655117034912109, -0.5245043039321899, -0.4834967851638794, -0.4424893260002136, -0.40148186683654785, -0.3604744076728821, -0.3194669485092163, -0.27845945954322815, -0.23745200037956238, -0.1964445412158966, -0.15543706715106964, -0.11442959308624268, -0.0734221339225769, -0.032414667308330536, 0.008592799305915833, 0.0496002659201622, 0.09060773253440857, 0.13161519169807434, 0.1726226657629013, 0.21363013982772827, 0.25463759899139404, 0.2956450581550598, 0.3366525173187256, 0.37766000628471375, 0.4186674654483795, 0.4596749246120453, 0.5006824135780334, 0.5416898727416992, 0.582697331905365, 0.6237047910690308, 0.6647122502326965, 0.7057197093963623, 0.7467272281646729, 0.7877346277236938, 0.8287421464920044, 0.8697496056556702, 0.9107570648193359, 0.9517645239830017, 0.9927719831466675, 1.033779501914978, 1.074786901473999, 1.1157944202423096, 1.1568018198013306, 1.1978093385696411, 1.238816738128662, 1.2798242568969727, 1.3208316564559937, 1.3618391752243042, 1.4028465747833252, 1.4438540935516357, 1.4848614931106567, 1.5258690118789673, 1.5668765306472778]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 4.0, 9.0, 8.0, 26.0, 22.0, 34.0, 60.0, 82.0, 146.0, 211.0, 360.0, 642.0, 1158.0, 2235.0, 5017.0, 11168.0, 28423.0, 84893.0, 305735.0, 415439.0, 126216.0, 39455.0, 14603.0, 6277.0, 2868.0, 1504.0, 784.0, 476.0, 248.0, 150.0, 111.0, 72.0, 35.0, 27.0, 21.0, 13.0, 4.0, 12.0, 5.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.2071533203125, -0.2002849578857422, -0.19341659545898438, -0.18654823303222656, -0.17967987060546875, -0.17281150817871094, -0.16594314575195312, -0.1590747833251953, -0.1522064208984375, -0.1453380584716797, -0.13846969604492188, -0.13160133361816406, -0.12473297119140625, -0.11786460876464844, -0.11099624633789062, -0.10412788391113281, -0.097259521484375, -0.09039115905761719, -0.08352279663085938, -0.07665443420410156, -0.06978607177734375, -0.06291770935058594, -0.056049346923828125, -0.04918098449707031, -0.0423126220703125, -0.03544425964355469, -0.028575897216796875, -0.021707534790039062, -0.01483917236328125, -0.007970809936523438, -0.001102447509765625, 0.0057659149169921875, 0.01263427734375, 0.019502639770507812, 0.026371002197265625, 0.03323936462402344, 0.04010772705078125, 0.04697608947753906, 0.053844451904296875, 0.06071281433105469, 0.0675811767578125, 0.07444953918457031, 0.08131790161132812, 0.08818626403808594, 0.09505462646484375, 0.10192298889160156, 0.10879135131835938, 0.11565971374511719, 0.122528076171875, 0.1293964385986328, 0.13626480102539062, 0.14313316345214844, 0.15000152587890625, 0.15686988830566406, 0.16373825073242188, 0.1706066131591797, 0.1774749755859375, 0.1843433380126953, 0.19121170043945312, 0.19808006286621094, 0.20494842529296875, 0.21181678771972656, 0.21868515014648438, 0.2255535125732422, 0.232421875]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 1.0, 3.0, 5.0, 4.0, 6.0, 2.0, 3.0, 6.0, 13.0, 6.0, 10.0, 13.0, 27.0, 42.0, 47.0, 49.0, 48.0, 59.0, 63.0, 64.0, 56.0, 56.0, 63.0, 56.0, 60.0, 49.0, 49.0, 21.0, 30.0, 22.0, 19.0, 12.0, 19.0, 2.0, 5.0, 7.0, 4.0, 4.0, 5.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.763671875, -0.7315826416015625, -0.699493408203125, -0.6674041748046875, -0.63531494140625, -0.6032257080078125, -0.571136474609375, -0.5390472412109375, -0.5069580078125, -0.4748687744140625, -0.442779541015625, -0.4106903076171875, -0.37860107421875, -0.3465118408203125, -0.314422607421875, -0.2823333740234375, -0.250244140625, -0.2181549072265625, -0.186065673828125, -0.1539764404296875, -0.12188720703125, -0.0897979736328125, -0.057708740234375, -0.0256195068359375, 0.0064697265625, 0.0385589599609375, 0.070648193359375, 0.1027374267578125, 0.13482666015625, 0.1669158935546875, 0.199005126953125, 0.2310943603515625, 0.26318359375, 0.2952728271484375, 0.327362060546875, 0.3594512939453125, 0.39154052734375, 0.4236297607421875, 0.455718994140625, 0.4878082275390625, 0.5198974609375, 0.5519866943359375, 0.584075927734375, 0.6161651611328125, 0.64825439453125, 0.6803436279296875, 0.712432861328125, 0.7445220947265625, 0.776611328125, 0.8087005615234375, 0.840789794921875, 0.8728790283203125, 0.90496826171875, 0.9370574951171875, 0.969146728515625, 1.0012359619140625, 1.0333251953125, 1.0654144287109375, 1.097503662109375, 1.1295928955078125, 1.16168212890625, 1.1937713623046875, 1.225860595703125, 1.2579498291015625, 1.2900390625]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 2.0, 3.0, 6.0, 10.0, 4.0, 13.0, 17.0, 13.0, 19.0, 35.0, 39.0, 68.0, 82.0, 128.0, 207.0, 343.0, 688.0, 1457.0, 3916.0, 13127.0, 61639.0, 359856.0, 484996.0, 94319.0, 18370.0, 5276.0, 1993.0, 816.0, 435.0, 232.0, 129.0, 87.0, 71.0, 41.0, 29.0, 26.0, 18.0, 16.0, 4.0, 7.0, 4.0, 6.0, 5.0, 1.0, 6.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.2369384765625, -0.2293262481689453, -0.22171401977539062, -0.21410179138183594, -0.20648956298828125, -0.19887733459472656, -0.19126510620117188, -0.1836528778076172, -0.1760406494140625, -0.1684284210205078, -0.16081619262695312, -0.15320396423339844, -0.14559173583984375, -0.13797950744628906, -0.13036727905273438, -0.12275505065917969, -0.115142822265625, -0.10753059387207031, -0.09991836547851562, -0.09230613708496094, -0.08469390869140625, -0.07708168029785156, -0.06946945190429688, -0.06185722351074219, -0.0542449951171875, -0.04663276672363281, -0.039020538330078125, -0.03140830993652344, -0.02379608154296875, -0.016183853149414062, -0.008571624755859375, -0.0009593963623046875, 0.00665283203125, 0.014265060424804688, 0.021877288818359375, 0.029489517211914062, 0.03710174560546875, 0.04471397399902344, 0.052326202392578125, 0.05993843078613281, 0.0675506591796875, 0.07516288757324219, 0.08277511596679688, 0.09038734436035156, 0.09799957275390625, 0.10561180114746094, 0.11322402954101562, 0.12083625793457031, 0.128448486328125, 0.1360607147216797, 0.14367294311523438, 0.15128517150878906, 0.15889739990234375, 0.16650962829589844, 0.17412185668945312, 0.1817340850830078, 0.1893463134765625, 0.1969585418701172, 0.20457077026367188, 0.21218299865722656, 0.21979522705078125, 0.22740745544433594, 0.23501968383789062, 0.2426319122314453, 0.250244140625]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 2.0, 2.0, 2.0, 7.0, 7.0, 6.0, 9.0, 11.0, 14.0, 10.0, 18.0, 17.0, 19.0, 25.0, 22.0, 21.0, 32.0, 53.0, 33.0, 40.0, 44.0, 54.0, 47.0, 60.0, 48.0, 47.0, 40.0, 34.0, 38.0, 42.0, 31.0, 25.0, 33.0, 24.0, 13.0, 18.0, 11.0, 8.0, 6.0, 13.0, 6.0, 4.0, 2.0, 2.0, 3.0, 2.0, 2.0, 0.0, 1.0, 3.0, 2.0], "bins": [-1.767578125, -1.71893310546875, -1.6702880859375, -1.62164306640625, -1.572998046875, -1.52435302734375, -1.4757080078125, -1.42706298828125, -1.37841796875, -1.32977294921875, -1.2811279296875, -1.23248291015625, -1.183837890625, -1.13519287109375, -1.0865478515625, -1.03790283203125, -0.9892578125, -0.94061279296875, -0.8919677734375, -0.84332275390625, -0.794677734375, -0.74603271484375, -0.6973876953125, -0.64874267578125, -0.60009765625, -0.55145263671875, -0.5028076171875, -0.45416259765625, -0.405517578125, -0.35687255859375, -0.3082275390625, -0.25958251953125, -0.2109375, -0.16229248046875, -0.1136474609375, -0.06500244140625, -0.016357421875, 0.03228759765625, 0.0809326171875, 0.12957763671875, 0.17822265625, 0.22686767578125, 0.2755126953125, 0.32415771484375, 0.372802734375, 0.42144775390625, 0.4700927734375, 0.51873779296875, 0.5673828125, 0.61602783203125, 0.6646728515625, 0.71331787109375, 0.761962890625, 0.81060791015625, 0.8592529296875, 0.90789794921875, 0.95654296875, 1.00518798828125, 1.0538330078125, 1.10247802734375, 1.151123046875, 1.19976806640625, 1.2484130859375, 1.29705810546875, 1.345703125]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 3.0, 7.0, 13.0, 10.0, 35.0, 46.0, 58.0, 130.0, 212.0, 481.0, 1153.0, 3369.0, 13475.0, 101145.0, 720448.0, 180374.0, 20403.0, 4599.0, 1388.0, 577.0, 276.0, 138.0, 77.0, 47.0, 33.0, 15.0, 15.0, 9.0, 5.0, 9.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.1768798828125, -0.17229938507080078, -0.16771888732910156, -0.16313838958740234, -0.15855789184570312, -0.1539773941040039, -0.1493968963623047, -0.14481639862060547, -0.14023590087890625, -0.13565540313720703, -0.1310749053955078, -0.1264944076538086, -0.12191390991210938, -0.11733341217041016, -0.11275291442871094, -0.10817241668701172, -0.1035919189453125, -0.09901142120361328, -0.09443092346191406, -0.08985042572021484, -0.08526992797851562, -0.0806894302368164, -0.07610893249511719, -0.07152843475341797, -0.06694793701171875, -0.06236743927001953, -0.05778694152832031, -0.053206443786621094, -0.048625946044921875, -0.044045448303222656, -0.03946495056152344, -0.03488445281982422, -0.030303955078125, -0.02572345733642578, -0.021142959594726562, -0.016562461853027344, -0.011981964111328125, -0.007401466369628906, -0.0028209686279296875, 0.0017595291137695312, 0.00634002685546875, 0.010920524597167969, 0.015501022338867188, 0.020081520080566406, 0.024662017822265625, 0.029242515563964844, 0.03382301330566406, 0.03840351104736328, 0.0429840087890625, 0.04756450653076172, 0.05214500427246094, 0.056725502014160156, 0.061305999755859375, 0.0658864974975586, 0.07046699523925781, 0.07504749298095703, 0.07962799072265625, 0.08420848846435547, 0.08878898620605469, 0.0933694839477539, 0.09794998168945312, 0.10253047943115234, 0.10711097717285156, 0.11169147491455078, 0.11627197265625]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 6.0, 6.0, 6.0, 19.0, 25.0, 56.0, 76.0, 90.0, 136.0, 153.0, 126.0, 129.0, 54.0, 50.0, 28.0, 20.0, 13.0, 5.0, 7.0, 3.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.9696693420410156e-05, -3.730412572622299e-05, -3.491155803203583e-05, -3.251899033784866e-05, -3.01264226436615e-05, -2.7733854949474335e-05, -2.534128725528717e-05, -2.2948719561100006e-05, -2.0556151866912842e-05, -1.8163584172725677e-05, -1.5771016478538513e-05, -1.3378448784351349e-05, -1.0985881090164185e-05, -8.59331339597702e-06, -6.200745701789856e-06, -3.8081780076026917e-06, -1.4156103134155273e-06, 9.76957380771637e-07, 3.3695250749588013e-06, 5.7620927691459656e-06, 8.15466046333313e-06, 1.0547228157520294e-05, 1.2939795851707458e-05, 1.5332363545894623e-05, 1.7724931240081787e-05, 2.011749893426895e-05, 2.2510066628456116e-05, 2.490263432264328e-05, 2.7295202016830444e-05, 2.968776971101761e-05, 3.208033740520477e-05, 3.447290509939194e-05, 3.68654727935791e-05, 3.9258040487766266e-05, 4.165060818195343e-05, 4.4043175876140594e-05, 4.643574357032776e-05, 4.882831126451492e-05, 5.122087895870209e-05, 5.361344665288925e-05, 5.6006014347076416e-05, 5.839858204126358e-05, 6.0791149735450745e-05, 6.318371742963791e-05, 6.557628512382507e-05, 6.796885281801224e-05, 7.03614205121994e-05, 7.275398820638657e-05, 7.514655590057373e-05, 7.75391235947609e-05, 7.993169128894806e-05, 8.232425898313522e-05, 8.471682667732239e-05, 8.710939437150955e-05, 8.950196206569672e-05, 9.189452975988388e-05, 9.428709745407104e-05, 9.667966514825821e-05, 9.907223284244537e-05, 0.00010146480053663254, 0.0001038573682308197, 0.00010624993592500687, 0.00010864250361919403, 0.0001110350713133812, 0.00011342763900756836]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 3.0, 4.0, 13.0, 8.0, 24.0, 28.0, 37.0, 77.0, 108.0, 246.0, 609.0, 1421.0, 4764.0, 22052.0, 143379.0, 639067.0, 198711.0, 28821.0, 6109.0, 1718.0, 676.0, 310.0, 158.0, 79.0, 41.0, 32.0, 24.0, 13.0, 8.0, 9.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11334228515625, -0.10923290252685547, -0.10512351989746094, -0.1010141372680664, -0.09690475463867188, -0.09279537200927734, -0.08868598937988281, -0.08457660675048828, -0.08046722412109375, -0.07635784149169922, -0.07224845886230469, -0.06813907623291016, -0.06402969360351562, -0.059920310974121094, -0.05581092834472656, -0.05170154571533203, -0.0475921630859375, -0.04348278045654297, -0.03937339782714844, -0.035264015197753906, -0.031154632568359375, -0.027045249938964844, -0.022935867309570312, -0.01882648468017578, -0.01471710205078125, -0.010607719421386719, -0.0064983367919921875, -0.0023889541625976562, 0.001720428466796875, 0.005829811096191406, 0.009939193725585938, 0.014048576354980469, 0.018157958984375, 0.02226734161376953, 0.026376724243164062, 0.030486106872558594, 0.034595489501953125, 0.038704872131347656, 0.04281425476074219, 0.04692363739013672, 0.05103302001953125, 0.05514240264892578, 0.05925178527832031, 0.06336116790771484, 0.06747055053710938, 0.0715799331665039, 0.07568931579589844, 0.07979869842529297, 0.0839080810546875, 0.08801746368408203, 0.09212684631347656, 0.0962362289428711, 0.10034561157226562, 0.10445499420166016, 0.10856437683105469, 0.11267375946044922, 0.11678314208984375, 0.12089252471923828, 0.1250019073486328, 0.12911128997802734, 0.13322067260742188, 0.1373300552368164, 0.14143943786621094, 0.14554882049560547, 0.149658203125]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 2.0, 1.0, 4.0, 7.0, 6.0, 14.0, 19.0, 23.0, 33.0, 48.0, 76.0, 75.0, 98.0, 119.0, 106.0, 104.0, 72.0, 60.0, 47.0, 34.0, 22.0, 12.0, 14.0, 8.0, 3.0, 7.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.017669677734375, -0.016624927520751953, -0.015580177307128906, -0.01453542709350586, -0.013490676879882812, -0.012445926666259766, -0.011401176452636719, -0.010356426239013672, -0.009311676025390625, -0.008266925811767578, -0.007222175598144531, -0.006177425384521484, -0.0051326751708984375, -0.004087924957275391, -0.0030431747436523438, -0.001998424530029297, -0.00095367431640625, 9.107589721679688e-05, 0.0011358261108398438, 0.0021805763244628906, 0.0032253265380859375, 0.004270076751708984, 0.005314826965332031, 0.006359577178955078, 0.007404327392578125, 0.008449077606201172, 0.009493827819824219, 0.010538578033447266, 0.011583328247070312, 0.01262807846069336, 0.013672828674316406, 0.014717578887939453, 0.0157623291015625, 0.016807079315185547, 0.017851829528808594, 0.01889657974243164, 0.019941329956054688, 0.020986080169677734, 0.02203083038330078, 0.023075580596923828, 0.024120330810546875, 0.025165081024169922, 0.02620983123779297, 0.027254581451416016, 0.028299331665039062, 0.02934408187866211, 0.030388832092285156, 0.0314335823059082, 0.03247833251953125, 0.0335230827331543, 0.034567832946777344, 0.03561258316040039, 0.03665733337402344, 0.037702083587646484, 0.03874683380126953, 0.03979158401489258, 0.040836334228515625, 0.04188108444213867, 0.04292583465576172, 0.043970584869384766, 0.04501533508300781, 0.04606008529663086, 0.047104835510253906, 0.04814958572387695, 0.0491943359375]}, "gradients/decoder.model.decoder.layers.4.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 1.0, 1.0, 7.0, 16.0, 28.0, 53.0, 150.0, 262.0, 247.0, 125.0, 43.0, 30.0, 13.0, 7.0, 12.0, 6.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0], "bins": [-4.1519951820373535, -4.057504653930664, -3.963014602661133, -3.8685240745544434, -3.774033784866333, -3.6795434951782227, -3.5850532054901123, -3.490562915802002, -3.3960726261138916, -3.3015823364257812, -3.207092046737671, -3.1126017570495605, -3.018111228942871, -2.9236209392547607, -2.8291306495666504, -2.73464035987854, -2.6401500701904297, -2.5456597805023193, -2.451169490814209, -2.3566789627075195, -2.262188673019409, -2.167698383331299, -2.0732080936431885, -1.9787178039550781, -1.8842272758483887, -1.7897369861602783, -1.6952465772628784, -1.600756287574768, -1.5062659978866577, -1.4117755889892578, -1.3172852993011475, -1.222795009613037, -1.1283048391342163, -1.033814549446106, -0.9393242001533508, -0.8448338508605957, -0.7503435611724854, -0.6558532118797302, -0.5613628625869751, -0.46687257289886475, -0.3723822236061096, -0.2778919041156769, -0.18340156972408295, -0.08891123533248901, 0.005579084157943726, 0.10006940364837646, 0.1945597529411316, 0.28905004262924194, 0.38354039192199707, 0.4780307114124298, 0.5725210309028625, 0.6670113801956177, 0.761501669883728, 0.8559920191764832, 0.9504823684692383, 1.0449726581573486, 1.139462947845459, 1.2339532375335693, 1.3284436464309692, 1.4229339361190796, 1.51742422580719, 1.6119146347045898, 1.7064049243927002, 1.8008952140808105, 1.8953856229782104]}, "gradients/decoder.model.decoder.layers.4.self_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 2.0, 1.0, 3.0, 4.0, 3.0, 5.0, 8.0, 4.0, 5.0, 12.0, 18.0, 21.0, 29.0, 32.0, 37.0, 50.0, 52.0, 52.0, 70.0, 62.0, 71.0, 57.0, 62.0, 61.0, 46.0, 46.0, 35.0, 39.0, 26.0, 26.0, 20.0, 12.0, 10.0, 12.0, 3.0, 8.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.75704425573349, -0.7262541651725769, -0.6954640746116638, -0.6646739840507507, -0.6338839530944824, -0.6030938625335693, -0.5723037719726562, -0.5415136814117432, -0.5107235908508301, -0.479933500289917, -0.4491434097290039, -0.4183533489704132, -0.3875632584095001, -0.35677316784858704, -0.32598310708999634, -0.29519301652908325, -0.26440292596817017, -0.23361283540725708, -0.2028227597475052, -0.1720326840877533, -0.1412425935268402, -0.11045250296592712, -0.07966242730617523, -0.04887235164642334, -0.018082261085510254, 0.012707822024822235, 0.043497905135154724, 0.07428798824548721, 0.1050780713558197, 0.1358681619167328, 0.16665823757648468, 0.19744831323623657, 0.22823834419250488, 0.25902843475341797, 0.28981852531433105, 0.32060858607292175, 0.35139867663383484, 0.3821887671947479, 0.4129788279533386, 0.4437689185142517, 0.4745590090751648, 0.5053490996360779, 0.536139190196991, 0.566929280757904, 0.5977193117141724, 0.6285094022750854, 0.6592994928359985, 0.6900895833969116, 0.7208796739578247, 0.7516697645187378, 0.7824598550796509, 0.813249945640564, 0.844040036201477, 0.8748301267623901, 0.9056201577186584, 0.9364102482795715, 0.9672003388404846, 0.9979904294013977, 1.028780460357666, 1.059570550918579, 1.0903606414794922, 1.1211507320404053, 1.1519408226013184, 1.1827309131622314, 1.2135210037231445]}, "gradients/decoder.model.decoder.layers.4.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 7.0, 17.0, 21.0, 26.0, 26.0, 48.0, 64.0, 151.0, 205.0, 377.0, 677.0, 1268.0, 2683.0, 6337.0, 17433.0, 65289.0, 424713.0, 433118.0, 66522.0, 17692.0, 6286.0, 2674.0, 1308.0, 607.0, 394.0, 224.0, 135.0, 94.0, 53.0, 33.0, 32.0, 13.0, 11.0, 5.0, 8.0, 4.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.68505859375, -0.6587142944335938, -0.6323699951171875, -0.6060256958007812, -0.579681396484375, -0.5533370971679688, -0.5269927978515625, -0.5006484985351562, -0.47430419921875, -0.44795989990234375, -0.4216156005859375, -0.39527130126953125, -0.368927001953125, -0.34258270263671875, -0.3162384033203125, -0.28989410400390625, -0.2635498046875, -0.23720550537109375, -0.2108612060546875, -0.18451690673828125, -0.158172607421875, -0.13182830810546875, -0.1054840087890625, -0.07913970947265625, -0.05279541015625, -0.02645111083984375, -0.0001068115234375, 0.02623748779296875, 0.052581787109375, 0.07892608642578125, 0.1052703857421875, 0.13161468505859375, 0.157958984375, 0.18430328369140625, 0.2106475830078125, 0.23699188232421875, 0.263336181640625, 0.28968048095703125, 0.3160247802734375, 0.34236907958984375, 0.36871337890625, 0.39505767822265625, 0.4214019775390625, 0.44774627685546875, 0.474090576171875, 0.5004348754882812, 0.5267791748046875, 0.5531234741210938, 0.5794677734375, 0.6058120727539062, 0.6321563720703125, 0.6585006713867188, 0.684844970703125, 0.7111892700195312, 0.7375335693359375, 0.7638778686523438, 0.79022216796875, 0.8165664672851562, 0.8429107666015625, 0.8692550659179688, 0.895599365234375, 0.9219436645507812, 0.9482879638671875, 0.9746322631835938, 1.0009765625]}, "gradients/decoder.model.decoder.layers.4.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 2.0, 4.0, 4.0, 1.0, 7.0, 4.0, 9.0, 12.0, 17.0, 20.0, 18.0, 36.0, 42.0, 40.0, 54.0, 64.0, 60.0, 63.0, 68.0, 82.0, 66.0, 55.0, 51.0, 52.0, 40.0, 39.0, 23.0, 21.0, 15.0, 10.0, 7.0, 7.0, 2.0, 5.0, 6.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8671875, -1.79437255859375, -1.7215576171875, -1.64874267578125, -1.575927734375, -1.50311279296875, -1.4302978515625, -1.35748291015625, -1.28466796875, -1.21185302734375, -1.1390380859375, -1.06622314453125, -0.993408203125, -0.92059326171875, -0.8477783203125, -0.77496337890625, -0.7021484375, -0.62933349609375, -0.5565185546875, -0.48370361328125, -0.410888671875, -0.33807373046875, -0.2652587890625, -0.19244384765625, -0.11962890625, -0.04681396484375, 0.0260009765625, 0.09881591796875, 0.171630859375, 0.24444580078125, 0.3172607421875, 0.39007568359375, 0.462890625, 0.53570556640625, 0.6085205078125, 0.68133544921875, 0.754150390625, 0.82696533203125, 0.8997802734375, 0.97259521484375, 1.04541015625, 1.11822509765625, 1.1910400390625, 1.26385498046875, 1.336669921875, 1.40948486328125, 1.4822998046875, 1.55511474609375, 1.6279296875, 1.70074462890625, 1.7735595703125, 1.84637451171875, 1.919189453125, 1.99200439453125, 2.0648193359375, 2.13763427734375, 2.21044921875, 2.28326416015625, 2.3560791015625, 2.42889404296875, 2.501708984375, 2.57452392578125, 2.6473388671875, 2.72015380859375, 2.79296875]}, "gradients/decoder.model.decoder.layers.4.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 0.0, 5.0, 4.0, 7.0, 12.0, 10.0, 12.0, 15.0, 18.0, 18.0, 34.0, 41.0, 56.0, 83.0, 160.0, 228.0, 377.0, 693.0, 1634.0, 5607.0, 31382.0, 454905.0, 509717.0, 34290.0, 5884.0, 1592.0, 706.0, 370.0, 223.0, 136.0, 92.0, 57.0, 59.0, 33.0, 23.0, 15.0, 17.0, 11.0, 11.0, 4.0, 8.0, 3.0, 1.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.041015625, -1.0084991455078125, -0.975982666015625, -0.9434661865234375, -0.91094970703125, -0.8784332275390625, -0.845916748046875, -0.8134002685546875, -0.7808837890625, -0.7483673095703125, -0.715850830078125, -0.6833343505859375, -0.65081787109375, -0.6183013916015625, -0.585784912109375, -0.5532684326171875, -0.520751953125, -0.4882354736328125, -0.455718994140625, -0.4232025146484375, -0.39068603515625, -0.3581695556640625, -0.325653076171875, -0.2931365966796875, -0.2606201171875, -0.2281036376953125, -0.195587158203125, -0.1630706787109375, -0.13055419921875, -0.0980377197265625, -0.065521240234375, -0.0330047607421875, -0.00048828125, 0.0320281982421875, 0.064544677734375, 0.0970611572265625, 0.12957763671875, 0.1620941162109375, 0.194610595703125, 0.2271270751953125, 0.2596435546875, 0.2921600341796875, 0.324676513671875, 0.3571929931640625, 0.38970947265625, 0.4222259521484375, 0.454742431640625, 0.4872589111328125, 0.519775390625, 0.5522918701171875, 0.584808349609375, 0.6173248291015625, 0.64984130859375, 0.6823577880859375, 0.714874267578125, 0.7473907470703125, 0.7799072265625, 0.8124237060546875, 0.844940185546875, 0.8774566650390625, 0.90997314453125, 0.9424896240234375, 0.975006103515625, 1.0075225830078125, 1.0400390625]}, "gradients/decoder.model.decoder.layers.4.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 4.0, 0.0, 2.0, 1.0, 0.0, 1.0, 4.0, 3.0, 3.0, 5.0, 2.0, 8.0, 16.0, 9.0, 19.0, 24.0, 20.0, 18.0, 23.0, 23.0, 31.0, 31.0, 47.0, 32.0, 55.0, 60.0, 60.0, 48.0, 43.0, 41.0, 37.0, 40.0, 38.0, 47.0, 34.0, 30.0, 16.0, 25.0, 17.0, 22.0, 18.0, 5.0, 16.0, 9.0, 6.0, 9.0, 6.0, 4.0, 3.0, 0.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.0078125, -1.94097900390625, -1.8741455078125, -1.80731201171875, -1.740478515625, -1.67364501953125, -1.6068115234375, -1.53997802734375, -1.47314453125, -1.40631103515625, -1.3394775390625, -1.27264404296875, -1.205810546875, -1.13897705078125, -1.0721435546875, -1.00531005859375, -0.9384765625, -0.87164306640625, -0.8048095703125, -0.73797607421875, -0.671142578125, -0.60430908203125, -0.5374755859375, -0.47064208984375, -0.40380859375, -0.33697509765625, -0.2701416015625, -0.20330810546875, -0.136474609375, -0.06964111328125, -0.0028076171875, 0.06402587890625, 0.130859375, 0.19769287109375, 0.2645263671875, 0.33135986328125, 0.398193359375, 0.46502685546875, 0.5318603515625, 0.59869384765625, 0.66552734375, 0.73236083984375, 0.7991943359375, 0.86602783203125, 0.932861328125, 0.99969482421875, 1.0665283203125, 1.13336181640625, 1.2001953125, 1.26702880859375, 1.3338623046875, 1.40069580078125, 1.467529296875, 1.53436279296875, 1.6011962890625, 1.66802978515625, 1.73486328125, 1.80169677734375, 1.8685302734375, 1.93536376953125, 2.002197265625, 2.06903076171875, 2.1358642578125, 2.20269775390625, 2.26953125]}, "gradients/decoder.model.decoder.layers.4.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 3.0, 9.0, 8.0, 7.0, 16.0, 18.0, 30.0, 42.0, 63.0, 87.0, 145.0, 265.0, 439.0, 888.0, 1994.0, 5998.0, 26378.0, 176667.0, 703228.0, 106981.0, 17590.0, 4336.0, 1642.0, 725.0, 399.0, 178.0, 136.0, 86.0, 57.0, 44.0, 20.0, 28.0, 17.0, 7.0, 8.0, 6.0, 5.0, 0.0, 5.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.287841796875, -0.2776985168457031, -0.26755523681640625, -0.2574119567871094, -0.2472686767578125, -0.23712539672851562, -0.22698211669921875, -0.21683883666992188, -0.206695556640625, -0.19655227661132812, -0.18640899658203125, -0.17626571655273438, -0.1661224365234375, -0.15597915649414062, -0.14583587646484375, -0.13569259643554688, -0.12554931640625, -0.11540603637695312, -0.10526275634765625, -0.09511947631835938, -0.0849761962890625, -0.07483291625976562, -0.06468963623046875, -0.054546356201171875, -0.044403076171875, -0.034259796142578125, -0.02411651611328125, -0.013973236083984375, -0.0038299560546875, 0.006313323974609375, 0.01645660400390625, 0.026599884033203125, 0.0367431640625, 0.046886444091796875, 0.05702972412109375, 0.06717300415039062, 0.0773162841796875, 0.08745956420898438, 0.09760284423828125, 0.10774612426757812, 0.117889404296875, 0.12803268432617188, 0.13817596435546875, 0.14831924438476562, 0.1584625244140625, 0.16860580444335938, 0.17874908447265625, 0.18889236450195312, 0.19903564453125, 0.20917892456054688, 0.21932220458984375, 0.22946548461914062, 0.2396087646484375, 0.24975204467773438, 0.25989532470703125, 0.2700386047363281, 0.280181884765625, 0.2903251647949219, 0.30046844482421875, 0.3106117248535156, 0.3207550048828125, 0.3308982849121094, 0.34104156494140625, 0.3511848449707031, 0.361328125]}, "gradients/decoder.model.decoder.layers.4.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 8.0, 7.0, 8.0, 12.0, 21.0, 21.0, 42.0, 75.0, 78.0, 169.0, 239.0, 118.0, 58.0, 51.0, 30.0, 29.0, 13.0, 7.0, 7.0, 5.0, 4.0, 3.0, 0.0, 3.0, 1.0, 1.0, 1.0, 3.0], "bins": [-0.00010657310485839844, -0.00010426435619592667, -0.0001019556075334549, -9.964685887098312e-05, -9.733811020851135e-05, -9.502936154603958e-05, -9.272061288356781e-05, -9.041186422109604e-05, -8.810311555862427e-05, -8.57943668961525e-05, -8.348561823368073e-05, -8.117686957120895e-05, -7.886812090873718e-05, -7.655937224626541e-05, -7.425062358379364e-05, -7.194187492132187e-05, -6.96331262588501e-05, -6.732437759637833e-05, -6.501562893390656e-05, -6.270688027143478e-05, -6.039813160896301e-05, -5.808938294649124e-05, -5.578063428401947e-05, -5.34718856215477e-05, -5.116313695907593e-05, -4.8854388296604156e-05, -4.6545639634132385e-05, -4.4236890971660614e-05, -4.192814230918884e-05, -3.961939364671707e-05, -3.73106449842453e-05, -3.500189632177353e-05, -3.269314765930176e-05, -3.0384398996829987e-05, -2.8075650334358215e-05, -2.5766901671886444e-05, -2.3458153009414673e-05, -2.11494043469429e-05, -1.884065568447113e-05, -1.653190702199936e-05, -1.4223158359527588e-05, -1.1914409697055817e-05, -9.605661034584045e-06, -7.296912372112274e-06, -4.988163709640503e-06, -2.6794150471687317e-06, -3.7066638469696045e-07, 1.938082277774811e-06, 4.246830940246582e-06, 6.555579602718353e-06, 8.864328265190125e-06, 1.1173076927661896e-05, 1.3481825590133667e-05, 1.5790574252605438e-05, 1.809932291507721e-05, 2.040807157754898e-05, 2.2716820240020752e-05, 2.5025568902492523e-05, 2.7334317564964294e-05, 2.9643066227436066e-05, 3.195181488990784e-05, 3.426056355237961e-05, 3.656931221485138e-05, 3.887806087732315e-05, 4.118680953979492e-05]}, "gradients/decoder.model.decoder.layers.4.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 4.0, 1.0, 3.0, 4.0, 3.0, 2.0, 9.0, 10.0, 24.0, 25.0, 30.0, 57.0, 67.0, 106.0, 156.0, 268.0, 432.0, 765.0, 1401.0, 2792.0, 6349.0, 16972.0, 58540.0, 267817.0, 558526.0, 93499.0, 24528.0, 8619.0, 3573.0, 1675.0, 904.0, 486.0, 323.0, 187.0, 125.0, 75.0, 66.0, 32.0, 30.0, 19.0, 18.0, 18.0, 7.0, 2.0, 2.0, 3.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.271728515625, -0.2637748718261719, -0.25582122802734375, -0.24786758422851562, -0.2399139404296875, -0.23196029663085938, -0.22400665283203125, -0.21605300903320312, -0.208099365234375, -0.20014572143554688, -0.19219207763671875, -0.18423843383789062, -0.1762847900390625, -0.16833114624023438, -0.16037750244140625, -0.15242385864257812, -0.14447021484375, -0.13651657104492188, -0.12856292724609375, -0.12060928344726562, -0.1126556396484375, -0.10470199584960938, -0.09674835205078125, -0.08879470825195312, -0.080841064453125, -0.07288742065429688, -0.06493377685546875, -0.056980133056640625, -0.0490264892578125, -0.041072845458984375, -0.03311920166015625, -0.025165557861328125, -0.0172119140625, -0.009258270263671875, -0.00130462646484375, 0.006649017333984375, 0.0146026611328125, 0.022556304931640625, 0.03050994873046875, 0.038463592529296875, 0.046417236328125, 0.054370880126953125, 0.06232452392578125, 0.07027816772460938, 0.0782318115234375, 0.08618545532226562, 0.09413909912109375, 0.10209274291992188, 0.11004638671875, 0.11800003051757812, 0.12595367431640625, 0.13390731811523438, 0.1418609619140625, 0.14981460571289062, 0.15776824951171875, 0.16572189331054688, 0.173675537109375, 0.18162918090820312, 0.18958282470703125, 0.19753646850585938, 0.2054901123046875, 0.21344375610351562, 0.22139739990234375, 0.22935104370117188, 0.2373046875]}, "gradients/decoder.model.decoder.layers.4.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 2.0, 6.0, 6.0, 8.0, 6.0, 6.0, 19.0, 22.0, 16.0, 15.0, 21.0, 27.0, 33.0, 43.0, 50.0, 73.0, 103.0, 144.0, 84.0, 64.0, 47.0, 29.0, 34.0, 28.0, 18.0, 22.0, 12.0, 9.0, 18.0, 10.0, 8.0, 4.0, 6.0, 2.0, 7.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10382080078125, -0.10013675689697266, -0.09645271301269531, -0.09276866912841797, -0.08908462524414062, -0.08540058135986328, -0.08171653747558594, -0.0780324935913086, -0.07434844970703125, -0.0706644058227539, -0.06698036193847656, -0.06329631805419922, -0.059612274169921875, -0.05592823028564453, -0.05224418640136719, -0.048560142517089844, -0.0448760986328125, -0.041192054748535156, -0.03750801086425781, -0.03382396697998047, -0.030139923095703125, -0.02645587921142578, -0.022771835327148438, -0.019087791442871094, -0.01540374755859375, -0.011719703674316406, -0.008035659790039062, -0.004351615905761719, -0.000667572021484375, 0.0030164718627929688, 0.0067005157470703125, 0.010384559631347656, 0.014068603515625, 0.017752647399902344, 0.021436691284179688, 0.02512073516845703, 0.028804779052734375, 0.03248882293701172, 0.03617286682128906, 0.039856910705566406, 0.04354095458984375, 0.047224998474121094, 0.05090904235839844, 0.05459308624267578, 0.058277130126953125, 0.06196117401123047, 0.06564521789550781, 0.06932926177978516, 0.0730133056640625, 0.07669734954833984, 0.08038139343261719, 0.08406543731689453, 0.08774948120117188, 0.09143352508544922, 0.09511756896972656, 0.0988016128540039, 0.10248565673828125, 0.1061697006225586, 0.10985374450683594, 0.11353778839111328, 0.11722183227539062, 0.12090587615966797, 0.12458992004394531, 0.12827396392822266, 0.1319580078125]}, "gradients/decoder.model.decoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 16.0, 19.0, 85.0, 193.0, 333.0, 209.0, 76.0, 26.0, 15.0, 12.0, 8.0, 6.0, 2.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.60097074508667, -7.3677473068237305, -7.134523868560791, -6.901300430297852, -6.668076992034912, -6.434853553771973, -6.201630592346191, -5.968406677246094, -5.7351837158203125, -5.501960277557373, -5.268736839294434, -5.035513401031494, -4.802289962768555, -4.569066524505615, -4.335843086242676, -4.1026201248168945, -3.869396209716797, -3.6361727714538574, -3.402949333190918, -3.1697258949279785, -2.936502456665039, -2.7032790184020996, -2.4700558185577393, -2.2368323802948, -2.0036089420318604, -1.770385503768921, -1.5371620655059814, -1.3039387464523315, -1.070715308189392, -0.8374918699264526, -0.6042685508728027, -0.3710451126098633, -0.13782167434692383, 0.09540173411369324, 0.3286251425743103, 0.561848521232605, 0.7950719594955444, 1.0282953977584839, 1.2615187168121338, 1.4947421550750732, 1.7279655933380127, 1.9611890316009521, 2.1944124698638916, 2.427635669708252, 2.6608591079711914, 2.894082546234131, 3.1273059844970703, 3.3605294227600098, 3.593752861022949, 3.8269762992858887, 4.060199737548828, 4.293423175811768, 4.526646614074707, 4.7598700523376465, 4.993093490600586, 5.226316452026367, 5.459540367126465, 5.692763805389404, 5.925987243652344, 6.159210681915283, 6.392434120178223, 6.625657558441162, 6.858880996704102, 7.092103958129883, 7.325327396392822]}, "gradients/decoder.model.decoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 0.0, 2.0, 3.0, 1.0, 6.0, 2.0, 7.0, 8.0, 13.0, 9.0, 13.0, 16.0, 22.0, 21.0, 14.0, 21.0, 26.0, 38.0, 39.0, 38.0, 41.0, 25.0, 52.0, 33.0, 39.0, 49.0, 43.0, 53.0, 38.0, 38.0, 38.0, 30.0, 27.0, 35.0, 21.0, 22.0, 20.0, 25.0, 19.0, 12.0, 8.0, 6.0, 6.0, 6.0, 6.0, 9.0, 6.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-3.5884580612182617, -3.4799041748046875, -3.371350049972534, -3.26279616355896, -3.1542420387268066, -3.0456881523132324, -2.937134265899658, -2.828580379486084, -2.7200262546539307, -2.6114723682403564, -2.502918243408203, -2.394364356994629, -2.2858104705810547, -2.1772563457489014, -2.068702459335327, -1.9601484537124634, -1.8515944480895996, -1.7430404424667358, -1.634486436843872, -1.5259325504302979, -1.417378544807434, -1.3088245391845703, -1.200270652770996, -1.0917166471481323, -0.9831626415252686, -0.8746086359024048, -0.7660546898841858, -0.6575007438659668, -0.548946738243103, -0.44039273262023926, -0.33183878660202026, -0.22328484058380127, -0.1147305965423584, -0.006176620721817017, 0.10237735509872437, 0.21093133091926575, 0.31948530673980713, 0.4280393123626709, 0.5365932583808899, 0.6451472043991089, 0.7537012100219727, 0.8622552156448364, 0.9708091616630554, 1.0793631076812744, 1.1879171133041382, 1.296471118927002, 1.4050250053405762, 1.51357901096344, 1.6221330165863037, 1.7306870222091675, 1.8392410278320312, 1.9477949142456055, 2.0563488006591797, 2.164902925491333, 2.2734568119049072, 2.3820109367370605, 2.4905648231506348, 2.599118709564209, 2.7076728343963623, 2.8162267208099365, 2.92478084564209, 3.033334732055664, 3.1418886184692383, 3.2504425048828125, 3.358996629714966]}, "gradients/decoder.model.decoder.layers.3.fc2.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 8.0, 7.0, 8.0, 9.0, 8.0, 21.0, 19.0, 33.0, 61.0, 56.0, 87.0, 156.0, 205.0, 350.0, 538.0, 1013.0, 2205.0, 5587.0, 17494.0, 74599.0, 688908.0, 3068684.0, 275081.0, 40637.0, 10649.0, 3918.0, 1686.0, 890.0, 502.0, 276.0, 189.0, 120.0, 83.0, 70.0, 33.0, 24.0, 22.0, 15.0, 13.0, 7.0, 5.0, 2.0, 4.0, 4.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0], "bins": [-1.765625, -1.712646484375, -1.65966796875, -1.606689453125, -1.5537109375, -1.500732421875, -1.44775390625, -1.394775390625, -1.341796875, -1.288818359375, -1.23583984375, -1.182861328125, -1.1298828125, -1.076904296875, -1.02392578125, -0.970947265625, -0.91796875, -0.864990234375, -0.81201171875, -0.759033203125, -0.7060546875, -0.653076171875, -0.60009765625, -0.547119140625, -0.494140625, -0.441162109375, -0.38818359375, -0.335205078125, -0.2822265625, -0.229248046875, -0.17626953125, -0.123291015625, -0.0703125, -0.017333984375, 0.03564453125, 0.088623046875, 0.1416015625, 0.194580078125, 0.24755859375, 0.300537109375, 0.353515625, 0.406494140625, 0.45947265625, 0.512451171875, 0.5654296875, 0.618408203125, 0.67138671875, 0.724365234375, 0.77734375, 0.830322265625, 0.88330078125, 0.936279296875, 0.9892578125, 1.042236328125, 1.09521484375, 1.148193359375, 1.201171875, 1.254150390625, 1.30712890625, 1.360107421875, 1.4130859375, 1.466064453125, 1.51904296875, 1.572021484375, 1.625]}, "gradients/decoder.model.decoder.layers.3.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 5.0, 3.0, 3.0, 7.0, 5.0, 14.0, 9.0, 16.0, 23.0, 26.0, 33.0, 38.0, 52.0, 66.0, 79.0, 76.0, 92.0, 83.0, 70.0, 61.0, 56.0, 42.0, 42.0, 26.0, 16.0, 13.0, 10.0, 7.0, 6.0, 15.0, 2.0, 2.0, 2.0, 1.0, 3.0, 0.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.146484375, -1.104827880859375, -1.06317138671875, -1.021514892578125, -0.9798583984375, -0.938201904296875, -0.89654541015625, -0.854888916015625, -0.813232421875, -0.771575927734375, -0.72991943359375, -0.688262939453125, -0.6466064453125, -0.604949951171875, -0.56329345703125, -0.521636962890625, -0.47998046875, -0.438323974609375, -0.39666748046875, -0.355010986328125, -0.3133544921875, -0.271697998046875, -0.23004150390625, -0.188385009765625, -0.146728515625, -0.105072021484375, -0.06341552734375, -0.021759033203125, 0.0198974609375, 0.061553955078125, 0.10321044921875, 0.144866943359375, 0.1865234375, 0.228179931640625, 0.26983642578125, 0.311492919921875, 0.3531494140625, 0.394805908203125, 0.43646240234375, 0.478118896484375, 0.519775390625, 0.561431884765625, 0.60308837890625, 0.644744873046875, 0.6864013671875, 0.728057861328125, 0.76971435546875, 0.811370849609375, 0.85302734375, 0.894683837890625, 0.93634033203125, 0.977996826171875, 1.0196533203125, 1.061309814453125, 1.10296630859375, 1.144622802734375, 1.186279296875, 1.227935791015625, 1.26959228515625, 1.311248779296875, 1.3529052734375, 1.394561767578125, 1.43621826171875, 1.477874755859375, 1.51953125]}, "gradients/decoder.model.decoder.layers.3.fc1.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 6.0, 3.0, 6.0, 7.0, 9.0, 17.0, 21.0, 27.0, 59.0, 84.0, 149.0, 305.0, 616.0, 1485.0, 5291.0, 28453.0, 529804.0, 3524906.0, 87749.0, 10743.0, 2652.0, 951.0, 426.0, 222.0, 106.0, 64.0, 22.0, 28.0, 24.0, 16.0, 11.0, 9.0, 10.0, 5.0, 6.0, 2.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.265625, -2.188140869140625, -2.11065673828125, -2.033172607421875, -1.9556884765625, -1.878204345703125, -1.80072021484375, -1.723236083984375, -1.645751953125, -1.568267822265625, -1.49078369140625, -1.413299560546875, -1.3358154296875, -1.258331298828125, -1.18084716796875, -1.103363037109375, -1.02587890625, -0.948394775390625, -0.87091064453125, -0.793426513671875, -0.7159423828125, -0.638458251953125, -0.56097412109375, -0.483489990234375, -0.406005859375, -0.328521728515625, -0.25103759765625, -0.173553466796875, -0.0960693359375, -0.018585205078125, 0.05889892578125, 0.136383056640625, 0.2138671875, 0.291351318359375, 0.36883544921875, 0.446319580078125, 0.5238037109375, 0.601287841796875, 0.67877197265625, 0.756256103515625, 0.833740234375, 0.911224365234375, 0.98870849609375, 1.066192626953125, 1.1436767578125, 1.221160888671875, 1.29864501953125, 1.376129150390625, 1.45361328125, 1.531097412109375, 1.60858154296875, 1.686065673828125, 1.7635498046875, 1.841033935546875, 1.91851806640625, 1.996002197265625, 2.073486328125, 2.150970458984375, 2.22845458984375, 2.305938720703125, 2.3834228515625, 2.460906982421875, 2.53839111328125, 2.615875244140625, 2.693359375]}, "gradients/decoder.model.decoder.layers.3.fc1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 2.0, 5.0, 7.0, 5.0, 13.0, 6.0, 22.0, 31.0, 33.0, 51.0, 77.0, 118.0, 170.0, 274.0, 508.0, 805.0, 723.0, 445.0, 253.0, 180.0, 118.0, 61.0, 51.0, 34.0, 23.0, 17.0, 16.0, 8.0, 6.0, 2.0, 2.0, 1.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.59912109375, -0.5836982727050781, -0.5682754516601562, -0.5528526306152344, -0.5374298095703125, -0.5220069885253906, -0.5065841674804688, -0.4911613464355469, -0.475738525390625, -0.4603157043457031, -0.44489288330078125, -0.4294700622558594, -0.4140472412109375, -0.3986244201660156, -0.38320159912109375, -0.3677787780761719, -0.35235595703125, -0.3369331359863281, -0.32151031494140625, -0.3060874938964844, -0.2906646728515625, -0.2752418518066406, -0.25981903076171875, -0.24439620971679688, -0.228973388671875, -0.21355056762695312, -0.19812774658203125, -0.18270492553710938, -0.1672821044921875, -0.15185928344726562, -0.13643646240234375, -0.12101364135742188, -0.1055908203125, -0.09016799926757812, -0.07474517822265625, -0.059322357177734375, -0.0438995361328125, -0.028476715087890625, -0.01305389404296875, 0.002368927001953125, 0.017791748046875, 0.033214569091796875, 0.04863739013671875, 0.06406021118164062, 0.0794830322265625, 0.09490585327148438, 0.11032867431640625, 0.12575149536132812, 0.14117431640625, 0.15659713745117188, 0.17201995849609375, 0.18744277954101562, 0.2028656005859375, 0.21828842163085938, 0.23371124267578125, 0.24913406372070312, 0.264556884765625, 0.2799797058105469, 0.29540252685546875, 0.3108253479003906, 0.3262481689453125, 0.3416709899902344, 0.35709381103515625, 0.3725166320800781, 0.387939453125]}, "gradients/decoder.model.decoder.layers.3.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 3.0, 3.0, 1.0, 5.0, 5.0, 14.0, 14.0, 35.0, 78.0, 159.0, 210.0, 189.0, 129.0, 63.0, 41.0, 32.0, 10.0, 11.0, 2.0, 1.0, 4.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.754863262176514, -4.636016368865967, -4.517168998718262, -4.398322105407715, -4.279475212097168, -4.160628318786621, -4.041780948638916, -3.922934055328369, -3.8040871620178223, -3.6852400302886963, -3.5663931369781494, -3.4475460052490234, -3.3286991119384766, -3.2098519802093506, -3.0910050868988037, -2.9721579551696777, -2.853311061859131, -2.734463930130005, -2.615617036819458, -2.496769905090332, -2.377923011779785, -2.259075880050659, -2.1402289867401123, -2.0213818550109863, -1.9025347232818604, -1.783687710762024, -1.6648406982421875, -1.545993685722351, -1.4271466732025146, -1.3082995414733887, -1.1894526481628418, -1.0706055164337158, -0.951758623123169, -0.8329116106033325, -0.7140645980834961, -0.5952175855636597, -0.47637054324150085, -0.35752350091934204, -0.23867648839950562, -0.11982947587966919, -0.0009824633598327637, 0.11786455661058426, 0.23671157658100128, 0.3555586040019989, 0.4744056165218353, 0.5932526588439941, 0.7120996713638306, 0.830946683883667, 0.9497936964035034, 1.0686407089233398, 1.1874877214431763, 1.3063347339630127, 1.4251817464828491, 1.5440287590026855, 1.6628758907318115, 1.7817227840423584, 1.9005699157714844, 2.0194170475006104, 2.1382639408111572, 2.257111072540283, 2.37595796585083, 2.494805097579956, 2.613651990890503, 2.732499122619629, 2.851346015930176]}, "gradients/decoder.model.decoder.layers.3.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 0.0, 3.0, 3.0, 3.0, 6.0, 3.0, 3.0, 13.0, 8.0, 10.0, 13.0, 16.0, 20.0, 29.0, 26.0, 33.0, 38.0, 44.0, 46.0, 53.0, 42.0, 37.0, 57.0, 49.0, 43.0, 44.0, 42.0, 47.0, 54.0, 41.0, 39.0, 32.0, 26.0, 14.0, 14.0, 11.0, 13.0, 13.0, 5.0, 5.0, 1.0, 4.0, 3.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9125967621803284, -0.8759400844573975, -0.8392834067344666, -0.8026267290115356, -0.76596999168396, -0.7293133735656738, -0.6926566362380981, -0.6559999585151672, -0.6193432807922363, -0.5826866030693054, -0.5460299253463745, -0.5093732476234436, -0.4727165400981903, -0.4360598623752594, -0.3994031548500061, -0.3627464771270752, -0.3260897994041443, -0.2894331216812134, -0.25277644395828247, -0.21611973643302917, -0.17946305871009827, -0.14280638098716736, -0.10614968836307526, -0.06949299573898315, -0.032836318016052246, 0.003820367157459259, 0.040477052330970764, 0.07713373750448227, 0.11379042267799377, 0.15044710040092468, 0.18710379302501678, 0.2237604856491089, 0.260417103767395, 0.2970737814903259, 0.33373045921325684, 0.37038716673851013, 0.40704384446144104, 0.44370052218437195, 0.48035722970962524, 0.5170139074325562, 0.5536705851554871, 0.590327262878418, 0.6269839406013489, 0.6636406183242798, 0.7002973556518555, 0.7369539737701416, 0.7736107110977173, 0.8102673888206482, 0.8469240665435791, 0.88358074426651, 0.9202374219894409, 0.9568940997123718, 0.9935507774353027, 1.0302075147628784, 1.0668641328811646, 1.1035208702087402, 1.1401774883270264, 1.176834225654602, 1.2134908437728882, 1.2501475811004639, 1.28680419921875, 1.3234609365463257, 1.3601175546646118, 1.3967742919921875, 1.4334310293197632]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 3.0, 4.0, 5.0, 4.0, 6.0, 4.0, 14.0, 12.0, 15.0, 22.0, 38.0, 49.0, 91.0, 136.0, 198.0, 335.0, 551.0, 1116.0, 2105.0, 4432.0, 10464.0, 39698.0, 401206.0, 514172.0, 51878.0, 11791.0, 4915.0, 2402.0, 1206.0, 674.0, 369.0, 247.0, 128.0, 108.0, 42.0, 40.0, 26.0, 20.0, 7.0, 11.0, 5.0, 1.0, 3.0, 1.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.400634765625, -0.388519287109375, -0.37640380859375, -0.364288330078125, -0.3521728515625, -0.340057373046875, -0.32794189453125, -0.315826416015625, -0.3037109375, -0.291595458984375, -0.27947998046875, -0.267364501953125, -0.2552490234375, -0.243133544921875, -0.23101806640625, -0.218902587890625, -0.206787109375, -0.194671630859375, -0.18255615234375, -0.170440673828125, -0.1583251953125, -0.146209716796875, -0.13409423828125, -0.121978759765625, -0.10986328125, -0.097747802734375, -0.08563232421875, -0.073516845703125, -0.0614013671875, -0.049285888671875, -0.03717041015625, -0.025054931640625, -0.012939453125, -0.000823974609375, 0.01129150390625, 0.023406982421875, 0.0355224609375, 0.047637939453125, 0.05975341796875, 0.071868896484375, 0.083984375, 0.096099853515625, 0.10821533203125, 0.120330810546875, 0.1324462890625, 0.144561767578125, 0.15667724609375, 0.168792724609375, 0.180908203125, 0.193023681640625, 0.20513916015625, 0.217254638671875, 0.2293701171875, 0.241485595703125, 0.25360107421875, 0.265716552734375, 0.27783203125, 0.289947509765625, 0.30206298828125, 0.314178466796875, 0.3262939453125, 0.338409423828125, 0.35052490234375, 0.362640380859375, 0.374755859375]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 5.0, 4.0, 4.0, 11.0, 9.0, 8.0, 19.0, 23.0, 19.0, 25.0, 31.0, 38.0, 46.0, 66.0, 57.0, 67.0, 55.0, 64.0, 55.0, 58.0, 60.0, 58.0, 45.0, 43.0, 32.0, 26.0, 15.0, 14.0, 11.0, 6.0, 9.0, 8.0, 3.0, 3.0, 4.0, 5.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.72216796875, -0.6925125122070312, -0.6628570556640625, -0.6332015991210938, -0.603546142578125, -0.5738906860351562, -0.5442352294921875, -0.5145797729492188, -0.48492431640625, -0.45526885986328125, -0.4256134033203125, -0.39595794677734375, -0.366302490234375, -0.33664703369140625, -0.3069915771484375, -0.27733612060546875, -0.2476806640625, -0.21802520751953125, -0.1883697509765625, -0.15871429443359375, -0.129058837890625, -0.09940338134765625, -0.0697479248046875, -0.04009246826171875, -0.01043701171875, 0.01921844482421875, 0.0488739013671875, 0.07852935791015625, 0.108184814453125, 0.13784027099609375, 0.1674957275390625, 0.19715118408203125, 0.226806640625, 0.25646209716796875, 0.2861175537109375, 0.31577301025390625, 0.345428466796875, 0.37508392333984375, 0.4047393798828125, 0.43439483642578125, 0.46405029296875, 0.49370574951171875, 0.5233612060546875, 0.5530166625976562, 0.582672119140625, 0.6123275756835938, 0.6419830322265625, 0.6716384887695312, 0.7012939453125, 0.7309494018554688, 0.7606048583984375, 0.7902603149414062, 0.819915771484375, 0.8495712280273438, 0.8792266845703125, 0.9088821411132812, 0.93853759765625, 0.9681930541992188, 0.9978485107421875, 1.0275039672851562, 1.057159423828125, 1.0868148803710938, 1.1164703369140625, 1.1461257934570312, 1.17578125]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 4.0, 8.0, 6.0, 6.0, 9.0, 15.0, 22.0, 19.0, 37.0, 68.0, 91.0, 146.0, 266.0, 489.0, 903.0, 2073.0, 4641.0, 13488.0, 121793.0, 782627.0, 101242.0, 12392.0, 4268.0, 1938.0, 882.0, 459.0, 243.0, 143.0, 95.0, 64.0, 31.0, 25.0, 13.0, 12.0, 15.0, 7.0, 4.0, 3.0, 4.0, 1.0, 4.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.40771484375, -0.3958854675292969, -0.38405609130859375, -0.3722267150878906, -0.3603973388671875, -0.3485679626464844, -0.33673858642578125, -0.3249092102050781, -0.313079833984375, -0.3012504577636719, -0.28942108154296875, -0.2775917053222656, -0.2657623291015625, -0.2539329528808594, -0.24210357666015625, -0.23027420043945312, -0.21844482421875, -0.20661544799804688, -0.19478607177734375, -0.18295669555664062, -0.1711273193359375, -0.15929794311523438, -0.14746856689453125, -0.13563919067382812, -0.123809814453125, -0.11198043823242188, -0.10015106201171875, -0.08832168579101562, -0.0764923095703125, -0.06466293334960938, -0.05283355712890625, -0.041004180908203125, -0.0291748046875, -0.017345428466796875, -0.00551605224609375, 0.006313323974609375, 0.0181427001953125, 0.029972076416015625, 0.04180145263671875, 0.053630828857421875, 0.065460205078125, 0.07728958129882812, 0.08911895751953125, 0.10094833374023438, 0.1127777099609375, 0.12460708618164062, 0.13643646240234375, 0.14826583862304688, 0.16009521484375, 0.17192459106445312, 0.18375396728515625, 0.19558334350585938, 0.2074127197265625, 0.21924209594726562, 0.23107147216796875, 0.24290084838867188, 0.254730224609375, 0.2665596008300781, 0.27838897705078125, 0.2902183532714844, 0.3020477294921875, 0.3138771057128906, 0.32570648193359375, 0.3375358581542969, 0.349365234375]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 5.0, 5.0, 2.0, 4.0, 3.0, 12.0, 15.0, 15.0, 14.0, 22.0, 24.0, 29.0, 21.0, 36.0, 44.0, 56.0, 45.0, 42.0, 62.0, 60.0, 66.0, 41.0, 51.0, 63.0, 44.0, 34.0, 33.0, 25.0, 31.0, 19.0, 23.0, 19.0, 9.0, 10.0, 6.0, 6.0, 3.0, 5.0, 3.0, 0.0, 3.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.7490234375, -1.6984405517578125, -1.647857666015625, -1.5972747802734375, -1.54669189453125, -1.4961090087890625, -1.445526123046875, -1.3949432373046875, -1.3443603515625, -1.2937774658203125, -1.243194580078125, -1.1926116943359375, -1.14202880859375, -1.0914459228515625, -1.040863037109375, -0.9902801513671875, -0.939697265625, -0.8891143798828125, -0.838531494140625, -0.7879486083984375, -0.73736572265625, -0.6867828369140625, -0.636199951171875, -0.5856170654296875, -0.5350341796875, -0.4844512939453125, -0.433868408203125, -0.3832855224609375, -0.33270263671875, -0.2821197509765625, -0.231536865234375, -0.1809539794921875, -0.13037109375, -0.0797882080078125, -0.029205322265625, 0.0213775634765625, 0.07196044921875, 0.1225433349609375, 0.173126220703125, 0.2237091064453125, 0.2742919921875, 0.3248748779296875, 0.375457763671875, 0.4260406494140625, 0.47662353515625, 0.5272064208984375, 0.577789306640625, 0.6283721923828125, 0.678955078125, 0.7295379638671875, 0.780120849609375, 0.8307037353515625, 0.88128662109375, 0.9318695068359375, 0.982452392578125, 1.0330352783203125, 1.0836181640625, 1.1342010498046875, 1.184783935546875, 1.2353668212890625, 1.28594970703125, 1.3365325927734375, 1.387115478515625, 1.4376983642578125, 1.48828125]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 3.0, 3.0, 4.0, 4.0, 7.0, 11.0, 11.0, 17.0, 29.0, 44.0, 57.0, 88.0, 168.0, 252.0, 551.0, 1085.0, 2554.0, 7153.0, 27147.0, 250859.0, 667565.0, 70424.0, 13032.0, 4099.0, 1621.0, 806.0, 391.0, 199.0, 116.0, 77.0, 47.0, 51.0, 24.0, 9.0, 12.0, 9.0, 14.0, 7.0, 4.0, 0.0, 1.0, 4.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.1475830078125, -0.14339637756347656, -0.13920974731445312, -0.1350231170654297, -0.13083648681640625, -0.1266498565673828, -0.12246322631835938, -0.11827659606933594, -0.1140899658203125, -0.10990333557128906, -0.10571670532226562, -0.10153007507324219, -0.09734344482421875, -0.09315681457519531, -0.08897018432617188, -0.08478355407714844, -0.080596923828125, -0.07641029357910156, -0.07222366333007812, -0.06803703308105469, -0.06385040283203125, -0.05966377258300781, -0.055477142333984375, -0.05129051208496094, -0.0471038818359375, -0.04291725158691406, -0.038730621337890625, -0.03454399108886719, -0.03035736083984375, -0.026170730590820312, -0.021984100341796875, -0.017797470092773438, -0.01361083984375, -0.009424209594726562, -0.005237579345703125, -0.0010509490966796875, 0.00313568115234375, 0.0073223114013671875, 0.011508941650390625, 0.015695571899414062, 0.0198822021484375, 0.024068832397460938, 0.028255462646484375, 0.03244209289550781, 0.03662872314453125, 0.04081535339355469, 0.045001983642578125, 0.04918861389160156, 0.053375244140625, 0.05756187438964844, 0.061748504638671875, 0.06593513488769531, 0.07012176513671875, 0.07430839538574219, 0.07849502563476562, 0.08268165588378906, 0.0868682861328125, 0.09105491638183594, 0.09524154663085938, 0.09942817687988281, 0.10361480712890625, 0.10780143737792969, 0.11198806762695312, 0.11617469787597656, 0.120361328125]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 4.0, 1.0, 0.0, 2.0, 4.0, 4.0, 8.0, 8.0, 9.0, 27.0, 39.0, 65.0, 99.0, 132.0, 168.0, 130.0, 111.0, 68.0, 42.0, 41.0, 13.0, 8.0, 3.0, 6.0, 6.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 4.0, 3.0, 0.0, 2.0, 1.0, 1.0], "bins": [-9.08970832824707e-05, -8.871406316757202e-05, -8.653104305267334e-05, -8.434802293777466e-05, -8.216500282287598e-05, -7.99819827079773e-05, -7.779896259307861e-05, -7.561594247817993e-05, -7.343292236328125e-05, -7.124990224838257e-05, -6.906688213348389e-05, -6.68838620185852e-05, -6.470084190368652e-05, -6.251782178878784e-05, -6.033480167388916e-05, -5.815178155899048e-05, -5.59687614440918e-05, -5.3785741329193115e-05, -5.1602721214294434e-05, -4.941970109939575e-05, -4.723668098449707e-05, -4.505366086959839e-05, -4.287064075469971e-05, -4.0687620639801025e-05, -3.8504600524902344e-05, -3.632158041000366e-05, -3.413856029510498e-05, -3.19555401802063e-05, -2.9772520065307617e-05, -2.7589499950408936e-05, -2.5406479835510254e-05, -2.3223459720611572e-05, -2.104043960571289e-05, -1.885741949081421e-05, -1.6674399375915527e-05, -1.4491379261016846e-05, -1.2308359146118164e-05, -1.0125339031219482e-05, -7.9423189163208e-06, -5.759298801422119e-06, -3.5762786865234375e-06, -1.3932585716247559e-06, 7.897615432739258e-07, 2.9727816581726074e-06, 5.155801773071289e-06, 7.338821887969971e-06, 9.521842002868652e-06, 1.1704862117767334e-05, 1.3887882232666016e-05, 1.6070902347564697e-05, 1.825392246246338e-05, 2.043694257736206e-05, 2.2619962692260742e-05, 2.4802982807159424e-05, 2.6986002922058105e-05, 2.9169023036956787e-05, 3.135204315185547e-05, 3.353506326675415e-05, 3.571808338165283e-05, 3.7901103496551514e-05, 4.0084123611450195e-05, 4.226714372634888e-05, 4.445016384124756e-05, 4.663318395614624e-05, 4.881620407104492e-05]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 6.0, 10.0, 7.0, 16.0, 29.0, 33.0, 49.0, 70.0, 120.0, 175.0, 244.0, 397.0, 617.0, 1047.0, 1844.0, 3488.0, 7197.0, 17759.0, 58792.0, 257105.0, 488485.0, 149502.0, 36910.0, 12445.0, 5396.0, 2785.0, 1539.0, 865.0, 611.0, 337.0, 218.0, 146.0, 98.0, 62.0, 44.0, 31.0, 19.0, 13.0, 10.0, 11.0, 4.0, 1.0, 3.0, 6.0, 3.0, 5.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.09552001953125, -0.09265327453613281, -0.08978652954101562, -0.08691978454589844, -0.08405303955078125, -0.08118629455566406, -0.07831954956054688, -0.07545280456542969, -0.0725860595703125, -0.06971931457519531, -0.06685256958007812, -0.06398582458496094, -0.06111907958984375, -0.05825233459472656, -0.055385589599609375, -0.05251884460449219, -0.049652099609375, -0.04678535461425781, -0.043918609619140625, -0.04105186462402344, -0.03818511962890625, -0.03531837463378906, -0.032451629638671875, -0.029584884643554688, -0.0267181396484375, -0.023851394653320312, -0.020984649658203125, -0.018117904663085938, -0.01525115966796875, -0.012384414672851562, -0.009517669677734375, -0.0066509246826171875, -0.0037841796875, -0.0009174346923828125, 0.001949310302734375, 0.0048160552978515625, 0.00768280029296875, 0.010549545288085938, 0.013416290283203125, 0.016283035278320312, 0.0191497802734375, 0.022016525268554688, 0.024883270263671875, 0.027750015258789062, 0.03061676025390625, 0.03348350524902344, 0.036350250244140625, 0.03921699523925781, 0.042083740234375, 0.04495048522949219, 0.047817230224609375, 0.05068397521972656, 0.05355072021484375, 0.05641746520996094, 0.059284210205078125, 0.06215095520019531, 0.0650177001953125, 0.06788444519042969, 0.07075119018554688, 0.07361793518066406, 0.07648468017578125, 0.07935142517089844, 0.08221817016601562, 0.08508491516113281, 0.08795166015625]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 5.0, 1.0, 4.0, 3.0, 13.0, 12.0, 23.0, 26.0, 43.0, 74.0, 84.0, 94.0, 132.0, 117.0, 108.0, 68.0, 63.0, 44.0, 30.0, 19.0, 11.0, 12.0, 9.0, 2.0, 4.0, 0.0, 1.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.03240966796875, -0.03139448165893555, -0.030379295349121094, -0.02936410903930664, -0.028348922729492188, -0.027333736419677734, -0.02631855010986328, -0.025303363800048828, -0.024288177490234375, -0.023272991180419922, -0.02225780487060547, -0.021242618560791016, -0.020227432250976562, -0.01921224594116211, -0.018197059631347656, -0.017181873321533203, -0.01616668701171875, -0.015151500701904297, -0.014136314392089844, -0.01312112808227539, -0.012105941772460938, -0.011090755462646484, -0.010075569152832031, -0.009060382843017578, -0.008045196533203125, -0.007030010223388672, -0.006014823913574219, -0.004999637603759766, -0.0039844512939453125, -0.0029692649841308594, -0.0019540786743164062, -0.0009388923645019531, 7.62939453125e-05, 0.0010914802551269531, 0.0021066665649414062, 0.0031218528747558594, 0.0041370391845703125, 0.005152225494384766, 0.006167411804199219, 0.007182598114013672, 0.008197784423828125, 0.009212970733642578, 0.010228157043457031, 0.011243343353271484, 0.012258529663085938, 0.01327371597290039, 0.014288902282714844, 0.015304088592529297, 0.01631927490234375, 0.017334461212158203, 0.018349647521972656, 0.01936483383178711, 0.020380020141601562, 0.021395206451416016, 0.02241039276123047, 0.023425579071044922, 0.024440765380859375, 0.025455951690673828, 0.02647113800048828, 0.027486324310302734, 0.028501510620117188, 0.02951669692993164, 0.030531883239746094, 0.03154706954956055, 0.032562255859375]}, "gradients/decoder.model.decoder.layers.3.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 3.0, 7.0, 11.0, 12.0, 45.0, 88.0, 181.0, 260.0, 185.0, 97.0, 54.0, 26.0, 17.0, 8.0, 4.0, 3.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-3.796365737915039, -3.7112984657287598, -3.6262314319610596, -3.5411643981933594, -3.45609712600708, -3.371029853820801, -3.2859628200531006, -3.2008957862854004, -3.115828514099121, -3.030761241912842, -2.9456942081451416, -2.8606271743774414, -2.775559902191162, -2.690492630004883, -2.6054255962371826, -2.5203585624694824, -2.435291290283203, -2.350224018096924, -2.2651569843292236, -2.1800899505615234, -2.095022678375244, -2.009955406188965, -1.9248883724212646, -1.839821219444275, -1.7547540664672852, -1.6696869134902954, -1.5846197605133057, -1.499552607536316, -1.4144854545593262, -1.3294183015823364, -1.2443511486053467, -1.159283995628357, -1.074216604232788, -0.9891494512557983, -0.9040822982788086, -0.8190151453018188, -0.7339479923248291, -0.6488808393478394, -0.5638136863708496, -0.47874653339385986, -0.3936793804168701, -0.30861222743988037, -0.22354507446289062, -0.13847792148590088, -0.05341076850891113, 0.03165638446807861, 0.11672353744506836, 0.2017906904220581, 0.28685784339904785, 0.3719249963760376, 0.45699214935302734, 0.5420593023300171, 0.6271264553070068, 0.7121936082839966, 0.7972607612609863, 0.8823279142379761, 0.9673950672149658, 1.0524622201919556, 1.1375293731689453, 1.222596526145935, 1.3076636791229248, 1.3927308320999146, 1.4777979850769043, 1.562865138053894, 1.6479322910308838]}, "gradients/decoder.model.decoder.layers.3.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 3.0, 4.0, 3.0, 10.0, 9.0, 11.0, 17.0, 18.0, 26.0, 36.0, 37.0, 47.0, 51.0, 62.0, 63.0, 59.0, 74.0, 60.0, 60.0, 61.0, 52.0, 62.0, 52.0, 25.0, 28.0, 22.0, 12.0, 12.0, 12.0, 6.0, 1.0, 3.0, 2.0, 5.0, 0.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7505624890327454, -0.7202178835868835, -0.689873218536377, -0.6595286130905151, -0.6291840076446533, -0.5988394021987915, -0.5684947967529297, -0.5381501317024231, -0.5078055262565613, -0.47746092081069946, -0.44711628556251526, -0.41677165031433105, -0.38642704486846924, -0.3560824394226074, -0.3257378041744232, -0.295393168926239, -0.2650485634803772, -0.2347039431333542, -0.20435932278633118, -0.17401470243930817, -0.14367008209228516, -0.11332546174526215, -0.08298084139823914, -0.052636221051216125, -0.022291600704193115, 0.008053019642829895, 0.038397639989852905, 0.06874226033687592, 0.09908688068389893, 0.12943150103092194, 0.15977612137794495, 0.19012074172496796, 0.22046542167663574, 0.25081002712249756, 0.28115466237068176, 0.31149929761886597, 0.3418439030647278, 0.3721885085105896, 0.4025331437587738, 0.432877779006958, 0.4632223844528198, 0.49356698989868164, 0.5239115953445435, 0.55425626039505, 0.5846008658409119, 0.6149454712867737, 0.6452901363372803, 0.6756347417831421, 0.7059793472290039, 0.7363239526748657, 0.7666685581207275, 0.7970132231712341, 0.827357828617096, 0.8577024340629578, 0.8880470991134644, 0.9183917045593262, 0.948736310005188, 0.9790809154510498, 1.0094255208969116, 1.0397701263427734, 1.0701148509979248, 1.1004594564437866, 1.1308040618896484, 1.1611486673355103, 1.191493272781372]}, "gradients/decoder.model.decoder.layers.3.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 5.0, 6.0, 12.0, 19.0, 55.0, 65.0, 187.0, 568.0, 2188.0, 12771.0, 146049.0, 834062.0, 45243.0, 5613.0, 1100.0, 350.0, 138.0, 56.0, 30.0, 24.0, 8.0, 6.0, 2.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3388671875, -1.29315185546875, -1.2474365234375, -1.20172119140625, -1.156005859375, -1.11029052734375, -1.0645751953125, -1.01885986328125, -0.97314453125, -0.92742919921875, -0.8817138671875, -0.83599853515625, -0.790283203125, -0.74456787109375, -0.6988525390625, -0.65313720703125, -0.607421875, -0.56170654296875, -0.5159912109375, -0.47027587890625, -0.424560546875, -0.37884521484375, -0.3331298828125, -0.28741455078125, -0.24169921875, -0.19598388671875, -0.1502685546875, -0.10455322265625, -0.058837890625, -0.01312255859375, 0.0325927734375, 0.07830810546875, 0.1240234375, 0.16973876953125, 0.2154541015625, 0.26116943359375, 0.306884765625, 0.35260009765625, 0.3983154296875, 0.44403076171875, 0.48974609375, 0.53546142578125, 0.5811767578125, 0.62689208984375, 0.672607421875, 0.71832275390625, 0.7640380859375, 0.80975341796875, 0.85546875, 0.90118408203125, 0.9468994140625, 0.99261474609375, 1.038330078125, 1.08404541015625, 1.1297607421875, 1.17547607421875, 1.22119140625, 1.26690673828125, 1.3126220703125, 1.35833740234375, 1.404052734375, 1.44976806640625, 1.4954833984375, 1.54119873046875, 1.5869140625]}, "gradients/decoder.model.decoder.layers.3.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 3.0, 5.0, 12.0, 16.0, 28.0, 32.0, 46.0, 72.0, 87.0, 109.0, 110.0, 111.0, 101.0, 82.0, 70.0, 40.0, 33.0, 19.0, 19.0, 3.0, 5.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.072265625, -1.968170166015625, -1.86407470703125, -1.759979248046875, -1.6558837890625, -1.551788330078125, -1.44769287109375, -1.343597412109375, -1.239501953125, -1.135406494140625, -1.03131103515625, -0.927215576171875, -0.8231201171875, -0.719024658203125, -0.61492919921875, -0.510833740234375, -0.40673828125, -0.302642822265625, -0.19854736328125, -0.094451904296875, 0.0096435546875, 0.113739013671875, 0.21783447265625, 0.321929931640625, 0.426025390625, 0.530120849609375, 0.63421630859375, 0.738311767578125, 0.8424072265625, 0.946502685546875, 1.05059814453125, 1.154693603515625, 1.2587890625, 1.362884521484375, 1.46697998046875, 1.571075439453125, 1.6751708984375, 1.779266357421875, 1.88336181640625, 1.987457275390625, 2.091552734375, 2.195648193359375, 2.29974365234375, 2.403839111328125, 2.5079345703125, 2.612030029296875, 2.71612548828125, 2.820220947265625, 2.92431640625, 3.028411865234375, 3.13250732421875, 3.236602783203125, 3.3406982421875, 3.444793701171875, 3.54888916015625, 3.652984619140625, 3.757080078125, 3.861175537109375, 3.96527099609375, 4.069366455078125, 4.1734619140625, 4.277557373046875, 4.38165283203125, 4.485748291015625, 4.58984375]}, "gradients/decoder.model.decoder.layers.3.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 6.0, 4.0, 5.0, 2.0, 9.0, 12.0, 10.0, 11.0, 12.0, 19.0, 26.0, 42.0, 43.0, 69.0, 111.0, 179.0, 371.0, 1002.0, 8103.0, 640670.0, 389650.0, 6449.0, 886.0, 329.0, 166.0, 112.0, 70.0, 42.0, 47.0, 27.0, 14.0, 13.0, 10.0, 4.0, 8.0, 8.0, 9.0, 3.0, 2.0, 1.0, 0.0, 3.0, 2.0, 1.0, 1.0, 1.0], "bins": [-2.306640625, -2.245880126953125, -2.18511962890625, -2.124359130859375, -2.0635986328125, -2.002838134765625, -1.94207763671875, -1.881317138671875, -1.820556640625, -1.759796142578125, -1.69903564453125, -1.638275146484375, -1.5775146484375, -1.516754150390625, -1.45599365234375, -1.395233154296875, -1.33447265625, -1.273712158203125, -1.21295166015625, -1.152191162109375, -1.0914306640625, -1.030670166015625, -0.96990966796875, -0.909149169921875, -0.848388671875, -0.787628173828125, -0.72686767578125, -0.666107177734375, -0.6053466796875, -0.544586181640625, -0.48382568359375, -0.423065185546875, -0.3623046875, -0.301544189453125, -0.24078369140625, -0.180023193359375, -0.1192626953125, -0.058502197265625, 0.00225830078125, 0.063018798828125, 0.123779296875, 0.184539794921875, 0.24530029296875, 0.306060791015625, 0.3668212890625, 0.427581787109375, 0.48834228515625, 0.549102783203125, 0.60986328125, 0.670623779296875, 0.73138427734375, 0.792144775390625, 0.8529052734375, 0.913665771484375, 0.97442626953125, 1.035186767578125, 1.095947265625, 1.156707763671875, 1.21746826171875, 1.278228759765625, 1.3389892578125, 1.399749755859375, 1.46051025390625, 1.521270751953125, 1.58203125]}, "gradients/decoder.model.decoder.layers.3.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 6.0, 4.0, 12.0, 12.0, 11.0, 15.0, 9.0, 12.0, 14.0, 20.0, 35.0, 24.0, 31.0, 32.0, 47.0, 44.0, 50.0, 58.0, 52.0, 61.0, 37.0, 62.0, 57.0, 38.0, 36.0, 42.0, 35.0, 29.0, 19.0, 17.0, 6.0, 18.0, 8.0, 10.0, 10.0, 12.0, 8.0, 2.0, 3.0, 8.0, 0.0, 1.0, 1.0, 3.0], "bins": [-2.46484375, -2.4021453857421875, -2.339447021484375, -2.2767486572265625, -2.21405029296875, -2.1513519287109375, -2.088653564453125, -2.0259552001953125, -1.9632568359375, -1.9005584716796875, -1.837860107421875, -1.7751617431640625, -1.71246337890625, -1.6497650146484375, -1.587066650390625, -1.5243682861328125, -1.461669921875, -1.3989715576171875, -1.336273193359375, -1.2735748291015625, -1.21087646484375, -1.1481781005859375, -1.085479736328125, -1.0227813720703125, -0.9600830078125, -0.8973846435546875, -0.834686279296875, -0.7719879150390625, -0.70928955078125, -0.6465911865234375, -0.583892822265625, -0.5211944580078125, -0.45849609375, -0.3957977294921875, -0.333099365234375, -0.2704010009765625, -0.20770263671875, -0.1450042724609375, -0.082305908203125, -0.0196075439453125, 0.0430908203125, 0.1057891845703125, 0.168487548828125, 0.2311859130859375, 0.29388427734375, 0.3565826416015625, 0.419281005859375, 0.4819793701171875, 0.544677734375, 0.6073760986328125, 0.670074462890625, 0.7327728271484375, 0.79547119140625, 0.8581695556640625, 0.920867919921875, 0.9835662841796875, 1.0462646484375, 1.1089630126953125, 1.171661376953125, 1.2343597412109375, 1.29705810546875, 1.3597564697265625, 1.422454833984375, 1.4851531982421875, 1.5478515625]}, "gradients/decoder.model.decoder.layers.3.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 3.0, 2.0, 6.0, 5.0, 5.0, 2.0, 13.0, 20.0, 16.0, 21.0, 29.0, 32.0, 64.0, 106.0, 126.0, 192.0, 323.0, 476.0, 915.0, 1785.0, 4936.0, 17772.0, 100401.0, 764268.0, 126117.0, 20766.0, 5581.0, 2118.0, 988.0, 532.0, 313.0, 196.0, 116.0, 81.0, 63.0, 41.0, 34.0, 27.0, 15.0, 4.0, 16.0, 6.0, 6.0, 4.0, 2.0, 4.0, 5.0, 1.0, 0.0, 2.0, 4.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.26708984375, -0.2580528259277344, -0.24901580810546875, -0.23997879028320312, -0.2309417724609375, -0.22190475463867188, -0.21286773681640625, -0.20383071899414062, -0.194793701171875, -0.18575668334960938, -0.17671966552734375, -0.16768264770507812, -0.1586456298828125, -0.14960861206054688, -0.14057159423828125, -0.13153457641601562, -0.12249755859375, -0.11346054077148438, -0.10442352294921875, -0.09538650512695312, -0.0863494873046875, -0.07731246948242188, -0.06827545166015625, -0.059238433837890625, -0.050201416015625, -0.041164398193359375, -0.03212738037109375, -0.023090362548828125, -0.0140533447265625, -0.005016326904296875, 0.00402069091796875, 0.013057708740234375, 0.0220947265625, 0.031131744384765625, 0.04016876220703125, 0.049205780029296875, 0.0582427978515625, 0.06727981567382812, 0.07631683349609375, 0.08535385131835938, 0.094390869140625, 0.10342788696289062, 0.11246490478515625, 0.12150192260742188, 0.1305389404296875, 0.13957595825195312, 0.14861297607421875, 0.15764999389648438, 0.16668701171875, 0.17572402954101562, 0.18476104736328125, 0.19379806518554688, 0.2028350830078125, 0.21187210083007812, 0.22090911865234375, 0.22994613647460938, 0.238983154296875, 0.24802017211914062, 0.25705718994140625, 0.2660942077636719, 0.2751312255859375, 0.2841682434082031, 0.29320526123046875, 0.3022422790527344, 0.311279296875]}, "gradients/decoder.model.decoder.layers.3.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 7.0, 2.0, 7.0, 6.0, 9.0, 19.0, 16.0, 25.0, 29.0, 52.0, 64.0, 118.0, 236.0, 154.0, 71.0, 52.0, 34.0, 25.0, 17.0, 15.0, 12.0, 12.0, 6.0, 3.0, 5.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.458427429199219e-05, -4.3079257011413574e-05, -4.157423973083496e-05, -4.006922245025635e-05, -3.8564205169677734e-05, -3.705918788909912e-05, -3.555417060852051e-05, -3.4049153327941895e-05, -3.254413604736328e-05, -3.103911876678467e-05, -2.9534101486206055e-05, -2.802908420562744e-05, -2.6524066925048828e-05, -2.5019049644470215e-05, -2.35140323638916e-05, -2.2009015083312988e-05, -2.0503997802734375e-05, -1.8998980522155762e-05, -1.749396324157715e-05, -1.5988945960998535e-05, -1.4483928680419922e-05, -1.2978911399841309e-05, -1.1473894119262695e-05, -9.968876838684082e-06, -8.463859558105469e-06, -6.9588422775268555e-06, -5.453824996948242e-06, -3.948807716369629e-06, -2.4437904357910156e-06, -9.387731552124023e-07, 5.662441253662109e-07, 2.0712614059448242e-06, 3.5762786865234375e-06, 5.081295967102051e-06, 6.586313247680664e-06, 8.091330528259277e-06, 9.59634780883789e-06, 1.1101365089416504e-05, 1.2606382369995117e-05, 1.411139965057373e-05, 1.5616416931152344e-05, 1.7121434211730957e-05, 1.862645149230957e-05, 2.0131468772888184e-05, 2.1636486053466797e-05, 2.314150333404541e-05, 2.4646520614624023e-05, 2.6151537895202637e-05, 2.765655517578125e-05, 2.9161572456359863e-05, 3.0666589736938477e-05, 3.217160701751709e-05, 3.36766242980957e-05, 3.5181641578674316e-05, 3.668665885925293e-05, 3.819167613983154e-05, 3.9696693420410156e-05, 4.120171070098877e-05, 4.270672798156738e-05, 4.4211745262145996e-05, 4.571676254272461e-05, 4.722177982330322e-05, 4.8726797103881836e-05, 5.023181438446045e-05, 5.173683166503906e-05]}, "gradients/decoder.model.decoder.layers.3.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 2.0, 4.0, 2.0, 2.0, 3.0, 5.0, 14.0, 10.0, 14.0, 16.0, 25.0, 30.0, 39.0, 74.0, 82.0, 108.0, 141.0, 228.0, 348.0, 606.0, 1135.0, 2401.0, 6219.0, 22032.0, 135103.0, 775155.0, 79947.0, 15459.0, 4779.0, 2011.0, 972.0, 498.0, 339.0, 229.0, 129.0, 118.0, 77.0, 47.0, 41.0, 28.0, 21.0, 18.0, 14.0, 6.0, 15.0, 6.0, 5.0, 4.0, 1.0, 3.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.358154296875, -0.34803009033203125, -0.3379058837890625, -0.32778167724609375, -0.317657470703125, -0.30753326416015625, -0.2974090576171875, -0.28728485107421875, -0.27716064453125, -0.26703643798828125, -0.2569122314453125, -0.24678802490234375, -0.236663818359375, -0.22653961181640625, -0.2164154052734375, -0.20629119873046875, -0.1961669921875, -0.18604278564453125, -0.1759185791015625, -0.16579437255859375, -0.155670166015625, -0.14554595947265625, -0.1354217529296875, -0.12529754638671875, -0.11517333984375, -0.10504913330078125, -0.0949249267578125, -0.08480072021484375, -0.074676513671875, -0.06455230712890625, -0.0544281005859375, -0.04430389404296875, -0.0341796875, -0.02405548095703125, -0.0139312744140625, -0.00380706787109375, 0.006317138671875, 0.01644134521484375, 0.0265655517578125, 0.03668975830078125, 0.04681396484375, 0.05693817138671875, 0.0670623779296875, 0.07718658447265625, 0.087310791015625, 0.09743499755859375, 0.1075592041015625, 0.11768341064453125, 0.1278076171875, 0.13793182373046875, 0.1480560302734375, 0.15818023681640625, 0.168304443359375, 0.17842864990234375, 0.1885528564453125, 0.19867706298828125, 0.20880126953125, 0.21892547607421875, 0.2290496826171875, 0.23917388916015625, 0.249298095703125, 0.25942230224609375, 0.2695465087890625, 0.27967071533203125, 0.289794921875]}, "gradients/decoder.model.decoder.layers.3.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 2.0, 7.0, 7.0, 13.0, 6.0, 17.0, 19.0, 26.0, 36.0, 49.0, 48.0, 69.0, 158.0, 227.0, 87.0, 64.0, 37.0, 33.0, 28.0, 19.0, 9.0, 8.0, 5.0, 5.0, 5.0, 4.0, 3.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08941650390625, -0.08554553985595703, -0.08167457580566406, -0.0778036117553711, -0.07393264770507812, -0.07006168365478516, -0.06619071960449219, -0.06231975555419922, -0.05844879150390625, -0.05457782745361328, -0.05070686340332031, -0.046835899353027344, -0.042964935302734375, -0.039093971252441406, -0.03522300720214844, -0.03135204315185547, -0.0274810791015625, -0.02361011505126953, -0.019739151000976562, -0.015868186950683594, -0.011997222900390625, -0.008126258850097656, -0.0042552947998046875, -0.00038433074951171875, 0.00348663330078125, 0.007357597351074219, 0.011228561401367188, 0.015099525451660156, 0.018970489501953125, 0.022841453552246094, 0.026712417602539062, 0.03058338165283203, 0.034454345703125, 0.03832530975341797, 0.04219627380371094, 0.046067237854003906, 0.049938201904296875, 0.053809165954589844, 0.05768013000488281, 0.06155109405517578, 0.06542205810546875, 0.06929302215576172, 0.07316398620605469, 0.07703495025634766, 0.08090591430664062, 0.0847768783569336, 0.08864784240722656, 0.09251880645751953, 0.0963897705078125, 0.10026073455810547, 0.10413169860839844, 0.1080026626586914, 0.11187362670898438, 0.11574459075927734, 0.11961555480957031, 0.12348651885986328, 0.12735748291015625, 0.13122844696044922, 0.1350994110107422, 0.13897037506103516, 0.14284133911132812, 0.1467123031616211, 0.15058326721191406, 0.15445423126220703, 0.1583251953125]}, "gradients/decoder.model.decoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 9.0, 39.0, 283.0, 508.0, 135.0, 21.0, 8.0, 3.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.52910041809082, -20.085853576660156, -19.64260482788086, -19.199357986450195, -18.75611114501953, -18.312862396240234, -17.86961555480957, -17.426366806030273, -16.98311996459961, -16.539873123168945, -16.09662437438965, -15.653377532958984, -15.210129737854004, -14.766881942749023, -14.32363510131836, -13.880387306213379, -13.437139511108398, -12.993891716003418, -12.550643920898438, -12.107397079467773, -11.664149284362793, -11.220901489257812, -10.777654647827148, -10.334406852722168, -9.891159057617188, -9.447911262512207, -9.004663467407227, -8.561416625976562, -8.118168830871582, -7.674921035766602, -7.231673717498779, -6.788426399230957, -6.345178127288818, -5.901930809020996, -5.458683013916016, -5.015435218811035, -4.572187900543213, -4.128940582275391, -3.68569278717041, -3.242445230484009, -2.7991976737976074, -2.355950117111206, -1.9127025604248047, -1.4694550037384033, -1.026207447052002, -0.5829598903656006, -0.13971233367919922, 0.30353522300720215, 0.7467827796936035, 1.1900303363800049, 1.6332778930664062, 2.0765254497528076, 2.519773006439209, 2.9630205631256104, 3.4062681198120117, 3.849515676498413, 4.2927632331848145, 4.736010551452637, 5.179258346557617, 5.622506141662598, 6.06575345993042, 6.509000778198242, 6.952248573303223, 7.395496368408203, 7.838743686676025]}, "gradients/decoder.model.decoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 6.0, 2.0, 6.0, 5.0, 8.0, 21.0, 9.0, 16.0, 15.0, 16.0, 22.0, 25.0, 36.0, 41.0, 36.0, 41.0, 36.0, 48.0, 42.0, 47.0, 44.0, 42.0, 48.0, 33.0, 38.0, 46.0, 38.0, 20.0, 43.0, 33.0, 21.0, 22.0, 17.0, 9.0, 21.0, 12.0, 9.0, 12.0, 6.0, 4.0, 2.0, 2.0, 3.0, 2.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.5643696784973145, -2.4683492183685303, -2.372328996658325, -2.276308536529541, -2.180288314819336, -2.0842678546905518, -1.9882475137710571, -1.8922271728515625, -1.7962067127227783, -1.7001863718032837, -1.604166030883789, -1.5081455707550049, -1.4121252298355103, -1.3161048889160156, -1.220084547996521, -1.1240642070770264, -1.0280438661575317, -0.9320235252380371, -0.8360031247138977, -0.7399827837944031, -0.6439623832702637, -0.547942042350769, -0.4519217014312744, -0.355901300907135, -0.2598809599876404, -0.16386058926582336, -0.06784023344516754, 0.02818012237548828, 0.1242004930973053, 0.22022086381912231, 0.31624120473861694, 0.41226160526275635, 0.508281946182251, 0.6043022871017456, 0.700322687625885, 0.7963430285453796, 0.892363429069519, 0.9883837699890137, 1.0844041109085083, 1.180424451828003, 1.276444911956787, 1.3724652528762817, 1.4684855937957764, 1.5645060539245605, 1.6605263948440552, 1.7565467357635498, 1.8525670766830444, 1.948587417602539, 2.044607639312744, 2.1406280994415283, 2.2366483211517334, 2.3326687812805176, 2.4286890029907227, 2.524709463119507, 2.620729923248291, 2.716750144958496, 2.8127706050872803, 2.9087910652160645, 3.0048112869262695, 3.1008317470550537, 3.196851968765259, 3.292872428894043, 3.388892650604248, 3.4849131107330322, 3.5809335708618164]}, "gradients/decoder.model.decoder.layers.2.fc2.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 5.0, 8.0, 9.0, 10.0, 9.0, 14.0, 22.0, 23.0, 27.0, 45.0, 49.0, 89.0, 122.0, 184.0, 378.0, 737.0, 1677.0, 5219.0, 22892.0, 271755.0, 3649240.0, 214668.0, 18959.0, 4673.0, 1718.0, 720.0, 363.0, 209.0, 148.0, 77.0, 63.0, 49.0, 28.0, 26.0, 19.0, 16.0, 5.0, 4.0, 10.0, 5.0, 4.0, 1.0, 3.0, 1.0, 3.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.099609375, -2.028350830078125, -1.95709228515625, -1.885833740234375, -1.8145751953125, -1.743316650390625, -1.67205810546875, -1.600799560546875, -1.529541015625, -1.458282470703125, -1.38702392578125, -1.315765380859375, -1.2445068359375, -1.173248291015625, -1.10198974609375, -1.030731201171875, -0.95947265625, -0.888214111328125, -0.81695556640625, -0.745697021484375, -0.6744384765625, -0.603179931640625, -0.53192138671875, -0.460662841796875, -0.389404296875, -0.318145751953125, -0.24688720703125, -0.175628662109375, -0.1043701171875, -0.033111572265625, 0.03814697265625, 0.109405517578125, 0.1806640625, 0.251922607421875, 0.32318115234375, 0.394439697265625, 0.4656982421875, 0.536956787109375, 0.60821533203125, 0.679473876953125, 0.750732421875, 0.821990966796875, 0.89324951171875, 0.964508056640625, 1.0357666015625, 1.107025146484375, 1.17828369140625, 1.249542236328125, 1.32080078125, 1.392059326171875, 1.46331787109375, 1.534576416015625, 1.6058349609375, 1.677093505859375, 1.74835205078125, 1.819610595703125, 1.890869140625, 1.962127685546875, 2.03338623046875, 2.104644775390625, 2.1759033203125, 2.247161865234375, 2.31842041015625, 2.389678955078125, 2.4609375]}, "gradients/decoder.model.decoder.layers.2.fc2.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 2.0, 3.0, 9.0, 4.0, 9.0, 8.0, 12.0, 12.0, 20.0, 20.0, 26.0, 35.0, 41.0, 57.0, 53.0, 62.0, 63.0, 59.0, 78.0, 62.0, 65.0, 67.0, 48.0, 37.0, 37.0, 24.0, 15.0, 16.0, 12.0, 16.0, 10.0, 6.0, 5.0, 3.0, 1.0, 4.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8818359375, -0.849151611328125, -0.81646728515625, -0.783782958984375, -0.7510986328125, -0.718414306640625, -0.68572998046875, -0.653045654296875, -0.620361328125, -0.587677001953125, -0.55499267578125, -0.522308349609375, -0.4896240234375, -0.456939697265625, -0.42425537109375, -0.391571044921875, -0.35888671875, -0.326202392578125, -0.29351806640625, -0.260833740234375, -0.2281494140625, -0.195465087890625, -0.16278076171875, -0.130096435546875, -0.097412109375, -0.064727783203125, -0.03204345703125, 0.000640869140625, 0.0333251953125, 0.066009521484375, 0.09869384765625, 0.131378173828125, 0.1640625, 0.196746826171875, 0.22943115234375, 0.262115478515625, 0.2947998046875, 0.327484130859375, 0.36016845703125, 0.392852783203125, 0.425537109375, 0.458221435546875, 0.49090576171875, 0.523590087890625, 0.5562744140625, 0.588958740234375, 0.62164306640625, 0.654327392578125, 0.68701171875, 0.719696044921875, 0.75238037109375, 0.785064697265625, 0.8177490234375, 0.850433349609375, 0.88311767578125, 0.915802001953125, 0.948486328125, 0.981170654296875, 1.01385498046875, 1.046539306640625, 1.0792236328125, 1.111907958984375, 1.14459228515625, 1.177276611328125, 1.2099609375]}, "gradients/decoder.model.decoder.layers.2.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 4.0, 1.0, 6.0, 4.0, 6.0, 4.0, 13.0, 13.0, 14.0, 20.0, 35.0, 45.0, 72.0, 128.0, 160.0, 299.0, 644.0, 1445.0, 3874.0, 12716.0, 55749.0, 598414.0, 3298031.0, 181171.0, 28824.0, 7749.0, 2654.0, 1016.0, 491.0, 277.0, 119.0, 93.0, 58.0, 36.0, 24.0, 26.0, 15.0, 14.0, 6.0, 9.0, 4.0, 2.0, 2.0, 5.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.041015625, -1.983184814453125, -1.92535400390625, -1.867523193359375, -1.8096923828125, -1.751861572265625, -1.69403076171875, -1.636199951171875, -1.578369140625, -1.520538330078125, -1.46270751953125, -1.404876708984375, -1.3470458984375, -1.289215087890625, -1.23138427734375, -1.173553466796875, -1.11572265625, -1.057891845703125, -1.00006103515625, -0.942230224609375, -0.8843994140625, -0.826568603515625, -0.76873779296875, -0.710906982421875, -0.653076171875, -0.595245361328125, -0.53741455078125, -0.479583740234375, -0.4217529296875, -0.363922119140625, -0.30609130859375, -0.248260498046875, -0.1904296875, -0.132598876953125, -0.07476806640625, -0.016937255859375, 0.0408935546875, 0.098724365234375, 0.15655517578125, 0.214385986328125, 0.272216796875, 0.330047607421875, 0.38787841796875, 0.445709228515625, 0.5035400390625, 0.561370849609375, 0.61920166015625, 0.677032470703125, 0.73486328125, 0.792694091796875, 0.85052490234375, 0.908355712890625, 0.9661865234375, 1.024017333984375, 1.08184814453125, 1.139678955078125, 1.197509765625, 1.255340576171875, 1.31317138671875, 1.371002197265625, 1.4288330078125, 1.486663818359375, 1.54449462890625, 1.602325439453125, 1.66015625]}, "gradients/decoder.model.decoder.layers.2.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 4.0, 2.0, 0.0, 6.0, 6.0, 9.0, 6.0, 5.0, 14.0, 17.0, 27.0, 16.0, 25.0, 45.0, 57.0, 83.0, 112.0, 172.0, 216.0, 361.0, 527.0, 688.0, 528.0, 334.0, 235.0, 147.0, 111.0, 93.0, 50.0, 45.0, 31.0, 28.0, 17.0, 14.0, 12.0, 10.0, 6.0, 8.0, 2.0, 4.0, 3.0, 4.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3974609375, -0.3848457336425781, -0.37223052978515625, -0.3596153259277344, -0.3470001220703125, -0.3343849182128906, -0.32176971435546875, -0.3091545104980469, -0.296539306640625, -0.2839241027832031, -0.27130889892578125, -0.2586936950683594, -0.2460784912109375, -0.23346328735351562, -0.22084808349609375, -0.20823287963867188, -0.19561767578125, -0.18300247192382812, -0.17038726806640625, -0.15777206420898438, -0.1451568603515625, -0.13254165649414062, -0.11992645263671875, -0.10731124877929688, -0.094696044921875, -0.08208084106445312, -0.06946563720703125, -0.056850433349609375, -0.0442352294921875, -0.031620025634765625, -0.01900482177734375, -0.006389617919921875, 0.0062255859375, 0.018840789794921875, 0.03145599365234375, 0.044071197509765625, 0.0566864013671875, 0.06930160522460938, 0.08191680908203125, 0.09453201293945312, 0.107147216796875, 0.11976242065429688, 0.13237762451171875, 0.14499282836914062, 0.1576080322265625, 0.17022323608398438, 0.18283843994140625, 0.19545364379882812, 0.20806884765625, 0.22068405151367188, 0.23329925537109375, 0.24591445922851562, 0.2585296630859375, 0.2711448669433594, 0.28376007080078125, 0.2963752746582031, 0.308990478515625, 0.3216056823730469, 0.33422088623046875, 0.3468360900878906, 0.3594512939453125, 0.3720664978027344, 0.38468170166015625, 0.3972969055175781, 0.409912109375]}, "gradients/decoder.model.decoder.layers.2.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 4.0, 7.0, 14.0, 35.0, 45.0, 95.0, 159.0, 213.0, 192.0, 114.0, 51.0, 37.0, 13.0, 13.0, 8.0, 1.0, 4.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.717185020446777, -4.598300933837891, -4.479416370391846, -4.360532283782959, -4.241647720336914, -4.122763633728027, -4.003879547119141, -3.884995222091675, -3.766110897064209, -3.647226572036743, -3.5283422470092773, -3.4094581604003906, -3.290573835372925, -3.171689510345459, -3.0528054237365723, -2.9339210987091064, -2.8150367736816406, -2.696152448654175, -2.577268123626709, -2.4583840370178223, -2.3394997119903564, -2.2206153869628906, -2.101731300354004, -1.982846975326538, -1.8639626502990723, -1.7450783252716064, -1.6261941194534302, -1.507309913635254, -1.388425588607788, -1.2695412635803223, -1.150657057762146, -1.0317728519439697, -0.912888765335083, -0.794004499912262, -0.6751202344894409, -0.5562359690666199, -0.43735170364379883, -0.3184674382209778, -0.19958317279815674, -0.0806989073753357, 0.03818535804748535, 0.1570696234703064, 0.27595388889312744, 0.3948381543159485, 0.5137224197387695, 0.6326066851615906, 0.7514909505844116, 0.8703752160072327, 0.9892594814300537, 1.1081438064575195, 1.2270280122756958, 1.345912218093872, 1.464796543121338, 1.5836808681488037, 1.70256507396698, 1.8214492797851562, 1.940333604812622, 2.059217929840088, 2.1781020164489746, 2.2969863414764404, 2.4158706665039062, 2.534754991531372, 2.653639316558838, 2.7725234031677246, 2.8914077281951904]}, "gradients/decoder.model.decoder.layers.2.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 3.0, 4.0, 4.0, 5.0, 11.0, 11.0, 11.0, 16.0, 16.0, 20.0, 20.0, 28.0, 20.0, 43.0, 38.0, 41.0, 40.0, 45.0, 57.0, 46.0, 47.0, 37.0, 46.0, 48.0, 44.0, 53.0, 36.0, 32.0, 31.0, 25.0, 20.0, 15.0, 21.0, 18.0, 11.0, 9.0, 9.0, 5.0, 3.0, 4.0, 8.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9616534113883972, -0.9267609119415283, -0.8918684124946594, -0.8569759130477905, -0.8220833539962769, -0.7871909141540527, -0.7522983551025391, -0.7174058556556702, -0.6825133562088013, -0.6476208567619324, -0.6127283573150635, -0.5778358578681946, -0.5429433584213257, -0.508050799369812, -0.4731582999229431, -0.4382658004760742, -0.4033733010292053, -0.3684808015823364, -0.33358830213546753, -0.29869577288627625, -0.26380327343940735, -0.22891077399253845, -0.19401825964450836, -0.15912574529647827, -0.12423324584960938, -0.08934073895215988, -0.05444823205471039, -0.019555725157260895, 0.015336781740188599, 0.050229281187057495, 0.08512179553508759, 0.12001430988311768, 0.1549067497253418, 0.1897992491722107, 0.22469176352024078, 0.2595842778682709, 0.29447677731513977, 0.32936927676200867, 0.36426180601119995, 0.39915430545806885, 0.43404680490493774, 0.46893930435180664, 0.5038318037986755, 0.5387243032455444, 0.5736168622970581, 0.6085093021392822, 0.6434018611907959, 0.6782943606376648, 0.7131868600845337, 0.7480793595314026, 0.7829718589782715, 0.8178643584251404, 0.8527568578720093, 0.887649416923523, 0.9225419163703918, 0.9574344158172607, 0.9923269152641296, 1.0272194147109985, 1.0621119737625122, 1.0970044136047363, 1.13189697265625, 1.1667894124984741, 1.2016819715499878, 1.236574411392212, 1.2714669704437256]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 4.0, 3.0, 1.0, 5.0, 12.0, 12.0, 17.0, 23.0, 31.0, 45.0, 93.0, 118.0, 202.0, 355.0, 543.0, 974.0, 1570.0, 2911.0, 5058.0, 10924.0, 49221.0, 606356.0, 322477.0, 29101.0, 8334.0, 4211.0, 2425.0, 1447.0, 825.0, 487.0, 271.0, 176.0, 111.0, 75.0, 35.0, 25.0, 21.0, 19.0, 11.0, 9.0, 8.0, 2.0, 6.0, 4.0, 2.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.53857421875, -0.5199127197265625, -0.501251220703125, -0.4825897216796875, -0.46392822265625, -0.4452667236328125, -0.426605224609375, -0.4079437255859375, -0.3892822265625, -0.3706207275390625, -0.351959228515625, -0.3332977294921875, -0.31463623046875, -0.2959747314453125, -0.277313232421875, -0.2586517333984375, -0.239990234375, -0.2213287353515625, -0.202667236328125, -0.1840057373046875, -0.16534423828125, -0.1466827392578125, -0.128021240234375, -0.1093597412109375, -0.0906982421875, -0.0720367431640625, -0.053375244140625, -0.0347137451171875, -0.01605224609375, 0.0026092529296875, 0.021270751953125, 0.0399322509765625, 0.05859375, 0.0772552490234375, 0.095916748046875, 0.1145782470703125, 0.13323974609375, 0.1519012451171875, 0.170562744140625, 0.1892242431640625, 0.2078857421875, 0.2265472412109375, 0.245208740234375, 0.2638702392578125, 0.28253173828125, 0.3011932373046875, 0.319854736328125, 0.3385162353515625, 0.357177734375, 0.3758392333984375, 0.394500732421875, 0.4131622314453125, 0.43182373046875, 0.4504852294921875, 0.469146728515625, 0.4878082275390625, 0.5064697265625, 0.5251312255859375, 0.543792724609375, 0.5624542236328125, 0.58111572265625, 0.5997772216796875, 0.618438720703125, 0.6371002197265625, 0.65576171875]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 5.0, 5.0, 6.0, 12.0, 15.0, 18.0, 31.0, 24.0, 30.0, 40.0, 47.0, 62.0, 54.0, 62.0, 58.0, 61.0, 53.0, 66.0, 52.0, 67.0, 39.0, 30.0, 40.0, 29.0, 20.0, 20.0, 9.0, 12.0, 7.0, 13.0, 2.0, 6.0, 1.0, 3.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7666015625, -0.7341461181640625, -0.701690673828125, -0.6692352294921875, -0.63677978515625, -0.6043243408203125, -0.571868896484375, -0.5394134521484375, -0.5069580078125, -0.4745025634765625, -0.442047119140625, -0.4095916748046875, -0.37713623046875, -0.3446807861328125, -0.312225341796875, -0.2797698974609375, -0.247314453125, -0.2148590087890625, -0.182403564453125, -0.1499481201171875, -0.11749267578125, -0.0850372314453125, -0.052581787109375, -0.0201263427734375, 0.0123291015625, 0.0447845458984375, 0.077239990234375, 0.1096954345703125, 0.14215087890625, 0.1746063232421875, 0.207061767578125, 0.2395172119140625, 0.27197265625, 0.3044281005859375, 0.336883544921875, 0.3693389892578125, 0.40179443359375, 0.4342498779296875, 0.466705322265625, 0.4991607666015625, 0.5316162109375, 0.5640716552734375, 0.596527099609375, 0.6289825439453125, 0.66143798828125, 0.6938934326171875, 0.726348876953125, 0.7588043212890625, 0.791259765625, 0.8237152099609375, 0.856170654296875, 0.8886260986328125, 0.92108154296875, 0.9535369873046875, 0.985992431640625, 1.0184478759765625, 1.0509033203125, 1.0833587646484375, 1.115814208984375, 1.1482696533203125, 1.18072509765625, 1.2131805419921875, 1.245635986328125, 1.2780914306640625, 1.310546875]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 1.0, 3.0, 2.0, 4.0, 10.0, 10.0, 7.0, 9.0, 16.0, 26.0, 56.0, 89.0, 162.0, 379.0, 928.0, 2383.0, 6532.0, 46285.0, 914393.0, 65330.0, 7694.0, 2408.0, 987.0, 409.0, 185.0, 108.0, 43.0, 35.0, 18.0, 9.0, 8.0, 10.0, 4.0, 5.0, 4.0, 3.0, 1.0, 1.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.68505859375, -0.660186767578125, -0.63531494140625, -0.610443115234375, -0.5855712890625, -0.560699462890625, -0.53582763671875, -0.510955810546875, -0.486083984375, -0.461212158203125, -0.43634033203125, -0.411468505859375, -0.3865966796875, -0.361724853515625, -0.33685302734375, -0.311981201171875, -0.287109375, -0.262237548828125, -0.23736572265625, -0.212493896484375, -0.1876220703125, -0.162750244140625, -0.13787841796875, -0.113006591796875, -0.088134765625, -0.063262939453125, -0.03839111328125, -0.013519287109375, 0.0113525390625, 0.036224365234375, 0.06109619140625, 0.085968017578125, 0.11083984375, 0.135711669921875, 0.16058349609375, 0.185455322265625, 0.2103271484375, 0.235198974609375, 0.26007080078125, 0.284942626953125, 0.309814453125, 0.334686279296875, 0.35955810546875, 0.384429931640625, 0.4093017578125, 0.434173583984375, 0.45904541015625, 0.483917236328125, 0.5087890625, 0.533660888671875, 0.55853271484375, 0.583404541015625, 0.6082763671875, 0.633148193359375, 0.65802001953125, 0.682891845703125, 0.707763671875, 0.732635498046875, 0.75750732421875, 0.782379150390625, 0.8072509765625, 0.832122802734375, 0.85699462890625, 0.881866455078125, 0.90673828125]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 3.0, 5.0, 6.0, 3.0, 5.0, 8.0, 8.0, 9.0, 14.0, 13.0, 19.0, 24.0, 19.0, 24.0, 30.0, 34.0, 30.0, 36.0, 35.0, 38.0, 37.0, 57.0, 37.0, 57.0, 41.0, 46.0, 46.0, 37.0, 31.0, 28.0, 29.0, 20.0, 25.0, 28.0, 17.0, 18.0, 17.0, 12.0, 17.0, 12.0, 5.0, 5.0, 7.0, 2.0, 4.0, 3.0, 5.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.4638671875, -1.41510009765625, -1.3663330078125, -1.31756591796875, -1.268798828125, -1.22003173828125, -1.1712646484375, -1.12249755859375, -1.07373046875, -1.02496337890625, -0.9761962890625, -0.92742919921875, -0.878662109375, -0.82989501953125, -0.7811279296875, -0.73236083984375, -0.68359375, -0.63482666015625, -0.5860595703125, -0.53729248046875, -0.488525390625, -0.43975830078125, -0.3909912109375, -0.34222412109375, -0.29345703125, -0.24468994140625, -0.1959228515625, -0.14715576171875, -0.098388671875, -0.04962158203125, -0.0008544921875, 0.04791259765625, 0.0966796875, 0.14544677734375, 0.1942138671875, 0.24298095703125, 0.291748046875, 0.34051513671875, 0.3892822265625, 0.43804931640625, 0.48681640625, 0.53558349609375, 0.5843505859375, 0.63311767578125, 0.681884765625, 0.73065185546875, 0.7794189453125, 0.82818603515625, 0.876953125, 0.92572021484375, 0.9744873046875, 1.02325439453125, 1.072021484375, 1.12078857421875, 1.1695556640625, 1.21832275390625, 1.26708984375, 1.31585693359375, 1.3646240234375, 1.41339111328125, 1.462158203125, 1.51092529296875, 1.5596923828125, 1.60845947265625, 1.6572265625]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 2.0, 2.0, 6.0, 8.0, 7.0, 4.0, 4.0, 12.0, 12.0, 18.0, 25.0, 33.0, 45.0, 63.0, 80.0, 124.0, 163.0, 234.0, 339.0, 536.0, 876.0, 1463.0, 2579.0, 4827.0, 10043.0, 24766.0, 85196.0, 455732.0, 353641.0, 67335.0, 20865.0, 9052.0, 4348.0, 2332.0, 1345.0, 775.0, 513.0, 345.0, 227.0, 144.0, 109.0, 97.0, 55.0, 58.0, 27.0, 23.0, 15.0, 13.0, 11.0, 12.0, 10.0, 4.0, 3.0, 5.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1031494140625, -0.0997018814086914, -0.09625434875488281, -0.09280681610107422, -0.08935928344726562, -0.08591175079345703, -0.08246421813964844, -0.07901668548583984, -0.07556915283203125, -0.07212162017822266, -0.06867408752441406, -0.06522655487060547, -0.061779022216796875, -0.05833148956298828, -0.05488395690917969, -0.051436424255371094, -0.0479888916015625, -0.044541358947753906, -0.04109382629394531, -0.03764629364013672, -0.034198760986328125, -0.03075122833251953, -0.027303695678710938, -0.023856163024902344, -0.02040863037109375, -0.016961097717285156, -0.013513565063476562, -0.010066032409667969, -0.006618499755859375, -0.0031709671020507812, 0.0002765655517578125, 0.0037240982055664062, 0.007171630859375, 0.010619163513183594, 0.014066696166992188, 0.01751422882080078, 0.020961761474609375, 0.02440929412841797, 0.027856826782226562, 0.031304359436035156, 0.03475189208984375, 0.038199424743652344, 0.04164695739746094, 0.04509449005126953, 0.048542022705078125, 0.05198955535888672, 0.05543708801269531, 0.058884620666503906, 0.0623321533203125, 0.0657796859741211, 0.06922721862792969, 0.07267475128173828, 0.07612228393554688, 0.07956981658935547, 0.08301734924316406, 0.08646488189697266, 0.08991241455078125, 0.09335994720458984, 0.09680747985839844, 0.10025501251220703, 0.10370254516601562, 0.10715007781982422, 0.11059761047363281, 0.1140451431274414, 0.11749267578125]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 6.0, 5.0, 10.0, 20.0, 18.0, 15.0, 41.0, 84.0, 116.0, 170.0, 162.0, 129.0, 82.0, 38.0, 30.0, 18.0, 17.0, 10.0, 4.0, 4.0, 7.0, 2.0, 4.0, 4.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.00011211633682250977, -0.0001090075820684433, -0.00010589882731437683, -0.00010279007256031036, -9.96813178062439e-05, -9.657256305217743e-05, -9.346380829811096e-05, -9.03550535440445e-05, -8.724629878997803e-05, -8.413754403591156e-05, -8.102878928184509e-05, -7.792003452777863e-05, -7.481127977371216e-05, -7.170252501964569e-05, -6.859377026557922e-05, -6.548501551151276e-05, -6.237626075744629e-05, -5.926750600337982e-05, -5.6158751249313354e-05, -5.304999649524689e-05, -4.994124174118042e-05, -4.683248698711395e-05, -4.3723732233047485e-05, -4.061497747898102e-05, -3.750622272491455e-05, -3.4397467970848083e-05, -3.1288713216781616e-05, -2.817995846271515e-05, -2.507120370864868e-05, -2.1962448954582214e-05, -1.8853694200515747e-05, -1.574493944644928e-05, -1.2636184692382812e-05, -9.527429938316345e-06, -6.418675184249878e-06, -3.3099204301834106e-06, -2.0116567611694336e-07, 2.907589077949524e-06, 6.016343832015991e-06, 9.125098586082458e-06, 1.2233853340148926e-05, 1.5342608094215393e-05, 1.845136284828186e-05, 2.1560117602348328e-05, 2.4668872356414795e-05, 2.7777627110481262e-05, 3.088638186454773e-05, 3.39951366186142e-05, 3.7103891372680664e-05, 4.021264612674713e-05, 4.33214008808136e-05, 4.6430155634880066e-05, 4.953891038894653e-05, 5.2647665143013e-05, 5.575641989707947e-05, 5.8865174651145935e-05, 6.19739294052124e-05, 6.508268415927887e-05, 6.819143891334534e-05, 7.13001936674118e-05, 7.440894842147827e-05, 7.751770317554474e-05, 8.06264579296112e-05, 8.373521268367767e-05, 8.684396743774414e-05]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 4.0, 6.0, 3.0, 3.0, 11.0, 6.0, 6.0, 14.0, 19.0, 25.0, 36.0, 55.0, 72.0, 134.0, 226.0, 385.0, 615.0, 1275.0, 2506.0, 5081.0, 11587.0, 30740.0, 109993.0, 515758.0, 275774.0, 59258.0, 19098.0, 8062.0, 3736.0, 1835.0, 966.0, 504.0, 293.0, 162.0, 112.0, 53.0, 47.0, 31.0, 15.0, 17.0, 12.0, 6.0, 10.0, 5.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0], "bins": [-0.1416015625, -0.1372814178466797, -0.13296127319335938, -0.12864112854003906, -0.12432098388671875, -0.12000083923339844, -0.11568069458007812, -0.11136054992675781, -0.1070404052734375, -0.10272026062011719, -0.09840011596679688, -0.09407997131347656, -0.08975982666015625, -0.08543968200683594, -0.08111953735351562, -0.07679939270019531, -0.072479248046875, -0.06815910339355469, -0.06383895874023438, -0.05951881408691406, -0.05519866943359375, -0.05087852478027344, -0.046558380126953125, -0.04223823547363281, -0.0379180908203125, -0.03359794616699219, -0.029277801513671875, -0.024957656860351562, -0.02063751220703125, -0.016317367553710938, -0.011997222900390625, -0.0076770782470703125, -0.00335693359375, 0.0009632110595703125, 0.005283355712890625, 0.009603500366210938, 0.01392364501953125, 0.018243789672851562, 0.022563934326171875, 0.026884078979492188, 0.0312042236328125, 0.03552436828613281, 0.039844512939453125, 0.04416465759277344, 0.04848480224609375, 0.05280494689941406, 0.057125091552734375, 0.06144523620605469, 0.065765380859375, 0.07008552551269531, 0.07440567016601562, 0.07872581481933594, 0.08304595947265625, 0.08736610412597656, 0.09168624877929688, 0.09600639343261719, 0.1003265380859375, 0.10464668273925781, 0.10896682739257812, 0.11328697204589844, 0.11760711669921875, 0.12192726135253906, 0.12624740600585938, 0.1305675506591797, 0.1348876953125]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 6.0, 3.0, 1.0, 2.0, 10.0, 7.0, 4.0, 13.0, 10.0, 18.0, 25.0, 32.0, 39.0, 57.0, 81.0, 128.0, 142.0, 127.0, 75.0, 60.0, 36.0, 34.0, 23.0, 16.0, 11.0, 11.0, 6.0, 3.0, 8.0, 4.0, 1.0, 4.0, 4.0, 6.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.036346435546875, -0.03496408462524414, -0.03358173370361328, -0.03219938278198242, -0.030817031860351562, -0.029434680938720703, -0.028052330017089844, -0.026669979095458984, -0.025287628173828125, -0.023905277252197266, -0.022522926330566406, -0.021140575408935547, -0.019758224487304688, -0.018375873565673828, -0.01699352264404297, -0.01561117172241211, -0.01422882080078125, -0.01284646987915039, -0.011464118957519531, -0.010081768035888672, -0.008699417114257812, -0.007317066192626953, -0.005934715270996094, -0.004552364349365234, -0.003170013427734375, -0.0017876625061035156, -0.00040531158447265625, 0.0009770393371582031, 0.0023593902587890625, 0.003741741180419922, 0.005124092102050781, 0.006506443023681641, 0.0078887939453125, 0.00927114486694336, 0.010653495788574219, 0.012035846710205078, 0.013418197631835938, 0.014800548553466797, 0.016182899475097656, 0.017565250396728516, 0.018947601318359375, 0.020329952239990234, 0.021712303161621094, 0.023094654083251953, 0.024477005004882812, 0.025859355926513672, 0.02724170684814453, 0.02862405776977539, 0.03000640869140625, 0.03138875961303711, 0.03277111053466797, 0.03415346145629883, 0.03553581237792969, 0.03691816329956055, 0.038300514221191406, 0.039682865142822266, 0.041065216064453125, 0.042447566986083984, 0.043829917907714844, 0.0452122688293457, 0.04659461975097656, 0.04797697067260742, 0.04935932159423828, 0.05074167251586914, 0.0521240234375]}, "gradients/decoder.model.decoder.layers.2.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 8.0, 6.0, 13.0, 30.0, 47.0, 83.0, 136.0, 188.0, 176.0, 142.0, 81.0, 36.0, 22.0, 15.0, 8.0, 6.0, 2.0, 4.0, 3.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.1702020168304443, -3.0946621894836426, -3.019122362136841, -2.943582773208618, -2.8680429458618164, -2.7925031185150146, -2.716963291168213, -2.6414237022399902, -2.5658838748931885, -2.4903440475463867, -2.414804220199585, -2.3392646312713623, -2.2637248039245605, -2.188184976577759, -2.112645149230957, -2.0371055603027344, -1.961565613746643, -1.8860257863998413, -1.810486078262329, -1.7349462509155273, -1.6594065427780151, -1.5838667154312134, -1.5083270072937012, -1.4327871799468994, -1.3572473526000977, -1.281707525253296, -1.2061678171157837, -1.130627989768982, -1.0550882816314697, -0.979548454284668, -0.904008686542511, -0.828468918800354, -0.7529290914535522, -0.6773893237113953, -0.6018495559692383, -0.5263097286224365, -0.45076999068260193, -0.37523022294044495, -0.2996904253959656, -0.2241506576538086, -0.1486108899116516, -0.07307111471891403, 0.0024686604738235474, 0.07800844311714172, 0.1535482108592987, 0.2290879786014557, 0.30462777614593506, 0.38016754388809204, 0.455707311630249, 0.531247079372406, 0.606786847114563, 0.6823266744613647, 0.757866382598877, 0.8334062099456787, 0.9089459776878357, 0.9844857454299927, 1.0600254535675049, 1.1355652809143066, 1.2111049890518188, 1.2866448163986206, 1.3621845245361328, 1.4377243518829346, 1.5132641792297363, 1.5888038873672485, 1.6643437147140503]}, "gradients/decoder.model.decoder.layers.2.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 3.0, 4.0, 2.0, 4.0, 13.0, 9.0, 8.0, 11.0, 28.0, 14.0, 23.0, 23.0, 26.0, 47.0, 35.0, 45.0, 51.0, 47.0, 52.0, 59.0, 53.0, 45.0, 56.0, 46.0, 47.0, 45.0, 37.0, 29.0, 22.0, 24.0, 26.0, 13.0, 12.0, 15.0, 5.0, 7.0, 6.0, 5.0, 2.0, 3.0, 4.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.7240344285964966, -0.6975588798522949, -0.6710832715034485, -0.6446077227592468, -0.6181321144104004, -0.5916565656661987, -0.5651810169219971, -0.5387054085731506, -0.5122298002243042, -0.48575422167778015, -0.4592786431312561, -0.43280309438705444, -0.406327486038208, -0.37985193729400635, -0.3533763587474823, -0.32690078020095825, -0.3004252314567566, -0.27394965291023254, -0.2474740743637085, -0.22099851071834564, -0.1945229321718216, -0.16804735362529755, -0.1415717899799347, -0.11509621143341064, -0.0886206328868866, -0.06214505806565285, -0.0356694832444191, -0.009193912148475647, 0.0172816663980484, 0.04375724494457245, 0.0702328085899353, 0.09670838713645935, 0.12318390607833862, 0.14965948462486267, 0.17613506317138672, 0.20261062681674957, 0.22908620536327362, 0.2555617690086365, 0.2820373475551605, 0.30851292610168457, 0.3349885046482086, 0.36146408319473267, 0.3879396617412567, 0.41441524028778076, 0.4408907890319824, 0.46736639738082886, 0.4938419461250305, 0.520317554473877, 0.5467931032180786, 0.5732686519622803, 0.5997442603111267, 0.6262198090553284, 0.6526954174041748, 0.6791709661483765, 0.7056465148925781, 0.7321221232414246, 0.758597731590271, 0.7850732803344727, 0.8115488886833191, 0.8380244374275208, 0.8645000457763672, 0.8909755945205688, 0.9174511432647705, 0.9439267516136169, 0.9704023003578186]}, "gradients/decoder.model.decoder.layers.2.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 3.0, 1.0, 4.0, 2.0, 8.0, 6.0, 7.0, 5.0, 27.0, 26.0, 45.0, 63.0, 110.0, 200.0, 336.0, 690.0, 1577.0, 3756.0, 10123.0, 33544.0, 141711.0, 649507.0, 153674.0, 35302.0, 10747.0, 3952.0, 1589.0, 711.0, 369.0, 174.0, 107.0, 67.0, 36.0, 27.0, 17.0, 13.0, 10.0, 1.0, 1.0, 9.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7099609375, -0.6821441650390625, -0.654327392578125, -0.6265106201171875, -0.59869384765625, -0.5708770751953125, -0.543060302734375, -0.5152435302734375, -0.4874267578125, -0.4596099853515625, -0.431793212890625, -0.4039764404296875, -0.37615966796875, -0.3483428955078125, -0.320526123046875, -0.2927093505859375, -0.264892578125, -0.2370758056640625, -0.209259033203125, -0.1814422607421875, -0.15362548828125, -0.1258087158203125, -0.097991943359375, -0.0701751708984375, -0.0423583984375, -0.0145416259765625, 0.013275146484375, 0.0410919189453125, 0.06890869140625, 0.0967254638671875, 0.124542236328125, 0.1523590087890625, 0.18017578125, 0.2079925537109375, 0.235809326171875, 0.2636260986328125, 0.29144287109375, 0.3192596435546875, 0.347076416015625, 0.3748931884765625, 0.4027099609375, 0.4305267333984375, 0.458343505859375, 0.4861602783203125, 0.51397705078125, 0.5417938232421875, 0.569610595703125, 0.5974273681640625, 0.625244140625, 0.6530609130859375, 0.680877685546875, 0.7086944580078125, 0.73651123046875, 0.7643280029296875, 0.792144775390625, 0.8199615478515625, 0.8477783203125, 0.8755950927734375, 0.903411865234375, 0.9312286376953125, 0.95904541015625, 0.9868621826171875, 1.014678955078125, 1.0424957275390625, 1.0703125]}, "gradients/decoder.model.decoder.layers.2.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 1.0, 4.0, 16.0, 10.0, 18.0, 18.0, 23.0, 26.0, 46.0, 58.0, 63.0, 68.0, 68.0, 65.0, 76.0, 72.0, 72.0, 68.0, 50.0, 43.0, 41.0, 35.0, 19.0, 12.0, 10.0, 9.0, 5.0, 5.0, 3.0, 1.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5068359375, -1.4322662353515625, -1.357696533203125, -1.2831268310546875, -1.20855712890625, -1.1339874267578125, -1.059417724609375, -0.9848480224609375, -0.9102783203125, -0.8357086181640625, -0.761138916015625, -0.6865692138671875, -0.61199951171875, -0.5374298095703125, -0.462860107421875, -0.3882904052734375, -0.313720703125, -0.2391510009765625, -0.164581298828125, -0.0900115966796875, -0.01544189453125, 0.0591278076171875, 0.133697509765625, 0.2082672119140625, 0.2828369140625, 0.3574066162109375, 0.431976318359375, 0.5065460205078125, 0.58111572265625, 0.6556854248046875, 0.730255126953125, 0.8048248291015625, 0.87939453125, 0.9539642333984375, 1.028533935546875, 1.1031036376953125, 1.17767333984375, 1.2522430419921875, 1.326812744140625, 1.4013824462890625, 1.4759521484375, 1.5505218505859375, 1.625091552734375, 1.6996612548828125, 1.77423095703125, 1.8488006591796875, 1.923370361328125, 1.9979400634765625, 2.072509765625, 2.1470794677734375, 2.221649169921875, 2.2962188720703125, 2.37078857421875, 2.4453582763671875, 2.519927978515625, 2.5944976806640625, 2.6690673828125, 2.7436370849609375, 2.818206787109375, 2.8927764892578125, 2.96734619140625, 3.0419158935546875, 3.116485595703125, 3.1910552978515625, 3.265625]}, "gradients/decoder.model.decoder.layers.2.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 5.0, 3.0, 5.0, 3.0, 2.0, 5.0, 5.0, 7.0, 14.0, 12.0, 12.0, 15.0, 24.0, 27.0, 38.0, 41.0, 68.0, 102.0, 179.0, 348.0, 1449.0, 62978.0, 971819.0, 9772.0, 840.0, 272.0, 152.0, 100.0, 66.0, 34.0, 27.0, 26.0, 17.0, 13.0, 16.0, 12.0, 13.0, 7.0, 6.0, 10.0, 7.0, 3.0, 1.0, 4.0, 5.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.4609375, -3.357025146484375, -3.25311279296875, -3.149200439453125, -3.0452880859375, -2.941375732421875, -2.83746337890625, -2.733551025390625, -2.629638671875, -2.525726318359375, -2.42181396484375, -2.317901611328125, -2.2139892578125, -2.110076904296875, -2.00616455078125, -1.902252197265625, -1.79833984375, -1.694427490234375, -1.59051513671875, -1.486602783203125, -1.3826904296875, -1.278778076171875, -1.17486572265625, -1.070953369140625, -0.967041015625, -0.863128662109375, -0.75921630859375, -0.655303955078125, -0.5513916015625, -0.447479248046875, -0.34356689453125, -0.239654541015625, -0.1357421875, -0.031829833984375, 0.07208251953125, 0.175994873046875, 0.2799072265625, 0.383819580078125, 0.48773193359375, 0.591644287109375, 0.695556640625, 0.799468994140625, 0.90338134765625, 1.007293701171875, 1.1112060546875, 1.215118408203125, 1.31903076171875, 1.422943115234375, 1.52685546875, 1.630767822265625, 1.73468017578125, 1.838592529296875, 1.9425048828125, 2.046417236328125, 2.15032958984375, 2.254241943359375, 2.358154296875, 2.462066650390625, 2.56597900390625, 2.669891357421875, 2.7738037109375, 2.877716064453125, 2.98162841796875, 3.085540771484375, 3.189453125]}, "gradients/decoder.model.decoder.layers.2.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 2.0, 8.0, 6.0, 3.0, 5.0, 6.0, 10.0, 6.0, 20.0, 17.0, 25.0, 29.0, 17.0, 24.0, 26.0, 41.0, 35.0, 42.0, 43.0, 44.0, 35.0, 57.0, 52.0, 42.0, 49.0, 51.0, 49.0, 44.0, 28.0, 19.0, 31.0, 18.0, 16.0, 19.0, 21.0, 13.0, 5.0, 10.0, 8.0, 6.0, 10.0, 6.0, 4.0, 1.0, 4.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-2.041015625, -1.9801025390625, -1.919189453125, -1.8582763671875, -1.79736328125, -1.7364501953125, -1.675537109375, -1.6146240234375, -1.5537109375, -1.4927978515625, -1.431884765625, -1.3709716796875, -1.31005859375, -1.2491455078125, -1.188232421875, -1.1273193359375, -1.06640625, -1.0054931640625, -0.944580078125, -0.8836669921875, -0.82275390625, -0.7618408203125, -0.700927734375, -0.6400146484375, -0.5791015625, -0.5181884765625, -0.457275390625, -0.3963623046875, -0.33544921875, -0.2745361328125, -0.213623046875, -0.1527099609375, -0.091796875, -0.0308837890625, 0.030029296875, 0.0909423828125, 0.15185546875, 0.2127685546875, 0.273681640625, 0.3345947265625, 0.3955078125, 0.4564208984375, 0.517333984375, 0.5782470703125, 0.63916015625, 0.7000732421875, 0.760986328125, 0.8218994140625, 0.8828125, 0.9437255859375, 1.004638671875, 1.0655517578125, 1.12646484375, 1.1873779296875, 1.248291015625, 1.3092041015625, 1.3701171875, 1.4310302734375, 1.491943359375, 1.5528564453125, 1.61376953125, 1.6746826171875, 1.735595703125, 1.7965087890625, 1.857421875]}, "gradients/decoder.model.decoder.layers.2.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 4.0, 7.0, 5.0, 7.0, 14.0, 15.0, 21.0, 30.0, 39.0, 57.0, 87.0, 126.0, 228.0, 424.0, 1051.0, 3098.0, 13088.0, 101338.0, 812668.0, 98320.0, 12799.0, 3047.0, 1055.0, 402.0, 222.0, 112.0, 89.0, 57.0, 44.0, 26.0, 20.0, 18.0, 12.0, 2.0, 8.0, 8.0, 3.0, 3.0, 5.0, 1.0, 2.0, 1.0, 2.0, 2.0], "bins": [-0.5, -0.4870109558105469, -0.47402191162109375, -0.4610328674316406, -0.4480438232421875, -0.4350547790527344, -0.42206573486328125, -0.4090766906738281, -0.396087646484375, -0.3830986022949219, -0.37010955810546875, -0.3571205139160156, -0.3441314697265625, -0.3311424255371094, -0.31815338134765625, -0.3051643371582031, -0.29217529296875, -0.2791862487792969, -0.26619720458984375, -0.2532081604003906, -0.2402191162109375, -0.22723007202148438, -0.21424102783203125, -0.20125198364257812, -0.188262939453125, -0.17527389526367188, -0.16228485107421875, -0.14929580688476562, -0.1363067626953125, -0.12331771850585938, -0.11032867431640625, -0.09733963012695312, -0.0843505859375, -0.07136154174804688, -0.05837249755859375, -0.045383453369140625, -0.0323944091796875, -0.019405364990234375, -0.00641632080078125, 0.006572723388671875, 0.019561767578125, 0.032550811767578125, 0.04553985595703125, 0.058528900146484375, 0.0715179443359375, 0.08450698852539062, 0.09749603271484375, 0.11048507690429688, 0.12347412109375, 0.13646316528320312, 0.14945220947265625, 0.16244125366210938, 0.1754302978515625, 0.18841934204101562, 0.20140838623046875, 0.21439743041992188, 0.227386474609375, 0.24037551879882812, 0.25336456298828125, 0.2663536071777344, 0.2793426513671875, 0.2923316955566406, 0.30532073974609375, 0.3183097839355469, 0.331298828125]}, "gradients/decoder.model.decoder.layers.2.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 4.0, 0.0, 1.0, 2.0, 5.0, 6.0, 6.0, 6.0, 4.0, 9.0, 15.0, 25.0, 38.0, 55.0, 54.0, 93.0, 176.0, 168.0, 101.0, 70.0, 44.0, 42.0, 27.0, 11.0, 19.0, 11.0, 11.0, 3.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.27501106262207e-05, -5.110912024974823e-05, -4.946812987327576e-05, -4.7827139496803284e-05, -4.618614912033081e-05, -4.454515874385834e-05, -4.2904168367385864e-05, -4.126317799091339e-05, -3.962218761444092e-05, -3.7981197237968445e-05, -3.634020686149597e-05, -3.46992164850235e-05, -3.3058226108551025e-05, -3.141723573207855e-05, -2.977624535560608e-05, -2.8135254979133606e-05, -2.6494264602661133e-05, -2.485327422618866e-05, -2.3212283849716187e-05, -2.1571293473243713e-05, -1.993030309677124e-05, -1.8289312720298767e-05, -1.6648322343826294e-05, -1.500733196735382e-05, -1.3366341590881348e-05, -1.1725351214408875e-05, -1.0084360837936401e-05, -8.443370461463928e-06, -6.802380084991455e-06, -5.161389708518982e-06, -3.520399332046509e-06, -1.8794089555740356e-06, -2.384185791015625e-07, 1.4025717973709106e-06, 3.043562173843384e-06, 4.684552550315857e-06, 6.32554292678833e-06, 7.966533303260803e-06, 9.607523679733276e-06, 1.124851405620575e-05, 1.2889504432678223e-05, 1.4530494809150696e-05, 1.617148518562317e-05, 1.7812475562095642e-05, 1.9453465938568115e-05, 2.109445631504059e-05, 2.273544669151306e-05, 2.4376437067985535e-05, 2.6017427444458008e-05, 2.765841782093048e-05, 2.9299408197402954e-05, 3.094039857387543e-05, 3.25813889503479e-05, 3.4222379326820374e-05, 3.586336970329285e-05, 3.750436007976532e-05, 3.914535045623779e-05, 4.0786340832710266e-05, 4.242733120918274e-05, 4.406832158565521e-05, 4.5709311962127686e-05, 4.735030233860016e-05, 4.899129271507263e-05, 5.0632283091545105e-05, 5.227327346801758e-05]}, "gradients/decoder.model.decoder.layers.2.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 7.0, 3.0, 9.0, 8.0, 7.0, 21.0, 29.0, 46.0, 72.0, 139.0, 261.0, 498.0, 1116.0, 2872.0, 8265.0, 36688.0, 349201.0, 587197.0, 46429.0, 9958.0, 3229.0, 1325.0, 584.0, 266.0, 133.0, 76.0, 57.0, 20.0, 17.0, 7.0, 10.0, 7.0, 0.0, 0.0, 3.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.481201171875, -0.46855926513671875, -0.4559173583984375, -0.44327545166015625, -0.430633544921875, -0.41799163818359375, -0.4053497314453125, -0.39270782470703125, -0.38006591796875, -0.36742401123046875, -0.3547821044921875, -0.34214019775390625, -0.329498291015625, -0.31685638427734375, -0.3042144775390625, -0.29157257080078125, -0.2789306640625, -0.26628875732421875, -0.2536468505859375, -0.24100494384765625, -0.228363037109375, -0.21572113037109375, -0.2030792236328125, -0.19043731689453125, -0.17779541015625, -0.16515350341796875, -0.1525115966796875, -0.13986968994140625, -0.127227783203125, -0.11458587646484375, -0.1019439697265625, -0.08930206298828125, -0.07666015625, -0.06401824951171875, -0.0513763427734375, -0.03873443603515625, -0.026092529296875, -0.01345062255859375, -0.0008087158203125, 0.01183319091796875, 0.02447509765625, 0.03711700439453125, 0.0497589111328125, 0.06240081787109375, 0.075042724609375, 0.08768463134765625, 0.1003265380859375, 0.11296844482421875, 0.1256103515625, 0.13825225830078125, 0.1508941650390625, 0.16353607177734375, 0.176177978515625, 0.18881988525390625, 0.2014617919921875, 0.21410369873046875, 0.22674560546875, 0.23938751220703125, 0.2520294189453125, 0.26467132568359375, 0.277313232421875, 0.28995513916015625, 0.3025970458984375, 0.31523895263671875, 0.327880859375]}, "gradients/decoder.model.decoder.layers.2.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 2.0, 6.0, 1.0, 5.0, 7.0, 11.0, 10.0, 11.0, 14.0, 19.0, 32.0, 41.0, 52.0, 57.0, 124.0, 227.0, 118.0, 76.0, 42.0, 26.0, 24.0, 25.0, 12.0, 22.0, 12.0, 1.0, 7.0, 7.0, 3.0, 2.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.1710205078125, -0.16592788696289062, -0.16083526611328125, -0.15574264526367188, -0.1506500244140625, -0.14555740356445312, -0.14046478271484375, -0.13537216186523438, -0.130279541015625, -0.12518692016601562, -0.12009429931640625, -0.11500167846679688, -0.1099090576171875, -0.10481643676757812, -0.09972381591796875, -0.09463119506835938, -0.08953857421875, -0.08444595336914062, -0.07935333251953125, -0.07426071166992188, -0.0691680908203125, -0.06407546997070312, -0.05898284912109375, -0.053890228271484375, -0.048797607421875, -0.043704986572265625, -0.03861236572265625, -0.033519744873046875, -0.0284271240234375, -0.023334503173828125, -0.01824188232421875, -0.013149261474609375, -0.008056640625, -0.002964019775390625, 0.00212860107421875, 0.007221221923828125, 0.0123138427734375, 0.017406463623046875, 0.02249908447265625, 0.027591705322265625, 0.032684326171875, 0.037776947021484375, 0.04286956787109375, 0.047962188720703125, 0.0530548095703125, 0.058147430419921875, 0.06324005126953125, 0.06833267211914062, 0.07342529296875, 0.07851791381835938, 0.08361053466796875, 0.08870315551757812, 0.0937957763671875, 0.09888839721679688, 0.10398101806640625, 0.10907363891601562, 0.114166259765625, 0.11925888061523438, 0.12435150146484375, 0.12944412231445312, 0.1345367431640625, 0.13962936401367188, 0.14472198486328125, 0.14981460571289062, 0.1549072265625]}, "gradients/decoder.model.decoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 12.0, 25.0, 63.0, 177.0, 299.0, 251.0, 107.0, 44.0, 16.0, 7.0, 1.0, 4.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.379422187805176, -6.131861686706543, -5.88430118560791, -5.636740684509277, -5.3891801834106445, -5.141619682312012, -4.894059181213379, -4.646498203277588, -4.398937702178955, -4.151377201080322, -3.9038166999816895, -3.6562561988830566, -3.4086954593658447, -3.161134958267212, -2.913574457168579, -2.666013717651367, -2.4184534549713135, -2.1708929538726807, -1.9233323335647583, -1.6757718324661255, -1.4282112121582031, -1.1806507110595703, -0.9330902099609375, -0.6855295896530151, -0.4379690885543823, -0.19040854275226593, 0.057152003049850464, 0.30471253395080566, 0.5522730946540833, 0.7998336553573608, 1.0473941564559937, 1.294954776763916, 1.5425152778625488, 1.7900757789611816, 2.0376362800598145, 2.2851967811584473, 2.532757520675659, 2.780318021774292, 3.027878522872925, 3.2754392623901367, 3.5229997634887695, 3.7705602645874023, 4.018120765686035, 4.265681266784668, 4.513241767883301, 4.760802268981934, 5.008362770080566, 5.255923748016357, 5.503483772277832, 5.751044273376465, 5.998604774475098, 6.2461652755737305, 6.493725776672363, 6.741286277770996, 6.988846778869629, 7.23640775680542, 7.483968257904053, 7.7315287590026855, 7.979089260101318, 8.22665023803711, 8.474210739135742, 8.721771240234375, 8.969331741333008, 9.21689224243164, 9.464452743530273]}, "gradients/decoder.model.decoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 2.0, 2.0, 4.0, 7.0, 4.0, 7.0, 9.0, 20.0, 16.0, 17.0, 20.0, 24.0, 20.0, 22.0, 26.0, 28.0, 27.0, 25.0, 32.0, 43.0, 39.0, 46.0, 39.0, 47.0, 46.0, 32.0, 45.0, 32.0, 30.0, 43.0, 34.0, 23.0, 25.0, 25.0, 18.0, 24.0, 23.0, 26.0, 14.0, 10.0, 7.0, 7.0, 7.0, 2.0, 3.0, 6.0, 0.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.488837242126465, -2.3934450149536133, -2.298053026199341, -2.2026607990264893, -2.107268810272217, -2.0118765830993652, -1.9164844751358032, -1.8210923671722412, -1.7257002592086792, -1.6303081512451172, -1.5349160432815552, -1.4395239353179932, -1.3441317081451416, -1.2487397193908691, -1.1533474922180176, -1.0579553842544556, -0.9625632762908936, -0.8671711683273315, -0.7717790603637695, -0.6763868927955627, -0.5809947848320007, -0.4856026768684387, -0.39021050930023193, -0.2948184013366699, -0.1994262933731079, -0.1040341705083847, -0.008642047643661499, 0.0867500901222229, 0.1821421980857849, 0.2775343060493469, 0.3729264736175537, 0.4683185815811157, 0.5637104511260986, 0.6591025590896606, 0.7544946670532227, 0.8498868346214294, 0.9452789425849915, 1.0406711101531982, 1.1360632181167603, 1.2314553260803223, 1.3268474340438843, 1.4222395420074463, 1.5176316499710083, 1.6130237579345703, 1.7084159851074219, 1.8038079738616943, 1.899200201034546, 1.994592308998108, 2.08998441696167, 2.1853766441345215, 2.280768632888794, 2.3761608600616455, 2.471552848815918, 2.5669450759887695, 2.662337303161621, 2.7577292919158936, 2.853121280670166, 2.9485135078430176, 3.04390549659729, 3.1392977237701416, 3.234689712524414, 3.3300819396972656, 3.425474166870117, 3.5208661556243896, 3.616258382797241]}, "gradients/decoder.model.decoder.layers.1.fc2.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 5.0, 3.0, 10.0, 9.0, 19.0, 29.0, 35.0, 62.0, 61.0, 89.0, 131.0, 209.0, 349.0, 671.0, 1414.0, 3626.0, 12506.0, 79791.0, 2409531.0, 1614004.0, 55342.0, 9921.0, 3197.0, 1387.0, 697.0, 405.0, 246.0, 173.0, 110.0, 87.0, 46.0, 42.0, 25.0, 16.0, 12.0, 9.0, 8.0, 4.0, 3.0, 4.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8798828125, -1.8101043701171875, -1.740325927734375, -1.6705474853515625, -1.60076904296875, -1.5309906005859375, -1.461212158203125, -1.3914337158203125, -1.3216552734375, -1.2518768310546875, -1.182098388671875, -1.1123199462890625, -1.04254150390625, -0.9727630615234375, -0.902984619140625, -0.8332061767578125, -0.763427734375, -0.6936492919921875, -0.623870849609375, -0.5540924072265625, -0.48431396484375, -0.4145355224609375, -0.344757080078125, -0.2749786376953125, -0.2052001953125, -0.1354217529296875, -0.065643310546875, 0.0041351318359375, 0.07391357421875, 0.1436920166015625, 0.213470458984375, 0.2832489013671875, 0.35302734375, 0.4228057861328125, 0.492584228515625, 0.5623626708984375, 0.63214111328125, 0.7019195556640625, 0.771697998046875, 0.8414764404296875, 0.9112548828125, 0.9810333251953125, 1.050811767578125, 1.1205902099609375, 1.19036865234375, 1.2601470947265625, 1.329925537109375, 1.3997039794921875, 1.469482421875, 1.5392608642578125, 1.609039306640625, 1.6788177490234375, 1.74859619140625, 1.8183746337890625, 1.888153076171875, 1.9579315185546875, 2.0277099609375, 2.0974884033203125, 2.167266845703125, 2.2370452880859375, 2.30682373046875, 2.3766021728515625, 2.446380615234375, 2.5161590576171875, 2.5859375]}, "gradients/decoder.model.decoder.layers.1.fc2.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 1.0, 3.0, 7.0, 8.0, 6.0, 8.0, 8.0, 15.0, 11.0, 18.0, 26.0, 24.0, 27.0, 32.0, 38.0, 50.0, 55.0, 53.0, 51.0, 61.0, 52.0, 59.0, 47.0, 62.0, 44.0, 38.0, 27.0, 25.0, 29.0, 22.0, 18.0, 19.0, 14.0, 8.0, 8.0, 6.0, 5.0, 3.0, 4.0, 4.0, 5.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0], "bins": [-0.7734375, -0.7469863891601562, -0.7205352783203125, -0.6940841674804688, -0.667633056640625, -0.6411819458007812, -0.6147308349609375, -0.5882797241210938, -0.56182861328125, -0.5353775024414062, -0.5089263916015625, -0.48247528076171875, -0.456024169921875, -0.42957305908203125, -0.4031219482421875, -0.37667083740234375, -0.3502197265625, -0.32376861572265625, -0.2973175048828125, -0.27086639404296875, -0.244415283203125, -0.21796417236328125, -0.1915130615234375, -0.16506195068359375, -0.13861083984375, -0.11215972900390625, -0.0857086181640625, -0.05925750732421875, -0.032806396484375, -0.00635528564453125, 0.0200958251953125, 0.04654693603515625, 0.072998046875, 0.09944915771484375, 0.1259002685546875, 0.15235137939453125, 0.178802490234375, 0.20525360107421875, 0.2317047119140625, 0.25815582275390625, 0.28460693359375, 0.31105804443359375, 0.3375091552734375, 0.36396026611328125, 0.390411376953125, 0.41686248779296875, 0.4433135986328125, 0.46976470947265625, 0.4962158203125, 0.5226669311523438, 0.5491180419921875, 0.5755691528320312, 0.602020263671875, 0.6284713745117188, 0.6549224853515625, 0.6813735961914062, 0.70782470703125, 0.7342758178710938, 0.7607269287109375, 0.7871780395507812, 0.813629150390625, 0.8400802612304688, 0.8665313720703125, 0.8929824829101562, 0.91943359375]}, "gradients/decoder.model.decoder.layers.1.fc1.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 4.0, 1.0, 1.0, 1.0, 9.0, 3.0, 8.0, 7.0, 17.0, 20.0, 32.0, 49.0, 76.0, 118.0, 217.0, 419.0, 912.0, 2536.0, 8230.0, 38220.0, 369612.0, 3483675.0, 248621.0, 30618.0, 6985.0, 2112.0, 865.0, 407.0, 202.0, 99.0, 65.0, 49.0, 23.0, 24.0, 18.0, 9.0, 7.0, 9.0, 6.0, 2.0, 2.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.189453125, -2.1219482421875, -2.054443359375, -1.9869384765625, -1.91943359375, -1.8519287109375, -1.784423828125, -1.7169189453125, -1.6494140625, -1.5819091796875, -1.514404296875, -1.4468994140625, -1.37939453125, -1.3118896484375, -1.244384765625, -1.1768798828125, -1.109375, -1.0418701171875, -0.974365234375, -0.9068603515625, -0.83935546875, -0.7718505859375, -0.704345703125, -0.6368408203125, -0.5693359375, -0.5018310546875, -0.434326171875, -0.3668212890625, -0.29931640625, -0.2318115234375, -0.164306640625, -0.0968017578125, -0.029296875, 0.0382080078125, 0.105712890625, 0.1732177734375, 0.24072265625, 0.3082275390625, 0.375732421875, 0.4432373046875, 0.5107421875, 0.5782470703125, 0.645751953125, 0.7132568359375, 0.78076171875, 0.8482666015625, 0.915771484375, 0.9832763671875, 1.05078125, 1.1182861328125, 1.185791015625, 1.2532958984375, 1.32080078125, 1.3883056640625, 1.455810546875, 1.5233154296875, 1.5908203125, 1.6583251953125, 1.725830078125, 1.7933349609375, 1.86083984375, 1.9283447265625, 1.995849609375, 2.0633544921875, 2.130859375]}, "gradients/decoder.model.decoder.layers.1.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 6.0, 3.0, 6.0, 8.0, 13.0, 14.0, 21.0, 37.0, 57.0, 76.0, 92.0, 180.0, 338.0, 646.0, 851.0, 697.0, 439.0, 247.0, 123.0, 71.0, 53.0, 26.0, 28.0, 15.0, 14.0, 9.0, 6.0, 4.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.60107421875, -0.5800857543945312, -0.5590972900390625, -0.5381088256835938, -0.517120361328125, -0.49613189697265625, -0.4751434326171875, -0.45415496826171875, -0.43316650390625, -0.41217803955078125, -0.3911895751953125, -0.37020111083984375, -0.349212646484375, -0.32822418212890625, -0.3072357177734375, -0.28624725341796875, -0.2652587890625, -0.24427032470703125, -0.2232818603515625, -0.20229339599609375, -0.181304931640625, -0.16031646728515625, -0.1393280029296875, -0.11833953857421875, -0.09735107421875, -0.07636260986328125, -0.0553741455078125, -0.03438568115234375, -0.013397216796875, 0.00759124755859375, 0.0285797119140625, 0.04956817626953125, 0.070556640625, 0.09154510498046875, 0.1125335693359375, 0.13352203369140625, 0.154510498046875, 0.17549896240234375, 0.1964874267578125, 0.21747589111328125, 0.23846435546875, 0.25945281982421875, 0.2804412841796875, 0.30142974853515625, 0.322418212890625, 0.34340667724609375, 0.3643951416015625, 0.38538360595703125, 0.4063720703125, 0.42736053466796875, 0.4483489990234375, 0.46933746337890625, 0.490325927734375, 0.5113143920898438, 0.5323028564453125, 0.5532913208007812, 0.57427978515625, 0.5952682495117188, 0.6162567138671875, 0.6372451782226562, 0.658233642578125, 0.6792221069335938, 0.7002105712890625, 0.7211990356445312, 0.7421875]}, "gradients/decoder.model.decoder.layers.1.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 4.0, 8.0, 11.0, 16.0, 30.0, 39.0, 55.0, 61.0, 80.0, 109.0, 116.0, 125.0, 85.0, 75.0, 64.0, 40.0, 27.0, 24.0, 12.0, 12.0, 5.0, 5.0, 5.0, 0.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.662935733795166, -2.590834856033325, -2.5187339782714844, -2.4466331005096436, -2.3745322227478027, -2.302431344985962, -2.230330467224121, -2.1582295894622803, -2.0861287117004395, -2.0140278339385986, -1.9419269561767578, -1.869826078414917, -1.7977252006530762, -1.7256243228912354, -1.6535234451293945, -1.5814225673675537, -1.5093215703964233, -1.4372206926345825, -1.3651198148727417, -1.2930189371109009, -1.22091805934906, -1.1488171815872192, -1.0767161846160889, -1.004615306854248, -0.932514488697052, -0.8604136109352112, -0.7883127331733704, -0.7162117958068848, -0.644110918045044, -0.5720100402832031, -0.4999091625213623, -0.4278082847595215, -0.3557075262069702, -0.2836066484451294, -0.21150575578212738, -0.13940486311912537, -0.06730398535728455, 0.004796892404556274, 0.07689779996871948, 0.1489986777305603, 0.22109955549240112, 0.29320043325424194, 0.36530131101608276, 0.43740221858024597, 0.5095031261444092, 0.58160400390625, 0.6537048816680908, 0.7258057594299316, 0.7979066371917725, 0.8700075149536133, 0.9421083927154541, 1.014209270477295, 1.0863101482391357, 1.1584110260009766, 1.2305119037628174, 1.3026127815246582, 1.374713659286499, 1.4468145370483398, 1.5189154148101807, 1.5910162925720215, 1.6631171703338623, 1.7352180480957031, 1.807318925857544, 1.8794198036193848, 1.9515208005905151]}, "gradients/decoder.model.decoder.layers.1.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [6.0, 2.0, 1.0, 3.0, 4.0, 3.0, 2.0, 7.0, 6.0, 4.0, 7.0, 9.0, 19.0, 25.0, 24.0, 30.0, 22.0, 26.0, 27.0, 37.0, 25.0, 48.0, 41.0, 40.0, 32.0, 49.0, 44.0, 47.0, 41.0, 29.0, 36.0, 41.0, 33.0, 34.0, 31.0, 25.0, 20.0, 18.0, 20.0, 15.0, 15.0, 7.0, 12.0, 11.0, 6.0, 5.0, 2.0, 7.0, 6.0, 2.0, 4.0, 1.0, 2.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.8608332276344299, -0.8293626308441162, -0.7978919744491577, -0.766421377658844, -0.7349507808685303, -0.7034801244735718, -0.6720095276832581, -0.6405389308929443, -0.6090682744979858, -0.5775976777076721, -0.5461270213127136, -0.5146564245223999, -0.4831857979297638, -0.4517151713371277, -0.42024457454681396, -0.38877394795417786, -0.35730332136154175, -0.32583269476890564, -0.29436206817626953, -0.2628914713859558, -0.2314208447933197, -0.1999502182006836, -0.16847960650920868, -0.13700899481773376, -0.10553836822509766, -0.07406774908304214, -0.04259712994098663, -0.011126510798931122, 0.02034410834312439, 0.0518147349357605, 0.08328534662723541, 0.11475595831871033, 0.1462266445159912, 0.17769727110862732, 0.20916788280010223, 0.24063849449157715, 0.27210912108421326, 0.30357974767684937, 0.3350503444671631, 0.3665209710597992, 0.3979915976524353, 0.4294622242450714, 0.4609328508377075, 0.49240344762802124, 0.523874044418335, 0.5553447008132935, 0.5868152976036072, 0.6182858943939209, 0.6497565507888794, 0.6812271475791931, 0.7126978039741516, 0.7441684007644653, 0.7756390571594238, 0.8071096539497375, 0.8385802507400513, 0.8700509071350098, 0.9015215039253235, 0.9329921007156372, 0.9644627571105957, 0.9959333539009094, 1.0274039506912231, 1.0588746070861816, 1.0903452634811401, 1.121815800666809, 1.1532864570617676]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 12.0, 12.0, 13.0, 14.0, 29.0, 34.0, 79.0, 89.0, 163.0, 238.0, 348.0, 597.0, 970.0, 1746.0, 3273.0, 6646.0, 15230.0, 41501.0, 142606.0, 400905.0, 297755.0, 87128.0, 27372.0, 10684.0, 4911.0, 2630.0, 1428.0, 770.0, 502.0, 274.0, 182.0, 112.0, 81.0, 58.0, 43.0, 29.0, 16.0, 20.0, 16.0, 8.0, 9.0, 2.0, 7.0, 3.0, 5.0, 2.0, 1.0, 0.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.239501953125, -0.23056793212890625, -0.2216339111328125, -0.21269989013671875, -0.203765869140625, -0.19483184814453125, -0.1858978271484375, -0.17696380615234375, -0.16802978515625, -0.15909576416015625, -0.1501617431640625, -0.14122772216796875, -0.132293701171875, -0.12335968017578125, -0.1144256591796875, -0.10549163818359375, -0.0965576171875, -0.08762359619140625, -0.0786895751953125, -0.06975555419921875, -0.060821533203125, -0.05188751220703125, -0.0429534912109375, -0.03401947021484375, -0.02508544921875, -0.01615142822265625, -0.0072174072265625, 0.00171661376953125, 0.010650634765625, 0.01958465576171875, 0.0285186767578125, 0.03745269775390625, 0.04638671875, 0.05532073974609375, 0.0642547607421875, 0.07318878173828125, 0.082122802734375, 0.09105682373046875, 0.0999908447265625, 0.10892486572265625, 0.11785888671875, 0.12679290771484375, 0.1357269287109375, 0.14466094970703125, 0.153594970703125, 0.16252899169921875, 0.1714630126953125, 0.18039703369140625, 0.1893310546875, 0.19826507568359375, 0.2071990966796875, 0.21613311767578125, 0.225067138671875, 0.23400115966796875, 0.2429351806640625, 0.25186920166015625, 0.26080322265625, 0.26973724365234375, 0.2786712646484375, 0.28760528564453125, 0.296539306640625, 0.30547332763671875, 0.3144073486328125, 0.32334136962890625, 0.332275390625]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [3.0, 4.0, 4.0, 2.0, 4.0, 1.0, 3.0, 7.0, 11.0, 12.0, 12.0, 20.0, 34.0, 18.0, 32.0, 26.0, 30.0, 37.0, 47.0, 44.0, 38.0, 48.0, 50.0, 59.0, 53.0, 50.0, 39.0, 47.0, 44.0, 40.0, 32.0, 24.0, 21.0, 24.0, 15.0, 12.0, 13.0, 10.0, 9.0, 6.0, 7.0, 8.0, 1.0, 4.0, 6.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.54150390625, -0.5185775756835938, -0.4956512451171875, -0.47272491455078125, -0.449798583984375, -0.42687225341796875, -0.4039459228515625, -0.38101959228515625, -0.35809326171875, -0.33516693115234375, -0.3122406005859375, -0.28931427001953125, -0.266387939453125, -0.24346160888671875, -0.2205352783203125, -0.19760894775390625, -0.1746826171875, -0.15175628662109375, -0.1288299560546875, -0.10590362548828125, -0.082977294921875, -0.06005096435546875, -0.0371246337890625, -0.01419830322265625, 0.00872802734375, 0.03165435791015625, 0.0545806884765625, 0.07750701904296875, 0.100433349609375, 0.12335968017578125, 0.1462860107421875, 0.16921234130859375, 0.192138671875, 0.21506500244140625, 0.2379913330078125, 0.26091766357421875, 0.283843994140625, 0.30677032470703125, 0.3296966552734375, 0.35262298583984375, 0.37554931640625, 0.39847564697265625, 0.4214019775390625, 0.44432830810546875, 0.467254638671875, 0.49018096923828125, 0.5131072998046875, 0.5360336303710938, 0.5589599609375, 0.5818862915039062, 0.6048126220703125, 0.6277389526367188, 0.650665283203125, 0.6735916137695312, 0.6965179443359375, 0.7194442749023438, 0.74237060546875, 0.7652969360351562, 0.7882232666015625, 0.8111495971679688, 0.834075927734375, 0.8570022583007812, 0.8799285888671875, 0.9028549194335938, 0.92578125]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 3.0, 2.0, 6.0, 5.0, 5.0, 10.0, 14.0, 18.0, 20.0, 33.0, 40.0, 58.0, 76.0, 101.0, 186.0, 342.0, 521.0, 1015.0, 2200.0, 5354.0, 17169.0, 83928.0, 465929.0, 384422.0, 63828.0, 14351.0, 4623.0, 2019.0, 891.0, 494.0, 300.0, 176.0, 128.0, 76.0, 49.0, 43.0, 34.0, 22.0, 16.0, 16.0, 10.0, 6.0, 9.0, 0.0, 3.0, 5.0, 1.0, 3.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.29736328125, -0.2874259948730469, -0.27748870849609375, -0.2675514221191406, -0.2576141357421875, -0.24767684936523438, -0.23773956298828125, -0.22780227661132812, -0.217864990234375, -0.20792770385742188, -0.19799041748046875, -0.18805313110351562, -0.1781158447265625, -0.16817855834960938, -0.15824127197265625, -0.14830398559570312, -0.13836669921875, -0.12842941284179688, -0.11849212646484375, -0.10855484008789062, -0.0986175537109375, -0.08868026733398438, -0.07874298095703125, -0.06880569458007812, -0.058868408203125, -0.048931121826171875, -0.03899383544921875, -0.029056549072265625, -0.0191192626953125, -0.009181976318359375, 0.00075531005859375, 0.010692596435546875, 0.0206298828125, 0.030567169189453125, 0.04050445556640625, 0.050441741943359375, 0.0603790283203125, 0.07031631469726562, 0.08025360107421875, 0.09019088745117188, 0.100128173828125, 0.11006546020507812, 0.12000274658203125, 0.12994003295898438, 0.1398773193359375, 0.14981460571289062, 0.15975189208984375, 0.16968917846679688, 0.17962646484375, 0.18956375122070312, 0.19950103759765625, 0.20943832397460938, 0.2193756103515625, 0.22931289672851562, 0.23925018310546875, 0.24918746948242188, 0.259124755859375, 0.2690620422363281, 0.27899932861328125, 0.2889366149902344, 0.2988739013671875, 0.3088111877441406, 0.31874847412109375, 0.3286857604980469, 0.338623046875]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 4.0, 4.0, 3.0, 2.0, 6.0, 11.0, 7.0, 11.0, 13.0, 11.0, 17.0, 17.0, 17.0, 21.0, 28.0, 28.0, 35.0, 24.0, 39.0, 28.0, 32.0, 50.0, 37.0, 45.0, 48.0, 49.0, 46.0, 38.0, 31.0, 41.0, 41.0, 33.0, 24.0, 26.0, 23.0, 17.0, 19.0, 9.0, 17.0, 5.0, 13.0, 5.0, 11.0, 5.0, 4.0, 5.0, 4.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-1.3642578125, -1.3227081298828125, -1.281158447265625, -1.2396087646484375, -1.19805908203125, -1.1565093994140625, -1.114959716796875, -1.0734100341796875, -1.0318603515625, -0.9903106689453125, -0.948760986328125, -0.9072113037109375, -0.86566162109375, -0.8241119384765625, -0.782562255859375, -0.7410125732421875, -0.699462890625, -0.6579132080078125, -0.616363525390625, -0.5748138427734375, -0.53326416015625, -0.4917144775390625, -0.450164794921875, -0.4086151123046875, -0.3670654296875, -0.3255157470703125, -0.283966064453125, -0.2424163818359375, -0.20086669921875, -0.1593170166015625, -0.117767333984375, -0.0762176513671875, -0.03466796875, 0.0068817138671875, 0.048431396484375, 0.0899810791015625, 0.13153076171875, 0.1730804443359375, 0.214630126953125, 0.2561798095703125, 0.2977294921875, 0.3392791748046875, 0.380828857421875, 0.4223785400390625, 0.46392822265625, 0.5054779052734375, 0.547027587890625, 0.5885772705078125, 0.630126953125, 0.6716766357421875, 0.713226318359375, 0.7547760009765625, 0.79632568359375, 0.8378753662109375, 0.879425048828125, 0.9209747314453125, 0.9625244140625, 1.0040740966796875, 1.045623779296875, 1.0871734619140625, 1.12872314453125, 1.1702728271484375, 1.211822509765625, 1.2533721923828125, 1.294921875]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 0.0, 2.0, 5.0, 4.0, 2.0, 2.0, 12.0, 8.0, 19.0, 23.0, 31.0, 56.0, 68.0, 146.0, 222.0, 339.0, 668.0, 1399.0, 3243.0, 8585.0, 29390.0, 152246.0, 614275.0, 186883.0, 34442.0, 9673.0, 3534.0, 1519.0, 743.0, 388.0, 217.0, 136.0, 95.0, 53.0, 42.0, 25.0, 21.0, 18.0, 4.0, 5.0, 4.0, 3.0, 5.0, 2.0, 3.0, 0.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.157470703125, -0.15231704711914062, -0.14716339111328125, -0.14200973510742188, -0.1368560791015625, -0.13170242309570312, -0.12654876708984375, -0.12139511108398438, -0.116241455078125, -0.11108779907226562, -0.10593414306640625, -0.10078048706054688, -0.0956268310546875, -0.09047317504882812, -0.08531951904296875, -0.08016586303710938, -0.07501220703125, -0.06985855102539062, -0.06470489501953125, -0.059551239013671875, -0.0543975830078125, -0.049243927001953125, -0.04409027099609375, -0.038936614990234375, -0.033782958984375, -0.028629302978515625, -0.02347564697265625, -0.018321990966796875, -0.0131683349609375, -0.008014678955078125, -0.00286102294921875, 0.002292633056640625, 0.0074462890625, 0.012599945068359375, 0.01775360107421875, 0.022907257080078125, 0.0280609130859375, 0.033214569091796875, 0.03836822509765625, 0.043521881103515625, 0.048675537109375, 0.053829193115234375, 0.05898284912109375, 0.06413650512695312, 0.0692901611328125, 0.07444381713867188, 0.07959747314453125, 0.08475112915039062, 0.08990478515625, 0.09505844116210938, 0.10021209716796875, 0.10536575317382812, 0.1105194091796875, 0.11567306518554688, 0.12082672119140625, 0.12598037719726562, 0.131134033203125, 0.13628768920898438, 0.14144134521484375, 0.14659500122070312, 0.1517486572265625, 0.15690231323242188, 0.16205596923828125, 0.16720962524414062, 0.17236328125]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 2.0, 2.0, 3.0, 3.0, 5.0, 12.0, 4.0, 18.0, 18.0, 43.0, 47.0, 40.0, 79.0, 95.0, 141.0, 128.0, 103.0, 79.0, 54.0, 38.0, 28.0, 25.0, 9.0, 6.0, 4.0, 7.0, 3.0, 4.0, 3.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.881092071533203e-05, -8.602533489465714e-05, -8.323974907398224e-05, -8.045416325330734e-05, -7.766857743263245e-05, -7.488299161195755e-05, -7.209740579128265e-05, -6.931181997060776e-05, -6.652623414993286e-05, -6.374064832925797e-05, -6.095506250858307e-05, -5.816947668790817e-05, -5.5383890867233276e-05, -5.259830504655838e-05, -4.9812719225883484e-05, -4.702713340520859e-05, -4.424154758453369e-05, -4.1455961763858795e-05, -3.86703759431839e-05, -3.5884790122509e-05, -3.3099204301834106e-05, -3.031361848115921e-05, -2.7528032660484314e-05, -2.4742446839809418e-05, -2.195686101913452e-05, -1.9171275198459625e-05, -1.638568937778473e-05, -1.3600103557109833e-05, -1.0814517736434937e-05, -8.02893191576004e-06, -5.243346095085144e-06, -2.457760274410248e-06, 3.2782554626464844e-07, 3.1134113669395447e-06, 5.898997187614441e-06, 8.684583008289337e-06, 1.1470168828964233e-05, 1.425575464963913e-05, 1.7041340470314026e-05, 1.9826926290988922e-05, 2.261251211166382e-05, 2.5398097932338715e-05, 2.818368375301361e-05, 3.096926957368851e-05, 3.37548553943634e-05, 3.65404412150383e-05, 3.9326027035713196e-05, 4.211161285638809e-05, 4.489719867706299e-05, 4.7682784497737885e-05, 5.046837031841278e-05, 5.325395613908768e-05, 5.603954195976257e-05, 5.882512778043747e-05, 6.161071360111237e-05, 6.439629942178726e-05, 6.718188524246216e-05, 6.996747106313705e-05, 7.275305688381195e-05, 7.553864270448685e-05, 7.832422852516174e-05, 8.110981434583664e-05, 8.389540016651154e-05, 8.668098598718643e-05, 8.946657180786133e-05]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 2.0, 8.0, 3.0, 7.0, 9.0, 18.0, 24.0, 33.0, 53.0, 107.0, 156.0, 332.0, 527.0, 1026.0, 2042.0, 4215.0, 9365.0, 21958.0, 60656.0, 191737.0, 437775.0, 209615.0, 66369.0, 23692.0, 9778.0, 4488.0, 2131.0, 1096.0, 585.0, 317.0, 171.0, 91.0, 63.0, 39.0, 24.0, 18.0, 10.0, 5.0, 7.0, 1.0, 2.0, 10.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.156005859375, -0.1514892578125, -0.14697265625, -0.1424560546875, -0.137939453125, -0.1334228515625, -0.12890625, -0.1243896484375, -0.119873046875, -0.1153564453125, -0.11083984375, -0.1063232421875, -0.101806640625, -0.0972900390625, -0.0927734375, -0.0882568359375, -0.083740234375, -0.0792236328125, -0.07470703125, -0.0701904296875, -0.065673828125, -0.0611572265625, -0.056640625, -0.0521240234375, -0.047607421875, -0.0430908203125, -0.03857421875, -0.0340576171875, -0.029541015625, -0.0250244140625, -0.0205078125, -0.0159912109375, -0.011474609375, -0.0069580078125, -0.00244140625, 0.0020751953125, 0.006591796875, 0.0111083984375, 0.015625, 0.0201416015625, 0.024658203125, 0.0291748046875, 0.03369140625, 0.0382080078125, 0.042724609375, 0.0472412109375, 0.0517578125, 0.0562744140625, 0.060791015625, 0.0653076171875, 0.06982421875, 0.0743408203125, 0.078857421875, 0.0833740234375, 0.087890625, 0.0924072265625, 0.096923828125, 0.1014404296875, 0.10595703125, 0.1104736328125, 0.114990234375, 0.1195068359375, 0.1240234375, 0.1285400390625, 0.133056640625]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 6.0, 4.0, 5.0, 11.0, 9.0, 6.0, 18.0, 17.0, 34.0, 29.0, 44.0, 47.0, 58.0, 82.0, 101.0, 105.0, 88.0, 70.0, 55.0, 49.0, 34.0, 30.0, 21.0, 21.0, 14.0, 13.0, 7.0, 4.0, 15.0, 3.0, 1.0, 1.0, 3.0, 0.0, 3.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03411865234375, -0.032857418060302734, -0.03159618377685547, -0.030334949493408203, -0.029073715209960938, -0.027812480926513672, -0.026551246643066406, -0.02529001235961914, -0.024028778076171875, -0.02276754379272461, -0.021506309509277344, -0.020245075225830078, -0.018983840942382812, -0.017722606658935547, -0.01646137237548828, -0.015200138092041016, -0.01393890380859375, -0.012677669525146484, -0.011416435241699219, -0.010155200958251953, -0.008893966674804688, -0.007632732391357422, -0.006371498107910156, -0.005110263824462891, -0.003849029541015625, -0.0025877952575683594, -0.0013265609741210938, -6.532669067382812e-05, 0.0011959075927734375, 0.002457141876220703, 0.0037183761596679688, 0.004979610443115234, 0.0062408447265625, 0.007502079010009766, 0.008763313293457031, 0.010024547576904297, 0.011285781860351562, 0.012547016143798828, 0.013808250427246094, 0.01506948471069336, 0.016330718994140625, 0.01759195327758789, 0.018853187561035156, 0.020114421844482422, 0.021375656127929688, 0.022636890411376953, 0.02389812469482422, 0.025159358978271484, 0.02642059326171875, 0.027681827545166016, 0.02894306182861328, 0.030204296112060547, 0.03146553039550781, 0.03272676467895508, 0.033987998962402344, 0.03524923324584961, 0.036510467529296875, 0.03777170181274414, 0.039032936096191406, 0.04029417037963867, 0.04155540466308594, 0.0428166389465332, 0.04407787322998047, 0.045339107513427734, 0.046600341796875]}, "gradients/decoder.model.decoder.layers.1.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 5.0, 6.0, 12.0, 19.0, 32.0, 56.0, 62.0, 87.0, 106.0, 145.0, 157.0, 94.0, 73.0, 56.0, 37.0, 30.0, 7.0, 13.0, 7.0, 5.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.0202512741088867, -1.96947181224823, -1.9186922311782837, -1.867912769317627, -1.8171331882476807, -1.766353726387024, -1.7155742645263672, -1.664794683456421, -1.6140152215957642, -1.5632357597351074, -1.5124561786651611, -1.4616767168045044, -1.4108972549438477, -1.3601176738739014, -1.3093382120132446, -1.258558750152588, -1.2077791690826416, -1.1569997072219849, -1.1062201261520386, -1.0554406642913818, -1.0046610832214355, -0.9538816213607788, -0.9031021595001221, -0.8523226380348206, -0.801543116569519, -0.7507635951042175, -0.699984073638916, -0.6492046117782593, -0.5984250903129578, -0.5476455688476562, -0.4968660771846771, -0.446086585521698, -0.39530718326568604, -0.3445276618003845, -0.2937481701374054, -0.24296866357326508, -0.19218915700912476, -0.14140963554382324, -0.09063014388084412, -0.03985065221786499, 0.010928869247436523, 0.06170837581157684, 0.11248788237571716, 0.16326738893985748, 0.2140468955039978, 0.2648264169692993, 0.31560590863227844, 0.36638540029525757, 0.4171649217605591, 0.4679444432258606, 0.5187239646911621, 0.5695034265518188, 0.6202829480171204, 0.6710624694824219, 0.7218419313430786, 0.7726214528083801, 0.8234009742736816, 0.8741804957389832, 0.9249600172042847, 0.9757394790649414, 1.0265190601348877, 1.0772985219955444, 1.1280779838562012, 1.1788575649261475, 1.2296370267868042]}, "gradients/decoder.model.decoder.layers.1.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 4.0, 1.0, 3.0, 5.0, 4.0, 4.0, 2.0, 4.0, 7.0, 5.0, 5.0, 12.0, 15.0, 18.0, 27.0, 41.0, 31.0, 36.0, 44.0, 34.0, 40.0, 35.0, 49.0, 38.0, 57.0, 44.0, 49.0, 46.0, 47.0, 42.0, 41.0, 30.0, 28.0, 23.0, 30.0, 15.0, 16.0, 16.0, 14.0, 7.0, 9.0, 7.0, 5.0, 8.0, 3.0, 2.0, 0.0, 3.0, 1.0, 4.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.5690981149673462, -0.5480918884277344, -0.5270857214927673, -0.5060795545578003, -0.4850733280181885, -0.46406713128089905, -0.4430609345436096, -0.4220547378063202, -0.40104854106903076, -0.38004234433174133, -0.3590361475944519, -0.3380299508571625, -0.31702375411987305, -0.2960175573825836, -0.2750113606452942, -0.25400516390800476, -0.23299896717071533, -0.2119927704334259, -0.19098657369613647, -0.16998037695884705, -0.14897418022155762, -0.1279679834842682, -0.10696178674697876, -0.08595559000968933, -0.0649493932723999, -0.043943196535110474, -0.022936999797821045, -0.0019308030605316162, 0.019075393676757812, 0.04008159041404724, 0.06108778715133667, 0.0820939838886261, 0.1031002402305603, 0.12410643696784973, 0.14511263370513916, 0.1661188304424286, 0.18712502717971802, 0.20813122391700745, 0.22913742065429688, 0.2501436173915863, 0.27114981412887573, 0.29215601086616516, 0.3131622076034546, 0.334168404340744, 0.35517460107803345, 0.3761807978153229, 0.3971869945526123, 0.41819319128990173, 0.43919938802719116, 0.4602055847644806, 0.48121178150177, 0.5022180080413818, 0.5232241749763489, 0.5442303419113159, 0.5652365684509277, 0.5862427949905396, 0.6072489619255066, 0.6282551288604736, 0.6492613554000854, 0.6702675819396973, 0.6912737488746643, 0.7122799158096313, 0.7332861423492432, 0.754292368888855, 0.775298535823822]}, "gradients/decoder.model.decoder.layers.1.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 3.0, 4.0, 5.0, 8.0, 14.0, 16.0, 14.0, 42.0, 58.0, 107.0, 185.0, 306.0, 508.0, 948.0, 1839.0, 3689.0, 8167.0, 19835.0, 56937.0, 273310.0, 527430.0, 101896.0, 30924.0, 11753.0, 5154.0, 2479.0, 1238.0, 670.0, 410.0, 224.0, 145.0, 100.0, 51.0, 34.0, 17.0, 13.0, 10.0, 5.0, 3.0, 4.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1357421875, -1.0981597900390625, -1.060577392578125, -1.0229949951171875, -0.98541259765625, -0.9478302001953125, -0.910247802734375, -0.8726654052734375, -0.8350830078125, -0.7975006103515625, -0.759918212890625, -0.7223358154296875, -0.68475341796875, -0.6471710205078125, -0.609588623046875, -0.5720062255859375, -0.534423828125, -0.4968414306640625, -0.459259033203125, -0.4216766357421875, -0.38409423828125, -0.3465118408203125, -0.308929443359375, -0.2713470458984375, -0.2337646484375, -0.1961822509765625, -0.158599853515625, -0.1210174560546875, -0.08343505859375, -0.0458526611328125, -0.008270263671875, 0.0293121337890625, 0.06689453125, 0.1044769287109375, 0.142059326171875, 0.1796417236328125, 0.21722412109375, 0.2548065185546875, 0.292388916015625, 0.3299713134765625, 0.3675537109375, 0.4051361083984375, 0.442718505859375, 0.4803009033203125, 0.51788330078125, 0.5554656982421875, 0.593048095703125, 0.6306304931640625, 0.668212890625, 0.7057952880859375, 0.743377685546875, 0.7809600830078125, 0.81854248046875, 0.8561248779296875, 0.893707275390625, 0.9312896728515625, 0.9688720703125, 1.0064544677734375, 1.044036865234375, 1.0816192626953125, 1.11920166015625, 1.1567840576171875, 1.194366455078125, 1.2319488525390625, 1.26953125]}, "gradients/decoder.model.decoder.layers.1.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 4.0, 4.0, 1.0, 3.0, 4.0, 1.0, 3.0, 9.0, 11.0, 15.0, 17.0, 21.0, 37.0, 37.0, 32.0, 47.0, 41.0, 38.0, 47.0, 45.0, 53.0, 55.0, 45.0, 56.0, 54.0, 45.0, 45.0, 32.0, 19.0, 34.0, 26.0, 22.0, 17.0, 17.0, 19.0, 3.0, 11.0, 10.0, 7.0, 8.0, 3.0, 2.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.38671875, -1.338653564453125, -1.29058837890625, -1.242523193359375, -1.1944580078125, -1.146392822265625, -1.09832763671875, -1.050262451171875, -1.002197265625, -0.954132080078125, -0.90606689453125, -0.858001708984375, -0.8099365234375, -0.761871337890625, -0.71380615234375, -0.665740966796875, -0.61767578125, -0.569610595703125, -0.52154541015625, -0.473480224609375, -0.4254150390625, -0.377349853515625, -0.32928466796875, -0.281219482421875, -0.233154296875, -0.185089111328125, -0.13702392578125, -0.088958740234375, -0.0408935546875, 0.007171630859375, 0.05523681640625, 0.103302001953125, 0.1513671875, 0.199432373046875, 0.24749755859375, 0.295562744140625, 0.3436279296875, 0.391693115234375, 0.43975830078125, 0.487823486328125, 0.535888671875, 0.583953857421875, 0.63201904296875, 0.680084228515625, 0.7281494140625, 0.776214599609375, 0.82427978515625, 0.872344970703125, 0.92041015625, 0.968475341796875, 1.01654052734375, 1.064605712890625, 1.1126708984375, 1.160736083984375, 1.20880126953125, 1.256866455078125, 1.304931640625, 1.352996826171875, 1.40106201171875, 1.449127197265625, 1.4971923828125, 1.545257568359375, 1.59332275390625, 1.641387939453125, 1.689453125]}, "gradients/decoder.model.decoder.layers.1.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 7.0, 4.0, 7.0, 14.0, 16.0, 24.0, 52.0, 65.0, 126.0, 251.0, 445.0, 1066.0, 3180.0, 13227.0, 73126.0, 748673.0, 176918.0, 23309.0, 5235.0, 1582.0, 595.0, 264.0, 160.0, 71.0, 44.0, 49.0, 18.0, 7.0, 10.0, 4.0, 7.0, 4.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8974609375, -1.8375701904296875, -1.777679443359375, -1.7177886962890625, -1.65789794921875, -1.5980072021484375, -1.538116455078125, -1.4782257080078125, -1.4183349609375, -1.3584442138671875, -1.298553466796875, -1.2386627197265625, -1.17877197265625, -1.1188812255859375, -1.058990478515625, -0.9990997314453125, -0.939208984375, -0.8793182373046875, -0.819427490234375, -0.7595367431640625, -0.69964599609375, -0.6397552490234375, -0.579864501953125, -0.5199737548828125, -0.4600830078125, -0.4001922607421875, -0.340301513671875, -0.2804107666015625, -0.22052001953125, -0.1606292724609375, -0.100738525390625, -0.0408477783203125, 0.01904296875, 0.0789337158203125, 0.138824462890625, 0.1987152099609375, 0.25860595703125, 0.3184967041015625, 0.378387451171875, 0.4382781982421875, 0.4981689453125, 0.5580596923828125, 0.617950439453125, 0.6778411865234375, 0.73773193359375, 0.7976226806640625, 0.857513427734375, 0.9174041748046875, 0.977294921875, 1.0371856689453125, 1.097076416015625, 1.1569671630859375, 1.21685791015625, 1.2767486572265625, 1.336639404296875, 1.3965301513671875, 1.4564208984375, 1.5163116455078125, 1.576202392578125, 1.6360931396484375, 1.69598388671875, 1.7558746337890625, 1.815765380859375, 1.8756561279296875, 1.935546875]}, "gradients/decoder.model.decoder.layers.1.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 9.0, 4.0, 8.0, 13.0, 13.0, 10.0, 16.0, 17.0, 16.0, 28.0, 32.0, 43.0, 43.0, 44.0, 37.0, 62.0, 50.0, 53.0, 60.0, 55.0, 44.0, 46.0, 47.0, 35.0, 42.0, 31.0, 27.0, 23.0, 32.0, 13.0, 9.0, 12.0, 10.0, 5.0, 5.0, 6.0, 4.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8984375, -1.837982177734375, -1.77752685546875, -1.717071533203125, -1.6566162109375, -1.596160888671875, -1.53570556640625, -1.475250244140625, -1.414794921875, -1.354339599609375, -1.29388427734375, -1.233428955078125, -1.1729736328125, -1.112518310546875, -1.05206298828125, -0.991607666015625, -0.93115234375, -0.870697021484375, -0.81024169921875, -0.749786376953125, -0.6893310546875, -0.628875732421875, -0.56842041015625, -0.507965087890625, -0.447509765625, -0.387054443359375, -0.32659912109375, -0.266143798828125, -0.2056884765625, -0.145233154296875, -0.08477783203125, -0.024322509765625, 0.0361328125, 0.096588134765625, 0.15704345703125, 0.217498779296875, 0.2779541015625, 0.338409423828125, 0.39886474609375, 0.459320068359375, 0.519775390625, 0.580230712890625, 0.64068603515625, 0.701141357421875, 0.7615966796875, 0.822052001953125, 0.88250732421875, 0.942962646484375, 1.00341796875, 1.063873291015625, 1.12432861328125, 1.184783935546875, 1.2452392578125, 1.305694580078125, 1.36614990234375, 1.426605224609375, 1.487060546875, 1.547515869140625, 1.60797119140625, 1.668426513671875, 1.7288818359375, 1.789337158203125, 1.84979248046875, 1.910247802734375, 1.970703125]}, "gradients/decoder.model.decoder.layers.1.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 2.0, 3.0, 8.0, 7.0, 14.0, 20.0, 29.0, 41.0, 68.0, 105.0, 191.0, 339.0, 725.0, 1512.0, 3731.0, 10888.0, 44741.0, 266995.0, 566686.0, 118541.0, 22592.0, 6620.0, 2452.0, 1074.0, 505.0, 280.0, 156.0, 85.0, 52.0, 27.0, 12.0, 12.0, 13.0, 3.0, 4.0, 8.0, 4.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 3.0], "bins": [-0.306640625, -0.29683685302734375, -0.2870330810546875, -0.27722930908203125, -0.267425537109375, -0.25762176513671875, -0.2478179931640625, -0.23801422119140625, -0.22821044921875, -0.21840667724609375, -0.2086029052734375, -0.19879913330078125, -0.188995361328125, -0.17919158935546875, -0.1693878173828125, -0.15958404541015625, -0.1497802734375, -0.13997650146484375, -0.1301727294921875, -0.12036895751953125, -0.110565185546875, -0.10076141357421875, -0.0909576416015625, -0.08115386962890625, -0.07135009765625, -0.06154632568359375, -0.0517425537109375, -0.04193878173828125, -0.032135009765625, -0.02233123779296875, -0.0125274658203125, -0.00272369384765625, 0.007080078125, 0.01688385009765625, 0.0266876220703125, 0.03649139404296875, 0.046295166015625, 0.05609893798828125, 0.0659027099609375, 0.07570648193359375, 0.08551025390625, 0.09531402587890625, 0.1051177978515625, 0.11492156982421875, 0.124725341796875, 0.13452911376953125, 0.1443328857421875, 0.15413665771484375, 0.1639404296875, 0.17374420166015625, 0.1835479736328125, 0.19335174560546875, 0.203155517578125, 0.21295928955078125, 0.2227630615234375, 0.23256683349609375, 0.24237060546875, 0.25217437744140625, 0.2619781494140625, 0.27178192138671875, 0.281585693359375, 0.29138946533203125, 0.3011932373046875, 0.31099700927734375, 0.32080078125]}, "gradients/decoder.model.decoder.layers.1.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 4.0, 2.0, 3.0, 5.0, 3.0, 5.0, 7.0, 8.0, 19.0, 26.0, 35.0, 67.0, 73.0, 117.0, 133.0, 149.0, 101.0, 82.0, 51.0, 28.0, 25.0, 17.0, 13.0, 8.0, 8.0, 6.0, 4.0, 2.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.461143493652344e-05, -6.258673965930939e-05, -6.056204438209534e-05, -5.853734910488129e-05, -5.6512653827667236e-05, -5.4487958550453186e-05, -5.2463263273239136e-05, -5.0438567996025085e-05, -4.8413872718811035e-05, -4.6389177441596985e-05, -4.4364482164382935e-05, -4.2339786887168884e-05, -4.0315091609954834e-05, -3.8290396332740784e-05, -3.6265701055526733e-05, -3.424100577831268e-05, -3.221631050109863e-05, -3.0191615223884583e-05, -2.8166919946670532e-05, -2.6142224669456482e-05, -2.411752939224243e-05, -2.209283411502838e-05, -2.006813883781433e-05, -1.804344356060028e-05, -1.601874828338623e-05, -1.399405300617218e-05, -1.196935772895813e-05, -9.94466245174408e-06, -7.91996717453003e-06, -5.895271897315979e-06, -3.870576620101929e-06, -1.8458813428878784e-06, 1.7881393432617188e-07, 2.203509211540222e-06, 4.2282044887542725e-06, 6.252899765968323e-06, 8.277595043182373e-06, 1.0302290320396423e-05, 1.2326985597610474e-05, 1.4351680874824524e-05, 1.6376376152038574e-05, 1.8401071429252625e-05, 2.0425766706466675e-05, 2.2450461983680725e-05, 2.4475157260894775e-05, 2.6499852538108826e-05, 2.8524547815322876e-05, 3.0549243092536926e-05, 3.2573938369750977e-05, 3.459863364696503e-05, 3.662332892417908e-05, 3.864802420139313e-05, 4.067271947860718e-05, 4.269741475582123e-05, 4.472211003303528e-05, 4.674680531024933e-05, 4.877150058746338e-05, 5.079619586467743e-05, 5.282089114189148e-05, 5.484558641910553e-05, 5.687028169631958e-05, 5.889497697353363e-05, 6.091967225074768e-05, 6.294436752796173e-05, 6.496906280517578e-05]}, "gradients/decoder.model.decoder.layers.1.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 3.0, 4.0, 4.0, 4.0, 6.0, 14.0, 24.0, 22.0, 41.0, 78.0, 112.0, 161.0, 275.0, 589.0, 1248.0, 3160.0, 8645.0, 33921.0, 206386.0, 611240.0, 145181.0, 25465.0, 7084.0, 2574.0, 1104.0, 478.0, 277.0, 178.0, 107.0, 46.0, 47.0, 28.0, 23.0, 7.0, 8.0, 5.0, 0.0, 4.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.356689453125, -0.3449592590332031, -0.33322906494140625, -0.3214988708496094, -0.3097686767578125, -0.2980384826660156, -0.28630828857421875, -0.2745780944824219, -0.262847900390625, -0.2511177062988281, -0.23938751220703125, -0.22765731811523438, -0.2159271240234375, -0.20419692993164062, -0.19246673583984375, -0.18073654174804688, -0.16900634765625, -0.15727615356445312, -0.14554595947265625, -0.13381576538085938, -0.1220855712890625, -0.11035537719726562, -0.09862518310546875, -0.08689498901367188, -0.075164794921875, -0.06343460083007812, -0.05170440673828125, -0.039974212646484375, -0.0282440185546875, -0.016513824462890625, -0.00478363037109375, 0.006946563720703125, 0.0186767578125, 0.030406951904296875, 0.04213714599609375, 0.053867340087890625, 0.0655975341796875, 0.07732772827148438, 0.08905792236328125, 0.10078811645507812, 0.112518310546875, 0.12424850463867188, 0.13597869873046875, 0.14770889282226562, 0.1594390869140625, 0.17116928100585938, 0.18289947509765625, 0.19462966918945312, 0.20635986328125, 0.21809005737304688, 0.22982025146484375, 0.24155044555664062, 0.2532806396484375, 0.2650108337402344, 0.27674102783203125, 0.2884712219238281, 0.300201416015625, 0.3119316101074219, 0.32366180419921875, 0.3353919982910156, 0.3471221923828125, 0.3588523864746094, 0.37058258056640625, 0.3823127746582031, 0.39404296875]}, "gradients/decoder.model.decoder.layers.1.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 5.0, 5.0, 8.0, 9.0, 12.0, 12.0, 25.0, 18.0, 36.0, 49.0, 56.0, 77.0, 76.0, 105.0, 122.0, 82.0, 74.0, 52.0, 47.0, 29.0, 30.0, 9.0, 10.0, 9.0, 9.0, 7.0, 9.0, 7.0, 3.0, 3.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.1773681640625, -0.17200279235839844, -0.16663742065429688, -0.1612720489501953, -0.15590667724609375, -0.1505413055419922, -0.14517593383789062, -0.13981056213378906, -0.1344451904296875, -0.12907981872558594, -0.12371444702148438, -0.11834907531738281, -0.11298370361328125, -0.10761833190917969, -0.10225296020507812, -0.09688758850097656, -0.091522216796875, -0.08615684509277344, -0.08079147338867188, -0.07542610168457031, -0.07006072998046875, -0.06469535827636719, -0.059329986572265625, -0.05396461486816406, -0.0485992431640625, -0.04323387145996094, -0.037868499755859375, -0.03250312805175781, -0.02713775634765625, -0.021772384643554688, -0.016407012939453125, -0.011041641235351562, -0.00567626953125, -0.0003108978271484375, 0.005054473876953125, 0.010419845581054688, 0.01578521728515625, 0.021150588989257812, 0.026515960693359375, 0.03188133239746094, 0.0372467041015625, 0.04261207580566406, 0.047977447509765625, 0.05334281921386719, 0.05870819091796875, 0.06407356262207031, 0.06943893432617188, 0.07480430603027344, 0.080169677734375, 0.08553504943847656, 0.09090042114257812, 0.09626579284667969, 0.10163116455078125, 0.10699653625488281, 0.11236190795898438, 0.11772727966308594, 0.1230926513671875, 0.12845802307128906, 0.13382339477539062, 0.1391887664794922, 0.14455413818359375, 0.1499195098876953, 0.15528488159179688, 0.16065025329589844, 0.166015625]}, "gradients/decoder.model.decoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 13.0, 35.0, 88.0, 131.0, 214.0, 212.0, 153.0, 82.0, 50.0, 20.0, 7.0, 4.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.637090682983398, -9.452507972717285, -9.267924308776855, -9.083341598510742, -8.898757934570312, -8.7141752243042, -8.52959156036377, -8.345008850097656, -8.160425186157227, -7.975841999053955, -7.791258811950684, -7.606675624847412, -7.422092437744141, -7.237509727478027, -7.052926540374756, -6.868343353271484, -6.683760643005371, -6.4991774559021, -6.314594268798828, -6.130011081695557, -5.945427894592285, -5.760845184326172, -5.5762619972229, -5.391678810119629, -5.207095623016357, -5.022512435913086, -4.8379292488098145, -4.653346061706543, -4.46876335144043, -4.284180164337158, -4.099596977233887, -3.9150137901306152, -3.730431079864502, -3.5458478927612305, -3.361264705657959, -3.1766817569732666, -2.992098569869995, -2.8075153827667236, -2.6229324340820312, -2.4383492469787598, -2.2537660598754883, -2.069182872772217, -1.8845998048782349, -1.700016736984253, -1.5154335498809814, -1.33085036277771, -1.146267294883728, -0.9616842269897461, -0.7771010398864746, -0.5925179123878479, -0.4079347848892212, -0.22335165739059448, -0.03876852989196777, 0.14581459760665894, 0.33039772510528564, 0.5149807929992676, 0.6995639801025391, 0.8841471076011658, 1.0687302350997925, 1.2533133029937744, 1.437896490097046, 1.6224796772003174, 1.8070627450942993, 1.9916458129882812, 2.1762290000915527]}, "gradients/decoder.model.decoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 5.0, 2.0, 6.0, 6.0, 5.0, 11.0, 16.0, 13.0, 14.0, 8.0, 26.0, 19.0, 26.0, 22.0, 35.0, 24.0, 30.0, 31.0, 40.0, 46.0, 44.0, 37.0, 41.0, 42.0, 51.0, 42.0, 37.0, 37.0, 37.0, 30.0, 33.0, 23.0, 28.0, 28.0, 20.0, 21.0, 13.0, 8.0, 6.0, 10.0, 6.0, 5.0, 6.0, 6.0, 7.0, 3.0, 5.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.3803629875183105, -2.297638416290283, -2.214913845062256, -2.1321890354156494, -2.049464464187622, -1.9667398929595947, -1.8840152025222778, -1.801290512084961, -1.7185659408569336, -1.6358413696289062, -1.5531166791915894, -1.4703919887542725, -1.3876674175262451, -1.3049428462982178, -1.2222181558609009, -1.139493465423584, -1.0567688941955566, -0.9740442633628845, -0.8913196325302124, -0.8085950016975403, -0.7258703708648682, -0.643145740032196, -0.5604211091995239, -0.4776964783668518, -0.3949718475341797, -0.31224721670150757, -0.22952258586883545, -0.14679795503616333, -0.06407332420349121, 0.018651306629180908, 0.10137593746185303, 0.18410056829452515, 0.26682519912719727, 0.3495498299598694, 0.4322744607925415, 0.5149990916252136, 0.5977237224578857, 0.6804483532905579, 0.76317298412323, 0.8458976149559021, 0.9286222457885742, 1.0113468170166016, 1.0940715074539185, 1.1767961978912354, 1.2595207691192627, 1.34224534034729, 1.424970030784607, 1.5076947212219238, 1.5904192924499512, 1.6731438636779785, 1.7558685541152954, 1.8385932445526123, 1.9213178157806396, 2.004042387008667, 2.0867671966552734, 2.169491767883301, 2.252216339111328, 2.3349409103393555, 2.417665481567383, 2.5003902912139893, 2.5831148624420166, 2.665839433670044, 2.7485642433166504, 2.8312888145446777, 2.914013385772705]}, "gradients/decoder.model.decoder.layers.0.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 2.0, 1.0, 2.0, 4.0, 5.0, 5.0, 8.0, 12.0, 19.0, 17.0, 13.0, 17.0, 30.0, 32.0, 81.0, 99.0, 168.0, 298.0, 632.0, 1453.0, 3588.0, 11515.0, 56863.0, 1070486.0, 2893819.0, 126041.0, 19240.0, 5589.0, 2114.0, 941.0, 468.0, 234.0, 165.0, 99.0, 47.0, 44.0, 37.0, 19.0, 25.0, 23.0, 9.0, 7.0, 3.0, 3.0, 5.0, 3.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.0625, -1.9984130859375, -1.934326171875, -1.8702392578125, -1.80615234375, -1.7420654296875, -1.677978515625, -1.6138916015625, -1.5498046875, -1.4857177734375, -1.421630859375, -1.3575439453125, -1.29345703125, -1.2293701171875, -1.165283203125, -1.1011962890625, -1.037109375, -0.9730224609375, -0.908935546875, -0.8448486328125, -0.78076171875, -0.7166748046875, -0.652587890625, -0.5885009765625, -0.5244140625, -0.4603271484375, -0.396240234375, -0.3321533203125, -0.26806640625, -0.2039794921875, -0.139892578125, -0.0758056640625, -0.01171875, 0.0523681640625, 0.116455078125, 0.1805419921875, 0.24462890625, 0.3087158203125, 0.372802734375, 0.4368896484375, 0.5009765625, 0.5650634765625, 0.629150390625, 0.6932373046875, 0.75732421875, 0.8214111328125, 0.885498046875, 0.9495849609375, 1.013671875, 1.0777587890625, 1.141845703125, 1.2059326171875, 1.27001953125, 1.3341064453125, 1.398193359375, 1.4622802734375, 1.5263671875, 1.5904541015625, 1.654541015625, 1.7186279296875, 1.78271484375, 1.8468017578125, 1.910888671875, 1.9749755859375, 2.0390625]}, "gradients/decoder.model.decoder.layers.0.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 6.0, 8.0, 9.0, 4.0, 12.0, 19.0, 20.0, 29.0, 41.0, 48.0, 51.0, 70.0, 78.0, 88.0, 82.0, 70.0, 63.0, 53.0, 59.0, 35.0, 49.0, 23.0, 23.0, 15.0, 9.0, 13.0, 10.0, 8.0, 7.0, 4.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1015625, -1.06964111328125, -1.0377197265625, -1.00579833984375, -0.973876953125, -0.94195556640625, -0.9100341796875, -0.87811279296875, -0.84619140625, -0.81427001953125, -0.7823486328125, -0.75042724609375, -0.718505859375, -0.68658447265625, -0.6546630859375, -0.62274169921875, -0.5908203125, -0.55889892578125, -0.5269775390625, -0.49505615234375, -0.463134765625, -0.43121337890625, -0.3992919921875, -0.36737060546875, -0.33544921875, -0.30352783203125, -0.2716064453125, -0.23968505859375, -0.207763671875, -0.17584228515625, -0.1439208984375, -0.11199951171875, -0.080078125, -0.04815673828125, -0.0162353515625, 0.01568603515625, 0.047607421875, 0.07952880859375, 0.1114501953125, 0.14337158203125, 0.17529296875, 0.20721435546875, 0.2391357421875, 0.27105712890625, 0.302978515625, 0.33489990234375, 0.3668212890625, 0.39874267578125, 0.4306640625, 0.46258544921875, 0.4945068359375, 0.52642822265625, 0.558349609375, 0.59027099609375, 0.6221923828125, 0.65411376953125, 0.68603515625, 0.71795654296875, 0.7498779296875, 0.78179931640625, 0.813720703125, 0.84564208984375, 0.8775634765625, 0.90948486328125, 0.94140625]}, "gradients/decoder.model.decoder.layers.0.fc1.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 6.0, 3.0, 3.0, 1.0, 5.0, 6.0, 7.0, 5.0, 18.0, 13.0, 33.0, 33.0, 54.0, 99.0, 109.0, 265.0, 520.0, 1282.0, 3771.0, 13771.0, 79797.0, 1588321.0, 2375454.0, 106667.0, 16810.0, 4365.0, 1447.0, 652.0, 324.0, 158.0, 86.0, 58.0, 41.0, 29.0, 19.0, 14.0, 6.0, 7.0, 6.0, 9.0, 4.0, 4.0, 4.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-1.94140625, -1.8768310546875, -1.812255859375, -1.7476806640625, -1.68310546875, -1.6185302734375, -1.553955078125, -1.4893798828125, -1.4248046875, -1.3602294921875, -1.295654296875, -1.2310791015625, -1.16650390625, -1.1019287109375, -1.037353515625, -0.9727783203125, -0.908203125, -0.8436279296875, -0.779052734375, -0.7144775390625, -0.64990234375, -0.5853271484375, -0.520751953125, -0.4561767578125, -0.3916015625, -0.3270263671875, -0.262451171875, -0.1978759765625, -0.13330078125, -0.0687255859375, -0.004150390625, 0.0604248046875, 0.125, 0.1895751953125, 0.254150390625, 0.3187255859375, 0.38330078125, 0.4478759765625, 0.512451171875, 0.5770263671875, 0.6416015625, 0.7061767578125, 0.770751953125, 0.8353271484375, 0.89990234375, 0.9644775390625, 1.029052734375, 1.0936279296875, 1.158203125, 1.2227783203125, 1.287353515625, 1.3519287109375, 1.41650390625, 1.4810791015625, 1.545654296875, 1.6102294921875, 1.6748046875, 1.7393798828125, 1.803955078125, 1.8685302734375, 1.93310546875, 1.9976806640625, 2.062255859375, 2.1268310546875, 2.19140625]}, "gradients/decoder.model.decoder.layers.0.fc1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 4.0, 2.0, 6.0, 7.0, 1.0, 11.0, 16.0, 14.0, 24.0, 30.0, 33.0, 52.0, 83.0, 107.0, 156.0, 259.0, 380.0, 499.0, 533.0, 543.0, 403.0, 291.0, 195.0, 133.0, 78.0, 60.0, 37.0, 39.0, 18.0, 15.0, 5.0, 10.0, 7.0, 6.0, 7.0, 3.0, 1.0, 1.0, 3.0, 4.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0], "bins": [-0.53857421875, -0.523468017578125, -0.50836181640625, -0.493255615234375, -0.4781494140625, -0.463043212890625, -0.44793701171875, -0.432830810546875, -0.417724609375, -0.402618408203125, -0.38751220703125, -0.372406005859375, -0.3572998046875, -0.342193603515625, -0.32708740234375, -0.311981201171875, -0.296875, -0.281768798828125, -0.26666259765625, -0.251556396484375, -0.2364501953125, -0.221343994140625, -0.20623779296875, -0.191131591796875, -0.176025390625, -0.160919189453125, -0.14581298828125, -0.130706787109375, -0.1156005859375, -0.100494384765625, -0.08538818359375, -0.070281982421875, -0.05517578125, -0.040069580078125, -0.02496337890625, -0.009857177734375, 0.0052490234375, 0.020355224609375, 0.03546142578125, 0.050567626953125, 0.065673828125, 0.080780029296875, 0.09588623046875, 0.110992431640625, 0.1260986328125, 0.141204833984375, 0.15631103515625, 0.171417236328125, 0.1865234375, 0.201629638671875, 0.21673583984375, 0.231842041015625, 0.2469482421875, 0.262054443359375, 0.27716064453125, 0.292266845703125, 0.307373046875, 0.322479248046875, 0.33758544921875, 0.352691650390625, 0.3677978515625, 0.382904052734375, 0.39801025390625, 0.413116455078125, 0.42822265625]}, "gradients/decoder.model.decoder.layers.0.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 6.0, 4.0, 9.0, 6.0, 13.0, 14.0, 16.0, 25.0, 26.0, 34.0, 50.0, 35.0, 39.0, 50.0, 40.0, 47.0, 59.0, 57.0, 56.0, 53.0, 46.0, 52.0, 40.0, 38.0, 33.0, 18.0, 35.0, 25.0, 15.0, 14.0, 7.0, 7.0, 14.0, 5.0, 4.0, 3.0, 3.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0383001565933228, -1.001896619796753, -0.9654932022094727, -0.9290897250175476, -0.8926862478256226, -0.8562827110290527, -0.8198792338371277, -0.7834757566452026, -0.7470722794532776, -0.7106688022613525, -0.6742653250694275, -0.6378618478775024, -0.6014583110809326, -0.5650548934936523, -0.5286513566970825, -0.49224787950515747, -0.4558444023132324, -0.4194409251213074, -0.3830374479293823, -0.3466339409351349, -0.31023046374320984, -0.2738269865512848, -0.23742349445819855, -0.2010200023651123, -0.16461652517318726, -0.1282130479812622, -0.09180955588817596, -0.05540607124567032, -0.019002586603164673, 0.017400890588760376, 0.05380438268184662, 0.09020787477493286, 0.12661147117614746, 0.1630149483680725, 0.19941844046115875, 0.235821932554245, 0.27222540974617004, 0.3086288869380951, 0.34503239393234253, 0.3814358711242676, 0.4178393483161926, 0.4542428255081177, 0.4906463027000427, 0.5270497798919678, 0.5634533166885376, 0.5998567342758179, 0.6362602710723877, 0.6726637482643127, 0.7090672254562378, 0.7454707026481628, 0.7818741798400879, 0.8182776570320129, 0.854681134223938, 0.8910846710205078, 0.9274881482124329, 0.9638916254043579, 1.0002951622009277, 1.0366986989974976, 1.0731021165847778, 1.1095056533813477, 1.145909070968628, 1.1823126077651978, 1.218716025352478, 1.2551195621490479, 1.2915229797363281]}, "gradients/decoder.model.decoder.layers.0.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 3.0, 2.0, 3.0, 6.0, 9.0, 5.0, 10.0, 19.0, 14.0, 10.0, 19.0, 25.0, 20.0, 29.0, 31.0, 39.0, 36.0, 31.0, 45.0, 35.0, 49.0, 50.0, 27.0, 42.0, 61.0, 45.0, 35.0, 34.0, 40.0, 30.0, 28.0, 22.0, 22.0, 16.0, 22.0, 16.0, 18.0, 12.0, 7.0, 4.0, 8.0, 12.0, 7.0, 0.0, 7.0, 3.0, 0.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.9534391164779663, -0.921132504940033, -0.8888258934020996, -0.8565192222595215, -0.8242126107215881, -0.7919059991836548, -0.7595993280410767, -0.7272927165031433, -0.69498610496521, -0.6626794934272766, -0.6303728818893433, -0.5980662107467651, -0.5657595992088318, -0.5334529876708984, -0.5011463165283203, -0.46883970499038696, -0.4365330934524536, -0.40422648191452026, -0.3719198405742645, -0.3396131992340088, -0.30730658769607544, -0.2749999761581421, -0.24269333481788635, -0.2103867083787918, -0.17808008193969727, -0.14577345550060272, -0.11346682906150818, -0.08116020262241364, -0.04885357618331909, -0.01654694974422455, 0.015759676694869995, 0.04806630313396454, 0.08037281036376953, 0.11267943680286407, 0.14498606324195862, 0.17729268968105316, 0.2095993161201477, 0.24190594255924225, 0.2742125689983368, 0.30651921033859253, 0.3388258218765259, 0.37113243341445923, 0.40343907475471497, 0.4357457160949707, 0.46805232763290405, 0.5003589391708374, 0.5326656103134155, 0.5649722218513489, 0.5972788333892822, 0.6295854449272156, 0.6618920564651489, 0.694198727607727, 0.7265053391456604, 0.7588119506835938, 0.7911186218261719, 0.8234252333641052, 0.8557318449020386, 0.8880384564399719, 0.9203450679779053, 0.9526517391204834, 0.9849583506584167, 1.01726496219635, 1.0495716333389282, 1.0818781852722168, 1.114184856414795]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 6.0, 2.0, 7.0, 10.0, 11.0, 3.0, 20.0, 20.0, 36.0, 36.0, 78.0, 91.0, 155.0, 218.0, 299.0, 478.0, 779.0, 1390.0, 2344.0, 4234.0, 8385.0, 21327.0, 165151.0, 684633.0, 122914.0, 18583.0, 7664.0, 3969.0, 2347.0, 1255.0, 712.0, 493.0, 292.0, 185.0, 145.0, 111.0, 64.0, 39.0, 22.0, 11.0, 18.0, 8.0, 5.0, 7.0, 4.0, 2.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.460205078125, -0.44791412353515625, -0.4356231689453125, -0.42333221435546875, -0.411041259765625, -0.39875030517578125, -0.3864593505859375, -0.37416839599609375, -0.36187744140625, -0.34958648681640625, -0.3372955322265625, -0.32500457763671875, -0.312713623046875, -0.30042266845703125, -0.2881317138671875, -0.27584075927734375, -0.2635498046875, -0.25125885009765625, -0.2389678955078125, -0.22667694091796875, -0.214385986328125, -0.20209503173828125, -0.1898040771484375, -0.17751312255859375, -0.16522216796875, -0.15293121337890625, -0.1406402587890625, -0.12834930419921875, -0.116058349609375, -0.10376739501953125, -0.0914764404296875, -0.07918548583984375, -0.06689453125, -0.05460357666015625, -0.0423126220703125, -0.03002166748046875, -0.017730712890625, -0.00543975830078125, 0.0068511962890625, 0.01914215087890625, 0.03143310546875, 0.04372406005859375, 0.0560150146484375, 0.06830596923828125, 0.080596923828125, 0.09288787841796875, 0.1051788330078125, 0.11746978759765625, 0.1297607421875, 0.14205169677734375, 0.1543426513671875, 0.16663360595703125, 0.178924560546875, 0.19121551513671875, 0.2035064697265625, 0.21579742431640625, 0.22808837890625, 0.24037933349609375, 0.2526702880859375, 0.26496124267578125, 0.277252197265625, 0.28954315185546875, 0.3018341064453125, 0.31412506103515625, 0.326416015625]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 5.0, 3.0, 7.0, 11.0, 5.0, 10.0, 12.0, 18.0, 20.0, 20.0, 29.0, 30.0, 32.0, 40.0, 46.0, 38.0, 47.0, 51.0, 46.0, 49.0, 47.0, 38.0, 50.0, 42.0, 46.0, 35.0, 29.0, 28.0, 35.0, 19.0, 21.0, 17.0, 16.0, 11.0, 10.0, 11.0, 9.0, 4.0, 4.0, 7.0, 5.0, 3.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6181640625, -0.5950927734375, -0.572021484375, -0.5489501953125, -0.52587890625, -0.5028076171875, -0.479736328125, -0.4566650390625, -0.43359375, -0.4105224609375, -0.387451171875, -0.3643798828125, -0.34130859375, -0.3182373046875, -0.295166015625, -0.2720947265625, -0.2490234375, -0.2259521484375, -0.202880859375, -0.1798095703125, -0.15673828125, -0.1336669921875, -0.110595703125, -0.0875244140625, -0.064453125, -0.0413818359375, -0.018310546875, 0.0047607421875, 0.02783203125, 0.0509033203125, 0.073974609375, 0.0970458984375, 0.1201171875, 0.1431884765625, 0.166259765625, 0.1893310546875, 0.21240234375, 0.2354736328125, 0.258544921875, 0.2816162109375, 0.3046875, 0.3277587890625, 0.350830078125, 0.3739013671875, 0.39697265625, 0.4200439453125, 0.443115234375, 0.4661865234375, 0.4892578125, 0.5123291015625, 0.535400390625, 0.5584716796875, 0.58154296875, 0.6046142578125, 0.627685546875, 0.6507568359375, 0.673828125, 0.6968994140625, 0.719970703125, 0.7430419921875, 0.76611328125, 0.7891845703125, 0.812255859375, 0.8353271484375, 0.8583984375]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 9.0, 4.0, 11.0, 6.0, 9.0, 11.0, 13.0, 21.0, 37.0, 51.0, 60.0, 133.0, 277.0, 574.0, 1554.0, 4474.0, 19774.0, 554453.0, 443628.0, 16735.0, 4144.0, 1376.0, 578.0, 247.0, 136.0, 73.0, 62.0, 30.0, 16.0, 15.0, 10.0, 9.0, 5.0, 5.0, 6.0, 3.0, 5.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.6337890625, -0.61566162109375, -0.5975341796875, -0.57940673828125, -0.561279296875, -0.54315185546875, -0.5250244140625, -0.50689697265625, -0.48876953125, -0.47064208984375, -0.4525146484375, -0.43438720703125, -0.416259765625, -0.39813232421875, -0.3800048828125, -0.36187744140625, -0.34375, -0.32562255859375, -0.3074951171875, -0.28936767578125, -0.271240234375, -0.25311279296875, -0.2349853515625, -0.21685791015625, -0.19873046875, -0.18060302734375, -0.1624755859375, -0.14434814453125, -0.126220703125, -0.10809326171875, -0.0899658203125, -0.07183837890625, -0.0537109375, -0.03558349609375, -0.0174560546875, 0.00067138671875, 0.018798828125, 0.03692626953125, 0.0550537109375, 0.07318115234375, 0.09130859375, 0.10943603515625, 0.1275634765625, 0.14569091796875, 0.163818359375, 0.18194580078125, 0.2000732421875, 0.21820068359375, 0.236328125, 0.25445556640625, 0.2725830078125, 0.29071044921875, 0.308837890625, 0.32696533203125, 0.3450927734375, 0.36322021484375, 0.38134765625, 0.39947509765625, 0.4176025390625, 0.43572998046875, 0.453857421875, 0.47198486328125, 0.4901123046875, 0.50823974609375, 0.5263671875]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 3.0, 2.0, 4.0, 3.0, 4.0, 4.0, 1.0, 3.0, 10.0, 6.0, 6.0, 12.0, 11.0, 15.0, 22.0, 21.0, 17.0, 21.0, 21.0, 33.0, 31.0, 31.0, 22.0, 38.0, 24.0, 38.0, 57.0, 33.0, 51.0, 53.0, 40.0, 36.0, 39.0, 37.0, 35.0, 25.0, 26.0, 26.0, 20.0, 24.0, 18.0, 15.0, 15.0, 16.0, 10.0, 3.0, 6.0, 7.0, 4.0, 4.0, 2.0, 4.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.455078125, -1.40606689453125, -1.3570556640625, -1.30804443359375, -1.259033203125, -1.21002197265625, -1.1610107421875, -1.11199951171875, -1.06298828125, -1.01397705078125, -0.9649658203125, -0.91595458984375, -0.866943359375, -0.81793212890625, -0.7689208984375, -0.71990966796875, -0.6708984375, -0.62188720703125, -0.5728759765625, -0.52386474609375, -0.474853515625, -0.42584228515625, -0.3768310546875, -0.32781982421875, -0.27880859375, -0.22979736328125, -0.1807861328125, -0.13177490234375, -0.082763671875, -0.03375244140625, 0.0152587890625, 0.06427001953125, 0.11328125, 0.16229248046875, 0.2113037109375, 0.26031494140625, 0.309326171875, 0.35833740234375, 0.4073486328125, 0.45635986328125, 0.50537109375, 0.55438232421875, 0.6033935546875, 0.65240478515625, 0.701416015625, 0.75042724609375, 0.7994384765625, 0.84844970703125, 0.8974609375, 0.94647216796875, 0.9954833984375, 1.04449462890625, 1.093505859375, 1.14251708984375, 1.1915283203125, 1.24053955078125, 1.28955078125, 1.33856201171875, 1.3875732421875, 1.43658447265625, 1.485595703125, 1.53460693359375, 1.5836181640625, 1.63262939453125, 1.681640625]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 3.0, 5.0, 2.0, 5.0, 11.0, 11.0, 10.0, 10.0, 25.0, 30.0, 55.0, 104.0, 171.0, 261.0, 520.0, 1108.0, 2457.0, 6438.0, 23859.0, 443915.0, 531399.0, 26309.0, 6858.0, 2543.0, 1151.0, 549.0, 296.0, 169.0, 94.0, 71.0, 35.0, 28.0, 17.0, 11.0, 11.0, 5.0, 6.0, 4.0, 1.0, 5.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.356201171875, -0.34603118896484375, -0.3358612060546875, -0.32569122314453125, -0.315521240234375, -0.30535125732421875, -0.2951812744140625, -0.28501129150390625, -0.27484130859375, -0.26467132568359375, -0.2545013427734375, -0.24433135986328125, -0.234161376953125, -0.22399139404296875, -0.2138214111328125, -0.20365142822265625, -0.1934814453125, -0.18331146240234375, -0.1731414794921875, -0.16297149658203125, -0.152801513671875, -0.14263153076171875, -0.1324615478515625, -0.12229156494140625, -0.11212158203125, -0.10195159912109375, -0.0917816162109375, -0.08161163330078125, -0.071441650390625, -0.06127166748046875, -0.0511016845703125, -0.04093170166015625, -0.03076171875, -0.02059173583984375, -0.0104217529296875, -0.00025177001953125, 0.009918212890625, 0.02008819580078125, 0.0302581787109375, 0.04042816162109375, 0.05059814453125, 0.06076812744140625, 0.0709381103515625, 0.08110809326171875, 0.091278076171875, 0.10144805908203125, 0.1116180419921875, 0.12178802490234375, 0.1319580078125, 0.14212799072265625, 0.1522979736328125, 0.16246795654296875, 0.172637939453125, 0.18280792236328125, 0.1929779052734375, 0.20314788818359375, 0.21331787109375, 0.22348785400390625, 0.2336578369140625, 0.24382781982421875, 0.253997802734375, 0.26416778564453125, 0.2743377685546875, 0.28450775146484375, 0.294677734375]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 3.0, 5.0, 6.0, 1.0, 7.0, 6.0, 15.0, 25.0, 38.0, 80.0, 126.0, 210.0, 206.0, 104.0, 55.0, 33.0, 22.0, 12.0, 12.0, 11.0, 5.0, 7.0, 1.0, 6.0, 1.0, 3.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0001494884490966797, -0.0001454213634133339, -0.0001413542777299881, -0.0001372871920466423, -0.0001332201063632965, -0.00012915302067995071, -0.00012508593499660492, -0.00012101884931325912, -0.00011695176362991333, -0.00011288467794656754, -0.00010881759226322174, -0.00010475050657987595, -0.00010068342089653015, -9.661633521318436e-05, -9.254924952983856e-05, -8.848216384649277e-05, -8.441507816314697e-05, -8.034799247980118e-05, -7.628090679645538e-05, -7.221382111310959e-05, -6.81467354297638e-05, -6.4079649746418e-05, -6.0012564063072205e-05, -5.594547837972641e-05, -5.1878392696380615e-05, -4.781130701303482e-05, -4.3744221329689026e-05, -3.967713564634323e-05, -3.5610049962997437e-05, -3.154296427965164e-05, -2.7475878596305847e-05, -2.3408792912960052e-05, -1.9341707229614258e-05, -1.5274621546268463e-05, -1.1207535862922668e-05, -7.140450179576874e-06, -3.073364496231079e-06, 9.937211871147156e-07, 5.06080687046051e-06, 9.127892553806305e-06, 1.31949782371521e-05, 1.7262063920497894e-05, 2.132914960384369e-05, 2.5396235287189484e-05, 2.946332097053528e-05, 3.353040665388107e-05, 3.759749233722687e-05, 4.166457802057266e-05, 4.573166370391846e-05, 4.979874938726425e-05, 5.3865835070610046e-05, 5.793292075395584e-05, 6.200000643730164e-05, 6.606709212064743e-05, 7.013417780399323e-05, 7.420126348733902e-05, 7.826834917068481e-05, 8.233543485403061e-05, 8.64025205373764e-05, 9.04696062207222e-05, 9.453669190406799e-05, 9.860377758741379e-05, 0.00010267086327075958, 0.00010673794895410538, 0.00011080503463745117]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 0.0, 5.0, 3.0, 3.0, 5.0, 4.0, 11.0, 12.0, 8.0, 27.0, 31.0, 50.0, 79.0, 98.0, 135.0, 221.0, 297.0, 406.0, 582.0, 851.0, 1283.0, 2017.0, 3159.0, 5400.0, 10254.0, 24393.0, 91949.0, 450114.0, 349704.0, 65946.0, 19405.0, 8837.0, 4762.0, 2814.0, 1761.0, 1191.0, 828.0, 521.0, 373.0, 280.0, 181.0, 166.0, 92.0, 81.0, 59.0, 41.0, 32.0, 25.0, 25.0, 12.0, 11.0, 7.0, 3.0, 5.0, 5.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.1610107421875, -0.15579986572265625, -0.1505889892578125, -0.14537811279296875, -0.140167236328125, -0.13495635986328125, -0.1297454833984375, -0.12453460693359375, -0.11932373046875, -0.11411285400390625, -0.1089019775390625, -0.10369110107421875, -0.098480224609375, -0.09326934814453125, -0.0880584716796875, -0.08284759521484375, -0.07763671875, -0.07242584228515625, -0.0672149658203125, -0.06200408935546875, -0.056793212890625, -0.05158233642578125, -0.0463714599609375, -0.04116058349609375, -0.03594970703125, -0.03073883056640625, -0.0255279541015625, -0.02031707763671875, -0.015106201171875, -0.00989532470703125, -0.0046844482421875, 0.00052642822265625, 0.0057373046875, 0.01094818115234375, 0.0161590576171875, 0.02136993408203125, 0.026580810546875, 0.03179168701171875, 0.0370025634765625, 0.04221343994140625, 0.04742431640625, 0.05263519287109375, 0.0578460693359375, 0.06305694580078125, 0.068267822265625, 0.07347869873046875, 0.0786895751953125, 0.08390045166015625, 0.089111328125, 0.09432220458984375, 0.0995330810546875, 0.10474395751953125, 0.109954833984375, 0.11516571044921875, 0.1203765869140625, 0.12558746337890625, 0.13079833984375, 0.13600921630859375, 0.1412200927734375, 0.14643096923828125, 0.151641845703125, 0.15685272216796875, 0.1620635986328125, 0.16727447509765625, 0.1724853515625]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 4.0, 2.0, 5.0, 4.0, 8.0, 13.0, 10.0, 18.0, 31.0, 47.0, 68.0, 105.0, 127.0, 134.0, 134.0, 92.0, 71.0, 38.0, 27.0, 16.0, 6.0, 7.0, 10.0, 5.0, 0.0, 5.0, 1.0, 3.0, 0.0, 4.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.050537109375, -0.0486297607421875, -0.046722412109375, -0.0448150634765625, -0.04290771484375, -0.0410003662109375, -0.039093017578125, -0.0371856689453125, -0.0352783203125, -0.0333709716796875, -0.031463623046875, -0.0295562744140625, -0.02764892578125, -0.0257415771484375, -0.023834228515625, -0.0219268798828125, -0.02001953125, -0.0181121826171875, -0.016204833984375, -0.0142974853515625, -0.01239013671875, -0.0104827880859375, -0.008575439453125, -0.0066680908203125, -0.0047607421875, -0.0028533935546875, -0.000946044921875, 0.0009613037109375, 0.00286865234375, 0.0047760009765625, 0.006683349609375, 0.0085906982421875, 0.010498046875, 0.0124053955078125, 0.014312744140625, 0.0162200927734375, 0.01812744140625, 0.0200347900390625, 0.021942138671875, 0.0238494873046875, 0.0257568359375, 0.0276641845703125, 0.029571533203125, 0.0314788818359375, 0.03338623046875, 0.0352935791015625, 0.037200927734375, 0.0391082763671875, 0.041015625, 0.0429229736328125, 0.044830322265625, 0.0467376708984375, 0.04864501953125, 0.0505523681640625, 0.052459716796875, 0.0543670654296875, 0.0562744140625, 0.0581817626953125, 0.060089111328125, 0.0619964599609375, 0.06390380859375, 0.0658111572265625, 0.067718505859375, 0.0696258544921875, 0.071533203125]}, "gradients/decoder.model.decoder.layers.0.self_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 5.0, 3.0, 4.0, 3.0, 6.0, 11.0, 12.0, 23.0, 28.0, 24.0, 26.0, 38.0, 46.0, 42.0, 46.0, 66.0, 52.0, 67.0, 59.0, 61.0, 47.0, 46.0, 54.0, 45.0, 45.0, 29.0, 29.0, 25.0, 13.0, 12.0, 6.0, 10.0, 5.0, 9.0, 6.0, 1.0, 1.0, 4.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6278553009033203, -0.6019745469093323, -0.5760937333106995, -0.5502129793167114, -0.5243321657180786, -0.4984514117240906, -0.47257062792778015, -0.4466898441314697, -0.4208090901374817, -0.39492830634117126, -0.36904752254486084, -0.3431667685508728, -0.3172859847545624, -0.29140520095825195, -0.26552441716194153, -0.2396436482667923, -0.21376284956932068, -0.18788206577301025, -0.16200129687786102, -0.1361205130815506, -0.11023973673582077, -0.08435896039009094, -0.05847817659378052, -0.03259740769863129, -0.006716623902320862, 0.019164154306054115, 0.04504493251442909, 0.07092571258544922, 0.09680648893117905, 0.12268726527690887, 0.1485680490732193, 0.17444881796836853, 0.20032960176467896, 0.22621038556098938, 0.2520911693572998, 0.27797192335128784, 0.30385270714759827, 0.3297334909439087, 0.3556142747402191, 0.38149505853652954, 0.4073758125305176, 0.433256596326828, 0.4591373801231384, 0.48501813411712646, 0.5108989477157593, 0.5367797017097473, 0.5626604557037354, 0.5885412693023682, 0.614422082901001, 0.640302836894989, 0.6661836504936218, 0.6920644044876099, 0.7179452180862427, 0.7438259720802307, 0.7697067260742188, 0.7955875396728516, 0.8214682936668396, 0.8473490476608276, 0.8732298612594604, 0.8991106152534485, 0.9249914288520813, 0.9508721828460693, 0.9767529964447021, 1.0026336908340454, 1.0285145044326782]}, "gradients/decoder.model.decoder.layers.0.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 5.0, 0.0, 1.0, 0.0, 4.0, 5.0, 1.0, 7.0, 3.0, 12.0, 7.0, 10.0, 13.0, 9.0, 20.0, 25.0, 28.0, 21.0, 32.0, 33.0, 27.0, 34.0, 28.0, 53.0, 44.0, 40.0, 36.0, 49.0, 50.0, 40.0, 36.0, 44.0, 24.0, 36.0, 32.0, 31.0, 19.0, 24.0, 23.0, 14.0, 22.0, 14.0, 7.0, 11.0, 5.0, 6.0, 7.0, 5.0, 5.0, 5.0, 1.0, 4.0, 2.0, 0.0, 1.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5633696913719177, -0.5433587431907654, -0.523347795009613, -0.5033368468284607, -0.48332586884498596, -0.4633149206638336, -0.4433039426803589, -0.42329299449920654, -0.4032820463180542, -0.38327109813690186, -0.3632601499557495, -0.3432491719722748, -0.32323822379112244, -0.3032272756099701, -0.28321629762649536, -0.263205349445343, -0.24319440126419067, -0.22318345308303833, -0.2031724900007248, -0.18316152691841125, -0.1631505787372589, -0.14313963055610657, -0.12312866747379303, -0.10311770439147949, -0.08310675621032715, -0.06309580057859421, -0.04308484494686127, -0.023073889315128326, -0.0030629336833953857, 0.016948021948337555, 0.036958977580070496, 0.05696994066238403, 0.07698094844818115, 0.09699190407991409, 0.11700285971164703, 0.13701382279396057, 0.15702477097511292, 0.17703571915626526, 0.1970466822385788, 0.21705764532089233, 0.23706859350204468, 0.257079541683197, 0.27709048986434937, 0.2971014678478241, 0.31711241602897644, 0.3371233642101288, 0.3571343421936035, 0.37714529037475586, 0.3971562385559082, 0.41716718673706055, 0.4371781349182129, 0.4571891129016876, 0.47720006108283997, 0.4972110092639923, 0.517221987247467, 0.5372329354286194, 0.5572438836097717, 0.5772548317909241, 0.5972657799720764, 0.6172767281532288, 0.6372877359390259, 0.6572986841201782, 0.6773096323013306, 0.6973205804824829, 0.7173315286636353]}, "gradients/decoder.model.decoder.layers.0.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 3.0, 7.0, 7.0, 8.0, 6.0, 22.0, 20.0, 23.0, 41.0, 47.0, 66.0, 100.0, 148.0, 225.0, 383.0, 634.0, 1051.0, 1798.0, 3184.0, 5635.0, 10661.0, 20299.0, 40975.0, 100036.0, 309676.0, 346113.0, 114014.0, 45376.0, 22112.0, 11555.0, 6169.0, 3351.0, 1888.0, 1097.0, 663.0, 413.0, 254.0, 157.0, 115.0, 72.0, 33.0, 36.0, 26.0, 26.0, 11.0, 7.0, 3.0, 8.0, 1.0, 4.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.880859375, -0.8525009155273438, -0.8241424560546875, -0.7957839965820312, -0.767425537109375, -0.7390670776367188, -0.7107086181640625, -0.6823501586914062, -0.65399169921875, -0.6256332397460938, -0.5972747802734375, -0.5689163208007812, -0.540557861328125, -0.5121994018554688, -0.4838409423828125, -0.45548248291015625, -0.4271240234375, -0.39876556396484375, -0.3704071044921875, -0.34204864501953125, -0.313690185546875, -0.28533172607421875, -0.2569732666015625, -0.22861480712890625, -0.20025634765625, -0.17189788818359375, -0.1435394287109375, -0.11518096923828125, -0.086822509765625, -0.05846405029296875, -0.0301055908203125, -0.00174713134765625, 0.026611328125, 0.05496978759765625, 0.0833282470703125, 0.11168670654296875, 0.140045166015625, 0.16840362548828125, 0.1967620849609375, 0.22512054443359375, 0.25347900390625, 0.28183746337890625, 0.3101959228515625, 0.33855438232421875, 0.366912841796875, 0.39527130126953125, 0.4236297607421875, 0.45198822021484375, 0.4803466796875, 0.5087051391601562, 0.5370635986328125, 0.5654220581054688, 0.593780517578125, 0.6221389770507812, 0.6504974365234375, 0.6788558959960938, 0.70721435546875, 0.7355728149414062, 0.7639312744140625, 0.7922897338867188, 0.820648193359375, 0.8490066528320312, 0.8773651123046875, 0.9057235717773438, 0.93408203125]}, "gradients/decoder.model.decoder.layers.0.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 3.0, 3.0, 2.0, 4.0, 4.0, 2.0, 8.0, 11.0, 7.0, 16.0, 9.0, 10.0, 20.0, 30.0, 33.0, 32.0, 29.0, 32.0, 42.0, 22.0, 41.0, 36.0, 49.0, 45.0, 53.0, 53.0, 34.0, 43.0, 42.0, 38.0, 37.0, 34.0, 29.0, 22.0, 15.0, 21.0, 21.0, 14.0, 6.0, 13.0, 16.0, 5.0, 6.0, 3.0, 2.0, 5.0, 2.0, 2.0, 3.0, 0.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.087890625, -1.0493316650390625, -1.010772705078125, -0.9722137451171875, -0.93365478515625, -0.8950958251953125, -0.856536865234375, -0.8179779052734375, -0.7794189453125, -0.7408599853515625, -0.702301025390625, -0.6637420654296875, -0.62518310546875, -0.5866241455078125, -0.548065185546875, -0.5095062255859375, -0.470947265625, -0.4323883056640625, -0.393829345703125, -0.3552703857421875, -0.31671142578125, -0.2781524658203125, -0.239593505859375, -0.2010345458984375, -0.1624755859375, -0.1239166259765625, -0.085357666015625, -0.0467987060546875, -0.00823974609375, 0.0303192138671875, 0.068878173828125, 0.1074371337890625, 0.14599609375, 0.1845550537109375, 0.223114013671875, 0.2616729736328125, 0.30023193359375, 0.3387908935546875, 0.377349853515625, 0.4159088134765625, 0.4544677734375, 0.4930267333984375, 0.531585693359375, 0.5701446533203125, 0.60870361328125, 0.6472625732421875, 0.685821533203125, 0.7243804931640625, 0.762939453125, 0.8014984130859375, 0.840057373046875, 0.8786163330078125, 0.91717529296875, 0.9557342529296875, 0.994293212890625, 1.0328521728515625, 1.0714111328125, 1.1099700927734375, 1.148529052734375, 1.1870880126953125, 1.22564697265625, 1.2642059326171875, 1.302764892578125, 1.3413238525390625, 1.3798828125]}, "gradients/decoder.model.decoder.layers.0.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 2.0, 6.0, 12.0, 15.0, 17.0, 34.0, 59.0, 85.0, 147.0, 212.0, 349.0, 717.0, 1501.0, 3843.0, 10649.0, 33629.0, 132113.0, 616209.0, 185690.0, 41930.0, 13044.0, 4576.0, 1841.0, 828.0, 454.0, 214.0, 137.0, 89.0, 60.0, 37.0, 20.0, 17.0, 11.0, 5.0, 7.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-1.7666015625, -1.71832275390625, -1.6700439453125, -1.62176513671875, -1.573486328125, -1.52520751953125, -1.4769287109375, -1.42864990234375, -1.38037109375, -1.33209228515625, -1.2838134765625, -1.23553466796875, -1.187255859375, -1.13897705078125, -1.0906982421875, -1.04241943359375, -0.994140625, -0.94586181640625, -0.8975830078125, -0.84930419921875, -0.801025390625, -0.75274658203125, -0.7044677734375, -0.65618896484375, -0.60791015625, -0.55963134765625, -0.5113525390625, -0.46307373046875, -0.414794921875, -0.36651611328125, -0.3182373046875, -0.26995849609375, -0.2216796875, -0.17340087890625, -0.1251220703125, -0.07684326171875, -0.028564453125, 0.01971435546875, 0.0679931640625, 0.11627197265625, 0.16455078125, 0.21282958984375, 0.2611083984375, 0.30938720703125, 0.357666015625, 0.40594482421875, 0.4542236328125, 0.50250244140625, 0.55078125, 0.59906005859375, 0.6473388671875, 0.69561767578125, 0.743896484375, 0.79217529296875, 0.8404541015625, 0.88873291015625, 0.93701171875, 0.98529052734375, 1.0335693359375, 1.08184814453125, 1.130126953125, 1.17840576171875, 1.2266845703125, 1.27496337890625, 1.3232421875]}, "gradients/decoder.model.decoder.layers.0.self_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 2.0, 2.0, 4.0, 3.0, 9.0, 10.0, 12.0, 16.0, 17.0, 19.0, 29.0, 26.0, 37.0, 38.0, 38.0, 54.0, 53.0, 55.0, 68.0, 66.0, 53.0, 67.0, 52.0, 44.0, 50.0, 42.0, 26.0, 24.0, 25.0, 17.0, 15.0, 9.0, 8.0, 8.0, 3.0, 2.0, 1.0, 4.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4052734375, -1.3443450927734375, -1.283416748046875, -1.2224884033203125, -1.16156005859375, -1.1006317138671875, -1.039703369140625, -0.9787750244140625, -0.9178466796875, -0.8569183349609375, -0.795989990234375, -0.7350616455078125, -0.67413330078125, -0.6132049560546875, -0.552276611328125, -0.4913482666015625, -0.430419921875, -0.3694915771484375, -0.308563232421875, -0.2476348876953125, -0.18670654296875, -0.1257781982421875, -0.064849853515625, -0.0039215087890625, 0.0570068359375, 0.1179351806640625, 0.178863525390625, 0.2397918701171875, 0.30072021484375, 0.3616485595703125, 0.422576904296875, 0.4835052490234375, 0.54443359375, 0.6053619384765625, 0.666290283203125, 0.7272186279296875, 0.78814697265625, 0.8490753173828125, 0.910003662109375, 0.9709320068359375, 1.0318603515625, 1.0927886962890625, 1.153717041015625, 1.2146453857421875, 1.27557373046875, 1.3365020751953125, 1.397430419921875, 1.4583587646484375, 1.519287109375, 1.5802154541015625, 1.641143798828125, 1.7020721435546875, 1.76300048828125, 1.8239288330078125, 1.884857177734375, 1.9457855224609375, 2.0067138671875, 2.0676422119140625, 2.128570556640625, 2.1894989013671875, 2.25042724609375, 2.3113555908203125, 2.372283935546875, 2.4332122802734375, 2.494140625]}, "gradients/decoder.model.decoder.layers.0.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 1.0, 2.0, 10.0, 5.0, 4.0, 10.0, 15.0, 18.0, 23.0, 33.0, 48.0, 69.0, 93.0, 143.0, 211.0, 346.0, 505.0, 818.0, 1178.0, 1995.0, 3488.0, 6153.0, 11617.0, 24371.0, 59167.0, 174036.0, 442867.0, 199159.0, 66490.0, 26968.0, 12608.0, 6580.0, 3660.0, 2073.0, 1388.0, 805.0, 508.0, 362.0, 241.0, 157.0, 97.0, 72.0, 50.0, 29.0, 26.0, 16.0, 14.0, 14.0, 6.0, 4.0, 6.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0], "bins": [-0.288818359375, -0.28021240234375, -0.2716064453125, -0.26300048828125, -0.25439453125, -0.24578857421875, -0.2371826171875, -0.22857666015625, -0.219970703125, -0.21136474609375, -0.2027587890625, -0.19415283203125, -0.185546875, -0.17694091796875, -0.1683349609375, -0.15972900390625, -0.151123046875, -0.14251708984375, -0.1339111328125, -0.12530517578125, -0.11669921875, -0.10809326171875, -0.0994873046875, -0.09088134765625, -0.082275390625, -0.07366943359375, -0.0650634765625, -0.05645751953125, -0.0478515625, -0.03924560546875, -0.0306396484375, -0.02203369140625, -0.013427734375, -0.00482177734375, 0.0037841796875, 0.01239013671875, 0.02099609375, 0.02960205078125, 0.0382080078125, 0.04681396484375, 0.055419921875, 0.06402587890625, 0.0726318359375, 0.08123779296875, 0.08984375, 0.09844970703125, 0.1070556640625, 0.11566162109375, 0.124267578125, 0.13287353515625, 0.1414794921875, 0.15008544921875, 0.15869140625, 0.16729736328125, 0.1759033203125, 0.18450927734375, 0.193115234375, 0.20172119140625, 0.2103271484375, 0.21893310546875, 0.2275390625, 0.23614501953125, 0.2447509765625, 0.25335693359375, 0.261962890625]}, "gradients/decoder.model.decoder.layers.0.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 3.0, 3.0, 2.0, 4.0, 7.0, 8.0, 5.0, 8.0, 19.0, 11.0, 28.0, 43.0, 46.0, 82.0, 96.0, 188.0, 128.0, 84.0, 76.0, 39.0, 33.0, 23.0, 25.0, 15.0, 9.0, 6.0, 4.0, 3.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.337331771850586e-05, -7.064174860715866e-05, -6.791017949581146e-05, -6.517861038446426e-05, -6.244704127311707e-05, -5.971547216176987e-05, -5.698390305042267e-05, -5.425233393907547e-05, -5.152076482772827e-05, -4.878919571638107e-05, -4.6057626605033875e-05, -4.3326057493686676e-05, -4.059448838233948e-05, -3.786291927099228e-05, -3.513135015964508e-05, -3.239978104829788e-05, -2.9668211936950684e-05, -2.6936642825603485e-05, -2.4205073714256287e-05, -2.1473504602909088e-05, -1.874193549156189e-05, -1.601036638021469e-05, -1.3278797268867493e-05, -1.0547228157520294e-05, -7.815659046173096e-06, -5.084089934825897e-06, -2.3525208234786987e-06, 3.7904828786849976e-07, 3.1106173992156982e-06, 5.842186510562897e-06, 8.573755621910095e-06, 1.1305324733257294e-05, 1.4036893844604492e-05, 1.676846295595169e-05, 1.950003206729889e-05, 2.2231601178646088e-05, 2.4963170289993286e-05, 2.7694739401340485e-05, 3.0426308512687683e-05, 3.315787762403488e-05, 3.588944673538208e-05, 3.862101584672928e-05, 4.135258495807648e-05, 4.4084154069423676e-05, 4.6815723180770874e-05, 4.954729229211807e-05, 5.227886140346527e-05, 5.501043051481247e-05, 5.774199962615967e-05, 6.0473568737506866e-05, 6.320513784885406e-05, 6.593670696020126e-05, 6.866827607154846e-05, 7.139984518289566e-05, 7.413141429424286e-05, 7.686298340559006e-05, 7.959455251693726e-05, 8.232612162828445e-05, 8.505769073963165e-05, 8.778925985097885e-05, 9.052082896232605e-05, 9.325239807367325e-05, 9.598396718502045e-05, 9.871553629636765e-05, 0.00010144710540771484]}, "gradients/decoder.model.decoder.layers.0.self_attn.q_proj.weight": {"_type": "histogram", "values": [4.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 1.0, 2.0, 3.0, 4.0, 10.0, 8.0, 12.0, 21.0, 28.0, 32.0, 70.0, 97.0, 127.0, 187.0, 291.0, 517.0, 881.0, 1489.0, 2511.0, 4698.0, 8924.0, 19274.0, 48413.0, 164426.0, 526766.0, 177938.0, 51173.0, 20061.0, 9283.0, 4838.0, 2673.0, 1549.0, 890.0, 501.0, 299.0, 187.0, 125.0, 93.0, 59.0, 29.0, 25.0, 7.0, 13.0, 7.0, 6.0, 5.0, 2.0, 2.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.3984375, -0.3857994079589844, -0.37316131591796875, -0.3605232238769531, -0.3478851318359375, -0.3352470397949219, -0.32260894775390625, -0.3099708557128906, -0.297332763671875, -0.2846946716308594, -0.27205657958984375, -0.2594184875488281, -0.2467803955078125, -0.23414230346679688, -0.22150421142578125, -0.20886611938476562, -0.19622802734375, -0.18358993530273438, -0.17095184326171875, -0.15831375122070312, -0.1456756591796875, -0.13303756713867188, -0.12039947509765625, -0.10776138305664062, -0.095123291015625, -0.08248519897460938, -0.06984710693359375, -0.057209014892578125, -0.0445709228515625, -0.031932830810546875, -0.01929473876953125, -0.006656646728515625, 0.0059814453125, 0.018619537353515625, 0.03125762939453125, 0.043895721435546875, 0.0565338134765625, 0.06917190551757812, 0.08180999755859375, 0.09444808959960938, 0.107086181640625, 0.11972427368164062, 0.13236236572265625, 0.14500045776367188, 0.1576385498046875, 0.17027664184570312, 0.18291473388671875, 0.19555282592773438, 0.20819091796875, 0.22082901000976562, 0.23346710205078125, 0.24610519409179688, 0.2587432861328125, 0.2713813781738281, 0.28401947021484375, 0.2966575622558594, 0.309295654296875, 0.3219337463378906, 0.33457183837890625, 0.3472099304199219, 0.3598480224609375, 0.3724861145019531, 0.38512420654296875, 0.3977622985839844, 0.410400390625]}, "gradients/decoder.model.decoder.layers.0.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 1.0, 2.0, 3.0, 2.0, 3.0, 5.0, 4.0, 5.0, 8.0, 12.0, 11.0, 10.0, 25.0, 20.0, 31.0, 42.0, 48.0, 65.0, 88.0, 153.0, 97.0, 85.0, 53.0, 47.0, 38.0, 33.0, 30.0, 18.0, 12.0, 17.0, 5.0, 11.0, 4.0, 4.0, 3.0, 6.0, 0.0, 0.0, 3.0, 1.0, 1.0, 3.0, 0.0, 0.0, 2.0], "bins": [-0.27978515625, -0.27257537841796875, -0.2653656005859375, -0.25815582275390625, -0.250946044921875, -0.24373626708984375, -0.2365264892578125, -0.22931671142578125, -0.22210693359375, -0.21489715576171875, -0.2076873779296875, -0.20047760009765625, -0.193267822265625, -0.18605804443359375, -0.1788482666015625, -0.17163848876953125, -0.1644287109375, -0.15721893310546875, -0.1500091552734375, -0.14279937744140625, -0.135589599609375, -0.12837982177734375, -0.1211700439453125, -0.11396026611328125, -0.10675048828125, -0.09954071044921875, -0.0923309326171875, -0.08512115478515625, -0.077911376953125, -0.07070159912109375, -0.0634918212890625, -0.05628204345703125, -0.049072265625, -0.04186248779296875, -0.0346527099609375, -0.02744293212890625, -0.020233154296875, -0.01302337646484375, -0.0058135986328125, 0.00139617919921875, 0.00860595703125, 0.01581573486328125, 0.0230255126953125, 0.03023529052734375, 0.037445068359375, 0.04465484619140625, 0.0518646240234375, 0.05907440185546875, 0.0662841796875, 0.07349395751953125, 0.0807037353515625, 0.08791351318359375, 0.095123291015625, 0.10233306884765625, 0.1095428466796875, 0.11675262451171875, 0.12396240234375, 0.13117218017578125, 0.1383819580078125, 0.14559173583984375, 0.152801513671875, 0.16001129150390625, 0.1672210693359375, 0.17443084716796875, 0.181640625]}, "gradients/decoder.model.decoder.layernorm_embedding.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 6.0, 2.0, 14.0, 21.0, 32.0, 60.0, 87.0, 146.0, 151.0, 147.0, 121.0, 99.0, 47.0, 39.0, 16.0, 9.0, 6.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.914153575897217, -5.779911518096924, -5.645669460296631, -5.511427879333496, -5.377185821533203, -5.24294376373291, -5.108701705932617, -4.974459648132324, -4.840217590332031, -4.705975532531738, -4.571733474731445, -4.437491416931152, -4.303249835968018, -4.169007778167725, -4.034765720367432, -3.9005236625671387, -3.766281843185425, -3.632039785385132, -3.497797966003418, -3.363555908203125, -3.229313850402832, -3.095071792602539, -2.960829973220825, -2.8265879154205322, -2.6923460960388184, -2.5581040382385254, -2.4238622188568115, -2.2896201610565186, -2.1553781032562256, -2.0211362838745117, -1.8868942260742188, -1.7526521682739258, -1.6184101104736328, -1.4841681718826294, -1.3499261140823364, -1.215684175491333, -1.08144211769104, -0.9472001791000366, -0.8129582405090332, -0.678716242313385, -0.5444742441177368, -0.4102322459220886, -0.2759902775287628, -0.141748309135437, -0.007506310939788818, 0.12673568725585938, 0.2609776258468628, 0.395219624042511, 0.5294616222381592, 0.6637036204338074, 0.7979456186294556, 0.932187557220459, 1.066429615020752, 1.2006715536117554, 1.3349134922027588, 1.4691555500030518, 1.6033974885940552, 1.7376394271850586, 1.8718814849853516, 2.0061235427856445, 2.1403653621673584, 2.2746074199676514, 2.4088492393493652, 2.543091297149658, 2.677333354949951]}, "gradients/decoder.model.decoder.layernorm_embedding.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 1.0, 10.0, 9.0, 7.0, 13.0, 12.0, 17.0, 19.0, 20.0, 17.0, 24.0, 33.0, 36.0, 31.0, 32.0, 36.0, 37.0, 45.0, 45.0, 49.0, 52.0, 52.0, 36.0, 45.0, 34.0, 41.0, 38.0, 37.0, 28.0, 29.0, 26.0, 21.0, 15.0, 14.0, 11.0, 10.0, 9.0, 7.0, 1.0, 3.0, 1.0, 1.0, 1.0, 4.0, 1.0, 0.0, 1.0, 1.0], "bins": [-3.1904244422912598, -3.1008658409118652, -3.01130747795105, -2.9217488765716553, -2.83219051361084, -2.7426319122314453, -2.653073310852051, -2.5635149478912354, -2.47395658493042, -2.3843979835510254, -2.29483962059021, -2.2052810192108154, -2.11572265625, -2.0261640548706055, -1.9366055727005005, -1.8470470905303955, -1.757488489151001, -1.667930006980896, -1.578371524810791, -1.4888129234313965, -1.399254560470581, -1.3096959590911865, -1.2201374769210815, -1.1305789947509766, -1.0410205125808716, -0.9514620304107666, -0.8619035482406616, -0.7723450064659119, -0.6827865242958069, -0.5932280421257019, -0.5036695003509521, -0.41411101818084717, -0.3245522975921631, -0.2349938005208969, -0.14543530344963074, -0.05587679147720337, 0.03368169069290161, 0.12324017286300659, 0.21279871463775635, 0.30235719680786133, 0.3919156789779663, 0.4814741611480713, 0.5710326433181763, 0.660591185092926, 0.750149667263031, 0.839708149433136, 0.9292666912078857, 1.0188251733779907, 1.1083836555480957, 1.1979421377182007, 1.2875006198883057, 1.3770592212677002, 1.4666175842285156, 1.5561761856079102, 1.6457346677780151, 1.7352931499481201, 1.824851632118225, 1.91441011428833, 2.0039687156677246, 2.09352707862854, 2.1830856800079346, 2.27264404296875, 2.3622026443481445, 2.451761245727539, 2.5413196086883545]}, "gradients/decoder.model.decoder.embed_positions.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 2.0, 3.0, 4.0, 3.0, 4.0, 3.0, 8.0, 14.0, 13.0, 26.0, 30.0, 30.0, 45.0, 67.0, 90.0, 136.0, 146.0, 235.0, 266.0, 422.0, 524.0, 863.0, 1194.0, 1701.0, 2738.0, 1035223.0, 2041.0, 1468.0, 910.0, 659.0, 472.0, 338.0, 258.0, 175.0, 128.0, 94.0, 64.0, 60.0, 36.0, 29.0, 19.0, 14.0, 16.0, 18.0, 12.0, 2.0, 3.0, 0.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.3699378967285156, -3.2652695178985596, -3.1606011390686035, -3.0559327602386475, -2.9512643814086914, -2.8465962409973145, -2.7419278621673584, -2.6372594833374023, -2.5325911045074463, -2.4279227256774902, -2.323254346847534, -2.218585968017578, -2.113917827606201, -2.009249210357666, -1.904581069946289, -1.799912691116333, -1.695244312286377, -1.590575933456421, -1.4859075546264648, -1.3812392950057983, -1.2765709161758423, -1.1719025373458862, -1.0672342777252197, -0.9625658988952637, -0.8578975200653076, -0.7532291412353516, -0.6485608220100403, -0.543892502784729, -0.43922412395477295, -0.3345557451248169, -0.22988742589950562, -0.12521910667419434, -0.02055048942565918, 0.08411785960197449, 0.18878620862960815, 0.2934545576572418, 0.3981229066848755, 0.5027912855148315, 0.6074596047401428, 0.7121279239654541, 0.8167963027954102, 0.9214646816253662, 1.0261330604553223, 1.1308013200759888, 1.2354696989059448, 1.3401380777359009, 1.4448063373565674, 1.5494747161865234, 1.6541430950164795, 1.7588114738464355, 1.8634798526763916, 1.968148112297058, 2.0728163719177246, 2.1774849891662598, 2.2821531295776367, 2.3868215084075928, 2.491489887237549, 2.596158266067505, 2.700826644897461, 2.805495023727417, 2.910163402557373, 3.01483154296875, 3.119499921798706, 3.224168300628662, 3.328836679458618]}, "gradients/decoder.model.decoder.embed_tokens.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 4.0, 2.0, 5.0, 3.0, 7.0, 26.0, 26.0, 37.0, 86.0, 212.0, 601.0, 1638.0, 4764.0, 14378.0, 51399616.0, 35656.0, 9024.0, 3297.0, 1208.0, 446.0, 155.0, 66.0, 23.0, 11.0, 12.0, 13.0, 9.0, 8.0, 4.0, 2.0, 2.0, 2.0, 0.0, 4.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.1003999710083, -10.633543968200684, -10.166688919067383, -9.699832916259766, -9.232977867126465, -8.766121864318848, -8.299266815185547, -7.83241081237793, -7.365555286407471, -6.898699760437012, -6.431844234466553, -5.964988708496094, -5.498132705688477, -5.031277656555176, -4.564421653747559, -4.0975661277771, -3.6307106018066406, -3.1638550758361816, -2.6969995498657227, -2.2301437854766846, -1.7632882595062256, -1.2964327335357666, -0.8295769691467285, -0.36272144317626953, 0.10413408279418945, 0.5709896683692932, 1.037845253944397, 1.5047008991241455, 1.9715564250946045, 2.4384119510650635, 2.9052677154541016, 3.3721232414245605, 3.838979721069336, 4.305835247039795, 4.772690773010254, 5.239546775817871, 5.706401824951172, 6.173257827758789, 6.640113353729248, 7.106968879699707, 7.573824405670166, 8.040679931640625, 8.507535934448242, 8.974390983581543, 9.44124698638916, 9.908102035522461, 10.374958038330078, 10.841814041137695, 11.308669090270996, 11.775525093078613, 12.242380142211914, 12.709236145019531, 13.176091194152832, 13.64294719696045, 14.10980224609375, 14.576658248901367, 15.043514251708984, 15.510370254516602, 15.977225303649902, 16.444080352783203, 16.91093635559082, 17.377792358398438, 17.844648361206055, 18.311504364013672, 18.778358459472656]}, "gradients/encoder.adapter.layers.2.conv.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 6.0, 6.0, 5.0, 6.0, 16.0, 22.0, 32.0, 45.0, 57.0, 90.0, 161.0, 216.0, 356.0, 552.0, 914.0, 1587.0, 2760.0, 5116.0, 9419.0, 18093.0, 35789.0, 75504.0, 163305.0, 355388.0, 870365.0, 3511445.0, 668832.0, 303902.0, 137545.0, 64190.0, 30693.0, 15736.0, 8448.0, 4548.0, 2545.0, 1476.0, 873.0, 519.0, 319.0, 219.0, 133.0, 81.0, 44.0, 28.0, 18.0, 19.0, 8.0, 3.0, 4.0, 1.0, 2.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0], "bins": [-1.275390625, -1.23602294921875, -1.1966552734375, -1.15728759765625, -1.117919921875, -1.07855224609375, -1.0391845703125, -0.99981689453125, -0.96044921875, -0.92108154296875, -0.8817138671875, -0.84234619140625, -0.802978515625, -0.76361083984375, -0.7242431640625, -0.68487548828125, -0.6455078125, -0.60614013671875, -0.5667724609375, -0.52740478515625, -0.488037109375, -0.44866943359375, -0.4093017578125, -0.36993408203125, -0.33056640625, -0.29119873046875, -0.2518310546875, -0.21246337890625, -0.173095703125, -0.13372802734375, -0.0943603515625, -0.05499267578125, -0.015625, 0.02374267578125, 0.0631103515625, 0.10247802734375, 0.141845703125, 0.18121337890625, 0.2205810546875, 0.25994873046875, 0.29931640625, 0.33868408203125, 0.3780517578125, 0.41741943359375, 0.456787109375, 0.49615478515625, 0.5355224609375, 0.57489013671875, 0.6142578125, 0.65362548828125, 0.6929931640625, 0.73236083984375, 0.771728515625, 0.81109619140625, 0.8504638671875, 0.88983154296875, 0.92919921875, 0.96856689453125, 1.0079345703125, 1.04730224609375, 1.086669921875, 1.12603759765625, 1.1654052734375, 1.20477294921875, 1.244140625]}, "gradients/encoder.adapter.layers.2.conv.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 5.0, 4.0, 9.0, 5.0, 12.0, 14.0, 10.0, 14.0, 20.0, 33.0, 37.0, 37.0, 38.0, 57.0, 55.0, 55.0, 164.0, 916.0, 107.0, 59.0, 55.0, 55.0, 38.0, 35.0, 46.0, 33.0, 27.0, 20.0, 17.0, 17.0, 6.0, 10.0, 8.0, 5.0, 5.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-11.1484375, -10.7828369140625, -10.417236328125, -10.0516357421875, -9.68603515625, -9.3204345703125, -8.954833984375, -8.5892333984375, -8.2236328125, -7.8580322265625, -7.492431640625, -7.1268310546875, -6.76123046875, -6.3956298828125, -6.030029296875, -5.6644287109375, -5.298828125, -4.9332275390625, -4.567626953125, -4.2020263671875, -3.83642578125, -3.4708251953125, -3.105224609375, -2.7396240234375, -2.3740234375, -2.0084228515625, -1.642822265625, -1.2772216796875, -0.91162109375, -0.5460205078125, -0.180419921875, 0.1851806640625, 0.55078125, 0.9163818359375, 1.281982421875, 1.6475830078125, 2.01318359375, 2.3787841796875, 2.744384765625, 3.1099853515625, 3.4755859375, 3.8411865234375, 4.206787109375, 4.5723876953125, 4.93798828125, 5.3035888671875, 5.669189453125, 6.0347900390625, 6.400390625, 6.7659912109375, 7.131591796875, 7.4971923828125, 7.86279296875, 8.2283935546875, 8.593994140625, 8.9595947265625, 9.3251953125, 9.6907958984375, 10.056396484375, 10.4219970703125, 10.78759765625, 11.1531982421875, 11.518798828125, 11.8843994140625, 12.25]}, "gradients/encoder.adapter.layers.1.conv.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 4.0, 5.0, 4.0, 3.0, 2.0, 7.0, 15.0, 18.0, 39.0, 59.0, 111.0, 179.0, 297.0, 498.0, 862.0, 1607.0, 3034.0, 5585.0, 11065.0, 21837.0, 43909.0, 87027.0, 165478.0, 287927.0, 449085.0, 2376595.0, 1816747.0, 427700.0, 272802.0, 155700.0, 81315.0, 40303.0, 19961.0, 10298.0, 5251.0, 2754.0, 1464.0, 805.0, 441.0, 288.0, 140.0, 77.0, 58.0, 34.0, 23.0, 12.0, 6.0, 4.0, 7.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.779296875, -0.7569961547851562, -0.7346954345703125, -0.7123947143554688, -0.690093994140625, -0.6677932739257812, -0.6454925537109375, -0.6231918334960938, -0.60089111328125, -0.5785903930664062, -0.5562896728515625, -0.5339889526367188, -0.511688232421875, -0.48938751220703125, -0.4670867919921875, -0.44478607177734375, -0.4224853515625, -0.40018463134765625, -0.3778839111328125, -0.35558319091796875, -0.333282470703125, -0.31098175048828125, -0.2886810302734375, -0.26638031005859375, -0.24407958984375, -0.22177886962890625, -0.1994781494140625, -0.17717742919921875, -0.154876708984375, -0.13257598876953125, -0.1102752685546875, -0.08797454833984375, -0.065673828125, -0.04337310791015625, -0.0210723876953125, 0.00122833251953125, 0.023529052734375, 0.04582977294921875, 0.0681304931640625, 0.09043121337890625, 0.11273193359375, 0.13503265380859375, 0.1573333740234375, 0.17963409423828125, 0.201934814453125, 0.22423553466796875, 0.2465362548828125, 0.26883697509765625, 0.2911376953125, 0.31343841552734375, 0.3357391357421875, 0.35803985595703125, 0.380340576171875, 0.40264129638671875, 0.4249420166015625, 0.44724273681640625, 0.46954345703125, 0.49184417724609375, 0.5141448974609375, 0.5364456176757812, 0.558746337890625, 0.5810470581054688, 0.6033477783203125, 0.6256484985351562, 0.64794921875]}, "gradients/encoder.adapter.layers.1.conv.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 0.0, 2.0, 4.0, 4.0, 7.0, 3.0, 11.0, 13.0, 5.0, 13.0, 13.0, 15.0, 17.0, 20.0, 23.0, 30.0, 29.0, 37.0, 35.0, 41.0, 36.0, 36.0, 50.0, 91.0, 791.0, 276.0, 47.0, 51.0, 32.0, 30.0, 41.0, 29.0, 38.0, 24.0, 25.0, 19.0, 19.0, 13.0, 10.0, 6.0, 8.0, 11.0, 11.0, 1.0, 7.0, 2.0, 2.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 2.0], "bins": [-8.390625, -8.149658203125, -7.90869140625, -7.667724609375, -7.4267578125, -7.185791015625, -6.94482421875, -6.703857421875, -6.462890625, -6.221923828125, -5.98095703125, -5.739990234375, -5.4990234375, -5.258056640625, -5.01708984375, -4.776123046875, -4.53515625, -4.294189453125, -4.05322265625, -3.812255859375, -3.5712890625, -3.330322265625, -3.08935546875, -2.848388671875, -2.607421875, -2.366455078125, -2.12548828125, -1.884521484375, -1.6435546875, -1.402587890625, -1.16162109375, -0.920654296875, -0.6796875, -0.438720703125, -0.19775390625, 0.043212890625, 0.2841796875, 0.525146484375, 0.76611328125, 1.007080078125, 1.248046875, 1.489013671875, 1.72998046875, 1.970947265625, 2.2119140625, 2.452880859375, 2.69384765625, 2.934814453125, 3.17578125, 3.416748046875, 3.65771484375, 3.898681640625, 4.1396484375, 4.380615234375, 4.62158203125, 4.862548828125, 5.103515625, 5.344482421875, 5.58544921875, 5.826416015625, 6.0673828125, 6.308349609375, 6.54931640625, 6.790283203125, 7.03125]}, "gradients/encoder.adapter.layers.0.conv.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 3.0, 4.0, 4.0, 10.0, 10.0, 9.0, 11.0, 16.0, 10.0, 23.0, 42.0, 43.0, 57.0, 92.0, 152.0, 184.0, 237.0, 307.0, 449.0, 618.0, 852.0, 1425.0, 2326.0, 4178.0, 7965.0, 16165.0, 36133.0, 86252.0, 209417.0, 469363.0, 2660759.0, 2002382.0, 446462.0, 196859.0, 81345.0, 34122.0, 15290.0, 7189.0, 3885.0, 2293.0, 1403.0, 856.0, 601.0, 401.0, 332.0, 246.0, 187.0, 118.0, 78.0, 71.0, 50.0, 42.0, 29.0, 30.0, 22.0, 23.0, 8.0, 7.0], "bins": [-1.126953125, -1.096466064453125, -1.06597900390625, -1.035491943359375, -1.0050048828125, -0.974517822265625, -0.94403076171875, -0.913543701171875, -0.883056640625, -0.852569580078125, -0.82208251953125, -0.791595458984375, -0.7611083984375, -0.730621337890625, -0.70013427734375, -0.669647216796875, -0.63916015625, -0.608673095703125, -0.57818603515625, -0.547698974609375, -0.5172119140625, -0.486724853515625, -0.45623779296875, -0.425750732421875, -0.395263671875, -0.364776611328125, -0.33428955078125, -0.303802490234375, -0.2733154296875, -0.242828369140625, -0.21234130859375, -0.181854248046875, -0.1513671875, -0.120880126953125, -0.09039306640625, -0.059906005859375, -0.0294189453125, 0.001068115234375, 0.03155517578125, 0.062042236328125, 0.092529296875, 0.123016357421875, 0.15350341796875, 0.183990478515625, 0.2144775390625, 0.244964599609375, 0.27545166015625, 0.305938720703125, 0.33642578125, 0.366912841796875, 0.39739990234375, 0.427886962890625, 0.4583740234375, 0.488861083984375, 0.51934814453125, 0.549835205078125, 0.580322265625, 0.610809326171875, 0.64129638671875, 0.671783447265625, 0.7022705078125, 0.732757568359375, 0.76324462890625, 0.793731689453125, 0.82421875]}, "gradients/encoder.adapter.layers.0.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 2.0, 6.0, 1.0, 9.0, 13.0, 11.0, 20.0, 15.0, 18.0, 22.0, 30.0, 36.0, 35.0, 37.0, 36.0, 46.0, 51.0, 31.0, 53.0, 767.0, 327.0, 49.0, 42.0, 55.0, 46.0, 35.0, 31.0, 33.0, 34.0, 34.0, 17.0, 16.0, 11.0, 17.0, 7.0, 11.0, 9.0, 5.0, 3.0, 4.0, 3.0, 1.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-10.5234375, -10.22216796875, -9.9208984375, -9.61962890625, -9.318359375, -9.01708984375, -8.7158203125, -8.41455078125, -8.11328125, -7.81201171875, -7.5107421875, -7.20947265625, -6.908203125, -6.60693359375, -6.3056640625, -6.00439453125, -5.703125, -5.40185546875, -5.1005859375, -4.79931640625, -4.498046875, -4.19677734375, -3.8955078125, -3.59423828125, -3.29296875, -2.99169921875, -2.6904296875, -2.38916015625, -2.087890625, -1.78662109375, -1.4853515625, -1.18408203125, -0.8828125, -0.58154296875, -0.2802734375, 0.02099609375, 0.322265625, 0.62353515625, 0.9248046875, 1.22607421875, 1.52734375, 1.82861328125, 2.1298828125, 2.43115234375, 2.732421875, 3.03369140625, 3.3349609375, 3.63623046875, 3.9375, 4.23876953125, 4.5400390625, 4.84130859375, 5.142578125, 5.44384765625, 5.7451171875, 6.04638671875, 6.34765625, 6.64892578125, 6.9501953125, 7.25146484375, 7.552734375, 7.85400390625, 8.1552734375, 8.45654296875, 8.7578125]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 5.0, 6.0, 13.0, 27.0, 130.0, 396.0, 312.0, 72.0, 28.0, 12.0, 3.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.443695068359375, -24.878223419189453, -23.31275177001953, -21.74728012084961, -20.181808471679688, -18.616336822509766, -17.050867080688477, -15.485395431518555, -13.919923782348633, -12.354452133178711, -10.788980484008789, -9.223509788513184, -7.658038139343262, -6.09256649017334, -4.527095794677734, -2.9616241455078125, -1.3961524963378906, 0.16931891441345215, 1.734790325164795, 3.3002614974975586, 4.8657331466674805, 6.431204795837402, 7.996675491333008, 9.56214714050293, 11.127618789672852, 12.693090438842773, 14.258562088012695, 15.8240327835083, 17.389503479003906, 18.954975128173828, 20.52044677734375, 22.085918426513672, 23.651390075683594, 25.216861724853516, 26.782333374023438, 28.34780502319336, 29.91327667236328, 31.478748321533203, 33.044219970703125, 34.60968780517578, 36.17516326904297, 37.74063491821289, 39.30610656738281, 40.871578216552734, 42.437049865722656, 44.00252151489258, 45.5679931640625, 47.133460998535156, 48.69893264770508, 50.264404296875, 51.82987594604492, 53.395347595214844, 54.960819244384766, 56.52629089355469, 58.091758728027344, 59.65723419189453, 61.22270202636719, 62.78817367553711, 64.35364532470703, 65.91911315917969, 67.48458862304688, 69.05005645751953, 70.61553192138672, 72.18099975585938, 73.74647521972656]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 5.0, 5.0, 6.0, 6.0, 12.0, 8.0, 14.0, 19.0, 29.0, 36.0, 54.0, 38.0, 55.0, 71.0, 65.0, 79.0, 66.0, 62.0, 62.0, 50.0, 66.0, 48.0, 32.0, 30.0, 22.0, 19.0, 18.0, 9.0, 9.0, 6.0, 4.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.49193572998047, -33.27943801879883, -32.06694030761719, -30.85444450378418, -29.64194679260254, -28.42945098876953, -27.21695327758789, -26.00445556640625, -24.79195785522461, -23.57946014404297, -22.36696434020996, -21.15446662902832, -19.94196891784668, -18.729473114013672, -17.51697540283203, -16.30447769165039, -15.091981887817383, -13.879485130310059, -12.666987419128418, -11.454490661621094, -10.241992950439453, -9.029496192932129, -7.816999435424805, -6.604501724243164, -5.39200496673584, -4.179507732391357, -2.967010736465454, -1.7545137405395508, -0.5420165061950684, 0.6704807281494141, 1.8829774856567383, 3.095475196838379, 4.307971954345703, 5.5204691886901855, 6.732966423034668, 7.945463180541992, 9.157960891723633, 10.370457649230957, 11.582954406738281, 12.795452117919922, 14.007948875427246, 15.22044563293457, 16.43294334411621, 17.64543914794922, 18.85793685913086, 20.0704345703125, 21.28293228149414, 22.49542999267578, 23.70792579650879, 24.92042350769043, 26.132919311523438, 27.345417022705078, 28.55791473388672, 29.77041244506836, 30.982908248901367, 32.195404052734375, 33.407901763916016, 34.620399475097656, 35.8328971862793, 37.04539489746094, 38.25788879394531, 39.47038650512695, 40.682884216308594, 41.895381927490234, 43.107879638671875]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 3.0, 0.0, 3.0, 3.0, 8.0, 10.0, 6.0, 12.0, 16.0, 31.0, 41.0, 70.0, 106.0, 187.0, 463.0, 1428.0, 5645.0, 38844.0, 3965028.0, 169149.0, 10012.0, 1962.0, 621.0, 257.0, 151.0, 82.0, 52.0, 28.0, 22.0, 18.0, 13.0, 6.0, 7.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.61181640625, -0.588897705078125, -0.56597900390625, -0.543060302734375, -0.5201416015625, -0.497222900390625, -0.47430419921875, -0.451385498046875, -0.428466796875, -0.405548095703125, -0.38262939453125, -0.359710693359375, -0.3367919921875, -0.313873291015625, -0.29095458984375, -0.268035888671875, -0.2451171875, -0.222198486328125, -0.19927978515625, -0.176361083984375, -0.1534423828125, -0.130523681640625, -0.10760498046875, -0.084686279296875, -0.061767578125, -0.038848876953125, -0.01593017578125, 0.006988525390625, 0.0299072265625, 0.052825927734375, 0.07574462890625, 0.098663330078125, 0.12158203125, 0.144500732421875, 0.16741943359375, 0.190338134765625, 0.2132568359375, 0.236175537109375, 0.25909423828125, 0.282012939453125, 0.304931640625, 0.327850341796875, 0.35076904296875, 0.373687744140625, 0.3966064453125, 0.419525146484375, 0.44244384765625, 0.465362548828125, 0.48828125, 0.511199951171875, 0.53411865234375, 0.557037353515625, 0.5799560546875, 0.602874755859375, 0.62579345703125, 0.648712158203125, 0.671630859375, 0.694549560546875, 0.71746826171875, 0.740386962890625, 0.7633056640625, 0.786224365234375, 0.80914306640625, 0.832061767578125, 0.85498046875]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0, 4.0, 7.0, 11.0, 9.0, 14.0, 34.0, 32.0, 52.0, 72.0, 84.0, 76.0, 90.0, 92.0, 101.0, 65.0, 64.0, 64.0, 38.0, 29.0, 23.0, 11.0, 7.0, 9.0, 6.0, 5.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.150634765625, -0.1450824737548828, -0.13953018188476562, -0.13397789001464844, -0.12842559814453125, -0.12287330627441406, -0.11732101440429688, -0.11176872253417969, -0.1062164306640625, -0.10066413879394531, -0.09511184692382812, -0.08955955505371094, -0.08400726318359375, -0.07845497131347656, -0.07290267944335938, -0.06735038757324219, -0.061798095703125, -0.05624580383300781, -0.050693511962890625, -0.04514122009277344, -0.03958892822265625, -0.03403663635253906, -0.028484344482421875, -0.022932052612304688, -0.0173797607421875, -0.011827468872070312, -0.006275177001953125, -0.0007228851318359375, 0.00482940673828125, 0.010381698608398438, 0.015933990478515625, 0.021486282348632812, 0.02703857421875, 0.03259086608886719, 0.038143157958984375, 0.04369544982910156, 0.04924774169921875, 0.05480003356933594, 0.060352325439453125, 0.06590461730957031, 0.0714569091796875, 0.07700920104980469, 0.08256149291992188, 0.08811378479003906, 0.09366607666015625, 0.09921836853027344, 0.10477066040039062, 0.11032295227050781, 0.115875244140625, 0.12142753601074219, 0.12697982788085938, 0.13253211975097656, 0.13808441162109375, 0.14363670349121094, 0.14918899536132812, 0.1547412872314453, 0.1602935791015625, 0.1658458709716797, 0.17139816284179688, 0.17695045471191406, 0.18250274658203125, 0.18805503845214844, 0.19360733032226562, 0.1991596221923828, 0.2047119140625]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 4.0, 2.0, 4.0, 3.0, 6.0, 6.0, 11.0, 8.0, 9.0, 6.0, 11.0, 6.0, 14.0, 26.0, 26.0, 84.0, 150.0, 333.0, 1129.0, 14386.0, 4082830.0, 91822.0, 2427.0, 501.0, 206.0, 93.0, 62.0, 18.0, 19.0, 26.0, 12.0, 7.0, 8.0, 10.0, 7.0, 2.0, 1.0, 5.0, 1.0, 0.0, 3.0, 3.0, 2.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.439208984375, -0.4227561950683594, -0.40630340576171875, -0.3898506164550781, -0.3733978271484375, -0.3569450378417969, -0.34049224853515625, -0.3240394592285156, -0.307586669921875, -0.2911338806152344, -0.27468109130859375, -0.2582283020019531, -0.2417755126953125, -0.22532272338867188, -0.20886993408203125, -0.19241714477539062, -0.17596435546875, -0.15951156616210938, -0.14305877685546875, -0.12660598754882812, -0.1101531982421875, -0.09370040893554688, -0.07724761962890625, -0.060794830322265625, -0.044342041015625, -0.027889251708984375, -0.01143646240234375, 0.005016326904296875, 0.0214691162109375, 0.037921905517578125, 0.05437469482421875, 0.07082748413085938, 0.0872802734375, 0.10373306274414062, 0.12018585205078125, 0.13663864135742188, 0.1530914306640625, 0.16954421997070312, 0.18599700927734375, 0.20244979858398438, 0.218902587890625, 0.23535537719726562, 0.25180816650390625, 0.2682609558105469, 0.2847137451171875, 0.3011665344238281, 0.31761932373046875, 0.3340721130371094, 0.35052490234375, 0.3669776916503906, 0.38343048095703125, 0.3998832702636719, 0.4163360595703125, 0.4327888488769531, 0.44924163818359375, 0.4656944274902344, 0.482147216796875, 0.4986000061035156, 0.5150527954101562, 0.5315055847167969, 0.5479583740234375, 0.5644111633300781, 0.5808639526367188, 0.5973167419433594, 0.61376953125]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 7.0, 2.0, 4.0, 7.0, 8.0, 12.0, 16.0, 25.0, 35.0, 71.0, 161.0, 397.0, 852.0, 1381.0, 659.0, 205.0, 82.0, 42.0, 34.0, 18.0, 15.0, 12.0, 9.0, 7.0, 1.0, 7.0, 3.0, 6.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.1900634765625, -0.1828594207763672, -0.17565536499023438, -0.16845130920410156, -0.16124725341796875, -0.15404319763183594, -0.14683914184570312, -0.1396350860595703, -0.1324310302734375, -0.1252269744873047, -0.11802291870117188, -0.11081886291503906, -0.10361480712890625, -0.09641075134277344, -0.08920669555664062, -0.08200263977050781, -0.074798583984375, -0.06759452819824219, -0.060390472412109375, -0.05318641662597656, -0.04598236083984375, -0.03877830505371094, -0.031574249267578125, -0.024370193481445312, -0.0171661376953125, -0.009962081909179688, -0.002758026123046875, 0.0044460296630859375, 0.01165008544921875, 0.018854141235351562, 0.026058197021484375, 0.03326225280761719, 0.04046630859375, 0.04767036437988281, 0.054874420166015625, 0.06207847595214844, 0.06928253173828125, 0.07648658752441406, 0.08369064331054688, 0.09089469909667969, 0.0980987548828125, 0.10530281066894531, 0.11250686645507812, 0.11971092224121094, 0.12691497802734375, 0.13411903381347656, 0.14132308959960938, 0.1485271453857422, 0.155731201171875, 0.1629352569580078, 0.17013931274414062, 0.17734336853027344, 0.18454742431640625, 0.19175148010253906, 0.19895553588867188, 0.2061595916748047, 0.2133636474609375, 0.2205677032470703, 0.22777175903320312, 0.23497581481933594, 0.24217987060546875, 0.24938392639160156, 0.2565879821777344, 0.2637920379638672, 0.27099609375]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 8.0, 23.0, 590.0, 395.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.328495025634766, -8.171256065368652, -8.014018058776855, -7.856779098510742, -7.699540615081787, -7.542302131652832, -7.385063171386719, -7.227824687957764, -7.070586204528809, -6.9133477210998535, -6.75610876083374, -6.598870277404785, -6.44163179397583, -6.284393310546875, -6.127154350280762, -5.969915866851807, -5.812677383422852, -5.6554388999938965, -5.498199939727783, -5.340961456298828, -5.183722972869873, -5.026484489440918, -4.869245529174805, -4.71200704574585, -4.554768085479736, -4.397529602050781, -4.240290641784668, -4.083052158355713, -3.925813674926758, -3.7685749530792236, -3.6113362312316895, -3.4540977478027344, -3.2968592643737793, -3.139620542526245, -2.98238205909729, -2.825143337249756, -2.667904853820801, -2.5106661319732666, -2.3534274101257324, -2.1961889266967773, -2.0389504432678223, -1.8817118406295776, -1.724473237991333, -1.5672345161437988, -1.4099960327148438, -1.2527573108673096, -1.095518708229065, -0.9382801055908203, -0.7810413837432861, -0.6238027811050415, -0.4665641486644745, -0.30932551622390747, -0.15208691358566284, 0.005151689052581787, 0.1623903512954712, 0.3196289539337158, 0.47686755657196045, 0.6341061592102051, 0.7913447618484497, 0.9485834240913391, 1.1058220863342285, 1.2630605697631836, 1.4202992916107178, 1.5775378942489624, 1.734776496887207]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 5.0, 4.0, 5.0, 13.0, 27.0, 19.0, 23.0, 32.0, 38.0, 41.0, 40.0, 56.0, 61.0, 65.0, 62.0, 70.0, 68.0, 55.0, 53.0, 58.0, 46.0, 34.0, 29.0, 40.0, 13.0, 16.0, 14.0, 9.0, 4.0, 1.0, 4.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6065807938575745, -0.5849961638450623, -0.56341153383255, -0.5418268442153931, -0.5202422142028809, -0.49865758419036865, -0.47707295417785645, -0.45548832416534424, -0.43390366435050964, -0.41231903433799744, -0.39073437452316284, -0.36914974451065063, -0.3475651144981384, -0.32598045468330383, -0.3043958246707916, -0.28281116485595703, -0.2612265348434448, -0.23964188992977142, -0.21805724501609802, -0.19647261500358582, -0.17488797008991241, -0.153303325176239, -0.1317186951637268, -0.1101340502500534, -0.08854940533638, -0.0669647604227066, -0.0453801229596138, -0.023795485496520996, -0.002210840582847595, 0.019373804330825806, 0.04095843434333801, 0.06254307925701141, 0.08412778377532959, 0.10571242868900299, 0.1272970736026764, 0.1488817036151886, 0.170466348528862, 0.1920509934425354, 0.2136356234550476, 0.235220268368721, 0.2568049132823944, 0.2783895432949066, 0.2999742031097412, 0.3215588331222534, 0.3431434631347656, 0.3647281229496002, 0.3863127529621124, 0.407897412776947, 0.42948204278945923, 0.45106667280197144, 0.47265133261680603, 0.49423596262931824, 0.5158206224441528, 0.537405252456665, 0.5589898824691772, 0.5805745124816895, 0.6021591424942017, 0.6237437725067139, 0.6453284025192261, 0.6669130325317383, 0.6884977221488953, 0.7100823521614075, 0.7316669821739197, 0.7532516121864319, 0.7748363018035889]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 4.0, 5.0, 3.0, 5.0, 3.0, 8.0, 14.0, 31.0, 28.0, 47.0, 93.0, 154.0, 260.0, 470.0, 959.0, 2012.0, 5079.0, 19097.0, 755973.0, 243135.0, 13587.0, 4119.0, 1671.0, 777.0, 395.0, 245.0, 135.0, 84.0, 47.0, 41.0, 28.0, 14.0, 13.0, 13.0, 5.0, 1.0, 2.0, 0.0, 4.0, 4.0, 2.0, 0.0, 1.0], "bins": [-0.97216796875, -0.9477996826171875, -0.923431396484375, -0.8990631103515625, -0.87469482421875, -0.8503265380859375, -0.825958251953125, -0.8015899658203125, -0.7772216796875, -0.7528533935546875, -0.728485107421875, -0.7041168212890625, -0.67974853515625, -0.6553802490234375, -0.631011962890625, -0.6066436767578125, -0.582275390625, -0.5579071044921875, -0.533538818359375, -0.5091705322265625, -0.48480224609375, -0.4604339599609375, -0.436065673828125, -0.4116973876953125, -0.3873291015625, -0.3629608154296875, -0.338592529296875, -0.3142242431640625, -0.28985595703125, -0.2654876708984375, -0.241119384765625, -0.2167510986328125, -0.1923828125, -0.1680145263671875, -0.143646240234375, -0.1192779541015625, -0.09490966796875, -0.0705413818359375, -0.046173095703125, -0.0218048095703125, 0.0025634765625, 0.0269317626953125, 0.051300048828125, 0.0756683349609375, 0.10003662109375, 0.1244049072265625, 0.148773193359375, 0.1731414794921875, 0.197509765625, 0.2218780517578125, 0.246246337890625, 0.2706146240234375, 0.29498291015625, 0.3193511962890625, 0.343719482421875, 0.3680877685546875, 0.3924560546875, 0.4168243408203125, 0.441192626953125, 0.4655609130859375, 0.48992919921875, 0.5142974853515625, 0.538665771484375, 0.5630340576171875, 0.58740234375]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 4.0, 6.0, 4.0, 11.0, 8.0, 21.0, 26.0, 34.0, 51.0, 63.0, 86.0, 77.0, 75.0, 94.0, 93.0, 79.0, 58.0, 56.0, 53.0, 32.0, 26.0, 13.0, 9.0, 5.0, 10.0, 2.0, 4.0, 6.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.135009765625, -0.129669189453125, -0.12432861328125, -0.118988037109375, -0.1136474609375, -0.108306884765625, -0.10296630859375, -0.097625732421875, -0.09228515625, -0.086944580078125, -0.08160400390625, -0.076263427734375, -0.0709228515625, -0.065582275390625, -0.06024169921875, -0.054901123046875, -0.049560546875, -0.044219970703125, -0.03887939453125, -0.033538818359375, -0.0281982421875, -0.022857666015625, -0.01751708984375, -0.012176513671875, -0.0068359375, -0.001495361328125, 0.00384521484375, 0.009185791015625, 0.0145263671875, 0.019866943359375, 0.02520751953125, 0.030548095703125, 0.035888671875, 0.041229248046875, 0.04656982421875, 0.051910400390625, 0.0572509765625, 0.062591552734375, 0.06793212890625, 0.073272705078125, 0.07861328125, 0.083953857421875, 0.08929443359375, 0.094635009765625, 0.0999755859375, 0.105316162109375, 0.11065673828125, 0.115997314453125, 0.121337890625, 0.126678466796875, 0.13201904296875, 0.137359619140625, 0.1427001953125, 0.148040771484375, 0.15338134765625, 0.158721923828125, 0.1640625, 0.169403076171875, 0.17474365234375, 0.180084228515625, 0.1854248046875, 0.190765380859375, 0.19610595703125, 0.201446533203125, 0.206787109375]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 5.0, 7.0, 9.0, 11.0, 11.0, 9.0, 15.0, 21.0, 31.0, 26.0, 45.0, 45.0, 55.0, 76.0, 113.0, 190.0, 395.0, 1196.0, 6958.0, 107970.0, 831184.0, 91585.0, 6478.0, 1102.0, 363.0, 212.0, 103.0, 94.0, 54.0, 33.0, 52.0, 17.0, 25.0, 15.0, 11.0, 13.0, 9.0, 2.0, 5.0, 4.0, 2.0, 2.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.278076171875, -0.2692413330078125, -0.260406494140625, -0.2515716552734375, -0.24273681640625, -0.2339019775390625, -0.225067138671875, -0.2162322998046875, -0.2073974609375, -0.1985626220703125, -0.189727783203125, -0.1808929443359375, -0.17205810546875, -0.1632232666015625, -0.154388427734375, -0.1455535888671875, -0.13671875, -0.1278839111328125, -0.119049072265625, -0.1102142333984375, -0.10137939453125, -0.0925445556640625, -0.083709716796875, -0.0748748779296875, -0.0660400390625, -0.0572052001953125, -0.048370361328125, -0.0395355224609375, -0.03070068359375, -0.0218658447265625, -0.013031005859375, -0.0041961669921875, 0.004638671875, 0.0134735107421875, 0.022308349609375, 0.0311431884765625, 0.03997802734375, 0.0488128662109375, 0.057647705078125, 0.0664825439453125, 0.0753173828125, 0.0841522216796875, 0.092987060546875, 0.1018218994140625, 0.11065673828125, 0.1194915771484375, 0.128326416015625, 0.1371612548828125, 0.14599609375, 0.1548309326171875, 0.163665771484375, 0.1725006103515625, 0.18133544921875, 0.1901702880859375, 0.199005126953125, 0.2078399658203125, 0.2166748046875, 0.2255096435546875, 0.234344482421875, 0.2431793212890625, 0.25201416015625, 0.2608489990234375, 0.269683837890625, 0.2785186767578125, 0.287353515625]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 2.0, 2.0, 3.0, 7.0, 4.0, 6.0, 10.0, 9.0, 11.0, 15.0, 17.0, 10.0, 24.0, 27.0, 20.0, 26.0, 28.0, 43.0, 23.0, 34.0, 46.0, 40.0, 49.0, 45.0, 36.0, 44.0, 48.0, 35.0, 31.0, 33.0, 26.0, 27.0, 32.0, 24.0, 21.0, 16.0, 20.0, 24.0, 13.0, 16.0, 13.0, 14.0, 7.0, 11.0, 2.0, 4.0, 2.0, 3.0, 1.0, 7.0, 1.0, 1.0, 2.0], "bins": [-0.25927734375, -0.2518787384033203, -0.24448013305664062, -0.23708152770996094, -0.22968292236328125, -0.22228431701660156, -0.21488571166992188, -0.2074871063232422, -0.2000885009765625, -0.1926898956298828, -0.18529129028320312, -0.17789268493652344, -0.17049407958984375, -0.16309547424316406, -0.15569686889648438, -0.1482982635498047, -0.140899658203125, -0.1335010528564453, -0.12610244750976562, -0.11870384216308594, -0.11130523681640625, -0.10390663146972656, -0.09650802612304688, -0.08910942077636719, -0.0817108154296875, -0.07431221008300781, -0.06691360473632812, -0.05951499938964844, -0.05211639404296875, -0.04471778869628906, -0.037319183349609375, -0.029920578002929688, -0.02252197265625, -0.015123367309570312, -0.007724761962890625, -0.0003261566162109375, 0.00707244873046875, 0.014471054077148438, 0.021869659423828125, 0.029268264770507812, 0.0366668701171875, 0.04406547546386719, 0.051464080810546875, 0.05886268615722656, 0.06626129150390625, 0.07365989685058594, 0.08105850219726562, 0.08845710754394531, 0.095855712890625, 0.10325431823730469, 0.11065292358398438, 0.11805152893066406, 0.12545013427734375, 0.13284873962402344, 0.14024734497070312, 0.1476459503173828, 0.1550445556640625, 0.1624431610107422, 0.16984176635742188, 0.17724037170410156, 0.18463897705078125, 0.19203758239746094, 0.19943618774414062, 0.2068347930908203, 0.2142333984375]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 1.0, 2.0, 2.0, 5.0, 7.0, 8.0, 13.0, 12.0, 11.0, 23.0, 21.0, 39.0, 61.0, 83.0, 138.0, 209.0, 346.0, 696.0, 1814.0, 6615.0, 53304.0, 710829.0, 251116.0, 17701.0, 3194.0, 1084.0, 481.0, 246.0, 149.0, 102.0, 64.0, 49.0, 31.0, 23.0, 14.0, 13.0, 14.0, 9.0, 7.0, 5.0, 3.0, 6.0, 2.0, 2.0, 1.0, 0.0, 4.0, 0.0, 1.0, 1.0, 0.0, 3.0], "bins": [-0.060791015625, -0.058990478515625, -0.05718994140625, -0.055389404296875, -0.0535888671875, -0.051788330078125, -0.04998779296875, -0.048187255859375, -0.04638671875, -0.044586181640625, -0.04278564453125, -0.040985107421875, -0.0391845703125, -0.037384033203125, -0.03558349609375, -0.033782958984375, -0.031982421875, -0.030181884765625, -0.02838134765625, -0.026580810546875, -0.0247802734375, -0.022979736328125, -0.02117919921875, -0.019378662109375, -0.017578125, -0.015777587890625, -0.01397705078125, -0.012176513671875, -0.0103759765625, -0.008575439453125, -0.00677490234375, -0.004974365234375, -0.003173828125, -0.001373291015625, 0.00042724609375, 0.002227783203125, 0.0040283203125, 0.005828857421875, 0.00762939453125, 0.009429931640625, 0.01123046875, 0.013031005859375, 0.01483154296875, 0.016632080078125, 0.0184326171875, 0.020233154296875, 0.02203369140625, 0.023834228515625, 0.025634765625, 0.027435302734375, 0.02923583984375, 0.031036376953125, 0.0328369140625, 0.034637451171875, 0.03643798828125, 0.038238525390625, 0.0400390625, 0.041839599609375, 0.04364013671875, 0.045440673828125, 0.0472412109375, 0.049041748046875, 0.05084228515625, 0.052642822265625, 0.054443359375]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 1.0, 1.0, 3.0, 1.0, 3.0, 7.0, 8.0, 12.0, 19.0, 18.0, 25.0, 38.0, 34.0, 48.0, 72.0, 79.0, 54.0, 88.0, 79.0, 63.0, 65.0, 52.0, 44.0, 46.0, 33.0, 25.0, 17.0, 13.0, 11.0, 14.0, 6.0, 6.0, 2.0, 3.0, 2.0, 1.0, 1.0, 3.0, 1.0, 4.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-8.165836334228516e-06, -7.88271427154541e-06, -7.599592208862305e-06, -7.316470146179199e-06, -7.033348083496094e-06, -6.750226020812988e-06, -6.467103958129883e-06, -6.183981895446777e-06, -5.900859832763672e-06, -5.617737770080566e-06, -5.334615707397461e-06, -5.0514936447143555e-06, -4.76837158203125e-06, -4.4852495193481445e-06, -4.202127456665039e-06, -3.919005393981934e-06, -3.635883331298828e-06, -3.3527612686157227e-06, -3.069639205932617e-06, -2.7865171432495117e-06, -2.5033950805664062e-06, -2.2202730178833008e-06, -1.9371509552001953e-06, -1.6540288925170898e-06, -1.3709068298339844e-06, -1.087784767150879e-06, -8.046627044677734e-07, -5.21540641784668e-07, -2.384185791015625e-07, 4.470348358154297e-08, 3.2782554626464844e-07, 6.109476089477539e-07, 8.940696716308594e-07, 1.1771917343139648e-06, 1.4603137969970703e-06, 1.7434358596801758e-06, 2.0265579223632812e-06, 2.3096799850463867e-06, 2.592802047729492e-06, 2.8759241104125977e-06, 3.159046173095703e-06, 3.4421682357788086e-06, 3.725290298461914e-06, 4.0084123611450195e-06, 4.291534423828125e-06, 4.5746564865112305e-06, 4.857778549194336e-06, 5.140900611877441e-06, 5.424022674560547e-06, 5.707144737243652e-06, 5.990266799926758e-06, 6.273388862609863e-06, 6.556510925292969e-06, 6.839632987976074e-06, 7.12275505065918e-06, 7.405877113342285e-06, 7.68899917602539e-06, 7.972121238708496e-06, 8.255243301391602e-06, 8.538365364074707e-06, 8.821487426757812e-06, 9.104609489440918e-06, 9.387731552124023e-06, 9.670853614807129e-06, 9.953975677490234e-06]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 4.0, 1.0, 0.0, 3.0, 1.0, 1.0, 3.0, 5.0, 7.0, 24.0, 47.0, 76.0, 213.0, 644.0, 2120.0, 7462.0, 298054.0, 726067.0, 10077.0, 2511.0, 791.0, 238.0, 81.0, 50.0, 27.0, 13.0, 9.0, 6.0, 7.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1533203125, -0.14895057678222656, -0.14458084106445312, -0.1402111053466797, -0.13584136962890625, -0.1314716339111328, -0.12710189819335938, -0.12273216247558594, -0.1183624267578125, -0.11399269104003906, -0.10962295532226562, -0.10525321960449219, -0.10088348388671875, -0.09651374816894531, -0.09214401245117188, -0.08777427673339844, -0.083404541015625, -0.07903480529785156, -0.07466506958007812, -0.07029533386230469, -0.06592559814453125, -0.06155586242675781, -0.057186126708984375, -0.05281639099121094, -0.0484466552734375, -0.04407691955566406, -0.039707183837890625, -0.03533744812011719, -0.03096771240234375, -0.026597976684570312, -0.022228240966796875, -0.017858505249023438, -0.01348876953125, -0.009119033813476562, -0.004749298095703125, -0.0003795623779296875, 0.00399017333984375, 0.008359909057617188, 0.012729644775390625, 0.017099380493164062, 0.0214691162109375, 0.025838851928710938, 0.030208587646484375, 0.03457832336425781, 0.03894805908203125, 0.04331779479980469, 0.047687530517578125, 0.05205726623535156, 0.056427001953125, 0.06079673767089844, 0.06516647338867188, 0.06953620910644531, 0.07390594482421875, 0.07827568054199219, 0.08264541625976562, 0.08701515197753906, 0.0913848876953125, 0.09575462341308594, 0.10012435913085938, 0.10449409484863281, 0.10886383056640625, 0.11323356628417969, 0.11760330200195312, 0.12197303771972656, 0.1263427734375]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 3.0, 1.0, 4.0, 3.0, 5.0, 7.0, 6.0, 6.0, 12.0, 14.0, 14.0, 16.0, 29.0, 41.0, 48.0, 52.0, 83.0, 127.0, 111.0, 102.0, 80.0, 69.0, 40.0, 31.0, 17.0, 18.0, 15.0, 11.0, 7.0, 7.0, 0.0, 4.0, 4.0, 8.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.063232421875, -0.061065673828125, -0.05889892578125, -0.056732177734375, -0.0545654296875, -0.052398681640625, -0.05023193359375, -0.048065185546875, -0.0458984375, -0.043731689453125, -0.04156494140625, -0.039398193359375, -0.0372314453125, -0.035064697265625, -0.03289794921875, -0.030731201171875, -0.028564453125, -0.026397705078125, -0.02423095703125, -0.022064208984375, -0.0198974609375, -0.017730712890625, -0.01556396484375, -0.013397216796875, -0.01123046875, -0.009063720703125, -0.00689697265625, -0.004730224609375, -0.0025634765625, -0.000396728515625, 0.00177001953125, 0.003936767578125, 0.006103515625, 0.008270263671875, 0.01043701171875, 0.012603759765625, 0.0147705078125, 0.016937255859375, 0.01910400390625, 0.021270751953125, 0.0234375, 0.025604248046875, 0.02777099609375, 0.029937744140625, 0.0321044921875, 0.034271240234375, 0.03643798828125, 0.038604736328125, 0.040771484375, 0.042938232421875, 0.04510498046875, 0.047271728515625, 0.0494384765625, 0.051605224609375, 0.05377197265625, 0.055938720703125, 0.05810546875, 0.060272216796875, 0.06243896484375, 0.064605712890625, 0.0667724609375, 0.068939208984375, 0.07110595703125, 0.073272705078125, 0.075439453125]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 57.0, 870.0, 84.0, 5.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.787382125854492, -9.53990364074707, -9.292424201965332, -9.044944763183594, -8.797466278076172, -8.54998779296875, -8.302508354187012, -8.055028915405273, -7.807550430297852, -7.5600714683532715, -7.312592506408691, -7.065113544464111, -6.817634582519531, -6.570155620574951, -6.322676658630371, -6.075197696685791, -5.827718734741211, -5.580239772796631, -5.332760810852051, -5.085281848907471, -4.837802886962891, -4.5903239250183105, -4.3428449630737305, -4.09536600112915, -3.8478870391845703, -3.6004080772399902, -3.35292911529541, -3.10545015335083, -2.85797119140625, -2.61049222946167, -2.36301326751709, -2.1155343055725098, -1.868055820465088, -1.6205768585205078, -1.3730978965759277, -1.1256189346313477, -0.8781399726867676, -0.6306610107421875, -0.3831820487976074, -0.13570308685302734, 0.11177587509155273, 0.3592548370361328, 0.6067337989807129, 0.854212760925293, 1.101691722869873, 1.3491706848144531, 1.5966496467590332, 1.8441286087036133, 2.0916075706481934, 2.3390865325927734, 2.5865654945373535, 2.8340444564819336, 3.0815234184265137, 3.3290023803710938, 3.576481342315674, 3.823960304260254, 4.071439266204834, 4.318918228149414, 4.566397190093994, 4.813876152038574, 5.061355113983154, 5.308834075927734, 5.5563130378723145, 5.8037919998168945, 6.051270961761475]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 5.0, 3.0, 5.0, 4.0, 6.0, 9.0, 6.0, 8.0, 7.0, 10.0, 21.0, 23.0, 17.0, 27.0, 29.0, 34.0, 31.0, 26.0, 31.0, 51.0, 45.0, 47.0, 48.0, 44.0, 54.0, 48.0, 49.0, 39.0, 45.0, 32.0, 27.0, 29.0, 34.0, 16.0, 24.0, 17.0, 8.0, 13.0, 9.0, 9.0, 3.0, 8.0, 4.0, 6.0, 3.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7241535186767578, -1.672405481338501, -1.6206574440002441, -1.5689094066619873, -1.5171613693237305, -1.4654133319854736, -1.4136652946472168, -1.36191725730896, -1.3101692199707031, -1.2584211826324463, -1.2066731452941895, -1.1549251079559326, -1.1031770706176758, -1.051429033279419, -0.9996810555458069, -0.94793301820755, -0.896185040473938, -0.8444370031356812, -0.7926889657974243, -0.7409409284591675, -0.6891928911209106, -0.6374448537826538, -0.5856968760490417, -0.5339488387107849, -0.4822008013725281, -0.43045276403427124, -0.3787047266960144, -0.32695671916007996, -0.2752086818218231, -0.22346064448356628, -0.17171263694763184, -0.119964599609375, -0.06821656227111816, -0.016468532383441925, 0.035279497504234314, 0.08702751994132996, 0.1387755572795868, 0.19052359461784363, 0.24227160215377808, 0.2940196394920349, 0.34576767683029175, 0.3975157141685486, 0.4492637515068054, 0.5010117292404175, 0.5527597665786743, 0.6045078039169312, 0.656255841255188, 0.7080038785934448, 0.7597519159317017, 0.8114999532699585, 0.8632479906082153, 0.9149960279464722, 0.966744065284729, 1.0184921026229858, 1.0702400207519531, 1.12198805809021, 1.1737360954284668, 1.2254841327667236, 1.2772321701049805, 1.3289802074432373, 1.3807282447814941, 1.432476282119751, 1.4842243194580078, 1.5359723567962646, 1.5877203941345215]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 6.0, 2.0, 7.0, 14.0, 15.0, 12.0, 27.0, 31.0, 64.0, 78.0, 165.0, 921.0, 18958.0, 4170265.0, 3060.0, 321.0, 101.0, 78.0, 44.0, 36.0, 25.0, 17.0, 12.0, 9.0, 6.0, 5.0, 5.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.576171875, -1.51617431640625, -1.4561767578125, -1.39617919921875, -1.336181640625, -1.27618408203125, -1.2161865234375, -1.15618896484375, -1.09619140625, -1.03619384765625, -0.9761962890625, -0.91619873046875, -0.856201171875, -0.79620361328125, -0.7362060546875, -0.67620849609375, -0.6162109375, -0.55621337890625, -0.4962158203125, -0.43621826171875, -0.376220703125, -0.31622314453125, -0.2562255859375, -0.19622802734375, -0.13623046875, -0.07623291015625, -0.0162353515625, 0.04376220703125, 0.103759765625, 0.16375732421875, 0.2237548828125, 0.28375244140625, 0.34375, 0.40374755859375, 0.4637451171875, 0.52374267578125, 0.583740234375, 0.64373779296875, 0.7037353515625, 0.76373291015625, 0.82373046875, 0.88372802734375, 0.9437255859375, 1.00372314453125, 1.063720703125, 1.12371826171875, 1.1837158203125, 1.24371337890625, 1.3037109375, 1.36370849609375, 1.4237060546875, 1.48370361328125, 1.543701171875, 1.60369873046875, 1.6636962890625, 1.72369384765625, 1.78369140625, 1.84368896484375, 1.9036865234375, 1.96368408203125, 2.023681640625, 2.08367919921875, 2.1436767578125, 2.20367431640625, 2.263671875]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 2.0, 1.0, 6.0, 6.0, 17.0, 17.0, 16.0, 39.0, 48.0, 65.0, 74.0, 81.0, 81.0, 82.0, 82.0, 79.0, 69.0, 74.0, 59.0, 31.0, 25.0, 14.0, 14.0, 9.0, 6.0, 7.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.14208984375, -0.1367340087890625, -0.131378173828125, -0.1260223388671875, -0.12066650390625, -0.1153106689453125, -0.109954833984375, -0.1045989990234375, -0.0992431640625, -0.0938873291015625, -0.088531494140625, -0.0831756591796875, -0.07781982421875, -0.0724639892578125, -0.067108154296875, -0.0617523193359375, -0.056396484375, -0.0510406494140625, -0.045684814453125, -0.0403289794921875, -0.03497314453125, -0.0296173095703125, -0.024261474609375, -0.0189056396484375, -0.0135498046875, -0.0081939697265625, -0.002838134765625, 0.0025177001953125, 0.00787353515625, 0.0132293701171875, 0.018585205078125, 0.0239410400390625, 0.029296875, 0.0346527099609375, 0.040008544921875, 0.0453643798828125, 0.05072021484375, 0.0560760498046875, 0.061431884765625, 0.0667877197265625, 0.0721435546875, 0.0774993896484375, 0.082855224609375, 0.0882110595703125, 0.09356689453125, 0.0989227294921875, 0.104278564453125, 0.1096343994140625, 0.114990234375, 0.1203460693359375, 0.125701904296875, 0.1310577392578125, 0.13641357421875, 0.1417694091796875, 0.147125244140625, 0.1524810791015625, 0.1578369140625, 0.1631927490234375, 0.168548583984375, 0.1739044189453125, 0.17926025390625, 0.1846160888671875, 0.189971923828125, 0.1953277587890625, 0.20068359375]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 5.0, 4.0, 11.0, 5.0, 9.0, 12.0, 23.0, 38.0, 40.0, 84.0, 200.0, 454.0, 1421.0, 6607.0, 50296.0, 673023.0, 3137038.0, 294475.0, 25151.0, 3738.0, 963.0, 350.0, 146.0, 75.0, 30.0, 30.0, 17.0, 7.0, 4.0, 9.0, 3.0, 10.0, 3.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.269287109375, -0.2612133026123047, -0.2531394958496094, -0.24506568908691406, -0.23699188232421875, -0.22891807556152344, -0.22084426879882812, -0.2127704620361328, -0.2046966552734375, -0.1966228485107422, -0.18854904174804688, -0.18047523498535156, -0.17240142822265625, -0.16432762145996094, -0.15625381469726562, -0.1481800079345703, -0.140106201171875, -0.1320323944091797, -0.12395858764648438, -0.11588478088378906, -0.10781097412109375, -0.09973716735839844, -0.09166336059570312, -0.08358955383300781, -0.0755157470703125, -0.06744194030761719, -0.059368133544921875, -0.05129432678222656, -0.04322052001953125, -0.03514671325683594, -0.027072906494140625, -0.018999099731445312, -0.01092529296875, -0.0028514862060546875, 0.005222320556640625, 0.013296127319335938, 0.02136993408203125, 0.029443740844726562, 0.037517547607421875, 0.04559135437011719, 0.0536651611328125, 0.06173896789550781, 0.06981277465820312, 0.07788658142089844, 0.08596038818359375, 0.09403419494628906, 0.10210800170898438, 0.11018180847167969, 0.118255615234375, 0.1263294219970703, 0.13440322875976562, 0.14247703552246094, 0.15055084228515625, 0.15862464904785156, 0.16669845581054688, 0.1747722625732422, 0.1828460693359375, 0.1909198760986328, 0.19899368286132812, 0.20706748962402344, 0.21514129638671875, 0.22321510314941406, 0.23128890991210938, 0.2393627166748047, 0.2474365234375]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 5.0, 19.0, 20.0, 20.0, 42.0, 55.0, 113.0, 165.0, 284.0, 424.0, 687.0, 774.0, 579.0, 289.0, 190.0, 107.0, 103.0, 69.0, 32.0, 30.0, 26.0, 10.0, 9.0, 7.0, 4.0, 6.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1463623046875, -0.1424102783203125, -0.138458251953125, -0.1345062255859375, -0.13055419921875, -0.1266021728515625, -0.122650146484375, -0.1186981201171875, -0.11474609375, -0.1107940673828125, -0.106842041015625, -0.1028900146484375, -0.09893798828125, -0.0949859619140625, -0.091033935546875, -0.0870819091796875, -0.0831298828125, -0.0791778564453125, -0.075225830078125, -0.0712738037109375, -0.06732177734375, -0.0633697509765625, -0.059417724609375, -0.0554656982421875, -0.051513671875, -0.0475616455078125, -0.043609619140625, -0.0396575927734375, -0.03570556640625, -0.0317535400390625, -0.027801513671875, -0.0238494873046875, -0.0198974609375, -0.0159454345703125, -0.011993408203125, -0.0080413818359375, -0.00408935546875, -0.0001373291015625, 0.003814697265625, 0.0077667236328125, 0.01171875, 0.0156707763671875, 0.019622802734375, 0.0235748291015625, 0.02752685546875, 0.0314788818359375, 0.035430908203125, 0.0393829345703125, 0.0433349609375, 0.0472869873046875, 0.051239013671875, 0.0551910400390625, 0.05914306640625, 0.0630950927734375, 0.067047119140625, 0.0709991455078125, 0.074951171875, 0.0789031982421875, 0.082855224609375, 0.0868072509765625, 0.09075927734375, 0.0947113037109375, 0.098663330078125, 0.1026153564453125, 0.1065673828125]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 5.0, 17.0, 110.0, 618.0, 257.0, 6.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3332501649856567, -1.236007809638977, -1.1387654542922974, -1.0415229797363281, -0.9442806839942932, -0.8470383286476135, -0.7497959136962891, -0.6525535583496094, -0.5553112030029297, -0.45806884765625, -0.3608264625072479, -0.26358407735824585, -0.16634172201156616, -0.06909936666488647, 0.02814304828643799, 0.12538540363311768, 0.22262775897979736, 0.31987011432647705, 0.4171124994754791, 0.5143548846244812, 0.6115972399711609, 0.7088395953178406, 0.806082010269165, 0.9033243656158447, 1.0005667209625244, 1.097809076309204, 1.1950514316558838, 1.2922937870025635, 1.3895361423492432, 1.4867784976959229, 1.584020972251892, 1.6812633275985718, 1.778505802154541, 1.8757481575012207, 1.9729905128479004, 2.07023286819458, 2.1674752235412598, 2.2647175788879395, 2.361959934234619, 2.459202289581299, 2.5564446449279785, 2.653687000274658, 2.750929355621338, 2.8481717109680176, 2.9454140663146973, 3.042656421661377, 3.1398987770080566, 3.2371411323547363, 3.334383726119995, 3.431626081466675, 3.5288684368133545, 3.626110792160034, 3.723353147506714, 3.8205955028533936, 3.9178380966186523, 4.015080451965332, 4.112322807312012, 4.209565162658691, 4.306807518005371, 4.404049873352051, 4.5012922286987305, 4.59853458404541, 4.69577693939209, 4.7930192947387695, 4.890261650085449]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 2.0, 2.0, 4.0, 3.0, 7.0, 6.0, 6.0, 7.0, 9.0, 18.0, 17.0, 30.0, 20.0, 26.0, 25.0, 28.0, 36.0, 34.0, 58.0, 64.0, 45.0, 58.0, 57.0, 41.0, 38.0, 52.0, 45.0, 38.0, 47.0, 24.0, 42.0, 20.0, 25.0, 16.0, 12.0, 7.0, 12.0, 3.0, 2.0, 9.0, 6.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.4973805546760559, -0.48275768756866455, -0.4681348502635956, -0.4535120129585266, -0.43888914585113525, -0.4242662787437439, -0.4096434414386749, -0.39502060413360596, -0.3803977370262146, -0.36577486991882324, -0.3511520326137543, -0.3365291953086853, -0.32190632820129395, -0.3072834610939026, -0.2926606237888336, -0.27803778648376465, -0.2634149193763733, -0.24879206717014313, -0.23416921496391296, -0.2195463627576828, -0.20492351055145264, -0.19030065834522247, -0.1756778061389923, -0.16105495393276215, -0.14643210172653198, -0.13180924952030182, -0.11718639731407166, -0.10256354510784149, -0.08794069290161133, -0.07331784069538116, -0.058694988489151, -0.04407213628292084, -0.029449284076690674, -0.01482643187046051, -0.00020357966423034668, 0.014419272541999817, 0.02904212474822998, 0.043664976954460144, 0.05828782916069031, 0.07291068136692047, 0.08753353357315063, 0.1021563857793808, 0.11677923798561096, 0.13140209019184113, 0.1460249423980713, 0.16064779460430145, 0.17527064681053162, 0.18989349901676178, 0.20451635122299194, 0.2191392034292221, 0.23376205563545227, 0.24838490784168243, 0.2630077600479126, 0.27763062715530396, 0.2922534644603729, 0.3068763017654419, 0.32149916887283325, 0.3361220359802246, 0.3507448732852936, 0.36536771059036255, 0.3799905776977539, 0.39461344480514526, 0.40923628211021423, 0.4238591194152832, 0.43848198652267456]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 5.0, 9.0, 15.0, 13.0, 18.0, 28.0, 43.0, 73.0, 117.0, 135.0, 221.0, 391.0, 644.0, 1265.0, 2634.0, 6224.0, 19204.0, 88528.0, 517163.0, 335509.0, 53846.0, 13336.0, 4533.0, 2068.0, 1057.0, 578.0, 308.0, 217.0, 132.0, 80.0, 45.0, 49.0, 26.0, 19.0, 12.0, 8.0, 4.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2841796875, -0.27433013916015625, -0.2644805908203125, -0.25463104248046875, -0.244781494140625, -0.23493194580078125, -0.2250823974609375, -0.21523284912109375, -0.20538330078125, -0.19553375244140625, -0.1856842041015625, -0.17583465576171875, -0.165985107421875, -0.15613555908203125, -0.1462860107421875, -0.13643646240234375, -0.1265869140625, -0.11673736572265625, -0.1068878173828125, -0.09703826904296875, -0.087188720703125, -0.07733917236328125, -0.0674896240234375, -0.05764007568359375, -0.04779052734375, -0.03794097900390625, -0.0280914306640625, -0.01824188232421875, -0.008392333984375, 0.00145721435546875, 0.0113067626953125, 0.02115631103515625, 0.031005859375, 0.04085540771484375, 0.0507049560546875, 0.06055450439453125, 0.070404052734375, 0.08025360107421875, 0.0901031494140625, 0.09995269775390625, 0.10980224609375, 0.11965179443359375, 0.1295013427734375, 0.13935089111328125, 0.149200439453125, 0.15904998779296875, 0.1688995361328125, 0.17874908447265625, 0.1885986328125, 0.19844818115234375, 0.2082977294921875, 0.21814727783203125, 0.227996826171875, 0.23784637451171875, 0.2476959228515625, 0.25754547119140625, 0.26739501953125, 0.27724456787109375, 0.2870941162109375, 0.29694366455078125, 0.306793212890625, 0.31664276123046875, 0.3264923095703125, 0.33634185791015625, 0.34619140625]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 5.0, 4.0, 3.0, 4.0, 10.0, 13.0, 13.0, 27.0, 29.0, 43.0, 64.0, 80.0, 76.0, 83.0, 82.0, 84.0, 77.0, 78.0, 58.0, 55.0, 44.0, 27.0, 20.0, 14.0, 9.0, 7.0, 0.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1375732421875, -0.13240432739257812, -0.12723541259765625, -0.12206649780273438, -0.1168975830078125, -0.11172866821289062, -0.10655975341796875, -0.10139083862304688, -0.096221923828125, -0.09105300903320312, -0.08588409423828125, -0.08071517944335938, -0.0755462646484375, -0.07037734985351562, -0.06520843505859375, -0.060039520263671875, -0.05487060546875, -0.049701690673828125, -0.04453277587890625, -0.039363861083984375, -0.0341949462890625, -0.029026031494140625, -0.02385711669921875, -0.018688201904296875, -0.013519287109375, -0.008350372314453125, -0.00318145751953125, 0.001987457275390625, 0.0071563720703125, 0.012325286865234375, 0.01749420166015625, 0.022663116455078125, 0.02783203125, 0.033000946044921875, 0.03816986083984375, 0.043338775634765625, 0.0485076904296875, 0.053676605224609375, 0.05884552001953125, 0.06401443481445312, 0.069183349609375, 0.07435226440429688, 0.07952117919921875, 0.08469009399414062, 0.0898590087890625, 0.09502792358398438, 0.10019683837890625, 0.10536575317382812, 0.11053466796875, 0.11570358276367188, 0.12087249755859375, 0.12604141235351562, 0.1312103271484375, 0.13637924194335938, 0.14154815673828125, 0.14671707153320312, 0.151885986328125, 0.15705490112304688, 0.16222381591796875, 0.16739273071289062, 0.1725616455078125, 0.17773056030273438, 0.18289947509765625, 0.18806838989257812, 0.1932373046875]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 4.0, 3.0, 6.0, 5.0, 13.0, 13.0, 13.0, 17.0, 15.0, 18.0, 15.0, 32.0, 28.0, 37.0, 50.0, 55.0, 91.0, 146.0, 363.0, 1982.0, 53891.0, 911087.0, 77152.0, 2594.0, 404.0, 143.0, 98.0, 60.0, 47.0, 32.0, 28.0, 18.0, 12.0, 18.0, 7.0, 12.0, 9.0, 10.0, 6.0, 8.0, 6.0, 2.0, 3.0, 4.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0], "bins": [-0.61474609375, -0.5964202880859375, -0.578094482421875, -0.5597686767578125, -0.54144287109375, -0.5231170654296875, -0.504791259765625, -0.4864654541015625, -0.4681396484375, -0.4498138427734375, -0.431488037109375, -0.4131622314453125, -0.39483642578125, -0.3765106201171875, -0.358184814453125, -0.3398590087890625, -0.321533203125, -0.3032073974609375, -0.284881591796875, -0.2665557861328125, -0.24822998046875, -0.2299041748046875, -0.211578369140625, -0.1932525634765625, -0.1749267578125, -0.1566009521484375, -0.138275146484375, -0.1199493408203125, -0.10162353515625, -0.0832977294921875, -0.064971923828125, -0.0466461181640625, -0.0283203125, -0.0099945068359375, 0.008331298828125, 0.0266571044921875, 0.04498291015625, 0.0633087158203125, 0.081634521484375, 0.0999603271484375, 0.1182861328125, 0.1366119384765625, 0.154937744140625, 0.1732635498046875, 0.19158935546875, 0.2099151611328125, 0.228240966796875, 0.2465667724609375, 0.264892578125, 0.2832183837890625, 0.301544189453125, 0.3198699951171875, 0.33819580078125, 0.3565216064453125, 0.374847412109375, 0.3931732177734375, 0.4114990234375, 0.4298248291015625, 0.448150634765625, 0.4664764404296875, 0.48480224609375, 0.5031280517578125, 0.521453857421875, 0.5397796630859375, 0.55810546875]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 5.0, 3.0, 1.0, 7.0, 11.0, 11.0, 10.0, 10.0, 15.0, 6.0, 9.0, 21.0, 19.0, 26.0, 28.0, 37.0, 28.0, 49.0, 39.0, 44.0, 40.0, 44.0, 39.0, 33.0, 32.0, 43.0, 44.0, 38.0, 42.0, 43.0, 34.0, 26.0, 21.0, 26.0, 13.0, 12.0, 18.0, 12.0, 11.0, 10.0, 13.0, 17.0, 8.0, 3.0, 2.0, 1.0, 4.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1724853515625, -0.1670989990234375, -0.161712646484375, -0.1563262939453125, -0.15093994140625, -0.1455535888671875, -0.140167236328125, -0.1347808837890625, -0.12939453125, -0.1240081787109375, -0.118621826171875, -0.1132354736328125, -0.10784912109375, -0.1024627685546875, -0.097076416015625, -0.0916900634765625, -0.0863037109375, -0.0809173583984375, -0.075531005859375, -0.0701446533203125, -0.06475830078125, -0.0593719482421875, -0.053985595703125, -0.0485992431640625, -0.043212890625, -0.0378265380859375, -0.032440185546875, -0.0270538330078125, -0.02166748046875, -0.0162811279296875, -0.010894775390625, -0.0055084228515625, -0.0001220703125, 0.0052642822265625, 0.010650634765625, 0.0160369873046875, 0.02142333984375, 0.0268096923828125, 0.032196044921875, 0.0375823974609375, 0.04296875, 0.0483551025390625, 0.053741455078125, 0.0591278076171875, 0.06451416015625, 0.0699005126953125, 0.075286865234375, 0.0806732177734375, 0.0860595703125, 0.0914459228515625, 0.096832275390625, 0.1022186279296875, 0.10760498046875, 0.1129913330078125, 0.118377685546875, 0.1237640380859375, 0.129150390625, 0.1345367431640625, 0.139923095703125, 0.1453094482421875, 0.15069580078125, 0.1560821533203125, 0.161468505859375, 0.1668548583984375, 0.1722412109375]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 2.0, 2.0, 5.0, 6.0, 8.0, 23.0, 16.0, 31.0, 44.0, 80.0, 106.0, 199.0, 295.0, 503.0, 948.0, 2040.0, 4279.0, 11259.0, 34922.0, 145914.0, 524055.0, 242840.0, 54022.0, 15800.0, 5816.0, 2594.0, 1220.0, 609.0, 360.0, 207.0, 129.0, 79.0, 51.0, 36.0, 24.0, 13.0, 12.0, 4.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.09271240234375, -0.09011268615722656, -0.08751296997070312, -0.08491325378417969, -0.08231353759765625, -0.07971382141113281, -0.07711410522460938, -0.07451438903808594, -0.0719146728515625, -0.06931495666503906, -0.06671524047851562, -0.06411552429199219, -0.06151580810546875, -0.05891609191894531, -0.056316375732421875, -0.05371665954589844, -0.051116943359375, -0.04851722717285156, -0.045917510986328125, -0.04331779479980469, -0.04071807861328125, -0.03811836242675781, -0.035518646240234375, -0.03291893005371094, -0.0303192138671875, -0.027719497680664062, -0.025119781494140625, -0.022520065307617188, -0.01992034912109375, -0.017320632934570312, -0.014720916748046875, -0.012121200561523438, -0.009521484375, -0.0069217681884765625, -0.004322052001953125, -0.0017223358154296875, 0.00087738037109375, 0.0034770965576171875, 0.006076812744140625, 0.008676528930664062, 0.0112762451171875, 0.013875961303710938, 0.016475677490234375, 0.019075393676757812, 0.02167510986328125, 0.024274826049804688, 0.026874542236328125, 0.029474258422851562, 0.032073974609375, 0.03467369079589844, 0.037273406982421875, 0.03987312316894531, 0.04247283935546875, 0.04507255554199219, 0.047672271728515625, 0.05027198791503906, 0.0528717041015625, 0.05547142028808594, 0.058071136474609375, 0.06067085266113281, 0.06327056884765625, 0.06587028503417969, 0.06847000122070312, 0.07106971740722656, 0.07366943359375]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 5.0, 2.0, 5.0, 10.0, 9.0, 14.0, 16.0, 23.0, 39.0, 37.0, 55.0, 82.0, 71.0, 75.0, 96.0, 103.0, 88.0, 72.0, 45.0, 40.0, 17.0, 25.0, 18.0, 11.0, 15.0, 10.0, 5.0, 5.0, 1.0, 3.0, 3.0, 3.0, 3.0, 0.0, 2.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7583370208740234e-05, -1.696404069662094e-05, -1.6344711184501648e-05, -1.5725381672382355e-05, -1.5106052160263062e-05, -1.4486722648143768e-05, -1.3867393136024475e-05, -1.3248063623905182e-05, -1.2628734111785889e-05, -1.2009404599666595e-05, -1.1390075087547302e-05, -1.0770745575428009e-05, -1.0151416063308716e-05, -9.532086551189423e-06, -8.91275703907013e-06, -8.293427526950836e-06, -7.674098014831543e-06, -7.05476850271225e-06, -6.4354389905929565e-06, -5.816109478473663e-06, -5.19677996635437e-06, -4.577450454235077e-06, -3.958120942115784e-06, -3.3387914299964905e-06, -2.7194619178771973e-06, -2.100132405757904e-06, -1.4808028936386108e-06, -8.614733815193176e-07, -2.421438694000244e-07, 3.771856427192688e-07, 9.96515154838562e-07, 1.6158446669578552e-06, 2.2351741790771484e-06, 2.8545036911964417e-06, 3.473833203315735e-06, 4.093162715435028e-06, 4.712492227554321e-06, 5.3318217396736145e-06, 5.951151251792908e-06, 6.570480763912201e-06, 7.189810276031494e-06, 7.809139788150787e-06, 8.42846930027008e-06, 9.047798812389374e-06, 9.667128324508667e-06, 1.028645783662796e-05, 1.0905787348747253e-05, 1.1525116860866547e-05, 1.214444637298584e-05, 1.2763775885105133e-05, 1.3383105397224426e-05, 1.400243490934372e-05, 1.4621764421463013e-05, 1.5241093933582306e-05, 1.58604234457016e-05, 1.6479752957820892e-05, 1.7099082469940186e-05, 1.771841198205948e-05, 1.8337741494178772e-05, 1.8957071006298065e-05, 1.957640051841736e-05, 2.019573003053665e-05, 2.0815059542655945e-05, 2.1434389054775238e-05, 2.205371856689453e-05]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 2.0, 1.0, 6.0, 6.0, 9.0, 13.0, 12.0, 22.0, 29.0, 37.0, 54.0, 108.0, 236.0, 1097.0, 13549.0, 445527.0, 568428.0, 17508.0, 1340.0, 280.0, 93.0, 72.0, 26.0, 35.0, 20.0, 7.0, 13.0, 7.0, 6.0, 8.0, 2.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1708984375, -0.16615676879882812, -0.16141510009765625, -0.15667343139648438, -0.1519317626953125, -0.14719009399414062, -0.14244842529296875, -0.13770675659179688, -0.132965087890625, -0.12822341918945312, -0.12348175048828125, -0.11874008178710938, -0.1139984130859375, -0.10925674438476562, -0.10451507568359375, -0.09977340698242188, -0.09503173828125, -0.09029006958007812, -0.08554840087890625, -0.08080673217773438, -0.0760650634765625, -0.07132339477539062, -0.06658172607421875, -0.061840057373046875, -0.057098388671875, -0.052356719970703125, -0.04761505126953125, -0.042873382568359375, -0.0381317138671875, -0.033390045166015625, -0.02864837646484375, -0.023906707763671875, -0.0191650390625, -0.014423370361328125, -0.00968170166015625, -0.004940032958984375, -0.0001983642578125, 0.004543304443359375, 0.00928497314453125, 0.014026641845703125, 0.018768310546875, 0.023509979248046875, 0.02825164794921875, 0.032993316650390625, 0.0377349853515625, 0.042476654052734375, 0.04721832275390625, 0.051959991455078125, 0.05670166015625, 0.061443328857421875, 0.06618499755859375, 0.07092666625976562, 0.0756683349609375, 0.08041000366210938, 0.08515167236328125, 0.08989334106445312, 0.094635009765625, 0.09937667846679688, 0.10411834716796875, 0.10886001586914062, 0.1136016845703125, 0.11834335327148438, 0.12308502197265625, 0.12782669067382812, 0.132568359375]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 7.0, 2.0, 9.0, 15.0, 9.0, 22.0, 27.0, 31.0, 34.0, 56.0, 61.0, 51.0, 82.0, 83.0, 84.0, 68.0, 64.0, 65.0, 55.0, 40.0, 36.0, 25.0, 17.0, 16.0, 12.0, 14.0, 3.0, 10.0, 3.0, 1.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.046478271484375, -0.045200347900390625, -0.04392242431640625, -0.042644500732421875, -0.0413665771484375, -0.040088653564453125, -0.03881072998046875, -0.037532806396484375, -0.0362548828125, -0.034976959228515625, -0.03369903564453125, -0.032421112060546875, -0.0311431884765625, -0.029865264892578125, -0.02858734130859375, -0.027309417724609375, -0.026031494140625, -0.024753570556640625, -0.02347564697265625, -0.022197723388671875, -0.0209197998046875, -0.019641876220703125, -0.01836395263671875, -0.017086029052734375, -0.01580810546875, -0.014530181884765625, -0.01325225830078125, -0.011974334716796875, -0.0106964111328125, -0.009418487548828125, -0.00814056396484375, -0.006862640380859375, -0.005584716796875, -0.004306793212890625, -0.00302886962890625, -0.001750946044921875, -0.0004730224609375, 0.000804901123046875, 0.00208282470703125, 0.003360748291015625, 0.004638671875, 0.005916595458984375, 0.00719451904296875, 0.008472442626953125, 0.0097503662109375, 0.011028289794921875, 0.01230621337890625, 0.013584136962890625, 0.014862060546875, 0.016139984130859375, 0.01741790771484375, 0.018695831298828125, 0.0199737548828125, 0.021251678466796875, 0.02252960205078125, 0.023807525634765625, 0.02508544921875, 0.026363372802734375, 0.02764129638671875, 0.028919219970703125, 0.0301971435546875, 0.031475067138671875, 0.03275299072265625, 0.034030914306640625, 0.035308837890625]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 7.0, 13.0, 44.0, 249.0, 436.0, 201.0, 47.0, 11.0, 3.0, 2.0, 1.0], "bins": [-3.1108107566833496, -3.0567708015441895, -3.0027308464050293, -2.948690891265869, -2.894651174545288, -2.840611219406128, -2.7865712642669678, -2.7325313091278076, -2.6784913539886475, -2.6244513988494873, -2.570411443710327, -2.516371488571167, -2.462331771850586, -2.408291816711426, -2.3542518615722656, -2.3002119064331055, -2.2461719512939453, -2.192131996154785, -2.138092041015625, -2.084052085876465, -2.030012369155884, -1.9759724140167236, -1.9219324588775635, -1.8678925037384033, -1.8138526678085327, -1.7598127126693726, -1.705772876739502, -1.6517329216003418, -1.5976929664611816, -1.5436530113220215, -1.4896131753921509, -1.4355732202529907, -1.3815332651138306, -1.3274933099746704, -1.2734534740447998, -1.2194135189056396, -1.1653735637664795, -1.1113336086273193, -1.0572937726974487, -1.0032538175582886, -0.9492138624191284, -0.895173966884613, -0.8411340117454529, -0.7870941162109375, -0.7330541610717773, -0.679014265537262, -0.6249743700027466, -0.5709344148635864, -0.516894519329071, -0.4628545939922333, -0.4088146686553955, -0.3547747731208801, -0.30073481798171997, -0.2466949224472046, -0.19265499711036682, -0.13861507177352905, -0.08457514643669128, -0.030535224825143814, 0.023504696786403656, 0.07754461467266083, 0.1315845400094986, 0.18562445044517517, 0.23966437578201294, 0.2937043011188507, 0.3477442264556885]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 4.0, 5.0, 6.0, 9.0, 6.0, 11.0, 19.0, 16.0, 16.0, 18.0, 15.0, 18.0, 25.0, 31.0, 31.0, 34.0, 42.0, 34.0, 48.0, 42.0, 45.0, 49.0, 37.0, 42.0, 38.0, 52.0, 38.0, 34.0, 26.0, 39.0, 27.0, 30.0, 18.0, 22.0, 13.0, 10.0, 18.0, 3.0, 16.0, 9.0, 5.0, 2.0, 1.0, 1.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0], "bins": [-0.7301966547966003, -0.7078040838241577, -0.6854114532470703, -0.6630188822746277, -0.6406263113021851, -0.6182337403297424, -0.5958411693572998, -0.5734485387802124, -0.5510559678077698, -0.5286633968353271, -0.5062707662582397, -0.4838781952857971, -0.4614856243133545, -0.43909305334091187, -0.41670045256614685, -0.39430785179138184, -0.3719152808189392, -0.3495227098464966, -0.32713010907173157, -0.30473750829696655, -0.2823449373245239, -0.2599523663520813, -0.23755976557731628, -0.21516717970371246, -0.19277459383010864, -0.17038200795650482, -0.147989422082901, -0.12559683620929718, -0.10320425033569336, -0.08081166446208954, -0.05841907858848572, -0.0360264927148819, -0.0136338472366333, 0.00875873863697052, 0.03115132451057434, 0.05354391038417816, 0.07593649625778198, 0.0983290821313858, 0.12072166800498962, 0.14311425387859344, 0.16550683975219727, 0.1878994256258011, 0.2102920114994049, 0.23268459737300873, 0.25507718324661255, 0.2774697542190552, 0.2998623549938202, 0.3222549557685852, 0.34464752674102783, 0.36704009771347046, 0.3894326984882355, 0.4118252992630005, 0.4342178702354431, 0.45661044120788574, 0.47900304198265076, 0.5013956427574158, 0.5237882137298584, 0.546180784702301, 0.5685733556747437, 0.590965986251831, 0.6133585572242737, 0.6357511281967163, 0.6581437587738037, 0.6805363297462463, 0.702928900718689]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 4.0, 7.0, 10.0, 8.0, 21.0, 30.0, 26.0, 69.0, 100.0, 160.0, 276.0, 575.0, 1368.0, 5298.0, 129792.0, 3969895.0, 79789.0, 4500.0, 1175.0, 516.0, 285.0, 140.0, 88.0, 54.0, 36.0, 24.0, 13.0, 12.0, 6.0, 3.0, 7.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.41650390625, -0.4007568359375, -0.385009765625, -0.3692626953125, -0.353515625, -0.3377685546875, -0.322021484375, -0.3062744140625, -0.29052734375, -0.2747802734375, -0.259033203125, -0.2432861328125, -0.2275390625, -0.2117919921875, -0.196044921875, -0.1802978515625, -0.16455078125, -0.1488037109375, -0.133056640625, -0.1173095703125, -0.1015625, -0.0858154296875, -0.070068359375, -0.0543212890625, -0.03857421875, -0.0228271484375, -0.007080078125, 0.0086669921875, 0.0244140625, 0.0401611328125, 0.055908203125, 0.0716552734375, 0.08740234375, 0.1031494140625, 0.118896484375, 0.1346435546875, 0.150390625, 0.1661376953125, 0.181884765625, 0.1976318359375, 0.21337890625, 0.2291259765625, 0.244873046875, 0.2606201171875, 0.2763671875, 0.2921142578125, 0.307861328125, 0.3236083984375, 0.33935546875, 0.3551025390625, 0.370849609375, 0.3865966796875, 0.40234375, 0.4180908203125, 0.433837890625, 0.4495849609375, 0.46533203125, 0.4810791015625, 0.496826171875, 0.5125732421875, 0.5283203125, 0.5440673828125, 0.559814453125, 0.5755615234375, 0.59130859375]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 3.0, 6.0, 6.0, 10.0, 14.0, 21.0, 34.0, 48.0, 62.0, 81.0, 89.0, 81.0, 92.0, 81.0, 94.0, 68.0, 70.0, 52.0, 29.0, 28.0, 14.0, 12.0, 7.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1392822265625, -0.13382530212402344, -0.12836837768554688, -0.12291145324707031, -0.11745452880859375, -0.11199760437011719, -0.10654067993164062, -0.10108375549316406, -0.0956268310546875, -0.09016990661621094, -0.08471298217773438, -0.07925605773925781, -0.07379913330078125, -0.06834220886230469, -0.06288528442382812, -0.05742835998535156, -0.051971435546875, -0.04651451110839844, -0.041057586669921875, -0.03560066223144531, -0.03014373779296875, -0.024686813354492188, -0.019229888916015625, -0.013772964477539062, -0.0083160400390625, -0.0028591156005859375, 0.002597808837890625, 0.008054733276367188, 0.01351165771484375, 0.018968582153320312, 0.024425506591796875, 0.029882431030273438, 0.03533935546875, 0.04079627990722656, 0.046253204345703125, 0.05171012878417969, 0.05716705322265625, 0.06262397766113281, 0.06808090209960938, 0.07353782653808594, 0.0789947509765625, 0.08445167541503906, 0.08990859985351562, 0.09536552429199219, 0.10082244873046875, 0.10627937316894531, 0.11173629760742188, 0.11719322204589844, 0.122650146484375, 0.12810707092285156, 0.13356399536132812, 0.1390209197998047, 0.14447784423828125, 0.1499347686767578, 0.15539169311523438, 0.16084861755371094, 0.1663055419921875, 0.17176246643066406, 0.17721939086914062, 0.1826763153076172, 0.18813323974609375, 0.1935901641845703, 0.19904708862304688, 0.20450401306152344, 0.2099609375]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 2.0, 3.0, 3.0, 5.0, 7.0, 12.0, 10.0, 26.0, 16.0, 36.0, 48.0, 83.0, 132.0, 199.0, 503.0, 1293.0, 4748.0, 27671.0, 252298.0, 2262638.0, 1471709.0, 149697.0, 17863.0, 3419.0, 988.0, 370.0, 179.0, 101.0, 66.0, 49.0, 28.0, 19.0, 19.0, 17.0, 8.0, 7.0, 1.0, 4.0, 4.0, 1.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.291259765625, -0.2829113006591797, -0.2745628356933594, -0.26621437072753906, -0.25786590576171875, -0.24951744079589844, -0.24116897583007812, -0.2328205108642578, -0.2244720458984375, -0.2161235809326172, -0.20777511596679688, -0.19942665100097656, -0.19107818603515625, -0.18272972106933594, -0.17438125610351562, -0.1660327911376953, -0.157684326171875, -0.1493358612060547, -0.14098739624023438, -0.13263893127441406, -0.12429046630859375, -0.11594200134277344, -0.10759353637695312, -0.09924507141113281, -0.0908966064453125, -0.08254814147949219, -0.07419967651367188, -0.06585121154785156, -0.05750274658203125, -0.04915428161621094, -0.040805816650390625, -0.03245735168457031, -0.02410888671875, -0.015760421752929688, -0.007411956787109375, 0.0009365081787109375, 0.00928497314453125, 0.017633438110351562, 0.025981903076171875, 0.03433036804199219, 0.0426788330078125, 0.05102729797363281, 0.059375762939453125, 0.06772422790527344, 0.07607269287109375, 0.08442115783691406, 0.09276962280273438, 0.10111808776855469, 0.109466552734375, 0.11781501770019531, 0.12616348266601562, 0.13451194763183594, 0.14286041259765625, 0.15120887756347656, 0.15955734252929688, 0.1679058074951172, 0.1762542724609375, 0.1846027374267578, 0.19295120239257812, 0.20129966735839844, 0.20964813232421875, 0.21799659729003906, 0.22634506225585938, 0.2346935272216797, 0.2430419921875]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 1.0, 4.0, 8.0, 7.0, 9.0, 20.0, 19.0, 26.0, 47.0, 82.0, 106.0, 170.0, 221.0, 352.0, 490.0, 597.0, 516.0, 367.0, 281.0, 224.0, 170.0, 108.0, 85.0, 48.0, 31.0, 34.0, 14.0, 6.0, 11.0, 5.0, 6.0, 6.0, 5.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1529541015625, -0.1485271453857422, -0.14410018920898438, -0.13967323303222656, -0.13524627685546875, -0.13081932067871094, -0.12639236450195312, -0.12196540832519531, -0.1175384521484375, -0.11311149597167969, -0.10868453979492188, -0.10425758361816406, -0.09983062744140625, -0.09540367126464844, -0.09097671508789062, -0.08654975891113281, -0.082122802734375, -0.07769584655761719, -0.07326889038085938, -0.06884193420410156, -0.06441497802734375, -0.05998802185058594, -0.055561065673828125, -0.05113410949707031, -0.0467071533203125, -0.04228019714355469, -0.037853240966796875, -0.03342628479003906, -0.02899932861328125, -0.024572372436523438, -0.020145416259765625, -0.015718460083007812, -0.01129150390625, -0.0068645477294921875, -0.002437591552734375, 0.0019893646240234375, 0.00641632080078125, 0.010843276977539062, 0.015270233154296875, 0.019697189331054688, 0.0241241455078125, 0.028551101684570312, 0.032978057861328125, 0.03740501403808594, 0.04183197021484375, 0.04625892639160156, 0.050685882568359375, 0.05511283874511719, 0.059539794921875, 0.06396675109863281, 0.06839370727539062, 0.07282066345214844, 0.07724761962890625, 0.08167457580566406, 0.08610153198242188, 0.09052848815917969, 0.0949554443359375, 0.09938240051269531, 0.10380935668945312, 0.10823631286621094, 0.11266326904296875, 0.11709022521972656, 0.12151718139648438, 0.1259441375732422, 0.13037109375]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 7.0, 22.0, 38.0, 111.0, 218.0, 295.0, 204.0, 84.0, 23.0, 9.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9779017567634583, -0.9374116063117981, -0.8969214558601379, -0.8564313054084778, -0.8159412145614624, -0.7754510641098022, -0.7349609136581421, -0.6944707632064819, -0.6539806127548218, -0.6134904623031616, -0.5730003118515015, -0.5325101613998413, -0.49202004075050354, -0.4515298902988434, -0.4110397696495056, -0.37054961919784546, -0.3300594687461853, -0.28956931829452515, -0.24907918274402618, -0.20858904719352722, -0.16809889674186707, -0.1276087462902069, -0.08711861073970795, -0.046628475189208984, -0.006138324737548828, 0.03435181826353073, 0.07484196126461029, 0.11533210426568985, 0.1558222472667694, 0.19631239771842957, 0.23680253326892853, 0.2772926688194275, 0.3177828788757324, 0.3582730293273926, 0.39876317977905273, 0.4392533004283905, 0.47974345088005066, 0.5202336311340332, 0.5607237219810486, 0.6012138724327087, 0.6417040228843689, 0.682194173336029, 0.7226843237876892, 0.7631744742393494, 0.8036645650863647, 0.8441547155380249, 0.8846448659896851, 0.9251350164413452, 0.9656251668930054, 1.0061153173446655, 1.0466054677963257, 1.0870956182479858, 1.127585768699646, 1.1680759191513062, 1.2085660696029663, 1.249056100845337, 1.289546251296997, 1.3300364017486572, 1.3705265522003174, 1.4110167026519775, 1.4515068531036377, 1.4919970035552979, 1.532487154006958, 1.5729773044586182, 1.6134674549102783]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 6.0, 11.0, 15.0, 17.0, 14.0, 22.0, 26.0, 25.0, 29.0, 34.0, 44.0, 29.0, 47.0, 46.0, 60.0, 44.0, 42.0, 54.0, 55.0, 59.0, 39.0, 48.0, 40.0, 49.0, 33.0, 32.0, 11.0, 18.0, 14.0, 15.0, 7.0, 7.0, 3.0, 1.0, 12.0, 3.0, 1.0, 0.0, 2.0], "bins": [-0.7536828517913818, -0.7352420687675476, -0.7168012857437134, -0.6983605027198792, -0.6799197196960449, -0.6614788770675659, -0.6430381536483765, -0.6245973110198975, -0.6061565279960632, -0.587715744972229, -0.5692749619483948, -0.5508341789245605, -0.5323933959007263, -0.5139526128768921, -0.4955118000507355, -0.47707098722457886, -0.458630234003067, -0.4401894509792328, -0.42174866795539856, -0.40330785512924194, -0.3848670721054077, -0.3664262890815735, -0.34798550605773926, -0.32954472303390503, -0.3111039400100708, -0.2926631569862366, -0.27422237396240234, -0.2557815909385681, -0.2373407781124115, -0.21889999508857727, -0.20045921206474304, -0.18201841413974762, -0.1635776162147522, -0.14513683319091797, -0.12669603526592255, -0.10825525224208832, -0.08981446176767349, -0.07137367129325867, -0.05293288826942444, -0.034492090344429016, -0.016051307320594788, 0.0023894812911748886, 0.020830269902944565, 0.03927105665206909, 0.05771184712648392, 0.07615263760089874, 0.09459342062473297, 0.1130342185497284, 0.13147500157356262, 0.14991578459739685, 0.16835658252239227, 0.1867973655462265, 0.20523816347122192, 0.22367894649505615, 0.24211972951889038, 0.2605605125427246, 0.27900129556655884, 0.29744207859039307, 0.3158828616142273, 0.3343236446380615, 0.35276445746421814, 0.37120524048805237, 0.3896460235118866, 0.4080868363380432, 0.42652761936187744]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 3.0, 3.0, 9.0, 7.0, 17.0, 11.0, 18.0, 28.0, 52.0, 73.0, 136.0, 226.0, 403.0, 788.0, 1574.0, 3159.0, 6637.0, 15134.0, 41099.0, 144244.0, 422118.0, 289577.0, 78441.0, 25123.0, 10203.0, 4636.0, 2260.0, 1175.0, 625.0, 316.0, 171.0, 103.0, 66.0, 43.0, 26.0, 14.0, 16.0, 12.0, 5.0, 4.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.2412109375, -0.2331085205078125, -0.225006103515625, -0.2169036865234375, -0.20880126953125, -0.2006988525390625, -0.192596435546875, -0.1844940185546875, -0.1763916015625, -0.1682891845703125, -0.160186767578125, -0.1520843505859375, -0.14398193359375, -0.1358795166015625, -0.127777099609375, -0.1196746826171875, -0.111572265625, -0.1034698486328125, -0.095367431640625, -0.0872650146484375, -0.07916259765625, -0.0710601806640625, -0.062957763671875, -0.0548553466796875, -0.0467529296875, -0.0386505126953125, -0.030548095703125, -0.0224456787109375, -0.01434326171875, -0.0062408447265625, 0.001861572265625, 0.0099639892578125, 0.01806640625, 0.0261688232421875, 0.034271240234375, 0.0423736572265625, 0.05047607421875, 0.0585784912109375, 0.066680908203125, 0.0747833251953125, 0.0828857421875, 0.0909881591796875, 0.099090576171875, 0.1071929931640625, 0.11529541015625, 0.1233978271484375, 0.131500244140625, 0.1396026611328125, 0.147705078125, 0.1558074951171875, 0.163909912109375, 0.1720123291015625, 0.18011474609375, 0.1882171630859375, 0.196319580078125, 0.2044219970703125, 0.2125244140625, 0.2206268310546875, 0.228729248046875, 0.2368316650390625, 0.24493408203125, 0.2530364990234375, 0.261138916015625, 0.2692413330078125, 0.27734375]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 3.0, 2.0, 3.0, 6.0, 11.0, 19.0, 26.0, 35.0, 44.0, 82.0, 70.0, 107.0, 93.0, 81.0, 95.0, 71.0, 78.0, 56.0, 50.0, 30.0, 21.0, 13.0, 11.0, 1.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1510009765625, -0.14564132690429688, -0.14028167724609375, -0.13492202758789062, -0.1295623779296875, -0.12420272827148438, -0.11884307861328125, -0.11348342895507812, -0.108123779296875, -0.10276412963867188, -0.09740447998046875, -0.09204483032226562, -0.0866851806640625, -0.08132553100585938, -0.07596588134765625, -0.07060623168945312, -0.06524658203125, -0.059886932373046875, -0.05452728271484375, -0.049167633056640625, -0.0438079833984375, -0.038448333740234375, -0.03308868408203125, -0.027729034423828125, -0.022369384765625, -0.017009735107421875, -0.01165008544921875, -0.006290435791015625, -0.0009307861328125, 0.004428863525390625, 0.00978851318359375, 0.015148162841796875, 0.0205078125, 0.025867462158203125, 0.03122711181640625, 0.036586761474609375, 0.0419464111328125, 0.047306060791015625, 0.05266571044921875, 0.058025360107421875, 0.063385009765625, 0.06874465942382812, 0.07410430908203125, 0.07946395874023438, 0.0848236083984375, 0.09018325805664062, 0.09554290771484375, 0.10090255737304688, 0.10626220703125, 0.11162185668945312, 0.11698150634765625, 0.12234115600585938, 0.1277008056640625, 0.13306045532226562, 0.13842010498046875, 0.14377975463867188, 0.149139404296875, 0.15449905395507812, 0.15985870361328125, 0.16521835327148438, 0.1705780029296875, 0.17593765258789062, 0.18129730224609375, 0.18665695190429688, 0.1920166015625]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 6.0, 4.0, 7.0, 13.0, 8.0, 22.0, 19.0, 24.0, 38.0, 71.0, 78.0, 206.0, 404.0, 1327.0, 4686.0, 18045.0, 117232.0, 642693.0, 225366.0, 28536.0, 6892.0, 1791.0, 541.0, 209.0, 105.0, 75.0, 50.0, 31.0, 23.0, 19.0, 11.0, 8.0, 8.0, 3.0, 3.0, 2.0, 2.0, 2.0, 5.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.484619140625, -0.4713935852050781, -0.45816802978515625, -0.4449424743652344, -0.4317169189453125, -0.4184913635253906, -0.40526580810546875, -0.3920402526855469, -0.378814697265625, -0.3655891418457031, -0.35236358642578125, -0.3391380310058594, -0.3259124755859375, -0.3126869201660156, -0.29946136474609375, -0.2862358093261719, -0.27301025390625, -0.2597846984863281, -0.24655914306640625, -0.23333358764648438, -0.2201080322265625, -0.20688247680664062, -0.19365692138671875, -0.18043136596679688, -0.167205810546875, -0.15398025512695312, -0.14075469970703125, -0.12752914428710938, -0.1143035888671875, -0.10107803344726562, -0.08785247802734375, -0.07462692260742188, -0.0614013671875, -0.048175811767578125, -0.03495025634765625, -0.021724700927734375, -0.0084991455078125, 0.004726409912109375, 0.01795196533203125, 0.031177520751953125, 0.044403076171875, 0.057628631591796875, 0.07085418701171875, 0.08407974243164062, 0.0973052978515625, 0.11053085327148438, 0.12375640869140625, 0.13698196411132812, 0.15020751953125, 0.16343307495117188, 0.17665863037109375, 0.18988418579101562, 0.2031097412109375, 0.21633529663085938, 0.22956085205078125, 0.24278640747070312, 0.256011962890625, 0.2692375183105469, 0.28246307373046875, 0.2956886291503906, 0.3089141845703125, 0.3221397399902344, 0.33536529541015625, 0.3485908508300781, 0.36181640625]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 3.0, 9.0, 8.0, 11.0, 14.0, 10.0, 22.0, 26.0, 28.0, 35.0, 39.0, 33.0, 38.0, 48.0, 50.0, 55.0, 44.0, 53.0, 51.0, 54.0, 51.0, 42.0, 39.0, 49.0, 30.0, 35.0, 21.0, 20.0, 20.0, 16.0, 16.0, 9.0, 6.0, 9.0, 8.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.191162109375, -0.18412017822265625, -0.1770782470703125, -0.17003631591796875, -0.162994384765625, -0.15595245361328125, -0.1489105224609375, -0.14186859130859375, -0.13482666015625, -0.12778472900390625, -0.1207427978515625, -0.11370086669921875, -0.106658935546875, -0.09961700439453125, -0.0925750732421875, -0.08553314208984375, -0.0784912109375, -0.07144927978515625, -0.0644073486328125, -0.05736541748046875, -0.050323486328125, -0.04328155517578125, -0.0362396240234375, -0.02919769287109375, -0.02215576171875, -0.01511383056640625, -0.0080718994140625, -0.00102996826171875, 0.006011962890625, 0.01305389404296875, 0.0200958251953125, 0.02713775634765625, 0.0341796875, 0.04122161865234375, 0.0482635498046875, 0.05530548095703125, 0.062347412109375, 0.06938934326171875, 0.0764312744140625, 0.08347320556640625, 0.09051513671875, 0.09755706787109375, 0.1045989990234375, 0.11164093017578125, 0.118682861328125, 0.12572479248046875, 0.1327667236328125, 0.13980865478515625, 0.1468505859375, 0.15389251708984375, 0.1609344482421875, 0.16797637939453125, 0.175018310546875, 0.18206024169921875, 0.1891021728515625, 0.19614410400390625, 0.20318603515625, 0.21022796630859375, 0.2172698974609375, 0.22431182861328125, 0.231353759765625, 0.23839569091796875, 0.2454376220703125, 0.25247955322265625, 0.259521484375]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 4.0, 14.0, 19.0, 18.0, 36.0, 73.0, 135.0, 250.0, 454.0, 897.0, 2112.0, 5851.0, 21858.0, 188982.0, 703087.0, 101347.0, 15628.0, 4484.0, 1725.0, 738.0, 395.0, 180.0, 107.0, 62.0, 44.0, 21.0, 10.0, 8.0, 8.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.177001953125, -0.16872406005859375, -0.1604461669921875, -0.15216827392578125, -0.143890380859375, -0.13561248779296875, -0.1273345947265625, -0.11905670166015625, -0.11077880859375, -0.10250091552734375, -0.0942230224609375, -0.08594512939453125, -0.077667236328125, -0.06938934326171875, -0.0611114501953125, -0.05283355712890625, -0.0445556640625, -0.03627777099609375, -0.0279998779296875, -0.01972198486328125, -0.011444091796875, -0.00316619873046875, 0.0051116943359375, 0.01338958740234375, 0.02166748046875, 0.02994537353515625, 0.0382232666015625, 0.04650115966796875, 0.054779052734375, 0.06305694580078125, 0.0713348388671875, 0.07961273193359375, 0.087890625, 0.09616851806640625, 0.1044464111328125, 0.11272430419921875, 0.121002197265625, 0.12928009033203125, 0.1375579833984375, 0.14583587646484375, 0.15411376953125, 0.16239166259765625, 0.1706695556640625, 0.17894744873046875, 0.187225341796875, 0.19550323486328125, 0.2037811279296875, 0.21205902099609375, 0.2203369140625, 0.22861480712890625, 0.2368927001953125, 0.24517059326171875, 0.253448486328125, 0.26172637939453125, 0.2700042724609375, 0.27828216552734375, 0.28656005859375, 0.29483795166015625, 0.3031158447265625, 0.31139373779296875, 0.319671630859375, 0.32794952392578125, 0.3362274169921875, 0.34450531005859375, 0.352783203125]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 5.0, 4.0, 2.0, 5.0, 5.0, 5.0, 12.0, 16.0, 32.0, 50.0, 90.0, 125.0, 157.0, 157.0, 113.0, 83.0, 58.0, 30.0, 14.0, 13.0, 12.0, 3.0, 6.0, 6.0, 1.0, 1.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.4345855712890625e-05, -4.3206848204135895e-05, -4.2067840695381165e-05, -4.0928833186626434e-05, -3.9789825677871704e-05, -3.8650818169116974e-05, -3.7511810660362244e-05, -3.6372803151607513e-05, -3.523379564285278e-05, -3.409478813409805e-05, -3.295578062534332e-05, -3.181677311658859e-05, -3.067776560783386e-05, -2.9538758099079132e-05, -2.8399750590324402e-05, -2.726074308156967e-05, -2.612173557281494e-05, -2.498272806406021e-05, -2.384372055530548e-05, -2.270471304655075e-05, -2.156570553779602e-05, -2.042669802904129e-05, -1.928769052028656e-05, -1.814868301153183e-05, -1.70096755027771e-05, -1.587066799402237e-05, -1.473166048526764e-05, -1.3592652976512909e-05, -1.2453645467758179e-05, -1.1314637959003448e-05, -1.0175630450248718e-05, -9.036622941493988e-06, -7.897615432739258e-06, -6.758607923984528e-06, -5.619600415229797e-06, -4.480592906475067e-06, -3.341585397720337e-06, -2.2025778889656067e-06, -1.0635703802108765e-06, 7.543712854385376e-08, 1.214444637298584e-06, 2.353452146053314e-06, 3.4924596548080444e-06, 4.631467163562775e-06, 5.770474672317505e-06, 6.909482181072235e-06, 8.048489689826965e-06, 9.187497198581696e-06, 1.0326504707336426e-05, 1.1465512216091156e-05, 1.2604519724845886e-05, 1.3743527233600616e-05, 1.4882534742355347e-05, 1.6021542251110077e-05, 1.7160549759864807e-05, 1.8299557268619537e-05, 1.9438564777374268e-05, 2.0577572286128998e-05, 2.1716579794883728e-05, 2.2855587303638458e-05, 2.399459481239319e-05, 2.513360232114792e-05, 2.627260982990265e-05, 2.741161733865738e-05, 2.855062484741211e-05]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [4.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 4.0, 4.0, 4.0, 3.0, 2.0, 8.0, 6.0, 4.0, 9.0, 23.0, 31.0, 51.0, 62.0, 78.0, 206.0, 444.0, 1062.0, 2741.0, 7022.0, 22000.0, 96637.0, 356389.0, 399363.0, 121633.0, 27110.0, 8280.0, 3117.0, 1183.0, 490.0, 242.0, 112.0, 75.0, 45.0, 23.0, 32.0, 16.0, 16.0, 10.0, 11.0, 5.0, 4.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1212158203125, -0.11718559265136719, -0.11315536499023438, -0.10912513732910156, -0.10509490966796875, -0.10106468200683594, -0.09703445434570312, -0.09300422668457031, -0.0889739990234375, -0.08494377136230469, -0.08091354370117188, -0.07688331604003906, -0.07285308837890625, -0.06882286071777344, -0.06479263305664062, -0.06076240539550781, -0.056732177734375, -0.05270195007324219, -0.048671722412109375, -0.04464149475097656, -0.04061126708984375, -0.03658103942871094, -0.032550811767578125, -0.028520584106445312, -0.0244903564453125, -0.020460128784179688, -0.016429901123046875, -0.012399673461914062, -0.00836944580078125, -0.0043392181396484375, -0.000308990478515625, 0.0037212371826171875, 0.00775146484375, 0.011781692504882812, 0.015811920166015625, 0.019842147827148438, 0.02387237548828125, 0.027902603149414062, 0.031932830810546875, 0.03596305847167969, 0.0399932861328125, 0.04402351379394531, 0.048053741455078125, 0.05208396911621094, 0.05611419677734375, 0.06014442443847656, 0.06417465209960938, 0.06820487976074219, 0.072235107421875, 0.07626533508300781, 0.08029556274414062, 0.08432579040527344, 0.08835601806640625, 0.09238624572753906, 0.09641647338867188, 0.10044670104980469, 0.1044769287109375, 0.10850715637207031, 0.11253738403320312, 0.11656761169433594, 0.12059783935546875, 0.12462806701660156, 0.12865829467773438, 0.1326885223388672, 0.13671875]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 1.0, 4.0, 4.0, 4.0, 0.0, 6.0, 6.0, 2.0, 10.0, 12.0, 10.0, 22.0, 39.0, 43.0, 54.0, 61.0, 86.0, 86.0, 83.0, 98.0, 71.0, 68.0, 46.0, 43.0, 34.0, 35.0, 19.0, 14.0, 11.0, 6.0, 7.0, 5.0, 1.0, 6.0, 3.0, 2.0, 4.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.07916259765625, -0.07666206359863281, -0.07416152954101562, -0.07166099548339844, -0.06916046142578125, -0.06665992736816406, -0.06415939331054688, -0.06165885925292969, -0.0591583251953125, -0.05665779113769531, -0.054157257080078125, -0.05165672302246094, -0.04915618896484375, -0.04665565490722656, -0.044155120849609375, -0.04165458679199219, -0.039154052734375, -0.03665351867675781, -0.034152984619140625, -0.03165245056152344, -0.02915191650390625, -0.026651382446289062, -0.024150848388671875, -0.021650314331054688, -0.0191497802734375, -0.016649246215820312, -0.014148712158203125, -0.011648178100585938, -0.00914764404296875, -0.0066471099853515625, -0.004146575927734375, -0.0016460418701171875, 0.0008544921875, 0.0033550262451171875, 0.005855560302734375, 0.008356094360351562, 0.01085662841796875, 0.013357162475585938, 0.015857696533203125, 0.018358230590820312, 0.0208587646484375, 0.023359298706054688, 0.025859832763671875, 0.028360366821289062, 0.03086090087890625, 0.03336143493652344, 0.035861968994140625, 0.03836250305175781, 0.040863037109375, 0.04336357116699219, 0.045864105224609375, 0.04836463928222656, 0.05086517333984375, 0.05336570739746094, 0.055866241455078125, 0.05836677551269531, 0.0608673095703125, 0.06336784362792969, 0.06586837768554688, 0.06836891174316406, 0.07086944580078125, 0.07336997985839844, 0.07587051391601562, 0.07837104797363281, 0.08087158203125]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [11.0, 225.0, 710.0, 65.0, 6.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3859019875526428, -0.21582376956939697, -0.04574555158615112, 0.12433266639709473, 0.2944108843803406, 0.4644891023635864, 0.6345673203468323, 0.8046454787254333, 0.974723756313324, 1.1448019742965698, 1.314880132675171, 1.4849584102630615, 1.6550366878509521, 1.8251148462295532, 1.9951930046081543, 2.165271282196045, 2.3353495597839355, 2.505427837371826, 2.675506114959717, 2.8455841541290283, 3.015662431716919, 3.1857407093048096, 3.355818748474121, 3.5258970260620117, 3.6959753036499023, 3.866053581237793, 4.036131858825684, 4.206210136413574, 4.376288414001465, 4.546366214752197, 4.716444492340088, 4.8865227699279785, 5.056600570678711, 5.226678848266602, 5.396757125854492, 5.566835403442383, 5.736913681030273, 5.906991481781006, 6.0770697593688965, 6.247148036956787, 6.417226314544678, 6.587304592132568, 6.757382869720459, 6.92746114730835, 7.097538948059082, 7.267617225646973, 7.437695503234863, 7.607773780822754, 7.7778520584106445, 7.947930335998535, 8.118008613586426, 8.288086891174316, 8.458165168762207, 8.628243446350098, 8.798321723937988, 8.968399047851562, 9.138477325439453, 9.308555603027344, 9.478633880615234, 9.648712158203125, 9.818790435791016, 9.988868713378906, 10.158946990966797, 10.329025268554688, 10.499103546142578]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 2.0, 3.0, 4.0, 5.0, 9.0, 8.0, 8.0, 12.0, 15.0, 14.0, 25.0, 24.0, 27.0, 29.0, 23.0, 27.0, 34.0, 35.0, 27.0, 56.0, 49.0, 34.0, 46.0, 43.0, 53.0, 35.0, 41.0, 34.0, 32.0, 30.0, 32.0, 23.0, 23.0, 25.0, 26.0, 21.0, 13.0, 16.0, 13.0, 11.0, 6.0, 6.0, 3.0, 2.0, 1.0, 4.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.5564454197883606, -0.5384952425956726, -0.5205450654029846, -0.5025948286056519, -0.48464465141296387, -0.4666944742202759, -0.4487442970275879, -0.4307940900325775, -0.41284388303756714, -0.39489370584487915, -0.3769434988498688, -0.3589933216571808, -0.3410431146621704, -0.3230929374694824, -0.30514276027679443, -0.28719255328178406, -0.26924237608909607, -0.2512921988964081, -0.2333419919013977, -0.21539181470870972, -0.19744160771369934, -0.17949143052101135, -0.16154123842716217, -0.143591046333313, -0.1256408542394638, -0.10769066214561462, -0.08974047005176544, -0.07179028540849686, -0.053840093314647675, -0.03588990122079849, -0.017939716577529907, 1.0475516319274902e-05, 0.017960667610168457, 0.03591085970401764, 0.05386104807257652, 0.0718112364411354, 0.08976142853498459, 0.10771162062883377, 0.12566180527210236, 0.14361199736595154, 0.16156218945980072, 0.1795123815536499, 0.19746257364749908, 0.21541276574134827, 0.23336294293403625, 0.25131314992904663, 0.2692633271217346, 0.2872135043144226, 0.305163711309433, 0.32311388850212097, 0.34106409549713135, 0.35901427268981934, 0.3769644796848297, 0.3949146568775177, 0.4128648638725281, 0.43081504106521606, 0.44876521825790405, 0.46671539545059204, 0.4846656024456024, 0.5026158094406128, 0.5205659866333008, 0.5385161638259888, 0.5564663410186768, 0.5744165182113647, 0.5923667550086975]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 1.0, 7.0, 7.0, 7.0, 11.0, 8.0, 23.0, 34.0, 33.0, 74.0, 151.0, 226.0, 561.0, 994.0, 2739.0, 9165.0, 48417.0, 581795.0, 2952296.0, 539566.0, 45556.0, 8242.0, 2498.0, 955.0, 416.0, 192.0, 132.0, 59.0, 31.0, 29.0, 20.0, 14.0, 6.0, 8.0, 3.0, 4.0, 2.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.171630859375, -0.16538619995117188, -0.15914154052734375, -0.15289688110351562, -0.1466522216796875, -0.14040756225585938, -0.13416290283203125, -0.12791824340820312, -0.121673583984375, -0.11542892456054688, -0.10918426513671875, -0.10293960571289062, -0.0966949462890625, -0.09045028686523438, -0.08420562744140625, -0.07796096801757812, -0.07171630859375, -0.06547164916992188, -0.05922698974609375, -0.052982330322265625, -0.0467376708984375, -0.040493011474609375, -0.03424835205078125, -0.028003692626953125, -0.021759033203125, -0.015514373779296875, -0.00926971435546875, -0.003025054931640625, 0.0032196044921875, 0.009464263916015625, 0.01570892333984375, 0.021953582763671875, 0.0281982421875, 0.034442901611328125, 0.04068756103515625, 0.046932220458984375, 0.0531768798828125, 0.059421539306640625, 0.06566619873046875, 0.07191085815429688, 0.078155517578125, 0.08440017700195312, 0.09064483642578125, 0.09688949584960938, 0.1031341552734375, 0.10937881469726562, 0.11562347412109375, 0.12186813354492188, 0.12811279296875, 0.13435745239257812, 0.14060211181640625, 0.14684677124023438, 0.1530914306640625, 0.15933609008789062, 0.16558074951171875, 0.17182540893554688, 0.178070068359375, 0.18431472778320312, 0.19055938720703125, 0.19680404663085938, 0.2030487060546875, 0.20929336547851562, 0.21553802490234375, 0.22178268432617188, 0.22802734375]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 1.0, 3.0, 8.0, 17.0, 18.0, 26.0, 59.0, 53.0, 65.0, 74.0, 109.0, 93.0, 88.0, 105.0, 78.0, 55.0, 60.0, 43.0, 21.0, 19.0, 8.0, 5.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1541748046875, -0.1486072540283203, -0.14303970336914062, -0.13747215270996094, -0.13190460205078125, -0.12633705139160156, -0.12076950073242188, -0.11520195007324219, -0.1096343994140625, -0.10406684875488281, -0.09849929809570312, -0.09293174743652344, -0.08736419677734375, -0.08179664611816406, -0.07622909545898438, -0.07066154479980469, -0.065093994140625, -0.05952644348144531, -0.053958892822265625, -0.04839134216308594, -0.04282379150390625, -0.03725624084472656, -0.031688690185546875, -0.026121139526367188, -0.0205535888671875, -0.014986038208007812, -0.009418487548828125, -0.0038509368896484375, 0.00171661376953125, 0.0072841644287109375, 0.012851715087890625, 0.018419265747070312, 0.02398681640625, 0.029554367065429688, 0.035121917724609375, 0.04068946838378906, 0.04625701904296875, 0.05182456970214844, 0.057392120361328125, 0.06295967102050781, 0.0685272216796875, 0.07409477233886719, 0.07966232299804688, 0.08522987365722656, 0.09079742431640625, 0.09636497497558594, 0.10193252563476562, 0.10750007629394531, 0.113067626953125, 0.11863517761230469, 0.12420272827148438, 0.12977027893066406, 0.13533782958984375, 0.14090538024902344, 0.14647293090820312, 0.1520404815673828, 0.1576080322265625, 0.1631755828857422, 0.16874313354492188, 0.17431068420410156, 0.17987823486328125, 0.18544578552246094, 0.19101333618164062, 0.1965808868408203, 0.2021484375]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 2.0, 3.0, 3.0, 2.0, 8.0, 9.0, 13.0, 26.0, 27.0, 31.0, 64.0, 77.0, 141.0, 187.0, 260.0, 474.0, 811.0, 2171.0, 7290.0, 34396.0, 200386.0, 1119387.0, 2087070.0, 613566.0, 101694.0, 18685.0, 4516.0, 1434.0, 584.0, 363.0, 173.0, 151.0, 91.0, 58.0, 39.0, 26.0, 21.0, 15.0, 12.0, 4.0, 6.0, 5.0, 5.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1666259765625, -0.16130447387695312, -0.15598297119140625, -0.15066146850585938, -0.1453399658203125, -0.14001846313476562, -0.13469696044921875, -0.12937545776367188, -0.124053955078125, -0.11873245239257812, -0.11341094970703125, -0.10808944702148438, -0.1027679443359375, -0.09744644165039062, -0.09212493896484375, -0.08680343627929688, -0.08148193359375, -0.07616043090820312, -0.07083892822265625, -0.06551742553710938, -0.0601959228515625, -0.054874420166015625, -0.04955291748046875, -0.044231414794921875, -0.038909912109375, -0.033588409423828125, -0.02826690673828125, -0.022945404052734375, -0.0176239013671875, -0.012302398681640625, -0.00698089599609375, -0.001659393310546875, 0.003662109375, 0.008983612060546875, 0.01430511474609375, 0.019626617431640625, 0.0249481201171875, 0.030269622802734375, 0.03559112548828125, 0.040912628173828125, 0.046234130859375, 0.051555633544921875, 0.05687713623046875, 0.062198638916015625, 0.0675201416015625, 0.07284164428710938, 0.07816314697265625, 0.08348464965820312, 0.08880615234375, 0.09412765502929688, 0.09944915771484375, 0.10477066040039062, 0.1100921630859375, 0.11541366577148438, 0.12073516845703125, 0.12605667114257812, 0.131378173828125, 0.13669967651367188, 0.14202117919921875, 0.14734268188476562, 0.1526641845703125, 0.15798568725585938, 0.16330718994140625, 0.16862869262695312, 0.1739501953125]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 3.0, 4.0, 8.0, 7.0, 15.0, 15.0, 13.0, 31.0, 23.0, 43.0, 40.0, 67.0, 91.0, 105.0, 127.0, 168.0, 165.0, 231.0, 248.0, 291.0, 309.0, 281.0, 272.0, 253.0, 224.0, 206.0, 157.0, 147.0, 121.0, 90.0, 70.0, 62.0, 48.0, 34.0, 35.0, 24.0, 11.0, 14.0, 7.0, 3.0, 5.0, 6.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.11328125, -0.11002540588378906, -0.10676956176757812, -0.10351371765136719, -0.10025787353515625, -0.09700202941894531, -0.09374618530273438, -0.09049034118652344, -0.0872344970703125, -0.08397865295410156, -0.08072280883789062, -0.07746696472167969, -0.07421112060546875, -0.07095527648925781, -0.06769943237304688, -0.06444358825683594, -0.061187744140625, -0.05793190002441406, -0.054676055908203125, -0.05142021179199219, -0.04816436767578125, -0.04490852355957031, -0.041652679443359375, -0.03839683532714844, -0.0351409912109375, -0.03188514709472656, -0.028629302978515625, -0.025373458862304688, -0.02211761474609375, -0.018861770629882812, -0.015605926513671875, -0.012350082397460938, -0.00909423828125, -0.0058383941650390625, -0.002582550048828125, 0.0006732940673828125, 0.00392913818359375, 0.0071849822998046875, 0.010440826416015625, 0.013696670532226562, 0.0169525146484375, 0.020208358764648438, 0.023464202880859375, 0.026720046997070312, 0.02997589111328125, 0.03323173522949219, 0.036487579345703125, 0.03974342346191406, 0.042999267578125, 0.04625511169433594, 0.049510955810546875, 0.05276679992675781, 0.05602264404296875, 0.05927848815917969, 0.06253433227539062, 0.06579017639160156, 0.0690460205078125, 0.07230186462402344, 0.07555770874023438, 0.07881355285644531, 0.08206939697265625, 0.08532524108886719, 0.08858108520507812, 0.09183692932128906, 0.0950927734375]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 7.0, 29.0, 179.0, 499.0, 250.0, 49.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8006916046142578, -0.7077322602272034, -0.6147728562355042, -0.5218135118484497, -0.4288541376590729, -0.33589476346969604, -0.2429354190826416, -0.14997601509094238, -0.05701667070388794, 0.035942696034908295, 0.12890206277370453, 0.22186142206192017, 0.314820796251297, 0.40778017044067383, 0.5007395148277283, 0.5936989188194275, 0.6866582632064819, 0.7796176075935364, 0.8725770115852356, 0.96553635597229, 1.0584957599639893, 1.1514551639556885, 1.2444144487380981, 1.3373738527297974, 1.430333137512207, 1.5232925415039062, 1.616251826286316, 1.7092112302780151, 1.8021706342697144, 1.895129919052124, 1.9880893230438232, 2.0810487270355225, 2.1740081310272217, 2.266967535018921, 2.35992693901062, 2.4528861045837402, 2.5458455085754395, 2.6388049125671387, 2.731764316558838, 2.824723720550537, 2.9176831245422363, 3.0106425285339355, 3.1036019325256348, 3.196561336517334, 3.289520502090454, 3.3824799060821533, 3.4754393100738525, 3.5683987140655518, 3.661357879638672, 3.754317283630371, 3.8472766876220703, 3.9402360916137695, 4.033195495605469, 4.126154899597168, 4.219114303588867, 4.312073707580566, 4.405033111572266, 4.497992515563965, 4.590951919555664, 4.683911323547363, 4.7768707275390625, 4.869830131530762, 4.962789535522461, 5.05574893951416, 5.148707866668701]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 5.0, 3.0, 1.0, 5.0, 4.0, 8.0, 4.0, 4.0, 8.0, 13.0, 9.0, 18.0, 17.0, 17.0, 23.0, 23.0, 21.0, 26.0, 27.0, 41.0, 35.0, 31.0, 26.0, 34.0, 49.0, 32.0, 44.0, 35.0, 42.0, 27.0, 32.0, 27.0, 35.0, 34.0, 32.0, 19.0, 23.0, 26.0, 29.0, 27.0, 15.0, 14.0, 8.0, 13.0, 4.0, 12.0, 9.0, 7.0, 4.0, 4.0, 2.0, 3.0, 1.0, 0.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.4398230314254761, -0.42530906200408936, -0.41079509258270264, -0.3962811231613159, -0.3817671537399292, -0.3672531843185425, -0.35273921489715576, -0.33822524547576904, -0.3237112760543823, -0.3091973066329956, -0.2946833372116089, -0.28016936779022217, -0.26565539836883545, -0.25114142894744873, -0.236627459526062, -0.2221134901046753, -0.20759953558444977, -0.19308556616306305, -0.17857159674167633, -0.1640576273202896, -0.1495436578989029, -0.13502970337867737, -0.12051572650671005, -0.10600175708532333, -0.09148778766393661, -0.0769738182425499, -0.06245984882116318, -0.04794588312506676, -0.03343191370368004, -0.018917948007583618, -0.004403978586196899, 0.01010999083518982, 0.024623960256576538, 0.03913792967796326, 0.053651899099349976, 0.0681658685207367, 0.08267983794212341, 0.09719379991292953, 0.11170776933431625, 0.12622174620628357, 0.1407357156276703, 0.155249685049057, 0.16976365447044373, 0.18427762389183044, 0.19879159331321716, 0.21330556273460388, 0.2278195321559906, 0.24233350157737732, 0.25684744119644165, 0.27136141061782837, 0.2858753800392151, 0.3003893494606018, 0.3149033188819885, 0.32941728830337524, 0.34393125772476196, 0.3584452271461487, 0.3729591965675354, 0.3874731659889221, 0.40198713541030884, 0.41650110483169556, 0.4310150742530823, 0.445529043674469, 0.4600430130958557, 0.47455698251724243, 0.48907095193862915]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 5.0, 4.0, 10.0, 14.0, 21.0, 27.0, 32.0, 48.0, 67.0, 106.0, 181.0, 262.0, 488.0, 824.0, 1698.0, 3582.0, 7615.0, 16802.0, 38992.0, 92966.0, 214204.0, 318081.0, 200557.0, 86465.0, 36045.0, 15511.0, 7006.0, 3233.0, 1657.0, 839.0, 432.0, 276.0, 166.0, 99.0, 70.0, 48.0, 38.0, 21.0, 23.0, 7.0, 15.0, 5.0, 7.0, 4.0, 4.0, 0.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.2010498046875, -0.1946582794189453, -0.18826675415039062, -0.18187522888183594, -0.17548370361328125, -0.16909217834472656, -0.16270065307617188, -0.1563091278076172, -0.1499176025390625, -0.1435260772705078, -0.13713455200195312, -0.13074302673339844, -0.12435150146484375, -0.11795997619628906, -0.11156845092773438, -0.10517692565917969, -0.098785400390625, -0.09239387512207031, -0.08600234985351562, -0.07961082458496094, -0.07321929931640625, -0.06682777404785156, -0.060436248779296875, -0.05404472351074219, -0.0476531982421875, -0.04126167297363281, -0.034870147705078125, -0.028478622436523438, -0.02208709716796875, -0.015695571899414062, -0.009304046630859375, -0.0029125213623046875, 0.00347900390625, 0.009870529174804688, 0.016262054443359375, 0.022653579711914062, 0.02904510498046875, 0.03543663024902344, 0.041828155517578125, 0.04821968078613281, 0.0546112060546875, 0.06100273132324219, 0.06739425659179688, 0.07378578186035156, 0.08017730712890625, 0.08656883239746094, 0.09296035766601562, 0.09935188293457031, 0.105743408203125, 0.11213493347167969, 0.11852645874023438, 0.12491798400878906, 0.13130950927734375, 0.13770103454589844, 0.14409255981445312, 0.1504840850830078, 0.1568756103515625, 0.1632671356201172, 0.16965866088867188, 0.17605018615722656, 0.18244171142578125, 0.18883323669433594, 0.19522476196289062, 0.2016162872314453, 0.2080078125]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 4.0, 4.0, 14.0, 19.0, 34.0, 37.0, 55.0, 84.0, 92.0, 105.0, 89.0, 100.0, 85.0, 70.0, 78.0, 52.0, 33.0, 25.0, 16.0, 9.0, 2.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.152099609375, -0.14660263061523438, -0.14110565185546875, -0.13560867309570312, -0.1301116943359375, -0.12461471557617188, -0.11911773681640625, -0.11362075805664062, -0.108123779296875, -0.10262680053710938, -0.09712982177734375, -0.09163284301757812, -0.0861358642578125, -0.08063888549804688, -0.07514190673828125, -0.06964492797851562, -0.06414794921875, -0.058650970458984375, -0.05315399169921875, -0.047657012939453125, -0.0421600341796875, -0.036663055419921875, -0.03116607666015625, -0.025669097900390625, -0.020172119140625, -0.014675140380859375, -0.00917816162109375, -0.003681182861328125, 0.0018157958984375, 0.007312774658203125, 0.01280975341796875, 0.018306732177734375, 0.0238037109375, 0.029300689697265625, 0.03479766845703125, 0.040294647216796875, 0.0457916259765625, 0.051288604736328125, 0.05678558349609375, 0.062282562255859375, 0.067779541015625, 0.07327651977539062, 0.07877349853515625, 0.08427047729492188, 0.0897674560546875, 0.09526443481445312, 0.10076141357421875, 0.10625839233398438, 0.11175537109375, 0.11725234985351562, 0.12274932861328125, 0.12824630737304688, 0.1337432861328125, 0.13924026489257812, 0.14473724365234375, 0.15023422241210938, 0.155731201171875, 0.16122817993164062, 0.16672515869140625, 0.17222213745117188, 0.1777191162109375, 0.18321609497070312, 0.18871307373046875, 0.19421005249023438, 0.19970703125]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 2.0, 5.0, 5.0, 7.0, 8.0, 25.0, 32.0, 62.0, 83.0, 107.0, 215.0, 446.0, 1028.0, 2383.0, 6734.0, 18422.0, 51454.0, 145228.0, 334606.0, 299591.0, 119929.0, 43086.0, 15492.0, 5646.0, 2247.0, 818.0, 399.0, 188.0, 103.0, 65.0, 44.0, 35.0, 22.0, 14.0, 12.0, 5.0, 4.0, 3.0, 4.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.294189453125, -0.2857627868652344, -0.27733612060546875, -0.2689094543457031, -0.2604827880859375, -0.2520561218261719, -0.24362945556640625, -0.23520278930664062, -0.226776123046875, -0.21834945678710938, -0.20992279052734375, -0.20149612426757812, -0.1930694580078125, -0.18464279174804688, -0.17621612548828125, -0.16778945922851562, -0.15936279296875, -0.15093612670898438, -0.14250946044921875, -0.13408279418945312, -0.1256561279296875, -0.11722946166992188, -0.10880279541015625, -0.10037612915039062, -0.091949462890625, -0.08352279663085938, -0.07509613037109375, -0.06666946411132812, -0.0582427978515625, -0.049816131591796875, -0.04138946533203125, -0.032962799072265625, -0.0245361328125, -0.016109466552734375, -0.00768280029296875, 0.000743865966796875, 0.0091705322265625, 0.017597198486328125, 0.02602386474609375, 0.034450531005859375, 0.042877197265625, 0.051303863525390625, 0.05973052978515625, 0.06815719604492188, 0.0765838623046875, 0.08501052856445312, 0.09343719482421875, 0.10186386108398438, 0.11029052734375, 0.11871719360351562, 0.12714385986328125, 0.13557052612304688, 0.1439971923828125, 0.15242385864257812, 0.16085052490234375, 0.16927719116210938, 0.177703857421875, 0.18613052368164062, 0.19455718994140625, 0.20298385620117188, 0.2114105224609375, 0.21983718872070312, 0.22826385498046875, 0.23669052124023438, 0.2451171875]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 9.0, 14.0, 4.0, 5.0, 11.0, 9.0, 17.0, 14.0, 17.0, 21.0, 27.0, 23.0, 34.0, 29.0, 41.0, 34.0, 45.0, 36.0, 45.0, 49.0, 48.0, 47.0, 47.0, 49.0, 34.0, 42.0, 34.0, 43.0, 32.0, 27.0, 19.0, 14.0, 24.0, 14.0, 9.0, 9.0, 5.0, 5.0, 11.0, 6.0, 4.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.2197265625, -0.21307945251464844, -0.20643234252929688, -0.1997852325439453, -0.19313812255859375, -0.1864910125732422, -0.17984390258789062, -0.17319679260253906, -0.1665496826171875, -0.15990257263183594, -0.15325546264648438, -0.1466083526611328, -0.13996124267578125, -0.1333141326904297, -0.12666702270507812, -0.12001991271972656, -0.113372802734375, -0.10672569274902344, -0.10007858276367188, -0.09343147277832031, -0.08678436279296875, -0.08013725280761719, -0.07349014282226562, -0.06684303283691406, -0.0601959228515625, -0.05354881286621094, -0.046901702880859375, -0.04025459289550781, -0.03360748291015625, -0.026960372924804688, -0.020313262939453125, -0.013666152954101562, -0.00701904296875, -0.0003719329833984375, 0.006275177001953125, 0.012922286987304688, 0.01956939697265625, 0.026216506958007812, 0.032863616943359375, 0.03951072692871094, 0.0461578369140625, 0.05280494689941406, 0.059452056884765625, 0.06609916687011719, 0.07274627685546875, 0.07939338684082031, 0.08604049682617188, 0.09268760681152344, 0.099334716796875, 0.10598182678222656, 0.11262893676757812, 0.11927604675292969, 0.12592315673828125, 0.1325702667236328, 0.13921737670898438, 0.14586448669433594, 0.1525115966796875, 0.15915870666503906, 0.16580581665039062, 0.1724529266357422, 0.17910003662109375, 0.1857471466064453, 0.19239425659179688, 0.19904136657714844, 0.2056884765625]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 2.0, 1.0, 3.0, 8.0, 4.0, 9.0, 8.0, 13.0, 24.0, 27.0, 49.0, 58.0, 75.0, 121.0, 156.0, 257.0, 464.0, 802.0, 1766.0, 4798.0, 16255.0, 73455.0, 319976.0, 449362.0, 139075.0, 28967.0, 7520.0, 2541.0, 1159.0, 606.0, 339.0, 203.0, 140.0, 95.0, 59.0, 41.0, 33.0, 29.0, 12.0, 20.0, 12.0, 6.0, 5.0, 4.0, 3.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.21435546875, -0.20808792114257812, -0.20182037353515625, -0.19555282592773438, -0.1892852783203125, -0.18301773071289062, -0.17675018310546875, -0.17048263549804688, -0.164215087890625, -0.15794754028320312, -0.15167999267578125, -0.14541244506835938, -0.1391448974609375, -0.13287734985351562, -0.12660980224609375, -0.12034225463867188, -0.11407470703125, -0.10780715942382812, -0.10153961181640625, -0.09527206420898438, -0.0890045166015625, -0.08273696899414062, -0.07646942138671875, -0.07020187377929688, -0.063934326171875, -0.057666778564453125, -0.05139923095703125, -0.045131683349609375, -0.0388641357421875, -0.032596588134765625, -0.02632904052734375, -0.020061492919921875, -0.0137939453125, -0.007526397705078125, -0.00125885009765625, 0.005008697509765625, 0.0112762451171875, 0.017543792724609375, 0.02381134033203125, 0.030078887939453125, 0.036346435546875, 0.042613983154296875, 0.04888153076171875, 0.055149078369140625, 0.0614166259765625, 0.06768417358398438, 0.07395172119140625, 0.08021926879882812, 0.08648681640625, 0.09275436401367188, 0.09902191162109375, 0.10528945922851562, 0.1115570068359375, 0.11782455444335938, 0.12409210205078125, 0.13035964965820312, 0.136627197265625, 0.14289474487304688, 0.14916229248046875, 0.15542984008789062, 0.1616973876953125, 0.16796493530273438, 0.17423248291015625, 0.18050003051757812, 0.186767578125]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 4.0, 1.0, 1.0, 2.0, 1.0, 1.0, 7.0, 10.0, 8.0, 9.0, 16.0, 28.0, 30.0, 35.0, 47.0, 58.0, 90.0, 121.0, 111.0, 108.0, 83.0, 69.0, 37.0, 38.0, 28.0, 23.0, 12.0, 13.0, 7.0, 2.0, 5.0, 2.0, 4.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.814697265625e-05, -3.6937184631824493e-05, -3.572739660739899e-05, -3.451760858297348e-05, -3.3307820558547974e-05, -3.209803253412247e-05, -3.088824450969696e-05, -2.9678456485271454e-05, -2.8468668460845947e-05, -2.725888043642044e-05, -2.6049092411994934e-05, -2.4839304387569427e-05, -2.362951636314392e-05, -2.2419728338718414e-05, -2.1209940314292908e-05, -2.00001522898674e-05, -1.8790364265441895e-05, -1.7580576241016388e-05, -1.637078821659088e-05, -1.5161000192165375e-05, -1.3951212167739868e-05, -1.2741424143314362e-05, -1.1531636118888855e-05, -1.0321848094463348e-05, -9.112060070037842e-06, -7.902272045612335e-06, -6.692484021186829e-06, -5.482695996761322e-06, -4.2729079723358154e-06, -3.063119947910309e-06, -1.8533319234848022e-06, -6.435438990592957e-07, 5.662441253662109e-07, 1.7760321497917175e-06, 2.985820174217224e-06, 4.195608198642731e-06, 5.405396223068237e-06, 6.615184247493744e-06, 7.82497227191925e-06, 9.034760296344757e-06, 1.0244548320770264e-05, 1.145433634519577e-05, 1.2664124369621277e-05, 1.3873912394046783e-05, 1.508370041847229e-05, 1.6293488442897797e-05, 1.7503276467323303e-05, 1.871306449174881e-05, 1.9922852516174316e-05, 2.1132640540599823e-05, 2.234242856502533e-05, 2.3552216589450836e-05, 2.4762004613876343e-05, 2.597179263830185e-05, 2.7181580662727356e-05, 2.8391368687152863e-05, 2.960115671157837e-05, 3.0810944736003876e-05, 3.202073276042938e-05, 3.323052078485489e-05, 3.4440308809280396e-05, 3.56500968337059e-05, 3.685988485813141e-05, 3.8069672882556915e-05, 3.927946090698242e-05]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 5.0, 4.0, 7.0, 3.0, 9.0, 9.0, 13.0, 20.0, 22.0, 29.0, 44.0, 45.0, 84.0, 120.0, 168.0, 237.0, 369.0, 553.0, 843.0, 1326.0, 2242.0, 3960.0, 7535.0, 15126.0, 32521.0, 67812.0, 132597.0, 207889.0, 228516.0, 166572.0, 92151.0, 44514.0, 20926.0, 10028.0, 4997.0, 2698.0, 1533.0, 1042.0, 663.0, 393.0, 319.0, 195.0, 129.0, 87.0, 62.0, 45.0, 38.0, 26.0, 13.0, 11.0, 6.0, 4.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.0716552734375, -0.06928348541259766, -0.06691169738769531, -0.06453990936279297, -0.062168121337890625, -0.05979633331298828, -0.05742454528808594, -0.055052757263183594, -0.05268096923828125, -0.050309181213378906, -0.04793739318847656, -0.04556560516357422, -0.043193817138671875, -0.04082202911376953, -0.03845024108886719, -0.036078453063964844, -0.0337066650390625, -0.031334877014160156, -0.028963088989257812, -0.02659130096435547, -0.024219512939453125, -0.02184772491455078, -0.019475936889648438, -0.017104148864746094, -0.01473236083984375, -0.012360572814941406, -0.009988784790039062, -0.007616996765136719, -0.005245208740234375, -0.0028734207153320312, -0.0005016326904296875, 0.0018701553344726562, 0.004241943359375, 0.006613731384277344, 0.008985519409179688, 0.011357307434082031, 0.013729095458984375, 0.01610088348388672, 0.018472671508789062, 0.020844459533691406, 0.02321624755859375, 0.025588035583496094, 0.027959823608398438, 0.03033161163330078, 0.032703399658203125, 0.03507518768310547, 0.03744697570800781, 0.039818763732910156, 0.0421905517578125, 0.044562339782714844, 0.04693412780761719, 0.04930591583251953, 0.051677703857421875, 0.05404949188232422, 0.05642127990722656, 0.058793067932128906, 0.06116485595703125, 0.0635366439819336, 0.06590843200683594, 0.06828022003173828, 0.07065200805664062, 0.07302379608154297, 0.07539558410644531, 0.07776737213134766, 0.08013916015625]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 1.0, 1.0, 4.0, 3.0, 5.0, 9.0, 11.0, 23.0, 26.0, 23.0, 14.0, 31.0, 37.0, 28.0, 41.0, 58.0, 50.0, 60.0, 61.0, 51.0, 52.0, 56.0, 53.0, 48.0, 41.0, 43.0, 26.0, 25.0, 22.0, 15.0, 14.0, 14.0, 9.0, 10.0, 8.0, 8.0, 4.0, 5.0, 6.0, 3.0, 1.0, 4.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0694580078125, -0.0673818588256836, -0.06530570983886719, -0.06322956085205078, -0.061153411865234375, -0.05907726287841797, -0.05700111389160156, -0.054924964904785156, -0.05284881591796875, -0.050772666931152344, -0.04869651794433594, -0.04662036895751953, -0.044544219970703125, -0.04246807098388672, -0.04039192199707031, -0.038315773010253906, -0.0362396240234375, -0.034163475036621094, -0.03208732604980469, -0.03001117706298828, -0.027935028076171875, -0.02585887908935547, -0.023782730102539062, -0.021706581115722656, -0.01963043212890625, -0.017554283142089844, -0.015478134155273438, -0.013401985168457031, -0.011325836181640625, -0.009249687194824219, -0.0071735382080078125, -0.005097389221191406, -0.003021240234375, -0.0009450912475585938, 0.0011310577392578125, 0.0032072067260742188, 0.005283355712890625, 0.007359504699707031, 0.009435653686523438, 0.011511802673339844, 0.01358795166015625, 0.015664100646972656, 0.017740249633789062, 0.01981639862060547, 0.021892547607421875, 0.02396869659423828, 0.026044845581054688, 0.028120994567871094, 0.0301971435546875, 0.032273292541503906, 0.03434944152832031, 0.03642559051513672, 0.038501739501953125, 0.04057788848876953, 0.04265403747558594, 0.044730186462402344, 0.04680633544921875, 0.048882484436035156, 0.05095863342285156, 0.05303478240966797, 0.055110931396484375, 0.05718708038330078, 0.05926322937011719, 0.061339378356933594, 0.06341552734375]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 9.0, 21.0, 105.0, 311.0, 353.0, 160.0, 46.0, 9.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4857500791549683, -1.399176001548767, -1.3126018047332764, -1.2260277271270752, -1.139453649520874, -1.0528795719146729, -0.9663053750991821, -0.879731297492981, -0.793157160282135, -0.7065830230712891, -0.6200089454650879, -0.5334348082542419, -0.4468607008457184, -0.3602865934371948, -0.2737124562263489, -0.1871383786201477, -0.10056424140930176, -0.013990126550197601, 0.07258398830890656, 0.1591581106185913, 0.24573221802711487, 0.3323063254356384, 0.4188804626464844, 0.5054545402526855, 0.5920286774635315, 0.6786028146743774, 0.7651768922805786, 0.8517510294914246, 0.9383251667022705, 1.0248992443084717, 1.1114733219146729, 1.198047399520874, 1.2846214771270752, 1.3711955547332764, 1.457769751548767, 1.5443438291549683, 1.6309179067611694, 1.7174921035766602, 1.8040661811828613, 1.8906402587890625, 1.9772143363952637, 2.063788414001465, 2.150362491607666, 2.236936569213867, 2.3235108852386475, 2.4100849628448486, 2.49665904045105, 2.583233118057251, 2.6698074340820312, 2.7563815116882324, 2.8429555892944336, 2.9295296669006348, 3.016103982925415, 3.102678060531616, 3.1892521381378174, 3.2758262157440186, 3.3624002933502197, 3.448974370956421, 3.535548448562622, 3.6221227645874023, 3.7086968421936035, 3.7952709197998047, 3.881844997406006, 3.968419075012207, 4.054993152618408]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 5.0, 6.0, 11.0, 9.0, 9.0, 13.0, 17.0, 25.0, 26.0, 31.0, 36.0, 50.0, 36.0, 62.0, 58.0, 54.0, 48.0, 42.0, 62.0, 46.0, 58.0, 51.0, 30.0, 43.0, 37.0, 31.0, 25.0, 23.0, 10.0, 11.0, 13.0, 9.0, 5.0, 5.0, 5.0, 2.0, 4.0, 1.0, 0.0, 1.0, 2.0, 2.0], "bins": [-1.0124988555908203, -0.9869032502174377, -0.9613076448440552, -0.9357119798660278, -0.9101163744926453, -0.8845207691192627, -0.8589251041412354, -0.8333294987678528, -0.8077338933944702, -0.7821382880210876, -0.7565426826477051, -0.7309470176696777, -0.7053514122962952, -0.6797558069229126, -0.6541601419448853, -0.6285645365715027, -0.6029689311981201, -0.5773733258247375, -0.551777720451355, -0.5261820554733276, -0.5005864500999451, -0.4749908447265625, -0.44939520955085754, -0.4237995743751526, -0.39820396900177, -0.37260836362838745, -0.3470127284526825, -0.32141709327697754, -0.29582148790359497, -0.2702258825302124, -0.24463024735450745, -0.21903462707996368, -0.19343894720077515, -0.16784332692623138, -0.14224770665168762, -0.11665208637714386, -0.0910564661026001, -0.06546084582805634, -0.03986522555351257, -0.014269605278968811, 0.011326014995574951, 0.03692163527011871, 0.06251725554466248, 0.08811287581920624, 0.11370849609375, 0.13930411636829376, 0.16489973664283752, 0.1904953569173813, 0.21609097719192505, 0.2416865974664688, 0.2672822177410126, 0.29287785291671753, 0.3184734582901001, 0.34406906366348267, 0.3696646988391876, 0.3952603340148926, 0.42085593938827515, 0.4464515447616577, 0.47204717993736267, 0.4976428151130676, 0.5232384204864502, 0.5488340258598328, 0.5744296312332153, 0.6000252962112427, 0.6256209015846252]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 4.0, 9.0, 3.0, 9.0, 13.0, 22.0, 42.0, 74.0, 106.0, 201.0, 409.0, 1395.0, 21000.0, 2647006.0, 1510511.0, 11655.0, 1048.0, 370.0, 169.0, 100.0, 51.0, 40.0, 20.0, 12.0, 6.0, 7.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.32763671875, -0.3149986267089844, -0.30236053466796875, -0.2897224426269531, -0.2770843505859375, -0.2644462585449219, -0.25180816650390625, -0.23917007446289062, -0.226531982421875, -0.21389389038085938, -0.20125579833984375, -0.18861770629882812, -0.1759796142578125, -0.16334152221679688, -0.15070343017578125, -0.13806533813476562, -0.12542724609375, -0.11278915405273438, -0.10015106201171875, -0.08751296997070312, -0.0748748779296875, -0.062236785888671875, -0.04959869384765625, -0.036960601806640625, -0.024322509765625, -0.011684417724609375, 0.00095367431640625, 0.013591766357421875, 0.0262298583984375, 0.038867950439453125, 0.05150604248046875, 0.06414413452148438, 0.0767822265625, 0.08942031860351562, 0.10205841064453125, 0.11469650268554688, 0.1273345947265625, 0.13997268676757812, 0.15261077880859375, 0.16524887084960938, 0.177886962890625, 0.19052505493164062, 0.20316314697265625, 0.21580123901367188, 0.2284393310546875, 0.24107742309570312, 0.25371551513671875, 0.2663536071777344, 0.27899169921875, 0.2916297912597656, 0.30426788330078125, 0.3169059753417969, 0.3295440673828125, 0.3421821594238281, 0.35482025146484375, 0.3674583435058594, 0.380096435546875, 0.3927345275878906, 0.40537261962890625, 0.4180107116699219, 0.4306488037109375, 0.4432868957519531, 0.45592498779296875, 0.4685630798339844, 0.481201171875]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 6.0, 2.0, 6.0, 15.0, 22.0, 25.0, 47.0, 66.0, 70.0, 86.0, 86.0, 101.0, 93.0, 82.0, 77.0, 75.0, 47.0, 35.0, 31.0, 18.0, 12.0, 5.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1478271484375, -0.14230918884277344, -0.13679122924804688, -0.1312732696533203, -0.12575531005859375, -0.12023735046386719, -0.11471939086914062, -0.10920143127441406, -0.1036834716796875, -0.09816551208496094, -0.09264755249023438, -0.08712959289550781, -0.08161163330078125, -0.07609367370605469, -0.07057571411132812, -0.06505775451660156, -0.059539794921875, -0.05402183532714844, -0.048503875732421875, -0.04298591613769531, -0.03746795654296875, -0.03194999694824219, -0.026432037353515625, -0.020914077758789062, -0.0153961181640625, -0.009878158569335938, -0.004360198974609375, 0.0011577606201171875, 0.00667572021484375, 0.012193679809570312, 0.017711639404296875, 0.023229598999023438, 0.02874755859375, 0.03426551818847656, 0.039783477783203125, 0.04530143737792969, 0.05081939697265625, 0.05633735656738281, 0.061855316162109375, 0.06737327575683594, 0.0728912353515625, 0.07840919494628906, 0.08392715454101562, 0.08944511413574219, 0.09496307373046875, 0.10048103332519531, 0.10599899291992188, 0.11151695251464844, 0.117034912109375, 0.12255287170410156, 0.12807083129882812, 0.1335887908935547, 0.13910675048828125, 0.1446247100830078, 0.15014266967773438, 0.15566062927246094, 0.1611785888671875, 0.16669654846191406, 0.17221450805664062, 0.1777324676513672, 0.18325042724609375, 0.1887683868408203, 0.19428634643554688, 0.19980430603027344, 0.205322265625]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 4.0, 2.0, 9.0, 9.0, 23.0, 26.0, 34.0, 97.0, 156.0, 243.0, 547.0, 1425.0, 5282.0, 34246.0, 366438.0, 2463748.0, 1194017.0, 111253.0, 12528.0, 2478.0, 875.0, 382.0, 209.0, 99.0, 60.0, 40.0, 18.0, 13.0, 10.0, 10.0, 3.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.233154296875, -0.22603607177734375, -0.2189178466796875, -0.21179962158203125, -0.204681396484375, -0.19756317138671875, -0.1904449462890625, -0.18332672119140625, -0.17620849609375, -0.16909027099609375, -0.1619720458984375, -0.15485382080078125, -0.147735595703125, -0.14061737060546875, -0.1334991455078125, -0.12638092041015625, -0.1192626953125, -0.11214447021484375, -0.1050262451171875, -0.09790802001953125, -0.090789794921875, -0.08367156982421875, -0.0765533447265625, -0.06943511962890625, -0.06231689453125, -0.05519866943359375, -0.0480804443359375, -0.04096221923828125, -0.033843994140625, -0.02672576904296875, -0.0196075439453125, -0.01248931884765625, -0.00537109375, 0.00174713134765625, 0.0088653564453125, 0.01598358154296875, 0.023101806640625, 0.03022003173828125, 0.0373382568359375, 0.04445648193359375, 0.05157470703125, 0.05869293212890625, 0.0658111572265625, 0.07292938232421875, 0.080047607421875, 0.08716583251953125, 0.0942840576171875, 0.10140228271484375, 0.1085205078125, 0.11563873291015625, 0.1227569580078125, 0.12987518310546875, 0.136993408203125, 0.14411163330078125, 0.1512298583984375, 0.15834808349609375, 0.16546630859375, 0.17258453369140625, 0.1797027587890625, 0.18682098388671875, 0.193939208984375, 0.20105743408203125, 0.2081756591796875, 0.21529388427734375, 0.222412109375]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 6.0, 6.0, 7.0, 12.0, 19.0, 18.0, 20.0, 36.0, 66.0, 72.0, 116.0, 165.0, 236.0, 318.0, 354.0, 432.0, 472.0, 424.0, 326.0, 280.0, 227.0, 148.0, 105.0, 62.0, 43.0, 41.0, 25.0, 20.0, 14.0, 5.0, 3.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1456298828125, -0.140960693359375, -0.13629150390625, -0.131622314453125, -0.126953125, -0.122283935546875, -0.11761474609375, -0.112945556640625, -0.1082763671875, -0.103607177734375, -0.09893798828125, -0.094268798828125, -0.089599609375, -0.084930419921875, -0.08026123046875, -0.075592041015625, -0.0709228515625, -0.066253662109375, -0.06158447265625, -0.056915283203125, -0.05224609375, -0.047576904296875, -0.04290771484375, -0.038238525390625, -0.0335693359375, -0.028900146484375, -0.02423095703125, -0.019561767578125, -0.014892578125, -0.010223388671875, -0.00555419921875, -0.000885009765625, 0.0037841796875, 0.008453369140625, 0.01312255859375, 0.017791748046875, 0.0224609375, 0.027130126953125, 0.03179931640625, 0.036468505859375, 0.0411376953125, 0.045806884765625, 0.05047607421875, 0.055145263671875, 0.059814453125, 0.064483642578125, 0.06915283203125, 0.073822021484375, 0.0784912109375, 0.083160400390625, 0.08782958984375, 0.092498779296875, 0.09716796875, 0.101837158203125, 0.10650634765625, 0.111175537109375, 0.1158447265625, 0.120513916015625, 0.12518310546875, 0.129852294921875, 0.134521484375, 0.139190673828125, 0.14385986328125, 0.148529052734375, 0.1531982421875]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 9.0, 7.0, 26.0, 84.0, 202.0, 245.0, 214.0, 132.0, 65.0, 19.0, 6.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.067141056060791, -1.0202186107635498, -0.9732961654663086, -0.9263737201690674, -0.8794512748718262, -0.832528829574585, -0.7856063842773438, -0.7386839389801025, -0.6917614936828613, -0.6448390483856201, -0.5979166030883789, -0.5509941577911377, -0.5040717124938965, -0.4571492671966553, -0.41022685170173645, -0.36330440640449524, -0.3163819909095764, -0.2694595456123352, -0.222537100315094, -0.17561466991901398, -0.12869222462177277, -0.08176977932453156, -0.03484734892845154, 0.012075096368789673, 0.058997541666030884, 0.1059199869632721, 0.1528424322605133, 0.19976486265659332, 0.24668730795383453, 0.29360973834991455, 0.34053218364715576, 0.387454628944397, 0.4343770742416382, 0.4812995195388794, 0.5282219648361206, 0.5751444101333618, 0.622066855430603, 0.6689893007278442, 0.7159117460250854, 0.7628341913223267, 0.8097566366195679, 0.8566790819168091, 0.9036015272140503, 0.9505239725112915, 0.9974464178085327, 1.044368863105774, 1.0912913084030151, 1.1382137537002563, 1.185136079788208, 1.2320585250854492, 1.2789809703826904, 1.3259034156799316, 1.3728258609771729, 1.419748306274414, 1.4666707515716553, 1.5135931968688965, 1.5605156421661377, 1.607438087463379, 1.6543605327606201, 1.7012829780578613, 1.7482054233551025, 1.7951278686523438, 1.842050313949585, 1.8889727592468262, 1.9358952045440674]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 8.0, 2.0, 8.0, 9.0, 9.0, 9.0, 13.0, 15.0, 23.0, 29.0, 31.0, 41.0, 36.0, 40.0, 46.0, 40.0, 43.0, 41.0, 51.0, 52.0, 52.0, 53.0, 36.0, 60.0, 51.0, 27.0, 25.0, 39.0, 22.0, 20.0, 16.0, 15.0, 14.0, 13.0, 4.0, 5.0, 6.0, 2.0, 5.0, 5.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.6626296043395996, -0.6454196572303772, -0.6282097101211548, -0.6109997630119324, -0.59378981590271, -0.5765798687934875, -0.5593699216842651, -0.5421599745750427, -0.5249500274658203, -0.5077400803565979, -0.4905301332473755, -0.4733201861381531, -0.45611023902893066, -0.43890029191970825, -0.42169034481048584, -0.4044803977012634, -0.387270450592041, -0.3700605034828186, -0.3528505563735962, -0.3356406092643738, -0.31843066215515137, -0.30122071504592896, -0.28401076793670654, -0.26680082082748413, -0.24959087371826172, -0.2323809266090393, -0.2151709794998169, -0.19796103239059448, -0.18075108528137207, -0.16354113817214966, -0.14633119106292725, -0.12912124395370483, -0.11191123723983765, -0.09470129013061523, -0.07749134302139282, -0.06028139591217041, -0.043071448802948, -0.025861501693725586, -0.008651554584503174, 0.008558392524719238, 0.02576833963394165, 0.04297828674316406, 0.060188233852386475, 0.07739818096160889, 0.0946081280708313, 0.11181807518005371, 0.12902802228927612, 0.14623796939849854, 0.16344791650772095, 0.18065786361694336, 0.19786781072616577, 0.21507775783538818, 0.2322877049446106, 0.249497652053833, 0.2667075991630554, 0.28391754627227783, 0.30112749338150024, 0.31833744049072266, 0.33554738759994507, 0.3527573347091675, 0.3699672818183899, 0.3871772289276123, 0.4043871760368347, 0.42159712314605713, 0.43880707025527954]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 0.0, 1.0, 7.0, 6.0, 10.0, 17.0, 8.0, 15.0, 27.0, 29.0, 49.0, 93.0, 158.0, 260.0, 596.0, 1212.0, 2703.0, 6158.0, 14564.0, 38073.0, 116917.0, 328279.0, 344230.0, 126640.0, 40899.0, 15545.0, 6601.0, 2912.0, 1214.0, 587.0, 322.0, 168.0, 74.0, 54.0, 42.0, 27.0, 17.0, 17.0, 7.0, 3.0, 6.0, 9.0, 3.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2379150390625, -0.2299938201904297, -0.22207260131835938, -0.21415138244628906, -0.20623016357421875, -0.19830894470214844, -0.19038772583007812, -0.1824665069580078, -0.1745452880859375, -0.1666240692138672, -0.15870285034179688, -0.15078163146972656, -0.14286041259765625, -0.13493919372558594, -0.12701797485351562, -0.11909675598144531, -0.111175537109375, -0.10325431823730469, -0.09533309936523438, -0.08741188049316406, -0.07949066162109375, -0.07156944274902344, -0.06364822387695312, -0.05572700500488281, -0.0478057861328125, -0.03988456726074219, -0.031963348388671875, -0.024042129516601562, -0.01612091064453125, -0.008199691772460938, -0.000278472900390625, 0.0076427459716796875, 0.01556396484375, 0.023485183715820312, 0.031406402587890625, 0.03932762145996094, 0.04724884033203125, 0.05517005920410156, 0.06309127807617188, 0.07101249694824219, 0.0789337158203125, 0.08685493469238281, 0.09477615356445312, 0.10269737243652344, 0.11061859130859375, 0.11853981018066406, 0.12646102905273438, 0.1343822479248047, 0.142303466796875, 0.1502246856689453, 0.15814590454101562, 0.16606712341308594, 0.17398834228515625, 0.18190956115722656, 0.18983078002929688, 0.1977519989013672, 0.2056732177734375, 0.2135944366455078, 0.22151565551757812, 0.22943687438964844, 0.23735809326171875, 0.24527931213378906, 0.2532005310058594, 0.2611217498779297, 0.26904296875]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 4.0, 7.0, 13.0, 11.0, 27.0, 41.0, 56.0, 64.0, 96.0, 92.0, 104.0, 69.0, 97.0, 90.0, 71.0, 53.0, 33.0, 35.0, 24.0, 11.0, 9.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1451416015625, -0.1397705078125, -0.1343994140625, -0.1290283203125, -0.1236572265625, -0.1182861328125, -0.1129150390625, -0.1075439453125, -0.1021728515625, -0.0968017578125, -0.0914306640625, -0.0860595703125, -0.0806884765625, -0.0753173828125, -0.0699462890625, -0.0645751953125, -0.0592041015625, -0.0538330078125, -0.0484619140625, -0.0430908203125, -0.0377197265625, -0.0323486328125, -0.0269775390625, -0.0216064453125, -0.0162353515625, -0.0108642578125, -0.0054931640625, -0.0001220703125, 0.0052490234375, 0.0106201171875, 0.0159912109375, 0.0213623046875, 0.0267333984375, 0.0321044921875, 0.0374755859375, 0.0428466796875, 0.0482177734375, 0.0535888671875, 0.0589599609375, 0.0643310546875, 0.0697021484375, 0.0750732421875, 0.0804443359375, 0.0858154296875, 0.0911865234375, 0.0965576171875, 0.1019287109375, 0.1072998046875, 0.1126708984375, 0.1180419921875, 0.1234130859375, 0.1287841796875, 0.1341552734375, 0.1395263671875, 0.1448974609375, 0.1502685546875, 0.1556396484375, 0.1610107421875, 0.1663818359375, 0.1717529296875, 0.1771240234375, 0.1824951171875, 0.1878662109375, 0.1932373046875, 0.1986083984375]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 4.0, 14.0, 11.0, 13.0, 18.0, 35.0, 42.0, 53.0, 76.0, 118.0, 157.0, 244.0, 436.0, 944.0, 2228.0, 5975.0, 16642.0, 49408.0, 143472.0, 321431.0, 306453.0, 131432.0, 44486.0, 15450.0, 5392.0, 2041.0, 817.0, 437.0, 231.0, 139.0, 91.0, 74.0, 57.0, 27.0, 26.0, 23.0, 9.0, 16.0, 11.0, 6.0, 4.0, 6.0, 5.0, 0.0, 1.0, 4.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.2225341796875, -0.2153453826904297, -0.20815658569335938, -0.20096778869628906, -0.19377899169921875, -0.18659019470214844, -0.17940139770507812, -0.1722126007080078, -0.1650238037109375, -0.1578350067138672, -0.15064620971679688, -0.14345741271972656, -0.13626861572265625, -0.12907981872558594, -0.12189102172851562, -0.11470222473144531, -0.107513427734375, -0.10032463073730469, -0.09313583374023438, -0.08594703674316406, -0.07875823974609375, -0.07156944274902344, -0.06438064575195312, -0.05719184875488281, -0.0500030517578125, -0.04281425476074219, -0.035625457763671875, -0.028436660766601562, -0.02124786376953125, -0.014059066772460938, -0.006870269775390625, 0.0003185272216796875, 0.00750732421875, 0.014696121215820312, 0.021884918212890625, 0.029073715209960938, 0.03626251220703125, 0.04345130920410156, 0.050640106201171875, 0.05782890319824219, 0.0650177001953125, 0.07220649719238281, 0.07939529418945312, 0.08658409118652344, 0.09377288818359375, 0.10096168518066406, 0.10815048217773438, 0.11533927917480469, 0.122528076171875, 0.1297168731689453, 0.13690567016601562, 0.14409446716308594, 0.15128326416015625, 0.15847206115722656, 0.16566085815429688, 0.1728496551513672, 0.1800384521484375, 0.1872272491455078, 0.19441604614257812, 0.20160484313964844, 0.20879364013671875, 0.21598243713378906, 0.22317123413085938, 0.2303600311279297, 0.237548828125]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 6.0, 4.0, 4.0, 2.0, 6.0, 9.0, 15.0, 11.0, 13.0, 9.0, 26.0, 30.0, 18.0, 31.0, 40.0, 43.0, 42.0, 42.0, 42.0, 49.0, 39.0, 57.0, 43.0, 48.0, 35.0, 32.0, 35.0, 42.0, 36.0, 35.0, 22.0, 20.0, 21.0, 22.0, 15.0, 14.0, 7.0, 7.0, 8.0, 4.0, 7.0, 6.0, 5.0, 3.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.2237548828125, -0.2169017791748047, -0.21004867553710938, -0.20319557189941406, -0.19634246826171875, -0.18948936462402344, -0.18263626098632812, -0.1757831573486328, -0.1689300537109375, -0.1620769500732422, -0.15522384643554688, -0.14837074279785156, -0.14151763916015625, -0.13466453552246094, -0.12781143188476562, -0.12095832824707031, -0.114105224609375, -0.10725212097167969, -0.10039901733398438, -0.09354591369628906, -0.08669281005859375, -0.07983970642089844, -0.07298660278320312, -0.06613349914550781, -0.0592803955078125, -0.05242729187011719, -0.045574188232421875, -0.03872108459472656, -0.03186798095703125, -0.025014877319335938, -0.018161773681640625, -0.011308670043945312, -0.00445556640625, 0.0023975372314453125, 0.009250640869140625, 0.016103744506835938, 0.02295684814453125, 0.029809951782226562, 0.036663055419921875, 0.04351615905761719, 0.0503692626953125, 0.05722236633300781, 0.06407546997070312, 0.07092857360839844, 0.07778167724609375, 0.08463478088378906, 0.09148788452148438, 0.09834098815917969, 0.105194091796875, 0.11204719543457031, 0.11890029907226562, 0.12575340270996094, 0.13260650634765625, 0.13945960998535156, 0.14631271362304688, 0.1531658172607422, 0.1600189208984375, 0.1668720245361328, 0.17372512817382812, 0.18057823181152344, 0.18743133544921875, 0.19428443908691406, 0.20113754272460938, 0.2079906463623047, 0.21484375]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 3.0, 11.0, 12.0, 16.0, 22.0, 18.0, 41.0, 55.0, 82.0, 152.0, 225.0, 336.0, 584.0, 966.0, 1640.0, 2766.0, 4922.0, 8620.0, 15878.0, 29766.0, 57751.0, 110219.0, 181286.0, 220350.0, 180042.0, 109183.0, 57778.0, 29659.0, 15729.0, 8565.0, 4902.0, 2717.0, 1682.0, 1023.0, 591.0, 356.0, 219.0, 128.0, 92.0, 61.0, 37.0, 29.0, 12.0, 11.0, 12.0, 7.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.06475830078125, -0.06270217895507812, -0.06064605712890625, -0.058589935302734375, -0.0565338134765625, -0.054477691650390625, -0.05242156982421875, -0.050365447998046875, -0.048309326171875, -0.046253204345703125, -0.04419708251953125, -0.042140960693359375, -0.0400848388671875, -0.038028717041015625, -0.03597259521484375, -0.033916473388671875, -0.0318603515625, -0.029804229736328125, -0.02774810791015625, -0.025691986083984375, -0.0236358642578125, -0.021579742431640625, -0.01952362060546875, -0.017467498779296875, -0.015411376953125, -0.013355255126953125, -0.01129913330078125, -0.009243011474609375, -0.0071868896484375, -0.005130767822265625, -0.00307464599609375, -0.001018524169921875, 0.00103759765625, 0.003093719482421875, 0.00514984130859375, 0.007205963134765625, 0.0092620849609375, 0.011318206787109375, 0.01337432861328125, 0.015430450439453125, 0.017486572265625, 0.019542694091796875, 0.02159881591796875, 0.023654937744140625, 0.0257110595703125, 0.027767181396484375, 0.02982330322265625, 0.031879425048828125, 0.033935546875, 0.035991668701171875, 0.03804779052734375, 0.040103912353515625, 0.0421600341796875, 0.044216156005859375, 0.04627227783203125, 0.048328399658203125, 0.050384521484375, 0.052440643310546875, 0.05449676513671875, 0.056552886962890625, 0.0586090087890625, 0.060665130615234375, 0.06272125244140625, 0.06477737426757812, 0.06683349609375]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 0.0, 1.0, 1.0, 2.0, 3.0, 7.0, 5.0, 7.0, 6.0, 8.0, 7.0, 13.0, 17.0, 13.0, 21.0, 32.0, 43.0, 38.0, 66.0, 52.0, 68.0, 76.0, 69.0, 77.0, 52.0, 62.0, 51.0, 22.0, 35.0, 33.0, 19.0, 18.0, 11.0, 17.0, 19.0, 6.0, 5.0, 8.0, 2.0, 2.0, 4.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.6450881958007812e-05, -1.5895813703536987e-05, -1.5340745449066162e-05, -1.4785677194595337e-05, -1.4230608940124512e-05, -1.3675540685653687e-05, -1.3120472431182861e-05, -1.2565404176712036e-05, -1.2010335922241211e-05, -1.1455267667770386e-05, -1.090019941329956e-05, -1.0345131158828735e-05, -9.79006290435791e-06, -9.234994649887085e-06, -8.67992639541626e-06, -8.124858140945435e-06, -7.569789886474609e-06, -7.014721632003784e-06, -6.459653377532959e-06, -5.904585123062134e-06, -5.349516868591309e-06, -4.794448614120483e-06, -4.239380359649658e-06, -3.684312105178833e-06, -3.129243850708008e-06, -2.5741755962371826e-06, -2.0191073417663574e-06, -1.4640390872955322e-06, -9.08970832824707e-07, -3.5390257835388184e-07, 2.0116567611694336e-07, 7.562339305877686e-07, 1.3113021850585938e-06, 1.866370439529419e-06, 2.421438694000244e-06, 2.9765069484710693e-06, 3.5315752029418945e-06, 4.08664345741272e-06, 4.641711711883545e-06, 5.19677996635437e-06, 5.751848220825195e-06, 6.3069164752960205e-06, 6.861984729766846e-06, 7.417052984237671e-06, 7.972121238708496e-06, 8.527189493179321e-06, 9.082257747650146e-06, 9.637326002120972e-06, 1.0192394256591797e-05, 1.0747462511062622e-05, 1.1302530765533447e-05, 1.1857599020004272e-05, 1.2412667274475098e-05, 1.2967735528945923e-05, 1.3522803783416748e-05, 1.4077872037887573e-05, 1.4632940292358398e-05, 1.5188008546829224e-05, 1.574307680130005e-05, 1.6298145055770874e-05, 1.68532133102417e-05, 1.7408281564712524e-05, 1.796334981918335e-05, 1.8518418073654175e-05, 1.9073486328125e-05]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 1.0, 12.0, 12.0, 13.0, 17.0, 25.0, 50.0, 56.0, 52.0, 115.0, 186.0, 283.0, 491.0, 901.0, 1754.0, 3695.0, 7937.0, 18059.0, 43130.0, 103376.0, 210405.0, 275732.0, 206613.0, 101226.0, 41547.0, 17342.0, 7796.0, 3667.0, 1863.0, 929.0, 488.0, 274.0, 177.0, 110.0, 56.0, 45.0, 35.0, 31.0, 10.0, 16.0, 7.0, 13.0, 4.0, 2.0, 3.0, 2.0, 4.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.08258056640625, -0.0801858901977539, -0.07779121398925781, -0.07539653778076172, -0.07300186157226562, -0.07060718536376953, -0.06821250915527344, -0.06581783294677734, -0.06342315673828125, -0.061028480529785156, -0.05863380432128906, -0.05623912811279297, -0.053844451904296875, -0.05144977569580078, -0.04905509948730469, -0.046660423278808594, -0.0442657470703125, -0.041871070861816406, -0.03947639465332031, -0.03708171844482422, -0.034687042236328125, -0.03229236602783203, -0.029897689819335938, -0.027503013610839844, -0.02510833740234375, -0.022713661193847656, -0.020318984985351562, -0.01792430877685547, -0.015529632568359375, -0.013134956359863281, -0.010740280151367188, -0.008345603942871094, -0.005950927734375, -0.0035562515258789062, -0.0011615753173828125, 0.0012331008911132812, 0.003627777099609375, 0.006022453308105469, 0.008417129516601562, 0.010811805725097656, 0.01320648193359375, 0.015601158142089844, 0.017995834350585938, 0.02039051055908203, 0.022785186767578125, 0.02517986297607422, 0.027574539184570312, 0.029969215393066406, 0.0323638916015625, 0.034758567810058594, 0.03715324401855469, 0.03954792022705078, 0.041942596435546875, 0.04433727264404297, 0.04673194885253906, 0.049126625061035156, 0.05152130126953125, 0.053915977478027344, 0.05631065368652344, 0.05870532989501953, 0.061100006103515625, 0.06349468231201172, 0.06588935852050781, 0.0682840347290039, 0.0706787109375]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 7.0, 2.0, 2.0, 5.0, 5.0, 7.0, 7.0, 8.0, 10.0, 13.0, 10.0, 16.0, 17.0, 16.0, 23.0, 27.0, 34.0, 38.0, 37.0, 59.0, 51.0, 59.0, 50.0, 65.0, 52.0, 50.0, 53.0, 42.0, 41.0, 32.0, 32.0, 25.0, 17.0, 17.0, 12.0, 15.0, 10.0, 14.0, 2.0, 9.0, 2.0, 2.0, 6.0, 1.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.06512451171875, -0.0632014274597168, -0.061278343200683594, -0.05935525894165039, -0.05743217468261719, -0.055509090423583984, -0.05358600616455078, -0.05166292190551758, -0.049739837646484375, -0.04781675338745117, -0.04589366912841797, -0.043970584869384766, -0.04204750061035156, -0.04012441635131836, -0.038201332092285156, -0.03627824783325195, -0.03435516357421875, -0.03243207931518555, -0.030508995056152344, -0.02858591079711914, -0.026662826538085938, -0.024739742279052734, -0.02281665802001953, -0.020893573760986328, -0.018970489501953125, -0.017047405242919922, -0.015124320983886719, -0.013201236724853516, -0.011278152465820312, -0.00935506820678711, -0.007431983947753906, -0.005508899688720703, -0.0035858154296875, -0.0016627311706542969, 0.00026035308837890625, 0.0021834373474121094, 0.0041065216064453125, 0.006029605865478516, 0.007952690124511719, 0.009875774383544922, 0.011798858642578125, 0.013721942901611328, 0.01564502716064453, 0.017568111419677734, 0.019491195678710938, 0.02141427993774414, 0.023337364196777344, 0.025260448455810547, 0.02718353271484375, 0.029106616973876953, 0.031029701232910156, 0.03295278549194336, 0.03487586975097656, 0.036798954010009766, 0.03872203826904297, 0.04064512252807617, 0.042568206787109375, 0.04449129104614258, 0.04641437530517578, 0.048337459564208984, 0.05026054382324219, 0.05218362808227539, 0.054106712341308594, 0.0560297966003418, 0.057952880859375]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [2.0, 5.0, 28.0, 70.0, 145.0, 224.0, 229.0, 182.0, 88.0, 29.0, 11.0, 2.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3603176176548004, -0.30144357681274414, -0.24256952106952667, -0.1836954653263092, -0.12482142448425293, -0.06594738364219666, -0.007073312997817993, 0.05180072784423828, 0.11067476868629456, 0.16954880952835083, 0.2284228652715683, 0.28729692101478577, 0.34617096185684204, 0.4050450026988983, 0.463919073343277, 0.5227931141853333, 0.5816671848297119, 0.6405412554740906, 0.6994152665138245, 0.7582893371582031, 0.817163348197937, 0.8760374188423157, 0.9349114894866943, 0.9937855005264282, 1.052659511566162, 1.111533522605896, 1.1704076528549194, 1.2292816638946533, 1.2881556749343872, 1.347029685974121, 1.4059038162231445, 1.4647778272628784, 1.5236518383026123, 1.5825258493423462, 1.6413999795913696, 1.7002739906311035, 1.7591480016708374, 1.8180220127105713, 1.8768961429595947, 1.9357701539993286, 1.9946441650390625, 2.053518295288086, 2.1123921871185303, 2.1712663173675537, 2.230140447616577, 2.2890143394470215, 2.347888469696045, 2.4067625999450684, 2.465636730194092, 2.5245108604431152, 2.5833847522735596, 2.642258882522583, 2.7011330127716064, 2.760006904602051, 2.818881034851074, 2.8777551651000977, 2.936629056930542, 2.9955031871795654, 3.0543770790100098, 3.113251209259033, 3.1721253395080566, 3.230999231338501, 3.2898733615875244, 3.348747491836548, 3.407621383666992]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 2.0, 5.0, 4.0, 10.0, 15.0, 13.0, 13.0, 27.0, 19.0, 24.0, 22.0, 26.0, 39.0, 50.0, 46.0, 57.0, 44.0, 49.0, 46.0, 50.0, 46.0, 34.0, 64.0, 27.0, 50.0, 26.0, 32.0, 33.0, 28.0, 19.0, 21.0, 14.0, 16.0, 11.0, 2.0, 4.0, 8.0, 3.0, 4.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.8131624460220337, -0.7897802591323853, -0.7663980722427368, -0.7430158853530884, -0.7196336984634399, -0.6962515115737915, -0.6728693246841431, -0.6494871377944946, -0.6261049509048462, -0.6027227640151978, -0.5793405771255493, -0.5559583902359009, -0.5325762033462524, -0.509194016456604, -0.48581185936927795, -0.4624296724796295, -0.43904751539230347, -0.41566532850265503, -0.3922831416130066, -0.36890095472335815, -0.3455187678337097, -0.3221365809440613, -0.29875442385673523, -0.2753722369670868, -0.25199005007743835, -0.22860786318778992, -0.20522567629814148, -0.18184350430965424, -0.1584613174200058, -0.13507913053035736, -0.11169695854187012, -0.08831477165222168, -0.06493264436721802, -0.04155046120285988, -0.01816827803850174, 0.005213901400566101, 0.02859608829021454, 0.051978275179862976, 0.07536044716835022, 0.09874263405799866, 0.1221248209476471, 0.14550700783729553, 0.16888919472694397, 0.1922713667154312, 0.21565355360507965, 0.2390357404947281, 0.26241791248321533, 0.28580009937286377, 0.3091822862625122, 0.33256447315216064, 0.3559466600418091, 0.3793288469314575, 0.40271103382110596, 0.4260932207107544, 0.44947537779808044, 0.4728575646877289, 0.4962397515773773, 0.5196219086647034, 0.5430040955543518, 0.5663862824440002, 0.5897684693336487, 0.6131506562232971, 0.6365328431129456, 0.659915030002594, 0.6832972168922424]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 4.0, 4.0, 6.0, 10.0, 20.0, 28.0, 49.0, 71.0, 96.0, 184.0, 312.0, 687.0, 1847.0, 5915.0, 24542.0, 155312.0, 1406061.0, 2199637.0, 341593.0, 44255.0, 9128.0, 2580.0, 953.0, 428.0, 223.0, 131.0, 85.0, 39.0, 20.0, 20.0, 17.0, 9.0, 9.0, 6.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1531982421875, -0.14812088012695312, -0.14304351806640625, -0.13796615600585938, -0.1328887939453125, -0.12781143188476562, -0.12273406982421875, -0.11765670776367188, -0.112579345703125, -0.10750198364257812, -0.10242462158203125, -0.09734725952148438, -0.0922698974609375, -0.08719253540039062, -0.08211517333984375, -0.07703781127929688, -0.07196044921875, -0.06688308715820312, -0.06180572509765625, -0.056728363037109375, -0.0516510009765625, -0.046573638916015625, -0.04149627685546875, -0.036418914794921875, -0.031341552734375, -0.026264190673828125, -0.02118682861328125, -0.016109466552734375, -0.0110321044921875, -0.005954742431640625, -0.00087738037109375, 0.004199981689453125, 0.00927734375, 0.014354705810546875, 0.01943206787109375, 0.024509429931640625, 0.0295867919921875, 0.034664154052734375, 0.03974151611328125, 0.044818878173828125, 0.049896240234375, 0.054973602294921875, 0.06005096435546875, 0.06512832641601562, 0.0702056884765625, 0.07528305053710938, 0.08036041259765625, 0.08543777465820312, 0.09051513671875, 0.09559249877929688, 0.10066986083984375, 0.10574722290039062, 0.1108245849609375, 0.11590194702148438, 0.12097930908203125, 0.12605667114257812, 0.131134033203125, 0.13621139526367188, 0.14128875732421875, 0.14636611938476562, 0.1514434814453125, 0.15652084350585938, 0.16159820556640625, 0.16667556762695312, 0.1717529296875]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 5.0, 3.0, 12.0, 19.0, 22.0, 51.0, 63.0, 58.0, 77.0, 82.0, 80.0, 96.0, 94.0, 80.0, 89.0, 43.0, 57.0, 35.0, 20.0, 11.0, 8.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1522216796875, -0.14681053161621094, -0.14139938354492188, -0.1359882354736328, -0.13057708740234375, -0.1251659393310547, -0.11975479125976562, -0.11434364318847656, -0.1089324951171875, -0.10352134704589844, -0.09811019897460938, -0.09269905090332031, -0.08728790283203125, -0.08187675476074219, -0.07646560668945312, -0.07105445861816406, -0.065643310546875, -0.06023216247558594, -0.054821014404296875, -0.04940986633300781, -0.04399871826171875, -0.03858757019042969, -0.033176422119140625, -0.027765274047851562, -0.0223541259765625, -0.016942977905273438, -0.011531829833984375, -0.0061206817626953125, -0.00070953369140625, 0.0047016143798828125, 0.010112762451171875, 0.015523910522460938, 0.02093505859375, 0.026346206665039062, 0.031757354736328125, 0.03716850280761719, 0.04257965087890625, 0.04799079895019531, 0.053401947021484375, 0.05881309509277344, 0.0642242431640625, 0.06963539123535156, 0.07504653930664062, 0.08045768737792969, 0.08586883544921875, 0.09127998352050781, 0.09669113159179688, 0.10210227966308594, 0.107513427734375, 0.11292457580566406, 0.11833572387695312, 0.12374687194824219, 0.12915802001953125, 0.1345691680908203, 0.13998031616210938, 0.14539146423339844, 0.1508026123046875, 0.15621376037597656, 0.16162490844726562, 0.1670360565185547, 0.17244720458984375, 0.1778583526611328, 0.18326950073242188, 0.18868064880371094, 0.194091796875]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 4.0, 5.0, 4.0, 10.0, 15.0, 23.0, 31.0, 37.0, 61.0, 87.0, 152.0, 242.0, 500.0, 1352.0, 5408.0, 35816.0, 366231.0, 2533872.0, 1130092.0, 103879.0, 12512.0, 2365.0, 774.0, 349.0, 174.0, 103.0, 58.0, 45.0, 24.0, 22.0, 8.0, 9.0, 9.0, 6.0, 4.0, 3.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.193115234375, -0.18615341186523438, -0.17919158935546875, -0.17222976684570312, -0.1652679443359375, -0.15830612182617188, -0.15134429931640625, -0.14438247680664062, -0.137420654296875, -0.13045883178710938, -0.12349700927734375, -0.11653518676757812, -0.1095733642578125, -0.10261154174804688, -0.09564971923828125, -0.08868789672851562, -0.08172607421875, -0.07476425170898438, -0.06780242919921875, -0.060840606689453125, -0.0538787841796875, -0.046916961669921875, -0.03995513916015625, -0.032993316650390625, -0.026031494140625, -0.019069671630859375, -0.01210784912109375, -0.005146026611328125, 0.0018157958984375, 0.008777618408203125, 0.01573944091796875, 0.022701263427734375, 0.0296630859375, 0.036624908447265625, 0.04358673095703125, 0.050548553466796875, 0.0575103759765625, 0.06447219848632812, 0.07143402099609375, 0.07839584350585938, 0.085357666015625, 0.09231948852539062, 0.09928131103515625, 0.10624313354492188, 0.1132049560546875, 0.12016677856445312, 0.12712860107421875, 0.13409042358398438, 0.14105224609375, 0.14801406860351562, 0.15497589111328125, 0.16193771362304688, 0.1688995361328125, 0.17586135864257812, 0.18282318115234375, 0.18978500366210938, 0.196746826171875, 0.20370864868164062, 0.21067047119140625, 0.21763229370117188, 0.2245941162109375, 0.23155593872070312, 0.23851776123046875, 0.24547958374023438, 0.25244140625]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 5.0, 4.0, 3.0, 3.0, 2.0, 10.0, 9.0, 9.0, 22.0, 19.0, 31.0, 25.0, 29.0, 61.0, 74.0, 91.0, 123.0, 151.0, 182.0, 230.0, 262.0, 306.0, 352.0, 350.0, 318.0, 274.0, 235.0, 196.0, 159.0, 122.0, 89.0, 84.0, 69.0, 35.0, 38.0, 26.0, 23.0, 12.0, 11.0, 11.0, 6.0, 7.0, 7.0, 2.0, 1.0, 4.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.11126708984375, -0.10807418823242188, -0.10488128662109375, -0.10168838500976562, -0.0984954833984375, -0.09530258178710938, -0.09210968017578125, -0.08891677856445312, -0.085723876953125, -0.08253097534179688, -0.07933807373046875, -0.07614517211914062, -0.0729522705078125, -0.06975936889648438, -0.06656646728515625, -0.06337356567382812, -0.0601806640625, -0.056987762451171875, -0.05379486083984375, -0.050601959228515625, -0.0474090576171875, -0.044216156005859375, -0.04102325439453125, -0.037830352783203125, -0.034637451171875, -0.031444549560546875, -0.02825164794921875, -0.025058746337890625, -0.0218658447265625, -0.018672943115234375, -0.01548004150390625, -0.012287139892578125, -0.00909423828125, -0.005901336669921875, -0.00270843505859375, 0.000484466552734375, 0.0036773681640625, 0.006870269775390625, 0.01006317138671875, 0.013256072998046875, 0.016448974609375, 0.019641876220703125, 0.02283477783203125, 0.026027679443359375, 0.0292205810546875, 0.032413482666015625, 0.03560638427734375, 0.038799285888671875, 0.0419921875, 0.045185089111328125, 0.04837799072265625, 0.051570892333984375, 0.0547637939453125, 0.057956695556640625, 0.06114959716796875, 0.06434249877929688, 0.067535400390625, 0.07072830200195312, 0.07392120361328125, 0.07711410522460938, 0.0803070068359375, 0.08349990844726562, 0.08669281005859375, 0.08988571166992188, 0.09307861328125]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 8.0, 50.0, 111.0, 199.0, 262.0, 216.0, 117.0, 34.0, 12.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6143922805786133, -0.5652784109115601, -0.5161645412445068, -0.4670507311820984, -0.41793686151504517, -0.36882299184799194, -0.3197091519832611, -0.2705953121185303, -0.22148144245147705, -0.17236758768558502, -0.123253732919693, -0.07413987815380096, -0.025026023387908936, 0.024087831377983093, 0.07320168614387512, 0.12231552600860596, 0.17142939567565918, 0.2205432504415512, 0.26965710520744324, 0.3187709450721741, 0.3678848147392273, 0.4169986844062805, 0.46611252427101135, 0.5152263641357422, 0.5643402338027954, 0.6134541034698486, 0.6625679731369019, 0.7116817831993103, 0.7607956528663635, 0.8099095225334167, 0.8590233325958252, 0.9081372022628784, 0.9572510719299316, 1.0063649415969849, 1.055478811264038, 1.1045926809310913, 1.1537065505981445, 1.2028203010559082, 1.2519341707229614, 1.3010480403900146, 1.3501619100570679, 1.399275779724121, 1.4483896493911743, 1.4975035190582275, 1.5466172695159912, 1.5957311391830444, 1.6448450088500977, 1.6939588785171509, 1.743072748184204, 1.7921866178512573, 1.8413004875183105, 1.8904143571853638, 1.939528226852417, 1.9886419773101807, 2.0377559661865234, 2.086869716644287, 2.135983467102051, 2.1850972175598145, 2.2342112064361572, 2.283324956893921, 2.3324389457702637, 2.3815526962280273, 2.43066668510437, 2.479780435562134, 2.5288944244384766]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 5.0, 3.0, 3.0, 9.0, 6.0, 7.0, 9.0, 11.0, 15.0, 10.0, 18.0, 20.0, 28.0, 36.0, 29.0, 32.0, 27.0, 44.0, 35.0, 44.0, 55.0, 45.0, 43.0, 47.0, 42.0, 36.0, 37.0, 40.0, 43.0, 36.0, 30.0, 21.0, 22.0, 16.0, 11.0, 16.0, 17.0, 12.0, 9.0, 11.0, 7.0, 8.0, 9.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.4745761752128601, -0.461346834897995, -0.4481174647808075, -0.4348881244659424, -0.4216587543487549, -0.40842941403388977, -0.39520007371902466, -0.38197070360183716, -0.36874133348464966, -0.35551199316978455, -0.34228262305259705, -0.32905328273773193, -0.31582391262054443, -0.3025945723056793, -0.2893652319908142, -0.2761358618736267, -0.2629065215587616, -0.2496771663427353, -0.23644781112670898, -0.22321847081184387, -0.20998910069465637, -0.19675976037979126, -0.18353040516376495, -0.17030104994773865, -0.15707169473171234, -0.14384233951568604, -0.13061298429965973, -0.11738363653421402, -0.10415428131818771, -0.09092492610216141, -0.0776955783367157, -0.06446622312068939, -0.051236867904663086, -0.03800751268863678, -0.024778161197900772, -0.011548809707164764, 0.0016805455088615417, 0.014909900724887848, 0.028139248490333557, 0.04136860370635986, 0.05459795892238617, 0.06782731413841248, 0.08105666935443878, 0.09428601711988449, 0.1075153723359108, 0.1207447275519371, 0.1339740753173828, 0.14720343053340912, 0.16043278574943542, 0.17366214096546173, 0.18689149618148804, 0.20012083649635315, 0.21335020661354065, 0.22657954692840576, 0.23980890214443207, 0.2530382573604584, 0.2662675976753235, 0.2794969379901886, 0.2927263081073761, 0.3059556484222412, 0.3191850185394287, 0.3324143588542938, 0.34564369916915894, 0.35887306928634644, 0.37210243940353394]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 4.0, 8.0, 3.0, 14.0, 18.0, 16.0, 27.0, 44.0, 66.0, 95.0, 167.0, 280.0, 519.0, 892.0, 1862.0, 3909.0, 8866.0, 20559.0, 50161.0, 122034.0, 267447.0, 303823.0, 156084.0, 64075.0, 26631.0, 11239.0, 4882.0, 2197.0, 1174.0, 575.0, 351.0, 197.0, 115.0, 75.0, 47.0, 35.0, 20.0, 24.0, 1.0, 8.0, 6.0, 6.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.18994140625, -0.18384170532226562, -0.17774200439453125, -0.17164230346679688, -0.1655426025390625, -0.15944290161132812, -0.15334320068359375, -0.14724349975585938, -0.141143798828125, -0.13504409790039062, -0.12894439697265625, -0.12284469604492188, -0.1167449951171875, -0.11064529418945312, -0.10454559326171875, -0.09844589233398438, -0.09234619140625, -0.08624649047851562, -0.08014678955078125, -0.07404708862304688, -0.0679473876953125, -0.061847686767578125, -0.05574798583984375, -0.049648284912109375, -0.043548583984375, -0.037448883056640625, -0.03134918212890625, -0.025249481201171875, -0.0191497802734375, -0.013050079345703125, -0.00695037841796875, -0.000850677490234375, 0.0052490234375, 0.011348724365234375, 0.01744842529296875, 0.023548126220703125, 0.0296478271484375, 0.035747528076171875, 0.04184722900390625, 0.047946929931640625, 0.054046630859375, 0.060146331787109375, 0.06624603271484375, 0.07234573364257812, 0.0784454345703125, 0.08454513549804688, 0.09064483642578125, 0.09674453735351562, 0.10284423828125, 0.10894393920898438, 0.11504364013671875, 0.12114334106445312, 0.1272430419921875, 0.13334274291992188, 0.13944244384765625, 0.14554214477539062, 0.151641845703125, 0.15774154663085938, 0.16384124755859375, 0.16994094848632812, 0.1760406494140625, 0.18214035034179688, 0.18824005126953125, 0.19433975219726562, 0.200439453125]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 5.0, 3.0, 10.0, 19.0, 20.0, 40.0, 55.0, 74.0, 79.0, 77.0, 76.0, 96.0, 93.0, 95.0, 66.0, 57.0, 50.0, 43.0, 28.0, 9.0, 7.0, 5.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1474609375, -0.1422595977783203, -0.13705825805664062, -0.13185691833496094, -0.12665557861328125, -0.12145423889160156, -0.11625289916992188, -0.11105155944824219, -0.1058502197265625, -0.10064888000488281, -0.09544754028320312, -0.09024620056152344, -0.08504486083984375, -0.07984352111816406, -0.07464218139648438, -0.06944084167480469, -0.064239501953125, -0.05903816223144531, -0.053836822509765625, -0.04863548278808594, -0.04343414306640625, -0.03823280334472656, -0.033031463623046875, -0.027830123901367188, -0.0226287841796875, -0.017427444458007812, -0.012226104736328125, -0.0070247650146484375, -0.00182342529296875, 0.0033779144287109375, 0.008579254150390625, 0.013780593872070312, 0.01898193359375, 0.024183273315429688, 0.029384613037109375, 0.03458595275878906, 0.03978729248046875, 0.04498863220214844, 0.050189971923828125, 0.05539131164550781, 0.0605926513671875, 0.06579399108886719, 0.07099533081054688, 0.07619667053222656, 0.08139801025390625, 0.08659934997558594, 0.09180068969726562, 0.09700202941894531, 0.102203369140625, 0.10740470886230469, 0.11260604858398438, 0.11780738830566406, 0.12300872802734375, 0.12821006774902344, 0.13341140747070312, 0.1386127471923828, 0.1438140869140625, 0.1490154266357422, 0.15421676635742188, 0.15941810607910156, 0.16461944580078125, 0.16982078552246094, 0.17502212524414062, 0.1802234649658203, 0.1854248046875]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 6.0, 2.0, 3.0, 4.0, 3.0, 8.0, 9.0, 10.0, 17.0, 20.0, 20.0, 27.0, 49.0, 57.0, 64.0, 106.0, 239.0, 564.0, 1532.0, 4449.0, 13498.0, 39601.0, 109859.0, 267224.0, 338600.0, 173267.0, 64991.0, 22601.0, 7444.0, 2568.0, 875.0, 324.0, 152.0, 85.0, 71.0, 42.0, 40.0, 31.0, 15.0, 11.0, 17.0, 12.0, 6.0, 9.0, 8.0, 5.0, 6.0, 4.0, 3.0, 4.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.224609375, -0.21741867065429688, -0.21022796630859375, -0.20303726196289062, -0.1958465576171875, -0.18865585327148438, -0.18146514892578125, -0.17427444458007812, -0.167083740234375, -0.15989303588867188, -0.15270233154296875, -0.14551162719726562, -0.1383209228515625, -0.13113021850585938, -0.12393951416015625, -0.11674880981445312, -0.10955810546875, -0.10236740112304688, -0.09517669677734375, -0.08798599243164062, -0.0807952880859375, -0.07360458374023438, -0.06641387939453125, -0.059223175048828125, -0.052032470703125, -0.044841766357421875, -0.03765106201171875, -0.030460357666015625, -0.0232696533203125, -0.016078948974609375, -0.00888824462890625, -0.001697540283203125, 0.0054931640625, 0.012683868408203125, 0.01987457275390625, 0.027065277099609375, 0.0342559814453125, 0.041446685791015625, 0.04863739013671875, 0.055828094482421875, 0.063018798828125, 0.07020950317382812, 0.07740020751953125, 0.08459091186523438, 0.0917816162109375, 0.09897232055664062, 0.10616302490234375, 0.11335372924804688, 0.12054443359375, 0.12773513793945312, 0.13492584228515625, 0.14211654663085938, 0.1493072509765625, 0.15649795532226562, 0.16368865966796875, 0.17087936401367188, 0.178070068359375, 0.18526077270507812, 0.19245147705078125, 0.19964218139648438, 0.2068328857421875, 0.21402359008789062, 0.22121429443359375, 0.22840499877929688, 0.235595703125]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 4.0, 5.0, 3.0, 2.0, 5.0, 4.0, 6.0, 6.0, 10.0, 6.0, 1.0, 17.0, 8.0, 18.0, 18.0, 26.0, 16.0, 22.0, 32.0, 31.0, 27.0, 34.0, 32.0, 30.0, 39.0, 23.0, 48.0, 46.0, 35.0, 39.0, 40.0, 32.0, 32.0, 42.0, 34.0, 32.0, 22.0, 17.0, 22.0, 19.0, 19.0, 20.0, 14.0, 19.0, 11.0, 8.0, 9.0, 4.0, 1.0, 6.0, 4.0, 5.0, 3.0, 3.0, 3.0, 1.0, 1.0, 2.0], "bins": [-0.2122802734375, -0.20601654052734375, -0.1997528076171875, -0.19348907470703125, -0.187225341796875, -0.18096160888671875, -0.1746978759765625, -0.16843414306640625, -0.16217041015625, -0.15590667724609375, -0.1496429443359375, -0.14337921142578125, -0.137115478515625, -0.13085174560546875, -0.1245880126953125, -0.11832427978515625, -0.112060546875, -0.10579681396484375, -0.0995330810546875, -0.09326934814453125, -0.087005615234375, -0.08074188232421875, -0.0744781494140625, -0.06821441650390625, -0.06195068359375, -0.05568695068359375, -0.0494232177734375, -0.04315948486328125, -0.036895751953125, -0.03063201904296875, -0.0243682861328125, -0.01810455322265625, -0.0118408203125, -0.00557708740234375, 0.0006866455078125, 0.00695037841796875, 0.013214111328125, 0.01947784423828125, 0.0257415771484375, 0.03200531005859375, 0.03826904296875, 0.04453277587890625, 0.0507965087890625, 0.05706024169921875, 0.063323974609375, 0.06958770751953125, 0.0758514404296875, 0.08211517333984375, 0.08837890625, 0.09464263916015625, 0.1009063720703125, 0.10717010498046875, 0.113433837890625, 0.11969757080078125, 0.1259613037109375, 0.13222503662109375, 0.13848876953125, 0.14475250244140625, 0.1510162353515625, 0.15727996826171875, 0.163543701171875, 0.16980743408203125, 0.1760711669921875, 0.18233489990234375, 0.1885986328125]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 1.0, 6.0, 11.0, 5.0, 16.0, 18.0, 41.0, 40.0, 81.0, 139.0, 185.0, 320.0, 518.0, 792.0, 1372.0, 2267.0, 3917.0, 6541.0, 11445.0, 19525.0, 32881.0, 54395.0, 84397.0, 119233.0, 148313.0, 155876.0, 135337.0, 100666.0, 67205.0, 42403.0, 25102.0, 14622.0, 8685.0, 4937.0, 2847.0, 1718.0, 1037.0, 620.0, 361.0, 235.0, 137.0, 118.0, 62.0, 42.0, 34.0, 17.0, 12.0, 9.0, 6.0, 7.0, 1.0, 5.0, 1.0, 0.0, 1.0, 4.0, 1.0], "bins": [-0.043975830078125, -0.04261159896850586, -0.04124736785888672, -0.03988313674926758, -0.03851890563964844, -0.0371546745300293, -0.035790443420410156, -0.034426212310791016, -0.033061981201171875, -0.031697750091552734, -0.030333518981933594, -0.028969287872314453, -0.027605056762695312, -0.026240825653076172, -0.02487659454345703, -0.02351236343383789, -0.02214813232421875, -0.02078390121459961, -0.01941967010498047, -0.018055438995361328, -0.016691207885742188, -0.015326976776123047, -0.013962745666503906, -0.012598514556884766, -0.011234283447265625, -0.009870052337646484, -0.008505821228027344, -0.007141590118408203, -0.0057773590087890625, -0.004413127899169922, -0.0030488967895507812, -0.0016846656799316406, -0.0003204345703125, 0.0010437965393066406, 0.0024080276489257812, 0.003772258758544922, 0.0051364898681640625, 0.006500720977783203, 0.007864952087402344, 0.009229183197021484, 0.010593414306640625, 0.011957645416259766, 0.013321876525878906, 0.014686107635498047, 0.016050338745117188, 0.017414569854736328, 0.01877880096435547, 0.02014303207397461, 0.02150726318359375, 0.02287149429321289, 0.02423572540283203, 0.025599956512451172, 0.026964187622070312, 0.028328418731689453, 0.029692649841308594, 0.031056880950927734, 0.032421112060546875, 0.033785343170166016, 0.035149574279785156, 0.0365138053894043, 0.03787803649902344, 0.03924226760864258, 0.04060649871826172, 0.04197072982788086, 0.0433349609375]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 3.0, 3.0, 1.0, 0.0, 0.0, 2.0, 2.0, 5.0, 2.0, 6.0, 3.0, 2.0, 9.0, 8.0, 5.0, 7.0, 11.0, 18.0, 19.0, 35.0, 40.0, 35.0, 34.0, 59.0, 63.0, 69.0, 71.0, 68.0, 73.0, 73.0, 54.0, 55.0, 29.0, 37.0, 23.0, 11.0, 16.0, 18.0, 10.0, 7.0, 8.0, 3.0, 5.0, 2.0, 5.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.5854835510253906e-05, -1.5280209481716156e-05, -1.4705583453178406e-05, -1.4130957424640656e-05, -1.3556331396102905e-05, -1.2981705367565155e-05, -1.2407079339027405e-05, -1.1832453310489655e-05, -1.1257827281951904e-05, -1.0683201253414154e-05, -1.0108575224876404e-05, -9.533949196338654e-06, -8.959323167800903e-06, -8.384697139263153e-06, -7.810071110725403e-06, -7.235445082187653e-06, -6.660819053649902e-06, -6.086193025112152e-06, -5.511566996574402e-06, -4.936940968036652e-06, -4.362314939498901e-06, -3.787688910961151e-06, -3.213062882423401e-06, -2.6384368538856506e-06, -2.0638108253479004e-06, -1.4891847968101501e-06, -9.145587682723999e-07, -3.3993273973464966e-07, 2.3469328880310059e-07, 8.093193173408508e-07, 1.383945345878601e-06, 1.9585713744163513e-06, 2.5331974029541016e-06, 3.107823431491852e-06, 3.682449460029602e-06, 4.257075488567352e-06, 4.8317015171051025e-06, 5.406327545642853e-06, 5.980953574180603e-06, 6.555579602718353e-06, 7.1302056312561035e-06, 7.704831659793854e-06, 8.279457688331604e-06, 8.854083716869354e-06, 9.428709745407104e-06, 1.0003335773944855e-05, 1.0577961802482605e-05, 1.1152587831020355e-05, 1.1727213859558105e-05, 1.2301839888095856e-05, 1.2876465916633606e-05, 1.3451091945171356e-05, 1.4025717973709106e-05, 1.4600344002246857e-05, 1.5174970030784607e-05, 1.5749596059322357e-05, 1.6324222087860107e-05, 1.6898848116397858e-05, 1.7473474144935608e-05, 1.8048100173473358e-05, 1.862272620201111e-05, 1.919735223054886e-05, 1.977197825908661e-05, 2.034660428762436e-05, 2.092123031616211e-05]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 4.0, 5.0, 4.0, 4.0, 7.0, 16.0, 22.0, 19.0, 21.0, 43.0, 74.0, 121.0, 212.0, 406.0, 872.0, 1819.0, 4409.0, 9705.0, 22209.0, 48038.0, 96278.0, 166862.0, 220272.0, 204588.0, 136431.0, 73175.0, 34711.0, 15566.0, 6930.0, 3076.0, 1280.0, 646.0, 337.0, 144.0, 84.0, 55.0, 37.0, 21.0, 16.0, 10.0, 12.0, 4.0, 7.0, 8.0, 1.0, 1.0, 3.0, 2.0], "bins": [-0.07025146484375, -0.06844043731689453, -0.06662940979003906, -0.0648183822631836, -0.06300735473632812, -0.061196327209472656, -0.05938529968261719, -0.05757427215576172, -0.05576324462890625, -0.05395221710205078, -0.05214118957519531, -0.050330162048339844, -0.048519134521484375, -0.046708106994628906, -0.04489707946777344, -0.04308605194091797, -0.0412750244140625, -0.03946399688720703, -0.03765296936035156, -0.035841941833496094, -0.034030914306640625, -0.032219886779785156, -0.030408859252929688, -0.02859783172607422, -0.02678680419921875, -0.02497577667236328, -0.023164749145507812, -0.021353721618652344, -0.019542694091796875, -0.017731666564941406, -0.015920639038085938, -0.014109611511230469, -0.012298583984375, -0.010487556457519531, -0.008676528930664062, -0.006865501403808594, -0.005054473876953125, -0.0032434463500976562, -0.0014324188232421875, 0.00037860870361328125, 0.00218963623046875, 0.004000663757324219, 0.0058116912841796875, 0.007622718811035156, 0.009433746337890625, 0.011244773864746094, 0.013055801391601562, 0.014866828918457031, 0.0166778564453125, 0.01848888397216797, 0.020299911499023438, 0.022110939025878906, 0.023921966552734375, 0.025732994079589844, 0.027544021606445312, 0.02935504913330078, 0.03116607666015625, 0.03297710418701172, 0.03478813171386719, 0.036599159240722656, 0.038410186767578125, 0.040221214294433594, 0.04203224182128906, 0.04384326934814453, 0.045654296875]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 5.0, 4.0, 2.0, 10.0, 6.0, 6.0, 9.0, 17.0, 9.0, 15.0, 23.0, 26.0, 22.0, 22.0, 32.0, 34.0, 48.0, 40.0, 57.0, 49.0, 46.0, 45.0, 55.0, 40.0, 35.0, 37.0, 42.0, 48.0, 29.0, 35.0, 31.0, 25.0, 18.0, 15.0, 19.0, 11.0, 17.0, 9.0, 5.0, 3.0, 1.0, 2.0, 5.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.038848876953125, -0.03727006912231445, -0.035691261291503906, -0.03411245346069336, -0.03253364562988281, -0.030954837799072266, -0.02937602996826172, -0.027797222137451172, -0.026218414306640625, -0.024639606475830078, -0.02306079864501953, -0.021481990814208984, -0.019903182983398438, -0.01832437515258789, -0.016745567321777344, -0.015166759490966797, -0.01358795166015625, -0.012009143829345703, -0.010430335998535156, -0.00885152816772461, -0.0072727203369140625, -0.005693912506103516, -0.004115104675292969, -0.002536296844482422, -0.000957489013671875, 0.0006213188171386719, 0.0022001266479492188, 0.0037789344787597656, 0.0053577423095703125, 0.006936550140380859, 0.008515357971191406, 0.010094165802001953, 0.0116729736328125, 0.013251781463623047, 0.014830589294433594, 0.01640939712524414, 0.017988204956054688, 0.019567012786865234, 0.02114582061767578, 0.022724628448486328, 0.024303436279296875, 0.025882244110107422, 0.02746105194091797, 0.029039859771728516, 0.030618667602539062, 0.03219747543334961, 0.033776283264160156, 0.0353550910949707, 0.03693389892578125, 0.0385127067565918, 0.040091514587402344, 0.04167032241821289, 0.04324913024902344, 0.044827938079833984, 0.04640674591064453, 0.04798555374145508, 0.049564361572265625, 0.05114316940307617, 0.05272197723388672, 0.054300785064697266, 0.05587959289550781, 0.05745840072631836, 0.059037208557128906, 0.06061601638793945, 0.06219482421875]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 11.0, 35.0, 84.0, 146.0, 240.0, 224.0, 148.0, 78.0, 29.0, 9.0, 4.0, 3.0, 2.0, 2.0, 2.0], "bins": [-3.090036392211914, -3.03291654586792, -2.9757964611053467, -2.9186766147613525, -2.8615565299987793, -2.804436683654785, -2.747316598892212, -2.6901967525482178, -2.6330766677856445, -2.5759568214416504, -2.518836736679077, -2.461716890335083, -2.4045968055725098, -2.3474769592285156, -2.2903568744659424, -2.2332370281219482, -2.176117181777954, -2.11899733543396, -2.0618772506713867, -2.0047574043273926, -1.9476373195648193, -1.8905174732208252, -1.8333975076675415, -1.7762775421142578, -1.7191575765609741, -1.6620376110076904, -1.6049176454544067, -1.547797679901123, -1.490677833557129, -1.4335577487945557, -1.3764379024505615, -1.3193179368972778, -1.2621978521347046, -1.205077886581421, -1.1479579210281372, -1.0908379554748535, -1.0337181091308594, -0.9765980839729309, -0.919478178024292, -0.8623582124710083, -0.8052382469177246, -0.7481182813644409, -0.6909983158111572, -0.6338784098625183, -0.5767584443092346, -0.5196384787559509, -0.4625185430049896, -0.4053986072540283, -0.34827864170074463, -0.29115867614746094, -0.23403874039649963, -0.17691878974437714, -0.11979883909225464, -0.06267887353897095, -0.0055589377880096436, 0.05156099796295166, 0.10868096351623535, 0.16580091416835785, 0.22292086482048035, 0.28004080057144165, 0.33716076612472534, 0.39428073167800903, 0.45140066742897034, 0.5085206031799316, 0.5656405687332153]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 3.0, 2.0, 6.0, 6.0, 10.0, 8.0, 9.0, 8.0, 16.0, 19.0, 17.0, 22.0, 20.0, 27.0, 27.0, 23.0, 31.0, 34.0, 37.0, 34.0, 34.0, 32.0, 35.0, 35.0, 38.0, 38.0, 41.0, 43.0, 25.0, 28.0, 31.0, 37.0, 31.0, 28.0, 21.0, 17.0, 24.0, 19.0, 15.0, 15.0, 8.0, 14.0, 5.0, 6.0, 5.0, 4.0, 4.0, 3.0, 2.0, 5.0, 3.0, 3.0, 1.0, 3.0, 2.0, 1.0], "bins": [-0.6487107872962952, -0.6286462545394897, -0.6085817217826843, -0.5885172486305237, -0.5684527158737183, -0.5483881831169128, -0.5283236503601074, -0.5082591772079468, -0.48819464445114136, -0.46813011169433594, -0.4480656087398529, -0.4280010759830475, -0.40793657302856445, -0.38787204027175903, -0.3678075075149536, -0.3477430045604706, -0.32767847180366516, -0.30761393904685974, -0.2875494360923767, -0.2674849033355713, -0.24742040038108826, -0.22735586762428284, -0.2072913497686386, -0.18722683191299438, -0.16716231405735016, -0.14709779620170593, -0.1270332783460617, -0.10696875303983688, -0.08690423518419266, -0.06683971732854843, -0.04677519202232361, -0.026710674166679382, -0.006646156311035156, 0.013418363407254219, 0.033482883125543594, 0.05354740470647812, 0.07361192256212234, 0.09367644041776657, 0.1137409657239914, 0.13380548357963562, 0.15387000143527985, 0.17393451929092407, 0.1939990371465683, 0.21406355500221252, 0.23412808775901794, 0.254192590713501, 0.2742571234703064, 0.2943216562271118, 0.31438615918159485, 0.33445069193840027, 0.3545151948928833, 0.3745797276496887, 0.39464423060417175, 0.4147087633609772, 0.4347732663154602, 0.4548377990722656, 0.47490233182907104, 0.49496686458587646, 0.5150313973426819, 0.5350958704948425, 0.555160403251648, 0.5752249360084534, 0.5952894687652588, 0.6153539419174194, 0.6354184746742249]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 3.0, 6.0, 12.0, 16.0, 30.0, 60.0, 92.0, 187.0, 584.0, 2469.0, 19703.0, 518747.0, 3461816.0, 178267.0, 10066.0, 1550.0, 382.0, 140.0, 75.0, 37.0, 27.0, 13.0, 0.0, 2.0, 5.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.28466796875, -0.2746315002441406, -0.26459503173828125, -0.2545585632324219, -0.2445220947265625, -0.23448562622070312, -0.22444915771484375, -0.21441268920898438, -0.204376220703125, -0.19433975219726562, -0.18430328369140625, -0.17426681518554688, -0.1642303466796875, -0.15419387817382812, -0.14415740966796875, -0.13412094116210938, -0.12408447265625, -0.11404800415039062, -0.10401153564453125, -0.09397506713867188, -0.0839385986328125, -0.07390213012695312, -0.06386566162109375, -0.053829193115234375, -0.043792724609375, -0.033756256103515625, -0.02371978759765625, -0.013683319091796875, -0.0036468505859375, 0.006389617919921875, 0.01642608642578125, 0.026462554931640625, 0.0364990234375, 0.046535491943359375, 0.05657196044921875, 0.06660842895507812, 0.0766448974609375, 0.08668136596679688, 0.09671783447265625, 0.10675430297851562, 0.116790771484375, 0.12682723999023438, 0.13686370849609375, 0.14690017700195312, 0.1569366455078125, 0.16697311401367188, 0.17700958251953125, 0.18704605102539062, 0.19708251953125, 0.20711898803710938, 0.21715545654296875, 0.22719192504882812, 0.2372283935546875, 0.24726486206054688, 0.25730133056640625, 0.2673377990722656, 0.277374267578125, 0.2874107360839844, 0.29744720458984375, 0.3074836730957031, 0.3175201416015625, 0.3275566101074219, 0.33759307861328125, 0.3476295471191406, 0.357666015625]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 6.0, 11.0, 11.0, 19.0, 28.0, 44.0, 42.0, 66.0, 88.0, 86.0, 89.0, 76.0, 81.0, 81.0, 69.0, 55.0, 44.0, 43.0, 31.0, 16.0, 11.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1441650390625, -0.1390552520751953, -0.13394546508789062, -0.12883567810058594, -0.12372589111328125, -0.11861610412597656, -0.11350631713867188, -0.10839653015136719, -0.1032867431640625, -0.09817695617675781, -0.09306716918945312, -0.08795738220214844, -0.08284759521484375, -0.07773780822753906, -0.07262802124023438, -0.06751823425292969, -0.062408447265625, -0.05729866027832031, -0.052188873291015625, -0.04707908630371094, -0.04196929931640625, -0.03685951232910156, -0.031749725341796875, -0.026639938354492188, -0.0215301513671875, -0.016420364379882812, -0.011310577392578125, -0.0062007904052734375, -0.00109100341796875, 0.0040187835693359375, 0.009128570556640625, 0.014238357543945312, 0.01934814453125, 0.024457931518554688, 0.029567718505859375, 0.03467750549316406, 0.03978729248046875, 0.04489707946777344, 0.050006866455078125, 0.05511665344238281, 0.0602264404296875, 0.06533622741699219, 0.07044601440429688, 0.07555580139160156, 0.08066558837890625, 0.08577537536621094, 0.09088516235351562, 0.09599494934082031, 0.101104736328125, 0.10621452331542969, 0.11132431030273438, 0.11643409729003906, 0.12154388427734375, 0.12665367126464844, 0.13176345825195312, 0.1368732452392578, 0.1419830322265625, 0.1470928192138672, 0.15220260620117188, 0.15731239318847656, 0.16242218017578125, 0.16753196716308594, 0.17264175415039062, 0.1777515411376953, 0.182861328125]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 4.0, 12.0, 12.0, 23.0, 24.0, 33.0, 49.0, 122.0, 243.0, 483.0, 1776.0, 10681.0, 131133.0, 2181451.0, 1759828.0, 97634.0, 8430.0, 1475.0, 447.0, 170.0, 106.0, 63.0, 37.0, 32.0, 3.0, 4.0, 8.0, 5.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2034912109375, -0.1946239471435547, -0.18575668334960938, -0.17688941955566406, -0.16802215576171875, -0.15915489196777344, -0.15028762817382812, -0.1414203643798828, -0.1325531005859375, -0.12368583679199219, -0.11481857299804688, -0.10595130920410156, -0.09708404541015625, -0.08821678161621094, -0.07934951782226562, -0.07048225402832031, -0.061614990234375, -0.05274772644042969, -0.043880462646484375, -0.03501319885253906, -0.02614593505859375, -0.017278671264648438, -0.008411407470703125, 0.0004558563232421875, 0.0093231201171875, 0.018190383911132812, 0.027057647705078125, 0.03592491149902344, 0.04479217529296875, 0.05365943908691406, 0.06252670288085938, 0.07139396667480469, 0.08026123046875, 0.08912849426269531, 0.09799575805664062, 0.10686302185058594, 0.11573028564453125, 0.12459754943847656, 0.13346481323242188, 0.1423320770263672, 0.1511993408203125, 0.1600666046142578, 0.16893386840820312, 0.17780113220214844, 0.18666839599609375, 0.19553565979003906, 0.20440292358398438, 0.2132701873779297, 0.222137451171875, 0.2310047149658203, 0.23987197875976562, 0.24873924255371094, 0.25760650634765625, 0.26647377014160156, 0.2753410339355469, 0.2842082977294922, 0.2930755615234375, 0.3019428253173828, 0.3108100891113281, 0.31967735290527344, 0.32854461669921875, 0.33741188049316406, 0.3462791442871094, 0.3551464080810547, 0.364013671875]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 6.0, 9.0, 14.0, 13.0, 24.0, 37.0, 40.0, 62.0, 110.0, 110.0, 191.0, 265.0, 312.0, 411.0, 471.0, 468.0, 392.0, 305.0, 233.0, 198.0, 124.0, 87.0, 69.0, 36.0, 28.0, 20.0, 11.0, 13.0, 9.0, 7.0, 0.0, 4.0, 3.0, 3.0, 1.0, 1.0], "bins": [-0.1884765625, -0.18407344818115234, -0.1796703338623047, -0.17526721954345703, -0.17086410522460938, -0.16646099090576172, -0.16205787658691406, -0.1576547622680664, -0.15325164794921875, -0.1488485336303711, -0.14444541931152344, -0.14004230499267578, -0.13563919067382812, -0.13123607635498047, -0.1268329620361328, -0.12242984771728516, -0.1180267333984375, -0.11362361907958984, -0.10922050476074219, -0.10481739044189453, -0.10041427612304688, -0.09601116180419922, -0.09160804748535156, -0.0872049331665039, -0.08280181884765625, -0.0783987045288086, -0.07399559020996094, -0.06959247589111328, -0.06518936157226562, -0.06078624725341797, -0.05638313293457031, -0.051980018615722656, -0.047576904296875, -0.043173789978027344, -0.03877067565917969, -0.03436756134033203, -0.029964447021484375, -0.02556133270263672, -0.021158218383789062, -0.016755104064941406, -0.01235198974609375, -0.007948875427246094, -0.0035457611083984375, 0.0008573532104492188, 0.005260467529296875, 0.009663581848144531, 0.014066696166992188, 0.018469810485839844, 0.0228729248046875, 0.027276039123535156, 0.03167915344238281, 0.03608226776123047, 0.040485382080078125, 0.04488849639892578, 0.04929161071777344, 0.053694725036621094, 0.05809783935546875, 0.0625009536743164, 0.06690406799316406, 0.07130718231201172, 0.07571029663085938, 0.08011341094970703, 0.08451652526855469, 0.08891963958740234, 0.09332275390625]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 11.0, 26.0, 72.0, 104.0, 171.0, 190.0, 182.0, 124.0, 80.0, 28.0, 16.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5648368000984192, -0.5249695777893066, -0.48510241508483887, -0.4452351927757263, -0.40536803007125854, -0.365500807762146, -0.32563361525535583, -0.2857664227485657, -0.2458992302417755, -0.20603203773498535, -0.1661648452281952, -0.12629763782024384, -0.08643044531345367, -0.04656325280666351, -0.006696045398712158, 0.033171147108078, 0.07303833961486816, 0.11290553212165833, 0.1527727246284485, 0.19263993203639984, 0.23250712454319, 0.27237433195114136, 0.3122415244579315, 0.3521087169647217, 0.39197590947151184, 0.431843101978302, 0.47171029448509216, 0.5115774869918823, 0.5514447093009949, 0.5913118720054626, 0.6311790943145752, 0.671046257019043, 0.7109134197235107, 0.7507806420326233, 0.7906478047370911, 0.8305150270462036, 0.8703821897506714, 0.9102494120597839, 0.9501166343688965, 0.9899837970733643, 1.029850959777832, 1.0697181224822998, 1.1095854043960571, 1.149452567100525, 1.1893197298049927, 1.2291868925094604, 1.2690541744232178, 1.3089213371276855, 1.3487884998321533, 1.388655662536621, 1.4285229444503784, 1.4683901071548462, 1.508257269859314, 1.5481244325637817, 1.587991714477539, 1.6278588771820068, 1.6677261590957642, 1.707593321800232, 1.7474606037139893, 1.787327766418457, 1.8271949291229248, 1.8670620918273926, 1.90692937374115, 1.9467965364456177, 1.9866636991500854]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 3.0, 8.0, 2.0, 5.0, 6.0, 11.0, 11.0, 12.0, 9.0, 16.0, 17.0, 24.0, 24.0, 37.0, 27.0, 39.0, 32.0, 41.0, 43.0, 45.0, 45.0, 43.0, 54.0, 50.0, 33.0, 39.0, 36.0, 46.0, 52.0, 27.0, 39.0, 24.0, 22.0, 18.0, 14.0, 17.0, 11.0, 8.0, 1.0, 6.0, 3.0, 5.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.5098126530647278, -0.4945524334907532, -0.4792921841144562, -0.46403196454048157, -0.44877171516418457, -0.43351149559020996, -0.41825127601623535, -0.40299102663993835, -0.38773080706596375, -0.37247058749198914, -0.35721033811569214, -0.34195011854171753, -0.32668986916542053, -0.3114296495914459, -0.2961694002151489, -0.2809091806411743, -0.2656489610671997, -0.2503887414932251, -0.2351284921169281, -0.2198682725429535, -0.2046080380678177, -0.18934780359268188, -0.17408756911754608, -0.15882733464241028, -0.14356708526611328, -0.12830685079097748, -0.11304662376642227, -0.09778638929128647, -0.08252616226673126, -0.06726592779159546, -0.052005693316459656, -0.03674546629190445, -0.021485239267349243, -0.006225007586181164, 0.009035224094986916, 0.02429545670747757, 0.039555687457323074, 0.05481591820716858, 0.07007615268230438, 0.08533637970685959, 0.10059661418199539, 0.1158568486571312, 0.1311170756816864, 0.1463773101568222, 0.161637544631958, 0.17689776420593262, 0.19215801358222961, 0.20741823315620422, 0.22267846763134003, 0.23793870210647583, 0.25319892168045044, 0.26845917105674744, 0.28371939063072205, 0.29897964000701904, 0.31423985958099365, 0.32950007915496826, 0.34476032853126526, 0.36002054810523987, 0.37528079748153687, 0.3905410170555115, 0.40580126643180847, 0.4210614860057831, 0.4363217353820801, 0.4515819549560547, 0.4668421745300293]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 3.0, 3.0, 6.0, 8.0, 10.0, 11.0, 24.0, 27.0, 34.0, 58.0, 86.0, 148.0, 247.0, 505.0, 1033.0, 2267.0, 5250.0, 12583.0, 31884.0, 86479.0, 225825.0, 350243.0, 205786.0, 76708.0, 28910.0, 11525.0, 4706.0, 2124.0, 971.0, 453.0, 227.0, 147.0, 93.0, 44.0, 40.0, 27.0, 20.0, 15.0, 9.0, 5.0, 8.0, 3.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.346435546875, -0.3350563049316406, -0.32367706298828125, -0.3122978210449219, -0.3009185791015625, -0.2895393371582031, -0.27816009521484375, -0.2667808532714844, -0.255401611328125, -0.24402236938476562, -0.23264312744140625, -0.22126388549804688, -0.2098846435546875, -0.19850540161132812, -0.18712615966796875, -0.17574691772460938, -0.16436767578125, -0.15298843383789062, -0.14160919189453125, -0.13022994995117188, -0.1188507080078125, -0.10747146606445312, -0.09609222412109375, -0.08471298217773438, -0.073333740234375, -0.061954498291015625, -0.05057525634765625, -0.039196014404296875, -0.0278167724609375, -0.016437530517578125, -0.00505828857421875, 0.006320953369140625, 0.0177001953125, 0.029079437255859375, 0.04045867919921875, 0.051837921142578125, 0.0632171630859375, 0.07459640502929688, 0.08597564697265625, 0.09735488891601562, 0.108734130859375, 0.12011337280273438, 0.13149261474609375, 0.14287185668945312, 0.1542510986328125, 0.16563034057617188, 0.17700958251953125, 0.18838882446289062, 0.19976806640625, 0.21114730834960938, 0.22252655029296875, 0.23390579223632812, 0.2452850341796875, 0.2566642761230469, 0.26804351806640625, 0.2794227600097656, 0.290802001953125, 0.3021812438964844, 0.31356048583984375, 0.3249397277832031, 0.3363189697265625, 0.3476982116699219, 0.35907745361328125, 0.3704566955566406, 0.3818359375]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 7.0, 10.0, 21.0, 16.0, 29.0, 39.0, 49.0, 73.0, 79.0, 91.0, 105.0, 82.0, 79.0, 68.0, 67.0, 55.0, 50.0, 39.0, 18.0, 13.0, 11.0, 1.0, 6.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1431884765625, -0.1380748748779297, -0.13296127319335938, -0.12784767150878906, -0.12273406982421875, -0.11762046813964844, -0.11250686645507812, -0.10739326477050781, -0.1022796630859375, -0.09716606140136719, -0.09205245971679688, -0.08693885803222656, -0.08182525634765625, -0.07671165466308594, -0.07159805297851562, -0.06648445129394531, -0.061370849609375, -0.05625724792480469, -0.051143646240234375, -0.04603004455566406, -0.04091644287109375, -0.03580284118652344, -0.030689239501953125, -0.025575637817382812, -0.0204620361328125, -0.015348434448242188, -0.010234832763671875, -0.0051212310791015625, -7.62939453125e-06, 0.0051059722900390625, 0.010219573974609375, 0.015333175659179688, 0.02044677734375, 0.025560379028320312, 0.030673980712890625, 0.03578758239746094, 0.04090118408203125, 0.04601478576660156, 0.051128387451171875, 0.05624198913574219, 0.0613555908203125, 0.06646919250488281, 0.07158279418945312, 0.07669639587402344, 0.08180999755859375, 0.08692359924316406, 0.09203720092773438, 0.09715080261230469, 0.102264404296875, 0.10737800598144531, 0.11249160766601562, 0.11760520935058594, 0.12271881103515625, 0.12783241271972656, 0.13294601440429688, 0.1380596160888672, 0.1431732177734375, 0.1482868194580078, 0.15340042114257812, 0.15851402282714844, 0.16362762451171875, 0.16874122619628906, 0.17385482788085938, 0.1789684295654297, 0.18408203125]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 4.0, 3.0, 2.0, 4.0, 5.0, 9.0, 6.0, 12.0, 16.0, 24.0, 33.0, 45.0, 67.0, 99.0, 154.0, 214.0, 413.0, 697.0, 1274.0, 2464.0, 4977.0, 10409.0, 23488.0, 53877.0, 116563.0, 209419.0, 255326.0, 187861.0, 98982.0, 44750.0, 19577.0, 8752.0, 4179.0, 2117.0, 1117.0, 625.0, 331.0, 226.0, 134.0, 91.0, 53.0, 48.0, 37.0, 19.0, 20.0, 8.0, 10.0, 3.0, 7.0, 7.0, 4.0, 0.0, 0.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-0.2264404296875, -0.21898841857910156, -0.21153640747070312, -0.2040843963623047, -0.19663238525390625, -0.1891803741455078, -0.18172836303710938, -0.17427635192871094, -0.1668243408203125, -0.15937232971191406, -0.15192031860351562, -0.1444683074951172, -0.13701629638671875, -0.1295642852783203, -0.12211227416992188, -0.11466026306152344, -0.107208251953125, -0.09975624084472656, -0.09230422973632812, -0.08485221862792969, -0.07740020751953125, -0.06994819641113281, -0.062496185302734375, -0.05504417419433594, -0.0475921630859375, -0.04014015197753906, -0.032688140869140625, -0.025236129760742188, -0.01778411865234375, -0.010332107543945312, -0.002880096435546875, 0.0045719146728515625, 0.01202392578125, 0.019475936889648438, 0.026927947998046875, 0.03437995910644531, 0.04183197021484375, 0.04928398132324219, 0.056735992431640625, 0.06418800354003906, 0.0716400146484375, 0.07909202575683594, 0.08654403686523438, 0.09399604797363281, 0.10144805908203125, 0.10890007019042969, 0.11635208129882812, 0.12380409240722656, 0.131256103515625, 0.13870811462402344, 0.14616012573242188, 0.1536121368408203, 0.16106414794921875, 0.1685161590576172, 0.17596817016601562, 0.18342018127441406, 0.1908721923828125, 0.19832420349121094, 0.20577621459960938, 0.2132282257080078, 0.22068023681640625, 0.2281322479248047, 0.23558425903320312, 0.24303627014160156, 0.25048828125]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 5.0, 10.0, 7.0, 4.0, 8.0, 6.0, 15.0, 10.0, 31.0, 23.0, 24.0, 25.0, 29.0, 28.0, 43.0, 40.0, 32.0, 48.0, 43.0, 44.0, 39.0, 38.0, 44.0, 38.0, 49.0, 35.0, 24.0, 33.0, 36.0, 26.0, 19.0, 29.0, 28.0, 19.0, 9.0, 15.0, 12.0, 7.0, 9.0, 7.0, 2.0, 2.0, 2.0, 1.0, 2.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.251708984375, -0.24383163452148438, -0.23595428466796875, -0.22807693481445312, -0.2201995849609375, -0.21232223510742188, -0.20444488525390625, -0.19656753540039062, -0.188690185546875, -0.18081283569335938, -0.17293548583984375, -0.16505813598632812, -0.1571807861328125, -0.14930343627929688, -0.14142608642578125, -0.13354873657226562, -0.12567138671875, -0.11779403686523438, -0.10991668701171875, -0.10203933715820312, -0.0941619873046875, -0.08628463745117188, -0.07840728759765625, -0.07052993774414062, -0.062652587890625, -0.054775238037109375, -0.04689788818359375, -0.039020538330078125, -0.0311431884765625, -0.023265838623046875, -0.01538848876953125, -0.007511138916015625, 0.0003662109375, 0.008243560791015625, 0.01612091064453125, 0.023998260498046875, 0.0318756103515625, 0.039752960205078125, 0.04763031005859375, 0.055507659912109375, 0.063385009765625, 0.07126235961914062, 0.07913970947265625, 0.08701705932617188, 0.0948944091796875, 0.10277175903320312, 0.11064910888671875, 0.11852645874023438, 0.12640380859375, 0.13428115844726562, 0.14215850830078125, 0.15003585815429688, 0.1579132080078125, 0.16579055786132812, 0.17366790771484375, 0.18154525756835938, 0.189422607421875, 0.19729995727539062, 0.20517730712890625, 0.21305465698242188, 0.2209320068359375, 0.22880935668945312, 0.23668670654296875, 0.24456405639648438, 0.25244140625]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 2.0, 4.0, 3.0, 6.0, 14.0, 16.0, 13.0, 43.0, 55.0, 68.0, 104.0, 141.0, 225.0, 338.0, 553.0, 734.0, 1286.0, 2007.0, 2930.0, 4674.0, 7538.0, 12259.0, 20241.0, 35323.0, 63822.0, 114401.0, 183029.0, 211416.0, 162658.0, 96726.0, 52763.0, 29335.0, 17391.0, 10444.0, 6420.0, 4049.0, 2612.0, 1683.0, 1091.0, 730.0, 466.0, 274.0, 209.0, 141.0, 103.0, 74.0, 41.0, 30.0, 23.0, 22.0, 13.0, 10.0, 5.0, 6.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.08770751953125, -0.08490943908691406, -0.08211135864257812, -0.07931327819824219, -0.07651519775390625, -0.07371711730957031, -0.07091903686523438, -0.06812095642089844, -0.0653228759765625, -0.06252479553222656, -0.059726715087890625, -0.05692863464355469, -0.05413055419921875, -0.05133247375488281, -0.048534393310546875, -0.04573631286621094, -0.042938232421875, -0.04014015197753906, -0.037342071533203125, -0.03454399108886719, -0.03174591064453125, -0.028947830200195312, -0.026149749755859375, -0.023351669311523438, -0.0205535888671875, -0.017755508422851562, -0.014957427978515625, -0.012159347534179688, -0.00936126708984375, -0.0065631866455078125, -0.003765106201171875, -0.0009670257568359375, 0.0018310546875, 0.0046291351318359375, 0.007427215576171875, 0.010225296020507812, 0.01302337646484375, 0.015821456909179688, 0.018619537353515625, 0.021417617797851562, 0.0242156982421875, 0.027013778686523438, 0.029811859130859375, 0.03260993957519531, 0.03540802001953125, 0.03820610046386719, 0.041004180908203125, 0.04380226135253906, 0.046600341796875, 0.04939842224121094, 0.052196502685546875, 0.05499458312988281, 0.05779266357421875, 0.06059074401855469, 0.06338882446289062, 0.06618690490722656, 0.0689849853515625, 0.07178306579589844, 0.07458114624023438, 0.07737922668457031, 0.08017730712890625, 0.08297538757324219, 0.08577346801757812, 0.08857154846191406, 0.09136962890625]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 5.0, 5.0, 9.0, 6.0, 12.0, 12.0, 25.0, 23.0, 29.0, 40.0, 37.0, 52.0, 45.0, 69.0, 69.0, 81.0, 69.0, 64.0, 68.0, 45.0, 41.0, 41.0, 26.0, 28.0, 17.0, 17.0, 18.0, 7.0, 7.0, 11.0, 11.0, 4.0, 4.0, 4.0, 2.0, 1.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.872943878173828e-05, -2.775713801383972e-05, -2.6784837245941162e-05, -2.5812536478042603e-05, -2.4840235710144043e-05, -2.3867934942245483e-05, -2.2895634174346924e-05, -2.1923333406448364e-05, -2.0951032638549805e-05, -1.9978731870651245e-05, -1.9006431102752686e-05, -1.8034130334854126e-05, -1.7061829566955566e-05, -1.6089528799057007e-05, -1.5117228031158447e-05, -1.4144927263259888e-05, -1.3172626495361328e-05, -1.2200325727462769e-05, -1.1228024959564209e-05, -1.025572419166565e-05, -9.28342342376709e-06, -8.31112265586853e-06, -7.338821887969971e-06, -6.366521120071411e-06, -5.3942203521728516e-06, -4.421919584274292e-06, -3.4496188163757324e-06, -2.477318048477173e-06, -1.5050172805786133e-06, -5.327165126800537e-07, 4.3958425521850586e-07, 1.4118850231170654e-06, 2.384185791015625e-06, 3.3564865589141846e-06, 4.328787326812744e-06, 5.301088094711304e-06, 6.273388862609863e-06, 7.245689630508423e-06, 8.217990398406982e-06, 9.190291166305542e-06, 1.0162591934204102e-05, 1.1134892702102661e-05, 1.210719347000122e-05, 1.307949423789978e-05, 1.405179500579834e-05, 1.50240957736969e-05, 1.599639654159546e-05, 1.696869730949402e-05, 1.7940998077392578e-05, 1.8913298845291138e-05, 1.9885599613189697e-05, 2.0857900381088257e-05, 2.1830201148986816e-05, 2.2802501916885376e-05, 2.3774802684783936e-05, 2.4747103452682495e-05, 2.5719404220581055e-05, 2.6691704988479614e-05, 2.7664005756378174e-05, 2.8636306524276733e-05, 2.9608607292175293e-05, 3.058090806007385e-05, 3.155320882797241e-05, 3.252550959587097e-05, 3.349781036376953e-05]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 3.0, 4.0, 9.0, 11.0, 14.0, 24.0, 28.0, 38.0, 70.0, 101.0, 142.0, 218.0, 349.0, 535.0, 1088.0, 1934.0, 3847.0, 7825.0, 17578.0, 42134.0, 119450.0, 304379.0, 325938.0, 137749.0, 47804.0, 19487.0, 8830.0, 3991.0, 2115.0, 1170.0, 635.0, 367.0, 235.0, 134.0, 113.0, 75.0, 42.0, 24.0, 18.0, 9.0, 19.0, 5.0, 6.0, 4.0, 5.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0], "bins": [-0.1346435546875, -0.13016510009765625, -0.1256866455078125, -0.12120819091796875, -0.116729736328125, -0.11225128173828125, -0.1077728271484375, -0.10329437255859375, -0.09881591796875, -0.09433746337890625, -0.0898590087890625, -0.08538055419921875, -0.080902099609375, -0.07642364501953125, -0.0719451904296875, -0.06746673583984375, -0.06298828125, -0.05850982666015625, -0.0540313720703125, -0.04955291748046875, -0.045074462890625, -0.04059600830078125, -0.0361175537109375, -0.03163909912109375, -0.02716064453125, -0.02268218994140625, -0.0182037353515625, -0.01372528076171875, -0.009246826171875, -0.00476837158203125, -0.0002899169921875, 0.00418853759765625, 0.0086669921875, 0.01314544677734375, 0.0176239013671875, 0.02210235595703125, 0.026580810546875, 0.03105926513671875, 0.0355377197265625, 0.04001617431640625, 0.04449462890625, 0.04897308349609375, 0.0534515380859375, 0.05792999267578125, 0.062408447265625, 0.06688690185546875, 0.0713653564453125, 0.07584381103515625, 0.080322265625, 0.08480072021484375, 0.0892791748046875, 0.09375762939453125, 0.098236083984375, 0.10271453857421875, 0.1071929931640625, 0.11167144775390625, 0.11614990234375, 0.12062835693359375, 0.1251068115234375, 0.12958526611328125, 0.134063720703125, 0.13854217529296875, 0.1430206298828125, 0.14749908447265625, 0.1519775390625]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 2.0, 1.0, 6.0, 5.0, 4.0, 11.0, 5.0, 1.0, 9.0, 13.0, 21.0, 23.0, 21.0, 39.0, 61.0, 71.0, 79.0, 91.0, 105.0, 82.0, 66.0, 63.0, 56.0, 27.0, 35.0, 18.0, 24.0, 19.0, 12.0, 9.0, 9.0, 8.0, 5.0, 1.0, 6.0, 1.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1322021484375, -0.12809181213378906, -0.12398147583007812, -0.11987113952636719, -0.11576080322265625, -0.11165046691894531, -0.10754013061523438, -0.10342979431152344, -0.0993194580078125, -0.09520912170410156, -0.09109878540039062, -0.08698844909667969, -0.08287811279296875, -0.07876777648925781, -0.07465744018554688, -0.07054710388183594, -0.066436767578125, -0.06232643127441406, -0.058216094970703125, -0.05410575866699219, -0.04999542236328125, -0.04588508605957031, -0.041774749755859375, -0.03766441345214844, -0.0335540771484375, -0.029443740844726562, -0.025333404541015625, -0.021223068237304688, -0.01711273193359375, -0.013002395629882812, -0.008892059326171875, -0.0047817230224609375, -0.00067138671875, 0.0034389495849609375, 0.007549285888671875, 0.011659622192382812, 0.01576995849609375, 0.019880294799804688, 0.023990631103515625, 0.028100967407226562, 0.0322113037109375, 0.03632164001464844, 0.040431976318359375, 0.04454231262207031, 0.04865264892578125, 0.05276298522949219, 0.056873321533203125, 0.06098365783691406, 0.065093994140625, 0.06920433044433594, 0.07331466674804688, 0.07742500305175781, 0.08153533935546875, 0.08564567565917969, 0.08975601196289062, 0.09386634826660156, 0.0979766845703125, 0.10208702087402344, 0.10619735717773438, 0.11030769348144531, 0.11441802978515625, 0.11852836608886719, 0.12263870239257812, 0.12674903869628906, 0.130859375]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 8.0, 2.0, 12.0, 15.0, 35.0, 51.0, 62.0, 79.0, 100.0, 111.0, 120.0, 111.0, 104.0, 55.0, 40.0, 41.0, 26.0, 17.0, 9.0, 7.0, 5.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7709758281707764, -0.7264986634254456, -0.6820214986801147, -0.6375443339347839, -0.5930671691894531, -0.5485900044441223, -0.5041128396987915, -0.4596356451511383, -0.4151584804058075, -0.3706813156604767, -0.3262041509151459, -0.2817269563674927, -0.23724980652332306, -0.19277264177799225, -0.14829546213150024, -0.10381829738616943, -0.05934113264083862, -0.014863964170217514, 0.029613204300403595, 0.074090376496315, 0.11856754124164581, 0.16304470598697662, 0.20752188563346863, 0.25199905037879944, 0.29647621512413025, 0.34095337986946106, 0.38543054461479187, 0.42990773916244507, 0.4743849039077759, 0.5188620686531067, 0.5633392333984375, 0.6078163981437683, 0.6522935628890991, 0.6967707276344299, 0.7412478923797607, 0.7857250571250916, 0.8302022218704224, 0.8746793866157532, 0.919156551361084, 0.9636337757110596, 1.0081108808517456, 1.0525881052017212, 1.0970652103424072, 1.1415424346923828, 1.1860195398330688, 1.2304967641830444, 1.2749738693237305, 1.319451093673706, 1.3639283180236816, 1.4084055423736572, 1.4528826475143433, 1.4973598718643188, 1.5418369770050049, 1.5863142013549805, 1.6307913064956665, 1.675268530845642, 1.7197456359863281, 1.7642228603363037, 1.8086999654769897, 1.8531771898269653, 1.8976542949676514, 1.942131519317627, 1.986608624458313, 2.031085729598999, 2.0755629539489746]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 3.0, 3.0, 4.0, 8.0, 4.0, 8.0, 8.0, 14.0, 17.0, 19.0, 23.0, 17.0, 26.0, 18.0, 25.0, 34.0, 26.0, 39.0, 33.0, 37.0, 38.0, 35.0, 32.0, 39.0, 39.0, 44.0, 30.0, 43.0, 32.0, 34.0, 34.0, 30.0, 31.0, 24.0, 22.0, 18.0, 22.0, 23.0, 11.0, 13.0, 4.0, 3.0, 7.0, 7.0, 5.0, 4.0, 7.0, 4.0, 3.0, 1.0, 3.0, 1.0, 1.0, 3.0, 1.0, 2.0], "bins": [-0.8873392939567566, -0.8595561385154724, -0.8317729830741882, -0.8039898872375488, -0.7762067317962646, -0.7484235763549805, -0.7206404209136963, -0.6928572654724121, -0.6650741100311279, -0.6372909545898438, -0.6095077991485596, -0.5817246437072754, -0.553941547870636, -0.5261583924293518, -0.4983752369880676, -0.47059208154678345, -0.44280898571014404, -0.41502583026885986, -0.38724270462989807, -0.3594595491886139, -0.3316764235496521, -0.3038932681083679, -0.27611011266708374, -0.24832697212696075, -0.22054383158683777, -0.19276069104671478, -0.1649775505065918, -0.13719439506530762, -0.10941125452518463, -0.08162811398506165, -0.053844958543777466, -0.02606181800365448, 0.0017213821411132812, 0.029504526406526566, 0.05728767067193985, 0.08507081866264343, 0.11285395920276642, 0.1406370997428894, 0.16842025518417358, 0.19620339572429657, 0.22398653626441956, 0.25176969170570374, 0.2795528173446655, 0.3073359727859497, 0.3351191282272339, 0.3629022538661957, 0.39068540930747986, 0.41846853494644165, 0.44625169038772583, 0.47403484582901, 0.5018180012702942, 0.5296010971069336, 0.5573842525482178, 0.585167407989502, 0.6129505634307861, 0.6407337188720703, 0.6685168743133545, 0.6963000297546387, 0.7240831851959229, 0.751866340637207, 0.7796494364738464, 0.8074325919151306, 0.8352157473564148, 0.862998902797699, 0.8907819986343384]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 0.0, 4.0, 3.0, 5.0, 5.0, 4.0, 7.0, 10.0, 8.0, 9.0, 16.0, 16.0, 34.0, 54.0, 101.0, 153.0, 242.0, 369.0, 683.0, 1267.0, 2514.0, 5365.0, 13184.0, 37483.0, 128208.0, 560952.0, 1698366.0, 1284423.0, 334834.0, 82525.0, 25432.0, 9551.0, 4122.0, 1892.0, 1033.0, 563.0, 305.0, 192.0, 126.0, 79.0, 52.0, 30.0, 23.0, 12.0, 14.0, 4.0, 9.0, 4.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.13134765625, -0.12708663940429688, -0.12282562255859375, -0.11856460571289062, -0.1143035888671875, -0.11004257202148438, -0.10578155517578125, -0.10152053833007812, -0.097259521484375, -0.09299850463867188, -0.08873748779296875, -0.08447647094726562, -0.0802154541015625, -0.07595443725585938, -0.07169342041015625, -0.06743240356445312, -0.06317138671875, -0.058910369873046875, -0.05464935302734375, -0.050388336181640625, -0.0461273193359375, -0.041866302490234375, -0.03760528564453125, -0.033344268798828125, -0.029083251953125, -0.024822235107421875, -0.02056121826171875, -0.016300201416015625, -0.0120391845703125, -0.007778167724609375, -0.00351715087890625, 0.000743865966796875, 0.0050048828125, 0.009265899658203125, 0.01352691650390625, 0.017787933349609375, 0.0220489501953125, 0.026309967041015625, 0.03057098388671875, 0.034832000732421875, 0.039093017578125, 0.043354034423828125, 0.04761505126953125, 0.051876068115234375, 0.0561370849609375, 0.060398101806640625, 0.06465911865234375, 0.06892013549804688, 0.07318115234375, 0.07744216918945312, 0.08170318603515625, 0.08596420288085938, 0.0902252197265625, 0.09448623657226562, 0.09874725341796875, 0.10300827026367188, 0.107269287109375, 0.11153030395507812, 0.11579132080078125, 0.12005233764648438, 0.1243133544921875, 0.12857437133789062, 0.13283538818359375, 0.13709640502929688, 0.141357421875]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 5.0, 11.0, 9.0, 12.0, 24.0, 23.0, 28.0, 48.0, 55.0, 63.0, 69.0, 54.0, 71.0, 75.0, 66.0, 66.0, 66.0, 58.0, 49.0, 42.0, 30.0, 29.0, 18.0, 14.0, 8.0, 6.0, 3.0, 3.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1334228515625, -0.1281585693359375, -0.122894287109375, -0.1176300048828125, -0.11236572265625, -0.1071014404296875, -0.101837158203125, -0.0965728759765625, -0.09130859375, -0.0860443115234375, -0.080780029296875, -0.0755157470703125, -0.07025146484375, -0.0649871826171875, -0.059722900390625, -0.0544586181640625, -0.0491943359375, -0.0439300537109375, -0.038665771484375, -0.0334014892578125, -0.02813720703125, -0.0228729248046875, -0.017608642578125, -0.0123443603515625, -0.007080078125, -0.0018157958984375, 0.003448486328125, 0.0087127685546875, 0.01397705078125, 0.0192413330078125, 0.024505615234375, 0.0297698974609375, 0.0350341796875, 0.0402984619140625, 0.045562744140625, 0.0508270263671875, 0.05609130859375, 0.0613555908203125, 0.066619873046875, 0.0718841552734375, 0.0771484375, 0.0824127197265625, 0.087677001953125, 0.0929412841796875, 0.09820556640625, 0.1034698486328125, 0.108734130859375, 0.1139984130859375, 0.1192626953125, 0.1245269775390625, 0.129791259765625, 0.1350555419921875, 0.14031982421875, 0.1455841064453125, 0.150848388671875, 0.1561126708984375, 0.161376953125, 0.1666412353515625, 0.171905517578125, 0.1771697998046875, 0.18243408203125, 0.1876983642578125, 0.192962646484375, 0.1982269287109375, 0.2034912109375]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 5.0, 5.0, 9.0, 11.0, 22.0, 43.0, 42.0, 62.0, 108.0, 178.0, 335.0, 688.0, 1539.0, 3622.0, 10077.0, 31313.0, 120591.0, 576030.0, 1993992.0, 1135870.0, 238032.0, 55410.0, 16198.0, 5810.0, 2244.0, 982.0, 471.0, 249.0, 136.0, 78.0, 39.0, 26.0, 25.0, 13.0, 10.0, 10.0, 5.0, 4.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2159423828125, -0.21006202697753906, -0.20418167114257812, -0.1983013153076172, -0.19242095947265625, -0.1865406036376953, -0.18066024780273438, -0.17477989196777344, -0.1688995361328125, -0.16301918029785156, -0.15713882446289062, -0.1512584686279297, -0.14537811279296875, -0.1394977569580078, -0.13361740112304688, -0.12773704528808594, -0.121856689453125, -0.11597633361816406, -0.11009597778320312, -0.10421562194824219, -0.09833526611328125, -0.09245491027832031, -0.08657455444335938, -0.08069419860839844, -0.0748138427734375, -0.06893348693847656, -0.06305313110351562, -0.05717277526855469, -0.05129241943359375, -0.04541206359863281, -0.039531707763671875, -0.03365135192871094, -0.02777099609375, -0.021890640258789062, -0.016010284423828125, -0.010129928588867188, -0.00424957275390625, 0.0016307830810546875, 0.007511138916015625, 0.013391494750976562, 0.0192718505859375, 0.025152206420898438, 0.031032562255859375, 0.03691291809082031, 0.04279327392578125, 0.04867362976074219, 0.054553985595703125, 0.06043434143066406, 0.066314697265625, 0.07219505310058594, 0.07807540893554688, 0.08395576477050781, 0.08983612060546875, 0.09571647644042969, 0.10159683227539062, 0.10747718811035156, 0.1133575439453125, 0.11923789978027344, 0.12511825561523438, 0.1309986114501953, 0.13687896728515625, 0.1427593231201172, 0.14863967895507812, 0.15452003479003906, 0.160400390625]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 6.0, 2.0, 6.0, 11.0, 12.0, 11.0, 15.0, 39.0, 45.0, 63.0, 99.0, 127.0, 177.0, 280.0, 340.0, 435.0, 506.0, 501.0, 434.0, 266.0, 214.0, 156.0, 112.0, 77.0, 47.0, 33.0, 24.0, 16.0, 10.0, 7.0, 4.0, 5.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1328125, -0.12696456909179688, -0.12111663818359375, -0.11526870727539062, -0.1094207763671875, -0.10357284545898438, -0.09772491455078125, -0.09187698364257812, -0.086029052734375, -0.08018112182617188, -0.07433319091796875, -0.06848526000976562, -0.0626373291015625, -0.056789398193359375, -0.05094146728515625, -0.045093536376953125, -0.03924560546875, -0.033397674560546875, -0.02754974365234375, -0.021701812744140625, -0.0158538818359375, -0.010005950927734375, -0.00415802001953125, 0.001689910888671875, 0.007537841796875, 0.013385772705078125, 0.01923370361328125, 0.025081634521484375, 0.0309295654296875, 0.036777496337890625, 0.04262542724609375, 0.048473358154296875, 0.0543212890625, 0.060169219970703125, 0.06601715087890625, 0.07186508178710938, 0.0777130126953125, 0.08356094360351562, 0.08940887451171875, 0.09525680541992188, 0.101104736328125, 0.10695266723632812, 0.11280059814453125, 0.11864852905273438, 0.1244964599609375, 0.13034439086914062, 0.13619232177734375, 0.14204025268554688, 0.14788818359375, 0.15373611450195312, 0.15958404541015625, 0.16543197631835938, 0.1712799072265625, 0.17712783813476562, 0.18297576904296875, 0.18882369995117188, 0.194671630859375, 0.20051956176757812, 0.20636749267578125, 0.21221542358398438, 0.2180633544921875, 0.22391128540039062, 0.22975921630859375, 0.23560714721679688, 0.241455078125]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 4.0, 13.0, 22.0, 28.0, 50.0, 71.0, 106.0, 122.0, 137.0, 125.0, 118.0, 78.0, 55.0, 37.0, 18.0, 10.0, 4.0, 4.0, 6.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.063889741897583, -1.026673436164856, -0.9894572496414185, -0.9522410035133362, -0.9150247573852539, -0.8778085112571716, -0.8405922651290894, -0.8033759593963623, -0.7661597728729248, -0.7289435267448425, -0.6917272806167603, -0.654511034488678, -0.6172947883605957, -0.5800785422325134, -0.5428622961044312, -0.5056459903717041, -0.4684297442436218, -0.43121349811553955, -0.3939972519874573, -0.356781005859375, -0.3195647597312927, -0.28234851360321045, -0.2451322376728058, -0.2079159915447235, -0.17069974541664124, -0.13348349928855896, -0.09626724570989609, -0.059050992131233215, -0.02183474600315094, 0.015381500124931335, 0.052597761154174805, 0.08981400728225708, 0.12703025341033936, 0.16424649953842163, 0.2014627456665039, 0.23867900669574738, 0.27589523792266846, 0.31311148405075073, 0.3503277599811554, 0.38754400610923767, 0.42476025223731995, 0.4619764983654022, 0.4991927444934845, 0.5364090204238892, 0.5736252665519714, 0.6108415126800537, 0.648057758808136, 0.6852740049362183, 0.7224902510643005, 0.7597064971923828, 0.7969227433204651, 0.8341389894485474, 0.8713552355766296, 0.9085714817047119, 0.945787787437439, 0.9830039739608765, 1.0202202796936035, 1.0574365854263306, 1.094652771949768, 1.1318690776824951, 1.1690852642059326, 1.2063015699386597, 1.2435177564620972, 1.2807340621948242, 1.3179502487182617]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 4.0, 6.0, 10.0, 7.0, 9.0, 8.0, 12.0, 16.0, 24.0, 17.0, 20.0, 25.0, 24.0, 26.0, 27.0, 28.0, 41.0, 33.0, 47.0, 33.0, 32.0, 49.0, 34.0, 45.0, 36.0, 40.0, 38.0, 39.0, 27.0, 35.0, 26.0, 24.0, 29.0, 33.0, 14.0, 16.0, 13.0, 14.0, 7.0, 6.0, 5.0, 4.0, 5.0, 1.0, 8.0, 6.0, 2.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.48807013034820557, -0.4713576138019562, -0.4546450972557068, -0.4379325807094574, -0.421220064163208, -0.4045075476169586, -0.38779503107070923, -0.37108248472213745, -0.35436999797821045, -0.33765748143196106, -0.32094496488571167, -0.3042324483394623, -0.2875199317932129, -0.2708074152469635, -0.2540948987007141, -0.23738236725330353, -0.22066983580589294, -0.20395731925964355, -0.18724480271339417, -0.17053228616714478, -0.15381976962089539, -0.137107253074646, -0.12039472162723541, -0.10368220508098602, -0.08696968853473663, -0.07025717198848724, -0.053544651716947556, -0.03683213144540787, -0.020119614899158478, -0.003407098352909088, 0.013305425643920898, 0.030017942190170288, 0.04673045873641968, 0.06344297528266907, 0.08015549182891846, 0.09686801582574844, 0.11358053237199783, 0.13029304146766663, 0.1470055729150772, 0.1637180894613266, 0.180430606007576, 0.19714312255382538, 0.21385563910007477, 0.23056817054748535, 0.24728068709373474, 0.26399320363998413, 0.2807057201862335, 0.2974182367324829, 0.3141307532787323, 0.3308432698249817, 0.3475557863712311, 0.36426830291748047, 0.38098081946372986, 0.39769333600997925, 0.414405882358551, 0.431118369102478, 0.4478309154510498, 0.4645434319972992, 0.4812559485435486, 0.497968465089798, 0.5146809816360474, 0.5313935279846191, 0.5481060147285461, 0.5648185610771179, 0.5815310478210449]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 4.0, 3.0, 5.0, 5.0, 4.0, 6.0, 3.0, 6.0, 14.0, 27.0, 34.0, 60.0, 78.0, 115.0, 213.0, 316.0, 500.0, 918.0, 1778.0, 3338.0, 6623.0, 12546.0, 24641.0, 51614.0, 118008.0, 254698.0, 292757.0, 152156.0, 65205.0, 30550.0, 15341.0, 7928.0, 4158.0, 2120.0, 1184.0, 658.0, 373.0, 201.0, 116.0, 87.0, 50.0, 36.0, 17.0, 17.0, 14.0, 14.0, 8.0, 6.0, 4.0, 3.0, 3.0, 2.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.24072265625, -0.23273849487304688, -0.22475433349609375, -0.21677017211914062, -0.2087860107421875, -0.20080184936523438, -0.19281768798828125, -0.18483352661132812, -0.176849365234375, -0.16886520385742188, -0.16088104248046875, -0.15289688110351562, -0.1449127197265625, -0.13692855834960938, -0.12894439697265625, -0.12096023559570312, -0.11297607421875, -0.10499191284179688, -0.09700775146484375, -0.08902359008789062, -0.0810394287109375, -0.07305526733398438, -0.06507110595703125, -0.057086944580078125, -0.049102783203125, -0.041118621826171875, -0.03313446044921875, -0.025150299072265625, -0.0171661376953125, -0.009181976318359375, -0.00119781494140625, 0.006786346435546875, 0.0147705078125, 0.022754669189453125, 0.03073883056640625, 0.038722991943359375, 0.0467071533203125, 0.054691314697265625, 0.06267547607421875, 0.07065963745117188, 0.078643798828125, 0.08662796020507812, 0.09461212158203125, 0.10259628295898438, 0.1105804443359375, 0.11856460571289062, 0.12654876708984375, 0.13453292846679688, 0.14251708984375, 0.15050125122070312, 0.15848541259765625, 0.16646957397460938, 0.1744537353515625, 0.18243789672851562, 0.19042205810546875, 0.19840621948242188, 0.206390380859375, 0.21437454223632812, 0.22235870361328125, 0.23034286499023438, 0.2383270263671875, 0.24631118774414062, 0.25429534912109375, 0.2622795104980469, 0.270263671875]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 9.0, 10.0, 17.0, 20.0, 20.0, 26.0, 34.0, 45.0, 61.0, 57.0, 58.0, 81.0, 66.0, 65.0, 67.0, 62.0, 49.0, 64.0, 49.0, 38.0, 34.0, 21.0, 15.0, 16.0, 5.0, 11.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.13525390625, -0.130218505859375, -0.12518310546875, -0.120147705078125, -0.1151123046875, -0.110076904296875, -0.10504150390625, -0.100006103515625, -0.094970703125, -0.089935302734375, -0.08489990234375, -0.079864501953125, -0.0748291015625, -0.069793701171875, -0.06475830078125, -0.059722900390625, -0.0546875, -0.049652099609375, -0.04461669921875, -0.039581298828125, -0.0345458984375, -0.029510498046875, -0.02447509765625, -0.019439697265625, -0.014404296875, -0.009368896484375, -0.00433349609375, 0.000701904296875, 0.0057373046875, 0.010772705078125, 0.01580810546875, 0.020843505859375, 0.02587890625, 0.030914306640625, 0.03594970703125, 0.040985107421875, 0.0460205078125, 0.051055908203125, 0.05609130859375, 0.061126708984375, 0.066162109375, 0.071197509765625, 0.07623291015625, 0.081268310546875, 0.0863037109375, 0.091339111328125, 0.09637451171875, 0.101409912109375, 0.1064453125, 0.111480712890625, 0.11651611328125, 0.121551513671875, 0.1265869140625, 0.131622314453125, 0.13665771484375, 0.141693115234375, 0.146728515625, 0.151763916015625, 0.15679931640625, 0.161834716796875, 0.1668701171875, 0.171905517578125, 0.17694091796875, 0.181976318359375, 0.18701171875]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 3.0, 3.0, 8.0, 4.0, 3.0, 10.0, 24.0, 22.0, 28.0, 29.0, 52.0, 73.0, 93.0, 134.0, 304.0, 591.0, 1615.0, 5370.0, 19540.0, 73019.0, 286168.0, 452503.0, 153700.0, 39528.0, 10770.0, 3033.0, 886.0, 398.0, 232.0, 119.0, 83.0, 71.0, 35.0, 32.0, 22.0, 16.0, 9.0, 7.0, 6.0, 1.0, 5.0, 3.0, 3.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.353271484375, -0.3412017822265625, -0.329132080078125, -0.3170623779296875, -0.30499267578125, -0.2929229736328125, -0.280853271484375, -0.2687835693359375, -0.2567138671875, -0.2446441650390625, -0.232574462890625, -0.2205047607421875, -0.20843505859375, -0.1963653564453125, -0.184295654296875, -0.1722259521484375, -0.16015625, -0.1480865478515625, -0.136016845703125, -0.1239471435546875, -0.11187744140625, -0.0998077392578125, -0.087738037109375, -0.0756683349609375, -0.0635986328125, -0.0515289306640625, -0.039459228515625, -0.0273895263671875, -0.01531982421875, -0.0032501220703125, 0.008819580078125, 0.0208892822265625, 0.032958984375, 0.0450286865234375, 0.057098388671875, 0.0691680908203125, 0.08123779296875, 0.0933074951171875, 0.105377197265625, 0.1174468994140625, 0.1295166015625, 0.1415863037109375, 0.153656005859375, 0.1657257080078125, 0.17779541015625, 0.1898651123046875, 0.201934814453125, 0.2140045166015625, 0.22607421875, 0.2381439208984375, 0.250213623046875, 0.2622833251953125, 0.27435302734375, 0.2864227294921875, 0.298492431640625, 0.3105621337890625, 0.3226318359375, 0.3347015380859375, 0.346771240234375, 0.3588409423828125, 0.37091064453125, 0.3829803466796875, 0.395050048828125, 0.4071197509765625, 0.419189453125]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 3.0, 1.0, 2.0, 6.0, 4.0, 7.0, 4.0, 8.0, 13.0, 10.0, 23.0, 21.0, 30.0, 25.0, 33.0, 41.0, 38.0, 43.0, 50.0, 59.0, 41.0, 55.0, 58.0, 39.0, 36.0, 46.0, 40.0, 46.0, 42.0, 30.0, 26.0, 25.0, 18.0, 16.0, 21.0, 10.0, 17.0, 6.0, 5.0, 3.0, 5.0, 0.0, 0.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.372802734375, -0.3613777160644531, -0.34995269775390625, -0.3385276794433594, -0.3271026611328125, -0.3156776428222656, -0.30425262451171875, -0.2928276062011719, -0.281402587890625, -0.2699775695800781, -0.25855255126953125, -0.24712753295898438, -0.2357025146484375, -0.22427749633789062, -0.21285247802734375, -0.20142745971679688, -0.19000244140625, -0.17857742309570312, -0.16715240478515625, -0.15572738647460938, -0.1443023681640625, -0.13287734985351562, -0.12145233154296875, -0.11002731323242188, -0.098602294921875, -0.08717727661132812, -0.07575225830078125, -0.06432723999023438, -0.0529022216796875, -0.041477203369140625, -0.03005218505859375, -0.018627166748046875, -0.0072021484375, 0.004222869873046875, 0.01564788818359375, 0.027072906494140625, 0.0384979248046875, 0.049922943115234375, 0.06134796142578125, 0.07277297973632812, 0.084197998046875, 0.09562301635742188, 0.10704803466796875, 0.11847305297851562, 0.1298980712890625, 0.14132308959960938, 0.15274810791015625, 0.16417312622070312, 0.17559814453125, 0.18702316284179688, 0.19844818115234375, 0.20987319946289062, 0.2212982177734375, 0.23272323608398438, 0.24414825439453125, 0.2555732727050781, 0.266998291015625, 0.2784233093261719, 0.28984832763671875, 0.3012733459472656, 0.3126983642578125, 0.3241233825683594, 0.33554840087890625, 0.3469734191894531, 0.3583984375]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 1.0, 5.0, 3.0, 8.0, 8.0, 19.0, 18.0, 34.0, 56.0, 96.0, 103.0, 223.0, 354.0, 687.0, 1177.0, 1983.0, 3584.0, 6338.0, 11139.0, 18510.0, 32021.0, 56796.0, 107505.0, 187626.0, 230225.0, 173654.0, 96179.0, 50919.0, 28939.0, 17014.0, 10084.0, 5824.0, 3236.0, 1763.0, 1037.0, 541.0, 344.0, 216.0, 96.0, 60.0, 50.0, 33.0, 17.0, 13.0, 8.0, 5.0, 5.0, 2.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09637451171875, -0.09340095520019531, -0.09042739868164062, -0.08745384216308594, -0.08448028564453125, -0.08150672912597656, -0.07853317260742188, -0.07555961608886719, -0.0725860595703125, -0.06961250305175781, -0.06663894653320312, -0.06366539001464844, -0.06069183349609375, -0.05771827697753906, -0.054744720458984375, -0.05177116394042969, -0.048797607421875, -0.04582405090332031, -0.042850494384765625, -0.03987693786621094, -0.03690338134765625, -0.03392982482910156, -0.030956268310546875, -0.027982711791992188, -0.0250091552734375, -0.022035598754882812, -0.019062042236328125, -0.016088485717773438, -0.01311492919921875, -0.010141372680664062, -0.007167816162109375, -0.0041942596435546875, -0.001220703125, 0.0017528533935546875, 0.004726409912109375, 0.0076999664306640625, 0.01067352294921875, 0.013647079467773438, 0.016620635986328125, 0.019594192504882812, 0.0225677490234375, 0.025541305541992188, 0.028514862060546875, 0.03148841857910156, 0.03446197509765625, 0.03743553161621094, 0.040409088134765625, 0.04338264465332031, 0.046356201171875, 0.04932975769042969, 0.052303314208984375, 0.05527687072753906, 0.05825042724609375, 0.06122398376464844, 0.06419754028320312, 0.06717109680175781, 0.0701446533203125, 0.07311820983886719, 0.07609176635742188, 0.07906532287597656, 0.08203887939453125, 0.08501243591308594, 0.08798599243164062, 0.09095954895019531, 0.09393310546875]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 4.0, 2.0, 3.0, 10.0, 10.0, 11.0, 14.0, 10.0, 15.0, 21.0, 34.0, 50.0, 64.0, 74.0, 86.0, 81.0, 105.0, 93.0, 95.0, 55.0, 31.0, 32.0, 26.0, 28.0, 9.0, 11.0, 10.0, 5.0, 3.0, 2.0, 3.0, 3.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.07099723815918e-05, -3.9546750485897064e-05, -3.838352859020233e-05, -3.72203066945076e-05, -3.6057084798812866e-05, -3.4893862903118134e-05, -3.37306410074234e-05, -3.256741911172867e-05, -3.1404197216033936e-05, -3.0240975320339203e-05, -2.907775342464447e-05, -2.7914531528949738e-05, -2.6751309633255005e-05, -2.5588087737560272e-05, -2.442486584186554e-05, -2.3261643946170807e-05, -2.2098422050476074e-05, -2.093520015478134e-05, -1.977197825908661e-05, -1.8608756363391876e-05, -1.7445534467697144e-05, -1.628231257200241e-05, -1.5119090676307678e-05, -1.3955868780612946e-05, -1.2792646884918213e-05, -1.162942498922348e-05, -1.0466203093528748e-05, -9.302981197834015e-06, -8.139759302139282e-06, -6.9765374064445496e-06, -5.813315510749817e-06, -4.650093615055084e-06, -3.4868717193603516e-06, -2.323649823665619e-06, -1.1604279279708862e-06, 2.7939677238464355e-09, 1.166015863418579e-06, 2.3292377591133118e-06, 3.4924596548080444e-06, 4.655681550502777e-06, 5.81890344619751e-06, 6.9821253418922424e-06, 8.145347237586975e-06, 9.308569133281708e-06, 1.047179102897644e-05, 1.1635012924671173e-05, 1.2798234820365906e-05, 1.3961456716060638e-05, 1.5124678611755371e-05, 1.6287900507450104e-05, 1.7451122403144836e-05, 1.861434429883957e-05, 1.9777566194534302e-05, 2.0940788090229034e-05, 2.2104009985923767e-05, 2.32672318816185e-05, 2.4430453777313232e-05, 2.5593675673007965e-05, 2.6756897568702698e-05, 2.792011946439743e-05, 2.9083341360092163e-05, 3.0246563255786896e-05, 3.140978515148163e-05, 3.257300704717636e-05, 3.3736228942871094e-05]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 5.0, 5.0, 6.0, 6.0, 7.0, 16.0, 29.0, 47.0, 81.0, 109.0, 251.0, 497.0, 1169.0, 3237.0, 9852.0, 28171.0, 80671.0, 293172.0, 427811.0, 136176.0, 43491.0, 15412.0, 5169.0, 1808.0, 646.0, 303.0, 168.0, 88.0, 58.0, 37.0, 23.0, 14.0, 6.0, 7.0, 2.0, 2.0, 6.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.2076416015625, -0.2022075653076172, -0.19677352905273438, -0.19133949279785156, -0.18590545654296875, -0.18047142028808594, -0.17503738403320312, -0.1696033477783203, -0.1641693115234375, -0.1587352752685547, -0.15330123901367188, -0.14786720275878906, -0.14243316650390625, -0.13699913024902344, -0.13156509399414062, -0.1261310577392578, -0.120697021484375, -0.11526298522949219, -0.10982894897460938, -0.10439491271972656, -0.09896087646484375, -0.09352684020996094, -0.08809280395507812, -0.08265876770019531, -0.0772247314453125, -0.07179069519042969, -0.06635665893554688, -0.06092262268066406, -0.05548858642578125, -0.05005455017089844, -0.044620513916015625, -0.03918647766113281, -0.03375244140625, -0.028318405151367188, -0.022884368896484375, -0.017450332641601562, -0.01201629638671875, -0.0065822601318359375, -0.001148223876953125, 0.0042858123779296875, 0.0097198486328125, 0.015153884887695312, 0.020587921142578125, 0.026021957397460938, 0.03145599365234375, 0.03689002990722656, 0.042324066162109375, 0.04775810241699219, 0.053192138671875, 0.05862617492675781, 0.06406021118164062, 0.06949424743652344, 0.07492828369140625, 0.08036231994628906, 0.08579635620117188, 0.09123039245605469, 0.0966644287109375, 0.10209846496582031, 0.10753250122070312, 0.11296653747558594, 0.11840057373046875, 0.12383460998535156, 0.12926864624023438, 0.1347026824951172, 0.14013671875]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 3.0, 4.0, 5.0, 7.0, 10.0, 11.0, 16.0, 20.0, 23.0, 24.0, 60.0, 74.0, 94.0, 122.0, 127.0, 96.0, 85.0, 65.0, 42.0, 29.0, 22.0, 16.0, 16.0, 13.0, 9.0, 4.0, 7.0, 2.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1380615234375, -0.1321125030517578, -0.12616348266601562, -0.12021446228027344, -0.11426544189453125, -0.10831642150878906, -0.10236740112304688, -0.09641838073730469, -0.0904693603515625, -0.08452033996582031, -0.07857131958007812, -0.07262229919433594, -0.06667327880859375, -0.06072425842285156, -0.054775238037109375, -0.04882621765136719, -0.042877197265625, -0.03692817687988281, -0.030979156494140625, -0.025030136108398438, -0.01908111572265625, -0.013132095336914062, -0.007183074951171875, -0.0012340545654296875, 0.0047149658203125, 0.010663986206054688, 0.016613006591796875, 0.022562026977539062, 0.02851104736328125, 0.03446006774902344, 0.040409088134765625, 0.04635810852050781, 0.05230712890625, 0.05825614929199219, 0.06420516967773438, 0.07015419006347656, 0.07610321044921875, 0.08205223083496094, 0.08800125122070312, 0.09395027160644531, 0.0998992919921875, 0.10584831237792969, 0.11179733276367188, 0.11774635314941406, 0.12369537353515625, 0.12964439392089844, 0.13559341430664062, 0.1415424346923828, 0.147491455078125, 0.1534404754638672, 0.15938949584960938, 0.16533851623535156, 0.17128753662109375, 0.17723655700683594, 0.18318557739257812, 0.1891345977783203, 0.1950836181640625, 0.2010326385498047, 0.20698165893554688, 0.21293067932128906, 0.21887969970703125, 0.22482872009277344, 0.23077774047851562, 0.2367267608642578, 0.24267578125]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 24.0, 75.0, 163.0, 276.0, 243.0, 157.0, 53.0, 15.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.321749210357666, -5.217210292816162, -5.112671375274658, -5.0081329345703125, -4.903594017028809, -4.799055099487305, -4.694516181945801, -4.589977264404297, -4.485438346862793, -4.380899429321289, -4.276360511779785, -4.171821594238281, -4.0672831535339355, -3.9627442359924316, -3.8582053184509277, -3.753666400909424, -3.649127721786499, -3.544588804244995, -3.4400501251220703, -3.3355112075805664, -3.2309722900390625, -3.1264333724975586, -3.021894693374634, -2.91735577583313, -2.812817096710205, -2.708278179168701, -2.6037395000457764, -2.4992005825042725, -2.3946616649627686, -2.2901229858398438, -2.18558406829834, -2.081045150756836, -1.976505994796753, -1.8719671964645386, -1.7674282789230347, -1.6628894805908203, -1.5583505630493164, -1.453811764717102, -1.3492729663848877, -1.2447340488433838, -1.1401952505111694, -1.035656452178955, -0.9311175346374512, -0.8265787363052368, -0.7220398783683777, -0.6175010204315186, -0.5129622220993042, -0.40842336416244507, -0.30388450622558594, -0.199345663189888, -0.09480682015419006, 0.00973200798034668, 0.11427086591720581, 0.21880972385406494, 0.3233485221862793, 0.4278873801231384, 0.5324262380599976, 0.6369650959968567, 0.7415039539337158, 0.8460427522659302, 0.9505816102027893, 1.0551204681396484, 1.1596592664718628, 1.2641980648040771, 1.368736982345581]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 0.0, 1.0, 2.0, 4.0, 4.0, 1.0, 2.0, 4.0, 13.0, 18.0, 15.0, 10.0, 13.0, 18.0, 21.0, 20.0, 26.0, 16.0, 22.0, 24.0, 26.0, 33.0, 29.0, 41.0, 33.0, 20.0, 44.0, 34.0, 34.0, 40.0, 33.0, 37.0, 35.0, 25.0, 33.0, 31.0, 28.0, 28.0, 32.0, 24.0, 20.0, 15.0, 20.0, 20.0, 10.0, 5.0, 9.0, 7.0, 10.0, 7.0, 4.0, 3.0, 3.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0], "bins": [-0.8618771433830261, -0.8344240188598633, -0.8069709539413452, -0.7795178294181824, -0.7520647048950195, -0.7246116399765015, -0.6971585154533386, -0.6697053909301758, -0.6422523260116577, -0.6147992014884949, -0.5873461365699768, -0.559893012046814, -0.5324398875236511, -0.5049867630004883, -0.4775336980819702, -0.4500805735588074, -0.42262744903564453, -0.3951743543148041, -0.36772122979164124, -0.3402681350708008, -0.31281501054763794, -0.2853619158267975, -0.25790882110595703, -0.23045571148395538, -0.20300260186195374, -0.1755494922399521, -0.14809638261795044, -0.12064328789710999, -0.09319017827510834, -0.06573706865310669, -0.038283973932266235, -0.010830864310264587, 0.016622304916381836, 0.044075410813093185, 0.07152851670980453, 0.09898161888122559, 0.12643472850322723, 0.15388783812522888, 0.18134093284606934, 0.20879404246807098, 0.23624715209007263, 0.2637002468109131, 0.2911533713340759, 0.3186064660549164, 0.34605956077575684, 0.3735126852989197, 0.40096578001976013, 0.4284188747406006, 0.4558719992637634, 0.4833250939846039, 0.5107781887054443, 0.5382313132286072, 0.56568443775177, 0.5931375026702881, 0.6205906271934509, 0.6480437517166138, 0.6754968166351318, 0.7029499411582947, 0.7304030060768127, 0.7578561305999756, 0.7853092551231384, 0.8127623796463013, 0.8402154445648193, 0.8676685690879822, 0.895121693611145]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 1.0, 5.0, 1.0, 6.0, 10.0, 19.0, 21.0, 28.0, 51.0, 76.0, 133.0, 212.0, 360.0, 693.0, 1361.0, 3138.0, 7275.0, 20717.0, 75012.0, 378606.0, 1673021.0, 1582912.0, 348682.0, 70018.0, 19409.0, 6824.0, 2873.0, 1338.0, 669.0, 379.0, 208.0, 91.0, 55.0, 30.0, 22.0, 9.0, 14.0, 9.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1732177734375, -0.16762542724609375, -0.1620330810546875, -0.15644073486328125, -0.150848388671875, -0.14525604248046875, -0.1396636962890625, -0.13407135009765625, -0.12847900390625, -0.12288665771484375, -0.1172943115234375, -0.11170196533203125, -0.106109619140625, -0.10051727294921875, -0.0949249267578125, -0.08933258056640625, -0.083740234375, -0.07814788818359375, -0.0725555419921875, -0.06696319580078125, -0.061370849609375, -0.05577850341796875, -0.0501861572265625, -0.04459381103515625, -0.03900146484375, -0.03340911865234375, -0.0278167724609375, -0.02222442626953125, -0.016632080078125, -0.01103973388671875, -0.0054473876953125, 0.00014495849609375, 0.0057373046875, 0.01132965087890625, 0.0169219970703125, 0.02251434326171875, 0.028106689453125, 0.03369903564453125, 0.0392913818359375, 0.04488372802734375, 0.05047607421875, 0.05606842041015625, 0.0616607666015625, 0.06725311279296875, 0.072845458984375, 0.07843780517578125, 0.0840301513671875, 0.08962249755859375, 0.09521484375, 0.10080718994140625, 0.1063995361328125, 0.11199188232421875, 0.117584228515625, 0.12317657470703125, 0.1287689208984375, 0.13436126708984375, 0.13995361328125, 0.14554595947265625, 0.1511383056640625, 0.15673065185546875, 0.162322998046875, 0.16791534423828125, 0.1735076904296875, 0.17910003662109375, 0.1846923828125]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 5.0, 1.0, 7.0, 7.0, 5.0, 11.0, 17.0, 14.0, 27.0, 40.0, 27.0, 49.0, 45.0, 67.0, 60.0, 57.0, 58.0, 73.0, 53.0, 62.0, 59.0, 55.0, 36.0, 47.0, 32.0, 21.0, 20.0, 19.0, 8.0, 9.0, 11.0, 3.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.137451171875, -0.13236045837402344, -0.12726974487304688, -0.12217903137207031, -0.11708831787109375, -0.11199760437011719, -0.10690689086914062, -0.10181617736816406, -0.0967254638671875, -0.09163475036621094, -0.08654403686523438, -0.08145332336425781, -0.07636260986328125, -0.07127189636230469, -0.06618118286132812, -0.06109046936035156, -0.055999755859375, -0.05090904235839844, -0.045818328857421875, -0.04072761535644531, -0.03563690185546875, -0.030546188354492188, -0.025455474853515625, -0.020364761352539062, -0.0152740478515625, -0.010183334350585938, -0.005092620849609375, -1.9073486328125e-06, 0.00508880615234375, 0.010179519653320312, 0.015270233154296875, 0.020360946655273438, 0.02545166015625, 0.030542373657226562, 0.035633087158203125, 0.04072380065917969, 0.04581451416015625, 0.05090522766113281, 0.055995941162109375, 0.06108665466308594, 0.0661773681640625, 0.07126808166503906, 0.07635879516601562, 0.08144950866699219, 0.08654022216796875, 0.09163093566894531, 0.09672164916992188, 0.10181236267089844, 0.106903076171875, 0.11199378967285156, 0.11708450317382812, 0.12217521667480469, 0.12726593017578125, 0.1323566436767578, 0.13744735717773438, 0.14253807067871094, 0.1476287841796875, 0.15271949768066406, 0.15781021118164062, 0.1629009246826172, 0.16799163818359375, 0.1730823516845703, 0.17817306518554688, 0.18326377868652344, 0.1883544921875]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 8.0, 10.0, 15.0, 13.0, 33.0, 32.0, 64.0, 79.0, 114.0, 163.0, 304.0, 519.0, 939.0, 1846.0, 4337.0, 10088.0, 27684.0, 90408.0, 347059.0, 1284302.0, 1683175.0, 542306.0, 136505.0, 39762.0, 13656.0, 5607.0, 2516.0, 1136.0, 635.0, 327.0, 222.0, 164.0, 76.0, 64.0, 39.0, 25.0, 21.0, 10.0, 4.0, 8.0, 3.0, 3.0, 1.0, 1.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1923828125, -0.18620872497558594, -0.18003463745117188, -0.1738605499267578, -0.16768646240234375, -0.1615123748779297, -0.15533828735351562, -0.14916419982910156, -0.1429901123046875, -0.13681602478027344, -0.13064193725585938, -0.12446784973144531, -0.11829376220703125, -0.11211967468261719, -0.10594558715820312, -0.09977149963378906, -0.093597412109375, -0.08742332458496094, -0.08124923706054688, -0.07507514953613281, -0.06890106201171875, -0.06272697448730469, -0.056552886962890625, -0.05037879943847656, -0.0442047119140625, -0.03803062438964844, -0.031856536865234375, -0.025682449340820312, -0.01950836181640625, -0.013334274291992188, -0.007160186767578125, -0.0009860992431640625, 0.00518798828125, 0.011362075805664062, 0.017536163330078125, 0.023710250854492188, 0.02988433837890625, 0.03605842590332031, 0.042232513427734375, 0.04840660095214844, 0.0545806884765625, 0.06075477600097656, 0.06692886352539062, 0.07310295104980469, 0.07927703857421875, 0.08545112609863281, 0.09162521362304688, 0.09779930114746094, 0.103973388671875, 0.11014747619628906, 0.11632156372070312, 0.12249565124511719, 0.12866973876953125, 0.1348438262939453, 0.14101791381835938, 0.14719200134277344, 0.1533660888671875, 0.15954017639160156, 0.16571426391601562, 0.1718883514404297, 0.17806243896484375, 0.1842365264892578, 0.19041061401367188, 0.19658470153808594, 0.2027587890625]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 11.0, 17.0, 16.0, 19.0, 30.0, 38.0, 48.0, 75.0, 101.0, 156.0, 218.0, 322.0, 434.0, 472.0, 515.0, 460.0, 348.0, 247.0, 173.0, 110.0, 103.0, 50.0, 27.0, 28.0, 21.0, 9.0, 9.0, 8.0, 0.0, 5.0, 1.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.259765625, -0.2529563903808594, -0.24614715576171875, -0.23933792114257812, -0.2325286865234375, -0.22571945190429688, -0.21891021728515625, -0.21210098266601562, -0.205291748046875, -0.19848251342773438, -0.19167327880859375, -0.18486404418945312, -0.1780548095703125, -0.17124557495117188, -0.16443634033203125, -0.15762710571289062, -0.15081787109375, -0.14400863647460938, -0.13719940185546875, -0.13039016723632812, -0.1235809326171875, -0.11677169799804688, -0.10996246337890625, -0.10315322875976562, -0.096343994140625, -0.08953475952148438, -0.08272552490234375, -0.07591629028320312, -0.0691070556640625, -0.062297821044921875, -0.05548858642578125, -0.048679351806640625, -0.0418701171875, -0.035060882568359375, -0.02825164794921875, -0.021442413330078125, -0.0146331787109375, -0.007823944091796875, -0.00101470947265625, 0.005794525146484375, 0.012603759765625, 0.019412994384765625, 0.02622222900390625, 0.033031463623046875, 0.0398406982421875, 0.046649932861328125, 0.05345916748046875, 0.060268402099609375, 0.06707763671875, 0.07388687133789062, 0.08069610595703125, 0.08750534057617188, 0.0943145751953125, 0.10112380981445312, 0.10793304443359375, 0.11474227905273438, 0.121551513671875, 0.12836074829101562, 0.13516998291015625, 0.14197921752929688, 0.1487884521484375, 0.15559768676757812, 0.16240692138671875, 0.16921615600585938, 0.176025390625]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 3.0, 4.0, 1.0, 9.0, 5.0, 15.0, 14.0, 26.0, 22.0, 40.0, 39.0, 44.0, 49.0, 74.0, 70.0, 82.0, 65.0, 79.0, 79.0, 70.0, 51.0, 44.0, 34.0, 32.0, 21.0, 12.0, 10.0, 10.0, 6.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.1174962520599365, -1.0912173986434937, -1.0649385452270508, -1.038659691810608, -1.012380838394165, -0.9861020445823669, -0.9598232507705688, -0.933544397354126, -0.9072655439376831, -0.8809866905212402, -0.8547078371047974, -0.8284290432929993, -0.8021501898765564, -0.7758713364601135, -0.7495925426483154, -0.7233136892318726, -0.6970348358154297, -0.6707559823989868, -0.644477128982544, -0.6181983351707458, -0.591919481754303, -0.5656406283378601, -0.539361834526062, -0.5130829811096191, -0.48680412769317627, -0.4605252742767334, -0.4342464506626129, -0.40796762704849243, -0.38168877363204956, -0.3554099202156067, -0.3291310966014862, -0.3028522729873657, -0.2765734791755676, -0.25029462575912476, -0.22401580214500427, -0.1977369636297226, -0.17145812511444092, -0.14517928659915924, -0.11890044808387756, -0.09262160956859589, -0.06634277105331421, -0.04006393253803253, -0.013785094022750854, 0.012493744492530823, 0.0387725830078125, 0.06505142152309418, 0.09133026003837585, 0.11760909855365753, 0.1438879370689392, 0.1701667755842209, 0.19644561409950256, 0.22272445261478424, 0.24900329113006592, 0.2752821445465088, 0.3015609681606293, 0.32783979177474976, 0.3541186451911926, 0.3803974986076355, 0.406676322221756, 0.43295514583587646, 0.45923399925231934, 0.4855128526687622, 0.5117917060852051, 0.5380704998970032, 0.564349353313446]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 0.0, 1.0, 3.0, 1.0, 4.0, 1.0, 3.0, 3.0, 6.0, 6.0, 7.0, 4.0, 10.0, 18.0, 12.0, 4.0, 22.0, 19.0, 25.0, 19.0, 24.0, 26.0, 25.0, 31.0, 30.0, 43.0, 45.0, 48.0, 35.0, 41.0, 34.0, 45.0, 47.0, 30.0, 36.0, 35.0, 26.0, 35.0, 24.0, 28.0, 14.0, 29.0, 13.0, 21.0, 14.0, 16.0, 12.0, 10.0, 4.0, 8.0, 4.0, 2.0, 1.0, 4.0, 2.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.6893699169158936, -0.6683332324028015, -0.6472965478897095, -0.6262598633766174, -0.6052231788635254, -0.5841864943504333, -0.5631498098373413, -0.5421131253242493, -0.5210764408111572, -0.5000397562980652, -0.47900307178497314, -0.4579663872718811, -0.43692970275878906, -0.415893018245697, -0.394856333732605, -0.37381964921951294, -0.3527829647064209, -0.33174628019332886, -0.3107095956802368, -0.2896729111671448, -0.26863622665405273, -0.2475995421409607, -0.22656285762786865, -0.2055261731147766, -0.18448948860168457, -0.16345280408859253, -0.1424161195755005, -0.12137943506240845, -0.1003427505493164, -0.07930606603622437, -0.058269381523132324, -0.03723269701004028, -0.016196012496948242, 0.004840672016143799, 0.02587735652923584, 0.04691404104232788, 0.06795072555541992, 0.08898741006851196, 0.110024094581604, 0.13106077909469604, 0.15209746360778809, 0.17313414812088013, 0.19417083263397217, 0.2152075171470642, 0.23624420166015625, 0.2572808861732483, 0.27831757068634033, 0.2993542551994324, 0.3203909397125244, 0.34142762422561646, 0.3624643087387085, 0.38350099325180054, 0.4045376777648926, 0.4255743622779846, 0.44661104679107666, 0.4676477313041687, 0.48868441581726074, 0.5097211003303528, 0.5307577848434448, 0.5517944693565369, 0.5728311538696289, 0.593867838382721, 0.614904522895813, 0.635941207408905, 0.6569778919219971]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 4.0, 6.0, 7.0, 8.0, 7.0, 16.0, 19.0, 25.0, 47.0, 93.0, 147.0, 291.0, 552.0, 1062.0, 2215.0, 4594.0, 9498.0, 19364.0, 38873.0, 80436.0, 177698.0, 296413.0, 219781.0, 102207.0, 48297.0, 23570.0, 11834.0, 5833.0, 2776.0, 1384.0, 699.0, 346.0, 188.0, 101.0, 64.0, 38.0, 29.0, 13.0, 13.0, 9.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.291015625, -0.2823677062988281, -0.27371978759765625, -0.2650718688964844, -0.2564239501953125, -0.24777603149414062, -0.23912811279296875, -0.23048019409179688, -0.221832275390625, -0.21318435668945312, -0.20453643798828125, -0.19588851928710938, -0.1872406005859375, -0.17859268188476562, -0.16994476318359375, -0.16129684448242188, -0.15264892578125, -0.14400100708007812, -0.13535308837890625, -0.12670516967773438, -0.1180572509765625, -0.10940933227539062, -0.10076141357421875, -0.09211349487304688, -0.083465576171875, -0.07481765747070312, -0.06616973876953125, -0.057521820068359375, -0.0488739013671875, -0.040225982666015625, -0.03157806396484375, -0.022930145263671875, -0.0142822265625, -0.005634307861328125, 0.00301361083984375, 0.011661529541015625, 0.0203094482421875, 0.028957366943359375, 0.03760528564453125, 0.046253204345703125, 0.054901123046875, 0.06354904174804688, 0.07219696044921875, 0.08084487915039062, 0.0894927978515625, 0.09814071655273438, 0.10678863525390625, 0.11543655395507812, 0.12408447265625, 0.13273239135742188, 0.14138031005859375, 0.15002822875976562, 0.1586761474609375, 0.16732406616210938, 0.17597198486328125, 0.18461990356445312, 0.193267822265625, 0.20191574096679688, 0.21056365966796875, 0.21921157836914062, 0.2278594970703125, 0.23650741577148438, 0.24515533447265625, 0.2538032531738281, 0.262451171875]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 5.0, 3.0, 11.0, 13.0, 13.0, 21.0, 18.0, 28.0, 37.0, 34.0, 49.0, 44.0, 54.0, 53.0, 62.0, 61.0, 59.0, 64.0, 52.0, 62.0, 46.0, 42.0, 28.0, 40.0, 20.0, 20.0, 20.0, 13.0, 11.0, 9.0, 5.0, 1.0, 1.0, 6.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.12939453125, -0.12457466125488281, -0.11975479125976562, -0.11493492126464844, -0.11011505126953125, -0.10529518127441406, -0.10047531127929688, -0.09565544128417969, -0.0908355712890625, -0.08601570129394531, -0.08119583129882812, -0.07637596130371094, -0.07155609130859375, -0.06673622131347656, -0.061916351318359375, -0.05709648132324219, -0.052276611328125, -0.04745674133300781, -0.042636871337890625, -0.03781700134277344, -0.03299713134765625, -0.028177261352539062, -0.023357391357421875, -0.018537521362304688, -0.0137176513671875, -0.008897781372070312, -0.004077911376953125, 0.0007419586181640625, 0.00556182861328125, 0.010381698608398438, 0.015201568603515625, 0.020021438598632812, 0.02484130859375, 0.029661178588867188, 0.034481048583984375, 0.03930091857910156, 0.04412078857421875, 0.04894065856933594, 0.053760528564453125, 0.05858039855957031, 0.0634002685546875, 0.06822013854980469, 0.07304000854492188, 0.07785987854003906, 0.08267974853515625, 0.08749961853027344, 0.09231948852539062, 0.09713935852050781, 0.101959228515625, 0.10677909851074219, 0.11159896850585938, 0.11641883850097656, 0.12123870849609375, 0.12605857849121094, 0.13087844848632812, 0.1356983184814453, 0.1405181884765625, 0.1453380584716797, 0.15015792846679688, 0.15497779846191406, 0.15979766845703125, 0.16461753845214844, 0.16943740844726562, 0.1742572784423828, 0.1790771484375]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 6.0, 6.0, 7.0, 8.0, 14.0, 10.0, 20.0, 27.0, 36.0, 55.0, 71.0, 106.0, 195.0, 368.0, 883.0, 2136.0, 5941.0, 16294.0, 43538.0, 122628.0, 336837.0, 331352.0, 119754.0, 42628.0, 15605.0, 5982.0, 2195.0, 854.0, 417.0, 202.0, 114.0, 83.0, 49.0, 29.0, 28.0, 18.0, 19.0, 12.0, 5.0, 7.0, 1.0, 3.0, 4.0, 3.0, 4.0, 5.0, 0.0, 0.0, 3.0, 1.0, 1.0], "bins": [-0.39208984375, -0.38055419921875, -0.3690185546875, -0.35748291015625, -0.345947265625, -0.33441162109375, -0.3228759765625, -0.31134033203125, -0.2998046875, -0.28826904296875, -0.2767333984375, -0.26519775390625, -0.253662109375, -0.24212646484375, -0.2305908203125, -0.21905517578125, -0.20751953125, -0.19598388671875, -0.1844482421875, -0.17291259765625, -0.161376953125, -0.14984130859375, -0.1383056640625, -0.12677001953125, -0.115234375, -0.10369873046875, -0.0921630859375, -0.08062744140625, -0.069091796875, -0.05755615234375, -0.0460205078125, -0.03448486328125, -0.02294921875, -0.01141357421875, 0.0001220703125, 0.01165771484375, 0.023193359375, 0.03472900390625, 0.0462646484375, 0.05780029296875, 0.0693359375, 0.08087158203125, 0.0924072265625, 0.10394287109375, 0.115478515625, 0.12701416015625, 0.1385498046875, 0.15008544921875, 0.16162109375, 0.17315673828125, 0.1846923828125, 0.19622802734375, 0.207763671875, 0.21929931640625, 0.2308349609375, 0.24237060546875, 0.25390625, 0.26544189453125, 0.2769775390625, 0.28851318359375, 0.300048828125, 0.31158447265625, 0.3231201171875, 0.33465576171875, 0.34619140625]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [4.0, 1.0, 1.0, 5.0, 3.0, 2.0, 5.0, 6.0, 13.0, 6.0, 5.0, 11.0, 10.0, 17.0, 18.0, 28.0, 19.0, 35.0, 35.0, 32.0, 43.0, 34.0, 24.0, 39.0, 49.0, 38.0, 51.0, 43.0, 51.0, 49.0, 49.0, 30.0, 22.0, 35.0, 33.0, 28.0, 20.0, 26.0, 11.0, 14.0, 18.0, 8.0, 12.0, 6.0, 7.0, 7.0, 6.0, 5.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.3193359375, -0.3073005676269531, -0.29526519775390625, -0.2832298278808594, -0.2711944580078125, -0.2591590881347656, -0.24712371826171875, -0.23508834838867188, -0.223052978515625, -0.21101760864257812, -0.19898223876953125, -0.18694686889648438, -0.1749114990234375, -0.16287612915039062, -0.15084075927734375, -0.13880538940429688, -0.12677001953125, -0.11473464965820312, -0.10269927978515625, -0.09066390991210938, -0.0786285400390625, -0.06659317016601562, -0.05455780029296875, -0.042522430419921875, -0.030487060546875, -0.018451690673828125, -0.00641632080078125, 0.005619049072265625, 0.0176544189453125, 0.029689788818359375, 0.04172515869140625, 0.053760528564453125, 0.0657958984375, 0.07783126831054688, 0.08986663818359375, 0.10190200805664062, 0.1139373779296875, 0.12597274780273438, 0.13800811767578125, 0.15004348754882812, 0.162078857421875, 0.17411422729492188, 0.18614959716796875, 0.19818496704101562, 0.2102203369140625, 0.22225570678710938, 0.23429107666015625, 0.24632644653320312, 0.25836181640625, 0.2703971862792969, 0.28243255615234375, 0.2944679260253906, 0.3065032958984375, 0.3185386657714844, 0.33057403564453125, 0.3426094055175781, 0.354644775390625, 0.3666801452636719, 0.37871551513671875, 0.3907508850097656, 0.4027862548828125, 0.4148216247558594, 0.42685699462890625, 0.4388923645019531, 0.450927734375]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 1.0, 5.0, 12.0, 8.0, 12.0, 25.0, 25.0, 45.0, 73.0, 101.0, 128.0, 258.0, 418.0, 782.0, 1311.0, 2476.0, 4556.0, 8872.0, 16986.0, 33287.0, 66466.0, 136451.0, 240126.0, 247059.0, 145160.0, 70506.0, 35298.0, 17924.0, 9183.0, 4919.0, 2603.0, 1424.0, 795.0, 488.0, 259.0, 174.0, 111.0, 86.0, 46.0, 39.0, 16.0, 19.0, 9.0, 5.0, 3.0, 5.0, 1.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1190185546875, -0.11505699157714844, -0.11109542846679688, -0.10713386535644531, -0.10317230224609375, -0.09921073913574219, -0.09524917602539062, -0.09128761291503906, -0.0873260498046875, -0.08336448669433594, -0.07940292358398438, -0.07544136047363281, -0.07147979736328125, -0.06751823425292969, -0.06355667114257812, -0.05959510803222656, -0.055633544921875, -0.05167198181152344, -0.047710418701171875, -0.04374885559082031, -0.03978729248046875, -0.03582572937011719, -0.031864166259765625, -0.027902603149414062, -0.0239410400390625, -0.019979476928710938, -0.016017913818359375, -0.012056350708007812, -0.00809478759765625, -0.0041332244873046875, -0.000171661376953125, 0.0037899017333984375, 0.00775146484375, 0.011713027954101562, 0.015674591064453125, 0.019636154174804688, 0.02359771728515625, 0.027559280395507812, 0.031520843505859375, 0.03548240661621094, 0.0394439697265625, 0.04340553283691406, 0.047367095947265625, 0.05132865905761719, 0.05529022216796875, 0.05925178527832031, 0.06321334838867188, 0.06717491149902344, 0.071136474609375, 0.07509803771972656, 0.07905960083007812, 0.08302116394042969, 0.08698272705078125, 0.09094429016113281, 0.09490585327148438, 0.09886741638183594, 0.1028289794921875, 0.10679054260253906, 0.11075210571289062, 0.11471366882324219, 0.11867523193359375, 0.12263679504394531, 0.12659835815429688, 0.13055992126464844, 0.134521484375]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 4.0, 2.0, 0.0, 2.0, 2.0, 6.0, 9.0, 6.0, 7.0, 4.0, 5.0, 8.0, 10.0, 14.0, 21.0, 25.0, 27.0, 28.0, 30.0, 43.0, 43.0, 71.0, 58.0, 64.0, 67.0, 77.0, 52.0, 41.0, 49.0, 46.0, 35.0, 34.0, 27.0, 23.0, 11.0, 12.0, 11.0, 10.0, 2.0, 8.0, 6.0, 5.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-3.147125244140625e-05, -3.052130341529846e-05, -2.9571354389190674e-05, -2.8621405363082886e-05, -2.7671456336975098e-05, -2.672150731086731e-05, -2.577155828475952e-05, -2.4821609258651733e-05, -2.3871660232543945e-05, -2.2921711206436157e-05, -2.197176218032837e-05, -2.102181315422058e-05, -2.0071864128112793e-05, -1.9121915102005005e-05, -1.8171966075897217e-05, -1.722201704978943e-05, -1.627206802368164e-05, -1.5322118997573853e-05, -1.4372169971466064e-05, -1.3422220945358276e-05, -1.2472271919250488e-05, -1.15223228931427e-05, -1.0572373867034912e-05, -9.622424840927124e-06, -8.672475814819336e-06, -7.722526788711548e-06, -6.77257776260376e-06, -5.822628736495972e-06, -4.872679710388184e-06, -3.9227306842803955e-06, -2.9727816581726074e-06, -2.0228326320648193e-06, -1.0728836059570312e-06, -1.2293457984924316e-07, 8.270144462585449e-07, 1.776963472366333e-06, 2.726912498474121e-06, 3.676861524581909e-06, 4.626810550689697e-06, 5.576759576797485e-06, 6.5267086029052734e-06, 7.4766576290130615e-06, 8.42660665512085e-06, 9.376555681228638e-06, 1.0326504707336426e-05, 1.1276453733444214e-05, 1.2226402759552002e-05, 1.317635178565979e-05, 1.4126300811767578e-05, 1.5076249837875366e-05, 1.6026198863983154e-05, 1.6976147890090942e-05, 1.792609691619873e-05, 1.887604594230652e-05, 1.9825994968414307e-05, 2.0775943994522095e-05, 2.1725893020629883e-05, 2.267584204673767e-05, 2.362579107284546e-05, 2.4575740098953247e-05, 2.5525689125061035e-05, 2.6475638151168823e-05, 2.742558717727661e-05, 2.83755362033844e-05, 2.9325485229492188e-05]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 4.0, 2.0, 1.0, 5.0, 5.0, 2.0, 3.0, 2.0, 9.0, 9.0, 12.0, 14.0, 27.0, 32.0, 35.0, 47.0, 67.0, 133.0, 189.0, 294.0, 519.0, 888.0, 1624.0, 3194.0, 6256.0, 12556.0, 25296.0, 51724.0, 108022.0, 215339.0, 273675.0, 178650.0, 85947.0, 41958.0, 20856.0, 10190.0, 5035.0, 2619.0, 1450.0, 764.0, 402.0, 248.0, 155.0, 95.0, 64.0, 31.0, 29.0, 23.0, 10.0, 8.0, 13.0, 8.0, 4.0, 13.0, 4.0, 1.0, 5.0, 0.0, 3.0, 2.0, 0.0, 3.0], "bins": [-0.1273193359375, -0.1233835220336914, -0.11944770812988281, -0.11551189422607422, -0.11157608032226562, -0.10764026641845703, -0.10370445251464844, -0.09976863861083984, -0.09583282470703125, -0.09189701080322266, -0.08796119689941406, -0.08402538299560547, -0.08008956909179688, -0.07615375518798828, -0.07221794128417969, -0.0682821273803711, -0.0643463134765625, -0.060410499572753906, -0.05647468566894531, -0.05253887176513672, -0.048603057861328125, -0.04466724395751953, -0.04073143005371094, -0.036795616149902344, -0.03285980224609375, -0.028923988342285156, -0.024988174438476562, -0.02105236053466797, -0.017116546630859375, -0.013180732727050781, -0.009244918823242188, -0.005309104919433594, -0.001373291015625, 0.0025625228881835938, 0.0064983367919921875, 0.010434150695800781, 0.014369964599609375, 0.01830577850341797, 0.022241592407226562, 0.026177406311035156, 0.03011322021484375, 0.034049034118652344, 0.03798484802246094, 0.04192066192626953, 0.045856475830078125, 0.04979228973388672, 0.05372810363769531, 0.057663917541503906, 0.0615997314453125, 0.0655355453491211, 0.06947135925292969, 0.07340717315673828, 0.07734298706054688, 0.08127880096435547, 0.08521461486816406, 0.08915042877197266, 0.09308624267578125, 0.09702205657958984, 0.10095787048339844, 0.10489368438720703, 0.10882949829101562, 0.11276531219482422, 0.11670112609863281, 0.1206369400024414, 0.12457275390625]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 6.0, 1.0, 7.0, 8.0, 14.0, 17.0, 20.0, 19.0, 37.0, 37.0, 46.0, 57.0, 57.0, 73.0, 89.0, 77.0, 81.0, 75.0, 63.0, 54.0, 27.0, 32.0, 26.0, 18.0, 23.0, 9.0, 5.0, 5.0, 5.0, 8.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.16357421875, -0.1584930419921875, -0.153411865234375, -0.1483306884765625, -0.14324951171875, -0.1381683349609375, -0.133087158203125, -0.1280059814453125, -0.1229248046875, -0.1178436279296875, -0.112762451171875, -0.1076812744140625, -0.10260009765625, -0.0975189208984375, -0.092437744140625, -0.0873565673828125, -0.082275390625, -0.0771942138671875, -0.072113037109375, -0.0670318603515625, -0.06195068359375, -0.0568695068359375, -0.051788330078125, -0.0467071533203125, -0.0416259765625, -0.0365447998046875, -0.031463623046875, -0.0263824462890625, -0.02130126953125, -0.0162200927734375, -0.011138916015625, -0.0060577392578125, -0.0009765625, 0.0041046142578125, 0.009185791015625, 0.0142669677734375, 0.01934814453125, 0.0244293212890625, 0.029510498046875, 0.0345916748046875, 0.0396728515625, 0.0447540283203125, 0.049835205078125, 0.0549163818359375, 0.05999755859375, 0.0650787353515625, 0.070159912109375, 0.0752410888671875, 0.080322265625, 0.0854034423828125, 0.090484619140625, 0.0955657958984375, 0.10064697265625, 0.1057281494140625, 0.110809326171875, 0.1158905029296875, 0.1209716796875, 0.1260528564453125, 0.131134033203125, 0.1362152099609375, 0.14129638671875, 0.1463775634765625, 0.151458740234375, 0.1565399169921875, 0.16162109375]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 16.0, 19.0, 22.0, 25.0, 34.0, 42.0, 60.0, 52.0, 84.0, 93.0, 76.0, 87.0, 84.0, 61.0, 65.0, 50.0, 40.0, 30.0, 23.0, 15.0, 8.0, 10.0, 5.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5658867359161377, -1.5251084566116333, -1.4843300580978394, -1.443551778793335, -1.4027734994888306, -1.3619952201843262, -1.3212168216705322, -1.2804385423660278, -1.2396602630615234, -1.198881983757019, -1.158103585243225, -1.1173253059387207, -1.0765470266342163, -1.035768747329712, -0.994990348815918, -0.9542120695114136, -0.9134336709976196, -0.8726553320884705, -0.8318770527839661, -0.7910987138748169, -0.7503204345703125, -0.7095420956611633, -0.6687637567520142, -0.6279854774475098, -0.5872071385383606, -0.5464287996292114, -0.505650520324707, -0.46487218141555786, -0.4240938723087311, -0.3833155632019043, -0.3425372242927551, -0.30175891518592834, -0.2609807252883911, -0.22020241618156433, -0.17942409217357635, -0.13864576816558838, -0.0978674590587616, -0.057089149951934814, -0.01631082594394684, 0.024467498064041138, 0.06524580717086792, 0.1060241237282753, 0.14680244028568268, 0.18758076429367065, 0.22835907340049744, 0.2691373825073242, 0.3099157214164734, 0.35069403052330017, 0.39147233963012695, 0.43225064873695374, 0.4730289578437805, 0.5138072967529297, 0.5545855760574341, 0.5953639149665833, 0.6361422538757324, 0.6769205331802368, 0.717698872089386, 0.7584772109985352, 0.7992554903030396, 0.8400338292121887, 0.8808121681213379, 0.9215904474258423, 0.9623687863349915, 1.0031471252441406, 1.043925404548645]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 2.0, 0.0, 3.0, 5.0, 4.0, 2.0, 4.0, 5.0, 9.0, 9.0, 10.0, 9.0, 19.0, 21.0, 17.0, 21.0, 29.0, 29.0, 21.0, 26.0, 39.0, 28.0, 32.0, 34.0, 34.0, 38.0, 37.0, 46.0, 28.0, 37.0, 35.0, 35.0, 30.0, 35.0, 22.0, 32.0, 24.0, 35.0, 20.0, 22.0, 25.0, 16.0, 16.0, 9.0, 10.0, 12.0, 10.0, 7.0, 6.0, 3.0, 1.0, 4.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.9692829847335815, -0.9388770461082458, -0.9084711074829102, -0.8780651688575745, -0.8476592302322388, -0.8172532916069031, -0.7868473529815674, -0.7564414739608765, -0.726035475730896, -0.6956295371055603, -0.6652235984802246, -0.6348176598548889, -0.6044117212295532, -0.5740057826042175, -0.5435998439788818, -0.5131939649581909, -0.4827880263328552, -0.45238208770751953, -0.42197614908218384, -0.39157021045684814, -0.36116427183151245, -0.33075833320617676, -0.30035242438316345, -0.26994648575782776, -0.23954054713249207, -0.20913460850715637, -0.17872866988182068, -0.14832274615764618, -0.11791680753231049, -0.08751086890697479, -0.05710494518280029, -0.0266990065574646, 0.0037068724632263184, 0.03411280736327171, 0.06451874226331711, 0.0949246734380722, 0.1253306120634079, 0.1557365506887436, 0.1861424744129181, 0.21654841303825378, 0.24695435166358948, 0.27736029028892517, 0.30776622891426086, 0.33817213773727417, 0.36857807636260986, 0.39898401498794556, 0.42938995361328125, 0.45979589223861694, 0.49020183086395264, 0.5206077694892883, 0.551013708114624, 0.5814196467399597, 0.6118255853652954, 0.6422315239906311, 0.6726374626159668, 0.7030433416366577, 0.7334493398666382, 0.7638552784919739, 0.7942612171173096, 0.8246671557426453, 0.855073094367981, 0.8854790329933167, 0.9158849716186523, 0.9462908506393433, 0.976696789264679]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 2.0, 3.0, 4.0, 1.0, 5.0, 3.0, 6.0, 11.0, 7.0, 13.0, 17.0, 29.0, 25.0, 31.0, 51.0, 69.0, 146.0, 356.0, 960.0, 3343.0, 15489.0, 89942.0, 699257.0, 2618165.0, 660612.0, 85479.0, 14832.0, 3542.0, 1090.0, 368.0, 146.0, 84.0, 55.0, 29.0, 23.0, 22.0, 14.0, 10.0, 10.0, 8.0, 11.0, 8.0, 5.0, 2.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.259521484375, -0.2500801086425781, -0.24063873291015625, -0.23119735717773438, -0.2217559814453125, -0.21231460571289062, -0.20287322998046875, -0.19343185424804688, -0.183990478515625, -0.17454910278320312, -0.16510772705078125, -0.15566635131835938, -0.1462249755859375, -0.13678359985351562, -0.12734222412109375, -0.11790084838867188, -0.10845947265625, -0.09901809692382812, -0.08957672119140625, -0.08013534545898438, -0.0706939697265625, -0.061252593994140625, -0.05181121826171875, -0.042369842529296875, -0.032928466796875, -0.023487091064453125, -0.01404571533203125, -0.004604339599609375, 0.0048370361328125, 0.014278411865234375, 0.02371978759765625, 0.033161163330078125, 0.0426025390625, 0.052043914794921875, 0.06148529052734375, 0.07092666625976562, 0.0803680419921875, 0.08980941772460938, 0.09925079345703125, 0.10869216918945312, 0.118133544921875, 0.12757492065429688, 0.13701629638671875, 0.14645767211914062, 0.1558990478515625, 0.16534042358398438, 0.17478179931640625, 0.18422317504882812, 0.19366455078125, 0.20310592651367188, 0.21254730224609375, 0.22198867797851562, 0.2314300537109375, 0.24087142944335938, 0.25031280517578125, 0.2597541809082031, 0.269195556640625, 0.2786369323730469, 0.28807830810546875, 0.2975196838378906, 0.3069610595703125, 0.3164024353027344, 0.32584381103515625, 0.3352851867675781, 0.3447265625]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 6.0, 2.0, 10.0, 2.0, 9.0, 10.0, 9.0, 13.0, 21.0, 20.0, 23.0, 20.0, 34.0, 33.0, 47.0, 49.0, 39.0, 51.0, 49.0, 54.0, 58.0, 43.0, 58.0, 38.0, 38.0, 36.0, 41.0, 25.0, 29.0, 20.0, 27.0, 18.0, 16.0, 13.0, 11.0, 8.0, 9.0, 6.0, 4.0, 2.0, 7.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.123046875, -0.11855316162109375, -0.1140594482421875, -0.10956573486328125, -0.105072021484375, -0.10057830810546875, -0.0960845947265625, -0.09159088134765625, -0.08709716796875, -0.08260345458984375, -0.0781097412109375, -0.07361602783203125, -0.069122314453125, -0.06462860107421875, -0.0601348876953125, -0.05564117431640625, -0.0511474609375, -0.04665374755859375, -0.0421600341796875, -0.03766632080078125, -0.033172607421875, -0.02867889404296875, -0.0241851806640625, -0.01969146728515625, -0.01519775390625, -0.01070404052734375, -0.0062103271484375, -0.00171661376953125, 0.002777099609375, 0.00727081298828125, 0.0117645263671875, 0.01625823974609375, 0.020751953125, 0.02524566650390625, 0.0297393798828125, 0.03423309326171875, 0.038726806640625, 0.04322052001953125, 0.0477142333984375, 0.05220794677734375, 0.05670166015625, 0.06119537353515625, 0.0656890869140625, 0.07018280029296875, 0.074676513671875, 0.07917022705078125, 0.0836639404296875, 0.08815765380859375, 0.0926513671875, 0.09714508056640625, 0.1016387939453125, 0.10613250732421875, 0.110626220703125, 0.11511993408203125, 0.1196136474609375, 0.12410736083984375, 0.12860107421875, 0.13309478759765625, 0.1375885009765625, 0.14208221435546875, 0.146575927734375, 0.15106964111328125, 0.1555633544921875, 0.16005706787109375, 0.16455078125]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 5.0, 4.0, 17.0, 12.0, 20.0, 28.0, 40.0, 67.0, 103.0, 145.0, 265.0, 387.0, 686.0, 1186.0, 2047.0, 3795.0, 7417.0, 14765.0, 32628.0, 76088.0, 191714.0, 501071.0, 1173643.0, 1257771.0, 560092.0, 216082.0, 84511.0, 35919.0, 16217.0, 7990.0, 4133.0, 2241.0, 1273.0, 702.0, 466.0, 269.0, 195.0, 97.0, 61.0, 41.0, 35.0, 25.0, 16.0, 7.0, 6.0, 3.0, 3.0, 3.0, 4.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.2159423828125, -0.20960235595703125, -0.2032623291015625, -0.19692230224609375, -0.190582275390625, -0.18424224853515625, -0.1779022216796875, -0.17156219482421875, -0.16522216796875, -0.15888214111328125, -0.1525421142578125, -0.14620208740234375, -0.139862060546875, -0.13352203369140625, -0.1271820068359375, -0.12084197998046875, -0.114501953125, -0.10816192626953125, -0.1018218994140625, -0.09548187255859375, -0.089141845703125, -0.08280181884765625, -0.0764617919921875, -0.07012176513671875, -0.06378173828125, -0.05744171142578125, -0.0511016845703125, -0.04476165771484375, -0.038421630859375, -0.03208160400390625, -0.0257415771484375, -0.01940155029296875, -0.0130615234375, -0.00672149658203125, -0.0003814697265625, 0.00595855712890625, 0.012298583984375, 0.01863861083984375, 0.0249786376953125, 0.03131866455078125, 0.03765869140625, 0.04399871826171875, 0.0503387451171875, 0.05667877197265625, 0.063018798828125, 0.06935882568359375, 0.0756988525390625, 0.08203887939453125, 0.08837890625, 0.09471893310546875, 0.1010589599609375, 0.10739898681640625, 0.113739013671875, 0.12007904052734375, 0.1264190673828125, 0.13275909423828125, 0.13909912109375, 0.14543914794921875, 0.1517791748046875, 0.15811920166015625, 0.164459228515625, 0.17079925537109375, 0.1771392822265625, 0.18347930908203125, 0.1898193359375]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 4.0, 5.0, 7.0, 9.0, 8.0, 25.0, 22.0, 27.0, 50.0, 60.0, 87.0, 132.0, 183.0, 222.0, 290.0, 356.0, 474.0, 460.0, 370.0, 312.0, 254.0, 180.0, 156.0, 102.0, 82.0, 53.0, 42.0, 22.0, 24.0, 7.0, 15.0, 10.0, 6.0, 6.0, 6.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.21435546875, -0.20700836181640625, -0.1996612548828125, -0.19231414794921875, -0.184967041015625, -0.17761993408203125, -0.1702728271484375, -0.16292572021484375, -0.15557861328125, -0.14823150634765625, -0.1408843994140625, -0.13353729248046875, -0.126190185546875, -0.11884307861328125, -0.1114959716796875, -0.10414886474609375, -0.0968017578125, -0.08945465087890625, -0.0821075439453125, -0.07476043701171875, -0.067413330078125, -0.06006622314453125, -0.0527191162109375, -0.04537200927734375, -0.03802490234375, -0.03067779541015625, -0.0233306884765625, -0.01598358154296875, -0.008636474609375, -0.00128936767578125, 0.0060577392578125, 0.01340484619140625, 0.020751953125, 0.02809906005859375, 0.0354461669921875, 0.04279327392578125, 0.050140380859375, 0.05748748779296875, 0.0648345947265625, 0.07218170166015625, 0.07952880859375, 0.08687591552734375, 0.0942230224609375, 0.10157012939453125, 0.108917236328125, 0.11626434326171875, 0.1236114501953125, 0.13095855712890625, 0.1383056640625, 0.14565277099609375, 0.1529998779296875, 0.16034698486328125, 0.167694091796875, 0.17504119873046875, 0.1823883056640625, 0.18973541259765625, 0.19708251953125, 0.20442962646484375, 0.2117767333984375, 0.21912384033203125, 0.226470947265625, 0.23381805419921875, 0.2411651611328125, 0.24851226806640625, 0.255859375]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [6.0, 1.0, 17.0, 21.0, 40.0, 77.0, 101.0, 132.0, 128.0, 138.0, 117.0, 83.0, 79.0, 30.0, 30.0, 12.0, 5.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5251754522323608, -0.4611527919769287, -0.3971301317214966, -0.33310744166374207, -0.26908478140830994, -0.2050621211528778, -0.1410394310951233, -0.07701677083969116, -0.012994110584259033, 0.05102855712175369, 0.11505122482776642, 0.17907389998435974, 0.24309656023979187, 0.307119220495224, 0.3711419105529785, 0.43516457080841064, 0.4991872310638428, 0.5632098913192749, 0.627232551574707, 0.6912552118301392, 0.7552778720855713, 0.8193005323410034, 0.8833232522010803, 0.9473459124565125, 1.0113685131072998, 1.075391173362732, 1.139413833618164, 1.2034364938735962, 1.2674591541290283, 1.3314818143844604, 1.3955044746398926, 1.4595272541046143, 1.5235497951507568, 1.587572455406189, 1.651595115661621, 1.7156177759170532, 1.7796404361724854, 1.8436630964279175, 1.9076857566833496, 1.9717085361480713, 2.035731077194214, 2.0997538566589355, 2.163776397705078, 2.2277991771698, 2.2918217182159424, 2.355844497680664, 2.4198670387268066, 2.4838898181915283, 2.54791259765625, 2.6119353771209717, 2.6759579181671143, 2.739980697631836, 2.8040032386779785, 2.8680260181427, 2.9320485591888428, 2.9960713386535645, 3.060093879699707, 3.1241166591644287, 3.1881392002105713, 3.252161979675293, 3.3161845207214355, 3.3802073001861572, 3.4442298412323, 3.5082526206970215, 3.572275161743164]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 4.0, 2.0, 7.0, 8.0, 7.0, 10.0, 13.0, 18.0, 23.0, 20.0, 28.0, 29.0, 22.0, 27.0, 23.0, 30.0, 43.0, 41.0, 32.0, 48.0, 41.0, 40.0, 32.0, 31.0, 53.0, 43.0, 33.0, 39.0, 29.0, 45.0, 37.0, 22.0, 16.0, 18.0, 20.0, 18.0, 15.0, 7.0, 9.0, 9.0, 8.0, 4.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.882178783416748, -0.8557850122451782, -0.8293912410736084, -0.8029974699020386, -0.7766036987304688, -0.7502099275588989, -0.7238161563873291, -0.6974223256111145, -0.6710285544395447, -0.6446347832679749, -0.618241012096405, -0.5918472409248352, -0.5654534697532654, -0.5390596389770508, -0.512665867805481, -0.48627209663391113, -0.4598783552646637, -0.43348458409309387, -0.40709081292152405, -0.38069701194763184, -0.354303240776062, -0.3279094696044922, -0.30151569843292236, -0.27512192726135254, -0.24872814118862152, -0.2223343700170517, -0.19594058394432068, -0.16954681277275085, -0.14315304160118103, -0.11675925552845001, -0.09036548435688019, -0.06397169828414917, -0.037577927112579346, -0.011184150353074074, 0.015209626406431198, 0.04160340130329132, 0.06799717992544174, 0.09439095854759216, 0.12078472971916199, 0.147178515791893, 0.17357228696346283, 0.19996605813503265, 0.22635984420776367, 0.2527536153793335, 0.2791473865509033, 0.30554115772247314, 0.33193492889404297, 0.3583287298679352, 0.384722501039505, 0.41111627221107483, 0.43751004338264465, 0.46390384435653687, 0.4902976155281067, 0.5166913866996765, 0.5430851578712463, 0.5694789290428162, 0.595872700214386, 0.6222664713859558, 0.6486602425575256, 0.6750540137290955, 0.7014477849006653, 0.7278416156768799, 0.7542353868484497, 0.7806291580200195, 0.8070229291915894]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 5.0, 3.0, 2.0, 7.0, 11.0, 25.0, 30.0, 93.0, 175.0, 407.0, 839.0, 1938.0, 3968.0, 8841.0, 19607.0, 43623.0, 115730.0, 324090.0, 329109.0, 118997.0, 44430.0, 19954.0, 8960.0, 4232.0, 1909.0, 855.0, 370.0, 165.0, 89.0, 34.0, 26.0, 17.0, 11.0, 5.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.348876953125, -0.3394508361816406, -0.33002471923828125, -0.3205986022949219, -0.3111724853515625, -0.3017463684082031, -0.29232025146484375, -0.2828941345214844, -0.273468017578125, -0.2640419006347656, -0.25461578369140625, -0.24518966674804688, -0.2357635498046875, -0.22633743286132812, -0.21691131591796875, -0.20748519897460938, -0.19805908203125, -0.18863296508789062, -0.17920684814453125, -0.16978073120117188, -0.1603546142578125, -0.15092849731445312, -0.14150238037109375, -0.13207626342773438, -0.122650146484375, -0.11322402954101562, -0.10379791259765625, -0.09437179565429688, -0.0849456787109375, -0.07551956176757812, -0.06609344482421875, -0.056667327880859375, -0.0472412109375, -0.037815093994140625, -0.02838897705078125, -0.018962860107421875, -0.0095367431640625, -0.000110626220703125, 0.00931549072265625, 0.018741607666015625, 0.028167724609375, 0.037593841552734375, 0.04701995849609375, 0.056446075439453125, 0.0658721923828125, 0.07529830932617188, 0.08472442626953125, 0.09415054321289062, 0.10357666015625, 0.11300277709960938, 0.12242889404296875, 0.13185501098632812, 0.1412811279296875, 0.15070724487304688, 0.16013336181640625, 0.16955947875976562, 0.178985595703125, 0.18841171264648438, 0.19783782958984375, 0.20726394653320312, 0.2166900634765625, 0.22611618041992188, 0.23554229736328125, 0.24496841430664062, 0.25439453125]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 5.0, 5.0, 3.0, 2.0, 9.0, 3.0, 7.0, 11.0, 7.0, 16.0, 22.0, 17.0, 20.0, 29.0, 28.0, 33.0, 34.0, 34.0, 38.0, 39.0, 45.0, 39.0, 44.0, 54.0, 40.0, 42.0, 43.0, 27.0, 40.0, 44.0, 31.0, 27.0, 20.0, 25.0, 19.0, 16.0, 13.0, 13.0, 18.0, 7.0, 13.0, 7.0, 3.0, 7.0, 2.0, 3.0, 1.0, 3.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0], "bins": [-0.125244140625, -0.12113571166992188, -0.11702728271484375, -0.11291885375976562, -0.1088104248046875, -0.10470199584960938, -0.10059356689453125, -0.09648513793945312, -0.092376708984375, -0.08826828002929688, -0.08415985107421875, -0.08005142211914062, -0.0759429931640625, -0.07183456420898438, -0.06772613525390625, -0.06361770629882812, -0.05950927734375, -0.055400848388671875, -0.05129241943359375, -0.047183990478515625, -0.0430755615234375, -0.038967132568359375, -0.03485870361328125, -0.030750274658203125, -0.026641845703125, -0.022533416748046875, -0.01842498779296875, -0.014316558837890625, -0.0102081298828125, -0.006099700927734375, -0.00199127197265625, 0.002117156982421875, 0.0062255859375, 0.010334014892578125, 0.01444244384765625, 0.018550872802734375, 0.0226593017578125, 0.026767730712890625, 0.03087615966796875, 0.034984588623046875, 0.039093017578125, 0.043201446533203125, 0.04730987548828125, 0.051418304443359375, 0.0555267333984375, 0.059635162353515625, 0.06374359130859375, 0.06785202026367188, 0.07196044921875, 0.07606887817382812, 0.08017730712890625, 0.08428573608398438, 0.0883941650390625, 0.09250259399414062, 0.09661102294921875, 0.10071945190429688, 0.104827880859375, 0.10893630981445312, 0.11304473876953125, 0.11715316772460938, 0.1212615966796875, 0.12537002563476562, 0.12947845458984375, 0.13358688354492188, 0.1376953125]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 9.0, 7.0, 8.0, 4.0, 1.0, 12.0, 9.0, 31.0, 31.0, 59.0, 81.0, 137.0, 326.0, 827.0, 2489.0, 8006.0, 28059.0, 116046.0, 573711.0, 249985.0, 49168.0, 13253.0, 4054.0, 1319.0, 468.0, 183.0, 93.0, 42.0, 28.0, 22.0, 22.0, 13.0, 13.0, 6.0, 14.0, 5.0, 4.0, 1.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.505859375, -0.48938751220703125, -0.4729156494140625, -0.45644378662109375, -0.439971923828125, -0.42350006103515625, -0.4070281982421875, -0.39055633544921875, -0.37408447265625, -0.35761260986328125, -0.3411407470703125, -0.32466888427734375, -0.308197021484375, -0.29172515869140625, -0.2752532958984375, -0.25878143310546875, -0.2423095703125, -0.22583770751953125, -0.2093658447265625, -0.19289398193359375, -0.176422119140625, -0.15995025634765625, -0.1434783935546875, -0.12700653076171875, -0.11053466796875, -0.09406280517578125, -0.0775909423828125, -0.06111907958984375, -0.044647216796875, -0.02817535400390625, -0.0117034912109375, 0.00476837158203125, 0.021240234375, 0.03771209716796875, 0.0541839599609375, 0.07065582275390625, 0.087127685546875, 0.10359954833984375, 0.1200714111328125, 0.13654327392578125, 0.15301513671875, 0.16948699951171875, 0.1859588623046875, 0.20243072509765625, 0.218902587890625, 0.23537445068359375, 0.2518463134765625, 0.26831817626953125, 0.2847900390625, 0.30126190185546875, 0.3177337646484375, 0.33420562744140625, 0.350677490234375, 0.36714935302734375, 0.3836212158203125, 0.40009307861328125, 0.41656494140625, 0.43303680419921875, 0.4495086669921875, 0.46598052978515625, 0.482452392578125, 0.49892425537109375, 0.5153961181640625, 0.5318679809570312, 0.54833984375]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 0.0, 1.0, 3.0, 4.0, 5.0, 4.0, 4.0, 12.0, 14.0, 20.0, 18.0, 26.0, 24.0, 26.0, 37.0, 42.0, 57.0, 56.0, 65.0, 66.0, 60.0, 65.0, 59.0, 57.0, 40.0, 55.0, 41.0, 30.0, 28.0, 26.0, 20.0, 6.0, 5.0, 14.0, 5.0, 5.0, 5.0, 0.0, 4.0, 0.0, 0.0, 1.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.62353515625, -0.6042022705078125, -0.584869384765625, -0.5655364990234375, -0.54620361328125, -0.5268707275390625, -0.507537841796875, -0.4882049560546875, -0.4688720703125, -0.4495391845703125, -0.430206298828125, -0.4108734130859375, -0.39154052734375, -0.3722076416015625, -0.352874755859375, -0.3335418701171875, -0.314208984375, -0.2948760986328125, -0.275543212890625, -0.2562103271484375, -0.23687744140625, -0.2175445556640625, -0.198211669921875, -0.1788787841796875, -0.1595458984375, -0.1402130126953125, -0.120880126953125, -0.1015472412109375, -0.08221435546875, -0.0628814697265625, -0.043548583984375, -0.0242156982421875, -0.0048828125, 0.0144500732421875, 0.033782958984375, 0.0531158447265625, 0.07244873046875, 0.0917816162109375, 0.111114501953125, 0.1304473876953125, 0.1497802734375, 0.1691131591796875, 0.188446044921875, 0.2077789306640625, 0.22711181640625, 0.2464447021484375, 0.265777587890625, 0.2851104736328125, 0.304443359375, 0.3237762451171875, 0.343109130859375, 0.3624420166015625, 0.38177490234375, 0.4011077880859375, 0.420440673828125, 0.4397735595703125, 0.4591064453125, 0.4784393310546875, 0.497772216796875, 0.5171051025390625, 0.53643798828125, 0.5557708740234375, 0.575103759765625, 0.5944366455078125, 0.61376953125]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 5.0, 5.0, 6.0, 8.0, 7.0, 21.0, 24.0, 33.0, 72.0, 99.0, 132.0, 243.0, 357.0, 617.0, 1058.0, 1664.0, 2961.0, 5094.0, 9005.0, 16041.0, 28738.0, 59394.0, 148163.0, 346277.0, 246481.0, 91805.0, 40962.0, 20922.0, 12008.0, 6711.0, 3872.0, 2245.0, 1372.0, 845.0, 506.0, 275.0, 190.0, 125.0, 80.0, 55.0, 16.0, 26.0, 11.0, 17.0, 4.0, 6.0, 1.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.1669921875, -0.16204452514648438, -0.15709686279296875, -0.15214920043945312, -0.1472015380859375, -0.14225387573242188, -0.13730621337890625, -0.13235855102539062, -0.127410888671875, -0.12246322631835938, -0.11751556396484375, -0.11256790161132812, -0.1076202392578125, -0.10267257690429688, -0.09772491455078125, -0.09277725219726562, -0.08782958984375, -0.08288192749023438, -0.07793426513671875, -0.07298660278320312, -0.0680389404296875, -0.06309127807617188, -0.05814361572265625, -0.053195953369140625, -0.048248291015625, -0.043300628662109375, -0.03835296630859375, -0.033405303955078125, -0.0284576416015625, -0.023509979248046875, -0.01856231689453125, -0.013614654541015625, -0.0086669921875, -0.003719329833984375, 0.00122833251953125, 0.006175994873046875, 0.0111236572265625, 0.016071319580078125, 0.02101898193359375, 0.025966644287109375, 0.030914306640625, 0.035861968994140625, 0.04080963134765625, 0.045757293701171875, 0.0507049560546875, 0.055652618408203125, 0.06060028076171875, 0.06554794311523438, 0.07049560546875, 0.07544326782226562, 0.08039093017578125, 0.08533859252929688, 0.0902862548828125, 0.09523391723632812, 0.10018157958984375, 0.10512924194335938, 0.110076904296875, 0.11502456665039062, 0.11997222900390625, 0.12491989135742188, 0.1298675537109375, 0.13481521606445312, 0.13976287841796875, 0.14471054077148438, 0.149658203125]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 3.0, 4.0, 3.0, 5.0, 2.0, 5.0, 5.0, 12.0, 11.0, 12.0, 15.0, 16.0, 19.0, 25.0, 33.0, 48.0, 73.0, 89.0, 83.0, 102.0, 95.0, 78.0, 85.0, 45.0, 25.0, 23.0, 6.0, 7.0, 16.0, 10.0, 9.0, 4.0, 8.0, 8.0, 7.0, 4.0, 4.0, 1.0, 3.0, 3.0, 4.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-4.410743713378906e-05, -4.292838275432587e-05, -4.174932837486267e-05, -4.0570273995399475e-05, -3.939121961593628e-05, -3.8212165236473083e-05, -3.703311085700989e-05, -3.585405647754669e-05, -3.4675002098083496e-05, -3.34959477186203e-05, -3.2316893339157104e-05, -3.113783895969391e-05, -2.9958784580230713e-05, -2.8779730200767517e-05, -2.760067582130432e-05, -2.6421621441841125e-05, -2.524256706237793e-05, -2.4063512682914734e-05, -2.2884458303451538e-05, -2.1705403923988342e-05, -2.0526349544525146e-05, -1.934729516506195e-05, -1.8168240785598755e-05, -1.698918640613556e-05, -1.5810132026672363e-05, -1.4631077647209167e-05, -1.3452023267745972e-05, -1.2272968888282776e-05, -1.109391450881958e-05, -9.914860129356384e-06, -8.735805749893188e-06, -7.556751370429993e-06, -6.377696990966797e-06, -5.198642611503601e-06, -4.019588232040405e-06, -2.8405338525772095e-06, -1.6614794731140137e-06, -4.824250936508179e-07, 6.966292858123779e-07, 1.8756836652755737e-06, 3.0547380447387695e-06, 4.233792424201965e-06, 5.412846803665161e-06, 6.591901183128357e-06, 7.770955562591553e-06, 8.950009942054749e-06, 1.0129064321517944e-05, 1.130811870098114e-05, 1.2487173080444336e-05, 1.3666227459907532e-05, 1.4845281839370728e-05, 1.6024336218833923e-05, 1.720339059829712e-05, 1.8382444977760315e-05, 1.956149935722351e-05, 2.0740553736686707e-05, 2.1919608116149902e-05, 2.3098662495613098e-05, 2.4277716875076294e-05, 2.545677125453949e-05, 2.6635825634002686e-05, 2.781488001346588e-05, 2.8993934392929077e-05, 3.0172988772392273e-05, 3.135204315185547e-05]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 5.0, 6.0, 8.0, 13.0, 5.0, 16.0, 25.0, 53.0, 81.0, 156.0, 314.0, 723.0, 1571.0, 3635.0, 9256.0, 24229.0, 75119.0, 334349.0, 448221.0, 100434.0, 30859.0, 11351.0, 4454.0, 1947.0, 874.0, 433.0, 188.0, 92.0, 44.0, 31.0, 26.0, 15.0, 9.0, 6.0, 5.0, 2.0, 4.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.252685546875, -0.24456405639648438, -0.23644256591796875, -0.22832107543945312, -0.2201995849609375, -0.21207809448242188, -0.20395660400390625, -0.19583511352539062, -0.187713623046875, -0.17959213256835938, -0.17147064208984375, -0.16334915161132812, -0.1552276611328125, -0.14710617065429688, -0.13898468017578125, -0.13086318969726562, -0.12274169921875, -0.11462020874023438, -0.10649871826171875, -0.09837722778320312, -0.0902557373046875, -0.08213424682617188, -0.07401275634765625, -0.06589126586914062, -0.057769775390625, -0.049648284912109375, -0.04152679443359375, -0.033405303955078125, -0.0252838134765625, -0.017162322998046875, -0.00904083251953125, -0.000919342041015625, 0.0072021484375, 0.015323638916015625, 0.02344512939453125, 0.031566619873046875, 0.0396881103515625, 0.047809600830078125, 0.05593109130859375, 0.06405258178710938, 0.072174072265625, 0.08029556274414062, 0.08841705322265625, 0.09653854370117188, 0.1046600341796875, 0.11278152465820312, 0.12090301513671875, 0.12902450561523438, 0.13714599609375, 0.14526748657226562, 0.15338897705078125, 0.16151046752929688, 0.1696319580078125, 0.17775344848632812, 0.18587493896484375, 0.19399642944335938, 0.202117919921875, 0.21023941040039062, 0.21836090087890625, 0.22648239135742188, 0.2346038818359375, 0.24272537231445312, 0.25084686279296875, 0.2589683532714844, 0.26708984375]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 5.0, 5.0, 4.0, 7.0, 9.0, 6.0, 5.0, 9.0, 16.0, 21.0, 23.0, 33.0, 50.0, 65.0, 77.0, 109.0, 110.0, 103.0, 96.0, 52.0, 41.0, 32.0, 27.0, 19.0, 21.0, 18.0, 8.0, 4.0, 3.0, 3.0, 4.0, 4.0, 4.0, 2.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.19873046875, -0.1926288604736328, -0.18652725219726562, -0.18042564392089844, -0.17432403564453125, -0.16822242736816406, -0.16212081909179688, -0.1560192108154297, -0.1499176025390625, -0.1438159942626953, -0.13771438598632812, -0.13161277770996094, -0.12551116943359375, -0.11940956115722656, -0.11330795288085938, -0.10720634460449219, -0.101104736328125, -0.09500312805175781, -0.08890151977539062, -0.08279991149902344, -0.07669830322265625, -0.07059669494628906, -0.06449508666992188, -0.05839347839355469, -0.0522918701171875, -0.04619026184082031, -0.040088653564453125, -0.03398704528808594, -0.02788543701171875, -0.021783828735351562, -0.015682220458984375, -0.009580612182617188, -0.00347900390625, 0.0026226043701171875, 0.008724212646484375, 0.014825820922851562, 0.02092742919921875, 0.027029037475585938, 0.033130645751953125, 0.03923225402832031, 0.0453338623046875, 0.05143547058105469, 0.057537078857421875, 0.06363868713378906, 0.06974029541015625, 0.07584190368652344, 0.08194351196289062, 0.08804512023925781, 0.094146728515625, 0.10024833679199219, 0.10634994506835938, 0.11245155334472656, 0.11855316162109375, 0.12465476989746094, 0.13075637817382812, 0.1368579864501953, 0.1429595947265625, 0.1490612030029297, 0.15516281127929688, 0.16126441955566406, 0.16736602783203125, 0.17346763610839844, 0.17956924438476562, 0.1856708526611328, 0.1917724609375]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 3.0, 7.0, 6.0, 15.0, 18.0, 29.0, 34.0, 54.0, 54.0, 68.0, 90.0, 88.0, 72.0, 90.0, 71.0, 77.0, 55.0, 52.0, 42.0, 28.0, 14.0, 14.0, 9.0, 8.0, 3.0, 4.0, 1.0, 0.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.4024068117141724, -1.3567535877227783, -1.3111002445220947, -1.2654470205307007, -1.2197937965393066, -1.174140453338623, -1.128487229347229, -1.082834005355835, -1.0371806621551514, -0.9915273785591125, -0.9458740949630737, -0.9002208709716797, -0.8545675873756409, -0.808914303779602, -0.763261079788208, -0.7176077961921692, -0.6719545125961304, -0.6263012290000916, -0.5806479454040527, -0.5349947214126587, -0.4893414378166199, -0.44368815422058105, -0.3980349004268646, -0.3523816466331482, -0.3067283630371094, -0.26107507944107056, -0.21542182564735413, -0.1697685569524765, -0.12411528825759888, -0.07846201956272125, -0.03280875086784363, 0.012844502925872803, 0.05849766731262207, 0.1041509360074997, 0.14980420470237732, 0.19545747339725494, 0.24111074209213257, 0.2867640256881714, 0.3324172794818878, 0.37807053327560425, 0.42372381687164307, 0.4693771004676819, 0.5150303840637207, 0.5606836080551147, 0.6063368916511536, 0.6519901752471924, 0.6976433992385864, 0.7432966828346252, 0.7889499664306641, 0.8346032500267029, 0.8802565336227417, 0.9259097576141357, 0.9715630412101746, 1.0172163248062134, 1.0628695487976074, 1.108522891998291, 1.154176115989685, 1.199829339981079, 1.2454826831817627, 1.2911359071731567, 1.3367891311645508, 1.3824424743652344, 1.4280956983566284, 1.4737489223480225, 1.519402265548706]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 5.0, 4.0, 3.0, 6.0, 4.0, 5.0, 8.0, 11.0, 9.0, 11.0, 20.0, 22.0, 32.0, 25.0, 22.0, 30.0, 43.0, 37.0, 29.0, 35.0, 25.0, 48.0, 39.0, 42.0, 35.0, 49.0, 37.0, 43.0, 40.0, 42.0, 28.0, 30.0, 28.0, 21.0, 25.0, 17.0, 21.0, 21.0, 10.0, 11.0, 9.0, 8.0, 5.0, 2.0, 5.0, 5.0, 4.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1258656978607178, -1.0838481187820435, -1.0418305397033691, -0.9998130202293396, -0.9577955007553101, -0.9157779216766357, -0.8737603425979614, -0.8317427635192871, -0.7897252440452576, -0.7477076649665833, -0.7056901454925537, -0.6636725664138794, -0.6216549873352051, -0.5796374678611755, -0.5376198887825012, -0.4956023395061493, -0.45358479022979736, -0.41156724095344543, -0.3695496916770935, -0.3275321125984192, -0.28551456332206726, -0.24349701404571533, -0.20147943496704102, -0.1594618856906891, -0.11744433641433716, -0.07542677968740463, -0.03340922296047211, 0.008608341217041016, 0.050625890493392944, 0.09264343976974487, 0.1346610188484192, 0.17667856812477112, 0.21869611740112305, 0.260713666677475, 0.3027312159538269, 0.3447487950325012, 0.38676634430885315, 0.4287838935852051, 0.4708014726638794, 0.5128190517425537, 0.5548365712165833, 0.5968541502952576, 0.6388716697692871, 0.6808892488479614, 0.7229068279266357, 0.7649243474006653, 0.8069419264793396, 0.8489594459533691, 0.8909770250320435, 0.9329946041107178, 0.9750121235847473, 1.0170297622680664, 1.0590472221374512, 1.1010648012161255, 1.1430823802947998, 1.1850999593734741, 1.2271175384521484, 1.2691351175308228, 1.311152696609497, 1.3531701564788818, 1.3951877355575562, 1.4372053146362305, 1.4792228937149048, 1.521240472793579, 1.5632579326629639]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 2.0, 5.0, 4.0, 9.0, 10.0, 8.0, 10.0, 10.0, 13.0, 26.0, 38.0, 36.0, 64.0, 79.0, 112.0, 235.0, 544.0, 1418.0, 4286.0, 14175.0, 58089.0, 288951.0, 1773895.0, 1695549.0, 280188.0, 56256.0, 13910.0, 3933.0, 1285.0, 485.0, 236.0, 137.0, 68.0, 41.0, 47.0, 29.0, 21.0, 16.0, 9.0, 13.0, 11.0, 7.0, 7.0, 4.0, 4.0, 5.0, 4.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 3.0], "bins": [-0.313720703125, -0.3042106628417969, -0.29470062255859375, -0.2851905822753906, -0.2756805419921875, -0.2661705017089844, -0.25666046142578125, -0.24715042114257812, -0.237640380859375, -0.22813034057617188, -0.21862030029296875, -0.20911026000976562, -0.1996002197265625, -0.19009017944335938, -0.18058013916015625, -0.17107009887695312, -0.16156005859375, -0.15205001831054688, -0.14253997802734375, -0.13302993774414062, -0.1235198974609375, -0.11400985717773438, -0.10449981689453125, -0.09498977661132812, -0.085479736328125, -0.07596969604492188, -0.06645965576171875, -0.056949615478515625, -0.0474395751953125, -0.037929534912109375, -0.02841949462890625, -0.018909454345703125, -0.0093994140625, 0.000110626220703125, 0.00962066650390625, 0.019130706787109375, 0.0286407470703125, 0.038150787353515625, 0.04766082763671875, 0.057170867919921875, 0.066680908203125, 0.07619094848632812, 0.08570098876953125, 0.09521102905273438, 0.1047210693359375, 0.11423110961914062, 0.12374114990234375, 0.13325119018554688, 0.14276123046875, 0.15227127075195312, 0.16178131103515625, 0.17129135131835938, 0.1808013916015625, 0.19031143188476562, 0.19982147216796875, 0.20933151245117188, 0.218841552734375, 0.22835159301757812, 0.23786163330078125, 0.24737167358398438, 0.2568817138671875, 0.2663917541503906, 0.27590179443359375, 0.2854118347167969, 0.294921875]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0, 2.0, 2.0, 11.0, 5.0, 6.0, 11.0, 10.0, 13.0, 12.0, 13.0, 15.0, 21.0, 23.0, 26.0, 28.0, 27.0, 38.0, 28.0, 34.0, 41.0, 31.0, 48.0, 40.0, 42.0, 32.0, 45.0, 35.0, 33.0, 45.0, 34.0, 35.0, 26.0, 22.0, 36.0, 9.0, 15.0, 21.0, 20.0, 14.0, 13.0, 7.0, 5.0, 5.0, 5.0, 7.0, 5.0, 2.0, 5.0, 2.0, 0.0, 3.0, 0.0, 3.0, 0.0, 2.0, 2.0, 1.0], "bins": [-0.1309814453125, -0.12670516967773438, -0.12242889404296875, -0.11815261840820312, -0.1138763427734375, -0.10960006713867188, -0.10532379150390625, -0.10104751586914062, -0.096771240234375, -0.09249496459960938, -0.08821868896484375, -0.08394241333007812, -0.0796661376953125, -0.07538986206054688, -0.07111358642578125, -0.06683731079101562, -0.06256103515625, -0.058284759521484375, -0.05400848388671875, -0.049732208251953125, -0.0454559326171875, -0.041179656982421875, -0.03690338134765625, -0.032627105712890625, -0.028350830078125, -0.024074554443359375, -0.01979827880859375, -0.015522003173828125, -0.0112457275390625, -0.006969451904296875, -0.00269317626953125, 0.001583099365234375, 0.005859375, 0.010135650634765625, 0.01441192626953125, 0.018688201904296875, 0.0229644775390625, 0.027240753173828125, 0.03151702880859375, 0.035793304443359375, 0.040069580078125, 0.044345855712890625, 0.04862213134765625, 0.052898406982421875, 0.0571746826171875, 0.061450958251953125, 0.06572723388671875, 0.07000350952148438, 0.07427978515625, 0.07855606079101562, 0.08283233642578125, 0.08710861206054688, 0.0913848876953125, 0.09566116333007812, 0.09993743896484375, 0.10421371459960938, 0.108489990234375, 0.11276626586914062, 0.11704254150390625, 0.12131881713867188, 0.1255950927734375, 0.12987136840820312, 0.13414764404296875, 0.13842391967773438, 0.1427001953125]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 3.0, 5.0, 5.0, 16.0, 18.0, 17.0, 33.0, 29.0, 66.0, 100.0, 126.0, 202.0, 290.0, 474.0, 713.0, 1143.0, 1886.0, 3356.0, 6465.0, 13716.0, 31633.0, 82927.0, 233985.0, 693349.0, 1656241.0, 955660.0, 322932.0, 111677.0, 41924.0, 17434.0, 7946.0, 4126.0, 2174.0, 1283.0, 809.0, 488.0, 331.0, 234.0, 133.0, 95.0, 86.0, 51.0, 40.0, 22.0, 14.0, 6.0, 11.0, 10.0, 5.0, 1.0, 0.0, 2.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.30078125, -0.2915687561035156, -0.28235626220703125, -0.2731437683105469, -0.2639312744140625, -0.2547187805175781, -0.24550628662109375, -0.23629379272460938, -0.227081298828125, -0.21786880493164062, -0.20865631103515625, -0.19944381713867188, -0.1902313232421875, -0.18101882934570312, -0.17180633544921875, -0.16259384155273438, -0.15338134765625, -0.14416885375976562, -0.13495635986328125, -0.12574386596679688, -0.1165313720703125, -0.10731887817382812, -0.09810638427734375, -0.08889389038085938, -0.079681396484375, -0.07046890258789062, -0.06125640869140625, -0.052043914794921875, -0.0428314208984375, -0.033618927001953125, -0.02440643310546875, -0.015193939208984375, -0.0059814453125, 0.003231048583984375, 0.01244354248046875, 0.021656036376953125, 0.0308685302734375, 0.040081024169921875, 0.04929351806640625, 0.058506011962890625, 0.067718505859375, 0.07693099975585938, 0.08614349365234375, 0.09535598754882812, 0.1045684814453125, 0.11378097534179688, 0.12299346923828125, 0.13220596313476562, 0.14141845703125, 0.15063095092773438, 0.15984344482421875, 0.16905593872070312, 0.1782684326171875, 0.18748092651367188, 0.19669342041015625, 0.20590591430664062, 0.215118408203125, 0.22433090209960938, 0.23354339599609375, 0.24275588989257812, 0.2519683837890625, 0.2611808776855469, 0.27039337158203125, 0.2796058654785156, 0.288818359375]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 5.0, 2.0, 5.0, 5.0, 9.0, 25.0, 25.0, 27.0, 37.0, 53.0, 84.0, 114.0, 150.0, 231.0, 300.0, 422.0, 561.0, 474.0, 425.0, 311.0, 259.0, 164.0, 117.0, 80.0, 58.0, 42.0, 29.0, 20.0, 10.0, 8.0, 3.0, 3.0, 6.0, 5.0, 1.0, 3.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.289794921875, -0.2807655334472656, -0.27173614501953125, -0.2627067565917969, -0.2536773681640625, -0.24464797973632812, -0.23561859130859375, -0.22658920288085938, -0.217559814453125, -0.20853042602539062, -0.19950103759765625, -0.19047164916992188, -0.1814422607421875, -0.17241287231445312, -0.16338348388671875, -0.15435409545898438, -0.14532470703125, -0.13629531860351562, -0.12726593017578125, -0.11823654174804688, -0.1092071533203125, -0.10017776489257812, -0.09114837646484375, -0.08211898803710938, -0.073089599609375, -0.06406021118164062, -0.05503082275390625, -0.046001434326171875, -0.0369720458984375, -0.027942657470703125, -0.01891326904296875, -0.009883880615234375, -0.0008544921875, 0.008174896240234375, 0.01720428466796875, 0.026233673095703125, 0.0352630615234375, 0.044292449951171875, 0.05332183837890625, 0.062351226806640625, 0.071380615234375, 0.08041000366210938, 0.08943939208984375, 0.09846878051757812, 0.1074981689453125, 0.11652755737304688, 0.12555694580078125, 0.13458633422851562, 0.14361572265625, 0.15264511108398438, 0.16167449951171875, 0.17070388793945312, 0.1797332763671875, 0.18876266479492188, 0.19779205322265625, 0.20682144165039062, 0.215850830078125, 0.22488021850585938, 0.23390960693359375, 0.24293899536132812, 0.2519683837890625, 0.2609977722167969, 0.27002716064453125, 0.2790565490722656, 0.2880859375]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 4.0, 10.0, 24.0, 56.0, 81.0, 131.0, 197.0, 193.0, 153.0, 87.0, 47.0, 19.0, 6.0, 5.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8189446926116943, -1.7262909412384033, -1.6336370706558228, -1.5409832000732422, -1.4483294486999512, -1.3556756973266602, -1.2630218267440796, -1.170367956161499, -1.077714204788208, -0.9850603938102722, -0.8924065828323364, -0.7997527718544006, -0.7070989608764648, -0.614445149898529, -0.5217913389205933, -0.42913752794265747, -0.3364837169647217, -0.2438299059867859, -0.1511760950088501, -0.05852228403091431, 0.034131526947021484, 0.12678533792495728, 0.21943914890289307, 0.31209295988082886, 0.40474677085876465, 0.49740058183670044, 0.5900543928146362, 0.682708203792572, 0.7753620147705078, 0.8680158257484436, 0.9606696367263794, 1.05332350730896, 1.1459770202636719, 1.238630771636963, 1.3312846422195435, 1.423938512802124, 1.516592264175415, 1.609246015548706, 1.7018998861312866, 1.7945537567138672, 1.8872075080871582, 1.9798612594604492, 2.0725150108337402, 2.1651690006256104, 2.2578227519989014, 2.3504765033721924, 2.4431304931640625, 2.5357842445373535, 2.6284379959106445, 2.7210917472839355, 2.8137454986572266, 2.9063994884490967, 2.9990532398223877, 3.0917069911956787, 3.184360980987549, 3.27701473236084, 3.369668483734131, 3.462322235107422, 3.554975986480713, 3.647629976272583, 3.740283727645874, 3.832937479019165, 3.925591468811035, 4.018245220184326, 4.110898971557617]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 4.0, 2.0, 0.0, 4.0, 5.0, 6.0, 6.0, 8.0, 7.0, 9.0, 9.0, 20.0, 14.0, 12.0, 24.0, 28.0, 35.0, 26.0, 32.0, 26.0, 33.0, 41.0, 38.0, 38.0, 40.0, 42.0, 40.0, 39.0, 36.0, 34.0, 31.0, 41.0, 43.0, 25.0, 32.0, 29.0, 19.0, 28.0, 20.0, 18.0, 10.0, 10.0, 7.0, 9.0, 8.0, 8.0, 10.0, 3.0, 3.0, 4.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.8165557980537415, -0.7900149822235107, -0.7634741067886353, -0.7369332909584045, -0.710392415523529, -0.6838515996932983, -0.6573107242584229, -0.6307699084281921, -0.6042290925979614, -0.5776882767677307, -0.5511474013328552, -0.5246065855026245, -0.498065710067749, -0.4715248942375183, -0.4449840486049652, -0.4184432029724121, -0.3919023275375366, -0.3653614819049835, -0.3388206362724304, -0.3122798204421997, -0.2857389450073242, -0.2591981291770935, -0.2326572835445404, -0.2061164379119873, -0.1795755922794342, -0.1530347466468811, -0.126493901014328, -0.0999530702829361, -0.073412224650383, -0.046871379017829895, -0.02033054828643799, 0.006210297346115112, 0.03275120258331299, 0.05929204449057579, 0.08583288639783859, 0.1123737245798111, 0.1389145702123642, 0.1654554158449173, 0.1919962465763092, 0.2185370922088623, 0.2450779378414154, 0.2716187834739685, 0.2981596291065216, 0.3247004747390747, 0.3512412905693054, 0.3777821660041809, 0.4043229818344116, 0.4308638274669647, 0.4574046730995178, 0.4839455187320709, 0.510486364364624, 0.5370271801948547, 0.5635680556297302, 0.5901088714599609, 0.6166497468948364, 0.6431905627250671, 0.6697313785552979, 0.6962721943855286, 0.722813069820404, 0.7493538856506348, 0.7758947610855103, 0.802435576915741, 0.8289763927459717, 0.8555172681808472, 0.8820581436157227]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 0.0, 0.0, 3.0, 4.0, 5.0, 2.0, 13.0, 21.0, 41.0, 49.0, 66.0, 125.0, 198.0, 321.0, 519.0, 811.0, 1384.0, 2209.0, 3368.0, 5489.0, 8426.0, 13089.0, 20472.0, 32263.0, 54802.0, 114699.0, 256649.0, 264915.0, 120236.0, 57306.0, 33405.0, 20750.0, 13294.0, 8668.0, 5598.0, 3495.0, 2222.0, 1410.0, 872.0, 539.0, 308.0, 206.0, 119.0, 70.0, 41.0, 36.0, 21.0, 4.0, 3.0, 5.0, 5.0, 4.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 1.0, 1.0], "bins": [-0.180419921875, -0.17441177368164062, -0.16840362548828125, -0.16239547729492188, -0.1563873291015625, -0.15037918090820312, -0.14437103271484375, -0.13836288452148438, -0.132354736328125, -0.12634658813476562, -0.12033843994140625, -0.11433029174804688, -0.1083221435546875, -0.10231399536132812, -0.09630584716796875, -0.09029769897460938, -0.08428955078125, -0.07828140258789062, -0.07227325439453125, -0.06626510620117188, -0.0602569580078125, -0.054248809814453125, -0.04824066162109375, -0.042232513427734375, -0.036224365234375, -0.030216217041015625, -0.02420806884765625, -0.018199920654296875, -0.0121917724609375, -0.006183624267578125, -0.00017547607421875, 0.005832672119140625, 0.0118408203125, 0.017848968505859375, 0.02385711669921875, 0.029865264892578125, 0.0358734130859375, 0.041881561279296875, 0.04788970947265625, 0.053897857666015625, 0.059906005859375, 0.06591415405273438, 0.07192230224609375, 0.07793045043945312, 0.0839385986328125, 0.08994674682617188, 0.09595489501953125, 0.10196304321289062, 0.10797119140625, 0.11397933959960938, 0.11998748779296875, 0.12599563598632812, 0.1320037841796875, 0.13801193237304688, 0.14402008056640625, 0.15002822875976562, 0.156036376953125, 0.16204452514648438, 0.16805267333984375, 0.17406082153320312, 0.1800689697265625, 0.18607711791992188, 0.19208526611328125, 0.19809341430664062, 0.2041015625]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 3.0, 2.0, 1.0, 9.0, 6.0, 4.0, 8.0, 12.0, 11.0, 13.0, 17.0, 18.0, 21.0, 17.0, 27.0, 37.0, 33.0, 25.0, 36.0, 40.0, 38.0, 43.0, 39.0, 55.0, 42.0, 40.0, 38.0, 38.0, 38.0, 42.0, 32.0, 28.0, 34.0, 24.0, 17.0, 16.0, 19.0, 10.0, 9.0, 10.0, 18.0, 9.0, 4.0, 8.0, 4.0, 3.0, 4.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.1429443359375, -0.1384601593017578, -0.13397598266601562, -0.12949180603027344, -0.12500762939453125, -0.12052345275878906, -0.11603927612304688, -0.11155509948730469, -0.1070709228515625, -0.10258674621582031, -0.09810256958007812, -0.09361839294433594, -0.08913421630859375, -0.08465003967285156, -0.08016586303710938, -0.07568168640136719, -0.071197509765625, -0.06671333312988281, -0.062229156494140625, -0.05774497985839844, -0.05326080322265625, -0.04877662658691406, -0.044292449951171875, -0.03980827331542969, -0.0353240966796875, -0.030839920043945312, -0.026355743408203125, -0.021871566772460938, -0.01738739013671875, -0.012903213500976562, -0.008419036865234375, -0.0039348602294921875, 0.00054931640625, 0.0050334930419921875, 0.009517669677734375, 0.014001846313476562, 0.01848602294921875, 0.022970199584960938, 0.027454376220703125, 0.03193855285644531, 0.0364227294921875, 0.04090690612792969, 0.045391082763671875, 0.04987525939941406, 0.05435943603515625, 0.05884361267089844, 0.06332778930664062, 0.06781196594238281, 0.072296142578125, 0.07678031921386719, 0.08126449584960938, 0.08574867248535156, 0.09023284912109375, 0.09471702575683594, 0.09920120239257812, 0.10368537902832031, 0.1081695556640625, 0.11265373229980469, 0.11713790893554688, 0.12162208557128906, 0.12610626220703125, 0.13059043884277344, 0.13507461547851562, 0.1395587921142578, 0.14404296875]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 7.0, 8.0, 8.0, 10.0, 12.0, 19.0, 22.0, 33.0, 62.0, 71.0, 114.0, 218.0, 602.0, 2248.0, 8210.0, 28446.0, 103689.0, 625247.0, 214911.0, 46070.0, 13021.0, 3745.0, 1014.0, 349.0, 134.0, 71.0, 57.0, 42.0, 33.0, 19.0, 22.0, 7.0, 9.0, 5.0, 2.0, 5.0, 4.0, 2.0, 4.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.56103515625, -0.5433349609375, -0.525634765625, -0.5079345703125, -0.490234375, -0.4725341796875, -0.454833984375, -0.4371337890625, -0.41943359375, -0.4017333984375, -0.384033203125, -0.3663330078125, -0.3486328125, -0.3309326171875, -0.313232421875, -0.2955322265625, -0.27783203125, -0.2601318359375, -0.242431640625, -0.2247314453125, -0.20703125, -0.1893310546875, -0.171630859375, -0.1539306640625, -0.13623046875, -0.1185302734375, -0.100830078125, -0.0831298828125, -0.0654296875, -0.0477294921875, -0.030029296875, -0.0123291015625, 0.00537109375, 0.0230712890625, 0.040771484375, 0.0584716796875, 0.076171875, 0.0938720703125, 0.111572265625, 0.1292724609375, 0.14697265625, 0.1646728515625, 0.182373046875, 0.2000732421875, 0.2177734375, 0.2354736328125, 0.253173828125, 0.2708740234375, 0.28857421875, 0.3062744140625, 0.323974609375, 0.3416748046875, 0.359375, 0.3770751953125, 0.394775390625, 0.4124755859375, 0.43017578125, 0.4478759765625, 0.465576171875, 0.4832763671875, 0.5009765625, 0.5186767578125, 0.536376953125, 0.5540771484375, 0.57177734375]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 1.0, 2.0, 4.0, 1.0, 2.0, 3.0, 1.0, 9.0, 10.0, 12.0, 17.0, 23.0, 32.0, 36.0, 36.0, 51.0, 43.0, 41.0, 71.0, 65.0, 55.0, 71.0, 53.0, 43.0, 51.0, 54.0, 40.0, 39.0, 26.0, 23.0, 19.0, 22.0, 11.0, 9.0, 4.0, 9.0, 3.0, 3.0, 2.0, 2.0, 2.0, 0.0, 2.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.63232421875, -0.6123886108398438, -0.5924530029296875, -0.5725173950195312, -0.552581787109375, -0.5326461791992188, -0.5127105712890625, -0.49277496337890625, -0.47283935546875, -0.45290374755859375, -0.4329681396484375, -0.41303253173828125, -0.393096923828125, -0.37316131591796875, -0.3532257080078125, -0.33329010009765625, -0.3133544921875, -0.29341888427734375, -0.2734832763671875, -0.25354766845703125, -0.233612060546875, -0.21367645263671875, -0.1937408447265625, -0.17380523681640625, -0.15386962890625, -0.13393402099609375, -0.1139984130859375, -0.09406280517578125, -0.074127197265625, -0.05419158935546875, -0.0342559814453125, -0.01432037353515625, 0.005615234375, 0.02555084228515625, 0.0454864501953125, 0.06542205810546875, 0.085357666015625, 0.10529327392578125, 0.1252288818359375, 0.14516448974609375, 0.16510009765625, 0.18503570556640625, 0.2049713134765625, 0.22490692138671875, 0.244842529296875, 0.26477813720703125, 0.2847137451171875, 0.30464935302734375, 0.3245849609375, 0.34452056884765625, 0.3644561767578125, 0.38439178466796875, 0.404327392578125, 0.42426300048828125, 0.4441986083984375, 0.46413421630859375, 0.48406982421875, 0.5040054321289062, 0.5239410400390625, 0.5438766479492188, 0.563812255859375, 0.5837478637695312, 0.6036834716796875, 0.6236190795898438, 0.6435546875]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 3.0, 2.0, 0.0, 4.0, 5.0, 8.0, 10.0, 23.0, 19.0, 24.0, 51.0, 74.0, 100.0, 194.0, 238.0, 417.0, 589.0, 939.0, 1526.0, 2507.0, 3689.0, 5752.0, 8724.0, 13659.0, 22189.0, 41080.0, 95161.0, 275502.0, 334620.0, 123087.0, 49604.0, 25530.0, 15418.0, 9849.0, 6343.0, 4221.0, 2685.0, 1709.0, 1076.0, 678.0, 453.0, 296.0, 169.0, 111.0, 68.0, 43.0, 33.0, 26.0, 16.0, 21.0, 8.0, 3.0, 4.0, 3.0, 2.0, 1.0, 1.0, 3.0, 0.0, 1.0], "bins": [-0.1407470703125, -0.1363658905029297, -0.13198471069335938, -0.12760353088378906, -0.12322235107421875, -0.11884117126464844, -0.11445999145507812, -0.11007881164550781, -0.1056976318359375, -0.10131645202636719, -0.09693527221679688, -0.09255409240722656, -0.08817291259765625, -0.08379173278808594, -0.07941055297851562, -0.07502937316894531, -0.070648193359375, -0.06626701354980469, -0.061885833740234375, -0.05750465393066406, -0.05312347412109375, -0.04874229431152344, -0.044361114501953125, -0.03997993469238281, -0.0355987548828125, -0.031217575073242188, -0.026836395263671875, -0.022455215454101562, -0.01807403564453125, -0.013692855834960938, -0.009311676025390625, -0.0049304962158203125, -0.00054931640625, 0.0038318634033203125, 0.008213043212890625, 0.012594223022460938, 0.01697540283203125, 0.021356582641601562, 0.025737762451171875, 0.030118942260742188, 0.0345001220703125, 0.03888130187988281, 0.043262481689453125, 0.04764366149902344, 0.05202484130859375, 0.05640602111816406, 0.060787200927734375, 0.06516838073730469, 0.069549560546875, 0.07393074035644531, 0.07831192016601562, 0.08269309997558594, 0.08707427978515625, 0.09145545959472656, 0.09583663940429688, 0.10021781921386719, 0.1045989990234375, 0.10898017883300781, 0.11336135864257812, 0.11774253845214844, 0.12212371826171875, 0.12650489807128906, 0.13088607788085938, 0.1352672576904297, 0.1396484375]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 6.0, 2.0, 1.0, 2.0, 4.0, 8.0, 6.0, 5.0, 10.0, 19.0, 13.0, 21.0, 32.0, 52.0, 79.0, 83.0, 104.0, 133.0, 102.0, 86.0, 52.0, 41.0, 28.0, 27.0, 13.0, 15.0, 6.0, 7.0, 8.0, 3.0, 8.0, 3.0, 3.0, 3.0, 7.0, 1.0, 2.0, 2.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-3.2842159271240234e-05, -3.168080002069473e-05, -3.051944077014923e-05, -2.935808151960373e-05, -2.8196722269058228e-05, -2.7035363018512726e-05, -2.5874003767967224e-05, -2.4712644517421722e-05, -2.355128526687622e-05, -2.238992601633072e-05, -2.1228566765785217e-05, -2.0067207515239716e-05, -1.8905848264694214e-05, -1.7744489014148712e-05, -1.658312976360321e-05, -1.542177051305771e-05, -1.4260411262512207e-05, -1.3099052011966705e-05, -1.1937692761421204e-05, -1.0776333510875702e-05, -9.6149742603302e-06, -8.453615009784698e-06, -7.292255759239197e-06, -6.130896508693695e-06, -4.969537258148193e-06, -3.8081780076026917e-06, -2.64681875705719e-06, -1.4854595065116882e-06, -3.241002559661865e-07, 8.372589945793152e-07, 1.998618245124817e-06, 3.1599774956703186e-06, 4.32133674621582e-06, 5.482695996761322e-06, 6.644055247306824e-06, 7.805414497852325e-06, 8.966773748397827e-06, 1.0128132998943329e-05, 1.128949224948883e-05, 1.2450851500034332e-05, 1.3612210750579834e-05, 1.4773570001125336e-05, 1.5934929251670837e-05, 1.709628850221634e-05, 1.825764775276184e-05, 1.9419007003307343e-05, 2.0580366253852844e-05, 2.1741725504398346e-05, 2.2903084754943848e-05, 2.406444400548935e-05, 2.522580325603485e-05, 2.6387162506580353e-05, 2.7548521757125854e-05, 2.8709881007671356e-05, 2.9871240258216858e-05, 3.103259950876236e-05, 3.219395875930786e-05, 3.335531800985336e-05, 3.4516677260398865e-05, 3.5678036510944366e-05, 3.683939576148987e-05, 3.800075501203537e-05, 3.916211426258087e-05, 4.032347351312637e-05, 4.1484832763671875e-05]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 4.0, 3.0, 4.0, 8.0, 6.0, 19.0, 11.0, 25.0, 34.0, 52.0, 100.0, 140.0, 232.0, 413.0, 824.0, 1566.0, 3138.0, 6117.0, 12418.0, 25424.0, 60673.0, 211067.0, 487118.0, 148257.0, 48457.0, 21429.0, 10342.0, 5118.0, 2661.0, 1306.0, 688.0, 377.0, 208.0, 104.0, 68.0, 47.0, 22.0, 22.0, 13.0, 8.0, 9.0, 4.0, 3.0, 7.0, 5.0, 1.0, 3.0, 2.0, 1.0, 1.0, 2.0], "bins": [-0.212646484375, -0.2066364288330078, -0.20062637329101562, -0.19461631774902344, -0.18860626220703125, -0.18259620666503906, -0.17658615112304688, -0.1705760955810547, -0.1645660400390625, -0.1585559844970703, -0.15254592895507812, -0.14653587341308594, -0.14052581787109375, -0.13451576232910156, -0.12850570678710938, -0.12249565124511719, -0.116485595703125, -0.11047554016113281, -0.10446548461914062, -0.09845542907714844, -0.09244537353515625, -0.08643531799316406, -0.08042526245117188, -0.07441520690917969, -0.0684051513671875, -0.06239509582519531, -0.056385040283203125, -0.05037498474121094, -0.04436492919921875, -0.03835487365722656, -0.032344818115234375, -0.026334762573242188, -0.02032470703125, -0.014314651489257812, -0.008304595947265625, -0.0022945404052734375, 0.00371551513671875, 0.009725570678710938, 0.015735626220703125, 0.021745681762695312, 0.0277557373046875, 0.03376579284667969, 0.039775848388671875, 0.04578590393066406, 0.05179595947265625, 0.05780601501464844, 0.06381607055664062, 0.06982612609863281, 0.075836181640625, 0.08184623718261719, 0.08785629272460938, 0.09386634826660156, 0.09987640380859375, 0.10588645935058594, 0.11189651489257812, 0.11790657043457031, 0.1239166259765625, 0.1299266815185547, 0.13593673706054688, 0.14194679260253906, 0.14795684814453125, 0.15396690368652344, 0.15997695922851562, 0.1659870147705078, 0.1719970703125]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 3.0, 3.0, 0.0, 2.0, 1.0, 4.0, 2.0, 9.0, 5.0, 4.0, 6.0, 14.0, 25.0, 31.0, 49.0, 71.0, 116.0, 131.0, 162.0, 124.0, 80.0, 49.0, 24.0, 16.0, 17.0, 11.0, 8.0, 8.0, 5.0, 5.0, 1.0, 5.0, 6.0, 3.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.184814453125, -0.17796707153320312, -0.17111968994140625, -0.16427230834960938, -0.1574249267578125, -0.15057754516601562, -0.14373016357421875, -0.13688278198242188, -0.130035400390625, -0.12318801879882812, -0.11634063720703125, -0.10949325561523438, -0.1026458740234375, -0.09579849243164062, -0.08895111083984375, -0.08210372924804688, -0.07525634765625, -0.06840896606445312, -0.06156158447265625, -0.054714202880859375, -0.0478668212890625, -0.041019439697265625, -0.03417205810546875, -0.027324676513671875, -0.020477294921875, -0.013629913330078125, -0.00678253173828125, 6.4849853515625e-05, 0.0069122314453125, 0.013759613037109375, 0.02060699462890625, 0.027454376220703125, 0.0343017578125, 0.041149139404296875, 0.04799652099609375, 0.054843902587890625, 0.0616912841796875, 0.06853866577148438, 0.07538604736328125, 0.08223342895507812, 0.089080810546875, 0.09592819213867188, 0.10277557373046875, 0.10962295532226562, 0.1164703369140625, 0.12331771850585938, 0.13016510009765625, 0.13701248168945312, 0.14385986328125, 0.15070724487304688, 0.15755462646484375, 0.16440200805664062, 0.1712493896484375, 0.17809677124023438, 0.18494415283203125, 0.19179153442382812, 0.198638916015625, 0.20548629760742188, 0.21233367919921875, 0.21918106079101562, 0.2260284423828125, 0.23287582397460938, 0.23972320556640625, 0.24657058715820312, 0.25341796875]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 7.0, 13.0, 58.0, 128.0, 208.0, 243.0, 169.0, 98.0, 57.0, 24.0, 7.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.615866661071777, -4.492478370666504, -4.3690900802612305, -4.245701789855957, -4.122313499450684, -3.99892520904541, -3.8755369186401367, -3.7521486282348633, -3.62876033782959, -3.5053720474243164, -3.381983757019043, -3.2585954666137695, -3.135207176208496, -3.0118188858032227, -2.888430595397949, -2.765042304992676, -2.6416540145874023, -2.518265724182129, -2.3948774337768555, -2.271489143371582, -2.1481008529663086, -2.024712562561035, -1.9013242721557617, -1.7779359817504883, -1.654547929763794, -1.5311596393585205, -1.407771348953247, -1.2843830585479736, -1.1609947681427002, -1.0376064777374268, -0.9142182469367981, -0.7908299565315247, -0.6674416065216064, -0.544053316116333, -0.42066502571105957, -0.2972767651081085, -0.17388847470283508, -0.05050021409988403, 0.0728880763053894, 0.19627636671066284, 0.3196646571159363, 0.4430529475212097, 0.5664412379264832, 0.6898294687271118, 0.8132177591323853, 0.9366060495376587, 1.0599943399429321, 1.1833826303482056, 1.306770920753479, 1.4301592111587524, 1.5535475015640259, 1.6769357919692993, 1.8003240823745728, 1.9237122535705566, 2.04710054397583, 2.1704888343811035, 2.293877124786377, 2.4172654151916504, 2.540653705596924, 2.6640419960021973, 2.7874302864074707, 2.910818576812744, 3.0342068672180176, 3.157595157623291, 3.2809834480285645]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 0.0, 2.0, 5.0, 1.0, 5.0, 2.0, 8.0, 11.0, 13.0, 12.0, 9.0, 13.0, 14.0, 21.0, 31.0, 29.0, 35.0, 31.0, 35.0, 43.0, 53.0, 48.0, 51.0, 50.0, 42.0, 36.0, 36.0, 40.0, 46.0, 31.0, 33.0, 23.0, 33.0, 18.0, 20.0, 25.0, 22.0, 19.0, 9.0, 13.0, 10.0, 7.0, 5.0, 3.0, 8.0, 2.0, 4.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 1.0], "bins": [-1.59968900680542, -1.5522652864456177, -1.5048415660858154, -1.4574178457260132, -1.409994125366211, -1.3625702857971191, -1.3151466846466064, -1.2677228450775146, -1.2202991247177124, -1.1728754043579102, -1.125451683998108, -1.0780279636383057, -1.0306042432785034, -0.9831804633140564, -0.9357567429542542, -0.8883329629898071, -0.8409093022346497, -0.7934855818748474, -0.7460618615150452, -0.6986380815505981, -0.6512143611907959, -0.6037906408309937, -0.5563669204711914, -0.5089432001113892, -0.4615194499492645, -0.4140957295894623, -0.36667197942733765, -0.3192482590675354, -0.27182453870773315, -0.22440078854560852, -0.17697706818580627, -0.12955331802368164, -0.0821295976638794, -0.03470586612820625, 0.012717865407466888, 0.06014159321784973, 0.10756532847881317, 0.1549890637397766, 0.20241278409957886, 0.2498365342617035, 0.29726025462150574, 0.344683974981308, 0.3921077251434326, 0.43953144550323486, 0.4869551658630371, 0.5343788862228394, 0.5818026065826416, 0.6292263865470886, 0.6766501069068909, 0.7240738272666931, 0.7714975476264954, 0.8189213275909424, 0.8663450479507446, 0.9137687683105469, 0.9611924886703491, 1.0086162090301514, 1.0560399293899536, 1.1034636497497559, 1.150887370109558, 1.1983110904693604, 1.2457348108291626, 1.2931585311889648, 1.3405823707580566, 1.3880060911178589, 1.4354298114776611]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 5.0, 7.0, 1.0, 9.0, 14.0, 13.0, 21.0, 15.0, 26.0, 39.0, 52.0, 85.0, 114.0, 184.0, 355.0, 650.0, 1295.0, 2849.0, 6364.0, 15362.0, 39801.0, 112640.0, 369410.0, 1725198.0, 1427256.0, 328103.0, 102384.0, 36159.0, 14264.0, 6177.0, 2631.0, 1249.0, 638.0, 336.0, 180.0, 107.0, 70.0, 66.0, 34.0, 35.0, 18.0, 19.0, 11.0, 14.0, 9.0, 3.0, 9.0, 3.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.237548828125, -0.22961807250976562, -0.22168731689453125, -0.21375656127929688, -0.2058258056640625, -0.19789505004882812, -0.18996429443359375, -0.18203353881835938, -0.174102783203125, -0.16617202758789062, -0.15824127197265625, -0.15031051635742188, -0.1423797607421875, -0.13444900512695312, -0.12651824951171875, -0.11858749389648438, -0.11065673828125, -0.10272598266601562, -0.09479522705078125, -0.08686447143554688, -0.0789337158203125, -0.07100296020507812, -0.06307220458984375, -0.055141448974609375, -0.047210693359375, -0.039279937744140625, -0.03134918212890625, -0.023418426513671875, -0.0154876708984375, -0.007556915283203125, 0.00037384033203125, 0.008304595947265625, 0.0162353515625, 0.024166107177734375, 0.03209686279296875, 0.040027618408203125, 0.0479583740234375, 0.055889129638671875, 0.06381988525390625, 0.07175064086914062, 0.079681396484375, 0.08761215209960938, 0.09554290771484375, 0.10347366333007812, 0.1114044189453125, 0.11933517456054688, 0.12726593017578125, 0.13519668579101562, 0.14312744140625, 0.15105819702148438, 0.15898895263671875, 0.16691970825195312, 0.1748504638671875, 0.18278121948242188, 0.19071197509765625, 0.19864273071289062, 0.206573486328125, 0.21450424194335938, 0.22243499755859375, 0.23036575317382812, 0.2382965087890625, 0.24622726440429688, 0.25415802001953125, 0.2620887756347656, 0.27001953125]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 4.0, 3.0, 6.0, 5.0, 10.0, 11.0, 16.0, 19.0, 15.0, 14.0, 30.0, 35.0, 16.0, 29.0, 47.0, 41.0, 47.0, 36.0, 48.0, 49.0, 57.0, 41.0, 50.0, 45.0, 37.0, 30.0, 32.0, 33.0, 30.0, 35.0, 21.0, 16.0, 16.0, 19.0, 14.0, 11.0, 9.0, 6.0, 6.0, 10.0, 3.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.154541015625, -0.1491260528564453, -0.14371109008789062, -0.13829612731933594, -0.13288116455078125, -0.12746620178222656, -0.12205123901367188, -0.11663627624511719, -0.1112213134765625, -0.10580635070800781, -0.10039138793945312, -0.09497642517089844, -0.08956146240234375, -0.08414649963378906, -0.07873153686523438, -0.07331657409667969, -0.067901611328125, -0.06248664855957031, -0.057071685791015625, -0.05165672302246094, -0.04624176025390625, -0.04082679748535156, -0.035411834716796875, -0.029996871948242188, -0.0245819091796875, -0.019166946411132812, -0.013751983642578125, -0.008337020874023438, -0.00292205810546875, 0.0024929046630859375, 0.007907867431640625, 0.013322830200195312, 0.01873779296875, 0.024152755737304688, 0.029567718505859375, 0.03498268127441406, 0.04039764404296875, 0.04581260681152344, 0.051227569580078125, 0.05664253234863281, 0.0620574951171875, 0.06747245788574219, 0.07288742065429688, 0.07830238342285156, 0.08371734619140625, 0.08913230895996094, 0.09454727172851562, 0.09996223449707031, 0.105377197265625, 0.11079216003417969, 0.11620712280273438, 0.12162208557128906, 0.12703704833984375, 0.13245201110839844, 0.13786697387695312, 0.1432819366455078, 0.1486968994140625, 0.1541118621826172, 0.15952682495117188, 0.16494178771972656, 0.17035675048828125, 0.17577171325683594, 0.18118667602539062, 0.1866016387939453, 0.1920166015625]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 4.0, 7.0, 5.0, 16.0, 13.0, 20.0, 23.0, 36.0, 43.0, 67.0, 84.0, 121.0, 169.0, 245.0, 405.0, 666.0, 1030.0, 1851.0, 3339.0, 6664.0, 14448.0, 34109.0, 91890.0, 279271.0, 974774.0, 1914723.0, 585529.0, 177702.0, 61407.0, 23684.0, 10318.0, 5115.0, 2558.0, 1503.0, 863.0, 500.0, 353.0, 208.0, 127.0, 111.0, 87.0, 56.0, 39.0, 29.0, 28.0, 13.0, 6.0, 14.0, 8.0, 2.0, 1.0, 2.0, 5.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.357666015625, -0.3462409973144531, -0.33481597900390625, -0.3233909606933594, -0.3119659423828125, -0.3005409240722656, -0.28911590576171875, -0.2776908874511719, -0.266265869140625, -0.2548408508300781, -0.24341583251953125, -0.23199081420898438, -0.2205657958984375, -0.20914077758789062, -0.19771575927734375, -0.18629074096679688, -0.17486572265625, -0.16344070434570312, -0.15201568603515625, -0.14059066772460938, -0.1291656494140625, -0.11774063110351562, -0.10631561279296875, -0.09489059448242188, -0.083465576171875, -0.07204055786132812, -0.06061553955078125, -0.049190521240234375, -0.0377655029296875, -0.026340484619140625, -0.01491546630859375, -0.003490447998046875, 0.0079345703125, 0.019359588623046875, 0.03078460693359375, 0.042209625244140625, 0.0536346435546875, 0.06505966186523438, 0.07648468017578125, 0.08790969848632812, 0.099334716796875, 0.11075973510742188, 0.12218475341796875, 0.13360977172851562, 0.1450347900390625, 0.15645980834960938, 0.16788482666015625, 0.17930984497070312, 0.19073486328125, 0.20215988159179688, 0.21358489990234375, 0.22500991821289062, 0.2364349365234375, 0.24785995483398438, 0.25928497314453125, 0.2707099914550781, 0.282135009765625, 0.2935600280761719, 0.30498504638671875, 0.3164100646972656, 0.3278350830078125, 0.3392601013183594, 0.35068511962890625, 0.3621101379394531, 0.37353515625]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 7.0, 8.0, 2.0, 3.0, 13.0, 16.0, 28.0, 31.0, 49.0, 45.0, 84.0, 130.0, 178.0, 268.0, 393.0, 555.0, 761.0, 526.0, 341.0, 237.0, 145.0, 85.0, 45.0, 34.0, 27.0, 21.0, 12.0, 14.0, 10.0, 3.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.427490234375, -0.4160804748535156, -0.40467071533203125, -0.3932609558105469, -0.3818511962890625, -0.3704414367675781, -0.35903167724609375, -0.3476219177246094, -0.336212158203125, -0.3248023986816406, -0.31339263916015625, -0.3019828796386719, -0.2905731201171875, -0.2791633605957031, -0.26775360107421875, -0.2563438415527344, -0.24493408203125, -0.23352432250976562, -0.22211456298828125, -0.21070480346679688, -0.1992950439453125, -0.18788528442382812, -0.17647552490234375, -0.16506576538085938, -0.153656005859375, -0.14224624633789062, -0.13083648681640625, -0.11942672729492188, -0.1080169677734375, -0.09660720825195312, -0.08519744873046875, -0.07378768920898438, -0.0623779296875, -0.050968170166015625, -0.03955841064453125, -0.028148651123046875, -0.0167388916015625, -0.005329132080078125, 0.00608062744140625, 0.017490386962890625, 0.028900146484375, 0.040309906005859375, 0.05171966552734375, 0.06312942504882812, 0.0745391845703125, 0.08594894409179688, 0.09735870361328125, 0.10876846313476562, 0.12017822265625, 0.13158798217773438, 0.14299774169921875, 0.15440750122070312, 0.1658172607421875, 0.17722702026367188, 0.18863677978515625, 0.20004653930664062, 0.211456298828125, 0.22286605834960938, 0.23427581787109375, 0.24568557739257812, 0.2570953369140625, 0.2685050964355469, 0.27991485595703125, 0.2913246154785156, 0.302734375]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 11.0, 29.0, 40.0, 66.0, 113.0, 144.0, 131.0, 130.0, 147.0, 80.0, 53.0, 32.0, 11.0, 8.0, 6.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6104118824005127, -1.5310784578323364, -1.4517451524734497, -1.3724117279052734, -1.2930784225463867, -1.2137449979782104, -1.1344115734100342, -1.0550782680511475, -0.9757448434829712, -0.8964114785194397, -0.8170781135559082, -0.7377446889877319, -0.6584113240242004, -0.579077959060669, -0.49974456429481506, -0.4204111695289612, -0.3410778045654297, -0.2617444396018982, -0.1824110448360443, -0.10307766497135162, -0.023744285106658936, 0.05558907985687256, 0.13492247462272644, 0.21425586938858032, 0.2935892343521118, 0.3729225993156433, 0.4522559940814972, 0.5315893888473511, 0.6109227538108826, 0.6902561187744141, 0.7695895433425903, 0.8489229083061218, 0.9282560348510742, 1.0075894594192505, 1.0869227647781372, 1.1662561893463135, 1.2455894947052002, 1.3249229192733765, 1.4042563438415527, 1.4835896492004395, 1.5629230737686157, 1.642256498336792, 1.7215898036956787, 1.800923228263855, 1.8802566528320312, 1.959589958190918, 2.0389232635498047, 2.1182568073272705, 2.1975901126861572, 2.276923418045044, 2.3562569618225098, 2.4355902671813965, 2.514923572540283, 2.59425687789917, 2.6735904216766357, 2.7529237270355225, 2.8322572708129883, 2.911590576171875, 2.990924119949341, 3.0702574253082275, 3.1495907306671143, 3.22892427444458, 3.308257579803467, 3.3875908851623535, 3.4669241905212402]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 4.0, 3.0, 2.0, 5.0, 3.0, 7.0, 7.0, 4.0, 7.0, 9.0, 12.0, 23.0, 10.0, 24.0, 19.0, 16.0, 26.0, 25.0, 28.0, 25.0, 35.0, 38.0, 36.0, 38.0, 31.0, 26.0, 39.0, 28.0, 41.0, 26.0, 49.0, 29.0, 28.0, 31.0, 35.0, 33.0, 17.0, 33.0, 22.0, 20.0, 28.0, 13.0, 11.0, 8.0, 12.0, 13.0, 7.0, 5.0, 4.0, 4.0, 4.0, 3.0, 2.0, 6.0], "bins": [-1.1062405109405518, -1.0761770009994507, -1.0461136102676392, -1.016050100326538, -0.9859866499900818, -0.9559231996536255, -0.9258596897125244, -0.8957962393760681, -0.8657327890396118, -0.8356693387031555, -0.8056058883666992, -0.7755423784255981, -0.7454789280891418, -0.7154154777526855, -0.6853519678115845, -0.6552885174751282, -0.6252250671386719, -0.5951616168022156, -0.5650981664657593, -0.5350346565246582, -0.5049712061882019, -0.4749077558517456, -0.4448442757129669, -0.41478079557418823, -0.38471734523773193, -0.35465389490127563, -0.32459041476249695, -0.29452693462371826, -0.26446348428726196, -0.23440001904964447, -0.20433655381202698, -0.17427308857440948, -0.144209623336792, -0.1141461580991745, -0.084082692861557, -0.054019227623939514, -0.02395576238632202, 0.006107702851295471, 0.036171168088912964, 0.06623463332653046, 0.09629809856414795, 0.12636156380176544, 0.15642502903938293, 0.18648849427700043, 0.21655195951461792, 0.2466154247522354, 0.2766788899898529, 0.3067423701286316, 0.3368058204650879, 0.3668692708015442, 0.3969327509403229, 0.42699623107910156, 0.45705968141555786, 0.48712313175201416, 0.5171866416931152, 0.5472500920295715, 0.5773135423660278, 0.6073769927024841, 0.6374404430389404, 0.6675039529800415, 0.6975674033164978, 0.7276308536529541, 0.7576943635940552, 0.7877578139305115, 0.8178212642669678]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 6.0, 6.0, 13.0, 24.0, 32.0, 44.0, 51.0, 107.0, 169.0, 298.0, 486.0, 743.0, 1287.0, 2053.0, 3298.0, 5316.0, 8343.0, 13041.0, 20602.0, 32164.0, 52129.0, 92926.0, 187999.0, 263403.0, 158639.0, 79609.0, 46091.0, 28944.0, 18740.0, 11989.0, 7614.0, 4724.0, 3019.0, 1777.0, 1140.0, 664.0, 429.0, 239.0, 142.0, 108.0, 51.0, 43.0, 25.0, 16.0, 11.0, 5.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.167236328125, -0.16190719604492188, -0.15657806396484375, -0.15124893188476562, -0.1459197998046875, -0.14059066772460938, -0.13526153564453125, -0.12993240356445312, -0.124603271484375, -0.11927413940429688, -0.11394500732421875, -0.10861587524414062, -0.1032867431640625, -0.09795761108398438, -0.09262847900390625, -0.08729934692382812, -0.08197021484375, -0.07664108276367188, -0.07131195068359375, -0.06598281860351562, -0.0606536865234375, -0.055324554443359375, -0.04999542236328125, -0.044666290283203125, -0.039337158203125, -0.034008026123046875, -0.02867889404296875, -0.023349761962890625, -0.0180206298828125, -0.012691497802734375, -0.00736236572265625, -0.002033233642578125, 0.0032958984375, 0.008625030517578125, 0.01395416259765625, 0.019283294677734375, 0.0246124267578125, 0.029941558837890625, 0.03527069091796875, 0.040599822998046875, 0.045928955078125, 0.051258087158203125, 0.05658721923828125, 0.061916351318359375, 0.0672454833984375, 0.07257461547851562, 0.07790374755859375, 0.08323287963867188, 0.08856201171875, 0.09389114379882812, 0.09922027587890625, 0.10454940795898438, 0.1098785400390625, 0.11520767211914062, 0.12053680419921875, 0.12586593627929688, 0.131195068359375, 0.13652420043945312, 0.14185333251953125, 0.14718246459960938, 0.1525115966796875, 0.15784072875976562, 0.16316986083984375, 0.16849899291992188, 0.173828125]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 2.0, 3.0, 8.0, 6.0, 7.0, 3.0, 8.0, 10.0, 10.0, 11.0, 14.0, 17.0, 24.0, 18.0, 42.0, 27.0, 39.0, 19.0, 45.0, 51.0, 49.0, 48.0, 55.0, 41.0, 44.0, 41.0, 35.0, 36.0, 41.0, 34.0, 37.0, 34.0, 30.0, 22.0, 15.0, 16.0, 7.0, 11.0, 9.0, 7.0, 10.0, 5.0, 2.0, 7.0, 5.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.156982421875, -0.15175247192382812, -0.14652252197265625, -0.14129257202148438, -0.1360626220703125, -0.13083267211914062, -0.12560272216796875, -0.12037277221679688, -0.115142822265625, -0.10991287231445312, -0.10468292236328125, -0.09945297241210938, -0.0942230224609375, -0.08899307250976562, -0.08376312255859375, -0.07853317260742188, -0.07330322265625, -0.06807327270507812, -0.06284332275390625, -0.057613372802734375, -0.0523834228515625, -0.047153472900390625, -0.04192352294921875, -0.036693572998046875, -0.031463623046875, -0.026233673095703125, -0.02100372314453125, -0.015773773193359375, -0.0105438232421875, -0.005313873291015625, -8.392333984375e-05, 0.005146026611328125, 0.0103759765625, 0.015605926513671875, 0.02083587646484375, 0.026065826416015625, 0.0312957763671875, 0.036525726318359375, 0.04175567626953125, 0.046985626220703125, 0.052215576171875, 0.057445526123046875, 0.06267547607421875, 0.06790542602539062, 0.0731353759765625, 0.07836532592773438, 0.08359527587890625, 0.08882522583007812, 0.09405517578125, 0.09928512573242188, 0.10451507568359375, 0.10974502563476562, 0.1149749755859375, 0.12020492553710938, 0.12543487548828125, 0.13066482543945312, 0.135894775390625, 0.14112472534179688, 0.14635467529296875, 0.15158462524414062, 0.1568145751953125, 0.16204452514648438, 0.16727447509765625, 0.17250442504882812, 0.177734375]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 5.0, 2.0, 7.0, 8.0, 12.0, 7.0, 14.0, 15.0, 17.0, 17.0, 45.0, 34.0, 43.0, 104.0, 202.0, 625.0, 3805.0, 25295.0, 173470.0, 712231.0, 112358.0, 16851.0, 2462.0, 475.0, 147.0, 78.0, 54.0, 34.0, 39.0, 21.0, 20.0, 15.0, 7.0, 11.0, 7.0, 4.0, 2.0, 4.0, 5.0, 5.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.63671875, -0.6142959594726562, -0.5918731689453125, -0.5694503784179688, -0.547027587890625, -0.5246047973632812, -0.5021820068359375, -0.47975921630859375, -0.45733642578125, -0.43491363525390625, -0.4124908447265625, -0.39006805419921875, -0.367645263671875, -0.34522247314453125, -0.3227996826171875, -0.30037689208984375, -0.2779541015625, -0.25553131103515625, -0.2331085205078125, -0.21068572998046875, -0.188262939453125, -0.16584014892578125, -0.1434173583984375, -0.12099456787109375, -0.09857177734375, -0.07614898681640625, -0.0537261962890625, -0.03130340576171875, -0.008880615234375, 0.01354217529296875, 0.0359649658203125, 0.05838775634765625, 0.080810546875, 0.10323333740234375, 0.1256561279296875, 0.14807891845703125, 0.170501708984375, 0.19292449951171875, 0.2153472900390625, 0.23777008056640625, 0.26019287109375, 0.28261566162109375, 0.3050384521484375, 0.32746124267578125, 0.349884033203125, 0.37230682373046875, 0.3947296142578125, 0.41715240478515625, 0.4395751953125, 0.46199798583984375, 0.4844207763671875, 0.5068435668945312, 0.529266357421875, 0.5516891479492188, 0.5741119384765625, 0.5965347290039062, 0.61895751953125, 0.6413803100585938, 0.6638031005859375, 0.6862258911132812, 0.708648681640625, 0.7310714721679688, 0.7534942626953125, 0.7759170532226562, 0.79833984375]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 4.0, 6.0, 6.0, 11.0, 6.0, 9.0, 12.0, 17.0, 27.0, 23.0, 34.0, 26.0, 44.0, 27.0, 45.0, 44.0, 52.0, 61.0, 60.0, 47.0, 52.0, 34.0, 56.0, 54.0, 43.0, 39.0, 30.0, 21.0, 27.0, 9.0, 19.0, 12.0, 8.0, 7.0, 7.0, 9.0, 6.0, 8.0, 3.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.587890625, -0.5681991577148438, -0.5485076904296875, -0.5288162231445312, -0.509124755859375, -0.48943328857421875, -0.4697418212890625, -0.45005035400390625, -0.43035888671875, -0.41066741943359375, -0.3909759521484375, -0.37128448486328125, -0.351593017578125, -0.33190155029296875, -0.3122100830078125, -0.29251861572265625, -0.2728271484375, -0.25313568115234375, -0.2334442138671875, -0.21375274658203125, -0.194061279296875, -0.17436981201171875, -0.1546783447265625, -0.13498687744140625, -0.11529541015625, -0.09560394287109375, -0.0759124755859375, -0.05622100830078125, -0.036529541015625, -0.01683807373046875, 0.0028533935546875, 0.02254486083984375, 0.042236328125, 0.06192779541015625, 0.0816192626953125, 0.10131072998046875, 0.121002197265625, 0.14069366455078125, 0.1603851318359375, 0.18007659912109375, 0.19976806640625, 0.21945953369140625, 0.2391510009765625, 0.25884246826171875, 0.278533935546875, 0.29822540283203125, 0.3179168701171875, 0.33760833740234375, 0.3572998046875, 0.37699127197265625, 0.3966827392578125, 0.41637420654296875, 0.436065673828125, 0.45575714111328125, 0.4754486083984375, 0.49514007568359375, 0.51483154296875, 0.5345230102539062, 0.5542144775390625, 0.5739059448242188, 0.593597412109375, 0.6132888793945312, 0.6329803466796875, 0.6526718139648438, 0.67236328125]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [7.0, 3.0, 2.0, 3.0, 4.0, 14.0, 17.0, 23.0, 28.0, 47.0, 70.0, 86.0, 155.0, 209.0, 356.0, 548.0, 868.0, 1557.0, 2817.0, 5034.0, 9633.0, 18471.0, 35353.0, 66042.0, 161037.0, 414104.0, 182244.0, 70525.0, 37265.0, 19449.0, 10056.0, 5344.0, 2991.0, 1600.0, 942.0, 577.0, 346.0, 221.0, 167.0, 114.0, 76.0, 58.0, 35.0, 30.0, 13.0, 9.0, 4.0, 9.0, 1.0, 2.0, 6.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.119384765625, -0.11471176147460938, -0.11003875732421875, -0.10536575317382812, -0.1006927490234375, -0.09601974487304688, -0.09134674072265625, -0.08667373657226562, -0.082000732421875, -0.07732772827148438, -0.07265472412109375, -0.06798171997070312, -0.0633087158203125, -0.058635711669921875, -0.05396270751953125, -0.049289703369140625, -0.04461669921875, -0.039943695068359375, -0.03527069091796875, -0.030597686767578125, -0.0259246826171875, -0.021251678466796875, -0.01657867431640625, -0.011905670166015625, -0.007232666015625, -0.002559661865234375, 0.00211334228515625, 0.006786346435546875, 0.0114593505859375, 0.016132354736328125, 0.02080535888671875, 0.025478363037109375, 0.0301513671875, 0.034824371337890625, 0.03949737548828125, 0.044170379638671875, 0.0488433837890625, 0.053516387939453125, 0.05818939208984375, 0.06286239624023438, 0.067535400390625, 0.07220840454101562, 0.07688140869140625, 0.08155441284179688, 0.0862274169921875, 0.09090042114257812, 0.09557342529296875, 0.10024642944335938, 0.10491943359375, 0.10959243774414062, 0.11426544189453125, 0.11893844604492188, 0.1236114501953125, 0.12828445434570312, 0.13295745849609375, 0.13763046264648438, 0.142303466796875, 0.14697647094726562, 0.15164947509765625, 0.15632247924804688, 0.1609954833984375, 0.16566848754882812, 0.17034149169921875, 0.17501449584960938, 0.1796875]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 4.0, 4.0, 7.0, 8.0, 10.0, 9.0, 22.0, 13.0, 17.0, 24.0, 35.0, 56.0, 82.0, 118.0, 140.0, 121.0, 86.0, 72.0, 41.0, 32.0, 18.0, 18.0, 17.0, 9.0, 7.0, 8.0, 5.0, 7.0, 4.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.023313522338867e-05, -3.892183303833008e-05, -3.7610530853271484e-05, -3.629922866821289e-05, -3.49879264831543e-05, -3.36766242980957e-05, -3.236532211303711e-05, -3.1054019927978516e-05, -2.9742717742919922e-05, -2.8431415557861328e-05, -2.7120113372802734e-05, -2.580881118774414e-05, -2.4497509002685547e-05, -2.3186206817626953e-05, -2.187490463256836e-05, -2.0563602447509766e-05, -1.9252300262451172e-05, -1.7940998077392578e-05, -1.6629695892333984e-05, -1.531839370727539e-05, -1.4007091522216797e-05, -1.2695789337158203e-05, -1.138448715209961e-05, -1.0073184967041016e-05, -8.761882781982422e-06, -7.450580596923828e-06, -6.139278411865234e-06, -4.827976226806641e-06, -3.516674041748047e-06, -2.205371856689453e-06, -8.940696716308594e-07, 4.172325134277344e-07, 1.7285346984863281e-06, 3.039836883544922e-06, 4.351139068603516e-06, 5.662441253662109e-06, 6.973743438720703e-06, 8.285045623779297e-06, 9.59634780883789e-06, 1.0907649993896484e-05, 1.2218952178955078e-05, 1.3530254364013672e-05, 1.4841556549072266e-05, 1.615285873413086e-05, 1.7464160919189453e-05, 1.8775463104248047e-05, 2.008676528930664e-05, 2.1398067474365234e-05, 2.2709369659423828e-05, 2.4020671844482422e-05, 2.5331974029541016e-05, 2.664327621459961e-05, 2.7954578399658203e-05, 2.9265880584716797e-05, 3.057718276977539e-05, 3.1888484954833984e-05, 3.319978713989258e-05, 3.451108932495117e-05, 3.5822391510009766e-05, 3.713369369506836e-05, 3.844499588012695e-05, 3.975629806518555e-05, 4.106760025024414e-05, 4.2378902435302734e-05, 4.369020462036133e-05]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 3.0, 0.0, 4.0, 2.0, 9.0, 4.0, 11.0, 18.0, 23.0, 29.0, 36.0, 73.0, 116.0, 143.0, 231.0, 413.0, 783.0, 1541.0, 3202.0, 7499.0, 18125.0, 44174.0, 108682.0, 447692.0, 281036.0, 78480.0, 32499.0, 13064.0, 5555.0, 2493.0, 1143.0, 563.0, 322.0, 197.0, 108.0, 87.0, 55.0, 43.0, 28.0, 27.0, 16.0, 13.0, 6.0, 4.0, 1.0, 3.0, 1.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.20556640625, -0.19910812377929688, -0.19264984130859375, -0.18619155883789062, -0.1797332763671875, -0.17327499389648438, -0.16681671142578125, -0.16035842895507812, -0.153900146484375, -0.14744186401367188, -0.14098358154296875, -0.13452529907226562, -0.1280670166015625, -0.12160873413085938, -0.11515045166015625, -0.10869216918945312, -0.10223388671875, -0.09577560424804688, -0.08931732177734375, -0.08285903930664062, -0.0764007568359375, -0.06994247436523438, -0.06348419189453125, -0.057025909423828125, -0.050567626953125, -0.044109344482421875, -0.03765106201171875, -0.031192779541015625, -0.0247344970703125, -0.018276214599609375, -0.01181793212890625, -0.005359649658203125, 0.0010986328125, 0.007556915283203125, 0.01401519775390625, 0.020473480224609375, 0.0269317626953125, 0.033390045166015625, 0.03984832763671875, 0.046306610107421875, 0.052764892578125, 0.059223175048828125, 0.06568145751953125, 0.07213973999023438, 0.0785980224609375, 0.08505630493164062, 0.09151458740234375, 0.09797286987304688, 0.10443115234375, 0.11088943481445312, 0.11734771728515625, 0.12380599975585938, 0.1302642822265625, 0.13672256469726562, 0.14318084716796875, 0.14963912963867188, 0.156097412109375, 0.16255569458007812, 0.16901397705078125, 0.17547225952148438, 0.1819305419921875, 0.18838882446289062, 0.19484710693359375, 0.20130538940429688, 0.207763671875]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 2.0, 2.0, 5.0, 3.0, 9.0, 10.0, 13.0, 10.0, 13.0, 19.0, 27.0, 17.0, 31.0, 45.0, 52.0, 78.0, 112.0, 119.0, 113.0, 74.0, 52.0, 28.0, 24.0, 23.0, 16.0, 16.0, 18.0, 13.0, 14.0, 14.0, 9.0, 8.0, 8.0, 6.0, 3.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.16748046875, -0.16214942932128906, -0.15681838989257812, -0.1514873504638672, -0.14615631103515625, -0.1408252716064453, -0.13549423217773438, -0.13016319274902344, -0.1248321533203125, -0.11950111389160156, -0.11417007446289062, -0.10883903503417969, -0.10350799560546875, -0.09817695617675781, -0.09284591674804688, -0.08751487731933594, -0.082183837890625, -0.07685279846191406, -0.07152175903320312, -0.06619071960449219, -0.06085968017578125, -0.05552864074707031, -0.050197601318359375, -0.04486656188964844, -0.0395355224609375, -0.03420448303222656, -0.028873443603515625, -0.023542404174804688, -0.01821136474609375, -0.012880325317382812, -0.007549285888671875, -0.0022182464599609375, 0.00311279296875, 0.008443832397460938, 0.013774871826171875, 0.019105911254882812, 0.02443695068359375, 0.029767990112304688, 0.035099029541015625, 0.04043006896972656, 0.0457611083984375, 0.05109214782714844, 0.056423187255859375, 0.06175422668457031, 0.06708526611328125, 0.07241630554199219, 0.07774734497070312, 0.08307838439941406, 0.088409423828125, 0.09374046325683594, 0.09907150268554688, 0.10440254211425781, 0.10973358154296875, 0.11506462097167969, 0.12039566040039062, 0.12572669982910156, 0.1310577392578125, 0.13638877868652344, 0.14171981811523438, 0.1470508575439453, 0.15238189697265625, 0.1577129364013672, 0.16304397583007812, 0.16837501525878906, 0.1737060546875]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 7.0, 103.0, 366.0, 422.0, 105.0, 12.0, 2.0], "bins": [-15.278075218200684, -15.023869514465332, -14.769662857055664, -14.515457153320312, -14.261250495910645, -14.007044792175293, -13.752838134765625, -13.498632431030273, -13.244425773620605, -12.990220069885254, -12.736013412475586, -12.481807708740234, -12.227601051330566, -11.973395347595215, -11.719188690185547, -11.464982986450195, -11.210777282714844, -10.956571578979492, -10.702364921569824, -10.448159217834473, -10.193952560424805, -9.939746856689453, -9.685540199279785, -9.431334495544434, -9.177127838134766, -8.922922134399414, -8.668715476989746, -8.414509773254395, -8.160303115844727, -7.906096935272217, -7.651890754699707, -7.3976850509643555, -7.143478870391846, -6.889272689819336, -6.635066509246826, -6.380860328674316, -6.126654148101807, -5.872447967529297, -5.618242263793945, -5.364035606384277, -5.109829425811768, -4.855623245239258, -4.601417064666748, -4.347210884094238, -4.0930047035217285, -3.8387985229492188, -3.584592580795288, -3.3303864002227783, -3.0761804580688477, -2.821974277496338, -2.567768096923828, -2.3135619163513184, -2.0593557357788086, -1.8051496744155884, -1.5509436130523682, -1.2967374324798584, -1.042531132698059, -0.7883249521255493, -0.5341188311576843, -0.27991271018981934, -0.02570652961730957, 0.2284996509552002, 0.4827057123184204, 0.7369118928909302, 0.9911180734634399]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 3.0, 2.0, 1.0, 8.0, 7.0, 8.0, 6.0, 5.0, 28.0, 20.0, 20.0, 24.0, 28.0, 27.0, 29.0, 37.0, 24.0, 40.0, 36.0, 36.0, 45.0, 39.0, 37.0, 57.0, 36.0, 49.0, 33.0, 48.0, 28.0, 36.0, 27.0, 34.0, 31.0, 21.0, 25.0, 23.0, 11.0, 9.0, 6.0, 7.0, 7.0, 5.0, 2.0, 0.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1941161155700684, -1.1479588747024536, -1.1018016338348389, -1.0556445121765137, -1.009487271308899, -0.9633300304412842, -0.9171727895736694, -0.8710156083106995, -0.8248584270477295, -0.7787011861801147, -0.7325440049171448, -0.68638676404953, -0.6402295827865601, -0.5940723419189453, -0.5479151010513306, -0.5017579197883606, -0.45560067892074585, -0.4094434678554535, -0.36328625679016113, -0.3171290159225464, -0.2709718346595764, -0.22481460869312286, -0.1786573827266693, -0.13250017166137695, -0.0863429605960846, -0.04018574580550194, 0.005971468985080719, 0.052128687500953674, 0.09828589856624603, 0.1444431096315384, 0.19060033559799194, 0.2367575466632843, 0.28291475772857666, 0.329071968793869, 0.3752291798591614, 0.4213864207267761, 0.4675436019897461, 0.5137008428573608, 0.5598580837249756, 0.6060152649879456, 0.6521724462509155, 0.6983296871185303, 0.7444868683815002, 0.790644109249115, 0.836801290512085, 0.8829585313796997, 0.9291157722473145, 0.9752729535102844, 1.021430253982544, 1.0675874948501587, 1.1137447357177734, 1.1599018573760986, 1.2060590982437134, 1.2522163391113281, 1.2983735799789429, 1.3445308208465576, 1.3906879425048828, 1.4368451833724976, 1.4830024242401123, 1.5291595458984375, 1.5753167867660522, 1.621474027633667, 1.6676312685012817, 1.7137885093688965, 1.7599456310272217]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 9.0, 4.0, 12.0, 20.0, 18.0, 34.0, 34.0, 43.0, 105.0, 144.0, 195.0, 292.0, 443.0, 708.0, 1245.0, 2274.0, 4215.0, 8004.0, 16866.0, 38100.0, 92962.0, 247279.0, 778891.0, 1935857.0, 686396.0, 225970.0, 85995.0, 35563.0, 15778.0, 7692.0, 3932.0, 2115.0, 1139.0, 694.0, 445.0, 257.0, 201.0, 106.0, 78.0, 57.0, 37.0, 21.0, 18.0, 9.0, 11.0, 9.0, 8.0, 4.0, 2.0, 0.0, 1.0, 3.0], "bins": [-0.268310546875, -0.2607421875, -0.253173828125, -0.24560546875, -0.238037109375, -0.23046875, -0.222900390625, -0.21533203125, -0.207763671875, -0.2001953125, -0.192626953125, -0.18505859375, -0.177490234375, -0.169921875, -0.162353515625, -0.15478515625, -0.147216796875, -0.1396484375, -0.132080078125, -0.12451171875, -0.116943359375, -0.109375, -0.101806640625, -0.09423828125, -0.086669921875, -0.0791015625, -0.071533203125, -0.06396484375, -0.056396484375, -0.048828125, -0.041259765625, -0.03369140625, -0.026123046875, -0.0185546875, -0.010986328125, -0.00341796875, 0.004150390625, 0.01171875, 0.019287109375, 0.02685546875, 0.034423828125, 0.0419921875, 0.049560546875, 0.05712890625, 0.064697265625, 0.072265625, 0.079833984375, 0.08740234375, 0.094970703125, 0.1025390625, 0.110107421875, 0.11767578125, 0.125244140625, 0.1328125, 0.140380859375, 0.14794921875, 0.155517578125, 0.1630859375, 0.170654296875, 0.17822265625, 0.185791015625, 0.193359375, 0.200927734375, 0.20849609375, 0.216064453125]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 2.0, 3.0, 4.0, 5.0, 8.0, 2.0, 8.0, 13.0, 9.0, 10.0, 12.0, 15.0, 13.0, 18.0, 23.0, 21.0, 30.0, 30.0, 40.0, 30.0, 43.0, 40.0, 45.0, 33.0, 36.0, 37.0, 33.0, 44.0, 37.0, 47.0, 45.0, 38.0, 32.0, 33.0, 23.0, 22.0, 15.0, 20.0, 17.0, 9.0, 12.0, 5.0, 9.0, 7.0, 9.0, 11.0, 2.0, 3.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.14990234375, -0.1452178955078125, -0.140533447265625, -0.1358489990234375, -0.13116455078125, -0.1264801025390625, -0.121795654296875, -0.1171112060546875, -0.1124267578125, -0.1077423095703125, -0.103057861328125, -0.0983734130859375, -0.09368896484375, -0.0890045166015625, -0.084320068359375, -0.0796356201171875, -0.074951171875, -0.0702667236328125, -0.065582275390625, -0.0608978271484375, -0.05621337890625, -0.0515289306640625, -0.046844482421875, -0.0421600341796875, -0.0374755859375, -0.0327911376953125, -0.028106689453125, -0.0234222412109375, -0.01873779296875, -0.0140533447265625, -0.009368896484375, -0.0046844482421875, 0.0, 0.0046844482421875, 0.009368896484375, 0.0140533447265625, 0.01873779296875, 0.0234222412109375, 0.028106689453125, 0.0327911376953125, 0.0374755859375, 0.0421600341796875, 0.046844482421875, 0.0515289306640625, 0.05621337890625, 0.0608978271484375, 0.065582275390625, 0.0702667236328125, 0.074951171875, 0.0796356201171875, 0.084320068359375, 0.0890045166015625, 0.09368896484375, 0.0983734130859375, 0.103057861328125, 0.1077423095703125, 0.1124267578125, 0.1171112060546875, 0.121795654296875, 0.1264801025390625, 0.13116455078125, 0.1358489990234375, 0.140533447265625, 0.1452178955078125, 0.14990234375]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 9.0, 9.0, 12.0, 23.0, 29.0, 30.0, 55.0, 100.0, 145.0, 223.0, 389.0, 639.0, 1235.0, 2325.0, 4750.0, 10175.0, 24146.0, 63859.0, 192443.0, 674964.0, 2038108.0, 827338.0, 228875.0, 74303.0, 27536.0, 11509.0, 5293.0, 2605.0, 1364.0, 727.0, 405.0, 257.0, 128.0, 91.0, 57.0, 35.0, 22.0, 20.0, 17.0, 11.0, 10.0, 5.0, 2.0, 5.0, 3.0, 2.0, 2.0, 1.0, 1.0, 3.0], "bins": [-0.41650390625, -0.40445709228515625, -0.3924102783203125, -0.38036346435546875, -0.368316650390625, -0.35626983642578125, -0.3442230224609375, -0.33217620849609375, -0.32012939453125, -0.30808258056640625, -0.2960357666015625, -0.28398895263671875, -0.271942138671875, -0.25989532470703125, -0.2478485107421875, -0.23580169677734375, -0.2237548828125, -0.21170806884765625, -0.1996612548828125, -0.18761444091796875, -0.175567626953125, -0.16352081298828125, -0.1514739990234375, -0.13942718505859375, -0.12738037109375, -0.11533355712890625, -0.1032867431640625, -0.09123992919921875, -0.079193115234375, -0.06714630126953125, -0.0550994873046875, -0.04305267333984375, -0.031005859375, -0.01895904541015625, -0.0069122314453125, 0.00513458251953125, 0.017181396484375, 0.02922821044921875, 0.0412750244140625, 0.05332183837890625, 0.06536865234375, 0.07741546630859375, 0.0894622802734375, 0.10150909423828125, 0.113555908203125, 0.12560272216796875, 0.1376495361328125, 0.14969635009765625, 0.1617431640625, 0.17378997802734375, 0.1858367919921875, 0.19788360595703125, 0.209930419921875, 0.22197723388671875, 0.2340240478515625, 0.24607086181640625, 0.25811767578125, 0.27016448974609375, 0.2822113037109375, 0.29425811767578125, 0.306304931640625, 0.31835174560546875, 0.3303985595703125, 0.34244537353515625, 0.3544921875]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 5.0, 12.0, 14.0, 24.0, 32.0, 71.0, 98.0, 219.0, 341.0, 621.0, 1068.0, 701.0, 372.0, 226.0, 109.0, 61.0, 42.0, 28.0, 13.0, 9.0, 4.0, 5.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.80810546875, -0.7882270812988281, -0.7683486938476562, -0.7484703063964844, -0.7285919189453125, -0.7087135314941406, -0.6888351440429688, -0.6689567565917969, -0.649078369140625, -0.6291999816894531, -0.6093215942382812, -0.5894432067871094, -0.5695648193359375, -0.5496864318847656, -0.5298080444335938, -0.5099296569824219, -0.49005126953125, -0.4701728820800781, -0.45029449462890625, -0.4304161071777344, -0.4105377197265625, -0.3906593322753906, -0.37078094482421875, -0.3509025573730469, -0.331024169921875, -0.3111457824707031, -0.29126739501953125, -0.2713890075683594, -0.2515106201171875, -0.23163223266601562, -0.21175384521484375, -0.19187545776367188, -0.1719970703125, -0.15211868286132812, -0.13224029541015625, -0.11236190795898438, -0.0924835205078125, -0.07260513305664062, -0.05272674560546875, -0.032848358154296875, -0.012969970703125, 0.006908416748046875, 0.02678680419921875, 0.046665191650390625, 0.0665435791015625, 0.08642196655273438, 0.10630035400390625, 0.12617874145507812, 0.14605712890625, 0.16593551635742188, 0.18581390380859375, 0.20569229125976562, 0.2255706787109375, 0.24544906616210938, 0.26532745361328125, 0.2852058410644531, 0.305084228515625, 0.3249626159667969, 0.34484100341796875, 0.3647193908691406, 0.3845977783203125, 0.4044761657714844, 0.42435455322265625, 0.4442329406738281, 0.464111328125]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 5.0, 2.0, 5.0, 12.0, 8.0, 16.0, 31.0, 34.0, 64.0, 83.0, 74.0, 97.0, 115.0, 112.0, 87.0, 89.0, 63.0, 41.0, 31.0, 16.0, 9.0, 10.0, 1.0, 3.0, 3.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.248807907104492, -2.1808829307556152, -2.1129579544067383, -2.0450329780578613, -1.9771078824996948, -1.9091827869415283, -1.8412578105926514, -1.7733328342437744, -1.7054078578948975, -1.6374828815460205, -1.569557785987854, -1.501632809638977, -1.4337078332901, -1.3657827377319336, -1.2978577613830566, -1.2299327850341797, -1.1620076894760132, -1.0940827131271362, -1.0261576175689697, -0.9582326412200928, -0.8903076648712158, -0.8223826289176941, -0.7544575929641724, -0.6865326166152954, -0.6186075806617737, -0.550682544708252, -0.482757568359375, -0.41483253240585327, -0.34690752625465393, -0.2789825201034546, -0.21105748414993286, -0.14313247799873352, -0.07520747184753418, -0.007282458245754242, 0.060642555356025696, 0.12856757640838623, 0.19649258255958557, 0.2644175887107849, 0.33234262466430664, 0.400267630815506, 0.4681926369667053, 0.536117672920227, 0.604042649269104, 0.6719676852226257, 0.7398927211761475, 0.8078176975250244, 0.8757427334785461, 0.9436677694320679, 1.0115927457809448, 1.0795177221298218, 1.1474428176879883, 1.2153677940368652, 1.2832927703857422, 1.3512177467346191, 1.4191428422927856, 1.4870678186416626, 1.554992914199829, 1.622917890548706, 1.6908429861068726, 1.7587679624557495, 1.8266929388046265, 1.894618034362793, 1.96254301071167, 2.030467987060547, 2.098392963409424]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [4.0, 1.0, 2.0, 1.0, 3.0, 3.0, 3.0, 6.0, 4.0, 5.0, 1.0, 8.0, 12.0, 10.0, 6.0, 11.0, 31.0, 22.0, 24.0, 21.0, 27.0, 28.0, 30.0, 37.0, 44.0, 33.0, 32.0, 38.0, 33.0, 48.0, 32.0, 50.0, 33.0, 44.0, 37.0, 24.0, 34.0, 35.0, 18.0, 23.0, 28.0, 16.0, 17.0, 15.0, 14.0, 12.0, 13.0, 4.0, 14.0, 9.0, 3.0, 4.0, 5.0, 1.0, 1.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-1.07252037525177, -1.0364145040512085, -1.000308632850647, -0.9642028212547302, -0.9280970096588135, -0.891991138458252, -0.8558852672576904, -0.8197793960571289, -0.7836735844612122, -0.7475677132606506, -0.7114619016647339, -0.6753560304641724, -0.6392501592636108, -0.6031443476676941, -0.5670384764671326, -0.5309326648712158, -0.4948267936706543, -0.45872095227241516, -0.422615110874176, -0.3865092396736145, -0.35040339827537537, -0.31429755687713623, -0.2781916856765747, -0.24208584427833557, -0.20598000288009644, -0.1698741614818573, -0.13376830518245697, -0.09766245633363724, -0.061556607484817505, -0.02545076608657837, 0.01065509021282196, 0.04676094651222229, 0.08286690711975098, 0.11897275596857071, 0.15507860481739044, 0.19118446111679077, 0.2272903025150299, 0.26339614391326904, 0.29950201511383057, 0.3356078565120697, 0.37171369791030884, 0.407819539308548, 0.4439253807067871, 0.48003125190734863, 0.5161371231079102, 0.5522429347038269, 0.5883488059043884, 0.6244546175003052, 0.6605604887008667, 0.6966663599014282, 0.732772171497345, 0.7688780426979065, 0.8049838542938232, 0.8410897254943848, 0.8771955966949463, 0.9133014678955078, 0.9494072794914246, 0.9855131506919861, 1.0216189622879028, 1.0577248334884644, 1.0938307046890259, 1.1299364566802979, 1.1660423278808594, 1.202148199081421, 1.2382540702819824]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 4.0, 0.0, 2.0, 6.0, 9.0, 5.0, 15.0, 29.0, 36.0, 57.0, 89.0, 141.0, 204.0, 265.0, 404.0, 648.0, 983.0, 1383.0, 2126.0, 2987.0, 4564.0, 6433.0, 9452.0, 13923.0, 20477.0, 31159.0, 47979.0, 77900.0, 132413.0, 207044.0, 185716.0, 110830.0, 66391.0, 41111.0, 27093.0, 17925.0, 12332.0, 8404.0, 5759.0, 4003.0, 2635.0, 1746.0, 1295.0, 852.0, 554.0, 361.0, 284.0, 175.0, 110.0, 86.0, 46.0, 41.0, 34.0, 18.0, 17.0, 6.0, 5.0, 0.0, 2.0, 2.0, 1.0, 1.0], "bins": [-0.2149658203125, -0.20821380615234375, -0.2014617919921875, -0.19470977783203125, -0.187957763671875, -0.18120574951171875, -0.1744537353515625, -0.16770172119140625, -0.16094970703125, -0.15419769287109375, -0.1474456787109375, -0.14069366455078125, -0.133941650390625, -0.12718963623046875, -0.1204376220703125, -0.11368560791015625, -0.10693359375, -0.10018157958984375, -0.0934295654296875, -0.08667755126953125, -0.079925537109375, -0.07317352294921875, -0.0664215087890625, -0.05966949462890625, -0.05291748046875, -0.04616546630859375, -0.0394134521484375, -0.03266143798828125, -0.025909423828125, -0.01915740966796875, -0.0124053955078125, -0.00565338134765625, 0.0010986328125, 0.00785064697265625, 0.0146026611328125, 0.02135467529296875, 0.028106689453125, 0.03485870361328125, 0.0416107177734375, 0.04836273193359375, 0.05511474609375, 0.06186676025390625, 0.0686187744140625, 0.07537078857421875, 0.082122802734375, 0.08887481689453125, 0.0956268310546875, 0.10237884521484375, 0.109130859375, 0.11588287353515625, 0.1226348876953125, 0.12938690185546875, 0.136138916015625, 0.14289093017578125, 0.1496429443359375, 0.15639495849609375, 0.16314697265625, 0.16989898681640625, 0.1766510009765625, 0.18340301513671875, 0.190155029296875, 0.19690704345703125, 0.2036590576171875, 0.21041107177734375, 0.2171630859375]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 5.0, 2.0, 7.0, 4.0, 3.0, 8.0, 11.0, 8.0, 14.0, 16.0, 20.0, 18.0, 21.0, 28.0, 25.0, 32.0, 30.0, 40.0, 39.0, 32.0, 30.0, 37.0, 41.0, 39.0, 39.0, 47.0, 29.0, 38.0, 28.0, 32.0, 25.0, 31.0, 21.0, 21.0, 25.0, 27.0, 18.0, 12.0, 20.0, 16.0, 15.0, 8.0, 12.0, 13.0, 6.0, 6.0, 2.0, 0.0, 3.0, 3.0, 0.0, 1.0, 3.0, 0.0, 2.0, 1.0], "bins": [-0.147705078125, -0.1431121826171875, -0.138519287109375, -0.1339263916015625, -0.12933349609375, -0.1247406005859375, -0.120147705078125, -0.1155548095703125, -0.1109619140625, -0.1063690185546875, -0.101776123046875, -0.0971832275390625, -0.09259033203125, -0.0879974365234375, -0.083404541015625, -0.0788116455078125, -0.07421875, -0.0696258544921875, -0.065032958984375, -0.0604400634765625, -0.05584716796875, -0.0512542724609375, -0.046661376953125, -0.0420684814453125, -0.0374755859375, -0.0328826904296875, -0.028289794921875, -0.0236968994140625, -0.01910400390625, -0.0145111083984375, -0.009918212890625, -0.0053253173828125, -0.000732421875, 0.0038604736328125, 0.008453369140625, 0.0130462646484375, 0.01763916015625, 0.0222320556640625, 0.026824951171875, 0.0314178466796875, 0.0360107421875, 0.0406036376953125, 0.045196533203125, 0.0497894287109375, 0.05438232421875, 0.0589752197265625, 0.063568115234375, 0.0681610107421875, 0.07275390625, 0.0773468017578125, 0.081939697265625, 0.0865325927734375, 0.09112548828125, 0.0957183837890625, 0.100311279296875, 0.1049041748046875, 0.1094970703125, 0.1140899658203125, 0.118682861328125, 0.1232757568359375, 0.12786865234375, 0.1324615478515625, 0.137054443359375, 0.1416473388671875, 0.146240234375]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 6.0, 5.0, 9.0, 14.0, 20.0, 34.0, 34.0, 39.0, 69.0, 113.0, 155.0, 241.0, 433.0, 1047.0, 2881.0, 8883.0, 29071.0, 97847.0, 352923.0, 392789.0, 112549.0, 33568.0, 10269.0, 3183.0, 1175.0, 478.0, 268.0, 153.0, 106.0, 59.0, 39.0, 30.0, 21.0, 16.0, 11.0, 8.0, 4.0, 2.0, 3.0, 0.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.51318359375, -0.4961090087890625, -0.479034423828125, -0.4619598388671875, -0.44488525390625, -0.4278106689453125, -0.410736083984375, -0.3936614990234375, -0.3765869140625, -0.3595123291015625, -0.342437744140625, -0.3253631591796875, -0.30828857421875, -0.2912139892578125, -0.274139404296875, -0.2570648193359375, -0.239990234375, -0.2229156494140625, -0.205841064453125, -0.1887664794921875, -0.17169189453125, -0.1546173095703125, -0.137542724609375, -0.1204681396484375, -0.1033935546875, -0.0863189697265625, -0.069244384765625, -0.0521697998046875, -0.03509521484375, -0.0180206298828125, -0.000946044921875, 0.0161285400390625, 0.033203125, 0.0502777099609375, 0.067352294921875, 0.0844268798828125, 0.10150146484375, 0.1185760498046875, 0.135650634765625, 0.1527252197265625, 0.1697998046875, 0.1868743896484375, 0.203948974609375, 0.2210235595703125, 0.23809814453125, 0.2551727294921875, 0.272247314453125, 0.2893218994140625, 0.306396484375, 0.3234710693359375, 0.340545654296875, 0.3576202392578125, 0.37469482421875, 0.3917694091796875, 0.408843994140625, 0.4259185791015625, 0.4429931640625, 0.4600677490234375, 0.477142333984375, 0.4942169189453125, 0.51129150390625, 0.5283660888671875, 0.545440673828125, 0.5625152587890625, 0.57958984375]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 5.0, 1.0, 4.0, 5.0, 9.0, 4.0, 14.0, 12.0, 17.0, 15.0, 19.0, 7.0, 22.0, 23.0, 27.0, 30.0, 38.0, 28.0, 29.0, 41.0, 39.0, 36.0, 41.0, 46.0, 38.0, 37.0, 42.0, 39.0, 32.0, 38.0, 33.0, 32.0, 32.0, 19.0, 15.0, 23.0, 17.0, 14.0, 10.0, 18.0, 14.0, 5.0, 9.0, 9.0, 6.0, 3.0, 4.0, 4.0, 5.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.52197265625, -0.5056381225585938, -0.4893035888671875, -0.47296905517578125, -0.456634521484375, -0.44029998779296875, -0.4239654541015625, -0.40763092041015625, -0.39129638671875, -0.37496185302734375, -0.3586273193359375, -0.34229278564453125, -0.325958251953125, -0.30962371826171875, -0.2932891845703125, -0.27695465087890625, -0.2606201171875, -0.24428558349609375, -0.2279510498046875, -0.21161651611328125, -0.195281982421875, -0.17894744873046875, -0.1626129150390625, -0.14627838134765625, -0.12994384765625, -0.11360931396484375, -0.0972747802734375, -0.08094024658203125, -0.064605712890625, -0.04827117919921875, -0.0319366455078125, -0.01560211181640625, 0.000732421875, 0.01706695556640625, 0.0334014892578125, 0.04973602294921875, 0.066070556640625, 0.08240509033203125, 0.0987396240234375, 0.11507415771484375, 0.13140869140625, 0.14774322509765625, 0.1640777587890625, 0.18041229248046875, 0.196746826171875, 0.21308135986328125, 0.2294158935546875, 0.24575042724609375, 0.2620849609375, 0.27841949462890625, 0.2947540283203125, 0.31108856201171875, 0.327423095703125, 0.34375762939453125, 0.3600921630859375, 0.37642669677734375, 0.39276123046875, 0.40909576416015625, 0.4254302978515625, 0.44176483154296875, 0.458099365234375, 0.47443389892578125, 0.4907684326171875, 0.5071029663085938, 0.5234375]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 5.0, 3.0, 4.0, 3.0, 11.0, 12.0, 11.0, 22.0, 37.0, 67.0, 123.0, 202.0, 343.0, 645.0, 1224.0, 2348.0, 4777.0, 10129.0, 21595.0, 47136.0, 109126.0, 265742.0, 329196.0, 142690.0, 60786.0, 27126.0, 12970.0, 6125.0, 2936.0, 1399.0, 738.0, 432.0, 235.0, 123.0, 95.0, 68.0, 35.0, 16.0, 11.0, 4.0, 4.0, 4.0, 2.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.2225341796875, -0.21637916564941406, -0.21022415161132812, -0.2040691375732422, -0.19791412353515625, -0.1917591094970703, -0.18560409545898438, -0.17944908142089844, -0.1732940673828125, -0.16713905334472656, -0.16098403930664062, -0.1548290252685547, -0.14867401123046875, -0.1425189971923828, -0.13636398315429688, -0.13020896911621094, -0.124053955078125, -0.11789894104003906, -0.11174392700195312, -0.10558891296386719, -0.09943389892578125, -0.09327888488769531, -0.08712387084960938, -0.08096885681152344, -0.0748138427734375, -0.06865882873535156, -0.06250381469726562, -0.05634880065917969, -0.05019378662109375, -0.04403877258300781, -0.037883758544921875, -0.03172874450683594, -0.02557373046875, -0.019418716430664062, -0.013263702392578125, -0.0071086883544921875, -0.00095367431640625, 0.0052013397216796875, 0.011356353759765625, 0.017511367797851562, 0.0236663818359375, 0.029821395874023438, 0.035976409912109375, 0.04213142395019531, 0.04828643798828125, 0.05444145202636719, 0.060596466064453125, 0.06675148010253906, 0.072906494140625, 0.07906150817871094, 0.08521652221679688, 0.09137153625488281, 0.09752655029296875, 0.10368156433105469, 0.10983657836914062, 0.11599159240722656, 0.1221466064453125, 0.12830162048339844, 0.13445663452148438, 0.1406116485595703, 0.14676666259765625, 0.1529216766357422, 0.15907669067382812, 0.16523170471191406, 0.17138671875]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 4.0, 3.0, 4.0, 7.0, 5.0, 7.0, 4.0, 15.0, 18.0, 21.0, 13.0, 20.0, 45.0, 63.0, 58.0, 85.0, 98.0, 114.0, 122.0, 59.0, 67.0, 44.0, 26.0, 19.0, 22.0, 11.0, 12.0, 10.0, 2.0, 6.0, 2.0, 6.0, 4.0, 4.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-6.109476089477539e-05, -5.945749580860138e-05, -5.782023072242737e-05, -5.618296563625336e-05, -5.4545700550079346e-05, -5.2908435463905334e-05, -5.127117037773132e-05, -4.963390529155731e-05, -4.79966402053833e-05, -4.635937511920929e-05, -4.472211003303528e-05, -4.308484494686127e-05, -4.1447579860687256e-05, -3.9810314774513245e-05, -3.8173049688339233e-05, -3.653578460216522e-05, -3.489851951599121e-05, -3.32612544298172e-05, -3.162398934364319e-05, -2.9986724257469177e-05, -2.8349459171295166e-05, -2.6712194085121155e-05, -2.5074928998947144e-05, -2.3437663912773132e-05, -2.180039882659912e-05, -2.016313374042511e-05, -1.85258686542511e-05, -1.6888603568077087e-05, -1.5251338481903076e-05, -1.3614073395729065e-05, -1.1976808309555054e-05, -1.0339543223381042e-05, -8.702278137207031e-06, -7.06501305103302e-06, -5.427747964859009e-06, -3.7904828786849976e-06, -2.1532177925109863e-06, -5.159527063369751e-07, 1.1213123798370361e-06, 2.7585774660110474e-06, 4.395842552185059e-06, 6.03310763835907e-06, 7.670372724533081e-06, 9.307637810707092e-06, 1.0944902896881104e-05, 1.2582167983055115e-05, 1.4219433069229126e-05, 1.5856698155403137e-05, 1.749396324157715e-05, 1.913122832775116e-05, 2.076849341392517e-05, 2.2405758500099182e-05, 2.4043023586273193e-05, 2.5680288672447205e-05, 2.7317553758621216e-05, 2.8954818844795227e-05, 3.059208393096924e-05, 3.222934901714325e-05, 3.386661410331726e-05, 3.550387918949127e-05, 3.714114427566528e-05, 3.8778409361839294e-05, 4.0415674448013306e-05, 4.205293953418732e-05, 4.369020462036133e-05]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 13.0, 6.0, 4.0, 18.0, 15.0, 30.0, 53.0, 56.0, 87.0, 139.0, 213.0, 371.0, 683.0, 1301.0, 2878.0, 6778.0, 17251.0, 44145.0, 116970.0, 320451.0, 335736.0, 124025.0, 45957.0, 18137.0, 7073.0, 3133.0, 1320.0, 701.0, 391.0, 222.0, 140.0, 84.0, 57.0, 45.0, 27.0, 19.0, 6.0, 11.0, 6.0, 3.0, 4.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.2100830078125, -0.20308685302734375, -0.1960906982421875, -0.18909454345703125, -0.182098388671875, -0.17510223388671875, -0.1681060791015625, -0.16110992431640625, -0.15411376953125, -0.14711761474609375, -0.1401214599609375, -0.13312530517578125, -0.126129150390625, -0.11913299560546875, -0.1121368408203125, -0.10514068603515625, -0.09814453125, -0.09114837646484375, -0.0841522216796875, -0.07715606689453125, -0.070159912109375, -0.06316375732421875, -0.0561676025390625, -0.04917144775390625, -0.04217529296875, -0.03517913818359375, -0.0281829833984375, -0.02118682861328125, -0.014190673828125, -0.00719451904296875, -0.0001983642578125, 0.00679779052734375, 0.0137939453125, 0.02079010009765625, 0.0277862548828125, 0.03478240966796875, 0.041778564453125, 0.04877471923828125, 0.0557708740234375, 0.06276702880859375, 0.06976318359375, 0.07675933837890625, 0.0837554931640625, 0.09075164794921875, 0.097747802734375, 0.10474395751953125, 0.1117401123046875, 0.11873626708984375, 0.125732421875, 0.13272857666015625, 0.1397247314453125, 0.14672088623046875, 0.153717041015625, 0.16071319580078125, 0.1677093505859375, 0.17470550537109375, 0.18170166015625, 0.18869781494140625, 0.1956939697265625, 0.20269012451171875, 0.209686279296875, 0.21668243408203125, 0.2236785888671875, 0.23067474365234375, 0.2376708984375]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 7.0, 2.0, 7.0, 6.0, 14.0, 14.0, 18.0, 34.0, 46.0, 63.0, 109.0, 115.0, 163.0, 108.0, 76.0, 76.0, 48.0, 32.0, 23.0, 13.0, 10.0, 8.0, 6.0, 6.0, 2.0, 4.0, 4.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.327392578125, -0.3165740966796875, -0.305755615234375, -0.2949371337890625, -0.28411865234375, -0.2733001708984375, -0.262481689453125, -0.2516632080078125, -0.2408447265625, -0.2300262451171875, -0.219207763671875, -0.2083892822265625, -0.19757080078125, -0.1867523193359375, -0.175933837890625, -0.1651153564453125, -0.154296875, -0.1434783935546875, -0.132659912109375, -0.1218414306640625, -0.11102294921875, -0.1002044677734375, -0.089385986328125, -0.0785675048828125, -0.0677490234375, -0.0569305419921875, -0.046112060546875, -0.0352935791015625, -0.02447509765625, -0.0136566162109375, -0.002838134765625, 0.0079803466796875, 0.018798828125, 0.0296173095703125, 0.040435791015625, 0.0512542724609375, 0.06207275390625, 0.0728912353515625, 0.083709716796875, 0.0945281982421875, 0.1053466796875, 0.1161651611328125, 0.126983642578125, 0.1378021240234375, 0.14862060546875, 0.1594390869140625, 0.170257568359375, 0.1810760498046875, 0.19189453125, 0.2027130126953125, 0.213531494140625, 0.2243499755859375, 0.23516845703125, 0.2459869384765625, 0.256805419921875, 0.2676239013671875, 0.2784423828125, 0.2892608642578125, 0.300079345703125, 0.3108978271484375, 0.32171630859375, 0.3325347900390625, 0.343353271484375, 0.3541717529296875, 0.364990234375]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 7.0, 6.0, 7.0, 6.0, 11.0, 16.0, 28.0, 26.0, 51.0, 59.0, 78.0, 89.0, 93.0, 96.0, 107.0, 90.0, 65.0, 60.0, 36.0, 32.0, 18.0, 15.0, 3.0, 4.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-3.306152582168579, -3.234254837036133, -3.1623570919036865, -3.0904593467712402, -3.018561601638794, -2.9466638565063477, -2.8747661113739014, -2.802868366241455, -2.730970621109009, -2.6590728759765625, -2.587175130844116, -2.51527738571167, -2.4433796405792236, -2.3714818954467773, -2.299584150314331, -2.2276864051818848, -2.1557886600494385, -2.083890914916992, -2.011993169784546, -1.9400954246520996, -1.8681976795196533, -1.796299934387207, -1.7244021892547607, -1.6525044441223145, -1.5806066989898682, -1.5087089538574219, -1.4368112087249756, -1.3649134635925293, -1.293015718460083, -1.2211179733276367, -1.1492202281951904, -1.0773224830627441, -1.0054248571395874, -0.9335271120071411, -0.8616293668746948, -0.7897316217422485, -0.7178338766098022, -0.645936131477356, -0.5740383863449097, -0.5021406412124634, -0.4302428960800171, -0.3583451509475708, -0.2864474058151245, -0.21454966068267822, -0.14265191555023193, -0.07075417041778564, 0.0011435747146606445, 0.07304131984710693, 0.14493906497955322, 0.2168368101119995, 0.2887345552444458, 0.3606323003768921, 0.4325300455093384, 0.5044277906417847, 0.576325535774231, 0.6482232809066772, 0.7201210260391235, 0.7920187711715698, 0.8639165163040161, 0.9358142614364624, 1.0077120065689087, 1.079609751701355, 1.1515074968338013, 1.2234052419662476, 1.2953029870986938]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 3.0, 1.0, 4.0, 8.0, 5.0, 4.0, 7.0, 9.0, 8.0, 13.0, 18.0, 17.0, 16.0, 15.0, 33.0, 29.0, 27.0, 44.0, 29.0, 35.0, 40.0, 47.0, 37.0, 41.0, 41.0, 39.0, 44.0, 45.0, 41.0, 32.0, 35.0, 36.0, 37.0, 28.0, 18.0, 19.0, 18.0, 16.0, 15.0, 12.0, 14.0, 6.0, 10.0, 3.0, 2.0, 2.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0], "bins": [-1.7431740760803223, -1.6905277967453003, -1.6378815174102783, -1.585235357284546, -1.532589077949524, -1.479942798614502, -1.42729651927948, -1.374650239944458, -1.322003960609436, -1.269357681274414, -1.216711401939392, -1.1640651226043701, -1.1114189624786377, -1.0587726831436157, -1.0061264038085938, -0.9534801244735718, -0.9008339047431946, -0.8481876254081726, -0.7955414056777954, -0.7428951263427734, -0.6902488470077515, -0.6376025676727295, -0.5849563479423523, -0.5323100686073303, -0.47966381907463074, -0.42701756954193115, -0.3743712902069092, -0.3217250406742096, -0.26907879114151, -0.21643251180648804, -0.16378626227378845, -0.11113998293876648, -0.058493733406066895, -0.005847472697496414, 0.046798788011074066, 0.09944504499435425, 0.15209130942821503, 0.2047375738620758, 0.2573838233947754, 0.31003010272979736, 0.36267635226249695, 0.41532260179519653, 0.4679688811302185, 0.5206151008605957, 0.5732613801956177, 0.6259076595306396, 0.6785539388656616, 0.7312002182006836, 0.7838464379310608, 0.8364927172660828, 0.88913893699646, 0.9417852163314819, 0.9944314956665039, 1.0470777750015259, 1.0997240543365479, 1.1523702144622803, 1.2050164937973022, 1.2576627731323242, 1.3103090524673462, 1.3629553318023682, 1.4156014919281006, 1.4682477712631226, 1.5208940505981445, 1.5735403299331665, 1.6261866092681885]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 8.0, 7.0, 6.0, 7.0, 14.0, 21.0, 31.0, 46.0, 63.0, 95.0, 136.0, 183.0, 331.0, 484.0, 728.0, 1319.0, 2185.0, 3878.0, 7311.0, 14314.0, 29240.0, 62095.0, 138205.0, 324410.0, 886677.0, 1644921.0, 627253.0, 245030.0, 106913.0, 48822.0, 23381.0, 11703.0, 6089.0, 3295.0, 1906.0, 1161.0, 665.0, 435.0, 271.0, 200.0, 131.0, 108.0, 66.0, 45.0, 27.0, 25.0, 17.0, 8.0, 13.0, 9.0, 3.0, 5.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2010498046875, -0.19442367553710938, -0.18779754638671875, -0.18117141723632812, -0.1745452880859375, -0.16791915893554688, -0.16129302978515625, -0.15466690063476562, -0.148040771484375, -0.14141464233398438, -0.13478851318359375, -0.12816238403320312, -0.1215362548828125, -0.11491012573242188, -0.10828399658203125, -0.10165786743164062, -0.09503173828125, -0.08840560913085938, -0.08177947998046875, -0.07515335083007812, -0.0685272216796875, -0.061901092529296875, -0.05527496337890625, -0.048648834228515625, -0.042022705078125, -0.035396575927734375, -0.02877044677734375, -0.022144317626953125, -0.0155181884765625, -0.008892059326171875, -0.00226593017578125, 0.004360198974609375, 0.010986328125, 0.017612457275390625, 0.02423858642578125, 0.030864715576171875, 0.0374908447265625, 0.044116973876953125, 0.05074310302734375, 0.057369232177734375, 0.063995361328125, 0.07062149047851562, 0.07724761962890625, 0.08387374877929688, 0.0904998779296875, 0.09712600708007812, 0.10375213623046875, 0.11037826538085938, 0.11700439453125, 0.12363052368164062, 0.13025665283203125, 0.13688278198242188, 0.1435089111328125, 0.15013504028320312, 0.15676116943359375, 0.16338729858398438, 0.170013427734375, 0.17663955688476562, 0.18326568603515625, 0.18989181518554688, 0.1965179443359375, 0.20314407348632812, 0.20977020263671875, 0.21639633178710938, 0.2230224609375]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 5.0, 2.0, 7.0, 9.0, 10.0, 13.0, 16.0, 13.0, 12.0, 23.0, 26.0, 35.0, 29.0, 47.0, 44.0, 40.0, 40.0, 50.0, 37.0, 40.0, 41.0, 45.0, 55.0, 40.0, 47.0, 35.0, 35.0, 33.0, 24.0, 26.0, 21.0, 16.0, 15.0, 18.0, 8.0, 9.0, 7.0, 11.0, 5.0, 4.0, 5.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.161376953125, -0.15581512451171875, -0.1502532958984375, -0.14469146728515625, -0.139129638671875, -0.13356781005859375, -0.1280059814453125, -0.12244415283203125, -0.11688232421875, -0.11132049560546875, -0.1057586669921875, -0.10019683837890625, -0.094635009765625, -0.08907318115234375, -0.0835113525390625, -0.07794952392578125, -0.0723876953125, -0.06682586669921875, -0.0612640380859375, -0.05570220947265625, -0.050140380859375, -0.04457855224609375, -0.0390167236328125, -0.03345489501953125, -0.02789306640625, -0.02233123779296875, -0.0167694091796875, -0.01120758056640625, -0.005645751953125, -8.392333984375e-05, 0.0054779052734375, 0.01103973388671875, 0.0166015625, 0.02216339111328125, 0.0277252197265625, 0.03328704833984375, 0.038848876953125, 0.04441070556640625, 0.0499725341796875, 0.05553436279296875, 0.06109619140625, 0.06665802001953125, 0.0722198486328125, 0.07778167724609375, 0.083343505859375, 0.08890533447265625, 0.0944671630859375, 0.10002899169921875, 0.1055908203125, 0.11115264892578125, 0.1167144775390625, 0.12227630615234375, 0.127838134765625, 0.13339996337890625, 0.1389617919921875, 0.14452362060546875, 0.15008544921875, 0.15564727783203125, 0.1612091064453125, 0.16677093505859375, 0.172332763671875, 0.17789459228515625, 0.1834564208984375, 0.18901824951171875, 0.194580078125]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 3.0, 3.0, 4.0, 10.0, 12.0, 15.0, 13.0, 24.0, 37.0, 37.0, 81.0, 125.0, 202.0, 371.0, 756.0, 1750.0, 4158.0, 11172.0, 31979.0, 97922.0, 322658.0, 1230264.0, 1801443.0, 478800.0, 141600.0, 45118.0, 15537.0, 5667.0, 2348.0, 1009.0, 488.0, 239.0, 154.0, 89.0, 59.0, 40.0, 36.0, 22.0, 10.0, 8.0, 3.0, 5.0, 5.0, 4.0, 7.0, 0.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.400390625, -0.387939453125, -0.37548828125, -0.363037109375, -0.3505859375, -0.338134765625, -0.32568359375, -0.313232421875, -0.30078125, -0.288330078125, -0.27587890625, -0.263427734375, -0.2509765625, -0.238525390625, -0.22607421875, -0.213623046875, -0.201171875, -0.188720703125, -0.17626953125, -0.163818359375, -0.1513671875, -0.138916015625, -0.12646484375, -0.114013671875, -0.1015625, -0.089111328125, -0.07666015625, -0.064208984375, -0.0517578125, -0.039306640625, -0.02685546875, -0.014404296875, -0.001953125, 0.010498046875, 0.02294921875, 0.035400390625, 0.0478515625, 0.060302734375, 0.07275390625, 0.085205078125, 0.09765625, 0.110107421875, 0.12255859375, 0.135009765625, 0.1474609375, 0.159912109375, 0.17236328125, 0.184814453125, 0.197265625, 0.209716796875, 0.22216796875, 0.234619140625, 0.2470703125, 0.259521484375, 0.27197265625, 0.284423828125, 0.296875, 0.309326171875, 0.32177734375, 0.334228515625, 0.3466796875, 0.359130859375, 0.37158203125, 0.384033203125, 0.396484375]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 4.0, 7.0, 8.0, 16.0, 33.0, 53.0, 80.0, 142.0, 253.0, 423.0, 638.0, 890.0, 618.0, 360.0, 196.0, 132.0, 89.0, 59.0, 32.0, 25.0, 10.0, 8.0, 4.0, 3.0, 2.0, 4.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8173828125, -0.7994003295898438, -0.7814178466796875, -0.7634353637695312, -0.745452880859375, -0.7274703979492188, -0.7094879150390625, -0.6915054321289062, -0.67352294921875, -0.6555404663085938, -0.6375579833984375, -0.6195755004882812, -0.601593017578125, -0.5836105346679688, -0.5656280517578125, -0.5476455688476562, -0.5296630859375, -0.5116806030273438, -0.4936981201171875, -0.47571563720703125, -0.457733154296875, -0.43975067138671875, -0.4217681884765625, -0.40378570556640625, -0.38580322265625, -0.36782073974609375, -0.3498382568359375, -0.33185577392578125, -0.313873291015625, -0.29589080810546875, -0.2779083251953125, -0.25992584228515625, -0.241943359375, -0.22396087646484375, -0.2059783935546875, -0.18799591064453125, -0.170013427734375, -0.15203094482421875, -0.1340484619140625, -0.11606597900390625, -0.09808349609375, -0.08010101318359375, -0.0621185302734375, -0.04413604736328125, -0.026153564453125, -0.00817108154296875, 0.0098114013671875, 0.02779388427734375, 0.0457763671875, 0.06375885009765625, 0.0817413330078125, 0.09972381591796875, 0.117706298828125, 0.13568878173828125, 0.1536712646484375, 0.17165374755859375, 0.18963623046875, 0.20761871337890625, 0.2256011962890625, 0.24358367919921875, 0.261566162109375, 0.27954864501953125, 0.2975311279296875, 0.31551361083984375, 0.33349609375]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 6.0, 12.0, 22.0, 34.0, 37.0, 70.0, 74.0, 112.0, 107.0, 109.0, 97.0, 98.0, 80.0, 62.0, 32.0, 23.0, 18.0, 10.0, 1.0, 2.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-3.0508017539978027, -2.97878360748291, -2.9067654609680176, -2.834747076034546, -2.7627289295196533, -2.6907107830047607, -2.618692636489868, -2.5466744899749756, -2.474656105041504, -2.4026379585266113, -2.3306198120117188, -2.258601427078247, -2.1865832805633545, -2.114565134048462, -2.0425469875335693, -1.9705288410186768, -1.8985106945037842, -1.8264925479888916, -1.7544742822647095, -1.682456135749817, -1.6104378700256348, -1.5384197235107422, -1.4664015769958496, -1.394383430480957, -1.322365164756775, -1.2503470182418823, -1.1783287525177002, -1.1063106060028076, -1.034292459487915, -0.9622741937637329, -0.8902560472488403, -0.818237841129303, -0.7462195158004761, -0.6742013096809387, -0.6021831035614014, -0.5301649570465088, -0.45814675092697144, -0.3861285448074341, -0.3141103684902191, -0.24209219217300415, -0.1700739860534668, -0.09805579483509064, -0.026037603616714478, 0.04598058760166168, 0.11799877882003784, 0.1900169849395752, 0.26203516125679016, 0.3340533375740051, 0.4060715436935425, 0.47808974981307983, 0.5501079559326172, 0.6221261024475098, 0.6941443085670471, 0.7661625146865845, 0.838180661201477, 0.9101988673210144, 0.9822170734405518, 1.0542352199554443, 1.1262534856796265, 1.198271632194519, 1.2702898979187012, 1.3423080444335938, 1.4143261909484863, 1.486344337463379, 1.558362603187561]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 10.0, 3.0, 7.0, 14.0, 13.0, 12.0, 20.0, 12.0, 18.0, 16.0, 12.0, 31.0, 29.0, 40.0, 26.0, 40.0, 47.0, 46.0, 39.0, 52.0, 58.0, 45.0, 42.0, 50.0, 32.0, 44.0, 37.0, 29.0, 30.0, 28.0, 23.0, 14.0, 17.0, 17.0, 19.0, 7.0, 4.0, 5.0, 7.0, 3.0, 4.0, 2.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2122420072555542, -1.1747092008590698, -1.1371763944625854, -1.099643588066101, -1.0621106624603271, -1.0245778560638428, -0.9870450496673584, -0.949512243270874, -0.9119794368743896, -0.8744466304779053, -0.8369138240814209, -0.7993809580802917, -0.7618481516838074, -0.724315345287323, -0.6867824792861938, -0.6492496728897095, -0.6117168664932251, -0.5741840600967407, -0.5366512537002563, -0.4991183876991272, -0.4615855813026428, -0.42405277490615845, -0.3865199387073517, -0.3489871025085449, -0.31145429611206055, -0.27392148971557617, -0.2363886535167694, -0.19885583221912384, -0.16132301092147827, -0.1237901896238327, -0.08625736832618713, -0.04872453212738037, -0.011191844940185547, 0.026340976357460022, 0.06387379765510559, 0.10140661895275116, 0.13893944025039673, 0.1764722615480423, 0.21400508284568787, 0.25153791904449463, 0.289070725440979, 0.3266035318374634, 0.36413636803627014, 0.4016692042350769, 0.4392020106315613, 0.47673481702804565, 0.5142676830291748, 0.5518004894256592, 0.5893332958221436, 0.6268661022186279, 0.6643989086151123, 0.7019317746162415, 0.7394645810127258, 0.7769973874092102, 0.8145302534103394, 0.8520630598068237, 0.8895958662033081, 0.9271286725997925, 0.9646614789962769, 1.0021942853927612, 1.0397272109985352, 1.0772600173950195, 1.114792823791504, 1.1523256301879883, 1.1898584365844727]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 4.0, 3.0, 7.0, 6.0, 10.0, 15.0, 23.0, 33.0, 55.0, 76.0, 126.0, 166.0, 277.0, 387.0, 598.0, 936.0, 1346.0, 1983.0, 3103.0, 4633.0, 7393.0, 11911.0, 19380.0, 33311.0, 62239.0, 153144.0, 343912.0, 219456.0, 81327.0, 40749.0, 23127.0, 13879.0, 8854.0, 5510.0, 3630.0, 2340.0, 1504.0, 1052.0, 694.0, 471.0, 310.0, 199.0, 130.0, 84.0, 52.0, 39.0, 33.0, 17.0, 17.0, 6.0, 4.0, 3.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2493896484375, -0.2412586212158203, -0.23312759399414062, -0.22499656677246094, -0.21686553955078125, -0.20873451232910156, -0.20060348510742188, -0.1924724578857422, -0.1843414306640625, -0.1762104034423828, -0.16807937622070312, -0.15994834899902344, -0.15181732177734375, -0.14368629455566406, -0.13555526733398438, -0.1274242401123047, -0.119293212890625, -0.11116218566894531, -0.10303115844726562, -0.09490013122558594, -0.08676910400390625, -0.07863807678222656, -0.07050704956054688, -0.06237602233886719, -0.0542449951171875, -0.04611396789550781, -0.037982940673828125, -0.029851913452148438, -0.02172088623046875, -0.013589859008789062, -0.005458831787109375, 0.0026721954345703125, 0.01080322265625, 0.018934249877929688, 0.027065277099609375, 0.03519630432128906, 0.04332733154296875, 0.05145835876464844, 0.059589385986328125, 0.06772041320800781, 0.0758514404296875, 0.08398246765136719, 0.09211349487304688, 0.10024452209472656, 0.10837554931640625, 0.11650657653808594, 0.12463760375976562, 0.1327686309814453, 0.140899658203125, 0.1490306854248047, 0.15716171264648438, 0.16529273986816406, 0.17342376708984375, 0.18155479431152344, 0.18968582153320312, 0.1978168487548828, 0.2059478759765625, 0.2140789031982422, 0.22220993041992188, 0.23034095764160156, 0.23847198486328125, 0.24660301208496094, 0.2547340393066406, 0.2628650665283203, 0.27099609375]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 2.0, 2.0, 4.0, 1.0, 3.0, 1.0, 0.0, 3.0, 5.0, 7.0, 3.0, 7.0, 11.0, 8.0, 11.0, 21.0, 22.0, 17.0, 17.0, 23.0, 28.0, 32.0, 26.0, 32.0, 23.0, 42.0, 40.0, 48.0, 37.0, 39.0, 28.0, 38.0, 39.0, 44.0, 35.0, 35.0, 31.0, 29.0, 27.0, 30.0, 24.0, 13.0, 24.0, 17.0, 10.0, 16.0, 13.0, 8.0, 8.0, 9.0, 5.0, 3.0, 4.0, 0.0, 2.0, 1.0, 5.0, 0.0, 2.0, 4.0], "bins": [-0.1673583984375, -0.1623992919921875, -0.157440185546875, -0.1524810791015625, -0.14752197265625, -0.1425628662109375, -0.137603759765625, -0.1326446533203125, -0.127685546875, -0.1227264404296875, -0.117767333984375, -0.1128082275390625, -0.10784912109375, -0.1028900146484375, -0.097930908203125, -0.0929718017578125, -0.0880126953125, -0.0830535888671875, -0.078094482421875, -0.0731353759765625, -0.06817626953125, -0.0632171630859375, -0.058258056640625, -0.0532989501953125, -0.04833984375, -0.0433807373046875, -0.038421630859375, -0.0334625244140625, -0.02850341796875, -0.0235443115234375, -0.018585205078125, -0.0136260986328125, -0.0086669921875, -0.0037078857421875, 0.001251220703125, 0.0062103271484375, 0.01116943359375, 0.0161285400390625, 0.021087646484375, 0.0260467529296875, 0.031005859375, 0.0359649658203125, 0.040924072265625, 0.0458831787109375, 0.05084228515625, 0.0558013916015625, 0.060760498046875, 0.0657196044921875, 0.0706787109375, 0.0756378173828125, 0.080596923828125, 0.0855560302734375, 0.09051513671875, 0.0954742431640625, 0.100433349609375, 0.1053924560546875, 0.1103515625, 0.1153106689453125, 0.120269775390625, 0.1252288818359375, 0.13018798828125, 0.1351470947265625, 0.140106201171875, 0.1450653076171875, 0.1500244140625]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 4.0, 5.0, 8.0, 8.0, 24.0, 15.0, 29.0, 46.0, 48.0, 81.0, 119.0, 240.0, 480.0, 1000.0, 2349.0, 5823.0, 14346.0, 35834.0, 111316.0, 490641.0, 280530.0, 64840.0, 23730.0, 9765.0, 4004.0, 1654.0, 771.0, 355.0, 155.0, 108.0, 73.0, 43.0, 32.0, 26.0, 20.0, 9.0, 11.0, 5.0, 4.0, 2.0, 4.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.48828125, -0.4742431640625, -0.460205078125, -0.4461669921875, -0.43212890625, -0.4180908203125, -0.404052734375, -0.3900146484375, -0.3759765625, -0.3619384765625, -0.347900390625, -0.3338623046875, -0.31982421875, -0.3057861328125, -0.291748046875, -0.2777099609375, -0.263671875, -0.2496337890625, -0.235595703125, -0.2215576171875, -0.20751953125, -0.1934814453125, -0.179443359375, -0.1654052734375, -0.1513671875, -0.1373291015625, -0.123291015625, -0.1092529296875, -0.09521484375, -0.0811767578125, -0.067138671875, -0.0531005859375, -0.0390625, -0.0250244140625, -0.010986328125, 0.0030517578125, 0.01708984375, 0.0311279296875, 0.045166015625, 0.0592041015625, 0.0732421875, 0.0872802734375, 0.101318359375, 0.1153564453125, 0.12939453125, 0.1434326171875, 0.157470703125, 0.1715087890625, 0.185546875, 0.1995849609375, 0.213623046875, 0.2276611328125, 0.24169921875, 0.2557373046875, 0.269775390625, 0.2838134765625, 0.2978515625, 0.3118896484375, 0.325927734375, 0.3399658203125, 0.35400390625, 0.3680419921875, 0.382080078125, 0.3961181640625, 0.41015625]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 4.0, 4.0, 8.0, 4.0, 4.0, 9.0, 15.0, 14.0, 10.0, 21.0, 15.0, 20.0, 23.0, 26.0, 30.0, 29.0, 33.0, 36.0, 27.0, 38.0, 48.0, 43.0, 37.0, 38.0, 37.0, 49.0, 31.0, 31.0, 36.0, 33.0, 30.0, 31.0, 20.0, 30.0, 22.0, 10.0, 20.0, 12.0, 20.0, 10.0, 15.0, 10.0, 4.0, 9.0, 6.0, 2.0, 2.0, 4.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.5361328125, -0.5201530456542969, -0.5041732788085938, -0.4881935119628906, -0.4722137451171875, -0.4562339782714844, -0.44025421142578125, -0.4242744445800781, -0.408294677734375, -0.3923149108886719, -0.37633514404296875, -0.3603553771972656, -0.3443756103515625, -0.3283958435058594, -0.31241607666015625, -0.2964363098144531, -0.28045654296875, -0.2644767761230469, -0.24849700927734375, -0.23251724243164062, -0.2165374755859375, -0.20055770874023438, -0.18457794189453125, -0.16859817504882812, -0.152618408203125, -0.13663864135742188, -0.12065887451171875, -0.10467910766601562, -0.0886993408203125, -0.07271957397460938, -0.05673980712890625, -0.040760040283203125, -0.0247802734375, -0.008800506591796875, 0.00717926025390625, 0.023159027099609375, 0.0391387939453125, 0.055118560791015625, 0.07109832763671875, 0.08707809448242188, 0.103057861328125, 0.11903762817382812, 0.13501739501953125, 0.15099716186523438, 0.1669769287109375, 0.18295669555664062, 0.19893646240234375, 0.21491622924804688, 0.23089599609375, 0.24687576293945312, 0.26285552978515625, 0.2788352966308594, 0.2948150634765625, 0.3107948303222656, 0.32677459716796875, 0.3427543640136719, 0.358734130859375, 0.3747138977050781, 0.39069366455078125, 0.4066734313964844, 0.4226531982421875, 0.4386329650878906, 0.45461273193359375, 0.4705924987792969, 0.486572265625]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 6.0, 10.0, 9.0, 12.0, 20.0, 43.0, 95.0, 136.0, 300.0, 577.0, 1363.0, 2945.0, 7156.0, 17589.0, 43983.0, 108336.0, 387470.0, 319389.0, 94348.0, 38535.0, 15282.0, 6140.0, 2562.0, 1131.0, 529.0, 275.0, 128.0, 69.0, 56.0, 33.0, 21.0, 5.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2054443359375, -0.1993885040283203, -0.19333267211914062, -0.18727684020996094, -0.18122100830078125, -0.17516517639160156, -0.16910934448242188, -0.1630535125732422, -0.1569976806640625, -0.1509418487548828, -0.14488601684570312, -0.13883018493652344, -0.13277435302734375, -0.12671852111816406, -0.12066268920898438, -0.11460685729980469, -0.108551025390625, -0.10249519348144531, -0.09643936157226562, -0.09038352966308594, -0.08432769775390625, -0.07827186584472656, -0.07221603393554688, -0.06616020202636719, -0.0601043701171875, -0.05404853820800781, -0.047992706298828125, -0.04193687438964844, -0.03588104248046875, -0.029825210571289062, -0.023769378662109375, -0.017713546752929688, -0.01165771484375, -0.0056018829345703125, 0.000453948974609375, 0.0065097808837890625, 0.01256561279296875, 0.018621444702148438, 0.024677276611328125, 0.030733108520507812, 0.0367889404296875, 0.04284477233886719, 0.048900604248046875, 0.05495643615722656, 0.06101226806640625, 0.06706809997558594, 0.07312393188476562, 0.07917976379394531, 0.085235595703125, 0.09129142761230469, 0.09734725952148438, 0.10340309143066406, 0.10945892333984375, 0.11551475524902344, 0.12157058715820312, 0.1276264190673828, 0.1336822509765625, 0.1397380828857422, 0.14579391479492188, 0.15184974670410156, 0.15790557861328125, 0.16396141052246094, 0.17001724243164062, 0.1760730743408203, 0.18212890625]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 2.0, 2.0, 3.0, 1.0, 4.0, 3.0, 3.0, 7.0, 12.0, 5.0, 22.0, 13.0, 30.0, 46.0, 72.0, 100.0, 162.0, 161.0, 112.0, 70.0, 47.0, 24.0, 28.0, 18.0, 13.0, 16.0, 4.0, 7.0, 4.0, 4.0, 4.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.802776336669922e-05, -3.6372803151607513e-05, -3.471784293651581e-05, -3.30628827214241e-05, -3.14079225063324e-05, -2.9752962291240692e-05, -2.8098002076148987e-05, -2.644304186105728e-05, -2.4788081645965576e-05, -2.313312143087387e-05, -2.1478161215782166e-05, -1.982320100069046e-05, -1.8168240785598755e-05, -1.651328057050705e-05, -1.4858320355415344e-05, -1.3203360140323639e-05, -1.1548399925231934e-05, -9.893439710140228e-06, -8.238479495048523e-06, -6.583519279956818e-06, -4.928559064865112e-06, -3.273598849773407e-06, -1.6186386346817017e-06, 3.632158041000366e-08, 1.691281795501709e-06, 3.3462420105934143e-06, 5.00120222568512e-06, 6.656162440776825e-06, 8.31112265586853e-06, 9.966082870960236e-06, 1.1621043086051941e-05, 1.3276003301143646e-05, 1.4930963516235352e-05, 1.6585923731327057e-05, 1.8240883946418762e-05, 1.9895844161510468e-05, 2.1550804376602173e-05, 2.3205764591693878e-05, 2.4860724806785583e-05, 2.651568502187729e-05, 2.8170645236968994e-05, 2.98256054520607e-05, 3.1480565667152405e-05, 3.313552588224411e-05, 3.4790486097335815e-05, 3.644544631242752e-05, 3.8100406527519226e-05, 3.975536674261093e-05, 4.141032695770264e-05, 4.306528717279434e-05, 4.472024738788605e-05, 4.637520760297775e-05, 4.803016781806946e-05, 4.968512803316116e-05, 5.134008824825287e-05, 5.2995048463344574e-05, 5.465000867843628e-05, 5.6304968893527985e-05, 5.795992910861969e-05, 5.9614889323711395e-05, 6.12698495388031e-05, 6.29248097538948e-05, 6.457976996898651e-05, 6.623473018407822e-05, 6.788969039916992e-05]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 11.0, 10.0, 12.0, 14.0, 25.0, 38.0, 47.0, 70.0, 88.0, 140.0, 218.0, 393.0, 759.0, 1507.0, 3598.0, 9065.0, 24900.0, 68543.0, 208849.0, 475587.0, 163154.0, 57295.0, 20625.0, 7636.0, 2953.0, 1279.0, 690.0, 376.0, 218.0, 147.0, 86.0, 52.0, 58.0, 36.0, 26.0, 18.0, 10.0, 8.0, 5.0, 6.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.1934814453125, -0.1871185302734375, -0.180755615234375, -0.1743927001953125, -0.16802978515625, -0.1616668701171875, -0.155303955078125, -0.1489410400390625, -0.142578125, -0.1362152099609375, -0.129852294921875, -0.1234893798828125, -0.11712646484375, -0.1107635498046875, -0.104400634765625, -0.0980377197265625, -0.0916748046875, -0.0853118896484375, -0.078948974609375, -0.0725860595703125, -0.06622314453125, -0.0598602294921875, -0.053497314453125, -0.0471343994140625, -0.040771484375, -0.0344085693359375, -0.028045654296875, -0.0216827392578125, -0.01531982421875, -0.0089569091796875, -0.002593994140625, 0.0037689208984375, 0.0101318359375, 0.0164947509765625, 0.022857666015625, 0.0292205810546875, 0.03558349609375, 0.0419464111328125, 0.048309326171875, 0.0546722412109375, 0.06103515625, 0.0673980712890625, 0.073760986328125, 0.0801239013671875, 0.08648681640625, 0.0928497314453125, 0.099212646484375, 0.1055755615234375, 0.1119384765625, 0.1183013916015625, 0.124664306640625, 0.1310272216796875, 0.13739013671875, 0.1437530517578125, 0.150115966796875, 0.1564788818359375, 0.162841796875, 0.1692047119140625, 0.175567626953125, 0.1819305419921875, 0.18829345703125, 0.1946563720703125, 0.201019287109375, 0.2073822021484375, 0.2137451171875]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 4.0, 6.0, 10.0, 10.0, 13.0, 20.0, 32.0, 38.0, 72.0, 89.0, 164.0, 174.0, 133.0, 83.0, 53.0, 34.0, 17.0, 22.0, 15.0, 8.0, 4.0, 3.0, 1.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.352783203125, -0.3425102233886719, -0.33223724365234375, -0.3219642639160156, -0.3116912841796875, -0.3014183044433594, -0.29114532470703125, -0.2808723449707031, -0.270599365234375, -0.2603263854980469, -0.25005340576171875, -0.23978042602539062, -0.2295074462890625, -0.21923446655273438, -0.20896148681640625, -0.19868850708007812, -0.18841552734375, -0.17814254760742188, -0.16786956787109375, -0.15759658813476562, -0.1473236083984375, -0.13705062866210938, -0.12677764892578125, -0.11650466918945312, -0.106231689453125, -0.09595870971679688, -0.08568572998046875, -0.07541275024414062, -0.0651397705078125, -0.054866790771484375, -0.04459381103515625, -0.034320831298828125, -0.0240478515625, -0.013774871826171875, -0.00350189208984375, 0.006771087646484375, 0.0170440673828125, 0.027317047119140625, 0.03759002685546875, 0.047863006591796875, 0.058135986328125, 0.06840896606445312, 0.07868194580078125, 0.08895492553710938, 0.0992279052734375, 0.10950088500976562, 0.11977386474609375, 0.13004684448242188, 0.14031982421875, 0.15059280395507812, 0.16086578369140625, 0.17113876342773438, 0.1814117431640625, 0.19168472290039062, 0.20195770263671875, 0.21223068237304688, 0.222503662109375, 0.23277664184570312, 0.24304962158203125, 0.2533226013183594, 0.2635955810546875, 0.2738685607910156, 0.28414154052734375, 0.2944145202636719, 0.3046875]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 69.0, 735.0, 193.0, 9.0, 5.0, 3.0, 0.0, 1.0], "bins": [-28.58197021484375, -28.085954666137695, -27.58993911743164, -27.09392547607422, -26.597909927368164, -26.10189437866211, -25.605878829956055, -25.10986328125, -24.613849639892578, -24.117834091186523, -23.62181854248047, -23.125804901123047, -22.629789352416992, -22.133773803710938, -21.637758255004883, -21.141742706298828, -20.645727157592773, -20.14971160888672, -19.653696060180664, -19.157682418823242, -18.661666870117188, -18.165651321411133, -17.669635772705078, -17.173620223999023, -16.67760467529297, -16.181589126586914, -15.685574531555176, -15.189558982849121, -14.693544387817383, -14.197528839111328, -13.701513290405273, -13.205497741699219, -12.709484100341797, -12.213468551635742, -11.717453956604004, -11.22143840789795, -10.725423812866211, -10.229408264160156, -9.733392715454102, -9.237377166748047, -8.741361618041992, -8.245346069335938, -7.749331474304199, -7.2533159255981445, -6.757300853729248, -6.261285781860352, -5.765270233154297, -5.2692551612854, -4.773240566253662, -4.277225494384766, -3.78121018409729, -3.2851948738098145, -2.789179801940918, -2.2931647300720215, -1.797149419784546, -1.3011341094970703, -0.8051190376281738, -0.3091038465499878, 0.18691134452819824, 0.6829265356063843, 1.1789417266845703, 1.6749567985534668, 2.1709721088409424, 2.666987419128418, 3.1630024909973145]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 4.0, 2.0, 13.0, 12.0, 13.0, 20.0, 14.0, 25.0, 32.0, 40.0, 33.0, 50.0, 54.0, 49.0, 63.0, 69.0, 73.0, 50.0, 59.0, 43.0, 50.0, 43.0, 38.0, 40.0, 30.0, 28.0, 15.0, 14.0, 18.0, 8.0, 6.0, 3.0, 2.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3698962926864624, -1.3035523891448975, -1.237208366394043, -1.170864462852478, -1.104520559310913, -1.0381765365600586, -0.9718326330184937, -0.9054887294769287, -0.839144766330719, -0.7728008031845093, -0.7064568996429443, -0.6401129364967346, -0.5737689733505249, -0.50742506980896, -0.44108110666275024, -0.3747371733188629, -0.3083932399749756, -0.24204930663108826, -0.17570535838603973, -0.10936141014099121, -0.04301747679710388, 0.023326456546783447, 0.08967041969299316, 0.1560143530368805, 0.22235828638076782, 0.28870221972465515, 0.3550461530685425, 0.4213901162147522, 0.4877340495586395, 0.5540779829025269, 0.6204219460487366, 0.6867659091949463, 0.7531099319458008, 0.8194538950920105, 0.8857977986335754, 0.9521417617797852, 1.01848566532135, 1.084829568862915, 1.1511735916137695, 1.2175174951553345, 1.2838613986968994, 1.3502053022384644, 1.4165493249893188, 1.4828932285308838, 1.5492371320724487, 1.6155810356140137, 1.6819250583648682, 1.748268961906433, 1.8146129846572876, 1.8809568881988525, 1.947300910949707, 2.0136446952819824, 2.079988718032837, 2.1463327407836914, 2.212676525115967, 2.2790205478668213, 2.345364570617676, 2.4117085933685303, 2.4780523777008057, 2.54439640045166, 2.6107404232025146, 2.67708420753479, 2.7434282302856445, 2.809772253036499, 2.8761160373687744]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 5.0, 1.0, 7.0, 6.0, 9.0, 9.0, 21.0, 30.0, 51.0, 57.0, 61.0, 118.0, 173.0, 248.0, 369.0, 559.0, 911.0, 1485.0, 2624.0, 4943.0, 9134.0, 17600.0, 35861.0, 75215.0, 165626.0, 401896.0, 1281276.0, 1421669.0, 438709.0, 176661.0, 80374.0, 37888.0, 18782.0, 9500.0, 5154.0, 2700.0, 1578.0, 999.0, 656.0, 405.0, 269.0, 179.0, 136.0, 94.0, 77.0, 35.0, 39.0, 27.0, 18.0, 13.0, 13.0, 3.0, 10.0, 4.0, 2.0, 2.0, 2.0, 3.0, 0.0, 2.0, 0.0, 2.0, 1.0], "bins": [-0.1929931640625, -0.1861114501953125, -0.179229736328125, -0.1723480224609375, -0.16546630859375, -0.1585845947265625, -0.151702880859375, -0.1448211669921875, -0.137939453125, -0.1310577392578125, -0.124176025390625, -0.1172943115234375, -0.11041259765625, -0.1035308837890625, -0.096649169921875, -0.0897674560546875, -0.0828857421875, -0.0760040283203125, -0.069122314453125, -0.0622406005859375, -0.05535888671875, -0.0484771728515625, -0.041595458984375, -0.0347137451171875, -0.02783203125, -0.0209503173828125, -0.014068603515625, -0.0071868896484375, -0.00030517578125, 0.0065765380859375, 0.013458251953125, 0.0203399658203125, 0.0272216796875, 0.0341033935546875, 0.040985107421875, 0.0478668212890625, 0.05474853515625, 0.0616302490234375, 0.068511962890625, 0.0753936767578125, 0.082275390625, 0.0891571044921875, 0.096038818359375, 0.1029205322265625, 0.10980224609375, 0.1166839599609375, 0.123565673828125, 0.1304473876953125, 0.1373291015625, 0.1442108154296875, 0.151092529296875, 0.1579742431640625, 0.16485595703125, 0.1717376708984375, 0.178619384765625, 0.1855010986328125, 0.1923828125, 0.1992645263671875, 0.206146240234375, 0.2130279541015625, 0.21990966796875, 0.2267913818359375, 0.233673095703125, 0.2405548095703125, 0.2474365234375]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [3.0, 3.0, 3.0, 0.0, 2.0, 2.0, 6.0, 1.0, 7.0, 8.0, 10.0, 14.0, 15.0, 7.0, 22.0, 29.0, 20.0, 21.0, 22.0, 29.0, 30.0, 33.0, 29.0, 32.0, 43.0, 32.0, 45.0, 33.0, 41.0, 47.0, 37.0, 28.0, 34.0, 31.0, 44.0, 31.0, 30.0, 27.0, 23.0, 20.0, 23.0, 20.0, 18.0, 11.0, 8.0, 5.0, 7.0, 8.0, 5.0, 11.0, 6.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-0.137939453125, -0.13305091857910156, -0.12816238403320312, -0.12327384948730469, -0.11838531494140625, -0.11349678039550781, -0.10860824584960938, -0.10371971130371094, -0.0988311767578125, -0.09394264221191406, -0.08905410766601562, -0.08416557312011719, -0.07927703857421875, -0.07438850402832031, -0.06949996948242188, -0.06461143493652344, -0.059722900390625, -0.05483436584472656, -0.049945831298828125, -0.04505729675292969, -0.04016876220703125, -0.03528022766113281, -0.030391693115234375, -0.025503158569335938, -0.0206146240234375, -0.015726089477539062, -0.010837554931640625, -0.0059490203857421875, -0.00106048583984375, 0.0038280487060546875, 0.008716583251953125, 0.013605117797851562, 0.01849365234375, 0.023382186889648438, 0.028270721435546875, 0.03315925598144531, 0.03804779052734375, 0.04293632507324219, 0.047824859619140625, 0.05271339416503906, 0.0576019287109375, 0.06249046325683594, 0.06737899780273438, 0.07226753234863281, 0.07715606689453125, 0.08204460144042969, 0.08693313598632812, 0.09182167053222656, 0.096710205078125, 0.10159873962402344, 0.10648727416992188, 0.11137580871582031, 0.11626434326171875, 0.12115287780761719, 0.12604141235351562, 0.13092994689941406, 0.1358184814453125, 0.14070701599121094, 0.14559555053710938, 0.1504840850830078, 0.15537261962890625, 0.1602611541748047, 0.16514968872070312, 0.17003822326660156, 0.1749267578125]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 1.0, 4.0, 5.0, 5.0, 2.0, 5.0, 13.0, 12.0, 20.0, 35.0, 39.0, 76.0, 97.0, 135.0, 228.0, 388.0, 637.0, 1090.0, 1842.0, 3349.0, 6158.0, 11943.0, 23568.0, 47730.0, 101991.0, 226433.0, 569484.0, 1538406.0, 1005301.0, 360028.0, 154408.0, 70754.0, 34040.0, 16890.0, 8440.0, 4674.0, 2468.0, 1451.0, 807.0, 504.0, 311.0, 179.0, 128.0, 77.0, 50.0, 29.0, 26.0, 11.0, 10.0, 3.0, 3.0, 1.0, 6.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.260498046875, -0.25229644775390625, -0.2440948486328125, -0.23589324951171875, -0.227691650390625, -0.21949005126953125, -0.2112884521484375, -0.20308685302734375, -0.19488525390625, -0.18668365478515625, -0.1784820556640625, -0.17028045654296875, -0.162078857421875, -0.15387725830078125, -0.1456756591796875, -0.13747406005859375, -0.1292724609375, -0.12107086181640625, -0.1128692626953125, -0.10466766357421875, -0.096466064453125, -0.08826446533203125, -0.0800628662109375, -0.07186126708984375, -0.06365966796875, -0.05545806884765625, -0.0472564697265625, -0.03905487060546875, -0.030853271484375, -0.02265167236328125, -0.0144500732421875, -0.00624847412109375, 0.001953125, 0.01015472412109375, 0.0183563232421875, 0.02655792236328125, 0.034759521484375, 0.04296112060546875, 0.0511627197265625, 0.05936431884765625, 0.06756591796875, 0.07576751708984375, 0.0839691162109375, 0.09217071533203125, 0.100372314453125, 0.10857391357421875, 0.1167755126953125, 0.12497711181640625, 0.1331787109375, 0.14138031005859375, 0.1495819091796875, 0.15778350830078125, 0.165985107421875, 0.17418670654296875, 0.1823883056640625, 0.19058990478515625, 0.19879150390625, 0.20699310302734375, 0.2151947021484375, 0.22339630126953125, 0.231597900390625, 0.23979949951171875, 0.2480010986328125, 0.25620269775390625, 0.264404296875]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 3.0, 4.0, 6.0, 10.0, 5.0, 6.0, 6.0, 8.0, 11.0, 16.0, 16.0, 22.0, 23.0, 34.0, 33.0, 40.0, 47.0, 79.0, 80.0, 121.0, 167.0, 180.0, 262.0, 355.0, 437.0, 439.0, 385.0, 273.0, 237.0, 151.0, 140.0, 92.0, 63.0, 53.0, 58.0, 38.0, 36.0, 32.0, 24.0, 19.0, 11.0, 13.0, 8.0, 7.0, 4.0, 3.0, 8.0, 6.0, 3.0, 4.0, 3.0, 2.0, 0.0, 4.0], "bins": [-0.2880859375, -0.2798748016357422, -0.2716636657714844, -0.26345252990722656, -0.25524139404296875, -0.24703025817871094, -0.23881912231445312, -0.2306079864501953, -0.2223968505859375, -0.2141857147216797, -0.20597457885742188, -0.19776344299316406, -0.18955230712890625, -0.18134117126464844, -0.17313003540039062, -0.1649188995361328, -0.156707763671875, -0.1484966278076172, -0.14028549194335938, -0.13207435607910156, -0.12386322021484375, -0.11565208435058594, -0.10744094848632812, -0.09922981262207031, -0.0910186767578125, -0.08280754089355469, -0.07459640502929688, -0.06638526916503906, -0.05817413330078125, -0.04996299743652344, -0.041751861572265625, -0.03354072570800781, -0.02532958984375, -0.017118453979492188, -0.008907318115234375, -0.0006961822509765625, 0.00751495361328125, 0.015726089477539062, 0.023937225341796875, 0.03214836120605469, 0.0403594970703125, 0.04857063293457031, 0.056781768798828125, 0.06499290466308594, 0.07320404052734375, 0.08141517639160156, 0.08962631225585938, 0.09783744812011719, 0.106048583984375, 0.11425971984863281, 0.12247085571289062, 0.13068199157714844, 0.13889312744140625, 0.14710426330566406, 0.15531539916992188, 0.1635265350341797, 0.1717376708984375, 0.1799488067626953, 0.18815994262695312, 0.19637107849121094, 0.20458221435546875, 0.21279335021972656, 0.22100448608398438, 0.2292156219482422, 0.2374267578125]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 6.0, 6.0, 4.0, 14.0, 22.0, 37.0, 43.0, 51.0, 59.0, 76.0, 81.0, 85.0, 89.0, 87.0, 70.0, 57.0, 62.0, 49.0, 25.0, 22.0, 9.0, 22.0, 10.0, 6.0, 2.0, 2.0, 2.0, 1.0, 3.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.4226617813110352, -1.367058515548706, -1.3114553689956665, -1.2558521032333374, -1.2002488374710083, -1.1446456909179688, -1.0890424251556396, -1.0334391593933105, -0.977836012840271, -0.9222328066825867, -0.8666295409202576, -0.8110263347625732, -0.7554231286048889, -0.6998199224472046, -0.6442166566848755, -0.5886134505271912, -0.5330101847648621, -0.47740694880485535, -0.421803742647171, -0.3662005066871643, -0.31059730052948, -0.25499406456947327, -0.19939082860946655, -0.14378762245178223, -0.08818438649177551, -0.032581161707639694, 0.023022063076496124, 0.07862529158592224, 0.13422851264476776, 0.18983173370361328, 0.24543496966362, 0.3010381758213043, 0.35664141178131104, 0.41224464774131775, 0.4678478538990021, 0.5234510898590088, 0.5790542960166931, 0.6346575021743774, 0.6902607679367065, 0.7458639740943909, 0.8014671802520752, 0.8570703864097595, 0.9126736521720886, 0.968276858329773, 1.023880124092102, 1.0794832706451416, 1.1350865364074707, 1.1906898021697998, 1.246293067932129, 1.301896333694458, 1.3574994802474976, 1.4131027460098267, 1.4687060117721558, 1.5243091583251953, 1.5799124240875244, 1.6355156898498535, 1.691118836402893, 1.7467221021652222, 1.8023252487182617, 1.8579285144805908, 1.91353178024292, 1.9691349267959595, 2.024738311767578, 2.080341339111328, 2.1359446048736572]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 4.0, 5.0, 2.0, 8.0, 10.0, 3.0, 9.0, 18.0, 20.0, 9.0, 21.0, 13.0, 25.0, 15.0, 18.0, 30.0, 39.0, 26.0, 31.0, 35.0, 33.0, 40.0, 31.0, 38.0, 42.0, 41.0, 45.0, 36.0, 41.0, 33.0, 31.0, 27.0, 21.0, 28.0, 26.0, 15.0, 15.0, 20.0, 15.0, 19.0, 9.0, 14.0, 9.0, 9.0, 7.0, 10.0, 5.0, 2.0, 0.0, 1.0, 2.0, 2.0, 3.0, 1.0], "bins": [-1.0297563076019287, -0.9994377493858337, -0.969119131565094, -0.938800573348999, -0.9084819555282593, -0.8781633973121643, -0.8478448390960693, -0.8175262212753296, -0.7872076630592346, -0.7568891048431396, -0.7265704870223999, -0.6962519288063049, -0.66593337059021, -0.6356147527694702, -0.6052961945533752, -0.5749776363372803, -0.5446590185165405, -0.5143404603004456, -0.4840218424797058, -0.45370328426361084, -0.4233846962451935, -0.3930661082267761, -0.36274755001068115, -0.3324289619922638, -0.30211037397384644, -0.2717917859554291, -0.2414732128381729, -0.21115463972091675, -0.1808360517024994, -0.15051746368408203, -0.12019889056682587, -0.0898803174495697, -0.059561729431152344, -0.029243148863315582, 0.0010754317045211792, 0.03139401227235794, 0.0617125928401947, 0.09203118085861206, 0.12234975397586823, 0.1526683270931244, 0.18298691511154175, 0.2133055031299591, 0.24362407624721527, 0.27394264936447144, 0.3042612373828888, 0.33457982540130615, 0.3648983836174011, 0.3952169716358185, 0.42553555965423584, 0.4558541476726532, 0.48617273569107056, 0.5164912939071655, 0.5468099117279053, 0.5771284699440002, 0.6074470281600952, 0.637765645980835, 0.6680842041969299, 0.6984027624130249, 0.7287213802337646, 0.7590399384498596, 0.7893584966659546, 0.8196771144866943, 0.8499956727027893, 0.8803142309188843, 0.910632848739624]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 2.0, 1.0, 1.0, 3.0, 6.0, 17.0, 18.0, 31.0, 42.0, 75.0, 139.0, 207.0, 323.0, 577.0, 1001.0, 1688.0, 2749.0, 4621.0, 7733.0, 13787.0, 28082.0, 73703.0, 242066.0, 399824.0, 169091.0, 52964.0, 21996.0, 11443.0, 6515.0, 3906.0, 2293.0, 1458.0, 865.0, 508.0, 324.0, 190.0, 117.0, 68.0, 49.0, 32.0, 17.0, 9.0, 2.0, 8.0, 5.0, 3.0, 2.0, 0.0, 2.0, 2.0], "bins": [-0.370849609375, -0.3609199523925781, -0.35099029541015625, -0.3410606384277344, -0.3311309814453125, -0.3212013244628906, -0.31127166748046875, -0.3013420104980469, -0.291412353515625, -0.2814826965332031, -0.27155303955078125, -0.2616233825683594, -0.2516937255859375, -0.24176406860351562, -0.23183441162109375, -0.22190475463867188, -0.21197509765625, -0.20204544067382812, -0.19211578369140625, -0.18218612670898438, -0.1722564697265625, -0.16232681274414062, -0.15239715576171875, -0.14246749877929688, -0.132537841796875, -0.12260818481445312, -0.11267852783203125, -0.10274887084960938, -0.0928192138671875, -0.08288955688476562, -0.07295989990234375, -0.06303024291992188, -0.0531005859375, -0.043170928955078125, -0.03324127197265625, -0.023311614990234375, -0.0133819580078125, -0.003452301025390625, 0.00647735595703125, 0.016407012939453125, 0.026336669921875, 0.036266326904296875, 0.04619598388671875, 0.056125640869140625, 0.0660552978515625, 0.07598495483398438, 0.08591461181640625, 0.09584426879882812, 0.10577392578125, 0.11570358276367188, 0.12563323974609375, 0.13556289672851562, 0.1454925537109375, 0.15542221069335938, 0.16535186767578125, 0.17528152465820312, 0.185211181640625, 0.19514083862304688, 0.20507049560546875, 0.21500015258789062, 0.2249298095703125, 0.23485946655273438, 0.24478912353515625, 0.2547187805175781, 0.2646484375]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [3.0, 4.0, 2.0, 2.0, 5.0, 4.0, 12.0, 4.0, 10.0, 14.0, 9.0, 15.0, 13.0, 22.0, 19.0, 14.0, 25.0, 25.0, 31.0, 29.0, 36.0, 40.0, 38.0, 37.0, 47.0, 40.0, 35.0, 37.0, 41.0, 42.0, 39.0, 31.0, 37.0, 39.0, 25.0, 30.0, 21.0, 29.0, 13.0, 16.0, 12.0, 12.0, 9.0, 13.0, 4.0, 8.0, 6.0, 7.0, 4.0, 4.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1373291015625, -0.13211822509765625, -0.1269073486328125, -0.12169647216796875, -0.116485595703125, -0.11127471923828125, -0.1060638427734375, -0.10085296630859375, -0.09564208984375, -0.09043121337890625, -0.0852203369140625, -0.08000946044921875, -0.074798583984375, -0.06958770751953125, -0.0643768310546875, -0.05916595458984375, -0.053955078125, -0.04874420166015625, -0.0435333251953125, -0.03832244873046875, -0.033111572265625, -0.02790069580078125, -0.0226898193359375, -0.01747894287109375, -0.01226806640625, -0.00705718994140625, -0.0018463134765625, 0.00336456298828125, 0.008575439453125, 0.01378631591796875, 0.0189971923828125, 0.02420806884765625, 0.0294189453125, 0.03462982177734375, 0.0398406982421875, 0.04505157470703125, 0.050262451171875, 0.05547332763671875, 0.0606842041015625, 0.06589508056640625, 0.07110595703125, 0.07631683349609375, 0.0815277099609375, 0.08673858642578125, 0.091949462890625, 0.09716033935546875, 0.1023712158203125, 0.10758209228515625, 0.11279296875, 0.11800384521484375, 0.1232147216796875, 0.12842559814453125, 0.133636474609375, 0.13884735107421875, 0.1440582275390625, 0.14926910400390625, 0.15447998046875, 0.15969085693359375, 0.1649017333984375, 0.17011260986328125, 0.175323486328125, 0.18053436279296875, 0.1857452392578125, 0.19095611572265625, 0.1961669921875]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 10.0, 10.0, 7.0, 13.0, 15.0, 22.0, 32.0, 52.0, 78.0, 179.0, 348.0, 709.0, 1739.0, 4351.0, 11359.0, 33235.0, 162438.0, 577852.0, 197188.0, 38255.0, 12332.0, 4833.0, 1893.0, 786.0, 348.0, 187.0, 101.0, 63.0, 32.0, 30.0, 12.0, 11.0, 11.0, 7.0, 5.0, 4.0, 5.0, 3.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.450927734375, -0.4361686706542969, -0.42140960693359375, -0.4066505432128906, -0.3918914794921875, -0.3771324157714844, -0.36237335205078125, -0.3476142883300781, -0.332855224609375, -0.3180961608886719, -0.30333709716796875, -0.2885780334472656, -0.2738189697265625, -0.2590599060058594, -0.24430084228515625, -0.22954177856445312, -0.21478271484375, -0.20002365112304688, -0.18526458740234375, -0.17050552368164062, -0.1557464599609375, -0.14098739624023438, -0.12622833251953125, -0.11146926879882812, -0.096710205078125, -0.08195114135742188, -0.06719207763671875, -0.052433013916015625, -0.0376739501953125, -0.022914886474609375, -0.00815582275390625, 0.006603240966796875, 0.0213623046875, 0.036121368408203125, 0.05088043212890625, 0.06563949584960938, 0.0803985595703125, 0.09515762329101562, 0.10991668701171875, 0.12467575073242188, 0.139434814453125, 0.15419387817382812, 0.16895294189453125, 0.18371200561523438, 0.1984710693359375, 0.21323013305664062, 0.22798919677734375, 0.24274826049804688, 0.25750732421875, 0.2722663879394531, 0.28702545166015625, 0.3017845153808594, 0.3165435791015625, 0.3313026428222656, 0.34606170654296875, 0.3608207702636719, 0.375579833984375, 0.3903388977050781, 0.40509796142578125, 0.4198570251464844, 0.4346160888671875, 0.4493751525878906, 0.46413421630859375, 0.4788932800292969, 0.49365234375]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 4.0, 3.0, 4.0, 8.0, 10.0, 10.0, 16.0, 14.0, 16.0, 11.0, 26.0, 22.0, 33.0, 28.0, 35.0, 48.0, 51.0, 46.0, 42.0, 46.0, 52.0, 46.0, 54.0, 51.0, 50.0, 55.0, 31.0, 37.0, 30.0, 22.0, 25.0, 17.0, 22.0, 17.0, 7.0, 11.0, 4.0, 2.0, 6.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.59375, -0.5745086669921875, -0.555267333984375, -0.5360260009765625, -0.51678466796875, -0.4975433349609375, -0.478302001953125, -0.4590606689453125, -0.4398193359375, -0.4205780029296875, -0.401336669921875, -0.3820953369140625, -0.36285400390625, -0.3436126708984375, -0.324371337890625, -0.3051300048828125, -0.285888671875, -0.2666473388671875, -0.247406005859375, -0.2281646728515625, -0.20892333984375, -0.1896820068359375, -0.170440673828125, -0.1511993408203125, -0.1319580078125, -0.1127166748046875, -0.093475341796875, -0.0742340087890625, -0.05499267578125, -0.0357513427734375, -0.016510009765625, 0.0027313232421875, 0.02197265625, 0.0412139892578125, 0.060455322265625, 0.0796966552734375, 0.09893798828125, 0.1181793212890625, 0.137420654296875, 0.1566619873046875, 0.1759033203125, 0.1951446533203125, 0.214385986328125, 0.2336273193359375, 0.25286865234375, 0.2721099853515625, 0.291351318359375, 0.3105926513671875, 0.329833984375, 0.3490753173828125, 0.368316650390625, 0.3875579833984375, 0.40679931640625, 0.4260406494140625, 0.445281982421875, 0.4645233154296875, 0.4837646484375, 0.5030059814453125, 0.522247314453125, 0.5414886474609375, 0.56072998046875, 0.5799713134765625, 0.599212646484375, 0.6184539794921875, 0.6376953125]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 3.0, 4.0, 5.0, 4.0, 5.0, 13.0, 18.0, 28.0, 48.0, 75.0, 179.0, 370.0, 664.0, 1433.0, 3170.0, 6834.0, 14712.0, 31765.0, 79373.0, 240307.0, 411109.0, 157666.0, 55949.0, 23963.0, 10893.0, 5232.0, 2403.0, 1079.0, 566.0, 306.0, 144.0, 91.0, 49.0, 30.0, 15.0, 16.0, 12.0, 6.0, 7.0, 2.0, 4.0, 6.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1573486328125, -0.15232467651367188, -0.14730072021484375, -0.14227676391601562, -0.1372528076171875, -0.13222885131835938, -0.12720489501953125, -0.12218093872070312, -0.117156982421875, -0.11213302612304688, -0.10710906982421875, -0.10208511352539062, -0.0970611572265625, -0.09203720092773438, -0.08701324462890625, -0.08198928833007812, -0.07696533203125, -0.07194137573242188, -0.06691741943359375, -0.061893463134765625, -0.0568695068359375, -0.051845550537109375, -0.04682159423828125, -0.041797637939453125, -0.036773681640625, -0.031749725341796875, -0.02672576904296875, -0.021701812744140625, -0.0166778564453125, -0.011653900146484375, -0.00662994384765625, -0.001605987548828125, 0.00341796875, 0.008441925048828125, 0.01346588134765625, 0.018489837646484375, 0.0235137939453125, 0.028537750244140625, 0.03356170654296875, 0.038585662841796875, 0.043609619140625, 0.048633575439453125, 0.05365753173828125, 0.058681488037109375, 0.0637054443359375, 0.06872940063476562, 0.07375335693359375, 0.07877731323242188, 0.08380126953125, 0.08882522583007812, 0.09384918212890625, 0.09887313842773438, 0.1038970947265625, 0.10892105102539062, 0.11394500732421875, 0.11896896362304688, 0.123992919921875, 0.12901687622070312, 0.13404083251953125, 0.13906478881835938, 0.1440887451171875, 0.14911270141601562, 0.15413665771484375, 0.15916061401367188, 0.1641845703125]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 4.0, 7.0, 3.0, 6.0, 3.0, 12.0, 3.0, 15.0, 18.0, 18.0, 31.0, 47.0, 83.0, 112.0, 180.0, 136.0, 121.0, 64.0, 42.0, 30.0, 15.0, 11.0, 8.0, 8.0, 6.0, 6.0, 5.0, 6.0, 2.0, 0.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-5.1915645599365234e-05, -5.0331465899944305e-05, -4.8747286200523376e-05, -4.716310650110245e-05, -4.557892680168152e-05, -4.399474710226059e-05, -4.241056740283966e-05, -4.082638770341873e-05, -3.92422080039978e-05, -3.7658028304576874e-05, -3.6073848605155945e-05, -3.4489668905735016e-05, -3.290548920631409e-05, -3.132130950689316e-05, -2.973712980747223e-05, -2.81529501080513e-05, -2.656877040863037e-05, -2.4984590709209442e-05, -2.3400411009788513e-05, -2.1816231310367584e-05, -2.0232051610946655e-05, -1.8647871911525726e-05, -1.7063692212104797e-05, -1.547951251268387e-05, -1.389533281326294e-05, -1.231115311384201e-05, -1.0726973414421082e-05, -9.142793715000153e-06, -7.558614015579224e-06, -5.974434316158295e-06, -4.390254616737366e-06, -2.8060749173164368e-06, -1.2218952178955078e-06, 3.6228448152542114e-07, 1.94646418094635e-06, 3.530643880367279e-06, 5.114823579788208e-06, 6.699003279209137e-06, 8.283182978630066e-06, 9.867362678050995e-06, 1.1451542377471924e-05, 1.3035722076892853e-05, 1.4619901776313782e-05, 1.620408147573471e-05, 1.778826117515564e-05, 1.937244087457657e-05, 2.0956620573997498e-05, 2.2540800273418427e-05, 2.4124979972839355e-05, 2.5709159672260284e-05, 2.7293339371681213e-05, 2.8877519071102142e-05, 3.046169877052307e-05, 3.2045878469944e-05, 3.363005816936493e-05, 3.521423786878586e-05, 3.679841756820679e-05, 3.8382597267627716e-05, 3.9966776967048645e-05, 4.1550956666469574e-05, 4.31351363658905e-05, 4.471931606531143e-05, 4.630349576473236e-05, 4.788767546415329e-05, 4.947185516357422e-05]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 3.0, 3.0, 8.0, 7.0, 7.0, 25.0, 17.0, 35.0, 57.0, 134.0, 182.0, 436.0, 766.0, 1974.0, 4981.0, 12595.0, 34213.0, 99751.0, 307494.0, 379770.0, 133978.0, 44871.0, 16498.0, 6239.0, 2493.0, 1066.0, 443.0, 202.0, 117.0, 67.0, 36.0, 35.0, 16.0, 17.0, 8.0, 2.0, 5.0, 4.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1431884765625, -0.1377086639404297, -0.13222885131835938, -0.12674903869628906, -0.12126922607421875, -0.11578941345214844, -0.11030960083007812, -0.10482978820800781, -0.0993499755859375, -0.09387016296386719, -0.08839035034179688, -0.08291053771972656, -0.07743072509765625, -0.07195091247558594, -0.06647109985351562, -0.06099128723144531, -0.055511474609375, -0.05003166198730469, -0.044551849365234375, -0.03907203674316406, -0.03359222412109375, -0.028112411499023438, -0.022632598876953125, -0.017152786254882812, -0.0116729736328125, -0.0061931610107421875, -0.000713348388671875, 0.0047664642333984375, 0.01024627685546875, 0.015726089477539062, 0.021205902099609375, 0.026685714721679688, 0.03216552734375, 0.03764533996582031, 0.043125152587890625, 0.04860496520996094, 0.05408477783203125, 0.05956459045410156, 0.06504440307617188, 0.07052421569824219, 0.0760040283203125, 0.08148384094238281, 0.08696365356445312, 0.09244346618652344, 0.09792327880859375, 0.10340309143066406, 0.10888290405273438, 0.11436271667480469, 0.119842529296875, 0.1253223419189453, 0.13080215454101562, 0.13628196716308594, 0.14176177978515625, 0.14724159240722656, 0.15272140502929688, 0.1582012176513672, 0.1636810302734375, 0.1691608428955078, 0.17464065551757812, 0.18012046813964844, 0.18560028076171875, 0.19108009338378906, 0.19655990600585938, 0.2020397186279297, 0.20751953125]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 5.0, 1.0, 4.0, 7.0, 5.0, 0.0, 4.0, 4.0, 8.0, 14.0, 17.0, 19.0, 27.0, 27.0, 37.0, 37.0, 54.0, 59.0, 86.0, 87.0, 91.0, 70.0, 54.0, 51.0, 46.0, 29.0, 30.0, 23.0, 22.0, 10.0, 4.0, 18.0, 6.0, 10.0, 5.0, 7.0, 7.0, 4.0, 7.0, 2.0, 2.0, 0.0, 3.0, 3.0, 0.0, 2.0, 1.0, 0.0, 3.0, 2.0], "bins": [-0.154296875, -0.1497211456298828, -0.14514541625976562, -0.14056968688964844, -0.13599395751953125, -0.13141822814941406, -0.12684249877929688, -0.12226676940917969, -0.1176910400390625, -0.11311531066894531, -0.10853958129882812, -0.10396385192871094, -0.09938812255859375, -0.09481239318847656, -0.09023666381835938, -0.08566093444824219, -0.081085205078125, -0.07650947570800781, -0.07193374633789062, -0.06735801696777344, -0.06278228759765625, -0.05820655822753906, -0.053630828857421875, -0.04905509948730469, -0.0444793701171875, -0.03990364074707031, -0.035327911376953125, -0.030752182006835938, -0.02617645263671875, -0.021600723266601562, -0.017024993896484375, -0.012449264526367188, -0.00787353515625, -0.0032978057861328125, 0.001277923583984375, 0.0058536529541015625, 0.01042938232421875, 0.015005111694335938, 0.019580841064453125, 0.024156570434570312, 0.0287322998046875, 0.03330802917480469, 0.037883758544921875, 0.04245948791503906, 0.04703521728515625, 0.05161094665527344, 0.056186676025390625, 0.06076240539550781, 0.065338134765625, 0.06991386413574219, 0.07448959350585938, 0.07906532287597656, 0.08364105224609375, 0.08821678161621094, 0.09279251098632812, 0.09736824035644531, 0.1019439697265625, 0.10651969909667969, 0.11109542846679688, 0.11567115783691406, 0.12024688720703125, 0.12482261657714844, 0.12939834594726562, 0.1339740753173828, 0.1385498046875]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 3.0, 2.0, 7.0, 10.0, 13.0, 21.0, 28.0, 36.0, 60.0, 82.0, 78.0, 97.0, 106.0, 98.0, 85.0, 70.0, 57.0, 43.0, 29.0, 29.0, 15.0, 13.0, 6.0, 4.0, 6.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0], "bins": [-1.487866997718811, -1.4422687292099, -1.3966705799102783, -1.3510723114013672, -1.3054741621017456, -1.2598758935928345, -1.214277744293213, -1.1686794757843018, -1.1230813264846802, -1.077483057975769, -1.0318849086761475, -0.9862866997718811, -0.9406884908676147, -0.8950902819633484, -0.849492073059082, -0.8038938045501709, -0.7582955956459045, -0.7126973867416382, -0.6670991778373718, -0.6215009689331055, -0.5759027600288391, -0.5303045511245728, -0.484706312417984, -0.43910810351371765, -0.3935098946094513, -0.34791168570518494, -0.3023134768009186, -0.25671523809432983, -0.21111704409122467, -0.1655188351869583, -0.11992061138153076, -0.0743224024772644, -0.028724193572998047, 0.01687401905655861, 0.062472231686115265, 0.10807044804096222, 0.15366865694522858, 0.19926686584949493, 0.24486508965492249, 0.29046329855918884, 0.3360615074634552, 0.38165971636772156, 0.4272579252719879, 0.47285616397857666, 0.518454372882843, 0.5640525817871094, 0.6096507906913757, 0.6552489995956421, 0.7008472084999084, 0.7464454174041748, 0.7920436263084412, 0.8376418352127075, 0.8832400441169739, 0.9288382530212402, 0.9744365215301514, 1.020034670829773, 1.065632939338684, 1.1112312078475952, 1.1568293571472168, 1.202427625656128, 1.2480257749557495, 1.2936240434646606, 1.3392221927642822, 1.3848204612731934, 1.430418610572815]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [4.0, 1.0, 0.0, 0.0, 3.0, 1.0, 4.0, 2.0, 7.0, 3.0, 5.0, 9.0, 5.0, 9.0, 9.0, 11.0, 17.0, 20.0, 19.0, 21.0, 22.0, 30.0, 31.0, 21.0, 29.0, 41.0, 44.0, 42.0, 37.0, 42.0, 39.0, 40.0, 38.0, 34.0, 37.0, 34.0, 42.0, 37.0, 24.0, 32.0, 20.0, 19.0, 22.0, 18.0, 18.0, 12.0, 8.0, 13.0, 13.0, 7.0, 3.0, 8.0, 2.0, 4.0, 0.0, 3.0, 0.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.2208900451660156, -1.1810715198516846, -1.1412529945373535, -1.1014344692230225, -1.0616159439086914, -1.02179753780365, -0.9819790124893188, -0.9421604871749878, -0.9023419618606567, -0.8625234365463257, -0.8227049112319946, -0.7828864455223083, -0.7430679202079773, -0.7032493948936462, -0.66343092918396, -0.6236124038696289, -0.5837938785552979, -0.5439753532409668, -0.5041568279266357, -0.46433836221694946, -0.4245198369026184, -0.38470131158828735, -0.3448828160762787, -0.30506432056427, -0.26524579524993896, -0.2254272848367691, -0.18560877442359924, -0.14579026401042938, -0.10597175359725952, -0.06615324318408966, -0.0263347327709198, 0.013483762741088867, 0.05330228805541992, 0.09312079846858978, 0.13293930888175964, 0.1727578192949295, 0.21257632970809937, 0.2523948550224304, 0.2922133505344391, 0.33203184604644775, 0.3718503713607788, 0.41166889667510986, 0.45148739218711853, 0.4913058876991272, 0.5311244130134583, 0.5709429383277893, 0.6107614040374756, 0.6505799293518066, 0.6903984546661377, 0.7302169799804688, 0.7700355052947998, 0.8098539710044861, 0.8496724963188171, 0.8894910216331482, 0.9293094873428345, 0.9691280126571655, 1.0089465379714966, 1.0487650632858276, 1.0885835886001587, 1.1284021139144897, 1.1682205200195312, 1.2080390453338623, 1.2478575706481934, 1.2876760959625244, 1.3274946212768555]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 6.0, 6.0, 8.0, 12.0, 12.0, 19.0, 26.0, 40.0, 57.0, 59.0, 123.0, 213.0, 368.0, 616.0, 1065.0, 2038.0, 4212.0, 9469.0, 22735.0, 58997.0, 162138.0, 480766.0, 1557352.0, 1289680.0, 386117.0, 132889.0, 49589.0, 19583.0, 8231.0, 3658.0, 1862.0, 991.0, 526.0, 303.0, 179.0, 105.0, 76.0, 49.0, 32.0, 24.0, 14.0, 13.0, 8.0, 3.0, 8.0, 8.0, 5.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.299560546875, -0.2907257080078125, -0.281890869140625, -0.2730560302734375, -0.26422119140625, -0.2553863525390625, -0.246551513671875, -0.2377166748046875, -0.2288818359375, -0.2200469970703125, -0.211212158203125, -0.2023773193359375, -0.19354248046875, -0.1847076416015625, -0.175872802734375, -0.1670379638671875, -0.158203125, -0.1493682861328125, -0.140533447265625, -0.1316986083984375, -0.12286376953125, -0.1140289306640625, -0.105194091796875, -0.0963592529296875, -0.0875244140625, -0.0786895751953125, -0.069854736328125, -0.0610198974609375, -0.05218505859375, -0.0433502197265625, -0.034515380859375, -0.0256805419921875, -0.016845703125, -0.0080108642578125, 0.000823974609375, 0.0096588134765625, 0.01849365234375, 0.0273284912109375, 0.036163330078125, 0.0449981689453125, 0.0538330078125, 0.0626678466796875, 0.071502685546875, 0.0803375244140625, 0.08917236328125, 0.0980072021484375, 0.106842041015625, 0.1156768798828125, 0.12451171875, 0.1333465576171875, 0.142181396484375, 0.1510162353515625, 0.15985107421875, 0.1686859130859375, 0.177520751953125, 0.1863555908203125, 0.1951904296875, 0.2040252685546875, 0.212860107421875, 0.2216949462890625, 0.23052978515625, 0.2393646240234375, 0.248199462890625, 0.2570343017578125, 0.265869140625]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 0.0, 2.0, 0.0, 3.0, 1.0, 0.0, 2.0, 1.0, 5.0, 8.0, 9.0, 13.0, 8.0, 8.0, 17.0, 19.0, 21.0, 12.0, 20.0, 32.0, 32.0, 32.0, 35.0, 29.0, 46.0, 39.0, 50.0, 54.0, 46.0, 55.0, 37.0, 44.0, 27.0, 38.0, 24.0, 20.0, 27.0, 31.0, 30.0, 28.0, 16.0, 17.0, 13.0, 12.0, 10.0, 11.0, 9.0, 6.0, 8.0, 2.0, 0.0, 0.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1734619140625, -0.16794204711914062, -0.16242218017578125, -0.15690231323242188, -0.1513824462890625, -0.14586257934570312, -0.14034271240234375, -0.13482284545898438, -0.129302978515625, -0.12378311157226562, -0.11826324462890625, -0.11274337768554688, -0.1072235107421875, -0.10170364379882812, -0.09618377685546875, -0.09066390991210938, -0.08514404296875, -0.07962417602539062, -0.07410430908203125, -0.06858444213867188, -0.0630645751953125, -0.057544708251953125, -0.05202484130859375, -0.046504974365234375, -0.040985107421875, -0.035465240478515625, -0.02994537353515625, -0.024425506591796875, -0.0189056396484375, -0.013385772705078125, -0.00786590576171875, -0.002346038818359375, 0.003173828125, 0.008693695068359375, 0.01421356201171875, 0.019733428955078125, 0.0252532958984375, 0.030773162841796875, 0.03629302978515625, 0.041812896728515625, 0.047332763671875, 0.052852630615234375, 0.05837249755859375, 0.06389236450195312, 0.0694122314453125, 0.07493209838867188, 0.08045196533203125, 0.08597183227539062, 0.09149169921875, 0.09701156616210938, 0.10253143310546875, 0.10805130004882812, 0.1135711669921875, 0.11909103393554688, 0.12461090087890625, 0.13013076782226562, 0.135650634765625, 0.14117050170898438, 0.14669036865234375, 0.15221023559570312, 0.1577301025390625, 0.16324996948242188, 0.16876983642578125, 0.17428970336914062, 0.1798095703125]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 3.0, 12.0, 22.0, 25.0, 38.0, 69.0, 106.0, 210.0, 347.0, 603.0, 1121.0, 2315.0, 5300.0, 12439.0, 30904.0, 80422.0, 224863.0, 724887.0, 1922541.0, 798914.0, 244773.0, 86920.0, 33410.0, 13356.0, 5571.0, 2460.0, 1229.0, 627.0, 324.0, 187.0, 100.0, 68.0, 48.0, 23.0, 20.0, 16.0, 9.0, 3.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.37255859375, -0.3623619079589844, -0.35216522216796875, -0.3419685363769531, -0.3317718505859375, -0.3215751647949219, -0.31137847900390625, -0.3011817932128906, -0.290985107421875, -0.2807884216308594, -0.27059173583984375, -0.2603950500488281, -0.2501983642578125, -0.24000167846679688, -0.22980499267578125, -0.21960830688476562, -0.20941162109375, -0.19921493530273438, -0.18901824951171875, -0.17882156372070312, -0.1686248779296875, -0.15842819213867188, -0.14823150634765625, -0.13803482055664062, -0.127838134765625, -0.11764144897460938, -0.10744476318359375, -0.09724807739257812, -0.0870513916015625, -0.07685470581054688, -0.06665802001953125, -0.056461334228515625, -0.0462646484375, -0.036067962646484375, -0.02587127685546875, -0.015674591064453125, -0.0054779052734375, 0.004718780517578125, 0.01491546630859375, 0.025112152099609375, 0.035308837890625, 0.045505523681640625, 0.05570220947265625, 0.06589889526367188, 0.0760955810546875, 0.08629226684570312, 0.09648895263671875, 0.10668563842773438, 0.11688232421875, 0.12707901000976562, 0.13727569580078125, 0.14747238159179688, 0.1576690673828125, 0.16786575317382812, 0.17806243896484375, 0.18825912475585938, 0.198455810546875, 0.20865249633789062, 0.21884918212890625, 0.22904586791992188, 0.2392425537109375, 0.24943923950195312, 0.25963592529296875, 0.2698326110839844, 0.280029296875]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 8.0, 11.0, 6.0, 8.0, 22.0, 17.0, 23.0, 52.0, 44.0, 57.0, 60.0, 102.0, 131.0, 154.0, 232.0, 314.0, 450.0, 515.0, 458.0, 353.0, 254.0, 186.0, 133.0, 121.0, 71.0, 81.0, 49.0, 44.0, 38.0, 26.0, 11.0, 15.0, 10.0, 6.0, 4.0, 4.0, 3.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.347412109375, -0.3364448547363281, -0.32547760009765625, -0.3145103454589844, -0.3035430908203125, -0.2925758361816406, -0.28160858154296875, -0.2706413269042969, -0.259674072265625, -0.24870681762695312, -0.23773956298828125, -0.22677230834960938, -0.2158050537109375, -0.20483779907226562, -0.19387054443359375, -0.18290328979492188, -0.17193603515625, -0.16096878051757812, -0.15000152587890625, -0.13903427124023438, -0.1280670166015625, -0.11709976196289062, -0.10613250732421875, -0.09516525268554688, -0.084197998046875, -0.07323074340820312, -0.06226348876953125, -0.051296234130859375, -0.0403289794921875, -0.029361724853515625, -0.01839447021484375, -0.007427215576171875, 0.0035400390625, 0.014507293701171875, 0.02547454833984375, 0.036441802978515625, 0.0474090576171875, 0.058376312255859375, 0.06934356689453125, 0.08031082153320312, 0.091278076171875, 0.10224533081054688, 0.11321258544921875, 0.12417984008789062, 0.1351470947265625, 0.14611434936523438, 0.15708160400390625, 0.16804885864257812, 0.17901611328125, 0.18998336791992188, 0.20095062255859375, 0.21191787719726562, 0.2228851318359375, 0.23385238647460938, 0.24481964111328125, 0.2557868957519531, 0.266754150390625, 0.2777214050292969, 0.28868865966796875, 0.2996559143066406, 0.3106231689453125, 0.3215904235839844, 0.33255767822265625, 0.3435249328613281, 0.3544921875]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 2.0, 1.0, 2.0, 13.0, 23.0, 34.0, 56.0, 108.0, 135.0, 174.0, 128.0, 99.0, 81.0, 69.0, 33.0, 28.0, 8.0, 3.0, 0.0, 2.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.8676912784576416, -3.770326852798462, -3.6729624271392822, -3.5755980014801025, -3.478233575820923, -3.380869150161743, -3.2835049629211426, -3.186140537261963, -3.088776111602783, -2.9914116859436035, -2.894047260284424, -2.796682834625244, -2.6993184089660645, -2.6019539833068848, -2.504589557647705, -2.4072251319885254, -2.3098607063293457, -2.212496280670166, -2.1151318550109863, -2.0177674293518066, -1.920403003692627, -1.8230385780334473, -1.7256742715835571, -1.6283098459243774, -1.5309454202651978, -1.433580994606018, -1.3362165689468384, -1.2388522624969482, -1.1414878368377686, -1.0441234111785889, -0.9467589855194092, -0.8493945598602295, -0.7520301342010498, -0.6546657085418701, -0.5573012828826904, -0.4599369168281555, -0.36257249116897583, -0.26520806550979614, -0.16784369945526123, -0.07047927379608154, 0.026885151863098145, 0.12424956262111664, 0.22161397337913513, 0.31897836923599243, 0.4163427948951721, 0.5137072205543518, 0.6110715866088867, 0.7084360122680664, 0.8058004379272461, 0.9031648635864258, 1.0005292892456055, 1.0978937149047852, 1.1952581405639648, 1.2926225662231445, 1.3899868726730347, 1.4873512983322144, 1.584715723991394, 1.6820801496505737, 1.7794445753097534, 1.8768088817596436, 1.9741733074188232, 2.071537733078003, 2.1689021587371826, 2.2662665843963623, 2.363631010055542]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 2.0, 4.0, 1.0, 2.0, 2.0, 3.0, 6.0, 6.0, 5.0, 12.0, 15.0, 9.0, 20.0, 15.0, 25.0, 20.0, 30.0, 34.0, 34.0, 35.0, 56.0, 36.0, 43.0, 43.0, 34.0, 45.0, 50.0, 48.0, 50.0, 33.0, 41.0, 30.0, 32.0, 27.0, 25.0, 19.0, 23.0, 17.0, 19.0, 13.0, 11.0, 2.0, 14.0, 2.0, 4.0, 2.0, 3.0, 5.0, 2.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.1533795595169067, -1.1141748428344727, -1.0749702453613281, -1.035765528678894, -0.99656081199646, -0.9573561549186707, -0.9181514978408813, -0.8789467811584473, -0.839742124080658, -0.8005374670028687, -0.7613327503204346, -0.7221280932426453, -0.682923436164856, -0.6437187194824219, -0.6045140624046326, -0.5653094053268433, -0.5261046886444092, -0.4869000017642975, -0.4476953148841858, -0.4084906578063965, -0.3692859709262848, -0.3300812840461731, -0.2908766269683838, -0.2516719400882721, -0.2124672532081604, -0.1732625663280487, -0.1340578943490982, -0.09485321491956711, -0.05564853549003601, -0.016443848609924316, 0.022760823369026184, 0.061965495347976685, 0.10117030143737793, 0.14037498831748962, 0.17957966029644012, 0.21878433227539062, 0.2579890191555023, 0.297193706035614, 0.3363983631134033, 0.375603049993515, 0.4148077368736267, 0.4540124237537384, 0.4932171106338501, 0.5324217677116394, 0.5716264247894287, 0.6108311414718628, 0.6500357985496521, 0.6892404556274414, 0.7284451723098755, 0.7676498293876648, 0.8068545460700989, 0.8460592031478882, 0.8852639198303223, 0.9244685769081116, 0.9636732339859009, 1.002877950668335, 1.0420825481414795, 1.0812872648239136, 1.120491862297058, 1.1596965789794922, 1.1989012956619263, 1.2381060123443604, 1.2773106098175049, 1.316515326499939, 1.355720043182373]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 3.0, 5.0, 10.0, 16.0, 39.0, 60.0, 88.0, 141.0, 241.0, 342.0, 515.0, 968.0, 1514.0, 2198.0, 3421.0, 5254.0, 8202.0, 13575.0, 25063.0, 61705.0, 268036.0, 449487.0, 123658.0, 36827.0, 18112.0, 10526.0, 6582.0, 4213.0, 2759.0, 1872.0, 1155.0, 730.0, 482.0, 299.0, 178.0, 109.0, 69.0, 39.0, 28.0, 16.0, 10.0, 7.0, 5.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4287109375, -0.4158172607421875, -0.402923583984375, -0.3900299072265625, -0.37713623046875, -0.3642425537109375, -0.351348876953125, -0.3384552001953125, -0.3255615234375, -0.3126678466796875, -0.299774169921875, -0.2868804931640625, -0.27398681640625, -0.2610931396484375, -0.248199462890625, -0.2353057861328125, -0.222412109375, -0.2095184326171875, -0.196624755859375, -0.1837310791015625, -0.17083740234375, -0.1579437255859375, -0.145050048828125, -0.1321563720703125, -0.1192626953125, -0.1063690185546875, -0.093475341796875, -0.0805816650390625, -0.06768798828125, -0.0547943115234375, -0.041900634765625, -0.0290069580078125, -0.01611328125, -0.0032196044921875, 0.009674072265625, 0.0225677490234375, 0.03546142578125, 0.0483551025390625, 0.061248779296875, 0.0741424560546875, 0.0870361328125, 0.0999298095703125, 0.112823486328125, 0.1257171630859375, 0.13861083984375, 0.1515045166015625, 0.164398193359375, 0.1772918701171875, 0.190185546875, 0.2030792236328125, 0.215972900390625, 0.2288665771484375, 0.24176025390625, 0.2546539306640625, 0.267547607421875, 0.2804412841796875, 0.2933349609375, 0.3062286376953125, 0.319122314453125, 0.3320159912109375, 0.34490966796875, 0.3578033447265625, 0.370697021484375, 0.3835906982421875, 0.396484375]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 5.0, 1.0, 4.0, 3.0, 4.0, 3.0, 2.0, 14.0, 8.0, 5.0, 13.0, 17.0, 17.0, 17.0, 22.0, 26.0, 25.0, 23.0, 32.0, 40.0, 35.0, 40.0, 24.0, 38.0, 44.0, 44.0, 47.0, 32.0, 35.0, 33.0, 22.0, 47.0, 36.0, 23.0, 25.0, 32.0, 30.0, 21.0, 16.0, 15.0, 22.0, 12.0, 8.0, 16.0, 10.0, 7.0, 4.0, 5.0, 6.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.15576171875, -0.15059661865234375, -0.1454315185546875, -0.14026641845703125, -0.135101318359375, -0.12993621826171875, -0.1247711181640625, -0.11960601806640625, -0.11444091796875, -0.10927581787109375, -0.1041107177734375, -0.09894561767578125, -0.093780517578125, -0.08861541748046875, -0.0834503173828125, -0.07828521728515625, -0.0731201171875, -0.06795501708984375, -0.0627899169921875, -0.05762481689453125, -0.052459716796875, -0.04729461669921875, -0.0421295166015625, -0.03696441650390625, -0.03179931640625, -0.02663421630859375, -0.0214691162109375, -0.01630401611328125, -0.011138916015625, -0.00597381591796875, -0.0008087158203125, 0.00435638427734375, 0.009521484375, 0.01468658447265625, 0.0198516845703125, 0.02501678466796875, 0.030181884765625, 0.03534698486328125, 0.0405120849609375, 0.04567718505859375, 0.05084228515625, 0.05600738525390625, 0.0611724853515625, 0.06633758544921875, 0.071502685546875, 0.07666778564453125, 0.0818328857421875, 0.08699798583984375, 0.0921630859375, 0.09732818603515625, 0.1024932861328125, 0.10765838623046875, 0.112823486328125, 0.11798858642578125, 0.1231536865234375, 0.12831878662109375, 0.13348388671875, 0.13864898681640625, 0.1438140869140625, 0.14897918701171875, 0.154144287109375, 0.15930938720703125, 0.1644744873046875, 0.16963958740234375, 0.1748046875]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 2.0, 3.0, 13.0, 10.0, 16.0, 29.0, 59.0, 66.0, 97.0, 189.0, 347.0, 779.0, 2086.0, 6128.0, 17209.0, 50421.0, 379451.0, 501151.0, 59551.0, 19618.0, 7047.0, 2465.0, 967.0, 358.0, 178.0, 109.0, 74.0, 46.0, 40.0, 17.0, 10.0, 10.0, 6.0, 2.0, 5.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6044921875, -0.5829544067382812, -0.5614166259765625, -0.5398788452148438, -0.518341064453125, -0.49680328369140625, -0.4752655029296875, -0.45372772216796875, -0.43218994140625, -0.41065216064453125, -0.3891143798828125, -0.36757659912109375, -0.346038818359375, -0.32450103759765625, -0.3029632568359375, -0.28142547607421875, -0.2598876953125, -0.23834991455078125, -0.2168121337890625, -0.19527435302734375, -0.173736572265625, -0.15219879150390625, -0.1306610107421875, -0.10912322998046875, -0.08758544921875, -0.06604766845703125, -0.0445098876953125, -0.02297210693359375, -0.001434326171875, 0.02010345458984375, 0.0416412353515625, 0.06317901611328125, 0.084716796875, 0.10625457763671875, 0.1277923583984375, 0.14933013916015625, 0.170867919921875, 0.19240570068359375, 0.2139434814453125, 0.23548126220703125, 0.25701904296875, 0.27855682373046875, 0.3000946044921875, 0.32163238525390625, 0.343170166015625, 0.36470794677734375, 0.3862457275390625, 0.40778350830078125, 0.4293212890625, 0.45085906982421875, 0.4723968505859375, 0.49393463134765625, 0.515472412109375, 0.5370101928710938, 0.5585479736328125, 0.5800857543945312, 0.60162353515625, 0.6231613159179688, 0.6446990966796875, 0.6662368774414062, 0.687774658203125, 0.7093124389648438, 0.7308502197265625, 0.7523880004882812, 0.77392578125]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 6.0, 13.0, 7.0, 12.0, 10.0, 20.0, 17.0, 32.0, 35.0, 43.0, 46.0, 38.0, 40.0, 56.0, 48.0, 50.0, 52.0, 51.0, 60.0, 53.0, 51.0, 46.0, 31.0, 31.0, 24.0, 23.0, 17.0, 20.0, 15.0, 9.0, 13.0, 3.0, 11.0, 6.0, 4.0, 3.0, 1.0, 2.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.65283203125, -0.63427734375, -0.61572265625, -0.59716796875, -0.57861328125, -0.56005859375, -0.54150390625, -0.52294921875, -0.50439453125, -0.48583984375, -0.46728515625, -0.44873046875, -0.43017578125, -0.41162109375, -0.39306640625, -0.37451171875, -0.35595703125, -0.33740234375, -0.31884765625, -0.30029296875, -0.28173828125, -0.26318359375, -0.24462890625, -0.22607421875, -0.20751953125, -0.18896484375, -0.17041015625, -0.15185546875, -0.13330078125, -0.11474609375, -0.09619140625, -0.07763671875, -0.05908203125, -0.04052734375, -0.02197265625, -0.00341796875, 0.01513671875, 0.03369140625, 0.05224609375, 0.07080078125, 0.08935546875, 0.10791015625, 0.12646484375, 0.14501953125, 0.16357421875, 0.18212890625, 0.20068359375, 0.21923828125, 0.23779296875, 0.25634765625, 0.27490234375, 0.29345703125, 0.31201171875, 0.33056640625, 0.34912109375, 0.36767578125, 0.38623046875, 0.40478515625, 0.42333984375, 0.44189453125, 0.46044921875, 0.47900390625, 0.49755859375, 0.51611328125, 0.53466796875]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 5.0, 7.0, 9.0, 10.0, 23.0, 20.0, 35.0, 58.0, 94.0, 158.0, 261.0, 372.0, 576.0, 909.0, 1529.0, 2487.0, 3920.0, 6217.0, 10192.0, 18136.0, 36426.0, 90048.0, 285044.0, 367755.0, 124366.0, 46787.0, 21989.0, 12013.0, 7074.0, 4482.0, 2841.0, 1774.0, 1091.0, 691.0, 420.0, 275.0, 166.0, 97.0, 71.0, 44.0, 29.0, 17.0, 19.0, 4.0, 4.0, 2.0, 4.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.140625, -0.1361103057861328, -0.13159561157226562, -0.12708091735839844, -0.12256622314453125, -0.11805152893066406, -0.11353683471679688, -0.10902214050292969, -0.1045074462890625, -0.09999275207519531, -0.09547805786132812, -0.09096336364746094, -0.08644866943359375, -0.08193397521972656, -0.07741928100585938, -0.07290458679199219, -0.068389892578125, -0.06387519836425781, -0.059360504150390625, -0.05484580993652344, -0.05033111572265625, -0.04581642150878906, -0.041301727294921875, -0.03678703308105469, -0.0322723388671875, -0.027757644653320312, -0.023242950439453125, -0.018728256225585938, -0.01421356201171875, -0.009698867797851562, -0.005184173583984375, -0.0006694793701171875, 0.00384521484375, 0.008359909057617188, 0.012874603271484375, 0.017389297485351562, 0.02190399169921875, 0.026418685913085938, 0.030933380126953125, 0.03544807434082031, 0.0399627685546875, 0.04447746276855469, 0.048992156982421875, 0.05350685119628906, 0.05802154541015625, 0.06253623962402344, 0.06705093383789062, 0.07156562805175781, 0.076080322265625, 0.08059501647949219, 0.08510971069335938, 0.08962440490722656, 0.09413909912109375, 0.09865379333496094, 0.10316848754882812, 0.10768318176269531, 0.1121978759765625, 0.11671257019042969, 0.12122726440429688, 0.12574195861816406, 0.13025665283203125, 0.13477134704589844, 0.13928604125976562, 0.1438007354736328, 0.1483154296875]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 3.0, 6.0, 5.0, 4.0, 6.0, 9.0, 14.0, 38.0, 43.0, 90.0, 239.0, 270.0, 133.0, 60.0, 26.0, 14.0, 16.0, 10.0, 7.0, 7.0, 3.0, 0.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.364418029785156e-05, -5.067512392997742e-05, -4.770606756210327e-05, -4.4737011194229126e-05, -4.176795482635498e-05, -3.8798898458480835e-05, -3.582984209060669e-05, -3.2860785722732544e-05, -2.98917293548584e-05, -2.6922672986984253e-05, -2.3953616619110107e-05, -2.0984560251235962e-05, -1.8015503883361816e-05, -1.5046447515487671e-05, -1.2077391147613525e-05, -9.10833477973938e-06, -6.139278411865234e-06, -3.170222043991089e-06, -2.0116567611694336e-07, 2.767890691757202e-06, 5.736947059631348e-06, 8.706003427505493e-06, 1.1675059795379639e-05, 1.4644116163253784e-05, 1.761317253112793e-05, 2.0582228899002075e-05, 2.355128526687622e-05, 2.6520341634750366e-05, 2.9489398002624512e-05, 3.245845437049866e-05, 3.54275107383728e-05, 3.839656710624695e-05, 4.1365623474121094e-05, 4.433467984199524e-05, 4.7303736209869385e-05, 5.027279257774353e-05, 5.3241848945617676e-05, 5.621090531349182e-05, 5.917996168136597e-05, 6.214901804924011e-05, 6.511807441711426e-05, 6.80871307849884e-05, 7.105618715286255e-05, 7.40252435207367e-05, 7.699429988861084e-05, 7.996335625648499e-05, 8.293241262435913e-05, 8.590146899223328e-05, 8.887052536010742e-05, 9.183958172798157e-05, 9.480863809585571e-05, 9.777769446372986e-05, 0.000100746750831604, 0.00010371580719947815, 0.0001066848635673523, 0.00010965391993522644, 0.00011262297630310059, 0.00011559203267097473, 0.00011856108903884888, 0.00012153014540672302, 0.00012449920177459717, 0.0001274682581424713, 0.00013043731451034546, 0.0001334063708782196, 0.00013637542724609375]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 1.0, 0.0, 2.0, 7.0, 5.0, 1.0, 9.0, 10.0, 17.0, 16.0, 17.0, 31.0, 49.0, 91.0, 119.0, 180.0, 333.0, 630.0, 1154.0, 2135.0, 4157.0, 7887.0, 15911.0, 35095.0, 98927.0, 289115.0, 359993.0, 143137.0, 48401.0, 20288.0, 9936.0, 5080.0, 2674.0, 1397.0, 713.0, 402.0, 240.0, 134.0, 90.0, 53.0, 27.0, 28.0, 22.0, 11.0, 8.0, 10.0, 6.0, 6.0, 5.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1531982421875, -0.14857864379882812, -0.14395904541015625, -0.13933944702148438, -0.1347198486328125, -0.13010025024414062, -0.12548065185546875, -0.12086105346679688, -0.116241455078125, -0.11162185668945312, -0.10700225830078125, -0.10238265991210938, -0.0977630615234375, -0.09314346313476562, -0.08852386474609375, -0.08390426635742188, -0.07928466796875, -0.07466506958007812, -0.07004547119140625, -0.06542587280273438, -0.0608062744140625, -0.056186676025390625, -0.05156707763671875, -0.046947479248046875, -0.042327880859375, -0.037708282470703125, -0.03308868408203125, -0.028469085693359375, -0.0238494873046875, -0.019229888916015625, -0.01461029052734375, -0.009990692138671875, -0.00537109375, -0.000751495361328125, 0.00386810302734375, 0.008487701416015625, 0.0131072998046875, 0.017726898193359375, 0.02234649658203125, 0.026966094970703125, 0.031585693359375, 0.036205291748046875, 0.04082489013671875, 0.045444488525390625, 0.0500640869140625, 0.054683685302734375, 0.05930328369140625, 0.06392288208007812, 0.06854248046875, 0.07316207885742188, 0.07778167724609375, 0.08240127563476562, 0.0870208740234375, 0.09164047241210938, 0.09626007080078125, 0.10087966918945312, 0.105499267578125, 0.11011886596679688, 0.11473846435546875, 0.11935806274414062, 0.1239776611328125, 0.12859725952148438, 0.13321685791015625, 0.13783645629882812, 0.1424560546875]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 12.0, 9.0, 12.0, 9.0, 19.0, 15.0, 32.0, 57.0, 91.0, 119.0, 122.0, 134.0, 108.0, 84.0, 50.0, 38.0, 20.0, 16.0, 17.0, 11.0, 9.0, 7.0, 8.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.30419921875, -0.2963905334472656, -0.28858184814453125, -0.2807731628417969, -0.2729644775390625, -0.2651557922363281, -0.25734710693359375, -0.24953842163085938, -0.241729736328125, -0.23392105102539062, -0.22611236572265625, -0.21830368041992188, -0.2104949951171875, -0.20268630981445312, -0.19487762451171875, -0.18706893920898438, -0.17926025390625, -0.17145156860351562, -0.16364288330078125, -0.15583419799804688, -0.1480255126953125, -0.14021682739257812, -0.13240814208984375, -0.12459945678710938, -0.116790771484375, -0.10898208618164062, -0.10117340087890625, -0.09336471557617188, -0.0855560302734375, -0.07774734497070312, -0.06993865966796875, -0.062129974365234375, -0.0543212890625, -0.046512603759765625, -0.03870391845703125, -0.030895233154296875, -0.0230865478515625, -0.015277862548828125, -0.00746917724609375, 0.000339508056640625, 0.008148193359375, 0.015956878662109375, 0.02376556396484375, 0.031574249267578125, 0.0393829345703125, 0.047191619873046875, 0.05500030517578125, 0.06280899047851562, 0.07061767578125, 0.07842636108398438, 0.08623504638671875, 0.09404373168945312, 0.1018524169921875, 0.10966110229492188, 0.11746978759765625, 0.12527847290039062, 0.133087158203125, 0.14089584350585938, 0.14870452880859375, 0.15651321411132812, 0.1643218994140625, 0.17213058471679688, 0.17993927001953125, 0.18774795532226562, 0.195556640625]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 2.0, 3.0, 4.0, 4.0, 10.0, 10.0, 22.0, 46.0, 66.0, 84.0, 100.0, 124.0, 119.0, 122.0, 98.0, 79.0, 52.0, 23.0, 18.0, 7.0, 6.0, 6.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.3333089351654053, -2.259892463684082, -2.186476230621338, -2.1130597591400146, -2.0396432876586914, -1.9662269353866577, -1.892810583114624, -1.8193941116333008, -1.745977759361267, -1.6725614070892334, -1.5991449356079102, -1.5257285833358765, -1.4523122310638428, -1.3788957595825195, -1.3054794073104858, -1.2320630550384521, -1.158646583557129, -1.0852302312850952, -1.011813759803772, -0.9383974075317383, -0.8649809956550598, -0.7915645837783813, -0.7181482315063477, -0.6447318196296692, -0.5713154077529907, -0.49789899587631226, -0.4244826138019562, -0.3510662317276001, -0.27764981985092163, -0.20423340797424316, -0.13081702589988708, -0.057400643825531006, 0.016016006469726562, 0.08943240344524384, 0.1628488004207611, 0.23626519739627838, 0.30968159437179565, 0.3830980062484741, 0.4565143883228302, 0.5299307703971863, 0.6033471822738647, 0.6767635941505432, 0.7501800060272217, 0.8235963582992554, 0.8970127701759338, 0.9704291820526123, 1.043845534324646, 1.1172618865966797, 1.190678358078003, 1.2640947103500366, 1.3375111818313599, 1.4109275341033936, 1.4843440055847168, 1.5577603578567505, 1.6311767101287842, 1.7045931816101074, 1.7780095338821411, 1.8514258861541748, 1.924842357635498, 1.9982587099075317, 2.0716750621795654, 2.1450915336608887, 2.218508005142212, 2.291924238204956, 2.3653407096862793]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 5.0, 5.0, 6.0, 13.0, 6.0, 9.0, 12.0, 29.0, 23.0, 26.0, 33.0, 26.0, 32.0, 36.0, 58.0, 41.0, 51.0, 45.0, 43.0, 42.0, 54.0, 49.0, 44.0, 40.0, 45.0, 33.0, 29.0, 33.0, 24.0, 24.0, 21.0, 18.0, 10.0, 19.0, 9.0, 6.0, 7.0, 3.0, 2.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.581453800201416, -1.530779242515564, -1.480104684829712, -1.4294301271438599, -1.3787555694580078, -1.3280811309814453, -1.2774064540863037, -1.2267320156097412, -1.1760574579238892, -1.125382900238037, -1.074708342552185, -1.024033784866333, -0.9733592867851257, -0.9226847290992737, -0.8720101714134216, -0.8213356733322144, -0.7706610560417175, -0.7199864983558655, -0.6693119406700134, -0.6186374425888062, -0.5679628849029541, -0.517288327217102, -0.46661376953125, -0.41593924164772034, -0.3652646839618683, -0.31459012627601624, -0.2639155983924866, -0.21324104070663452, -0.16256649792194366, -0.11189195513725281, -0.06121739745140076, -0.010542869567871094, 0.04013168811798096, 0.09080623090267181, 0.14148077368736267, 0.19215533137321472, 0.24282987415790558, 0.29350441694259644, 0.3441789746284485, 0.39485350251197815, 0.4455280601978302, 0.49620261788368225, 0.5468771457672119, 0.597551703453064, 0.648226261138916, 0.6989008188247681, 0.7495753765106201, 0.8002498745918274, 0.8509244322776794, 0.9015989899635315, 0.9522735476493835, 1.0029480457305908, 1.0536226034164429, 1.104297161102295, 1.154971718788147, 1.205646276473999, 1.256320834159851, 1.3069953918457031, 1.3576699495315552, 1.4083445072174072, 1.4590190649032593, 1.5096936225891113, 1.5603680610656738, 1.6110426187515259, 1.661717176437378]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 5.0, 3.0, 5.0, 8.0, 10.0, 19.0, 18.0, 32.0, 51.0, 74.0, 125.0, 242.0, 443.0, 912.0, 1710.0, 3462.0, 7276.0, 16248.0, 36820.0, 87767.0, 228454.0, 676062.0, 1662902.0, 953893.0, 312124.0, 117109.0, 48564.0, 21323.0, 9655.0, 4505.0, 2135.0, 1028.0, 551.0, 307.0, 174.0, 89.0, 74.0, 36.0, 29.0, 24.0, 6.0, 6.0, 3.0, 4.0, 6.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2191162109375, -0.2114696502685547, -0.20382308959960938, -0.19617652893066406, -0.18852996826171875, -0.18088340759277344, -0.17323684692382812, -0.1655902862548828, -0.1579437255859375, -0.1502971649169922, -0.14265060424804688, -0.13500404357910156, -0.12735748291015625, -0.11971092224121094, -0.11206436157226562, -0.10441780090332031, -0.096771240234375, -0.08912467956542969, -0.08147811889648438, -0.07383155822753906, -0.06618499755859375, -0.05853843688964844, -0.050891876220703125, -0.04324531555175781, -0.0355987548828125, -0.027952194213867188, -0.020305633544921875, -0.012659072875976562, -0.00501251220703125, 0.0026340484619140625, 0.010280609130859375, 0.017927169799804688, 0.02557373046875, 0.03322029113769531, 0.040866851806640625, 0.04851341247558594, 0.05615997314453125, 0.06380653381347656, 0.07145309448242188, 0.07909965515136719, 0.0867462158203125, 0.09439277648925781, 0.10203933715820312, 0.10968589782714844, 0.11733245849609375, 0.12497901916503906, 0.13262557983398438, 0.1402721405029297, 0.147918701171875, 0.1555652618408203, 0.16321182250976562, 0.17085838317871094, 0.17850494384765625, 0.18615150451660156, 0.19379806518554688, 0.2014446258544922, 0.2090911865234375, 0.2167377471923828, 0.22438430786132812, 0.23203086853027344, 0.23967742919921875, 0.24732398986816406, 0.2549705505371094, 0.2626171112060547, 0.270263671875]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 8.0, 5.0, 6.0, 6.0, 12.0, 12.0, 13.0, 14.0, 10.0, 20.0, 18.0, 21.0, 29.0, 36.0, 32.0, 27.0, 36.0, 38.0, 45.0, 36.0, 40.0, 52.0, 31.0, 45.0, 49.0, 42.0, 38.0, 41.0, 49.0, 25.0, 30.0, 17.0, 18.0, 17.0, 18.0, 12.0, 14.0, 11.0, 7.0, 9.0, 9.0, 7.0, 3.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1988525390625, -0.19292068481445312, -0.18698883056640625, -0.18105697631835938, -0.1751251220703125, -0.16919326782226562, -0.16326141357421875, -0.15732955932617188, -0.151397705078125, -0.14546585083007812, -0.13953399658203125, -0.13360214233398438, -0.1276702880859375, -0.12173843383789062, -0.11580657958984375, -0.10987472534179688, -0.10394287109375, -0.09801101684570312, -0.09207916259765625, -0.08614730834960938, -0.0802154541015625, -0.07428359985351562, -0.06835174560546875, -0.062419891357421875, -0.056488037109375, -0.050556182861328125, -0.04462432861328125, -0.038692474365234375, -0.0327606201171875, -0.026828765869140625, -0.02089691162109375, -0.014965057373046875, -0.009033203125, -0.003101348876953125, 0.00283050537109375, 0.008762359619140625, 0.0146942138671875, 0.020626068115234375, 0.02655792236328125, 0.032489776611328125, 0.038421630859375, 0.044353485107421875, 0.05028533935546875, 0.056217193603515625, 0.0621490478515625, 0.06808090209960938, 0.07401275634765625, 0.07994461059570312, 0.08587646484375, 0.09180831909179688, 0.09774017333984375, 0.10367202758789062, 0.1096038818359375, 0.11553573608398438, 0.12146759033203125, 0.12739944458007812, 0.133331298828125, 0.13926315307617188, 0.14519500732421875, 0.15112686157226562, 0.1570587158203125, 0.16299057006835938, 0.16892242431640625, 0.17485427856445312, 0.1807861328125]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 4.0, 5.0, 8.0, 5.0, 17.0, 17.0, 26.0, 58.0, 77.0, 120.0, 184.0, 372.0, 694.0, 1445.0, 3206.0, 7440.0, 18580.0, 50851.0, 148085.0, 509774.0, 2029332.0, 1035463.0, 256487.0, 82132.0, 29590.0, 11349.0, 4749.0, 2050.0, 1024.0, 537.0, 245.0, 131.0, 84.0, 40.0, 45.0, 23.0, 15.0, 12.0, 6.0, 3.0, 4.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.325439453125, -0.3137054443359375, -0.301971435546875, -0.2902374267578125, -0.27850341796875, -0.2667694091796875, -0.255035400390625, -0.2433013916015625, -0.2315673828125, -0.2198333740234375, -0.208099365234375, -0.1963653564453125, -0.18463134765625, -0.1728973388671875, -0.161163330078125, -0.1494293212890625, -0.1376953125, -0.1259613037109375, -0.114227294921875, -0.1024932861328125, -0.09075927734375, -0.0790252685546875, -0.067291259765625, -0.0555572509765625, -0.0438232421875, -0.0320892333984375, -0.020355224609375, -0.0086212158203125, 0.00311279296875, 0.0148468017578125, 0.026580810546875, 0.0383148193359375, 0.050048828125, 0.0617828369140625, 0.073516845703125, 0.0852508544921875, 0.09698486328125, 0.1087188720703125, 0.120452880859375, 0.1321868896484375, 0.1439208984375, 0.1556549072265625, 0.167388916015625, 0.1791229248046875, 0.19085693359375, 0.2025909423828125, 0.214324951171875, 0.2260589599609375, 0.23779296875, 0.2495269775390625, 0.261260986328125, 0.2729949951171875, 0.28472900390625, 0.2964630126953125, 0.308197021484375, 0.3199310302734375, 0.3316650390625, 0.3433990478515625, 0.355133056640625, 0.3668670654296875, 0.37860107421875, 0.3903350830078125, 0.402069091796875, 0.4138031005859375, 0.425537109375]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 4.0, 5.0, 4.0, 1.0, 5.0, 4.0, 3.0, 9.0, 13.0, 15.0, 22.0, 31.0, 32.0, 34.0, 52.0, 59.0, 81.0, 81.0, 115.0, 146.0, 175.0, 227.0, 301.0, 447.0, 443.0, 396.0, 317.0, 235.0, 204.0, 112.0, 103.0, 77.0, 61.0, 46.0, 51.0, 40.0, 27.0, 12.0, 16.0, 22.0, 10.0, 7.0, 6.0, 7.0, 5.0, 3.0, 8.0, 2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 4.0, 1.0, 1.0], "bins": [-0.322021484375, -0.31207275390625, -0.3021240234375, -0.29217529296875, -0.2822265625, -0.27227783203125, -0.2623291015625, -0.25238037109375, -0.242431640625, -0.23248291015625, -0.2225341796875, -0.21258544921875, -0.20263671875, -0.19268798828125, -0.1827392578125, -0.17279052734375, -0.162841796875, -0.15289306640625, -0.1429443359375, -0.13299560546875, -0.123046875, -0.11309814453125, -0.1031494140625, -0.09320068359375, -0.083251953125, -0.07330322265625, -0.0633544921875, -0.05340576171875, -0.04345703125, -0.03350830078125, -0.0235595703125, -0.01361083984375, -0.003662109375, 0.00628662109375, 0.0162353515625, 0.02618408203125, 0.0361328125, 0.04608154296875, 0.0560302734375, 0.06597900390625, 0.075927734375, 0.08587646484375, 0.0958251953125, 0.10577392578125, 0.11572265625, 0.12567138671875, 0.1356201171875, 0.14556884765625, 0.155517578125, 0.16546630859375, 0.1754150390625, 0.18536376953125, 0.1953125, 0.20526123046875, 0.2152099609375, 0.22515869140625, 0.235107421875, 0.24505615234375, 0.2550048828125, 0.26495361328125, 0.27490234375, 0.28485107421875, 0.2947998046875, 0.30474853515625, 0.314697265625]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 5.0, 5.0, 10.0, 23.0, 29.0, 43.0, 55.0, 92.0, 117.0, 143.0, 122.0, 108.0, 98.0, 68.0, 39.0, 21.0, 12.0, 8.0, 2.0, 2.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.050027847290039, -2.9605612754821777, -2.8710947036743164, -2.781628370285034, -2.692161798477173, -2.6026952266693115, -2.51322865486145, -2.423762321472168, -2.3342957496643066, -2.2448291778564453, -2.155362606048584, -2.0658962726593018, -1.9764297008514404, -1.886963129043579, -1.7974965572357178, -1.708030104637146, -1.6185635328292847, -1.5290969610214233, -1.4396305084228516, -1.3501639366149902, -1.2606974840164185, -1.1712309122085571, -1.0817644596099854, -0.992297887802124, -0.9028313755989075, -0.8133648633956909, -0.7238983511924744, -0.6344318389892578, -0.5449652671813965, -0.4554987847805023, -0.3660322427749634, -0.2765657305717468, -0.18709921836853027, -0.09763269871473312, -0.008166179060935974, 0.08130034804344177, 0.17076686024665833, 0.2602333724498749, 0.3496999144554138, 0.43916642665863037, 0.5286329388618469, 0.6180994510650635, 0.70756596326828, 0.7970324754714966, 0.8864990472793579, 0.9759654998779297, 1.065432071685791, 1.1548986434936523, 1.2443650960922241, 1.3338316679000854, 1.4232981204986572, 1.5127646923065186, 1.6022311449050903, 1.6916977167129517, 1.7811641693115234, 1.8706307411193848, 1.960097312927246, 2.0495638847351074, 2.1390304565429688, 2.228496789932251, 2.3179633617401123, 2.4074299335479736, 2.496896505355835, 2.586362838745117, 2.6758294105529785]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 4.0, 1.0, 2.0, 7.0, 6.0, 6.0, 8.0, 10.0, 19.0, 15.0, 22.0, 23.0, 21.0, 30.0, 32.0, 29.0, 24.0, 31.0, 35.0, 39.0, 45.0, 45.0, 42.0, 41.0, 47.0, 49.0, 40.0, 34.0, 35.0, 32.0, 42.0, 28.0, 25.0, 18.0, 24.0, 18.0, 11.0, 10.0, 16.0, 7.0, 5.0, 12.0, 5.0, 4.0, 3.0, 3.0, 4.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.2190254926681519, -1.1784169673919678, -1.1378084421157837, -1.0971999168395996, -1.056591272354126, -1.015982747077942, -0.9753742218017578, -0.9347656965255737, -0.8941571712493896, -0.8535486459732056, -0.8129401206970215, -0.7723315358161926, -0.7317230105400085, -0.6911144852638245, -0.6505059003829956, -0.6098973751068115, -0.5692888498306274, -0.5286803245544434, -0.4880717694759369, -0.4474632143974304, -0.40685468912124634, -0.36624616384506226, -0.3256376087665558, -0.2850290536880493, -0.24442052841186523, -0.20381198823451996, -0.16320344805717468, -0.1225949078798294, -0.08198636770248413, -0.041377827525138855, -0.0007692873477935791, 0.03983926773071289, 0.08044791221618652, 0.1210564523935318, 0.16166499257087708, 0.20227353274822235, 0.24288207292556763, 0.2834905982017517, 0.3240991532802582, 0.36470770835876465, 0.40531623363494873, 0.4459247589111328, 0.4865333139896393, 0.5271418690681458, 0.5677503943443298, 0.6083589196205139, 0.6489675045013428, 0.6895760297775269, 0.7301845550537109, 0.770793080329895, 0.8114016056060791, 0.852010190486908, 0.892618715763092, 0.9332272410392761, 0.973835825920105, 1.014444351196289, 1.0550528764724731, 1.0956614017486572, 1.1362699270248413, 1.1768784523010254, 1.217487096786499, 1.258095622062683, 1.2987041473388672, 1.3393126726150513, 1.3799211978912354]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 5.0, 10.0, 15.0, 20.0, 30.0, 55.0, 83.0, 125.0, 254.0, 397.0, 716.0, 1283.0, 2165.0, 3916.0, 6956.0, 11429.0, 19753.0, 35700.0, 104114.0, 384170.0, 323037.0, 80472.0, 30998.0, 17812.0, 10570.0, 5989.0, 3661.0, 2064.0, 1157.0, 683.0, 336.0, 235.0, 123.0, 68.0, 51.0, 33.0, 27.0, 18.0, 9.0, 6.0, 3.0, 3.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.4453125, -0.4329109191894531, -0.42050933837890625, -0.4081077575683594, -0.3957061767578125, -0.3833045959472656, -0.37090301513671875, -0.3585014343261719, -0.346099853515625, -0.3336982727050781, -0.32129669189453125, -0.3088951110839844, -0.2964935302734375, -0.2840919494628906, -0.27169036865234375, -0.2592887878417969, -0.24688720703125, -0.23448562622070312, -0.22208404541015625, -0.20968246459960938, -0.1972808837890625, -0.18487930297851562, -0.17247772216796875, -0.16007614135742188, -0.147674560546875, -0.13527297973632812, -0.12287139892578125, -0.11046981811523438, -0.0980682373046875, -0.08566665649414062, -0.07326507568359375, -0.060863494873046875, -0.0484619140625, -0.036060333251953125, -0.02365875244140625, -0.011257171630859375, 0.0011444091796875, 0.013545989990234375, 0.02594757080078125, 0.038349151611328125, 0.050750732421875, 0.06315231323242188, 0.07555389404296875, 0.08795547485351562, 0.1003570556640625, 0.11275863647460938, 0.12516021728515625, 0.13756179809570312, 0.14996337890625, 0.16236495971679688, 0.17476654052734375, 0.18716812133789062, 0.1995697021484375, 0.21197128295898438, 0.22437286376953125, 0.23677444458007812, 0.249176025390625, 0.2615776062011719, 0.27397918701171875, 0.2863807678222656, 0.2987823486328125, 0.3111839294433594, 0.32358551025390625, 0.3359870910644531, 0.348388671875]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 0.0, 1.0, 2.0, 1.0, 3.0, 4.0, 8.0, 6.0, 7.0, 11.0, 5.0, 10.0, 18.0, 19.0, 22.0, 24.0, 22.0, 27.0, 27.0, 37.0, 31.0, 38.0, 41.0, 46.0, 41.0, 33.0, 41.0, 55.0, 27.0, 56.0, 32.0, 23.0, 35.0, 35.0, 39.0, 28.0, 26.0, 27.0, 18.0, 10.0, 16.0, 13.0, 12.0, 7.0, 6.0, 6.0, 5.0, 6.0, 2.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.178466796875, -0.1726226806640625, -0.166778564453125, -0.1609344482421875, -0.15509033203125, -0.1492462158203125, -0.143402099609375, -0.1375579833984375, -0.1317138671875, -0.1258697509765625, -0.120025634765625, -0.1141815185546875, -0.10833740234375, -0.1024932861328125, -0.096649169921875, -0.0908050537109375, -0.0849609375, -0.0791168212890625, -0.073272705078125, -0.0674285888671875, -0.06158447265625, -0.0557403564453125, -0.049896240234375, -0.0440521240234375, -0.0382080078125, -0.0323638916015625, -0.026519775390625, -0.0206756591796875, -0.01483154296875, -0.0089874267578125, -0.003143310546875, 0.0027008056640625, 0.008544921875, 0.0143890380859375, 0.020233154296875, 0.0260772705078125, 0.03192138671875, 0.0377655029296875, 0.043609619140625, 0.0494537353515625, 0.0552978515625, 0.0611419677734375, 0.066986083984375, 0.0728302001953125, 0.07867431640625, 0.0845184326171875, 0.090362548828125, 0.0962066650390625, 0.10205078125, 0.1078948974609375, 0.113739013671875, 0.1195831298828125, 0.12542724609375, 0.1312713623046875, 0.137115478515625, 0.1429595947265625, 0.1488037109375, 0.1546478271484375, 0.160491943359375, 0.1663360595703125, 0.17218017578125, 0.1780242919921875, 0.183868408203125, 0.1897125244140625, 0.195556640625]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 5.0, 4.0, 2.0, 3.0, 5.0, 6.0, 17.0, 17.0, 26.0, 37.0, 47.0, 93.0, 132.0, 209.0, 368.0, 691.0, 1483.0, 3700.0, 9510.0, 24518.0, 84412.0, 617991.0, 239152.0, 40942.0, 14892.0, 5729.0, 2371.0, 923.0, 511.0, 279.0, 169.0, 109.0, 58.0, 53.0, 33.0, 17.0, 15.0, 14.0, 5.0, 4.0, 2.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.58740234375, -0.5669631958007812, -0.5465240478515625, -0.5260848999023438, -0.505645751953125, -0.48520660400390625, -0.4647674560546875, -0.44432830810546875, -0.42388916015625, -0.40345001220703125, -0.3830108642578125, -0.36257171630859375, -0.342132568359375, -0.32169342041015625, -0.3012542724609375, -0.28081512451171875, -0.2603759765625, -0.23993682861328125, -0.2194976806640625, -0.19905853271484375, -0.178619384765625, -0.15818023681640625, -0.1377410888671875, -0.11730194091796875, -0.09686279296875, -0.07642364501953125, -0.0559844970703125, -0.03554534912109375, -0.015106201171875, 0.00533294677734375, 0.0257720947265625, 0.04621124267578125, 0.066650390625, 0.08708953857421875, 0.1075286865234375, 0.12796783447265625, 0.148406982421875, 0.16884613037109375, 0.1892852783203125, 0.20972442626953125, 0.23016357421875, 0.25060272216796875, 0.2710418701171875, 0.29148101806640625, 0.311920166015625, 0.33235931396484375, 0.3527984619140625, 0.37323760986328125, 0.3936767578125, 0.41411590576171875, 0.4345550537109375, 0.45499420166015625, 0.475433349609375, 0.49587249755859375, 0.5163116455078125, 0.5367507934570312, 0.55718994140625, 0.5776290893554688, 0.5980682373046875, 0.6185073852539062, 0.638946533203125, 0.6593856811523438, 0.6798248291015625, 0.7002639770507812, 0.720703125]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 1.0, 1.0, 1.0, 2.0, 7.0, 5.0, 8.0, 8.0, 8.0, 15.0, 12.0, 26.0, 24.0, 18.0, 27.0, 27.0, 30.0, 34.0, 43.0, 45.0, 51.0, 53.0, 66.0, 49.0, 41.0, 37.0, 40.0, 38.0, 56.0, 31.0, 31.0, 14.0, 25.0, 20.0, 19.0, 26.0, 16.0, 11.0, 16.0, 4.0, 7.0, 7.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 3.0], "bins": [-0.68798828125, -0.6669692993164062, -0.6459503173828125, -0.6249313354492188, -0.603912353515625, -0.5828933715820312, -0.5618743896484375, -0.5408554077148438, -0.51983642578125, -0.49881744384765625, -0.4777984619140625, -0.45677947998046875, -0.435760498046875, -0.41474151611328125, -0.3937225341796875, -0.37270355224609375, -0.3516845703125, -0.33066558837890625, -0.3096466064453125, -0.28862762451171875, -0.267608642578125, -0.24658966064453125, -0.2255706787109375, -0.20455169677734375, -0.18353271484375, -0.16251373291015625, -0.1414947509765625, -0.12047576904296875, -0.099456787109375, -0.07843780517578125, -0.0574188232421875, -0.03639984130859375, -0.015380859375, 0.00563812255859375, 0.0266571044921875, 0.04767608642578125, 0.068695068359375, 0.08971405029296875, 0.1107330322265625, 0.13175201416015625, 0.15277099609375, 0.17378997802734375, 0.1948089599609375, 0.21582794189453125, 0.236846923828125, 0.25786590576171875, 0.2788848876953125, 0.29990386962890625, 0.3209228515625, 0.34194183349609375, 0.3629608154296875, 0.38397979736328125, 0.404998779296875, 0.42601776123046875, 0.4470367431640625, 0.46805572509765625, 0.48907470703125, 0.5100936889648438, 0.5311126708984375, 0.5521316528320312, 0.573150634765625, 0.5941696166992188, 0.6151885986328125, 0.6362075805664062, 0.6572265625]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 5.0, 11.0, 8.0, 9.0, 17.0, 22.0, 34.0, 49.0, 67.0, 138.0, 194.0, 314.0, 478.0, 780.0, 1313.0, 2166.0, 3579.0, 6277.0, 10668.0, 18666.0, 35865.0, 79751.0, 261599.0, 395131.0, 124835.0, 49126.0, 24668.0, 13501.0, 7985.0, 4531.0, 2706.0, 1573.0, 908.0, 609.0, 344.0, 235.0, 139.0, 91.0, 62.0, 29.0, 31.0, 16.0, 12.0, 6.0, 2.0, 5.0, 3.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.142333984375, -0.13762283325195312, -0.13291168212890625, -0.12820053100585938, -0.1234893798828125, -0.11877822875976562, -0.11406707763671875, -0.10935592651367188, -0.104644775390625, -0.09993362426757812, -0.09522247314453125, -0.09051132202148438, -0.0858001708984375, -0.08108901977539062, -0.07637786865234375, -0.07166671752929688, -0.06695556640625, -0.062244415283203125, -0.05753326416015625, -0.052822113037109375, -0.0481109619140625, -0.043399810791015625, -0.03868865966796875, -0.033977508544921875, -0.029266357421875, -0.024555206298828125, -0.01984405517578125, -0.015132904052734375, -0.0104217529296875, -0.005710601806640625, -0.00099945068359375, 0.003711700439453125, 0.0084228515625, 0.013134002685546875, 0.01784515380859375, 0.022556304931640625, 0.0272674560546875, 0.031978607177734375, 0.03668975830078125, 0.041400909423828125, 0.046112060546875, 0.050823211669921875, 0.05553436279296875, 0.060245513916015625, 0.0649566650390625, 0.06966781616210938, 0.07437896728515625, 0.07909011840820312, 0.08380126953125, 0.08851242065429688, 0.09322357177734375, 0.09793472290039062, 0.1026458740234375, 0.10735702514648438, 0.11206817626953125, 0.11677932739257812, 0.121490478515625, 0.12620162963867188, 0.13091278076171875, 0.13562393188476562, 0.1403350830078125, 0.14504623413085938, 0.14975738525390625, 0.15446853637695312, 0.1591796875]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 5.0, 0.0, 3.0, 3.0, 4.0, 5.0, 4.0, 6.0, 5.0, 3.0, 3.0, 9.0, 5.0, 11.0, 15.0, 21.0, 35.0, 78.0, 147.0, 192.0, 158.0, 103.0, 50.0, 36.0, 21.0, 16.0, 14.0, 10.0, 17.0, 8.0, 3.0, 6.0, 1.0, 3.0, 6.0, 4.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.99162483215332e-05, -6.784126162528992e-05, -6.576627492904663e-05, -6.369128823280334e-05, -6.161630153656006e-05, -5.954131484031677e-05, -5.7466328144073486e-05, -5.53913414478302e-05, -5.3316354751586914e-05, -5.124136805534363e-05, -4.916638135910034e-05, -4.7091394662857056e-05, -4.501640796661377e-05, -4.2941421270370483e-05, -4.08664345741272e-05, -3.879144787788391e-05, -3.6716461181640625e-05, -3.464147448539734e-05, -3.256648778915405e-05, -3.0491501092910767e-05, -2.841651439666748e-05, -2.6341527700424194e-05, -2.4266541004180908e-05, -2.2191554307937622e-05, -2.0116567611694336e-05, -1.804158091545105e-05, -1.5966594219207764e-05, -1.3891607522964478e-05, -1.1816620826721191e-05, -9.741634130477905e-06, -7.666647434234619e-06, -5.591660737991333e-06, -3.516674041748047e-06, -1.4416873455047607e-06, 6.332993507385254e-07, 2.7082860469818115e-06, 4.783272743225098e-06, 6.858259439468384e-06, 8.93324613571167e-06, 1.1008232831954956e-05, 1.3083219528198242e-05, 1.5158206224441528e-05, 1.7233192920684814e-05, 1.93081796169281e-05, 2.1383166313171387e-05, 2.3458153009414673e-05, 2.553313970565796e-05, 2.7608126401901245e-05, 2.968311309814453e-05, 3.175809979438782e-05, 3.3833086490631104e-05, 3.590807318687439e-05, 3.7983059883117676e-05, 4.005804657936096e-05, 4.213303327560425e-05, 4.4208019971847534e-05, 4.628300666809082e-05, 4.8357993364334106e-05, 5.043298006057739e-05, 5.250796675682068e-05, 5.4582953453063965e-05, 5.665794014930725e-05, 5.873292684555054e-05, 6.080791354179382e-05, 6.288290023803711e-05]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 3.0, 4.0, 5.0, 2.0, 4.0, 4.0, 9.0, 5.0, 21.0, 19.0, 25.0, 18.0, 47.0, 53.0, 68.0, 106.0, 141.0, 227.0, 374.0, 663.0, 1193.0, 2167.0, 4390.0, 8835.0, 18019.0, 38655.0, 90809.0, 265418.0, 370138.0, 142593.0, 54678.0, 25148.0, 12071.0, 5894.0, 3037.0, 1536.0, 778.0, 471.0, 311.0, 174.0, 115.0, 77.0, 65.0, 45.0, 37.0, 40.0, 19.0, 11.0, 14.0, 9.0, 5.0, 5.0, 2.0, 1.0, 4.0, 4.0, 2.0, 2.0, 0.0, 2.0], "bins": [-0.1522216796875, -0.14749717712402344, -0.14277267456054688, -0.1380481719970703, -0.13332366943359375, -0.1285991668701172, -0.12387466430664062, -0.11915016174316406, -0.1144256591796875, -0.10970115661621094, -0.10497665405273438, -0.10025215148925781, -0.09552764892578125, -0.09080314636230469, -0.08607864379882812, -0.08135414123535156, -0.076629638671875, -0.07190513610839844, -0.06718063354492188, -0.06245613098144531, -0.05773162841796875, -0.05300712585449219, -0.048282623291015625, -0.04355812072753906, -0.0388336181640625, -0.03410911560058594, -0.029384613037109375, -0.024660110473632812, -0.01993560791015625, -0.015211105346679688, -0.010486602783203125, -0.0057621002197265625, -0.00103759765625, 0.0036869049072265625, 0.008411407470703125, 0.013135910034179688, 0.01786041259765625, 0.022584915161132812, 0.027309417724609375, 0.03203392028808594, 0.0367584228515625, 0.04148292541503906, 0.046207427978515625, 0.05093193054199219, 0.05565643310546875, 0.06038093566894531, 0.06510543823242188, 0.06982994079589844, 0.074554443359375, 0.07927894592285156, 0.08400344848632812, 0.08872795104980469, 0.09345245361328125, 0.09817695617675781, 0.10290145874023438, 0.10762596130371094, 0.1123504638671875, 0.11707496643066406, 0.12179946899414062, 0.1265239715576172, 0.13124847412109375, 0.1359729766845703, 0.14069747924804688, 0.14542198181152344, 0.150146484375]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 4.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 1.0, 6.0, 8.0, 4.0, 9.0, 10.0, 3.0, 13.0, 14.0, 22.0, 16.0, 15.0, 30.0, 46.0, 52.0, 59.0, 64.0, 69.0, 84.0, 78.0, 63.0, 60.0, 37.0, 32.0, 40.0, 28.0, 19.0, 18.0, 15.0, 12.0, 17.0, 9.0, 9.0, 7.0, 5.0, 3.0, 3.0, 6.0, 3.0, 2.0, 2.0, 6.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1513671875, -0.1461925506591797, -0.14101791381835938, -0.13584327697753906, -0.13066864013671875, -0.12549400329589844, -0.12031936645507812, -0.11514472961425781, -0.1099700927734375, -0.10479545593261719, -0.09962081909179688, -0.09444618225097656, -0.08927154541015625, -0.08409690856933594, -0.07892227172851562, -0.07374763488769531, -0.068572998046875, -0.06339836120605469, -0.058223724365234375, -0.05304908752441406, -0.04787445068359375, -0.04269981384277344, -0.037525177001953125, -0.03235054016113281, -0.0271759033203125, -0.022001266479492188, -0.016826629638671875, -0.011651992797851562, -0.00647735595703125, -0.0013027191162109375, 0.003871917724609375, 0.009046554565429688, 0.01422119140625, 0.019395828247070312, 0.024570465087890625, 0.029745101928710938, 0.03491973876953125, 0.04009437561035156, 0.045269012451171875, 0.05044364929199219, 0.0556182861328125, 0.06079292297363281, 0.06596755981445312, 0.07114219665527344, 0.07631683349609375, 0.08149147033691406, 0.08666610717773438, 0.09184074401855469, 0.097015380859375, 0.10219001770019531, 0.10736465454101562, 0.11253929138183594, 0.11771392822265625, 0.12288856506347656, 0.12806320190429688, 0.1332378387451172, 0.1384124755859375, 0.1435871124267578, 0.14876174926757812, 0.15393638610839844, 0.15911102294921875, 0.16428565979003906, 0.16946029663085938, 0.1746349334716797, 0.1798095703125]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 4.0, 8.0, 17.0, 80.0, 244.0, 343.0, 203.0, 67.0, 26.0, 6.0, 4.0, 0.0, 2.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.113089561462402, -8.902769088745117, -8.692448616027832, -8.482129096984863, -8.271808624267578, -8.061488151550293, -7.851167678833008, -7.640847206115723, -7.430527210235596, -7.2202067375183105, -7.009886741638184, -6.799566268920898, -6.589245796203613, -6.378925800323486, -6.168605327606201, -5.958285331726074, -5.747964859008789, -5.537644386291504, -5.327324390411377, -5.117003917694092, -4.906683921813965, -4.69636344909668, -4.4860429763793945, -4.275722503662109, -4.065402507781982, -3.8550822734832764, -3.6447620391845703, -3.434441566467285, -3.224121332168579, -3.013801097869873, -2.803480625152588, -2.593160390853882, -2.3828396797180176, -2.1725194454193115, -1.962199091911316, -1.7518787384033203, -1.5415585041046143, -1.3312382698059082, -1.1209179162979126, -0.910597562789917, -0.7002773284912109, -0.4899570345878601, -0.2796367406845093, -0.06931644678115845, 0.14100384712219238, 0.35132408142089844, 0.561644434928894, 0.7719647884368896, 0.9822850227355957, 1.1926052570343018, 1.4029256105422974, 1.613245964050293, 1.823566198348999, 2.033886432647705, 2.2442069053649902, 2.4545271396636963, 2.6648473739624023, 2.8751676082611084, 3.0854878425598145, 3.2958083152770996, 3.5061285495758057, 3.7164487838745117, 3.926769256591797, 4.137089729309082, 4.347409725189209]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 2.0, 1.0, 2.0, 1.0, 4.0, 9.0, 7.0, 3.0, 13.0, 11.0, 14.0, 16.0, 22.0, 16.0, 22.0, 16.0, 21.0, 31.0, 36.0, 27.0, 41.0, 33.0, 25.0, 45.0, 43.0, 39.0, 27.0, 28.0, 40.0, 34.0, 49.0, 34.0, 40.0, 22.0, 37.0, 24.0, 23.0, 16.0, 17.0, 22.0, 17.0, 18.0, 10.0, 12.0, 12.0, 15.0, 2.0, 7.0, 3.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.4391809701919556, -1.3924413919448853, -1.345701813697815, -1.2989622354507446, -1.2522226572036743, -1.205483078956604, -1.1587436199188232, -1.112004041671753, -1.0652644634246826, -1.0185248851776123, -0.971785306930542, -0.9250457286834717, -0.8783061504364014, -0.831566572189331, -0.7848270535469055, -0.7380874752998352, -0.6913478374481201, -0.6446082592010498, -0.5978686809539795, -0.5511291027069092, -0.5043895244598389, -0.45764997601509094, -0.410910427570343, -0.3641708493232727, -0.3174312710762024, -0.2706916928291321, -0.22395212948322296, -0.17721256613731384, -0.13047298789024353, -0.08373340964317322, -0.03699386119842529, 0.00974571704864502, 0.05648529529571533, 0.10322486609220505, 0.14996443688869476, 0.19670400023460388, 0.2434435784816742, 0.2901831567287445, 0.33692270517349243, 0.38366228342056274, 0.43040186166763306, 0.47714143991470337, 0.5238810181617737, 0.5706205368041992, 0.6173601150512695, 0.6640996932983398, 0.7108392715454102, 0.7575788497924805, 0.8043184280395508, 0.8510580062866211, 0.8977975845336914, 0.9445371627807617, 0.991276741027832, 1.0380163192749023, 1.0847558975219727, 1.131495475769043, 1.1782350540161133, 1.2249746322631836, 1.271714210510254, 1.3184537887573242, 1.3651933670043945, 1.4119329452514648, 1.4586725234985352, 1.5054121017456055, 1.5521515607833862]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 10.0, 9.0, 16.0, 23.0, 44.0, 73.0, 103.0, 222.0, 381.0, 736.0, 1557.0, 3421.0, 7739.0, 18067.0, 42801.0, 104411.0, 270502.0, 766715.0, 1529957.0, 916559.0, 323111.0, 121743.0, 49215.0, 20599.0, 8939.0, 3876.0, 1675.0, 824.0, 438.0, 238.0, 109.0, 65.0, 46.0, 23.0, 16.0, 11.0, 10.0, 5.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2376708984375, -0.2301464080810547, -0.22262191772460938, -0.21509742736816406, -0.20757293701171875, -0.20004844665527344, -0.19252395629882812, -0.1849994659423828, -0.1774749755859375, -0.1699504852294922, -0.16242599487304688, -0.15490150451660156, -0.14737701416015625, -0.13985252380371094, -0.13232803344726562, -0.12480354309082031, -0.117279052734375, -0.10975456237792969, -0.10223007202148438, -0.09470558166503906, -0.08718109130859375, -0.07965660095214844, -0.07213211059570312, -0.06460762023925781, -0.0570831298828125, -0.04955863952636719, -0.042034149169921875, -0.03450965881347656, -0.02698516845703125, -0.019460678100585938, -0.011936187744140625, -0.0044116973876953125, 0.00311279296875, 0.010637283325195312, 0.018161773681640625, 0.025686264038085938, 0.03321075439453125, 0.04073524475097656, 0.048259735107421875, 0.05578422546386719, 0.0633087158203125, 0.07083320617675781, 0.07835769653320312, 0.08588218688964844, 0.09340667724609375, 0.10093116760253906, 0.10845565795898438, 0.11598014831542969, 0.123504638671875, 0.1310291290283203, 0.13855361938476562, 0.14607810974121094, 0.15360260009765625, 0.16112709045410156, 0.16865158081054688, 0.1761760711669922, 0.1837005615234375, 0.1912250518798828, 0.19874954223632812, 0.20627403259277344, 0.21379852294921875, 0.22132301330566406, 0.22884750366210938, 0.2363719940185547, 0.243896484375]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 6.0, 5.0, 7.0, 4.0, 18.0, 10.0, 10.0, 18.0, 20.0, 22.0, 29.0, 23.0, 35.0, 34.0, 44.0, 35.0, 42.0, 45.0, 37.0, 46.0, 52.0, 37.0, 43.0, 57.0, 41.0, 39.0, 39.0, 32.0, 29.0, 23.0, 25.0, 21.0, 15.0, 10.0, 9.0, 8.0, 8.0, 9.0, 5.0, 6.0, 2.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.220458984375, -0.2139759063720703, -0.20749282836914062, -0.20100975036621094, -0.19452667236328125, -0.18804359436035156, -0.18156051635742188, -0.1750774383544922, -0.1685943603515625, -0.1621112823486328, -0.15562820434570312, -0.14914512634277344, -0.14266204833984375, -0.13617897033691406, -0.12969589233398438, -0.12321281433105469, -0.116729736328125, -0.11024665832519531, -0.10376358032226562, -0.09728050231933594, -0.09079742431640625, -0.08431434631347656, -0.07783126831054688, -0.07134819030761719, -0.0648651123046875, -0.05838203430175781, -0.051898956298828125, -0.04541587829589844, -0.03893280029296875, -0.03244972229003906, -0.025966644287109375, -0.019483566284179688, -0.01300048828125, -0.0065174102783203125, -3.4332275390625e-05, 0.0064487457275390625, 0.01293182373046875, 0.019414901733398438, 0.025897979736328125, 0.03238105773925781, 0.0388641357421875, 0.04534721374511719, 0.051830291748046875, 0.05831336975097656, 0.06479644775390625, 0.07127952575683594, 0.07776260375976562, 0.08424568176269531, 0.090728759765625, 0.09721183776855469, 0.10369491577148438, 0.11017799377441406, 0.11666107177734375, 0.12314414978027344, 0.12962722778320312, 0.1361103057861328, 0.1425933837890625, 0.1490764617919922, 0.15555953979492188, 0.16204261779785156, 0.16852569580078125, 0.17500877380371094, 0.18149185180664062, 0.1879749298095703, 0.1944580078125]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 6.0, 11.0, 17.0, 11.0, 23.0, 29.0, 58.0, 70.0, 123.0, 169.0, 287.0, 531.0, 1020.0, 2151.0, 4983.0, 13663.0, 40070.0, 123345.0, 416273.0, 1625186.0, 1437679.0, 363533.0, 108933.0, 35346.0, 12088.0, 4585.0, 1922.0, 898.0, 490.0, 293.0, 186.0, 105.0, 63.0, 41.0, 34.0, 18.0, 16.0, 10.0, 5.0, 8.0, 6.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.350830078125, -0.3387107849121094, -0.32659149169921875, -0.3144721984863281, -0.3023529052734375, -0.2902336120605469, -0.27811431884765625, -0.2659950256347656, -0.253875732421875, -0.24175643920898438, -0.22963714599609375, -0.21751785278320312, -0.2053985595703125, -0.19327926635742188, -0.18115997314453125, -0.16904067993164062, -0.15692138671875, -0.14480209350585938, -0.13268280029296875, -0.12056350708007812, -0.1084442138671875, -0.09632492065429688, -0.08420562744140625, -0.07208633422851562, -0.059967041015625, -0.047847747802734375, -0.03572845458984375, -0.023609161376953125, -0.0114898681640625, 0.000629425048828125, 0.01274871826171875, 0.024868011474609375, 0.0369873046875, 0.049106597900390625, 0.06122589111328125, 0.07334518432617188, 0.0854644775390625, 0.09758377075195312, 0.10970306396484375, 0.12182235717773438, 0.133941650390625, 0.14606094360351562, 0.15818023681640625, 0.17029953002929688, 0.1824188232421875, 0.19453811645507812, 0.20665740966796875, 0.21877670288085938, 0.23089599609375, 0.24301528930664062, 0.25513458251953125, 0.2672538757324219, 0.2793731689453125, 0.2914924621582031, 0.30361175537109375, 0.3157310485839844, 0.327850341796875, 0.3399696350097656, 0.35208892822265625, 0.3642082214355469, 0.3763275146484375, 0.3884468078613281, 0.40056610107421875, 0.4126853942871094, 0.4248046875]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 10.0, 3.0, 6.0, 5.0, 8.0, 16.0, 26.0, 25.0, 31.0, 38.0, 55.0, 68.0, 92.0, 130.0, 160.0, 223.0, 252.0, 427.0, 504.0, 482.0, 377.0, 290.0, 206.0, 148.0, 114.0, 99.0, 57.0, 60.0, 33.0, 42.0, 23.0, 19.0, 16.0, 4.0, 8.0, 9.0, 1.0, 11.0, 4.0, 3.0, 2.0], "bins": [-0.52734375, -0.5148200988769531, -0.5022964477539062, -0.4897727966308594, -0.4772491455078125, -0.4647254943847656, -0.45220184326171875, -0.4396781921386719, -0.427154541015625, -0.4146308898925781, -0.40210723876953125, -0.3895835876464844, -0.3770599365234375, -0.3645362854003906, -0.35201263427734375, -0.3394889831542969, -0.32696533203125, -0.3144416809082031, -0.30191802978515625, -0.2893943786621094, -0.2768707275390625, -0.2643470764160156, -0.25182342529296875, -0.23929977416992188, -0.226776123046875, -0.21425247192382812, -0.20172882080078125, -0.18920516967773438, -0.1766815185546875, -0.16415786743164062, -0.15163421630859375, -0.13911056518554688, -0.1265869140625, -0.11406326293945312, -0.10153961181640625, -0.08901596069335938, -0.0764923095703125, -0.06396865844726562, -0.05144500732421875, -0.038921356201171875, -0.026397705078125, -0.013874053955078125, -0.00135040283203125, 0.011173248291015625, 0.0236968994140625, 0.036220550537109375, 0.04874420166015625, 0.061267852783203125, 0.07379150390625, 0.08631515502929688, 0.09883880615234375, 0.11136245727539062, 0.1238861083984375, 0.13640975952148438, 0.14893341064453125, 0.16145706176757812, 0.173980712890625, 0.18650436401367188, 0.19902801513671875, 0.21155166625976562, 0.2240753173828125, 0.23659896850585938, 0.24912261962890625, 0.2616462707519531, 0.274169921875]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 3.0, 4.0, 4.0, 16.0, 35.0, 54.0, 110.0, 135.0, 167.0, 162.0, 131.0, 94.0, 43.0, 21.0, 13.0, 8.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-4.801357269287109, -4.672770023345947, -4.544182300567627, -4.415595054626465, -4.2870073318481445, -4.158420085906982, -4.02983283996582, -3.901245355606079, -3.772657871246338, -3.6440703868865967, -3.5154829025268555, -3.3868956565856934, -3.258308172225952, -3.129720687866211, -3.001133441925049, -2.8725459575653076, -2.7439584732055664, -2.615370988845825, -2.486783504486084, -2.358196258544922, -2.2296087741851807, -2.1010212898254395, -1.9724339246749878, -1.8438465595245361, -1.715259075164795, -1.5866715908050537, -1.458084225654602, -1.3294968605041504, -1.2009093761444092, -1.072321891784668, -0.9437345266342163, -0.8151471018791199, -0.6865594387054443, -0.5579720139503479, -0.42938458919525146, -0.30079716444015503, -0.1722097396850586, -0.04362231492996216, 0.08496510982513428, 0.2135525345802307, 0.34213995933532715, 0.4707273840904236, 0.59931480884552, 0.7279022336006165, 0.8564896583557129, 0.9850770831108093, 1.1136645078659058, 1.2422518730163574, 1.3708393573760986, 1.4994268417358398, 1.6280142068862915, 1.7566015720367432, 1.8851890563964844, 2.0137765407562256, 2.142364025115967, 2.270951271057129, 2.39953875541687, 2.5281262397766113, 2.6567134857177734, 2.7853009700775146, 2.913888454437256, 3.042475938796997, 3.1710634231567383, 3.2996506690979004, 3.4282381534576416]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 3.0, 7.0, 3.0, 3.0, 4.0, 6.0, 8.0, 2.0, 9.0, 18.0, 13.0, 17.0, 18.0, 13.0, 20.0, 24.0, 37.0, 19.0, 42.0, 36.0, 47.0, 33.0, 38.0, 42.0, 35.0, 47.0, 32.0, 40.0, 37.0, 38.0, 42.0, 40.0, 33.0, 32.0, 34.0, 28.0, 14.0, 21.0, 21.0, 8.0, 9.0, 7.0, 8.0, 8.0, 5.0, 4.0, 4.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.369152545928955, -1.3217673301696777, -1.2743819952011108, -1.2269967794418335, -1.1796114444732666, -1.1322262287139893, -1.0848408937454224, -1.037455677986145, -0.9900703430175781, -0.942685067653656, -0.8952997922897339, -0.8479145169258118, -0.8005292415618896, -0.7531439661979675, -0.7057586908340454, -0.6583734750747681, -0.610988199710846, -0.5636029243469238, -0.5162176489830017, -0.4688323736190796, -0.42144709825515747, -0.37406182289123535, -0.3266765773296356, -0.2792913019657135, -0.23190602660179138, -0.18452075123786926, -0.13713547587394714, -0.08975021541118622, -0.0423649400472641, 0.00502033531665802, 0.052405595779418945, 0.09979087114334106, 0.14717614650726318, 0.1945614218711853, 0.24194669723510742, 0.28933197259902954, 0.33671724796295166, 0.3841025233268738, 0.4314877688884735, 0.47887304425239563, 0.5262583494186401, 0.5736436247825623, 0.6210289001464844, 0.6684141755104065, 0.7157994508743286, 0.7631847262382507, 0.8105700016021729, 0.8579552173614502, 0.9053404927253723, 0.9527257680892944, 1.0001109838485718, 1.0474963188171387, 1.094881534576416, 1.142266869544983, 1.1896520853042603, 1.2370374202728271, 1.2844226360321045, 1.3318078517913818, 1.3791931867599487, 1.426578402519226, 1.473963737487793, 1.5213489532470703, 1.5687342882156372, 1.6161195039749146, 1.6635048389434814]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 7.0, 8.0, 10.0, 16.0, 24.0, 34.0, 45.0, 84.0, 160.0, 227.0, 348.0, 583.0, 998.0, 1586.0, 2696.0, 4226.0, 6823.0, 10776.0, 17423.0, 29279.0, 54684.0, 125856.0, 276800.0, 269708.0, 119664.0, 52846.0, 28755.0, 16983.0, 10541.0, 6743.0, 4073.0, 2567.0, 1516.0, 922.0, 597.0, 361.0, 218.0, 140.0, 78.0, 56.0, 47.0, 18.0, 12.0, 13.0, 4.0, 6.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.295166015625, -0.2859344482421875, -0.276702880859375, -0.2674713134765625, -0.25823974609375, -0.2490081787109375, -0.239776611328125, -0.2305450439453125, -0.2213134765625, -0.2120819091796875, -0.202850341796875, -0.1936187744140625, -0.18438720703125, -0.1751556396484375, -0.165924072265625, -0.1566925048828125, -0.1474609375, -0.1382293701171875, -0.128997802734375, -0.1197662353515625, -0.11053466796875, -0.1013031005859375, -0.092071533203125, -0.0828399658203125, -0.0736083984375, -0.0643768310546875, -0.055145263671875, -0.0459136962890625, -0.03668212890625, -0.0274505615234375, -0.018218994140625, -0.0089874267578125, 0.000244140625, 0.0094757080078125, 0.018707275390625, 0.0279388427734375, 0.03717041015625, 0.0464019775390625, 0.055633544921875, 0.0648651123046875, 0.0740966796875, 0.0833282470703125, 0.092559814453125, 0.1017913818359375, 0.11102294921875, 0.1202545166015625, 0.129486083984375, 0.1387176513671875, 0.14794921875, 0.1571807861328125, 0.166412353515625, 0.1756439208984375, 0.18487548828125, 0.1941070556640625, 0.203338623046875, 0.2125701904296875, 0.2218017578125, 0.2310333251953125, 0.240264892578125, 0.2494964599609375, 0.25872802734375, 0.2679595947265625, 0.277191162109375, 0.2864227294921875, 0.295654296875]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 6.0, 0.0, 2.0, 6.0, 3.0, 9.0, 7.0, 6.0, 12.0, 14.0, 10.0, 17.0, 15.0, 24.0, 27.0, 30.0, 35.0, 28.0, 23.0, 49.0, 38.0, 47.0, 42.0, 41.0, 39.0, 39.0, 38.0, 40.0, 40.0, 36.0, 29.0, 32.0, 34.0, 28.0, 23.0, 21.0, 14.0, 24.0, 28.0, 14.0, 6.0, 5.0, 10.0, 2.0, 6.0, 2.0, 4.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.1844482421875, -0.17877197265625, -0.173095703125, -0.16741943359375, -0.1617431640625, -0.15606689453125, -0.150390625, -0.14471435546875, -0.1390380859375, -0.13336181640625, -0.127685546875, -0.12200927734375, -0.1163330078125, -0.11065673828125, -0.10498046875, -0.09930419921875, -0.0936279296875, -0.08795166015625, -0.082275390625, -0.07659912109375, -0.0709228515625, -0.06524658203125, -0.0595703125, -0.05389404296875, -0.0482177734375, -0.04254150390625, -0.036865234375, -0.03118896484375, -0.0255126953125, -0.01983642578125, -0.01416015625, -0.00848388671875, -0.0028076171875, 0.00286865234375, 0.008544921875, 0.01422119140625, 0.0198974609375, 0.02557373046875, 0.03125, 0.03692626953125, 0.0426025390625, 0.04827880859375, 0.053955078125, 0.05963134765625, 0.0653076171875, 0.07098388671875, 0.07666015625, 0.08233642578125, 0.0880126953125, 0.09368896484375, 0.099365234375, 0.10504150390625, 0.1107177734375, 0.11639404296875, 0.1220703125, 0.12774658203125, 0.1334228515625, 0.13909912109375, 0.144775390625, 0.15045166015625, 0.1561279296875, 0.16180419921875, 0.16748046875, 0.17315673828125, 0.1788330078125]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 4.0, 3.0, 4.0, 4.0, 9.0, 6.0, 17.0, 19.0, 31.0, 50.0, 67.0, 92.0, 153.0, 271.0, 484.0, 900.0, 1999.0, 5346.0, 15728.0, 48162.0, 221641.0, 579514.0, 123181.0, 32778.0, 10852.0, 3947.0, 1573.0, 739.0, 385.0, 203.0, 125.0, 94.0, 48.0, 42.0, 29.0, 18.0, 16.0, 4.0, 8.0, 3.0, 0.0, 3.0, 6.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.64111328125, -0.6199798583984375, -0.598846435546875, -0.5777130126953125, -0.55657958984375, -0.5354461669921875, -0.514312744140625, -0.4931793212890625, -0.4720458984375, -0.4509124755859375, -0.429779052734375, -0.4086456298828125, -0.38751220703125, -0.3663787841796875, -0.345245361328125, -0.3241119384765625, -0.302978515625, -0.2818450927734375, -0.260711669921875, -0.2395782470703125, -0.21844482421875, -0.1973114013671875, -0.176177978515625, -0.1550445556640625, -0.1339111328125, -0.1127777099609375, -0.091644287109375, -0.0705108642578125, -0.04937744140625, -0.0282440185546875, -0.007110595703125, 0.0140228271484375, 0.03515625, 0.0562896728515625, 0.077423095703125, 0.0985565185546875, 0.11968994140625, 0.1408233642578125, 0.161956787109375, 0.1830902099609375, 0.2042236328125, 0.2253570556640625, 0.246490478515625, 0.2676239013671875, 0.28875732421875, 0.3098907470703125, 0.331024169921875, 0.3521575927734375, 0.373291015625, 0.3944244384765625, 0.415557861328125, 0.4366912841796875, 0.45782470703125, 0.4789581298828125, 0.500091552734375, 0.5212249755859375, 0.5423583984375, 0.5634918212890625, 0.584625244140625, 0.6057586669921875, 0.62689208984375, 0.6480255126953125, 0.669158935546875, 0.6902923583984375, 0.71142578125]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 5.0, 2.0, 2.0, 2.0, 3.0, 4.0, 5.0, 9.0, 5.0, 12.0, 8.0, 20.0, 17.0, 17.0, 20.0, 21.0, 28.0, 25.0, 19.0, 34.0, 28.0, 27.0, 46.0, 43.0, 33.0, 26.0, 37.0, 49.0, 30.0, 47.0, 46.0, 40.0, 28.0, 31.0, 27.0, 26.0, 31.0, 26.0, 20.0, 16.0, 12.0, 10.0, 18.0, 16.0, 8.0, 7.0, 6.0, 9.0, 2.0, 5.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.480712890625, -0.4645957946777344, -0.44847869873046875, -0.4323616027832031, -0.4162445068359375, -0.4001274108886719, -0.38401031494140625, -0.3678932189941406, -0.351776123046875, -0.3356590270996094, -0.31954193115234375, -0.3034248352050781, -0.2873077392578125, -0.2711906433105469, -0.25507354736328125, -0.23895645141601562, -0.22283935546875, -0.20672225952148438, -0.19060516357421875, -0.17448806762695312, -0.1583709716796875, -0.14225387573242188, -0.12613677978515625, -0.11001968383789062, -0.093902587890625, -0.07778549194335938, -0.06166839599609375, -0.045551300048828125, -0.0294342041015625, -0.013317108154296875, 0.00279998779296875, 0.018917083740234375, 0.0350341796875, 0.051151275634765625, 0.06726837158203125, 0.08338546752929688, 0.0995025634765625, 0.11561965942382812, 0.13173675537109375, 0.14785385131835938, 0.163970947265625, 0.18008804321289062, 0.19620513916015625, 0.21232223510742188, 0.2284393310546875, 0.24455642700195312, 0.26067352294921875, 0.2767906188964844, 0.29290771484375, 0.3090248107910156, 0.32514190673828125, 0.3412590026855469, 0.3573760986328125, 0.3734931945800781, 0.38961029052734375, 0.4057273864746094, 0.421844482421875, 0.4379615783691406, 0.45407867431640625, 0.4701957702636719, 0.4863128662109375, 0.5024299621582031, 0.5185470581054688, 0.5346641540527344, 0.55078125]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 3.0, 3.0, 3.0, 2.0, 9.0, 18.0, 17.0, 26.0, 32.0, 49.0, 72.0, 107.0, 176.0, 305.0, 526.0, 874.0, 1552.0, 2537.0, 4346.0, 7652.0, 12986.0, 23065.0, 44165.0, 93843.0, 228065.0, 341752.0, 146549.0, 65436.0, 32502.0, 17354.0, 10109.0, 5934.0, 3462.0, 2058.0, 1199.0, 687.0, 414.0, 242.0, 141.0, 87.0, 73.0, 34.0, 32.0, 17.0, 14.0, 16.0, 2.0, 3.0, 5.0, 4.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.1424560546875, -0.13817405700683594, -0.13389205932617188, -0.1296100616455078, -0.12532806396484375, -0.12104606628417969, -0.11676406860351562, -0.11248207092285156, -0.1082000732421875, -0.10391807556152344, -0.09963607788085938, -0.09535408020019531, -0.09107208251953125, -0.08679008483886719, -0.08250808715820312, -0.07822608947753906, -0.073944091796875, -0.06966209411621094, -0.06538009643554688, -0.06109809875488281, -0.05681610107421875, -0.05253410339355469, -0.048252105712890625, -0.04397010803222656, -0.0396881103515625, -0.03540611267089844, -0.031124114990234375, -0.026842117309570312, -0.02256011962890625, -0.018278121948242188, -0.013996124267578125, -0.009714126586914062, -0.00543212890625, -0.0011501312255859375, 0.003131866455078125, 0.0074138641357421875, 0.01169586181640625, 0.015977859497070312, 0.020259857177734375, 0.024541854858398438, 0.0288238525390625, 0.03310585021972656, 0.037387847900390625, 0.04166984558105469, 0.04595184326171875, 0.05023384094238281, 0.054515838623046875, 0.05879783630371094, 0.063079833984375, 0.06736183166503906, 0.07164382934570312, 0.07592582702636719, 0.08020782470703125, 0.08448982238769531, 0.08877182006835938, 0.09305381774902344, 0.0973358154296875, 0.10161781311035156, 0.10589981079101562, 0.11018180847167969, 0.11446380615234375, 0.11874580383300781, 0.12302780151367188, 0.12730979919433594, 0.131591796875]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 5.0, 3.0, 2.0, 4.0, 3.0, 4.0, 3.0, 7.0, 8.0, 10.0, 13.0, 11.0, 13.0, 18.0, 18.0, 44.0, 44.0, 60.0, 91.0, 135.0, 140.0, 98.0, 75.0, 52.0, 33.0, 32.0, 19.0, 14.0, 8.0, 7.0, 10.0, 6.0, 2.0, 4.0, 5.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.1140785217285156e-05, -4.9374066293239594e-05, -4.760734736919403e-05, -4.584062844514847e-05, -4.4073909521102905e-05, -4.230719059705734e-05, -4.054047167301178e-05, -3.877375274896622e-05, -3.7007033824920654e-05, -3.524031490087509e-05, -3.347359597682953e-05, -3.1706877052783966e-05, -2.9940158128738403e-05, -2.817343920469284e-05, -2.6406720280647278e-05, -2.4640001356601715e-05, -2.2873282432556152e-05, -2.110656350851059e-05, -1.9339844584465027e-05, -1.7573125660419464e-05, -1.58064067363739e-05, -1.4039687812328339e-05, -1.2272968888282776e-05, -1.0506249964237213e-05, -8.73953104019165e-06, -6.972812116146088e-06, -5.206093192100525e-06, -3.439374268054962e-06, -1.6726553440093994e-06, 9.406358003616333e-08, 1.860782504081726e-06, 3.627501428127289e-06, 5.3942203521728516e-06, 7.160939276218414e-06, 8.927658200263977e-06, 1.069437712430954e-05, 1.2461096048355103e-05, 1.4227814972400665e-05, 1.5994533896446228e-05, 1.776125282049179e-05, 1.9527971744537354e-05, 2.1294690668582916e-05, 2.306140959262848e-05, 2.4828128516674042e-05, 2.6594847440719604e-05, 2.8361566364765167e-05, 3.012828528881073e-05, 3.189500421285629e-05, 3.3661723136901855e-05, 3.542844206094742e-05, 3.719516098499298e-05, 3.8961879909038544e-05, 4.0728598833084106e-05, 4.249531775712967e-05, 4.426203668117523e-05, 4.6028755605220795e-05, 4.779547452926636e-05, 4.956219345331192e-05, 5.132891237735748e-05, 5.3095631301403046e-05, 5.486235022544861e-05, 5.662906914949417e-05, 5.8395788073539734e-05, 6.01625069975853e-05, 6.192922592163086e-05]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 4.0, 3.0, 5.0, 10.0, 4.0, 13.0, 16.0, 26.0, 31.0, 35.0, 62.0, 105.0, 128.0, 205.0, 345.0, 575.0, 1032.0, 2131.0, 4240.0, 8557.0, 17428.0, 37538.0, 84229.0, 200170.0, 337220.0, 198813.0, 84056.0, 37173.0, 17156.0, 8266.0, 4098.0, 2079.0, 1052.0, 618.0, 376.0, 228.0, 147.0, 103.0, 83.0, 39.0, 42.0, 28.0, 23.0, 21.0, 7.0, 10.0, 10.0, 4.0, 4.0, 4.0, 1.0, 3.0, 2.0, 3.0, 0.0, 2.0, 3.0], "bins": [-0.1298828125, -0.12575912475585938, -0.12163543701171875, -0.11751174926757812, -0.1133880615234375, -0.10926437377929688, -0.10514068603515625, -0.10101699829101562, -0.096893310546875, -0.09276962280273438, -0.08864593505859375, -0.08452224731445312, -0.0803985595703125, -0.07627487182617188, -0.07215118408203125, -0.06802749633789062, -0.06390380859375, -0.059780120849609375, -0.05565643310546875, -0.051532745361328125, -0.0474090576171875, -0.043285369873046875, -0.03916168212890625, -0.035037994384765625, -0.030914306640625, -0.026790618896484375, -0.02266693115234375, -0.018543243408203125, -0.0144195556640625, -0.010295867919921875, -0.00617218017578125, -0.002048492431640625, 0.0020751953125, 0.006198883056640625, 0.01032257080078125, 0.014446258544921875, 0.0185699462890625, 0.022693634033203125, 0.02681732177734375, 0.030941009521484375, 0.035064697265625, 0.039188385009765625, 0.04331207275390625, 0.047435760498046875, 0.0515594482421875, 0.055683135986328125, 0.05980682373046875, 0.06393051147460938, 0.06805419921875, 0.07217788696289062, 0.07630157470703125, 0.08042526245117188, 0.0845489501953125, 0.08867263793945312, 0.09279632568359375, 0.09692001342773438, 0.101043701171875, 0.10516738891601562, 0.10929107666015625, 0.11341476440429688, 0.1175384521484375, 0.12166213989257812, 0.12578582763671875, 0.12990951538085938, 0.134033203125]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 0.0, 7.0, 1.0, 5.0, 4.0, 3.0, 10.0, 8.0, 11.0, 10.0, 12.0, 21.0, 15.0, 22.0, 23.0, 32.0, 35.0, 60.0, 49.0, 63.0, 63.0, 79.0, 71.0, 55.0, 54.0, 52.0, 36.0, 38.0, 30.0, 20.0, 21.0, 17.0, 16.0, 9.0, 11.0, 8.0, 8.0, 4.0, 4.0, 7.0, 6.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 0.0, 0.0, 1.0, 2.0, 1.0], "bins": [-0.150146484375, -0.1457061767578125, -0.141265869140625, -0.1368255615234375, -0.13238525390625, -0.1279449462890625, -0.123504638671875, -0.1190643310546875, -0.1146240234375, -0.1101837158203125, -0.105743408203125, -0.1013031005859375, -0.09686279296875, -0.0924224853515625, -0.087982177734375, -0.0835418701171875, -0.0791015625, -0.0746612548828125, -0.070220947265625, -0.0657806396484375, -0.06134033203125, -0.0569000244140625, -0.052459716796875, -0.0480194091796875, -0.0435791015625, -0.0391387939453125, -0.034698486328125, -0.0302581787109375, -0.02581787109375, -0.0213775634765625, -0.016937255859375, -0.0124969482421875, -0.008056640625, -0.0036163330078125, 0.000823974609375, 0.0052642822265625, 0.00970458984375, 0.0141448974609375, 0.018585205078125, 0.0230255126953125, 0.0274658203125, 0.0319061279296875, 0.036346435546875, 0.0407867431640625, 0.04522705078125, 0.0496673583984375, 0.054107666015625, 0.0585479736328125, 0.06298828125, 0.0674285888671875, 0.071868896484375, 0.0763092041015625, 0.08074951171875, 0.0851898193359375, 0.089630126953125, 0.0940704345703125, 0.0985107421875, 0.1029510498046875, 0.107391357421875, 0.1118316650390625, 0.11627197265625, 0.1207122802734375, 0.125152587890625, 0.1295928955078125, 0.134033203125]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 2.0, 1.0, 2.0, 10.0, 12.0, 22.0, 56.0, 99.0, 140.0, 169.0, 171.0, 139.0, 86.0, 44.0, 23.0, 10.0, 6.0, 4.0, 0.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.620044469833374, -3.51045298576355, -3.4008612632751465, -3.2912697792053223, -3.181678295135498, -3.072086811065674, -2.9624950885772705, -2.8529036045074463, -2.743311882019043, -2.6337203979492188, -2.5241286754608154, -2.414537191390991, -2.304945707321167, -2.1953539848327637, -2.0857625007629395, -1.9761710166931152, -1.866579532623291, -1.7569879293441772, -1.647396445274353, -1.5378048419952393, -1.428213357925415, -1.3186217546463013, -1.2090301513671875, -1.0994386672973633, -0.9898470640182495, -0.8802555203437805, -0.7706639766693115, -0.6610723733901978, -0.5514808297157288, -0.44188928604125977, -0.332297682762146, -0.222706139087677, -0.1131143569946289, -0.0035227984189987183, 0.10606876015663147, 0.21566033363342285, 0.32525187730789185, 0.43484342098236084, 0.5444350242614746, 0.6540265679359436, 0.7636181116104126, 0.8732096552848816, 0.9828011989593506, 1.0923928022384644, 1.2019844055175781, 1.3115758895874023, 1.4211674928665161, 1.5307590961456299, 1.640350580215454, 1.7499421834945679, 1.859533667564392, 1.9691252708435059, 2.07871675491333, 2.1883082389831543, 2.2978999614715576, 2.407491445541382, 2.517083168029785, 2.6266746520996094, 2.7362663745880127, 2.845857858657837, 2.955449342727661, 3.0650410652160645, 3.1746325492858887, 3.284224033355713, 3.393815517425537]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 2.0, 3.0, 3.0, 2.0, 4.0, 5.0, 7.0, 6.0, 12.0, 12.0, 19.0, 18.0, 22.0, 19.0, 22.0, 28.0, 30.0, 23.0, 47.0, 28.0, 37.0, 33.0, 43.0, 38.0, 41.0, 32.0, 46.0, 35.0, 33.0, 48.0, 38.0, 29.0, 33.0, 27.0, 31.0, 16.0, 30.0, 20.0, 20.0, 11.0, 13.0, 10.0, 8.0, 6.0, 5.0, 1.0, 4.0, 2.0, 4.0, 1.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-1.3803519010543823, -1.3370733261108398, -1.293794870376587, -1.2505162954330444, -1.207237720489502, -1.163959264755249, -1.1206806898117065, -1.077402114868164, -1.0341236591339111, -0.9908451437950134, -0.947566568851471, -0.9042880535125732, -0.8610094785690308, -0.8177309632301331, -0.7744524478912354, -0.7311738729476929, -0.6878952980041504, -0.6446167826652527, -0.6013382077217102, -0.5580596923828125, -0.51478111743927, -0.4715026021003723, -0.4282240867614746, -0.3849455416202545, -0.3416669964790344, -0.29838845133781433, -0.25510990619659424, -0.21183139085769653, -0.16855284571647644, -0.12527430057525635, -0.08199578523635864, -0.03871724009513855, 0.004561185836791992, 0.04783972352743149, 0.09111826121807098, 0.13439679145812988, 0.17767533659934998, 0.22095388174057007, 0.2642323970794678, 0.30751094222068787, 0.35078948736190796, 0.39406803250312805, 0.43734657764434814, 0.48062509298324585, 0.5239036083221436, 0.567182183265686, 0.6104606986045837, 0.6537392139434814, 0.6970177888870239, 0.7402963042259216, 0.7835748791694641, 0.8268533945083618, 0.8701319694519043, 0.913410484790802, 0.9566890001296997, 0.9999675750732422, 1.0432460308074951, 1.0865246057510376, 1.1298030614852905, 1.173081636428833, 1.2163602113723755, 1.259638786315918, 1.302917242050171, 1.3461958169937134, 1.3894743919372559]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 1.0, 7.0, 12.0, 12.0, 15.0, 34.0, 32.0, 67.0, 106.0, 155.0, 212.0, 357.0, 632.0, 1120.0, 1998.0, 3813.0, 7427.0, 15067.0, 30644.0, 63729.0, 138152.0, 321808.0, 789491.0, 1353186.0, 844023.0, 343730.0, 146714.0, 67520.0, 31984.0, 15616.0, 7906.0, 3973.0, 2035.0, 1104.0, 678.0, 366.0, 209.0, 135.0, 79.0, 56.0, 28.0, 21.0, 15.0, 9.0, 5.0, 3.0, 5.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.208984375, -0.20310401916503906, -0.19722366333007812, -0.1913433074951172, -0.18546295166015625, -0.1795825958251953, -0.17370223999023438, -0.16782188415527344, -0.1619415283203125, -0.15606117248535156, -0.15018081665039062, -0.1443004608154297, -0.13842010498046875, -0.1325397491455078, -0.12665939331054688, -0.12077903747558594, -0.114898681640625, -0.10901832580566406, -0.10313796997070312, -0.09725761413574219, -0.09137725830078125, -0.08549690246582031, -0.07961654663085938, -0.07373619079589844, -0.0678558349609375, -0.06197547912597656, -0.056095123291015625, -0.05021476745605469, -0.04433441162109375, -0.03845405578613281, -0.032573699951171875, -0.026693344116210938, -0.02081298828125, -0.014932632446289062, -0.009052276611328125, -0.0031719207763671875, 0.00270843505859375, 0.008588790893554688, 0.014469146728515625, 0.020349502563476562, 0.0262298583984375, 0.03211021423339844, 0.037990570068359375, 0.04387092590332031, 0.04975128173828125, 0.05563163757324219, 0.061511993408203125, 0.06739234924316406, 0.073272705078125, 0.07915306091308594, 0.08503341674804688, 0.09091377258300781, 0.09679412841796875, 0.10267448425292969, 0.10855484008789062, 0.11443519592285156, 0.1203155517578125, 0.12619590759277344, 0.13207626342773438, 0.1379566192626953, 0.14383697509765625, 0.1497173309326172, 0.15559768676757812, 0.16147804260253906, 0.1673583984375]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 3.0, 3.0, 3.0, 2.0, 9.0, 8.0, 5.0, 12.0, 10.0, 27.0, 17.0, 25.0, 18.0, 21.0, 23.0, 34.0, 34.0, 36.0, 43.0, 46.0, 30.0, 46.0, 34.0, 43.0, 42.0, 40.0, 47.0, 46.0, 41.0, 21.0, 33.0, 32.0, 24.0, 17.0, 18.0, 27.0, 18.0, 15.0, 8.0, 9.0, 7.0, 13.0, 7.0, 4.0, 4.0, 2.0, 2.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1658935546875, -0.16040420532226562, -0.15491485595703125, -0.14942550659179688, -0.1439361572265625, -0.13844680786132812, -0.13295745849609375, -0.12746810913085938, -0.121978759765625, -0.11648941040039062, -0.11100006103515625, -0.10551071166992188, -0.1000213623046875, -0.09453201293945312, -0.08904266357421875, -0.08355331420898438, -0.07806396484375, -0.07257461547851562, -0.06708526611328125, -0.061595916748046875, -0.0561065673828125, -0.050617218017578125, -0.04512786865234375, -0.039638519287109375, -0.034149169921875, -0.028659820556640625, -0.02317047119140625, -0.017681121826171875, -0.0121917724609375, -0.006702423095703125, -0.00121307373046875, 0.004276275634765625, 0.009765625, 0.015254974365234375, 0.02074432373046875, 0.026233673095703125, 0.0317230224609375, 0.037212371826171875, 0.04270172119140625, 0.048191070556640625, 0.053680419921875, 0.059169769287109375, 0.06465911865234375, 0.07014846801757812, 0.0756378173828125, 0.08112716674804688, 0.08661651611328125, 0.09210586547851562, 0.09759521484375, 0.10308456420898438, 0.10857391357421875, 0.11406326293945312, 0.1195526123046875, 0.12504196166992188, 0.13053131103515625, 0.13602066040039062, 0.141510009765625, 0.14699935913085938, 0.15248870849609375, 0.15797805786132812, 0.1634674072265625, 0.16895675659179688, 0.17444610595703125, 0.17993545532226562, 0.1854248046875]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 6.0, 15.0, 17.0, 18.0, 32.0, 54.0, 81.0, 157.0, 266.0, 451.0, 784.0, 1457.0, 2910.0, 6531.0, 16628.0, 47014.0, 141810.0, 475629.0, 1865893.0, 1189216.0, 297775.0, 93949.0, 31883.0, 12048.0, 4802.0, 2261.0, 1109.0, 635.0, 323.0, 195.0, 118.0, 74.0, 51.0, 33.0, 17.0, 11.0, 11.0, 9.0, 1.0, 6.0, 2.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.413818359375, -0.4022636413574219, -0.39070892333984375, -0.3791542053222656, -0.3675994873046875, -0.3560447692871094, -0.34449005126953125, -0.3329353332519531, -0.321380615234375, -0.3098258972167969, -0.29827117919921875, -0.2867164611816406, -0.2751617431640625, -0.2636070251464844, -0.25205230712890625, -0.24049758911132812, -0.22894287109375, -0.21738815307617188, -0.20583343505859375, -0.19427871704101562, -0.1827239990234375, -0.17116928100585938, -0.15961456298828125, -0.14805984497070312, -0.136505126953125, -0.12495040893554688, -0.11339569091796875, -0.10184097290039062, -0.0902862548828125, -0.07873153686523438, -0.06717681884765625, -0.055622100830078125, -0.0440673828125, -0.032512664794921875, -0.02095794677734375, -0.009403228759765625, 0.0021514892578125, 0.013706207275390625, 0.02526092529296875, 0.036815643310546875, 0.048370361328125, 0.059925079345703125, 0.07147979736328125, 0.08303451538085938, 0.0945892333984375, 0.10614395141601562, 0.11769866943359375, 0.12925338745117188, 0.14080810546875, 0.15236282348632812, 0.16391754150390625, 0.17547225952148438, 0.1870269775390625, 0.19858169555664062, 0.21013641357421875, 0.22169113159179688, 0.233245849609375, 0.24480056762695312, 0.25635528564453125, 0.2679100036621094, 0.2794647216796875, 0.2910194396972656, 0.30257415771484375, 0.3141288757324219, 0.32568359375]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 4.0, 8.0, 5.0, 6.0, 6.0, 13.0, 15.0, 20.0, 30.0, 24.0, 40.0, 43.0, 56.0, 75.0, 95.0, 111.0, 149.0, 199.0, 275.0, 380.0, 455.0, 427.0, 334.0, 269.0, 221.0, 159.0, 134.0, 107.0, 94.0, 63.0, 54.0, 48.0, 40.0, 33.0, 19.0, 18.0, 15.0, 17.0, 9.0, 5.0, 2.0, 5.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.301025390625, -0.2910041809082031, -0.28098297119140625, -0.2709617614746094, -0.2609405517578125, -0.2509193420410156, -0.24089813232421875, -0.23087692260742188, -0.220855712890625, -0.21083450317382812, -0.20081329345703125, -0.19079208374023438, -0.1807708740234375, -0.17074966430664062, -0.16072845458984375, -0.15070724487304688, -0.14068603515625, -0.13066482543945312, -0.12064361572265625, -0.11062240600585938, -0.1006011962890625, -0.09057998657226562, -0.08055877685546875, -0.07053756713867188, -0.060516357421875, -0.050495147705078125, -0.04047393798828125, -0.030452728271484375, -0.0204315185546875, -0.010410308837890625, -0.00038909912109375, 0.009632110595703125, 0.0196533203125, 0.029674530029296875, 0.03969573974609375, 0.049716949462890625, 0.0597381591796875, 0.06975936889648438, 0.07978057861328125, 0.08980178833007812, 0.099822998046875, 0.10984420776367188, 0.11986541748046875, 0.12988662719726562, 0.1399078369140625, 0.14992904663085938, 0.15995025634765625, 0.16997146606445312, 0.17999267578125, 0.19001388549804688, 0.20003509521484375, 0.21005630493164062, 0.2200775146484375, 0.23009872436523438, 0.24011993408203125, 0.2501411437988281, 0.260162353515625, 0.2701835632324219, 0.28020477294921875, 0.2902259826660156, 0.3002471923828125, 0.3102684020996094, 0.32028961181640625, 0.3303108215332031, 0.34033203125]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 8.0, 25.0, 41.0, 99.0, 158.0, 190.0, 170.0, 129.0, 91.0, 44.0, 20.0, 5.0, 4.0, 2.0, 3.0, 2.0, 1.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.2965497970581055, -4.160928249359131, -4.0253071784973145, -3.88968563079834, -3.7540643215179443, -3.618443012237549, -3.482821464538574, -3.3472001552581787, -3.211578845977783, -3.0759575366973877, -2.940335988998413, -2.8047146797180176, -2.669093370437622, -2.5334720611572266, -2.397850513458252, -2.2622292041778564, -2.126607656478882, -1.9909862279891968, -1.8553649187088013, -1.7197434902191162, -1.5841221809387207, -1.4485007524490356, -1.3128793239593506, -1.177258014678955, -1.04163658618927, -0.9060152173042297, -0.7703938484191895, -0.6347724199295044, -0.4991510510444641, -0.36352968215942383, -0.22790825366973877, -0.09228688478469849, 0.0433344841003418, 0.17895586788654327, 0.31457725167274475, 0.4501986503601074, 0.5858200192451477, 0.721441388130188, 0.857062816619873, 0.9926841855049133, 1.1283055543899536, 1.2639269828796387, 1.3995482921600342, 1.5351697206497192, 1.6707911491394043, 1.8064124584197998, 1.9420338869094849, 2.07765531539917, 2.2132766246795654, 2.348897933959961, 2.4845194816589355, 2.620140790939331, 2.7557621002197266, 2.891383647918701, 3.0270049571990967, 3.162626266479492, 3.298247814178467, 3.4338691234588623, 3.569490671157837, 3.7051119804382324, 3.840733289718628, 3.9763545989990234, 4.111976146697998, 4.247597694396973, 4.383218765258789]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 8.0, 7.0, 4.0, 2.0, 6.0, 8.0, 12.0, 16.0, 13.0, 25.0, 16.0, 21.0, 34.0, 23.0, 29.0, 27.0, 28.0, 37.0, 28.0, 36.0, 23.0, 29.0, 45.0, 49.0, 45.0, 42.0, 34.0, 43.0, 36.0, 37.0, 44.0, 30.0, 25.0, 16.0, 23.0, 18.0, 16.0, 11.0, 10.0, 12.0, 7.0, 8.0, 5.0, 7.0, 5.0, 1.0, 4.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.1318919658660889, -1.0941553115844727, -1.0564186573028564, -1.0186818838119507, -0.9809452295303345, -0.9432085752487183, -0.9054718613624573, -0.8677351474761963, -0.8299984931945801, -0.7922618389129639, -0.7545251250267029, -0.7167884111404419, -0.6790517568588257, -0.6413151025772095, -0.6035783886909485, -0.5658416748046875, -0.5281050205230713, -0.4903683364391327, -0.4526316523551941, -0.4148949682712555, -0.3771582841873169, -0.3394216001033783, -0.3016849160194397, -0.2639482319355011, -0.2262115478515625, -0.1884748637676239, -0.1507381796836853, -0.1130014955997467, -0.0752648115158081, -0.03752812743186951, 0.0002085566520690918, 0.03794524073600769, 0.07568204402923584, 0.11341872811317444, 0.15115541219711304, 0.18889209628105164, 0.22662878036499023, 0.26436546444892883, 0.30210214853286743, 0.33983883261680603, 0.37757551670074463, 0.4153122007846832, 0.4530488848686218, 0.4907855689525604, 0.528522253036499, 0.5662589073181152, 0.6039956212043762, 0.6417323350906372, 0.6794689893722534, 0.7172056436538696, 0.7549423575401306, 0.7926790714263916, 0.8304157257080078, 0.868152379989624, 0.905889093875885, 0.943625807762146, 0.9813624620437622, 1.0190991163253784, 1.0568358898162842, 1.0945725440979004, 1.1323091983795166, 1.1700458526611328, 1.207782506942749, 1.2455192804336548, 1.283255934715271]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 5.0, 1.0, 5.0, 2.0, 6.0, 5.0, 9.0, 24.0, 29.0, 44.0, 75.0, 118.0, 176.0, 275.0, 472.0, 706.0, 1189.0, 1962.0, 3244.0, 5487.0, 10520.0, 21100.0, 48176.0, 106037.0, 195253.0, 248292.0, 198750.0, 109464.0, 49979.0, 22163.0, 10614.0, 5755.0, 3279.0, 2021.0, 1298.0, 773.0, 456.0, 295.0, 175.0, 125.0, 75.0, 35.0, 45.0, 11.0, 18.0, 11.0, 5.0, 1.0, 2.0, 6.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.24365234375, -0.2361602783203125, -0.228668212890625, -0.2211761474609375, -0.21368408203125, -0.2061920166015625, -0.198699951171875, -0.1912078857421875, -0.1837158203125, -0.1762237548828125, -0.168731689453125, -0.1612396240234375, -0.15374755859375, -0.1462554931640625, -0.138763427734375, -0.1312713623046875, -0.123779296875, -0.1162872314453125, -0.108795166015625, -0.1013031005859375, -0.09381103515625, -0.0863189697265625, -0.078826904296875, -0.0713348388671875, -0.0638427734375, -0.0563507080078125, -0.048858642578125, -0.0413665771484375, -0.03387451171875, -0.0263824462890625, -0.018890380859375, -0.0113983154296875, -0.00390625, 0.0035858154296875, 0.011077880859375, 0.0185699462890625, 0.02606201171875, 0.0335540771484375, 0.041046142578125, 0.0485382080078125, 0.0560302734375, 0.0635223388671875, 0.071014404296875, 0.0785064697265625, 0.08599853515625, 0.0934906005859375, 0.100982666015625, 0.1084747314453125, 0.115966796875, 0.1234588623046875, 0.130950927734375, 0.1384429931640625, 0.14593505859375, 0.1534271240234375, 0.160919189453125, 0.1684112548828125, 0.1759033203125, 0.1833953857421875, 0.190887451171875, 0.1983795166015625, 0.20587158203125, 0.2133636474609375, 0.220855712890625, 0.2283477783203125, 0.23583984375]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 3.0, 1.0, 2.0, 0.0, 6.0, 7.0, 7.0, 8.0, 11.0, 16.0, 13.0, 22.0, 22.0, 25.0, 16.0, 28.0, 22.0, 32.0, 41.0, 27.0, 44.0, 33.0, 55.0, 42.0, 49.0, 34.0, 43.0, 34.0, 35.0, 40.0, 37.0, 42.0, 24.0, 35.0, 23.0, 26.0, 21.0, 12.0, 15.0, 7.0, 13.0, 7.0, 3.0, 9.0, 4.0, 4.0, 5.0, 6.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1746826171875, -0.1691436767578125, -0.163604736328125, -0.1580657958984375, -0.15252685546875, -0.1469879150390625, -0.141448974609375, -0.1359100341796875, -0.13037109375, -0.1248321533203125, -0.119293212890625, -0.1137542724609375, -0.10821533203125, -0.1026763916015625, -0.097137451171875, -0.0915985107421875, -0.0860595703125, -0.0805206298828125, -0.074981689453125, -0.0694427490234375, -0.06390380859375, -0.0583648681640625, -0.052825927734375, -0.0472869873046875, -0.041748046875, -0.0362091064453125, -0.030670166015625, -0.0251312255859375, -0.01959228515625, -0.0140533447265625, -0.008514404296875, -0.0029754638671875, 0.0025634765625, 0.0081024169921875, 0.013641357421875, 0.0191802978515625, 0.02471923828125, 0.0302581787109375, 0.035797119140625, 0.0413360595703125, 0.046875, 0.0524139404296875, 0.057952880859375, 0.0634918212890625, 0.06903076171875, 0.0745697021484375, 0.080108642578125, 0.0856475830078125, 0.0911865234375, 0.0967254638671875, 0.102264404296875, 0.1078033447265625, 0.11334228515625, 0.1188812255859375, 0.124420166015625, 0.1299591064453125, 0.135498046875, 0.1410369873046875, 0.146575927734375, 0.1521148681640625, 0.15765380859375, 0.1631927490234375, 0.168731689453125, 0.1742706298828125, 0.1798095703125]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 0.0, 4.0, 8.0, 5.0, 7.0, 10.0, 25.0, 17.0, 21.0, 25.0, 27.0, 58.0, 110.0, 106.0, 215.0, 343.0, 681.0, 1323.0, 2722.0, 5777.0, 14529.0, 43472.0, 145423.0, 340033.0, 313771.0, 121037.0, 36131.0, 12298.0, 5255.0, 2496.0, 1210.0, 536.0, 324.0, 182.0, 120.0, 74.0, 53.0, 34.0, 24.0, 27.0, 15.0, 7.0, 13.0, 4.0, 4.0, 5.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.31103515625, -0.3006401062011719, -0.29024505615234375, -0.2798500061035156, -0.2694549560546875, -0.2590599060058594, -0.24866485595703125, -0.23826980590820312, -0.227874755859375, -0.21747970581054688, -0.20708465576171875, -0.19668960571289062, -0.1862945556640625, -0.17589950561523438, -0.16550445556640625, -0.15510940551757812, -0.14471435546875, -0.13431930541992188, -0.12392425537109375, -0.11352920532226562, -0.1031341552734375, -0.09273910522460938, -0.08234405517578125, -0.07194900512695312, -0.061553955078125, -0.051158905029296875, -0.04076385498046875, -0.030368804931640625, -0.0199737548828125, -0.009578704833984375, 0.00081634521484375, 0.011211395263671875, 0.0216064453125, 0.032001495361328125, 0.04239654541015625, 0.052791595458984375, 0.0631866455078125, 0.07358169555664062, 0.08397674560546875, 0.09437179565429688, 0.104766845703125, 0.11516189575195312, 0.12555694580078125, 0.13595199584960938, 0.1463470458984375, 0.15674209594726562, 0.16713714599609375, 0.17753219604492188, 0.18792724609375, 0.19832229614257812, 0.20871734619140625, 0.21911239624023438, 0.2295074462890625, 0.23990249633789062, 0.25029754638671875, 0.2606925964355469, 0.271087646484375, 0.2814826965332031, 0.29187774658203125, 0.3022727966308594, 0.3126678466796875, 0.3230628967285156, 0.33345794677734375, 0.3438529968261719, 0.354248046875]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 5.0, 3.0, 7.0, 7.0, 9.0, 6.0, 8.0, 12.0, 21.0, 23.0, 20.0, 23.0, 25.0, 34.0, 30.0, 48.0, 48.0, 48.0, 39.0, 48.0, 41.0, 41.0, 36.0, 45.0, 48.0, 42.0, 45.0, 39.0, 43.0, 20.0, 19.0, 26.0, 18.0, 18.0, 18.0, 5.0, 9.0, 11.0, 8.0, 0.0, 3.0, 4.0, 2.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5009765625, -0.48424530029296875, -0.4675140380859375, -0.45078277587890625, -0.434051513671875, -0.41732025146484375, -0.4005889892578125, -0.38385772705078125, -0.36712646484375, -0.35039520263671875, -0.3336639404296875, -0.31693267822265625, -0.300201416015625, -0.28347015380859375, -0.2667388916015625, -0.25000762939453125, -0.2332763671875, -0.21654510498046875, -0.1998138427734375, -0.18308258056640625, -0.166351318359375, -0.14962005615234375, -0.1328887939453125, -0.11615753173828125, -0.09942626953125, -0.08269500732421875, -0.0659637451171875, -0.04923248291015625, -0.032501220703125, -0.01576995849609375, 0.0009613037109375, 0.01769256591796875, 0.034423828125, 0.05115509033203125, 0.0678863525390625, 0.08461761474609375, 0.101348876953125, 0.11808013916015625, 0.1348114013671875, 0.15154266357421875, 0.16827392578125, 0.18500518798828125, 0.2017364501953125, 0.21846771240234375, 0.235198974609375, 0.25193023681640625, 0.2686614990234375, 0.28539276123046875, 0.3021240234375, 0.31885528564453125, 0.3355865478515625, 0.35231781005859375, 0.369049072265625, 0.38578033447265625, 0.4025115966796875, 0.41924285888671875, 0.43597412109375, 0.45270538330078125, 0.4694366455078125, 0.48616790771484375, 0.502899169921875, 0.5196304321289062, 0.5363616943359375, 0.5530929565429688, 0.56982421875]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 3.0, 4.0, 16.0, 6.0, 10.0, 18.0, 25.0, 51.0, 67.0, 107.0, 142.0, 234.0, 424.0, 741.0, 1110.0, 2087.0, 3671.0, 6627.0, 12212.0, 23590.0, 48673.0, 100749.0, 186035.0, 243697.0, 197496.0, 110815.0, 53758.0, 26374.0, 13383.0, 7045.0, 3923.0, 2275.0, 1273.0, 747.0, 424.0, 266.0, 183.0, 95.0, 69.0, 53.0, 28.0, 21.0, 13.0, 5.0, 4.0, 7.0, 4.0, 3.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.10748291015625, -0.10396671295166016, -0.10045051574707031, -0.09693431854248047, -0.09341812133789062, -0.08990192413330078, -0.08638572692871094, -0.0828695297241211, -0.07935333251953125, -0.0758371353149414, -0.07232093811035156, -0.06880474090576172, -0.06528854370117188, -0.06177234649658203, -0.05825614929199219, -0.054739952087402344, -0.0512237548828125, -0.047707557678222656, -0.04419136047363281, -0.04067516326904297, -0.037158966064453125, -0.03364276885986328, -0.030126571655273438, -0.026610374450683594, -0.02309417724609375, -0.019577980041503906, -0.016061782836914062, -0.012545585632324219, -0.009029388427734375, -0.005513191223144531, -0.0019969940185546875, 0.0015192031860351562, 0.005035400390625, 0.008551597595214844, 0.012067794799804688, 0.015583992004394531, 0.019100189208984375, 0.02261638641357422, 0.026132583618164062, 0.029648780822753906, 0.03316497802734375, 0.036681175231933594, 0.04019737243652344, 0.04371356964111328, 0.047229766845703125, 0.05074596405029297, 0.05426216125488281, 0.057778358459472656, 0.0612945556640625, 0.06481075286865234, 0.06832695007324219, 0.07184314727783203, 0.07535934448242188, 0.07887554168701172, 0.08239173889160156, 0.0859079360961914, 0.08942413330078125, 0.0929403305053711, 0.09645652770996094, 0.09997272491455078, 0.10348892211914062, 0.10700511932373047, 0.11052131652832031, 0.11403751373291016, 0.1175537109375]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 2.0, 1.0, 2.0, 4.0, 2.0, 4.0, 6.0, 7.0, 20.0, 22.0, 33.0, 38.0, 43.0, 57.0, 82.0, 67.0, 85.0, 80.0, 83.0, 76.0, 75.0, 47.0, 49.0, 19.0, 17.0, 18.0, 18.0, 13.0, 10.0, 4.0, 3.0, 3.0, 2.0, 2.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 0.0, 0.0, 2.0], "bins": [-4.589557647705078e-05, -4.462432116270065e-05, -4.3353065848350525e-05, -4.20818105340004e-05, -4.081055521965027e-05, -3.953929990530014e-05, -3.826804459095001e-05, -3.6996789276599884e-05, -3.5725533962249756e-05, -3.445427864789963e-05, -3.31830233335495e-05, -3.191176801919937e-05, -3.064051270484924e-05, -2.9369257390499115e-05, -2.8098002076148987e-05, -2.682674676179886e-05, -2.555549144744873e-05, -2.4284236133098602e-05, -2.3012980818748474e-05, -2.1741725504398346e-05, -2.0470470190048218e-05, -1.919921487569809e-05, -1.792795956134796e-05, -1.6656704246997833e-05, -1.5385448932647705e-05, -1.4114193618297577e-05, -1.2842938303947449e-05, -1.157168298959732e-05, -1.0300427675247192e-05, -9.029172360897064e-06, -7.757917046546936e-06, -6.486661732196808e-06, -5.21540641784668e-06, -3.9441511034965515e-06, -2.6728957891464233e-06, -1.4016404747962952e-06, -1.30385160446167e-07, 1.1408701539039612e-06, 2.4121254682540894e-06, 3.6833807826042175e-06, 4.954636096954346e-06, 6.225891411304474e-06, 7.497146725654602e-06, 8.76840204000473e-06, 1.0039657354354858e-05, 1.1310912668704987e-05, 1.2582167983055115e-05, 1.3853423297405243e-05, 1.5124678611755371e-05, 1.63959339261055e-05, 1.7667189240455627e-05, 1.8938444554805756e-05, 2.0209699869155884e-05, 2.1480955183506012e-05, 2.275221049785614e-05, 2.402346581220627e-05, 2.5294721126556396e-05, 2.6565976440906525e-05, 2.7837231755256653e-05, 2.910848706960678e-05, 3.037974238395691e-05, 3.165099769830704e-05, 3.2922253012657166e-05, 3.4193508327007294e-05, 3.546476364135742e-05]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 9.0, 13.0, 31.0, 69.0, 136.0, 346.0, 1075.0, 4424.0, 20275.0, 106555.0, 413507.0, 385044.0, 93729.0, 17945.0, 3882.0, 975.0, 307.0, 137.0, 57.0, 28.0, 9.0, 7.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2354736328125, -0.2273426055908203, -0.21921157836914062, -0.21108055114746094, -0.20294952392578125, -0.19481849670410156, -0.18668746948242188, -0.1785564422607422, -0.1704254150390625, -0.1622943878173828, -0.15416336059570312, -0.14603233337402344, -0.13790130615234375, -0.12977027893066406, -0.12163925170898438, -0.11350822448730469, -0.105377197265625, -0.09724617004394531, -0.08911514282226562, -0.08098411560058594, -0.07285308837890625, -0.06472206115722656, -0.056591033935546875, -0.04846000671386719, -0.0403289794921875, -0.03219795227050781, -0.024066925048828125, -0.015935897827148438, -0.00780487060546875, 0.0003261566162109375, 0.008457183837890625, 0.016588211059570312, 0.02471923828125, 0.03285026550292969, 0.040981292724609375, 0.04911231994628906, 0.05724334716796875, 0.06537437438964844, 0.07350540161132812, 0.08163642883300781, 0.0897674560546875, 0.09789848327636719, 0.10602951049804688, 0.11416053771972656, 0.12229156494140625, 0.13042259216308594, 0.13855361938476562, 0.1466846466064453, 0.154815673828125, 0.1629467010498047, 0.17107772827148438, 0.17920875549316406, 0.18733978271484375, 0.19547080993652344, 0.20360183715820312, 0.2117328643798828, 0.2198638916015625, 0.2279949188232422, 0.23612594604492188, 0.24425697326660156, 0.25238800048828125, 0.26051902770996094, 0.2686500549316406, 0.2767810821533203, 0.284912109375]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 4.0, 2.0, 2.0, 2.0, 3.0, 3.0, 8.0, 3.0, 8.0, 9.0, 16.0, 19.0, 13.0, 35.0, 38.0, 36.0, 50.0, 62.0, 73.0, 68.0, 78.0, 58.0, 86.0, 63.0, 43.0, 47.0, 31.0, 31.0, 27.0, 23.0, 13.0, 10.0, 11.0, 6.0, 4.0, 5.0, 4.0, 5.0, 3.0, 2.0, 7.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.136474609375, -0.13218307495117188, -0.12789154052734375, -0.12360000610351562, -0.1193084716796875, -0.11501693725585938, -0.11072540283203125, -0.10643386840820312, -0.102142333984375, -0.09785079956054688, -0.09355926513671875, -0.08926773071289062, -0.0849761962890625, -0.08068466186523438, -0.07639312744140625, -0.07210159301757812, -0.06781005859375, -0.06351852416992188, -0.05922698974609375, -0.054935455322265625, -0.0506439208984375, -0.046352386474609375, -0.04206085205078125, -0.037769317626953125, -0.033477783203125, -0.029186248779296875, -0.02489471435546875, -0.020603179931640625, -0.0163116455078125, -0.012020111083984375, -0.00772857666015625, -0.003437042236328125, 0.0008544921875, 0.005146026611328125, 0.00943756103515625, 0.013729095458984375, 0.0180206298828125, 0.022312164306640625, 0.02660369873046875, 0.030895233154296875, 0.035186767578125, 0.039478302001953125, 0.04376983642578125, 0.048061370849609375, 0.0523529052734375, 0.056644439697265625, 0.06093597412109375, 0.06522750854492188, 0.06951904296875, 0.07381057739257812, 0.07810211181640625, 0.08239364624023438, 0.0866851806640625, 0.09097671508789062, 0.09526824951171875, 0.09955978393554688, 0.103851318359375, 0.10814285278320312, 0.11243438720703125, 0.11672592163085938, 0.1210174560546875, 0.12530899047851562, 0.12960052490234375, 0.13389205932617188, 0.13818359375]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 2.0, 5.0, 7.0, 7.0, 14.0, 44.0, 62.0, 90.0, 139.0, 178.0, 157.0, 138.0, 77.0, 41.0, 22.0, 10.0, 8.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.9208884239196777, -2.8411672115325928, -2.761446237564087, -2.681725025177002, -2.602003812789917, -2.522282600402832, -2.442561626434326, -2.362840414047241, -2.2831192016601562, -2.2033979892730713, -2.1236770153045654, -2.0439558029174805, -1.9642345905303955, -1.8845134973526, -1.8047924041748047, -1.7250711917877197, -1.6453502178192139, -1.5656291246414185, -1.4859079122543335, -1.406186819076538, -1.3264656066894531, -1.2467445135116577, -1.1670234203338623, -1.0873022079467773, -1.007581114768982, -0.9278599619865417, -0.8481388092041016, -0.7684177160263062, -0.688696563243866, -0.6089754104614258, -0.5292543172836304, -0.4495331645011902, -0.3698122501373291, -0.2900910973548889, -0.21036997437477112, -0.13064883649349213, -0.050927698612213135, 0.02879345417022705, 0.10851457715034485, 0.18823570013046265, 0.26795685291290283, 0.347678005695343, 0.4273991286754608, 0.5071202516555786, 0.5868414044380188, 0.666562557220459, 0.7462836503982544, 0.8260048031806946, 0.9057259559631348, 0.985447108745575, 1.0651682615280151, 1.1448893547058105, 1.2246105670928955, 1.304331660270691, 1.3840527534484863, 1.4637739658355713, 1.5434950590133667, 1.623216152191162, 1.702937364578247, 1.7826584577560425, 1.862379550933838, 1.9421007633209229, 2.021821975708008, 2.1015429496765137, 2.1812641620635986]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 7.0, 5.0, 8.0, 9.0, 8.0, 7.0, 15.0, 19.0, 15.0, 21.0, 18.0, 18.0, 32.0, 24.0, 34.0, 41.0, 36.0, 36.0, 43.0, 44.0, 46.0, 51.0, 37.0, 41.0, 44.0, 44.0, 23.0, 29.0, 25.0, 37.0, 23.0, 27.0, 19.0, 19.0, 19.0, 15.0, 13.0, 22.0, 5.0, 8.0, 8.0, 5.0, 7.0, 3.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.236580729484558, -1.1948776245117188, -1.1531745195388794, -1.11147141456604, -1.0697681903839111, -1.0280650854110718, -0.9863619804382324, -0.9446588754653931, -0.9029557704925537, -0.8612526655197144, -0.819549560546875, -0.7778463959693909, -0.7361432909965515, -0.6944401860237122, -0.652737021446228, -0.6110339164733887, -0.5693308115005493, -0.52762770652771, -0.4859245717525482, -0.4442214369773865, -0.4025183320045471, -0.36081522703170776, -0.319112092256546, -0.2774089574813843, -0.23570585250854492, -0.19400273263454437, -0.15229961276054382, -0.11059649288654327, -0.06889337301254272, -0.027190253138542175, 0.014512866735458374, 0.05621600151062012, 0.09791910648345947, 0.13962222635746002, 0.18132534623146057, 0.22302846610546112, 0.26473158597946167, 0.306434690952301, 0.34813782572746277, 0.3898409605026245, 0.43154406547546387, 0.4732471704483032, 0.5149502754211426, 0.5566534399986267, 0.5983565449714661, 0.6400596499443054, 0.6817628145217896, 0.7234659194946289, 0.7651690244674683, 0.8068721294403076, 0.848575234413147, 0.8902783989906311, 0.9319815039634705, 0.9736846089363098, 1.015387773513794, 1.0570908784866333, 1.0987939834594727, 1.140497088432312, 1.1822001934051514, 1.2239032983779907, 1.26560640335083, 1.307309627532959, 1.3490127325057983, 1.3907158374786377, 1.432418942451477]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 6.0, 4.0, 6.0, 5.0, 11.0, 19.0, 13.0, 26.0, 42.0, 72.0, 118.0, 165.0, 244.0, 413.0, 734.0, 1306.0, 2479.0, 4879.0, 9989.0, 22194.0, 51033.0, 124553.0, 327599.0, 892225.0, 1506460.0, 771961.0, 285670.0, 109533.0, 44720.0, 19661.0, 9014.0, 4281.0, 2128.0, 1138.0, 652.0, 363.0, 237.0, 122.0, 67.0, 54.0, 37.0, 26.0, 14.0, 3.0, 6.0, 3.0, 4.0, 0.0, 2.0, 1.0, 1.0, 2.0], "bins": [-0.229248046875, -0.22295379638671875, -0.2166595458984375, -0.21036529541015625, -0.204071044921875, -0.19777679443359375, -0.1914825439453125, -0.18518829345703125, -0.17889404296875, -0.17259979248046875, -0.1663055419921875, -0.16001129150390625, -0.153717041015625, -0.14742279052734375, -0.1411285400390625, -0.13483428955078125, -0.1285400390625, -0.12224578857421875, -0.1159515380859375, -0.10965728759765625, -0.103363037109375, -0.09706878662109375, -0.0907745361328125, -0.08448028564453125, -0.07818603515625, -0.07189178466796875, -0.0655975341796875, -0.05930328369140625, -0.053009033203125, -0.04671478271484375, -0.0404205322265625, -0.03412628173828125, -0.02783203125, -0.02153778076171875, -0.0152435302734375, -0.00894927978515625, -0.002655029296875, 0.00363922119140625, 0.0099334716796875, 0.01622772216796875, 0.02252197265625, 0.02881622314453125, 0.0351104736328125, 0.04140472412109375, 0.047698974609375, 0.05399322509765625, 0.0602874755859375, 0.06658172607421875, 0.0728759765625, 0.07917022705078125, 0.0854644775390625, 0.09175872802734375, 0.098052978515625, 0.10434722900390625, 0.1106414794921875, 0.11693572998046875, 0.12322998046875, 0.12952423095703125, 0.1358184814453125, 0.14211273193359375, 0.148406982421875, 0.15470123291015625, 0.1609954833984375, 0.16728973388671875, 0.173583984375]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 5.0, 3.0, 3.0, 4.0, 2.0, 2.0, 7.0, 8.0, 11.0, 12.0, 15.0, 17.0, 26.0, 22.0, 18.0, 33.0, 20.0, 28.0, 51.0, 41.0, 26.0, 45.0, 40.0, 50.0, 59.0, 66.0, 54.0, 33.0, 41.0, 34.0, 38.0, 25.0, 24.0, 23.0, 28.0, 18.0, 13.0, 17.0, 13.0, 11.0, 6.0, 9.0, 7.0, 6.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2071533203125, -0.20105552673339844, -0.19495773315429688, -0.1888599395751953, -0.18276214599609375, -0.1766643524169922, -0.17056655883789062, -0.16446876525878906, -0.1583709716796875, -0.15227317810058594, -0.14617538452148438, -0.1400775909423828, -0.13397979736328125, -0.1278820037841797, -0.12178421020507812, -0.11568641662597656, -0.109588623046875, -0.10349082946777344, -0.09739303588867188, -0.09129524230957031, -0.08519744873046875, -0.07909965515136719, -0.07300186157226562, -0.06690406799316406, -0.0608062744140625, -0.05470848083496094, -0.048610687255859375, -0.04251289367675781, -0.03641510009765625, -0.030317306518554688, -0.024219512939453125, -0.018121719360351562, -0.01202392578125, -0.0059261322021484375, 0.000171661376953125, 0.0062694549560546875, 0.01236724853515625, 0.018465042114257812, 0.024562835693359375, 0.030660629272460938, 0.0367584228515625, 0.04285621643066406, 0.048954010009765625, 0.05505180358886719, 0.06114959716796875, 0.06724739074707031, 0.07334518432617188, 0.07944297790527344, 0.085540771484375, 0.09163856506347656, 0.09773635864257812, 0.10383415222167969, 0.10993194580078125, 0.11602973937988281, 0.12212753295898438, 0.12822532653808594, 0.1343231201171875, 0.14042091369628906, 0.14651870727539062, 0.1526165008544922, 0.15871429443359375, 0.1648120880126953, 0.17090988159179688, 0.17700767517089844, 0.18310546875]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [4.0, 1.0, 1.0, 0.0, 2.0, 1.0, 5.0, 8.0, 11.0, 12.0, 13.0, 17.0, 36.0, 38.0, 59.0, 126.0, 161.0, 354.0, 542.0, 1043.0, 1993.0, 4167.0, 9187.0, 21528.0, 53772.0, 142332.0, 428945.0, 1529831.0, 1394673.0, 388352.0, 131044.0, 49484.0, 19927.0, 8584.0, 3856.0, 1932.0, 976.0, 508.0, 290.0, 193.0, 105.0, 65.0, 39.0, 16.0, 18.0, 14.0, 7.0, 8.0, 5.0, 3.0, 3.0, 3.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.2469482421875, -0.2381153106689453, -0.22928237915039062, -0.22044944763183594, -0.21161651611328125, -0.20278358459472656, -0.19395065307617188, -0.1851177215576172, -0.1762847900390625, -0.1674518585205078, -0.15861892700195312, -0.14978599548339844, -0.14095306396484375, -0.13212013244628906, -0.12328720092773438, -0.11445426940917969, -0.105621337890625, -0.09678840637207031, -0.08795547485351562, -0.07912254333496094, -0.07028961181640625, -0.06145668029785156, -0.052623748779296875, -0.04379081726074219, -0.0349578857421875, -0.026124954223632812, -0.017292022705078125, -0.008459091186523438, 0.00037384033203125, 0.009206771850585938, 0.018039703369140625, 0.026872634887695312, 0.03570556640625, 0.04453849792480469, 0.053371429443359375, 0.06220436096191406, 0.07103729248046875, 0.07987022399902344, 0.08870315551757812, 0.09753608703613281, 0.1063690185546875, 0.11520195007324219, 0.12403488159179688, 0.13286781311035156, 0.14170074462890625, 0.15053367614746094, 0.15936660766601562, 0.1681995391845703, 0.177032470703125, 0.1858654022216797, 0.19469833374023438, 0.20353126525878906, 0.21236419677734375, 0.22119712829589844, 0.23003005981445312, 0.2388629913330078, 0.2476959228515625, 0.2565288543701172, 0.2653617858886719, 0.27419471740722656, 0.28302764892578125, 0.29186058044433594, 0.3006935119628906, 0.3095264434814453, 0.318359375]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 4.0, 3.0, 4.0, 9.0, 4.0, 11.0, 17.0, 12.0, 13.0, 19.0, 29.0, 34.0, 47.0, 60.0, 89.0, 100.0, 140.0, 160.0, 231.0, 279.0, 416.0, 480.0, 458.0, 359.0, 259.0, 181.0, 138.0, 117.0, 87.0, 67.0, 49.0, 42.0, 29.0, 32.0, 29.0, 17.0, 10.0, 9.0, 11.0, 3.0, 5.0, 9.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2861328125, -0.2771148681640625, -0.268096923828125, -0.2590789794921875, -0.25006103515625, -0.2410430908203125, -0.232025146484375, -0.2230072021484375, -0.2139892578125, -0.2049713134765625, -0.195953369140625, -0.1869354248046875, -0.17791748046875, -0.1688995361328125, -0.159881591796875, -0.1508636474609375, -0.141845703125, -0.1328277587890625, -0.123809814453125, -0.1147918701171875, -0.10577392578125, -0.0967559814453125, -0.087738037109375, -0.0787200927734375, -0.0697021484375, -0.0606842041015625, -0.051666259765625, -0.0426483154296875, -0.03363037109375, -0.0246124267578125, -0.015594482421875, -0.0065765380859375, 0.00244140625, 0.0114593505859375, 0.020477294921875, 0.0294952392578125, 0.03851318359375, 0.0475311279296875, 0.056549072265625, 0.0655670166015625, 0.0745849609375, 0.0836029052734375, 0.092620849609375, 0.1016387939453125, 0.11065673828125, 0.1196746826171875, 0.128692626953125, 0.1377105712890625, 0.146728515625, 0.1557464599609375, 0.164764404296875, 0.1737823486328125, 0.18280029296875, 0.1918182373046875, 0.200836181640625, 0.2098541259765625, 0.2188720703125, 0.2278900146484375, 0.236907958984375, 0.2459259033203125, 0.25494384765625, 0.2639617919921875, 0.272979736328125, 0.2819976806640625, 0.291015625]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 0.0, 2.0, 1.0, 5.0, 1.0, 4.0, 8.0, 10.0, 11.0, 17.0, 22.0, 45.0, 45.0, 67.0, 85.0, 110.0, 114.0, 109.0, 87.0, 64.0, 76.0, 48.0, 31.0, 19.0, 11.0, 6.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.359570264816284, -2.2967381477355957, -2.233905792236328, -2.1710736751556396, -2.108241558074951, -2.0454092025756836, -1.9825770854949951, -1.919744849205017, -1.856912612915039, -1.794080376625061, -1.7312482595443726, -1.6684160232543945, -1.6055837869644165, -1.5427515506744385, -1.47991943359375, -1.417087197303772, -1.3542550802230835, -1.2914228439331055, -1.228590726852417, -1.165758490562439, -1.102926254272461, -1.0400941371917725, -0.9772619009017944, -0.9144296646118164, -0.8515974879264832, -0.7887653112411499, -0.7259330749511719, -0.6631008982658386, -0.6002687215805054, -0.5374364852905273, -0.4746043086051941, -0.41177210211753845, -0.3489398956298828, -0.2861076891422272, -0.22327549755573273, -0.16044330596923828, -0.09761109948158264, -0.034778892993927, 0.02805328369140625, 0.09088549017906189, 0.15371769666671753, 0.21654990315437317, 0.2793821096420288, 0.34221428632736206, 0.4050464928150177, 0.46787869930267334, 0.5307108759880066, 0.5935430526733398, 0.6563752889633179, 0.7192074656486511, 0.7820397019386292, 0.8448718786239624, 0.9077041149139404, 0.9705362915992737, 1.033368468284607, 1.096200704574585, 1.1590328216552734, 1.2218650579452515, 1.28469717502594, 1.347529411315918, 1.410361647605896, 1.473193883895874, 1.5360260009765625, 1.5988582372665405, 1.6616904735565186]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 3.0, 4.0, 3.0, 4.0, 2.0, 6.0, 5.0, 1.0, 8.0, 15.0, 12.0, 15.0, 11.0, 21.0, 23.0, 37.0, 17.0, 29.0, 35.0, 31.0, 37.0, 48.0, 48.0, 45.0, 36.0, 45.0, 43.0, 51.0, 40.0, 41.0, 32.0, 38.0, 25.0, 17.0, 22.0, 23.0, 24.0, 24.0, 17.0, 11.0, 13.0, 11.0, 7.0, 13.0, 8.0, 5.0, 2.0, 3.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.9790079593658447, -0.9467331767082214, -0.9144583940505981, -0.8821836709976196, -0.8499088883399963, -0.817634105682373, -0.7853593826293945, -0.7530845999717712, -0.720809817314148, -0.6885350346565247, -0.6562602519989014, -0.6239855289459229, -0.5917107462882996, -0.5594359636306763, -0.5271612405776978, -0.49488645792007446, -0.46261167526245117, -0.4303368926048279, -0.398062139749527, -0.3657873868942261, -0.3335126042366028, -0.3012378215789795, -0.2689630687236786, -0.2366883009672165, -0.2044135332107544, -0.1721387654542923, -0.1398639976978302, -0.1075892299413681, -0.075314462184906, -0.04303969442844391, -0.010764926671981812, 0.021509841084480286, 0.053784728050231934, 0.08605949580669403, 0.11833426356315613, 0.15060903131961823, 0.18288379907608032, 0.21515856683254242, 0.24743333458900452, 0.2797080874443054, 0.3119828701019287, 0.344257652759552, 0.3765324056148529, 0.4088071584701538, 0.4410819411277771, 0.4733567237854004, 0.5056314468383789, 0.5379062294960022, 0.5701810121536255, 0.6024557948112488, 0.6347305774688721, 0.6670053005218506, 0.6992800831794739, 0.7315548658370972, 0.7638295888900757, 0.796104371547699, 0.8283791542053223, 0.8606539368629456, 0.8929287195205688, 0.9252034425735474, 0.9574782252311707, 0.989753007888794, 1.0220277309417725, 1.0543025732040405, 1.086577296257019]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 4.0, 3.0, 3.0, 12.0, 5.0, 18.0, 13.0, 19.0, 43.0, 43.0, 71.0, 99.0, 168.0, 306.0, 457.0, 755.0, 1326.0, 2278.0, 4061.0, 7288.0, 14374.0, 31695.0, 84459.0, 214990.0, 326806.0, 213049.0, 83522.0, 31760.0, 14234.0, 7165.0, 3930.0, 2295.0, 1359.0, 729.0, 455.0, 254.0, 171.0, 107.0, 72.0, 60.0, 23.0, 22.0, 18.0, 6.0, 13.0, 6.0, 8.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.306396484375, -0.29634857177734375, -0.2863006591796875, -0.27625274658203125, -0.266204833984375, -0.25615692138671875, -0.2461090087890625, -0.23606109619140625, -0.22601318359375, -0.21596527099609375, -0.2059173583984375, -0.19586944580078125, -0.185821533203125, -0.17577362060546875, -0.1657257080078125, -0.15567779541015625, -0.1456298828125, -0.13558197021484375, -0.1255340576171875, -0.11548614501953125, -0.105438232421875, -0.09539031982421875, -0.0853424072265625, -0.07529449462890625, -0.06524658203125, -0.05519866943359375, -0.0451507568359375, -0.03510284423828125, -0.025054931640625, -0.01500701904296875, -0.0049591064453125, 0.00508880615234375, 0.01513671875, 0.02518463134765625, 0.0352325439453125, 0.04528045654296875, 0.055328369140625, 0.06537628173828125, 0.0754241943359375, 0.08547210693359375, 0.09552001953125, 0.10556793212890625, 0.1156158447265625, 0.12566375732421875, 0.135711669921875, 0.14575958251953125, 0.1558074951171875, 0.16585540771484375, 0.1759033203125, 0.18595123291015625, 0.1959991455078125, 0.20604705810546875, 0.216094970703125, 0.22614288330078125, 0.2361907958984375, 0.24623870849609375, 0.25628662109375, 0.26633453369140625, 0.2763824462890625, 0.28643035888671875, 0.296478271484375, 0.30652618408203125, 0.3165740966796875, 0.32662200927734375, 0.336669921875]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 4.0, 4.0, 7.0, 6.0, 11.0, 8.0, 11.0, 16.0, 17.0, 20.0, 30.0, 19.0, 26.0, 42.0, 38.0, 28.0, 32.0, 35.0, 37.0, 40.0, 43.0, 32.0, 44.0, 43.0, 47.0, 33.0, 48.0, 41.0, 31.0, 36.0, 28.0, 26.0, 19.0, 15.0, 18.0, 16.0, 8.0, 14.0, 8.0, 7.0, 7.0, 2.0, 1.0, 2.0, 7.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.2005615234375, -0.1947784423828125, -0.188995361328125, -0.1832122802734375, -0.17742919921875, -0.1716461181640625, -0.165863037109375, -0.1600799560546875, -0.154296875, -0.1485137939453125, -0.142730712890625, -0.1369476318359375, -0.13116455078125, -0.1253814697265625, -0.119598388671875, -0.1138153076171875, -0.1080322265625, -0.1022491455078125, -0.096466064453125, -0.0906829833984375, -0.08489990234375, -0.0791168212890625, -0.073333740234375, -0.0675506591796875, -0.061767578125, -0.0559844970703125, -0.050201416015625, -0.0444183349609375, -0.03863525390625, -0.0328521728515625, -0.027069091796875, -0.0212860107421875, -0.0155029296875, -0.0097198486328125, -0.003936767578125, 0.0018463134765625, 0.00762939453125, 0.0134124755859375, 0.019195556640625, 0.0249786376953125, 0.03076171875, 0.0365447998046875, 0.042327880859375, 0.0481109619140625, 0.05389404296875, 0.0596771240234375, 0.065460205078125, 0.0712432861328125, 0.0770263671875, 0.0828094482421875, 0.088592529296875, 0.0943756103515625, 0.10015869140625, 0.1059417724609375, 0.111724853515625, 0.1175079345703125, 0.123291015625, 0.1290740966796875, 0.134857177734375, 0.1406402587890625, 0.14642333984375, 0.1522064208984375, 0.157989501953125, 0.1637725830078125, 0.1695556640625]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 4.0, 12.0, 9.0, 16.0, 21.0, 35.0, 43.0, 91.0, 149.0, 294.0, 539.0, 1030.0, 2112.0, 4016.0, 8497.0, 19695.0, 59063.0, 209817.0, 418023.0, 223544.0, 63101.0, 20883.0, 8859.0, 4269.0, 2112.0, 1077.0, 545.0, 328.0, 145.0, 81.0, 49.0, 37.0, 18.0, 12.0, 15.0, 4.0, 4.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 5.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.349853515625, -0.33800506591796875, -0.3261566162109375, -0.31430816650390625, -0.302459716796875, -0.29061126708984375, -0.2787628173828125, -0.26691436767578125, -0.25506591796875, -0.24321746826171875, -0.2313690185546875, -0.21952056884765625, -0.207672119140625, -0.19582366943359375, -0.1839752197265625, -0.17212677001953125, -0.1602783203125, -0.14842987060546875, -0.1365814208984375, -0.12473297119140625, -0.112884521484375, -0.10103607177734375, -0.0891876220703125, -0.07733917236328125, -0.06549072265625, -0.05364227294921875, -0.0417938232421875, -0.02994537353515625, -0.018096923828125, -0.00624847412109375, 0.0055999755859375, 0.01744842529296875, 0.029296875, 0.04114532470703125, 0.0529937744140625, 0.06484222412109375, 0.076690673828125, 0.08853912353515625, 0.1003875732421875, 0.11223602294921875, 0.12408447265625, 0.13593292236328125, 0.1477813720703125, 0.15962982177734375, 0.171478271484375, 0.18332672119140625, 0.1951751708984375, 0.20702362060546875, 0.2188720703125, 0.23072052001953125, 0.2425689697265625, 0.25441741943359375, 0.266265869140625, 0.27811431884765625, 0.2899627685546875, 0.30181121826171875, 0.31365966796875, 0.32550811767578125, 0.3373565673828125, 0.34920501708984375, 0.361053466796875, 0.37290191650390625, 0.3847503662109375, 0.39659881591796875, 0.408447265625]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 4.0, 12.0, 10.0, 8.0, 12.0, 17.0, 16.0, 27.0, 19.0, 20.0, 35.0, 34.0, 44.0, 43.0, 37.0, 53.0, 44.0, 46.0, 67.0, 43.0, 50.0, 48.0, 48.0, 39.0, 39.0, 32.0, 28.0, 22.0, 20.0, 18.0, 10.0, 16.0, 4.0, 10.0, 8.0, 10.0, 2.0, 5.0, 5.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.66943359375, -0.6508560180664062, -0.6322784423828125, -0.6137008666992188, -0.595123291015625, -0.5765457153320312, -0.5579681396484375, -0.5393905639648438, -0.52081298828125, -0.5022354125976562, -0.4836578369140625, -0.46508026123046875, -0.446502685546875, -0.42792510986328125, -0.4093475341796875, -0.39076995849609375, -0.3721923828125, -0.35361480712890625, -0.3350372314453125, -0.31645965576171875, -0.297882080078125, -0.27930450439453125, -0.2607269287109375, -0.24214935302734375, -0.22357177734375, -0.20499420166015625, -0.1864166259765625, -0.16783905029296875, -0.149261474609375, -0.13068389892578125, -0.1121063232421875, -0.09352874755859375, -0.074951171875, -0.05637359619140625, -0.0377960205078125, -0.01921844482421875, -0.000640869140625, 0.01793670654296875, 0.0365142822265625, 0.05509185791015625, 0.07366943359375, 0.09224700927734375, 0.1108245849609375, 0.12940216064453125, 0.147979736328125, 0.16655731201171875, 0.1851348876953125, 0.20371246337890625, 0.2222900390625, 0.24086761474609375, 0.2594451904296875, 0.27802276611328125, 0.296600341796875, 0.31517791748046875, 0.3337554931640625, 0.35233306884765625, 0.37091064453125, 0.38948822021484375, 0.4080657958984375, 0.42664337158203125, 0.445220947265625, 0.46379852294921875, 0.4823760986328125, 0.5009536743164062, 0.51953125]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 6.0, 7.0, 9.0, 17.0, 28.0, 47.0, 52.0, 113.0, 196.0, 308.0, 516.0, 710.0, 1292.0, 2089.0, 3404.0, 5709.0, 9849.0, 17936.0, 35089.0, 78501.0, 172347.0, 281881.0, 225050.0, 109847.0, 49427.0, 23679.0, 12588.0, 7191.0, 4229.0, 2517.0, 1573.0, 886.0, 573.0, 366.0, 204.0, 121.0, 71.0, 53.0, 33.0, 17.0, 19.0, 5.0, 4.0, 2.0, 5.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1212158203125, -0.11772346496582031, -0.11423110961914062, -0.11073875427246094, -0.10724639892578125, -0.10375404357910156, -0.10026168823242188, -0.09676933288574219, -0.0932769775390625, -0.08978462219238281, -0.08629226684570312, -0.08279991149902344, -0.07930755615234375, -0.07581520080566406, -0.07232284545898438, -0.06883049011230469, -0.065338134765625, -0.06184577941894531, -0.058353424072265625, -0.05486106872558594, -0.05136871337890625, -0.04787635803222656, -0.044384002685546875, -0.04089164733886719, -0.0373992919921875, -0.03390693664550781, -0.030414581298828125, -0.026922225952148438, -0.02342987060546875, -0.019937515258789062, -0.016445159912109375, -0.012952804565429688, -0.00946044921875, -0.0059680938720703125, -0.002475738525390625, 0.0010166168212890625, 0.00450897216796875, 0.008001327514648438, 0.011493682861328125, 0.014986038208007812, 0.0184783935546875, 0.021970748901367188, 0.025463104248046875, 0.028955459594726562, 0.03244781494140625, 0.03594017028808594, 0.039432525634765625, 0.04292488098144531, 0.046417236328125, 0.04990959167480469, 0.053401947021484375, 0.05689430236816406, 0.06038665771484375, 0.06387901306152344, 0.06737136840820312, 0.07086372375488281, 0.0743560791015625, 0.07784843444824219, 0.08134078979492188, 0.08483314514160156, 0.08832550048828125, 0.09181785583496094, 0.09531021118164062, 0.09880256652832031, 0.102294921875]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 3.0, 4.0, 2.0, 1.0, 3.0, 3.0, 4.0, 6.0, 6.0, 8.0, 14.0, 20.0, 26.0, 38.0, 51.0, 56.0, 68.0, 94.0, 97.0, 90.0, 87.0, 69.0, 59.0, 41.0, 40.0, 26.0, 19.0, 15.0, 11.0, 7.0, 11.0, 7.0, 6.0, 3.0, 1.0, 2.0, 5.0, 0.0, 1.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.451108932495117e-05, -3.31830233335495e-05, -3.185495734214783e-05, -3.0526891350746155e-05, -2.9198825359344482e-05, -2.787075936794281e-05, -2.6542693376541138e-05, -2.5214627385139465e-05, -2.3886561393737793e-05, -2.255849540233612e-05, -2.1230429410934448e-05, -1.9902363419532776e-05, -1.8574297428131104e-05, -1.724623143672943e-05, -1.591816544532776e-05, -1.4590099453926086e-05, -1.3262033462524414e-05, -1.1933967471122742e-05, -1.060590147972107e-05, -9.277835488319397e-06, -7.949769496917725e-06, -6.621703505516052e-06, -5.29363751411438e-06, -3.9655715227127075e-06, -2.637505531311035e-06, -1.3094395399093628e-06, 1.862645149230957e-08, 1.346692442893982e-06, 2.6747584342956543e-06, 4.002824425697327e-06, 5.330890417098999e-06, 6.658956408500671e-06, 7.987022399902344e-06, 9.315088391304016e-06, 1.0643154382705688e-05, 1.197122037410736e-05, 1.3299286365509033e-05, 1.4627352356910706e-05, 1.5955418348312378e-05, 1.728348433971405e-05, 1.8611550331115723e-05, 1.9939616322517395e-05, 2.1267682313919067e-05, 2.259574830532074e-05, 2.3923814296722412e-05, 2.5251880288124084e-05, 2.6579946279525757e-05, 2.790801227092743e-05, 2.92360782623291e-05, 3.0564144253730774e-05, 3.1892210245132446e-05, 3.322027623653412e-05, 3.454834222793579e-05, 3.587640821933746e-05, 3.7204474210739136e-05, 3.853254020214081e-05, 3.986060619354248e-05, 4.118867218494415e-05, 4.2516738176345825e-05, 4.38448041677475e-05, 4.517287015914917e-05, 4.650093615055084e-05, 4.7829002141952515e-05, 4.915706813335419e-05, 5.048513412475586e-05]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 2.0, 3.0, 4.0, 4.0, 17.0, 12.0, 16.0, 25.0, 43.0, 67.0, 118.0, 163.0, 293.0, 464.0, 816.0, 1375.0, 2319.0, 3963.0, 7287.0, 12682.0, 23523.0, 43793.0, 83034.0, 148409.0, 213471.0, 207067.0, 136061.0, 75682.0, 39616.0, 20969.0, 11724.0, 6559.0, 3723.0, 2156.0, 1238.0, 751.0, 415.0, 260.0, 155.0, 100.0, 55.0, 45.0, 23.0, 16.0, 15.0, 10.0, 5.0, 4.0, 1.0, 2.0, 4.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.0831298828125, -0.08015251159667969, -0.07717514038085938, -0.07419776916503906, -0.07122039794921875, -0.06824302673339844, -0.06526565551757812, -0.06228828430175781, -0.0593109130859375, -0.05633354187011719, -0.053356170654296875, -0.05037879943847656, -0.04740142822265625, -0.04442405700683594, -0.041446685791015625, -0.03846931457519531, -0.035491943359375, -0.03251457214355469, -0.029537200927734375, -0.026559829711914062, -0.02358245849609375, -0.020605087280273438, -0.017627716064453125, -0.014650344848632812, -0.0116729736328125, -0.008695602416992188, -0.005718231201171875, -0.0027408599853515625, 0.00023651123046875, 0.0032138824462890625, 0.006191253662109375, 0.009168624877929688, 0.01214599609375, 0.015123367309570312, 0.018100738525390625, 0.021078109741210938, 0.02405548095703125, 0.027032852172851562, 0.030010223388671875, 0.03298759460449219, 0.0359649658203125, 0.03894233703613281, 0.041919708251953125, 0.04489707946777344, 0.04787445068359375, 0.05085182189941406, 0.053829193115234375, 0.05680656433105469, 0.059783935546875, 0.06276130676269531, 0.06573867797851562, 0.06871604919433594, 0.07169342041015625, 0.07467079162597656, 0.07764816284179688, 0.08062553405761719, 0.0836029052734375, 0.08658027648925781, 0.08955764770507812, 0.09253501892089844, 0.09551239013671875, 0.09848976135253906, 0.10146713256835938, 0.10444450378417969, 0.107421875]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 5.0, 5.0, 5.0, 3.0, 8.0, 4.0, 14.0, 17.0, 15.0, 32.0, 46.0, 48.0, 70.0, 89.0, 96.0, 109.0, 78.0, 93.0, 71.0, 45.0, 49.0, 17.0, 22.0, 17.0, 5.0, 11.0, 11.0, 5.0, 3.0, 9.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.2010498046875, -0.1955108642578125, -0.189971923828125, -0.1844329833984375, -0.17889404296875, -0.1733551025390625, -0.167816162109375, -0.1622772216796875, -0.15673828125, -0.1511993408203125, -0.145660400390625, -0.1401214599609375, -0.13458251953125, -0.1290435791015625, -0.123504638671875, -0.1179656982421875, -0.1124267578125, -0.1068878173828125, -0.101348876953125, -0.0958099365234375, -0.09027099609375, -0.0847320556640625, -0.079193115234375, -0.0736541748046875, -0.068115234375, -0.0625762939453125, -0.057037353515625, -0.0514984130859375, -0.04595947265625, -0.0404205322265625, -0.034881591796875, -0.0293426513671875, -0.0238037109375, -0.0182647705078125, -0.012725830078125, -0.0071868896484375, -0.00164794921875, 0.0038909912109375, 0.009429931640625, 0.0149688720703125, 0.0205078125, 0.0260467529296875, 0.031585693359375, 0.0371246337890625, 0.04266357421875, 0.0482025146484375, 0.053741455078125, 0.0592803955078125, 0.0648193359375, 0.0703582763671875, 0.075897216796875, 0.0814361572265625, 0.08697509765625, 0.0925140380859375, 0.098052978515625, 0.1035919189453125, 0.109130859375, 0.1146697998046875, 0.120208740234375, 0.1257476806640625, 0.13128662109375, 0.1368255615234375, 0.142364501953125, 0.1479034423828125, 0.1534423828125]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 4.0, 5.0, 15.0, 31.0, 67.0, 128.0, 244.0, 227.0, 137.0, 75.0, 43.0, 17.0, 4.0, 4.0, 3.0, 5.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.3535819053649902, -2.236393690109253, -2.1192054748535156, -2.002017021179199, -1.884828805923462, -1.7676405906677246, -1.6504523754119873, -1.5332640409469604, -1.4160757064819336, -1.2988874912261963, -1.1816991567611694, -1.0645109415054321, -0.9473226070404053, -0.830134391784668, -0.7129461169242859, -0.5957578420639038, -0.4785696268081665, -0.3613813519477844, -0.24419309198856354, -0.12700483202934265, -0.009816557168960571, 0.10737168788909912, 0.2245599627494812, 0.3417482376098633, 0.45893651247024536, 0.5761247873306274, 0.6933130621910095, 0.8105013370513916, 0.9276895523071289, 1.0448777675628662, 1.162066102027893, 1.27925443649292, 1.3964426517486572, 1.5136308670043945, 1.6308192014694214, 1.7480074167251587, 1.8651957511901855, 1.9823839664459229, 2.09957218170166, 2.2167606353759766, 2.333948850631714, 2.451137065887451, 2.5683252811431885, 2.685513734817505, 2.802701950073242, 2.9198901653289795, 3.037078380584717, 3.154266834259033, 3.2714548110961914, 3.3886430263519287, 3.505831241607666, 3.6230196952819824, 3.7402079105377197, 3.857396125793457, 3.9745843410491943, 4.091772556304932, 4.208961009979248, 4.3261494636535645, 4.443337440490723, 4.560525894165039, 4.677713871002197, 4.794902324676514, 4.91209077835083, 5.029278755187988, 5.146467208862305]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 3.0, 4.0, 2.0, 7.0, 7.0, 9.0, 11.0, 16.0, 12.0, 24.0, 25.0, 23.0, 37.0, 44.0, 42.0, 36.0, 43.0, 37.0, 46.0, 62.0, 51.0, 36.0, 46.0, 53.0, 42.0, 47.0, 45.0, 28.0, 26.0, 21.0, 21.0, 18.0, 19.0, 13.0, 12.0, 9.0, 7.0, 12.0, 5.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.4980342388153076, -1.451537847518921, -1.4050415754318237, -1.358545184135437, -1.3120489120483398, -1.2655525207519531, -1.2190561294555664, -1.1725598573684692, -1.1260634660720825, -1.0795670747756958, -1.0330708026885986, -0.9865744113922119, -0.94007807970047, -0.893581748008728, -0.8470854163169861, -0.8005890846252441, -0.7540927529335022, -0.7075964212417603, -0.6611000895500183, -0.6146037578582764, -0.5681073665618896, -0.5216110348701477, -0.47511470317840576, -0.42861834168434143, -0.3821220099925995, -0.33562567830085754, -0.2891293168067932, -0.24263298511505127, -0.19613663852214813, -0.149640291929245, -0.10314396023750305, -0.05664759874343872, -0.010151267051696777, 0.03634507581591606, 0.0828414186835289, 0.12933775782585144, 0.17583410441875458, 0.22233045101165771, 0.26882678270339966, 0.315323144197464, 0.36181947588920593, 0.4083158075809479, 0.4548121690750122, 0.5013085007667542, 0.5478048324584961, 0.5943012237548828, 0.64079749584198, 0.6872938871383667, 0.7337902188301086, 0.7802865505218506, 0.8267828822135925, 0.8732792139053345, 0.9197756052017212, 0.9662719368934631, 1.012768268585205, 1.0592646598815918, 1.105760931968689, 1.1522573232650757, 1.1987535953521729, 1.2452499866485596, 1.2917462587356567, 1.3382426500320435, 1.3847389221191406, 1.4312353134155273, 1.477731704711914]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 2.0, 7.0, 1.0, 11.0, 8.0, 12.0, 12.0, 24.0, 25.0, 43.0, 86.0, 159.0, 238.0, 403.0, 730.0, 1298.0, 2472.0, 5242.0, 11496.0, 26838.0, 67211.0, 179277.0, 492965.0, 1177434.0, 1288945.0, 586655.0, 215196.0, 80096.0, 32135.0, 13377.0, 5978.0, 2798.0, 1393.0, 716.0, 415.0, 212.0, 144.0, 81.0, 50.0, 37.0, 27.0, 16.0, 5.0, 5.0, 3.0, 5.0, 3.0, 0.0, 0.0, 1.0, 3.0, 1.0], "bins": [-0.2415771484375, -0.23488235473632812, -0.22818756103515625, -0.22149276733398438, -0.2147979736328125, -0.20810317993164062, -0.20140838623046875, -0.19471359252929688, -0.188018798828125, -0.18132400512695312, -0.17462921142578125, -0.16793441772460938, -0.1612396240234375, -0.15454483032226562, -0.14785003662109375, -0.14115524291992188, -0.13446044921875, -0.12776565551757812, -0.12107086181640625, -0.11437606811523438, -0.1076812744140625, -0.10098648071289062, -0.09429168701171875, -0.08759689331054688, -0.080902099609375, -0.07420730590820312, -0.06751251220703125, -0.060817718505859375, -0.0541229248046875, -0.047428131103515625, -0.04073333740234375, -0.034038543701171875, -0.02734375, -0.020648956298828125, -0.01395416259765625, -0.007259368896484375, -0.0005645751953125, 0.006130218505859375, 0.01282501220703125, 0.019519805908203125, 0.026214599609375, 0.032909393310546875, 0.03960418701171875, 0.046298980712890625, 0.0529937744140625, 0.059688568115234375, 0.06638336181640625, 0.07307815551757812, 0.07977294921875, 0.08646774291992188, 0.09316253662109375, 0.09985733032226562, 0.1065521240234375, 0.11324691772460938, 0.11994171142578125, 0.12663650512695312, 0.133331298828125, 0.14002609252929688, 0.14672088623046875, 0.15341567993164062, 0.1601104736328125, 0.16680526733398438, 0.17350006103515625, 0.18019485473632812, 0.1868896484375]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 4.0, 1.0, 2.0, 6.0, 4.0, 6.0, 6.0, 13.0, 17.0, 8.0, 19.0, 30.0, 22.0, 29.0, 26.0, 33.0, 37.0, 33.0, 54.0, 31.0, 31.0, 45.0, 49.0, 51.0, 36.0, 58.0, 37.0, 43.0, 43.0, 36.0, 40.0, 27.0, 19.0, 26.0, 18.0, 18.0, 14.0, 9.0, 5.0, 6.0, 4.0, 5.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.2078857421875, -0.2017078399658203, -0.19552993774414062, -0.18935203552246094, -0.18317413330078125, -0.17699623107910156, -0.17081832885742188, -0.1646404266357422, -0.1584625244140625, -0.1522846221923828, -0.14610671997070312, -0.13992881774902344, -0.13375091552734375, -0.12757301330566406, -0.12139511108398438, -0.11521720886230469, -0.109039306640625, -0.10286140441894531, -0.09668350219726562, -0.09050559997558594, -0.08432769775390625, -0.07814979553222656, -0.07197189331054688, -0.06579399108886719, -0.0596160888671875, -0.05343818664550781, -0.047260284423828125, -0.04108238220214844, -0.03490447998046875, -0.028726577758789062, -0.022548675537109375, -0.016370773315429688, -0.01019287109375, -0.0040149688720703125, 0.002162933349609375, 0.008340835571289062, 0.01451873779296875, 0.020696640014648438, 0.026874542236328125, 0.03305244445800781, 0.0392303466796875, 0.04540824890136719, 0.051586151123046875, 0.05776405334472656, 0.06394195556640625, 0.07011985778808594, 0.07629776000976562, 0.08247566223144531, 0.088653564453125, 0.09483146667480469, 0.10100936889648438, 0.10718727111816406, 0.11336517333984375, 0.11954307556152344, 0.12572097778320312, 0.1318988800048828, 0.1380767822265625, 0.1442546844482422, 0.15043258666992188, 0.15661048889160156, 0.16278839111328125, 0.16896629333496094, 0.17514419555664062, 0.1813220977783203, 0.1875]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 2.0, 7.0, 8.0, 8.0, 12.0, 10.0, 23.0, 31.0, 53.0, 75.0, 85.0, 135.0, 213.0, 348.0, 561.0, 1049.0, 1935.0, 3744.0, 7582.0, 15524.0, 35040.0, 82108.0, 207316.0, 576024.0, 1475307.0, 1131031.0, 396553.0, 148531.0, 60373.0, 26014.0, 12118.0, 5723.0, 2933.0, 1543.0, 854.0, 532.0, 318.0, 201.0, 122.0, 74.0, 44.0, 28.0, 25.0, 25.0, 14.0, 11.0, 6.0, 4.0, 0.0, 5.0, 1.0, 3.0, 2.0, 2.0, 1.0], "bins": [-0.260498046875, -0.2527961730957031, -0.24509429931640625, -0.23739242553710938, -0.2296905517578125, -0.22198867797851562, -0.21428680419921875, -0.20658493041992188, -0.198883056640625, -0.19118118286132812, -0.18347930908203125, -0.17577743530273438, -0.1680755615234375, -0.16037368774414062, -0.15267181396484375, -0.14496994018554688, -0.13726806640625, -0.12956619262695312, -0.12186431884765625, -0.11416244506835938, -0.1064605712890625, -0.09875869750976562, -0.09105682373046875, -0.08335494995117188, -0.075653076171875, -0.06795120239257812, -0.06024932861328125, -0.052547454833984375, -0.0448455810546875, -0.037143707275390625, -0.02944183349609375, -0.021739959716796875, -0.0140380859375, -0.006336212158203125, 0.00136566162109375, 0.009067535400390625, 0.0167694091796875, 0.024471282958984375, 0.03217315673828125, 0.039875030517578125, 0.047576904296875, 0.055278778076171875, 0.06298065185546875, 0.07068252563476562, 0.0783843994140625, 0.08608627319335938, 0.09378814697265625, 0.10149002075195312, 0.10919189453125, 0.11689376831054688, 0.12459564208984375, 0.13229751586914062, 0.1399993896484375, 0.14770126342773438, 0.15540313720703125, 0.16310501098632812, 0.170806884765625, 0.17850875854492188, 0.18621063232421875, 0.19391250610351562, 0.2016143798828125, 0.20931625366210938, 0.21701812744140625, 0.22472000122070312, 0.232421875]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 3.0, 1.0, 3.0, 3.0, 9.0, 6.0, 9.0, 13.0, 14.0, 19.0, 25.0, 33.0, 36.0, 54.0, 83.0, 89.0, 116.0, 144.0, 203.0, 219.0, 290.0, 376.0, 435.0, 402.0, 337.0, 221.0, 198.0, 175.0, 126.0, 99.0, 66.0, 63.0, 54.0, 46.0, 22.0, 22.0, 14.0, 13.0, 12.0, 6.0, 7.0, 4.0, 4.0, 3.0, 1.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.30419921875, -0.2951469421386719, -0.28609466552734375, -0.2770423889160156, -0.2679901123046875, -0.2589378356933594, -0.24988555908203125, -0.24083328247070312, -0.231781005859375, -0.22272872924804688, -0.21367645263671875, -0.20462417602539062, -0.1955718994140625, -0.18651962280273438, -0.17746734619140625, -0.16841506958007812, -0.15936279296875, -0.15031051635742188, -0.14125823974609375, -0.13220596313476562, -0.1231536865234375, -0.11410140991210938, -0.10504913330078125, -0.09599685668945312, -0.086944580078125, -0.07789230346679688, -0.06884002685546875, -0.059787750244140625, -0.0507354736328125, -0.041683197021484375, -0.03263092041015625, -0.023578643798828125, -0.0145263671875, -0.005474090576171875, 0.00357818603515625, 0.012630462646484375, 0.0216827392578125, 0.030735015869140625, 0.03978729248046875, 0.048839569091796875, 0.057891845703125, 0.06694412231445312, 0.07599639892578125, 0.08504867553710938, 0.0941009521484375, 0.10315322875976562, 0.11220550537109375, 0.12125778198242188, 0.13031005859375, 0.13936233520507812, 0.14841461181640625, 0.15746688842773438, 0.1665191650390625, 0.17557144165039062, 0.18462371826171875, 0.19367599487304688, 0.202728271484375, 0.21178054809570312, 0.22083282470703125, 0.22988510131835938, 0.2389373779296875, 0.24798965454101562, 0.25704193115234375, 0.2660942077636719, 0.275146484375]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 1.0, 2.0, 4.0, 7.0, 18.0, 36.0, 50.0, 80.0, 158.0, 180.0, 144.0, 120.0, 86.0, 51.0, 32.0, 20.0, 7.0, 7.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.3948707580566406, -3.294560194015503, -3.194249391555786, -3.0939388275146484, -2.9936280250549316, -2.893317461013794, -2.7930068969726562, -2.6926960945129395, -2.5923855304718018, -2.492074966430664, -2.3917641639709473, -2.2914535999298096, -2.191143035888672, -2.090832233428955, -1.9905216693878174, -1.8902109861373901, -1.789900302886963, -1.6895896196365356, -1.5892789363861084, -1.4889683723449707, -1.3886576890945435, -1.2883470058441162, -1.1880364418029785, -1.0877257585525513, -0.987415075302124, -0.8871043920516968, -0.7867937684059143, -0.6864831447601318, -0.5861724615097046, -0.48586177825927734, -0.3855511546134949, -0.2852405309677124, -0.18492984771728516, -0.0846191942691803, 0.01569145917892456, 0.11600211262702942, 0.21631276607513428, 0.3166234493255615, 0.416934072971344, 0.5172446966171265, 0.6175553798675537, 0.717866063117981, 0.8181766867637634, 0.9184873104095459, 1.0187979936599731, 1.1191086769104004, 1.219419240951538, 1.3197299242019653, 1.4200406074523926, 1.5203512907028198, 1.620661973953247, 1.7209725379943848, 1.821283221244812, 1.9215939044952393, 2.021904468536377, 2.1222152709960938, 2.2225258350372314, 2.322836399078369, 2.423147201538086, 2.5234577655792236, 2.6237683296203613, 2.724079132080078, 2.824389696121216, 2.9247002601623535, 3.0250110626220703]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 5.0, 5.0, 10.0, 6.0, 14.0, 11.0, 13.0, 14.0, 19.0, 22.0, 30.0, 26.0, 31.0, 34.0, 32.0, 43.0, 42.0, 48.0, 36.0, 49.0, 44.0, 43.0, 49.0, 53.0, 28.0, 42.0, 36.0, 24.0, 30.0, 21.0, 22.0, 19.0, 17.0, 17.0, 20.0, 16.0, 12.0, 3.0, 5.0, 5.0, 5.0, 1.0, 2.0, 4.0, 2.0, 0.0, 0.0, 2.0], "bins": [-1.2589434385299683, -1.224161148071289, -1.1893788576126099, -1.1545965671539307, -1.119814157485962, -1.0850318670272827, -1.0502495765686035, -1.0154672861099243, -0.9806849956512451, -0.9459027051925659, -0.9111204147338867, -0.8763380646705627, -0.8415557742118835, -0.8067734837532043, -0.7719911336898804, -0.7372088432312012, -0.702426552772522, -0.6676442623138428, -0.6328619718551636, -0.5980796217918396, -0.5632973313331604, -0.5285150408744812, -0.4937327206134796, -0.458950400352478, -0.42416810989379883, -0.38938581943511963, -0.35460349917411804, -0.31982117891311646, -0.28503888845443726, -0.25025659799575806, -0.21547427773475647, -0.18069197237491608, -0.14590954780578613, -0.11112724244594574, -0.07634493708610535, -0.041562631726264954, -0.0067803263664245605, 0.028001978993415833, 0.06278428435325623, 0.09756658971309662, 0.132348895072937, 0.1671312004327774, 0.2019135057926178, 0.2366958111524582, 0.2714781165122986, 0.3062604069709778, 0.34104272723197937, 0.37582504749298096, 0.41060733795166016, 0.44538962841033936, 0.48017194867134094, 0.5149542689323425, 0.5497365593910217, 0.5845188498497009, 0.6193011999130249, 0.6540834903717041, 0.6888657808303833, 0.7236480712890625, 0.7584303617477417, 0.7932127118110657, 0.8279950022697449, 0.8627772927284241, 0.897559642791748, 0.9323419332504272, 0.9671242237091064]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 0.0, 2.0, 3.0, 6.0, 7.0, 8.0, 18.0, 31.0, 48.0, 100.0, 135.0, 243.0, 475.0, 813.0, 1434.0, 2665.0, 4708.0, 8041.0, 14829.0, 33353.0, 108472.0, 303342.0, 345095.0, 143502.0, 42951.0, 16998.0, 9136.0, 5237.0, 3054.0, 1708.0, 907.0, 519.0, 289.0, 174.0, 97.0, 52.0, 30.0, 34.0, 19.0, 15.0, 7.0, 4.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.465087890625, -0.45145416259765625, -0.4378204345703125, -0.42418670654296875, -0.410552978515625, -0.39691925048828125, -0.3832855224609375, -0.36965179443359375, -0.35601806640625, -0.34238433837890625, -0.3287506103515625, -0.31511688232421875, -0.301483154296875, -0.28784942626953125, -0.2742156982421875, -0.26058197021484375, -0.2469482421875, -0.23331451416015625, -0.2196807861328125, -0.20604705810546875, -0.192413330078125, -0.17877960205078125, -0.1651458740234375, -0.15151214599609375, -0.13787841796875, -0.12424468994140625, -0.1106109619140625, -0.09697723388671875, -0.083343505859375, -0.06970977783203125, -0.0560760498046875, -0.04244232177734375, -0.02880859375, -0.01517486572265625, -0.0015411376953125, 0.01209259033203125, 0.025726318359375, 0.03936004638671875, 0.0529937744140625, 0.06662750244140625, 0.08026123046875, 0.09389495849609375, 0.1075286865234375, 0.12116241455078125, 0.134796142578125, 0.14842987060546875, 0.1620635986328125, 0.17569732666015625, 0.1893310546875, 0.20296478271484375, 0.2165985107421875, 0.23023223876953125, 0.243865966796875, 0.25749969482421875, 0.2711334228515625, 0.28476715087890625, 0.29840087890625, 0.31203460693359375, 0.3256683349609375, 0.33930206298828125, 0.352935791015625, 0.36656951904296875, 0.3802032470703125, 0.39383697509765625, 0.407470703125]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 5.0, 4.0, 7.0, 6.0, 7.0, 11.0, 16.0, 19.0, 25.0, 19.0, 31.0, 35.0, 30.0, 34.0, 45.0, 42.0, 52.0, 35.0, 57.0, 54.0, 54.0, 48.0, 44.0, 38.0, 50.0, 41.0, 35.0, 38.0, 17.0, 24.0, 18.0, 21.0, 9.0, 10.0, 9.0, 2.0, 7.0, 2.0, 5.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.190673828125, -0.18371963500976562, -0.17676544189453125, -0.16981124877929688, -0.1628570556640625, -0.15590286254882812, -0.14894866943359375, -0.14199447631835938, -0.135040283203125, -0.12808609008789062, -0.12113189697265625, -0.11417770385742188, -0.1072235107421875, -0.10026931762695312, -0.09331512451171875, -0.08636093139648438, -0.07940673828125, -0.07245254516601562, -0.06549835205078125, -0.058544158935546875, -0.0515899658203125, -0.044635772705078125, -0.03768157958984375, -0.030727386474609375, -0.023773193359375, -0.016819000244140625, -0.00986480712890625, -0.002910614013671875, 0.0040435791015625, 0.010997772216796875, 0.01795196533203125, 0.024906158447265625, 0.0318603515625, 0.038814544677734375, 0.04576873779296875, 0.052722930908203125, 0.0596771240234375, 0.06663131713867188, 0.07358551025390625, 0.08053970336914062, 0.087493896484375, 0.09444808959960938, 0.10140228271484375, 0.10835647583007812, 0.1153106689453125, 0.12226486206054688, 0.12921905517578125, 0.13617324829101562, 0.14312744140625, 0.15008163452148438, 0.15703582763671875, 0.16399002075195312, 0.1709442138671875, 0.17789840698242188, 0.18485260009765625, 0.19180679321289062, 0.198760986328125, 0.20571517944335938, 0.21266937255859375, 0.21962356567382812, 0.2265777587890625, 0.23353195190429688, 0.24048614501953125, 0.24744033813476562, 0.25439453125]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 8.0, 9.0, 2.0, 10.0, 8.0, 13.0, 13.0, 27.0, 56.0, 90.0, 134.0, 227.0, 434.0, 823.0, 1470.0, 2864.0, 5566.0, 11034.0, 24355.0, 74657.0, 265422.0, 408794.0, 170452.0, 46765.0, 17434.0, 8563.0, 4345.0, 2264.0, 1195.0, 649.0, 370.0, 180.0, 118.0, 76.0, 34.0, 32.0, 21.0, 19.0, 14.0, 4.0, 5.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.413818359375, -0.3997001647949219, -0.38558197021484375, -0.3714637756347656, -0.3573455810546875, -0.3432273864746094, -0.32910919189453125, -0.3149909973144531, -0.300872802734375, -0.2867546081542969, -0.27263641357421875, -0.2585182189941406, -0.2444000244140625, -0.23028182983398438, -0.21616363525390625, -0.20204544067382812, -0.18792724609375, -0.17380905151367188, -0.15969085693359375, -0.14557266235351562, -0.1314544677734375, -0.11733627319335938, -0.10321807861328125, -0.08909988403320312, -0.074981689453125, -0.060863494873046875, -0.04674530029296875, -0.032627105712890625, -0.0185089111328125, -0.004390716552734375, 0.00972747802734375, 0.023845672607421875, 0.0379638671875, 0.052082061767578125, 0.06620025634765625, 0.08031845092773438, 0.0944366455078125, 0.10855484008789062, 0.12267303466796875, 0.13679122924804688, 0.150909423828125, 0.16502761840820312, 0.17914581298828125, 0.19326400756835938, 0.2073822021484375, 0.22150039672851562, 0.23561859130859375, 0.24973678588867188, 0.26385498046875, 0.2779731750488281, 0.29209136962890625, 0.3062095642089844, 0.3203277587890625, 0.3344459533691406, 0.34856414794921875, 0.3626823425292969, 0.376800537109375, 0.3909187316894531, 0.40503692626953125, 0.4191551208496094, 0.4332733154296875, 0.4473915100097656, 0.46150970458984375, 0.4756278991699219, 0.48974609375]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 1.0, 6.0, 4.0, 5.0, 9.0, 15.0, 9.0, 14.0, 16.0, 21.0, 23.0, 26.0, 32.0, 33.0, 43.0, 35.0, 40.0, 50.0, 49.0, 43.0, 39.0, 51.0, 45.0, 47.0, 43.0, 33.0, 34.0, 31.0, 28.0, 22.0, 28.0, 25.0, 21.0, 19.0, 14.0, 13.0, 11.0, 10.0, 8.0, 2.0, 4.0, 3.0, 0.0, 5.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.63134765625, -0.6118698120117188, -0.5923919677734375, -0.5729141235351562, -0.553436279296875, -0.5339584350585938, -0.5144805908203125, -0.49500274658203125, -0.47552490234375, -0.45604705810546875, -0.4365692138671875, -0.41709136962890625, -0.397613525390625, -0.37813568115234375, -0.3586578369140625, -0.33917999267578125, -0.3197021484375, -0.30022430419921875, -0.2807464599609375, -0.26126861572265625, -0.241790771484375, -0.22231292724609375, -0.2028350830078125, -0.18335723876953125, -0.16387939453125, -0.14440155029296875, -0.1249237060546875, -0.10544586181640625, -0.085968017578125, -0.06649017333984375, -0.0470123291015625, -0.02753448486328125, -0.008056640625, 0.01142120361328125, 0.0308990478515625, 0.05037689208984375, 0.069854736328125, 0.08933258056640625, 0.1088104248046875, 0.12828826904296875, 0.14776611328125, 0.16724395751953125, 0.1867218017578125, 0.20619964599609375, 0.225677490234375, 0.24515533447265625, 0.2646331787109375, 0.28411102294921875, 0.3035888671875, 0.32306671142578125, 0.3425445556640625, 0.36202239990234375, 0.381500244140625, 0.40097808837890625, 0.4204559326171875, 0.43993377685546875, 0.45941162109375, 0.47888946533203125, 0.4983673095703125, 0.5178451538085938, 0.537322998046875, 0.5568008422851562, 0.5762786865234375, 0.5957565307617188, 0.615234375]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 1.0, 4.0, 3.0, 7.0, 13.0, 12.0, 22.0, 32.0, 65.0, 112.0, 167.0, 314.0, 522.0, 930.0, 1712.0, 2972.0, 5288.0, 9678.0, 17374.0, 34634.0, 78971.0, 194254.0, 317407.0, 214715.0, 89042.0, 37887.0, 19041.0, 10099.0, 5797.0, 3159.0, 1875.0, 1043.0, 602.0, 327.0, 194.0, 102.0, 72.0, 40.0, 24.0, 17.0, 13.0, 9.0, 4.0, 3.0, 0.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.1558837890625, -0.15150070190429688, -0.14711761474609375, -0.14273452758789062, -0.1383514404296875, -0.13396835327148438, -0.12958526611328125, -0.12520217895507812, -0.120819091796875, -0.11643600463867188, -0.11205291748046875, -0.10766983032226562, -0.1032867431640625, -0.09890365600585938, -0.09452056884765625, -0.09013748168945312, -0.08575439453125, -0.08137130737304688, -0.07698822021484375, -0.07260513305664062, -0.0682220458984375, -0.06383895874023438, -0.05945587158203125, -0.055072784423828125, -0.050689697265625, -0.046306610107421875, -0.04192352294921875, -0.037540435791015625, -0.0331573486328125, -0.028774261474609375, -0.02439117431640625, -0.020008087158203125, -0.015625, -0.011241912841796875, -0.00685882568359375, -0.002475738525390625, 0.0019073486328125, 0.006290435791015625, 0.01067352294921875, 0.015056610107421875, 0.019439697265625, 0.023822784423828125, 0.02820587158203125, 0.032588958740234375, 0.0369720458984375, 0.041355133056640625, 0.04573822021484375, 0.050121307373046875, 0.05450439453125, 0.058887481689453125, 0.06327056884765625, 0.06765365600585938, 0.0720367431640625, 0.07641983032226562, 0.08080291748046875, 0.08518600463867188, 0.089569091796875, 0.09395217895507812, 0.09833526611328125, 0.10271835327148438, 0.1071014404296875, 0.11148452758789062, 0.11586761474609375, 0.12025070190429688, 0.1246337890625]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 2.0, 5.0, 8.0, 6.0, 2.0, 7.0, 4.0, 13.0, 18.0, 13.0, 29.0, 41.0, 51.0, 78.0, 92.0, 115.0, 100.0, 101.0, 87.0, 53.0, 59.0, 49.0, 11.0, 16.0, 10.0, 8.0, 2.0, 6.0, 2.0, 2.0, 4.0, 2.0, 1.0, 2.0, 2.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.4286251068115234e-05, -4.24729660153389e-05, -4.065968096256256e-05, -3.8846395909786224e-05, -3.703311085700989e-05, -3.521982580423355e-05, -3.3406540751457214e-05, -3.159325569868088e-05, -2.977997064590454e-05, -2.7966685593128204e-05, -2.6153400540351868e-05, -2.434011548757553e-05, -2.2526830434799194e-05, -2.0713545382022858e-05, -1.890026032924652e-05, -1.7086975276470184e-05, -1.5273690223693848e-05, -1.3460405170917511e-05, -1.1647120118141174e-05, -9.833835065364838e-06, -8.020550012588501e-06, -6.207264959812164e-06, -4.393979907035828e-06, -2.580694854259491e-06, -7.674098014831543e-07, 1.0458752512931824e-06, 2.859160304069519e-06, 4.672445356845856e-06, 6.485730409622192e-06, 8.299015462398529e-06, 1.0112300515174866e-05, 1.1925585567951202e-05, 1.3738870620727539e-05, 1.5552155673503876e-05, 1.7365440726280212e-05, 1.917872577905655e-05, 2.0992010831832886e-05, 2.2805295884609222e-05, 2.461858093738556e-05, 2.6431865990161896e-05, 2.8245151042938232e-05, 3.005843609571457e-05, 3.1871721148490906e-05, 3.368500620126724e-05, 3.549829125404358e-05, 3.7311576306819916e-05, 3.912486135959625e-05, 4.093814641237259e-05, 4.2751431465148926e-05, 4.456471651792526e-05, 4.63780015707016e-05, 4.8191286623477936e-05, 5.000457167625427e-05, 5.181785672903061e-05, 5.3631141781806946e-05, 5.544442683458328e-05, 5.725771188735962e-05, 5.9070996940135956e-05, 6.088428199291229e-05, 6.269756704568863e-05, 6.451085209846497e-05, 6.63241371512413e-05, 6.813742220401764e-05, 6.995070725679398e-05, 7.176399230957031e-05]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 2.0, 4.0, 3.0, 3.0, 10.0, 6.0, 8.0, 12.0, 23.0, 39.0, 45.0, 68.0, 98.0, 143.0, 257.0, 404.0, 642.0, 1110.0, 1972.0, 3616.0, 6955.0, 13243.0, 26626.0, 58146.0, 127831.0, 237337.0, 262619.0, 162409.0, 74945.0, 34372.0, 16714.0, 8629.0, 4335.0, 2443.0, 1350.0, 814.0, 462.0, 298.0, 190.0, 130.0, 80.0, 48.0, 35.0, 23.0, 19.0, 14.0, 9.0, 10.0, 6.0, 3.0, 3.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.1407470703125, -0.13674449920654297, -0.13274192810058594, -0.1287393569946289, -0.12473678588867188, -0.12073421478271484, -0.11673164367675781, -0.11272907257080078, -0.10872650146484375, -0.10472393035888672, -0.10072135925292969, -0.09671878814697266, -0.09271621704101562, -0.0887136459350586, -0.08471107482910156, -0.08070850372314453, -0.0767059326171875, -0.07270336151123047, -0.06870079040527344, -0.0646982192993164, -0.060695648193359375, -0.056693077087402344, -0.05269050598144531, -0.04868793487548828, -0.04468536376953125, -0.04068279266357422, -0.03668022155761719, -0.032677650451660156, -0.028675079345703125, -0.024672508239746094, -0.020669937133789062, -0.01666736602783203, -0.012664794921875, -0.008662223815917969, -0.0046596527099609375, -0.0006570816040039062, 0.003345489501953125, 0.007348060607910156, 0.011350631713867188, 0.015353202819824219, 0.01935577392578125, 0.02335834503173828, 0.027360916137695312, 0.031363487243652344, 0.035366058349609375, 0.039368629455566406, 0.04337120056152344, 0.04737377166748047, 0.0513763427734375, 0.05537891387939453, 0.05938148498535156, 0.0633840560913086, 0.06738662719726562, 0.07138919830322266, 0.07539176940917969, 0.07939434051513672, 0.08339691162109375, 0.08739948272705078, 0.09140205383300781, 0.09540462493896484, 0.09940719604492188, 0.1034097671508789, 0.10741233825683594, 0.11141490936279297, 0.11541748046875]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 5.0, 2.0, 5.0, 4.0, 8.0, 8.0, 12.0, 10.0, 13.0, 20.0, 32.0, 24.0, 51.0, 56.0, 54.0, 57.0, 72.0, 76.0, 73.0, 58.0, 72.0, 56.0, 54.0, 36.0, 36.0, 32.0, 20.0, 12.0, 13.0, 7.0, 8.0, 8.0, 7.0, 1.0, 2.0, 0.0, 6.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.13671875, -0.1314239501953125, -0.126129150390625, -0.1208343505859375, -0.11553955078125, -0.1102447509765625, -0.104949951171875, -0.0996551513671875, -0.0943603515625, -0.0890655517578125, -0.083770751953125, -0.0784759521484375, -0.07318115234375, -0.0678863525390625, -0.062591552734375, -0.0572967529296875, -0.052001953125, -0.0467071533203125, -0.041412353515625, -0.0361175537109375, -0.03082275390625, -0.0255279541015625, -0.020233154296875, -0.0149383544921875, -0.0096435546875, -0.0043487548828125, 0.000946044921875, 0.0062408447265625, 0.01153564453125, 0.0168304443359375, 0.022125244140625, 0.0274200439453125, 0.03271484375, 0.0380096435546875, 0.043304443359375, 0.0485992431640625, 0.05389404296875, 0.0591888427734375, 0.064483642578125, 0.0697784423828125, 0.0750732421875, 0.0803680419921875, 0.085662841796875, 0.0909576416015625, 0.09625244140625, 0.1015472412109375, 0.106842041015625, 0.1121368408203125, 0.117431640625, 0.1227264404296875, 0.128021240234375, 0.1333160400390625, 0.13861083984375, 0.1439056396484375, 0.149200439453125, 0.1544952392578125, 0.1597900390625, 0.1650848388671875, 0.170379638671875, 0.1756744384765625, 0.18096923828125, 0.1862640380859375, 0.191558837890625, 0.1968536376953125, 0.2021484375]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 0.0, 2.0, 0.0, 3.0, 5.0, 23.0, 52.0, 71.0, 120.0, 199.0, 222.0, 140.0, 75.0, 50.0, 21.0, 10.0, 6.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.524312496185303, -5.396092891693115, -5.267873764038086, -5.139654159545898, -5.011434555053711, -4.883215427398682, -4.754995822906494, -4.626776695251465, -4.498557090759277, -4.37033748626709, -4.2421183586120605, -4.113898754119873, -3.9856793880462646, -3.8574600219726562, -3.7292404174804688, -3.6010210514068604, -3.472801685333252, -3.3445823192596436, -3.216362953186035, -3.0881433486938477, -2.9599239826202393, -2.831704616546631, -2.7034850120544434, -2.575265645980835, -2.4470462799072266, -2.318826913833618, -2.1906075477600098, -2.0623879432678223, -1.9341685771942139, -1.8059492111206055, -1.6777297258377075, -1.5495102405548096, -1.421290397644043, -1.2930710315704346, -1.1648515462875366, -1.0366320610046387, -0.9084126949310303, -0.7801932692527771, -0.6519738435745239, -0.5237544178962708, -0.3955349922180176, -0.2673155665397644, -0.13909614086151123, -0.010876715183258057, 0.11734271049499512, 0.2455621361732483, 0.37378156185150146, 0.5020009875297546, 0.6302204132080078, 0.758439838886261, 0.8866592645645142, 1.014878749847412, 1.1430981159210205, 1.271317481994629, 1.3995369672775269, 1.5277564525604248, 1.6559758186340332, 1.7841951847076416, 1.9124146699905396, 2.0406341552734375, 2.168853521347046, 2.2970728874206543, 2.425292491912842, 2.55351185798645, 2.6817312240600586]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 1.0, 5.0, 9.0, 8.0, 9.0, 7.0, 14.0, 14.0, 16.0, 25.0, 20.0, 30.0, 27.0, 26.0, 38.0, 43.0, 38.0, 42.0, 39.0, 36.0, 49.0, 50.0, 50.0, 39.0, 38.0, 34.0, 31.0, 32.0, 37.0, 26.0, 26.0, 23.0, 25.0, 20.0, 13.0, 12.0, 16.0, 6.0, 7.0, 6.0, 5.0, 4.0, 3.0, 1.0, 2.0, 4.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-1.4765243530273438, -1.4304780960083008, -1.3844318389892578, -1.3383855819702148, -1.2923392057418823, -1.2462929487228394, -1.2002466917037964, -1.1542004346847534, -1.1081541776657104, -1.0621079206466675, -1.0160616636276245, -0.9700153470039368, -0.9239690899848938, -0.877922773361206, -0.8318765163421631, -0.7858302593231201, -0.7397839426994324, -0.6937376856803894, -0.6476913690567017, -0.6016451120376587, -0.5555988550186157, -0.5095525979995728, -0.463506281375885, -0.41746002435684204, -0.3714137375354767, -0.32536745071411133, -0.27932119369506836, -0.233274906873703, -0.18722863495349884, -0.14118236303329468, -0.09513607621192932, -0.04908981919288635, -0.003043532371520996, 0.043002743273973465, 0.08904901891946793, 0.13509529829025269, 0.18114157021045685, 0.227187842130661, 0.27323412895202637, 0.31928038597106934, 0.3653266727924347, 0.41137295961380005, 0.457419216632843, 0.5034655332565308, 0.5495117902755737, 0.5955580472946167, 0.6416043043136597, 0.6876505613327026, 0.7336968779563904, 0.7797431349754333, 0.8257894515991211, 0.8718357086181641, 0.917881965637207, 0.96392822265625, 1.009974479675293, 1.056020736694336, 1.1020671129226685, 1.1481133699417114, 1.1941596269607544, 1.240206003189087, 1.2862522602081299, 1.3322985172271729, 1.3783447742462158, 1.4243910312652588, 1.4704372882843018]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 9.0, 12.0, 12.0, 22.0, 25.0, 51.0, 98.0, 141.0, 248.0, 550.0, 936.0, 1949.0, 4189.0, 9724.0, 23898.0, 63975.0, 184410.0, 533329.0, 1246127.0, 1259219.0, 557699.0, 196498.0, 67608.0, 25173.0, 10126.0, 4364.0, 1945.0, 905.0, 464.0, 261.0, 116.0, 73.0, 48.0, 30.0, 16.0, 16.0, 8.0, 6.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.241943359375, -0.23438644409179688, -0.22682952880859375, -0.21927261352539062, -0.2117156982421875, -0.20415878295898438, -0.19660186767578125, -0.18904495239257812, -0.181488037109375, -0.17393112182617188, -0.16637420654296875, -0.15881729125976562, -0.1512603759765625, -0.14370346069335938, -0.13614654541015625, -0.12858963012695312, -0.12103271484375, -0.11347579956054688, -0.10591888427734375, -0.09836196899414062, -0.0908050537109375, -0.08324813842773438, -0.07569122314453125, -0.06813430786132812, -0.060577392578125, -0.053020477294921875, -0.04546356201171875, -0.037906646728515625, -0.0303497314453125, -0.022792816162109375, -0.01523590087890625, -0.007678985595703125, -0.0001220703125, 0.007434844970703125, 0.01499176025390625, 0.022548675537109375, 0.0301055908203125, 0.037662506103515625, 0.04521942138671875, 0.052776336669921875, 0.060333251953125, 0.06789016723632812, 0.07544708251953125, 0.08300399780273438, 0.0905609130859375, 0.09811782836914062, 0.10567474365234375, 0.11323165893554688, 0.12078857421875, 0.12834548950195312, 0.13590240478515625, 0.14345932006835938, 0.1510162353515625, 0.15857315063476562, 0.16613006591796875, 0.17368698120117188, 0.181243896484375, 0.18880081176757812, 0.19635772705078125, 0.20391464233398438, 0.2114715576171875, 0.21902847290039062, 0.22658538818359375, 0.23414230346679688, 0.24169921875]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [3.0, 3.0, 2.0, 5.0, 3.0, 2.0, 6.0, 6.0, 6.0, 7.0, 9.0, 12.0, 8.0, 13.0, 15.0, 14.0, 26.0, 15.0, 21.0, 29.0, 33.0, 35.0, 29.0, 38.0, 36.0, 42.0, 39.0, 40.0, 38.0, 40.0, 30.0, 37.0, 50.0, 50.0, 36.0, 22.0, 34.0, 32.0, 20.0, 26.0, 19.0, 18.0, 13.0, 12.0, 7.0, 7.0, 5.0, 10.0, 6.0, 4.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.171142578125, -0.16509437561035156, -0.15904617309570312, -0.1529979705810547, -0.14694976806640625, -0.1409015655517578, -0.13485336303710938, -0.12880516052246094, -0.1227569580078125, -0.11670875549316406, -0.11066055297851562, -0.10461235046386719, -0.09856414794921875, -0.09251594543457031, -0.08646774291992188, -0.08041954040527344, -0.074371337890625, -0.06832313537597656, -0.062274932861328125, -0.05622673034667969, -0.05017852783203125, -0.04413032531738281, -0.038082122802734375, -0.03203392028808594, -0.0259857177734375, -0.019937515258789062, -0.013889312744140625, -0.007841110229492188, -0.00179290771484375, 0.0042552947998046875, 0.010303497314453125, 0.016351699829101562, 0.02239990234375, 0.028448104858398438, 0.034496307373046875, 0.04054450988769531, 0.04659271240234375, 0.05264091491699219, 0.058689117431640625, 0.06473731994628906, 0.0707855224609375, 0.07683372497558594, 0.08288192749023438, 0.08893013000488281, 0.09497833251953125, 0.10102653503417969, 0.10707473754882812, 0.11312294006347656, 0.119171142578125, 0.12521934509277344, 0.13126754760742188, 0.1373157501220703, 0.14336395263671875, 0.1494121551513672, 0.15546035766601562, 0.16150856018066406, 0.1675567626953125, 0.17360496520996094, 0.17965316772460938, 0.1857013702392578, 0.19174957275390625, 0.1977977752685547, 0.20384597778320312, 0.20989418029785156, 0.2159423828125]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 3.0, 1.0, 3.0, 2.0, 6.0, 9.0, 15.0, 22.0, 31.0, 44.0, 77.0, 120.0, 206.0, 406.0, 736.0, 1319.0, 2905.0, 6544.0, 15581.0, 41145.0, 120312.0, 397323.0, 1430059.0, 1535291.0, 437175.0, 130052.0, 44665.0, 17007.0, 6867.0, 3066.0, 1468.0, 799.0, 439.0, 250.0, 134.0, 79.0, 44.0, 36.0, 14.0, 12.0, 8.0, 3.0, 8.0, 6.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.390380859375, -0.38038063049316406, -0.3703804016113281, -0.3603801727294922, -0.35037994384765625, -0.3403797149658203, -0.3303794860839844, -0.32037925720214844, -0.3103790283203125, -0.30037879943847656, -0.2903785705566406, -0.2803783416748047, -0.27037811279296875, -0.2603778839111328, -0.2503776550292969, -0.24037742614746094, -0.230377197265625, -0.22037696838378906, -0.21037673950195312, -0.2003765106201172, -0.19037628173828125, -0.1803760528564453, -0.17037582397460938, -0.16037559509277344, -0.1503753662109375, -0.14037513732910156, -0.13037490844726562, -0.12037467956542969, -0.11037445068359375, -0.10037422180175781, -0.09037399291992188, -0.08037376403808594, -0.07037353515625, -0.06037330627441406, -0.050373077392578125, -0.04037284851074219, -0.03037261962890625, -0.020372390747070312, -0.010372161865234375, -0.0003719329833984375, 0.0096282958984375, 0.019628524780273438, 0.029628753662109375, 0.03962898254394531, 0.04962921142578125, 0.05962944030761719, 0.06962966918945312, 0.07962989807128906, 0.089630126953125, 0.09963035583496094, 0.10963058471679688, 0.11963081359863281, 0.12963104248046875, 0.1396312713623047, 0.14963150024414062, 0.15963172912597656, 0.1696319580078125, 0.17963218688964844, 0.18963241577148438, 0.1996326446533203, 0.20963287353515625, 0.2196331024169922, 0.22963333129882812, 0.23963356018066406, 0.2496337890625]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 4.0, 7.0, 6.0, 14.0, 16.0, 15.0, 29.0, 29.0, 36.0, 57.0, 60.0, 98.0, 129.0, 166.0, 213.0, 289.0, 367.0, 478.0, 475.0, 382.0, 302.0, 232.0, 184.0, 126.0, 82.0, 73.0, 48.0, 40.0, 39.0, 14.0, 16.0, 12.0, 14.0, 9.0, 5.0, 8.0, 5.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.35498046875, -0.3438911437988281, -0.33280181884765625, -0.3217124938964844, -0.3106231689453125, -0.2995338439941406, -0.28844451904296875, -0.2773551940917969, -0.266265869140625, -0.2551765441894531, -0.24408721923828125, -0.23299789428710938, -0.2219085693359375, -0.21081924438476562, -0.19972991943359375, -0.18864059448242188, -0.17755126953125, -0.16646194458007812, -0.15537261962890625, -0.14428329467773438, -0.1331939697265625, -0.12210464477539062, -0.11101531982421875, -0.09992599487304688, -0.088836669921875, -0.07774734497070312, -0.06665802001953125, -0.055568695068359375, -0.0444793701171875, -0.033390045166015625, -0.02230072021484375, -0.011211395263671875, -0.0001220703125, 0.010967254638671875, 0.02205657958984375, 0.033145904541015625, 0.0442352294921875, 0.055324554443359375, 0.06641387939453125, 0.07750320434570312, 0.088592529296875, 0.09968185424804688, 0.11077117919921875, 0.12186050415039062, 0.1329498291015625, 0.14403915405273438, 0.15512847900390625, 0.16621780395507812, 0.17730712890625, 0.18839645385742188, 0.19948577880859375, 0.21057510375976562, 0.2216644287109375, 0.23275375366210938, 0.24384307861328125, 0.2549324035644531, 0.266021728515625, 0.2771110534667969, 0.28820037841796875, 0.2992897033691406, 0.3103790283203125, 0.3214683532714844, 0.33255767822265625, 0.3436470031738281, 0.354736328125]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 4.0, 6.0, 16.0, 50.0, 102.0, 115.0, 169.0, 169.0, 155.0, 90.0, 70.0, 30.0, 14.0, 4.0, 4.0, 5.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.6586127281188965, -3.5374972820281982, -3.416381597518921, -3.2952661514282227, -3.1741507053375244, -3.053035020828247, -2.931919574737549, -2.8108038902282715, -2.6896884441375732, -2.568572998046875, -2.4474573135375977, -2.3263418674468994, -2.205226421356201, -2.084110736846924, -1.9629952907562256, -1.8418797254562378, -1.7207642793655396, -1.5996487140655518, -1.4785332679748535, -1.3574177026748657, -1.236302137374878, -1.1151866912841797, -0.9940711259841919, -0.8729555606842041, -0.7518400549888611, -0.6307245492935181, -0.5096089839935303, -0.38849347829818726, -0.26737794280052185, -0.14626240730285645, -0.025146901607513428, 0.09596866369247437, 0.21708416938781738, 0.3381997048854828, 0.4593152403831482, 0.5804307460784912, 0.701546311378479, 0.822661817073822, 0.943777322769165, 1.0648928880691528, 1.1860084533691406, 1.3071240186691284, 1.4282394647598267, 1.5493550300598145, 1.6704705953598022, 1.79158616065979, 1.9127016067504883, 2.0338172912597656, 2.1549324989318848, 2.276047945022583, 2.3971636295318604, 2.5182790756225586, 2.639394521713257, 2.760510206222534, 2.8816256523132324, 3.0027413368225098, 3.123856782913208, 3.2449722290039062, 3.3660879135131836, 3.487203359603882, 3.60831880569458, 3.7294344902038574, 3.8505499362945557, 3.971665382385254, 4.092781066894531]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 3.0, 10.0, 4.0, 6.0, 6.0, 6.0, 16.0, 17.0, 14.0, 17.0, 25.0, 20.0, 26.0, 26.0, 26.0, 30.0, 42.0, 41.0, 42.0, 50.0, 47.0, 41.0, 34.0, 28.0, 43.0, 31.0, 35.0, 36.0, 29.0, 27.0, 33.0, 30.0, 26.0, 22.0, 23.0, 16.0, 12.0, 8.0, 6.0, 13.0, 8.0, 8.0, 6.0, 4.0, 8.0, 3.0, 5.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.1304309368133545, -1.0955514907836914, -1.0606721639633179, -1.0257927179336548, -0.9909133911132812, -0.9560339450836182, -0.9211545586585999, -0.8862751722335815, -0.8513957858085632, -0.8165163993835449, -0.7816370129585266, -0.7467576265335083, -0.7118781805038452, -0.6769988536834717, -0.6421194076538086, -0.6072400212287903, -0.572360634803772, -0.5374812483787537, -0.5026018619537354, -0.46772244572639465, -0.43284305930137634, -0.39796367287635803, -0.36308425664901733, -0.328204870223999, -0.2933254837989807, -0.2584460973739624, -0.2235666960477829, -0.1886872947216034, -0.15380790829658508, -0.11892852187156677, -0.08404912054538727, -0.049169719219207764, -0.014290213584899902, 0.020589180290699005, 0.05546857416629791, 0.09034796804189682, 0.12522736191749573, 0.16010674834251404, 0.19498614966869354, 0.22986555099487305, 0.26474493741989136, 0.29962432384490967, 0.334503710269928, 0.3693831264972687, 0.404262512922287, 0.4391418993473053, 0.474021315574646, 0.5089007019996643, 0.5437800884246826, 0.5786594748497009, 0.6135388612747192, 0.6484182476997375, 0.6832976341247559, 0.718177080154419, 0.7530564665794373, 0.7879358530044556, 0.8228152394294739, 0.8576946258544922, 0.8925740122795105, 0.9274533987045288, 0.9623328447341919, 0.9972121715545654, 1.0320916175842285, 1.0669710636138916, 1.1018503904342651]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 2.0, 3.0, 4.0, 2.0, 2.0, 3.0, 9.0, 9.0, 14.0, 21.0, 31.0, 43.0, 61.0, 126.0, 192.0, 253.0, 396.0, 556.0, 801.0, 1291.0, 1946.0, 3206.0, 5814.0, 12506.0, 34283.0, 108853.0, 276705.0, 337145.0, 171471.0, 55436.0, 18625.0, 7727.0, 3983.0, 2415.0, 1551.0, 987.0, 678.0, 453.0, 308.0, 225.0, 118.0, 103.0, 74.0, 42.0, 35.0, 23.0, 12.0, 8.0, 9.0, 4.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.3671875, -0.3554229736328125, -0.343658447265625, -0.3318939208984375, -0.32012939453125, -0.3083648681640625, -0.296600341796875, -0.2848358154296875, -0.2730712890625, -0.2613067626953125, -0.249542236328125, -0.2377777099609375, -0.22601318359375, -0.2142486572265625, -0.202484130859375, -0.1907196044921875, -0.178955078125, -0.1671905517578125, -0.155426025390625, -0.1436614990234375, -0.13189697265625, -0.1201324462890625, -0.108367919921875, -0.0966033935546875, -0.0848388671875, -0.0730743408203125, -0.061309814453125, -0.0495452880859375, -0.03778076171875, -0.0260162353515625, -0.014251708984375, -0.0024871826171875, 0.00927734375, 0.0210418701171875, 0.032806396484375, 0.0445709228515625, 0.05633544921875, 0.0680999755859375, 0.079864501953125, 0.0916290283203125, 0.1033935546875, 0.1151580810546875, 0.126922607421875, 0.1386871337890625, 0.15045166015625, 0.1622161865234375, 0.173980712890625, 0.1857452392578125, 0.197509765625, 0.2092742919921875, 0.221038818359375, 0.2328033447265625, 0.24456787109375, 0.2563323974609375, 0.268096923828125, 0.2798614501953125, 0.2916259765625, 0.3033905029296875, 0.315155029296875, 0.3269195556640625, 0.33868408203125, 0.3504486083984375, 0.362213134765625, 0.3739776611328125, 0.3857421875]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 2.0, 5.0, 8.0, 4.0, 9.0, 11.0, 11.0, 11.0, 13.0, 22.0, 23.0, 22.0, 26.0, 35.0, 39.0, 41.0, 34.0, 46.0, 41.0, 33.0, 56.0, 45.0, 48.0, 41.0, 41.0, 39.0, 52.0, 47.0, 31.0, 23.0, 30.0, 26.0, 13.0, 21.0, 13.0, 8.0, 12.0, 5.0, 5.0, 4.0, 3.0, 1.0, 4.0, 3.0, 3.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2021484375, -0.1941070556640625, -0.186065673828125, -0.1780242919921875, -0.16998291015625, -0.1619415283203125, -0.153900146484375, -0.1458587646484375, -0.1378173828125, -0.1297760009765625, -0.121734619140625, -0.1136932373046875, -0.10565185546875, -0.0976104736328125, -0.089569091796875, -0.0815277099609375, -0.073486328125, -0.0654449462890625, -0.057403564453125, -0.0493621826171875, -0.04132080078125, -0.0332794189453125, -0.025238037109375, -0.0171966552734375, -0.0091552734375, -0.0011138916015625, 0.006927490234375, 0.0149688720703125, 0.02301025390625, 0.0310516357421875, 0.039093017578125, 0.0471343994140625, 0.05517578125, 0.0632171630859375, 0.071258544921875, 0.0792999267578125, 0.08734130859375, 0.0953826904296875, 0.103424072265625, 0.1114654541015625, 0.1195068359375, 0.1275482177734375, 0.135589599609375, 0.1436309814453125, 0.15167236328125, 0.1597137451171875, 0.167755126953125, 0.1757965087890625, 0.183837890625, 0.1918792724609375, 0.199920654296875, 0.2079620361328125, 0.21600341796875, 0.2240447998046875, 0.232086181640625, 0.2401275634765625, 0.2481689453125, 0.2562103271484375, 0.264251708984375, 0.2722930908203125, 0.28033447265625, 0.2883758544921875, 0.296417236328125, 0.3044586181640625, 0.3125]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 3.0, 7.0, 16.0, 18.0, 43.0, 84.0, 185.0, 350.0, 750.0, 1660.0, 3846.0, 10619.0, 42374.0, 229640.0, 512386.0, 195208.0, 35659.0, 9370.0, 3530.0, 1465.0, 713.0, 313.0, 156.0, 86.0, 41.0, 17.0, 7.0, 5.0, 4.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.5390625, -0.5229454040527344, -0.5068283081054688, -0.4907112121582031, -0.4745941162109375, -0.4584770202636719, -0.44235992431640625, -0.4262428283691406, -0.410125732421875, -0.3940086364746094, -0.37789154052734375, -0.3617744445800781, -0.3456573486328125, -0.3295402526855469, -0.31342315673828125, -0.2973060607910156, -0.28118896484375, -0.2650718688964844, -0.24895477294921875, -0.23283767700195312, -0.2167205810546875, -0.20060348510742188, -0.18448638916015625, -0.16836929321289062, -0.152252197265625, -0.13613510131835938, -0.12001800537109375, -0.10390090942382812, -0.0877838134765625, -0.07166671752929688, -0.05554962158203125, -0.039432525634765625, -0.0233154296875, -0.007198333740234375, 0.00891876220703125, 0.025035858154296875, 0.0411529541015625, 0.057270050048828125, 0.07338714599609375, 0.08950424194335938, 0.105621337890625, 0.12173843383789062, 0.13785552978515625, 0.15397262573242188, 0.1700897216796875, 0.18620681762695312, 0.20232391357421875, 0.21844100952148438, 0.23455810546875, 0.2506752014160156, 0.26679229736328125, 0.2829093933105469, 0.2990264892578125, 0.3151435852050781, 0.33126068115234375, 0.3473777770996094, 0.363494873046875, 0.3796119689941406, 0.39572906494140625, 0.4118461608886719, 0.4279632568359375, 0.4440803527832031, 0.46019744873046875, 0.4763145446777344, 0.492431640625]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 4.0, 3.0, 4.0, 5.0, 6.0, 9.0, 13.0, 20.0, 13.0, 9.0, 18.0, 21.0, 25.0, 33.0, 24.0, 26.0, 27.0, 29.0, 43.0, 36.0, 32.0, 48.0, 44.0, 33.0, 27.0, 46.0, 37.0, 26.0, 31.0, 28.0, 45.0, 24.0, 20.0, 36.0, 28.0, 26.0, 16.0, 16.0, 18.0, 18.0, 7.0, 5.0, 5.0, 5.0, 10.0, 3.0, 1.0, 3.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.58984375, -0.57183837890625, -0.5538330078125, -0.53582763671875, -0.517822265625, -0.49981689453125, -0.4818115234375, -0.46380615234375, -0.44580078125, -0.42779541015625, -0.4097900390625, -0.39178466796875, -0.373779296875, -0.35577392578125, -0.3377685546875, -0.31976318359375, -0.3017578125, -0.28375244140625, -0.2657470703125, -0.24774169921875, -0.229736328125, -0.21173095703125, -0.1937255859375, -0.17572021484375, -0.15771484375, -0.13970947265625, -0.1217041015625, -0.10369873046875, -0.085693359375, -0.06768798828125, -0.0496826171875, -0.03167724609375, -0.013671875, 0.00433349609375, 0.0223388671875, 0.04034423828125, 0.058349609375, 0.07635498046875, 0.0943603515625, 0.11236572265625, 0.13037109375, 0.14837646484375, 0.1663818359375, 0.18438720703125, 0.202392578125, 0.22039794921875, 0.2384033203125, 0.25640869140625, 0.2744140625, 0.29241943359375, 0.3104248046875, 0.32843017578125, 0.346435546875, 0.36444091796875, 0.3824462890625, 0.40045166015625, 0.41845703125, 0.43646240234375, 0.4544677734375, 0.47247314453125, 0.490478515625, 0.50848388671875, 0.5264892578125, 0.54449462890625, 0.5625]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 5.0, 7.0, 5.0, 15.0, 24.0, 25.0, 41.0, 46.0, 92.0, 114.0, 195.0, 310.0, 415.0, 607.0, 985.0, 1412.0, 2385.0, 3665.0, 6300.0, 11058.0, 19729.0, 36780.0, 69347.0, 127625.0, 200146.0, 219034.0, 155594.0, 88011.0, 46305.0, 24628.0, 13705.0, 7675.0, 4452.0, 2796.0, 1723.0, 1092.0, 732.0, 481.0, 313.0, 234.0, 163.0, 86.0, 69.0, 40.0, 32.0, 25.0, 13.0, 7.0, 10.0, 5.0, 2.0, 1.0, 3.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.06842041015625, -0.06607627868652344, -0.06373214721679688, -0.06138801574707031, -0.05904388427734375, -0.05669975280761719, -0.054355621337890625, -0.05201148986816406, -0.0496673583984375, -0.04732322692871094, -0.044979095458984375, -0.04263496398925781, -0.04029083251953125, -0.03794670104980469, -0.035602569580078125, -0.03325843811035156, -0.030914306640625, -0.028570175170898438, -0.026226043701171875, -0.023881912231445312, -0.02153778076171875, -0.019193649291992188, -0.016849517822265625, -0.014505386352539062, -0.0121612548828125, -0.009817123413085938, -0.007472991943359375, -0.0051288604736328125, -0.00278472900390625, -0.0004405975341796875, 0.001903533935546875, 0.0042476654052734375, 0.006591796875, 0.008935928344726562, 0.011280059814453125, 0.013624191284179688, 0.01596832275390625, 0.018312454223632812, 0.020656585693359375, 0.023000717163085938, 0.0253448486328125, 0.027688980102539062, 0.030033111572265625, 0.03237724304199219, 0.03472137451171875, 0.03706550598144531, 0.039409637451171875, 0.04175376892089844, 0.044097900390625, 0.04644203186035156, 0.048786163330078125, 0.05113029479980469, 0.05347442626953125, 0.05581855773925781, 0.058162689208984375, 0.06050682067871094, 0.0628509521484375, 0.06519508361816406, 0.06753921508789062, 0.06988334655761719, 0.07222747802734375, 0.07457160949707031, 0.07691574096679688, 0.07925987243652344, 0.08160400390625]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 2.0, 4.0, 3.0, 4.0, 18.0, 20.0, 16.0, 25.0, 59.0, 80.0, 75.0, 131.0, 139.0, 129.0, 89.0, 50.0, 51.0, 32.0, 26.0, 17.0, 9.0, 4.0, 3.0, 4.0, 6.0, 3.0, 3.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.990266799926758e-05, -5.811639130115509e-05, -5.63301146030426e-05, -5.4543837904930115e-05, -5.275756120681763e-05, -5.097128450870514e-05, -4.918500781059265e-05, -4.7398731112480164e-05, -4.5612454414367676e-05, -4.382617771625519e-05, -4.20399010181427e-05, -4.025362432003021e-05, -3.8467347621917725e-05, -3.668107092380524e-05, -3.489479422569275e-05, -3.310851752758026e-05, -3.1322240829467773e-05, -2.9535964131355286e-05, -2.7749687433242798e-05, -2.596341073513031e-05, -2.4177134037017822e-05, -2.2390857338905334e-05, -2.0604580640792847e-05, -1.881830394268036e-05, -1.703202724456787e-05, -1.5245750546455383e-05, -1.3459473848342896e-05, -1.1673197150230408e-05, -9.88692045211792e-06, -8.100643754005432e-06, -6.314367055892944e-06, -4.5280903577804565e-06, -2.7418136596679688e-06, -9.55536961555481e-07, 8.307397365570068e-07, 2.6170164346694946e-06, 4.403293132781982e-06, 6.18956983089447e-06, 7.975846529006958e-06, 9.762123227119446e-06, 1.1548399925231934e-05, 1.3334676623344421e-05, 1.512095332145691e-05, 1.6907230019569397e-05, 1.8693506717681885e-05, 2.0479783415794373e-05, 2.226606011390686e-05, 2.4052336812019348e-05, 2.5838613510131836e-05, 2.7624890208244324e-05, 2.941116690635681e-05, 3.11974436044693e-05, 3.298372030258179e-05, 3.4769997000694275e-05, 3.655627369880676e-05, 3.834255039691925e-05, 4.012882709503174e-05, 4.1915103793144226e-05, 4.3701380491256714e-05, 4.54876571893692e-05, 4.727393388748169e-05, 4.906021058559418e-05, 5.0846487283706665e-05, 5.263276398181915e-05, 5.441904067993164e-05]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 4.0, 7.0, 8.0, 5.0, 30.0, 33.0, 51.0, 78.0, 118.0, 194.0, 292.0, 467.0, 799.0, 1256.0, 2055.0, 3547.0, 5704.0, 10099.0, 17552.0, 31339.0, 55386.0, 94887.0, 150718.0, 192933.0, 179056.0, 125269.0, 75776.0, 43179.0, 24402.0, 13764.0, 8002.0, 4599.0, 2714.0, 1598.0, 990.0, 613.0, 363.0, 228.0, 153.0, 114.0, 60.0, 42.0, 24.0, 21.0, 13.0, 3.0, 9.0, 6.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06866455078125, -0.06643390655517578, -0.06420326232910156, -0.061972618103027344, -0.059741973876953125, -0.057511329650878906, -0.05528068542480469, -0.05305004119873047, -0.05081939697265625, -0.04858875274658203, -0.04635810852050781, -0.044127464294433594, -0.041896820068359375, -0.039666175842285156, -0.03743553161621094, -0.03520488739013672, -0.0329742431640625, -0.03074359893798828, -0.028512954711914062, -0.026282310485839844, -0.024051666259765625, -0.021821022033691406, -0.019590377807617188, -0.01735973358154297, -0.01512908935546875, -0.012898445129394531, -0.010667800903320312, -0.008437156677246094, -0.006206512451171875, -0.003975868225097656, -0.0017452239990234375, 0.00048542022705078125, 0.002716064453125, 0.004946708679199219, 0.0071773529052734375, 0.009407997131347656, 0.011638641357421875, 0.013869285583496094, 0.016099929809570312, 0.01833057403564453, 0.02056121826171875, 0.02279186248779297, 0.025022506713867188, 0.027253150939941406, 0.029483795166015625, 0.031714439392089844, 0.03394508361816406, 0.03617572784423828, 0.0384063720703125, 0.04063701629638672, 0.04286766052246094, 0.045098304748535156, 0.047328948974609375, 0.049559593200683594, 0.05179023742675781, 0.05402088165283203, 0.05625152587890625, 0.05848217010498047, 0.06071281433105469, 0.0629434585571289, 0.06517410278320312, 0.06740474700927734, 0.06963539123535156, 0.07186603546142578, 0.0740966796875]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 2.0, 1.0, 4.0, 8.0, 8.0, 7.0, 8.0, 10.0, 11.0, 12.0, 26.0, 38.0, 32.0, 29.0, 30.0, 40.0, 50.0, 44.0, 57.0, 57.0, 56.0, 60.0, 61.0, 51.0, 44.0, 33.0, 32.0, 26.0, 24.0, 20.0, 17.0, 23.0, 12.0, 14.0, 6.0, 12.0, 6.0, 7.0, 8.0, 5.0, 2.0, 7.0, 6.0, 2.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0], "bins": [-0.12274169921875, -0.11921215057373047, -0.11568260192871094, -0.1121530532836914, -0.10862350463867188, -0.10509395599365234, -0.10156440734863281, -0.09803485870361328, -0.09450531005859375, -0.09097576141357422, -0.08744621276855469, -0.08391666412353516, -0.08038711547851562, -0.0768575668334961, -0.07332801818847656, -0.06979846954345703, -0.0662689208984375, -0.06273937225341797, -0.05920982360839844, -0.055680274963378906, -0.052150726318359375, -0.048621177673339844, -0.04509162902832031, -0.04156208038330078, -0.03803253173828125, -0.03450298309326172, -0.030973434448242188, -0.027443885803222656, -0.023914337158203125, -0.020384788513183594, -0.016855239868164062, -0.013325691223144531, -0.009796142578125, -0.006266593933105469, -0.0027370452880859375, 0.0007925033569335938, 0.004322052001953125, 0.007851600646972656, 0.011381149291992188, 0.014910697937011719, 0.01844024658203125, 0.02196979522705078, 0.025499343872070312, 0.029028892517089844, 0.032558441162109375, 0.036087989807128906, 0.03961753845214844, 0.04314708709716797, 0.0466766357421875, 0.05020618438720703, 0.05373573303222656, 0.057265281677246094, 0.060794830322265625, 0.06432437896728516, 0.06785392761230469, 0.07138347625732422, 0.07491302490234375, 0.07844257354736328, 0.08197212219238281, 0.08550167083740234, 0.08903121948242188, 0.0925607681274414, 0.09609031677246094, 0.09961986541748047, 0.1031494140625]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 6.0, 8.0, 5.0, 11.0, 17.0, 27.0, 33.0, 60.0, 90.0, 125.0, 119.0, 125.0, 97.0, 87.0, 66.0, 40.0, 27.0, 16.0, 12.0, 7.0, 7.0, 3.0, 2.0, 5.0, 3.0, 4.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-1.7611908912658691, -1.6923216581344604, -1.6234524250030518, -1.5545833110809326, -1.485714077949524, -1.4168448448181152, -1.347975730895996, -1.2791064977645874, -1.2102372646331787, -1.14136803150177, -1.0724987983703613, -1.0036296844482422, -0.9347604513168335, -0.8658912181854248, -0.7970220446586609, -0.728152871131897, -0.6592836380004883, -0.5904144048690796, -0.5215452313423157, -0.45267602801322937, -0.38380682468414307, -0.31493762135505676, -0.24606841802597046, -0.17719921469688416, -0.10833001136779785, -0.03946080803871155, 0.029408395290374756, 0.09827759861946106, 0.16714680194854736, 0.23601600527763367, 0.30488520860671997, 0.3737544119358063, 0.4426236152648926, 0.5114928483963013, 0.5803620219230652, 0.6492311954498291, 0.7181004285812378, 0.7869696617126465, 0.8558388352394104, 0.9247080087661743, 0.993577241897583, 1.0624464750289917, 1.1313157081604004, 1.2001848220825195, 1.2690540552139282, 1.337923288345337, 1.406792402267456, 1.4756616353988647, 1.5445308685302734, 1.6134001016616821, 1.6822693347930908, 1.75113844871521, 1.8200076818466187, 1.8888769149780273, 1.9577460289001465, 2.0266153812408447, 2.095484495162964, 2.164353609085083, 2.2332229614257812, 2.3020920753479004, 2.3709611892700195, 2.4398305416107178, 2.508699655532837, 2.577569007873535, 2.6464381217956543]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 6.0, 3.0, 6.0, 4.0, 10.0, 9.0, 5.0, 10.0, 7.0, 10.0, 17.0, 24.0, 24.0, 36.0, 39.0, 26.0, 31.0, 43.0, 41.0, 43.0, 35.0, 40.0, 43.0, 41.0, 46.0, 49.0, 38.0, 39.0, 28.0, 25.0, 27.0, 28.0, 28.0, 19.0, 23.0, 25.0, 19.0, 15.0, 13.0, 11.0, 10.0, 7.0, 2.0, 5.0, 2.0, 0.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.6595165729522705, -1.610802173614502, -1.5620877742767334, -1.5133733749389648, -1.4646589756011963, -1.4159444570541382, -1.3672300577163696, -1.318515658378601, -1.2698012590408325, -1.221086859703064, -1.1723724603652954, -1.1236580610275269, -1.0749435424804688, -1.0262291431427002, -0.9775147438049316, -0.9288003444671631, -0.8800859451293945, -0.831371545791626, -0.7826571464538574, -0.7339426875114441, -0.6852282881736755, -0.636513888835907, -0.5877994298934937, -0.5390850305557251, -0.49037063121795654, -0.441656231880188, -0.39294180274009705, -0.3442273736000061, -0.29551297426223755, -0.2467985600233078, -0.19808414578437805, -0.1493697166442871, -0.1006554365158081, -0.05194102227687836, -0.0032266080379486084, 0.04548780620098114, 0.09420222043991089, 0.14291663467884064, 0.19163104891777039, 0.24034547805786133, 0.2890598773956299, 0.33777427673339844, 0.3864887058734894, 0.4352031350135803, 0.4839175343513489, 0.5326319336891174, 0.5813463926315308, 0.6300607919692993, 0.6787751913070679, 0.7274895906448364, 0.776203989982605, 0.8249184489250183, 0.8736328482627869, 0.9223472476005554, 0.9710617065429688, 1.0197761058807373, 1.0684905052185059, 1.1172049045562744, 1.165919303894043, 1.2146337032318115, 1.26334810256958, 1.3120626211166382, 1.3607770204544067, 1.4094914197921753, 1.4582058191299438]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 1.0, 5.0, 4.0, 7.0, 13.0, 14.0, 24.0, 27.0, 45.0, 59.0, 79.0, 137.0, 221.0, 334.0, 705.0, 1320.0, 2692.0, 6467.0, 17142.0, 53217.0, 200571.0, 778026.0, 1776200.0, 990195.0, 263287.0, 68149.0, 21012.0, 7699.0, 3278.0, 1568.0, 721.0, 421.0, 240.0, 135.0, 84.0, 61.0, 42.0, 24.0, 18.0, 16.0, 18.0, 5.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.324951171875, -0.3149833679199219, -0.30501556396484375, -0.2950477600097656, -0.2850799560546875, -0.2751121520996094, -0.26514434814453125, -0.2551765441894531, -0.245208740234375, -0.23524093627929688, -0.22527313232421875, -0.21530532836914062, -0.2053375244140625, -0.19536972045898438, -0.18540191650390625, -0.17543411254882812, -0.16546630859375, -0.15549850463867188, -0.14553070068359375, -0.13556289672851562, -0.1255950927734375, -0.11562728881835938, -0.10565948486328125, -0.09569168090820312, -0.085723876953125, -0.07575607299804688, -0.06578826904296875, -0.055820465087890625, -0.0458526611328125, -0.035884857177734375, -0.02591705322265625, -0.015949249267578125, -0.0059814453125, 0.003986358642578125, 0.01395416259765625, 0.023921966552734375, 0.0338897705078125, 0.043857574462890625, 0.05382537841796875, 0.06379318237304688, 0.073760986328125, 0.08372879028320312, 0.09369659423828125, 0.10366439819335938, 0.1136322021484375, 0.12360000610351562, 0.13356781005859375, 0.14353561401367188, 0.15350341796875, 0.16347122192382812, 0.17343902587890625, 0.18340682983398438, 0.1933746337890625, 0.20334243774414062, 0.21331024169921875, 0.22327804565429688, 0.233245849609375, 0.24321365356445312, 0.25318145751953125, 0.2631492614746094, 0.2731170654296875, 0.2830848693847656, 0.29305267333984375, 0.3030204772949219, 0.31298828125]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 1.0, 3.0, 4.0, 11.0, 9.0, 3.0, 14.0, 22.0, 21.0, 25.0, 21.0, 26.0, 29.0, 36.0, 38.0, 33.0, 50.0, 38.0, 46.0, 46.0, 51.0, 46.0, 52.0, 45.0, 34.0, 44.0, 47.0, 39.0, 42.0, 23.0, 20.0, 16.0, 19.0, 12.0, 12.0, 3.0, 11.0, 7.0, 4.0, 2.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.288818359375, -0.2810802459716797, -0.2733421325683594, -0.26560401916503906, -0.25786590576171875, -0.25012779235839844, -0.24238967895507812, -0.2346515655517578, -0.2269134521484375, -0.2191753387451172, -0.21143722534179688, -0.20369911193847656, -0.19596099853515625, -0.18822288513183594, -0.18048477172851562, -0.1727466583251953, -0.165008544921875, -0.1572704315185547, -0.14953231811523438, -0.14179420471191406, -0.13405609130859375, -0.12631797790527344, -0.11857986450195312, -0.11084175109863281, -0.1031036376953125, -0.09536552429199219, -0.08762741088867188, -0.07988929748535156, -0.07215118408203125, -0.06441307067871094, -0.056674957275390625, -0.04893684387207031, -0.04119873046875, -0.03346061706542969, -0.025722503662109375, -0.017984390258789062, -0.01024627685546875, -0.0025081634521484375, 0.005229949951171875, 0.012968063354492188, 0.0207061767578125, 0.028444290161132812, 0.036182403564453125, 0.04392051696777344, 0.05165863037109375, 0.05939674377441406, 0.06713485717773438, 0.07487297058105469, 0.082611083984375, 0.09034919738769531, 0.09808731079101562, 0.10582542419433594, 0.11356353759765625, 0.12130165100097656, 0.12903976440429688, 0.1367778778076172, 0.1445159912109375, 0.1522541046142578, 0.15999221801757812, 0.16773033142089844, 0.17546844482421875, 0.18320655822753906, 0.19094467163085938, 0.1986827850341797, 0.2064208984375]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 6.0, 5.0, 8.0, 18.0, 19.0, 28.0, 57.0, 72.0, 116.0, 190.0, 303.0, 539.0, 866.0, 1481.0, 2732.0, 4891.0, 9577.0, 19612.0, 44972.0, 112813.0, 331645.0, 1140929.0, 1680551.0, 550151.0, 172971.0, 65059.0, 27397.0, 12779.0, 6407.0, 3355.0, 1919.0, 1139.0, 653.0, 370.0, 237.0, 150.0, 89.0, 68.0, 43.0, 30.0, 16.0, 15.0, 5.0, 3.0, 4.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.2332763671875, -0.2247028350830078, -0.21612930297851562, -0.20755577087402344, -0.19898223876953125, -0.19040870666503906, -0.18183517456054688, -0.1732616424560547, -0.1646881103515625, -0.1561145782470703, -0.14754104614257812, -0.13896751403808594, -0.13039398193359375, -0.12182044982910156, -0.11324691772460938, -0.10467338562011719, -0.096099853515625, -0.08752632141113281, -0.07895278930664062, -0.07037925720214844, -0.06180572509765625, -0.05323219299316406, -0.044658660888671875, -0.03608512878417969, -0.0275115966796875, -0.018938064575195312, -0.010364532470703125, -0.0017910003662109375, 0.00678253173828125, 0.015356063842773438, 0.023929595947265625, 0.03250312805175781, 0.04107666015625, 0.04965019226074219, 0.058223724365234375, 0.06679725646972656, 0.07537078857421875, 0.08394432067871094, 0.09251785278320312, 0.10109138488769531, 0.1096649169921875, 0.11823844909667969, 0.12681198120117188, 0.13538551330566406, 0.14395904541015625, 0.15253257751464844, 0.16110610961914062, 0.1696796417236328, 0.178253173828125, 0.1868267059326172, 0.19540023803710938, 0.20397377014160156, 0.21254730224609375, 0.22112083435058594, 0.22969436645507812, 0.2382678985595703, 0.2468414306640625, 0.2554149627685547, 0.2639884948730469, 0.27256202697753906, 0.28113555908203125, 0.28970909118652344, 0.2982826232910156, 0.3068561553955078, 0.3154296875]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 5.0, 0.0, 3.0, 1.0, 4.0, 7.0, 2.0, 8.0, 6.0, 13.0, 16.0, 19.0, 15.0, 30.0, 56.0, 49.0, 76.0, 81.0, 114.0, 146.0, 212.0, 266.0, 382.0, 470.0, 450.0, 408.0, 300.0, 243.0, 149.0, 141.0, 92.0, 70.0, 55.0, 46.0, 38.0, 31.0, 15.0, 22.0, 13.0, 12.0, 6.0, 5.0, 1.0, 1.0, 2.0, 2.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.372802734375, -0.3615531921386719, -0.35030364990234375, -0.3390541076660156, -0.3278045654296875, -0.3165550231933594, -0.30530548095703125, -0.2940559387207031, -0.282806396484375, -0.2715568542480469, -0.26030731201171875, -0.24905776977539062, -0.2378082275390625, -0.22655868530273438, -0.21530914306640625, -0.20405960083007812, -0.19281005859375, -0.18156051635742188, -0.17031097412109375, -0.15906143188476562, -0.1478118896484375, -0.13656234741210938, -0.12531280517578125, -0.11406326293945312, -0.102813720703125, -0.09156417846679688, -0.08031463623046875, -0.06906509399414062, -0.0578155517578125, -0.046566009521484375, -0.03531646728515625, -0.024066925048828125, -0.0128173828125, -0.001567840576171875, 0.00968170166015625, 0.020931243896484375, 0.0321807861328125, 0.043430328369140625, 0.05467987060546875, 0.06592941284179688, 0.077178955078125, 0.08842849731445312, 0.09967803955078125, 0.11092758178710938, 0.1221771240234375, 0.13342666625976562, 0.14467620849609375, 0.15592575073242188, 0.16717529296875, 0.17842483520507812, 0.18967437744140625, 0.20092391967773438, 0.2121734619140625, 0.22342300415039062, 0.23467254638671875, 0.24592208862304688, 0.257171630859375, 0.2684211730957031, 0.27967071533203125, 0.2909202575683594, 0.3021697998046875, 0.3134193420410156, 0.32466888427734375, 0.3359184265136719, 0.34716796875]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 5.0, 2.0, 6.0, 6.0, 7.0, 15.0, 19.0, 59.0, 73.0, 120.0, 135.0, 145.0, 148.0, 119.0, 57.0, 43.0, 14.0, 9.0, 8.0, 4.0, 0.0, 4.0, 2.0, 0.0, 3.0, 1.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.6599502563476562, -2.5545105934143066, -2.449071168899536, -2.3436315059661865, -2.238192081451416, -2.1327524185180664, -2.027312755584717, -1.9218733310699463, -1.8164336681365967, -1.7109941244125366, -1.6055545806884766, -1.500114917755127, -1.394675374031067, -1.2892358303070068, -1.1837962865829468, -1.0783567428588867, -0.9729171991348267, -0.8674776554107666, -0.7620380520820618, -0.6565985083580017, -0.5511589050292969, -0.4457193613052368, -0.34027981758117676, -0.23484021425247192, -0.12940067052841187, -0.023961104452610016, 0.08147846162319183, 0.18691802024841309, 0.29235759377479553, 0.397797167301178, 0.503236711025238, 0.6086763143539429, 0.7141158580780029, 0.819555401802063, 0.9249950051307678, 1.0304346084594727, 1.1358741521835327, 1.2413136959075928, 1.3467532396316528, 1.452192783355713, 1.5576324462890625, 1.6630719900131226, 1.7685115337371826, 1.8739511966705322, 1.9793907403945923, 2.0848302841186523, 2.190269947052002, 2.2957093715667725, 2.401148796081543, 2.5065884590148926, 2.612027883529663, 2.7174675464630127, 2.822906970977783, 2.928346633911133, 3.0337862968444824, 3.139225721359253, 3.2446653842926025, 3.350105047225952, 3.4555444717407227, 3.5609841346740723, 3.6664235591888428, 3.7718632221221924, 3.877302646636963, 3.9827423095703125, 4.088181972503662]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 2.0, 1.0, 3.0, 5.0, 5.0, 8.0, 9.0, 5.0, 18.0, 12.0, 16.0, 18.0, 20.0, 21.0, 23.0, 31.0, 34.0, 30.0, 45.0, 40.0, 53.0, 57.0, 51.0, 35.0, 46.0, 34.0, 43.0, 39.0, 37.0, 35.0, 33.0, 40.0, 25.0, 29.0, 22.0, 22.0, 13.0, 13.0, 10.0, 5.0, 7.0, 3.0, 6.0, 4.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.3149120807647705, -1.2741389274597168, -1.233365774154663, -1.1925926208496094, -1.1518194675445557, -1.111046314239502, -1.0702731609344482, -1.0295000076293945, -0.9887268543243408, -0.9479537010192871, -0.9071805477142334, -0.8664073944091797, -0.825634241104126, -0.7848610877990723, -0.7440879344940186, -0.7033147811889648, -0.6625416278839111, -0.6217684745788574, -0.5809953212738037, -0.54022216796875, -0.4994490146636963, -0.4586758613586426, -0.41790270805358887, -0.37712955474853516, -0.33635640144348145, -0.29558324813842773, -0.254810094833374, -0.2140369415283203, -0.1732637882232666, -0.1324906349182129, -0.09171748161315918, -0.05094432830810547, -0.010171175003051758, 0.030601978302001953, 0.07137513160705566, 0.11214828491210938, 0.15292143821716309, 0.1936945915222168, 0.2344677448272705, 0.2752408981323242, 0.31601405143737793, 0.35678720474243164, 0.39756035804748535, 0.43833351135253906, 0.4791066646575928, 0.5198798179626465, 0.5606529712677002, 0.6014261245727539, 0.6421992778778076, 0.6829724311828613, 0.723745584487915, 0.7645187377929688, 0.8052918910980225, 0.8460650444030762, 0.8868381977081299, 0.9276113510131836, 0.9683845043182373, 1.009157657623291, 1.0499308109283447, 1.0907039642333984, 1.1314771175384521, 1.1722502708435059, 1.2130234241485596, 1.2537965774536133, 1.294569730758667]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 2.0, 2.0, 3.0, 4.0, 4.0, 13.0, 13.0, 14.0, 33.0, 36.0, 77.0, 119.0, 177.0, 277.0, 481.0, 775.0, 1299.0, 2161.0, 3722.0, 6530.0, 11664.0, 20255.0, 37044.0, 64697.0, 106053.0, 154547.0, 182148.0, 165249.0, 118848.0, 74618.0, 42599.0, 23858.0, 13310.0, 7532.0, 4254.0, 2453.0, 1387.0, 803.0, 556.0, 341.0, 224.0, 129.0, 87.0, 59.0, 36.0, 28.0, 15.0, 16.0, 6.0, 2.0, 4.0, 2.0, 0.0, 1.0, 2.0], "bins": [-0.1868896484375, -0.18164443969726562, -0.17639923095703125, -0.17115402221679688, -0.1659088134765625, -0.16066360473632812, -0.15541839599609375, -0.15017318725585938, -0.144927978515625, -0.13968276977539062, -0.13443756103515625, -0.12919235229492188, -0.1239471435546875, -0.11870193481445312, -0.11345672607421875, -0.10821151733398438, -0.10296630859375, -0.09772109985351562, -0.09247589111328125, -0.08723068237304688, -0.0819854736328125, -0.07674026489257812, -0.07149505615234375, -0.06624984741210938, -0.061004638671875, -0.055759429931640625, -0.05051422119140625, -0.045269012451171875, -0.0400238037109375, -0.034778594970703125, -0.02953338623046875, -0.024288177490234375, -0.01904296875, -0.013797760009765625, -0.00855255126953125, -0.003307342529296875, 0.0019378662109375, 0.007183074951171875, 0.01242828369140625, 0.017673492431640625, 0.022918701171875, 0.028163909912109375, 0.03340911865234375, 0.038654327392578125, 0.0438995361328125, 0.049144744873046875, 0.05438995361328125, 0.059635162353515625, 0.06488037109375, 0.07012557983398438, 0.07537078857421875, 0.08061599731445312, 0.0858612060546875, 0.09110641479492188, 0.09635162353515625, 0.10159683227539062, 0.106842041015625, 0.11208724975585938, 0.11733245849609375, 0.12257766723632812, 0.1278228759765625, 0.13306808471679688, 0.13831329345703125, 0.14355850219726562, 0.1488037109375]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 2.0, 3.0, 3.0, 5.0, 6.0, 3.0, 7.0, 7.0, 4.0, 10.0, 12.0, 11.0, 14.0, 16.0, 17.0, 26.0, 24.0, 17.0, 35.0, 20.0, 37.0, 35.0, 32.0, 26.0, 41.0, 33.0, 39.0, 50.0, 28.0, 35.0, 36.0, 32.0, 26.0, 37.0, 44.0, 31.0, 22.0, 20.0, 27.0, 20.0, 20.0, 23.0, 14.0, 7.0, 12.0, 5.0, 12.0, 1.0, 7.0, 4.0, 6.0, 1.0, 3.0, 2.0, 6.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.202392578125, -0.19571685791015625, -0.1890411376953125, -0.18236541748046875, -0.175689697265625, -0.16901397705078125, -0.1623382568359375, -0.15566253662109375, -0.14898681640625, -0.14231109619140625, -0.1356353759765625, -0.12895965576171875, -0.122283935546875, -0.11560821533203125, -0.1089324951171875, -0.10225677490234375, -0.0955810546875, -0.08890533447265625, -0.0822296142578125, -0.07555389404296875, -0.068878173828125, -0.06220245361328125, -0.0555267333984375, -0.04885101318359375, -0.04217529296875, -0.03549957275390625, -0.0288238525390625, -0.02214813232421875, -0.015472412109375, -0.00879669189453125, -0.0021209716796875, 0.00455474853515625, 0.01123046875, 0.01790618896484375, 0.0245819091796875, 0.03125762939453125, 0.037933349609375, 0.04460906982421875, 0.0512847900390625, 0.05796051025390625, 0.06463623046875, 0.07131195068359375, 0.0779876708984375, 0.08466339111328125, 0.091339111328125, 0.09801483154296875, 0.1046905517578125, 0.11136627197265625, 0.1180419921875, 0.12471771240234375, 0.1313934326171875, 0.13806915283203125, 0.144744873046875, 0.15142059326171875, 0.1580963134765625, 0.16477203369140625, 0.17144775390625, 0.17812347412109375, 0.1847991943359375, 0.19147491455078125, 0.198150634765625, 0.20482635498046875, 0.2115020751953125, 0.21817779541015625, 0.224853515625]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 3.0, 2.0, 4.0, 6.0, 10.0, 14.0, 17.0, 18.0, 54.0, 108.0, 259.0, 516.0, 1144.0, 2920.0, 7325.0, 20613.0, 59165.0, 161828.0, 350187.0, 267785.0, 113549.0, 40330.0, 13915.0, 5072.0, 2008.0, 902.0, 365.0, 186.0, 91.0, 61.0, 36.0, 29.0, 9.0, 18.0, 7.0, 3.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.30029296875, -0.291412353515625, -0.28253173828125, -0.273651123046875, -0.2647705078125, -0.255889892578125, -0.24700927734375, -0.238128662109375, -0.229248046875, -0.220367431640625, -0.21148681640625, -0.202606201171875, -0.1937255859375, -0.184844970703125, -0.17596435546875, -0.167083740234375, -0.158203125, -0.149322509765625, -0.14044189453125, -0.131561279296875, -0.1226806640625, -0.113800048828125, -0.10491943359375, -0.096038818359375, -0.087158203125, -0.078277587890625, -0.06939697265625, -0.060516357421875, -0.0516357421875, -0.042755126953125, -0.03387451171875, -0.024993896484375, -0.01611328125, -0.007232666015625, 0.00164794921875, 0.010528564453125, 0.0194091796875, 0.028289794921875, 0.03717041015625, 0.046051025390625, 0.054931640625, 0.063812255859375, 0.07269287109375, 0.081573486328125, 0.0904541015625, 0.099334716796875, 0.10821533203125, 0.117095947265625, 0.1259765625, 0.134857177734375, 0.14373779296875, 0.152618408203125, 0.1614990234375, 0.170379638671875, 0.17926025390625, 0.188140869140625, 0.197021484375, 0.205902099609375, 0.21478271484375, 0.223663330078125, 0.2325439453125, 0.241424560546875, 0.25030517578125, 0.259185791015625, 0.26806640625]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 0.0, 2.0, 3.0, 5.0, 3.0, 5.0, 13.0, 10.0, 12.0, 15.0, 14.0, 21.0, 23.0, 26.0, 32.0, 45.0, 42.0, 47.0, 43.0, 51.0, 41.0, 50.0, 58.0, 56.0, 47.0, 52.0, 38.0, 36.0, 38.0, 30.0, 27.0, 20.0, 18.0, 14.0, 25.0, 10.0, 10.0, 10.0, 2.0, 4.0, 3.0, 3.0, 6.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.734375, -0.7115554809570312, -0.6887359619140625, -0.6659164428710938, -0.643096923828125, -0.6202774047851562, -0.5974578857421875, -0.5746383666992188, -0.55181884765625, -0.5289993286132812, -0.5061798095703125, -0.48336029052734375, -0.460540771484375, -0.43772125244140625, -0.4149017333984375, -0.39208221435546875, -0.3692626953125, -0.34644317626953125, -0.3236236572265625, -0.30080413818359375, -0.277984619140625, -0.25516510009765625, -0.2323455810546875, -0.20952606201171875, -0.18670654296875, -0.16388702392578125, -0.1410675048828125, -0.11824798583984375, -0.095428466796875, -0.07260894775390625, -0.0497894287109375, -0.02696990966796875, -0.004150390625, 0.01866912841796875, 0.0414886474609375, 0.06430816650390625, 0.087127685546875, 0.10994720458984375, 0.1327667236328125, 0.15558624267578125, 0.17840576171875, 0.20122528076171875, 0.2240447998046875, 0.24686431884765625, 0.269683837890625, 0.29250335693359375, 0.3153228759765625, 0.33814239501953125, 0.3609619140625, 0.38378143310546875, 0.4066009521484375, 0.42942047119140625, 0.452239990234375, 0.47505950927734375, 0.4978790283203125, 0.5206985473632812, 0.54351806640625, 0.5663375854492188, 0.5891571044921875, 0.6119766235351562, 0.634796142578125, 0.6576156616210938, 0.6804351806640625, 0.7032546997070312, 0.72607421875]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 0.0, 1.0, 2.0, 0.0, 4.0, 5.0, 7.0, 15.0, 15.0, 18.0, 18.0, 46.0, 61.0, 84.0, 123.0, 190.0, 304.0, 447.0, 752.0, 1314.0, 2553.0, 6072.0, 16226.0, 49999.0, 158745.0, 400020.0, 270446.0, 93557.0, 29104.0, 9816.0, 4078.0, 1840.0, 1008.0, 592.0, 359.0, 233.0, 169.0, 121.0, 64.0, 41.0, 39.0, 22.0, 15.0, 11.0, 10.0, 6.0, 2.0, 3.0, 3.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0811767578125, -0.07844924926757812, -0.07572174072265625, -0.07299423217773438, -0.0702667236328125, -0.06753921508789062, -0.06481170654296875, -0.062084197998046875, -0.059356689453125, -0.056629180908203125, -0.05390167236328125, -0.051174163818359375, -0.0484466552734375, -0.045719146728515625, -0.04299163818359375, -0.040264129638671875, -0.03753662109375, -0.034809112548828125, -0.03208160400390625, -0.029354095458984375, -0.0266265869140625, -0.023899078369140625, -0.02117156982421875, -0.018444061279296875, -0.015716552734375, -0.012989044189453125, -0.01026153564453125, -0.007534027099609375, -0.0048065185546875, -0.002079010009765625, 0.00064849853515625, 0.003376007080078125, 0.006103515625, 0.008831024169921875, 0.01155853271484375, 0.014286041259765625, 0.0170135498046875, 0.019741058349609375, 0.02246856689453125, 0.025196075439453125, 0.027923583984375, 0.030651092529296875, 0.03337860107421875, 0.036106109619140625, 0.0388336181640625, 0.041561126708984375, 0.04428863525390625, 0.047016143798828125, 0.04974365234375, 0.052471160888671875, 0.05519866943359375, 0.057926177978515625, 0.0606536865234375, 0.06338119506835938, 0.06610870361328125, 0.06883621215820312, 0.071563720703125, 0.07429122924804688, 0.07701873779296875, 0.07974624633789062, 0.0824737548828125, 0.08520126342773438, 0.08792877197265625, 0.09065628051757812, 0.0933837890625]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 6.0, 3.0, 6.0, 10.0, 19.0, 16.0, 34.0, 39.0, 46.0, 81.0, 116.0, 115.0, 97.0, 101.0, 69.0, 79.0, 48.0, 31.0, 22.0, 18.0, 15.0, 12.0, 11.0, 1.0, 6.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-3.987550735473633e-05, -3.870762884616852e-05, -3.753975033760071e-05, -3.63718718290329e-05, -3.520399332046509e-05, -3.403611481189728e-05, -3.286823630332947e-05, -3.170035779476166e-05, -3.053247928619385e-05, -2.9364600777626038e-05, -2.8196722269058228e-05, -2.7028843760490417e-05, -2.5860965251922607e-05, -2.4693086743354797e-05, -2.3525208234786987e-05, -2.2357329726219177e-05, -2.1189451217651367e-05, -2.0021572709083557e-05, -1.8853694200515747e-05, -1.7685815691947937e-05, -1.6517937183380127e-05, -1.5350058674812317e-05, -1.4182180166244507e-05, -1.3014301657676697e-05, -1.1846423149108887e-05, -1.0678544640541077e-05, -9.510666131973267e-06, -8.342787623405457e-06, -7.1749091148376465e-06, -6.0070306062698364e-06, -4.839152097702026e-06, -3.6712735891342163e-06, -2.5033950805664062e-06, -1.3355165719985962e-06, -1.6763806343078613e-07, 1.000240445137024e-06, 2.168118953704834e-06, 3.335997462272644e-06, 4.503875970840454e-06, 5.671754479408264e-06, 6.839632987976074e-06, 8.007511496543884e-06, 9.175390005111694e-06, 1.0343268513679504e-05, 1.1511147022247314e-05, 1.2679025530815125e-05, 1.3846904039382935e-05, 1.5014782547950745e-05, 1.6182661056518555e-05, 1.7350539565086365e-05, 1.8518418073654175e-05, 1.9686296582221985e-05, 2.0854175090789795e-05, 2.2022053599357605e-05, 2.3189932107925415e-05, 2.4357810616493225e-05, 2.5525689125061035e-05, 2.6693567633628845e-05, 2.7861446142196655e-05, 2.9029324650764465e-05, 3.0197203159332275e-05, 3.1365081667900085e-05, 3.2532960176467896e-05, 3.3700838685035706e-05, 3.4868717193603516e-05]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 4.0, 2.0, 1.0, 3.0, 5.0, 13.0, 14.0, 15.0, 28.0, 32.0, 42.0, 53.0, 64.0, 83.0, 122.0, 150.0, 224.0, 318.0, 370.0, 581.0, 885.0, 1391.0, 2495.0, 4512.0, 9091.0, 18706.0, 40835.0, 89735.0, 185861.0, 310748.0, 198409.0, 97411.0, 44145.0, 20176.0, 9779.0, 4950.0, 2625.0, 1473.0, 978.0, 595.0, 454.0, 312.0, 244.0, 152.0, 111.0, 91.0, 72.0, 57.0, 46.0, 29.0, 15.0, 14.0, 13.0, 11.0, 9.0, 7.0, 3.0, 0.0, 3.0, 5.0, 1.0, 1.0], "bins": [-0.06878662109375, -0.06660652160644531, -0.06442642211914062, -0.06224632263183594, -0.06006622314453125, -0.05788612365722656, -0.055706024169921875, -0.05352592468261719, -0.0513458251953125, -0.04916572570800781, -0.046985626220703125, -0.04480552673339844, -0.04262542724609375, -0.04044532775878906, -0.038265228271484375, -0.03608512878417969, -0.033905029296875, -0.03172492980957031, -0.029544830322265625, -0.027364730834960938, -0.02518463134765625, -0.023004531860351562, -0.020824432373046875, -0.018644332885742188, -0.0164642333984375, -0.014284133911132812, -0.012104034423828125, -0.009923934936523438, -0.00774383544921875, -0.0055637359619140625, -0.003383636474609375, -0.0012035369873046875, 0.0009765625, 0.0031566619873046875, 0.005336761474609375, 0.0075168609619140625, 0.00969696044921875, 0.011877059936523438, 0.014057159423828125, 0.016237258911132812, 0.0184173583984375, 0.020597457885742188, 0.022777557373046875, 0.024957656860351562, 0.02713775634765625, 0.029317855834960938, 0.031497955322265625, 0.03367805480957031, 0.035858154296875, 0.03803825378417969, 0.040218353271484375, 0.04239845275878906, 0.04457855224609375, 0.04675865173339844, 0.048938751220703125, 0.05111885070800781, 0.0532989501953125, 0.05547904968261719, 0.057659149169921875, 0.05983924865722656, 0.06201934814453125, 0.06419944763183594, 0.06637954711914062, 0.06855964660644531, 0.07073974609375]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 2.0, 3.0, 4.0, 11.0, 8.0, 12.0, 18.0, 13.0, 26.0, 32.0, 42.0, 50.0, 37.0, 49.0, 55.0, 60.0, 62.0, 73.0, 85.0, 61.0, 51.0, 44.0, 31.0, 36.0, 41.0, 19.0, 20.0, 16.0, 8.0, 5.0, 10.0, 4.0, 2.0, 1.0, 3.0, 2.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.09063720703125, -0.08763694763183594, -0.08463668823242188, -0.08163642883300781, -0.07863616943359375, -0.07563591003417969, -0.07263565063476562, -0.06963539123535156, -0.0666351318359375, -0.06363487243652344, -0.060634613037109375, -0.05763435363769531, -0.05463409423828125, -0.05163383483886719, -0.048633575439453125, -0.04563331604003906, -0.042633056640625, -0.03963279724121094, -0.036632537841796875, -0.03363227844238281, -0.03063201904296875, -0.027631759643554688, -0.024631500244140625, -0.021631240844726562, -0.0186309814453125, -0.015630722045898438, -0.012630462646484375, -0.009630203247070312, -0.00662994384765625, -0.0036296844482421875, -0.000629425048828125, 0.0023708343505859375, 0.00537109375, 0.008371353149414062, 0.011371612548828125, 0.014371871948242188, 0.01737213134765625, 0.020372390747070312, 0.023372650146484375, 0.026372909545898438, 0.0293731689453125, 0.03237342834472656, 0.035373687744140625, 0.03837394714355469, 0.04137420654296875, 0.04437446594238281, 0.047374725341796875, 0.05037498474121094, 0.053375244140625, 0.05637550354003906, 0.059375762939453125, 0.06237602233886719, 0.06537628173828125, 0.06837654113769531, 0.07137680053710938, 0.07437705993652344, 0.0773773193359375, 0.08037757873535156, 0.08337783813476562, 0.08637809753417969, 0.08937835693359375, 0.09237861633300781, 0.09537887573242188, 0.09837913513183594, 0.10137939453125]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 3.0, 3.0, 3.0, 10.0, 12.0, 17.0, 22.0, 35.0, 53.0, 71.0, 89.0, 110.0, 111.0, 115.0, 97.0, 75.0, 70.0, 39.0, 25.0, 14.0, 8.0, 6.0, 4.0, 5.0, 2.0, 1.0, 3.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.2833003997802734, -2.224071979522705, -2.164843797683716, -2.1056153774261475, -2.046387195587158, -1.9871587753295898, -1.927930474281311, -1.8687021732330322, -1.8094737529754639, -1.750245451927185, -1.6910171508789062, -1.631788730621338, -1.572560429573059, -1.5133321285247803, -1.4541038274765015, -1.3948755264282227, -1.3356472253799438, -1.276418924331665, -1.2171906232833862, -1.1579623222351074, -1.098733901977539, -1.0395056009292603, -0.9802772998809814, -0.9210489988327026, -0.861820638179779, -0.8025923371315002, -0.7433639764785767, -0.6841356754302979, -0.624907374382019, -0.5656790137290955, -0.5064507126808167, -0.44722238183021545, -0.38799405097961426, -0.32876572012901306, -0.26953738927841187, -0.21030908823013306, -0.15108075737953186, -0.09185242652893066, -0.032624125480651855, 0.02660420536994934, 0.08583253622055054, 0.14506086707115173, 0.20428918302059174, 0.26351749897003174, 0.32274582982063293, 0.38197416067123413, 0.44120246171951294, 0.5004308223724365, 0.5596591234207153, 0.6188874244689941, 0.6781157851219177, 0.7373440861701965, 0.7965724468231201, 0.8558007478713989, 0.9150290489196777, 0.9742573499679565, 1.0334856510162354, 1.0927139520645142, 1.151942253112793, 1.2111706733703613, 1.2703989744186401, 1.329627275466919, 1.3888555765151978, 1.4480838775634766, 1.507312297821045]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 4.0, 2.0, 5.0, 6.0, 6.0, 11.0, 13.0, 13.0, 16.0, 21.0, 30.0, 24.0, 29.0, 32.0, 34.0, 40.0, 30.0, 48.0, 60.0, 62.0, 54.0, 62.0, 48.0, 42.0, 46.0, 42.0, 31.0, 38.0, 24.0, 28.0, 20.0, 17.0, 16.0, 11.0, 9.0, 10.0, 9.0, 7.0, 2.0, 3.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.7964046001434326, -1.7404115200042725, -1.6844185590744019, -1.6284254789352417, -1.5724323987960815, -1.516439437866211, -1.4604463577270508, -1.4044532775878906, -1.34846031665802, -1.2924672365188599, -1.2364742755889893, -1.180481195449829, -1.124488115310669, -1.0684951543807983, -1.0125020742416382, -0.9565090537071228, -0.9005159735679626, -0.8445229530334473, -0.7885298728942871, -0.7325368523597717, -0.6765438318252563, -0.6205507516860962, -0.5645577311515808, -0.5085647106170654, -0.45257166028022766, -0.3965786099433899, -0.3405855894088745, -0.28459253907203674, -0.22859950363636017, -0.1726064682006836, -0.11661341786384583, -0.060620397329330444, -0.004627346992492676, 0.0513656921684742, 0.10735873132944107, 0.16335177421569824, 0.21934480965137482, 0.2753378450870514, 0.33133089542388916, 0.38732391595840454, 0.4433169662952423, 0.4993100166320801, 0.5553030371665955, 0.6112960577011108, 0.667289137840271, 0.7232821583747864, 0.7792751789093018, 0.8352682590484619, 0.8912612795829773, 0.9472543001174927, 1.0032473802566528, 1.0592403411865234, 1.1152334213256836, 1.1712265014648438, 1.227219581604004, 1.2832125425338745, 1.3392056226730347, 1.3951987028121948, 1.4511916637420654, 1.5071847438812256, 1.5631778240203857, 1.6191707849502563, 1.6751638650894165, 1.731156826019287, 1.7871499061584473]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 4.0, 2.0, 2.0, 8.0, 17.0, 17.0, 27.0, 40.0, 60.0, 62.0, 122.0, 196.0, 266.0, 387.0, 629.0, 1048.0, 1882.0, 3237.0, 6296.0, 12935.0, 29020.0, 67835.0, 157941.0, 334733.0, 599211.0, 816193.0, 826522.0, 628971.0, 377530.0, 187137.0, 80792.0, 32708.0, 14072.0, 6406.0, 3259.0, 1876.0, 1078.0, 674.0, 394.0, 249.0, 154.0, 84.0, 65.0, 42.0, 32.0, 28.0, 15.0, 11.0, 8.0, 4.0, 3.0, 5.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.1812744140625, -0.1756153106689453, -0.16995620727539062, -0.16429710388183594, -0.15863800048828125, -0.15297889709472656, -0.14731979370117188, -0.1416606903076172, -0.1360015869140625, -0.1303424835205078, -0.12468338012695312, -0.11902427673339844, -0.11336517333984375, -0.10770606994628906, -0.10204696655273438, -0.09638786315917969, -0.090728759765625, -0.08506965637207031, -0.07941055297851562, -0.07375144958496094, -0.06809234619140625, -0.06243324279785156, -0.056774139404296875, -0.05111503601074219, -0.0454559326171875, -0.03979682922363281, -0.034137725830078125, -0.028478622436523438, -0.02281951904296875, -0.017160415649414062, -0.011501312255859375, -0.0058422088623046875, -0.00018310546875, 0.0054759979248046875, 0.011135101318359375, 0.016794204711914062, 0.02245330810546875, 0.028112411499023438, 0.033771514892578125, 0.03943061828613281, 0.0450897216796875, 0.05074882507324219, 0.056407928466796875, 0.06206703186035156, 0.06772613525390625, 0.07338523864746094, 0.07904434204101562, 0.08470344543457031, 0.090362548828125, 0.09602165222167969, 0.10168075561523438, 0.10733985900878906, 0.11299896240234375, 0.11865806579589844, 0.12431716918945312, 0.1299762725830078, 0.1356353759765625, 0.1412944793701172, 0.14695358276367188, 0.15261268615722656, 0.15827178955078125, 0.16393089294433594, 0.16958999633789062, 0.1752490997314453, 0.180908203125]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 3.0, 3.0, 2.0, 4.0, 4.0, 7.0, 7.0, 7.0, 15.0, 8.0, 13.0, 11.0, 16.0, 24.0, 22.0, 22.0, 19.0, 24.0, 27.0, 23.0, 31.0, 31.0, 24.0, 41.0, 36.0, 33.0, 39.0, 32.0, 41.0, 40.0, 39.0, 35.0, 42.0, 26.0, 36.0, 39.0, 25.0, 27.0, 23.0, 17.0, 20.0, 17.0, 12.0, 9.0, 4.0, 3.0, 6.0, 8.0, 5.0, 4.0, 4.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.1925048828125, -0.18637847900390625, -0.1802520751953125, -0.17412567138671875, -0.167999267578125, -0.16187286376953125, -0.1557464599609375, -0.14962005615234375, -0.14349365234375, -0.13736724853515625, -0.1312408447265625, -0.12511444091796875, -0.118988037109375, -0.11286163330078125, -0.1067352294921875, -0.10060882568359375, -0.094482421875, -0.08835601806640625, -0.0822296142578125, -0.07610321044921875, -0.069976806640625, -0.06385040283203125, -0.0577239990234375, -0.05159759521484375, -0.04547119140625, -0.03934478759765625, -0.0332183837890625, -0.02709197998046875, -0.020965576171875, -0.01483917236328125, -0.0087127685546875, -0.00258636474609375, 0.0035400390625, 0.00966644287109375, 0.0157928466796875, 0.02191925048828125, 0.028045654296875, 0.03417205810546875, 0.0402984619140625, 0.04642486572265625, 0.05255126953125, 0.05867767333984375, 0.0648040771484375, 0.07093048095703125, 0.077056884765625, 0.08318328857421875, 0.0893096923828125, 0.09543609619140625, 0.1015625, 0.10768890380859375, 0.1138153076171875, 0.11994171142578125, 0.126068115234375, 0.13219451904296875, 0.1383209228515625, 0.14444732666015625, 0.15057373046875, 0.15670013427734375, 0.1628265380859375, 0.16895294189453125, 0.175079345703125, 0.18120574951171875, 0.1873321533203125, 0.19345855712890625, 0.1995849609375]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 0.0, 4.0, 2.0, 8.0, 12.0, 12.0, 21.0, 39.0, 43.0, 56.0, 118.0, 170.0, 278.0, 458.0, 1022.0, 2201.0, 6310.0, 26908.0, 190291.0, 1936695.0, 1816867.0, 177206.0, 25428.0, 6001.0, 1998.0, 880.0, 487.0, 269.0, 178.0, 113.0, 69.0, 44.0, 29.0, 18.0, 20.0, 13.0, 8.0, 5.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5009765625, -0.4842681884765625, -0.467559814453125, -0.4508514404296875, -0.43414306640625, -0.4174346923828125, -0.400726318359375, -0.3840179443359375, -0.3673095703125, -0.3506011962890625, -0.333892822265625, -0.3171844482421875, -0.30047607421875, -0.2837677001953125, -0.267059326171875, -0.2503509521484375, -0.233642578125, -0.2169342041015625, -0.200225830078125, -0.1835174560546875, -0.16680908203125, -0.1501007080078125, -0.133392333984375, -0.1166839599609375, -0.0999755859375, -0.0832672119140625, -0.066558837890625, -0.0498504638671875, -0.03314208984375, -0.0164337158203125, 0.000274658203125, 0.0169830322265625, 0.03369140625, 0.0503997802734375, 0.067108154296875, 0.0838165283203125, 0.10052490234375, 0.1172332763671875, 0.133941650390625, 0.1506500244140625, 0.1673583984375, 0.1840667724609375, 0.200775146484375, 0.2174835205078125, 0.23419189453125, 0.2509002685546875, 0.267608642578125, 0.2843170166015625, 0.301025390625, 0.3177337646484375, 0.334442138671875, 0.3511505126953125, 0.36785888671875, 0.3845672607421875, 0.401275634765625, 0.4179840087890625, 0.4346923828125, 0.4514007568359375, 0.468109130859375, 0.4848175048828125, 0.50152587890625, 0.5182342529296875, 0.534942626953125, 0.5516510009765625, 0.568359375]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 7.0, 6.0, 6.0, 18.0, 22.0, 22.0, 26.0, 45.0, 55.0, 75.0, 93.0, 138.0, 178.0, 214.0, 321.0, 363.0, 400.0, 395.0, 353.0, 308.0, 292.0, 190.0, 152.0, 115.0, 91.0, 46.0, 49.0, 25.0, 19.0, 16.0, 11.0, 5.0, 7.0, 4.0, 3.0, 1.0, 4.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.451904296875, -0.4368400573730469, -0.42177581787109375, -0.4067115783691406, -0.3916473388671875, -0.3765830993652344, -0.36151885986328125, -0.3464546203613281, -0.331390380859375, -0.3163261413574219, -0.30126190185546875, -0.2861976623535156, -0.2711334228515625, -0.2560691833496094, -0.24100494384765625, -0.22594070434570312, -0.21087646484375, -0.19581222534179688, -0.18074798583984375, -0.16568374633789062, -0.1506195068359375, -0.13555526733398438, -0.12049102783203125, -0.10542678833007812, -0.090362548828125, -0.07529830932617188, -0.06023406982421875, -0.045169830322265625, -0.0301055908203125, -0.015041351318359375, 2.288818359375e-05, 0.015087127685546875, 0.0301513671875, 0.045215606689453125, 0.06027984619140625, 0.07534408569335938, 0.0904083251953125, 0.10547256469726562, 0.12053680419921875, 0.13560104370117188, 0.150665283203125, 0.16572952270507812, 0.18079376220703125, 0.19585800170898438, 0.2109222412109375, 0.22598648071289062, 0.24105072021484375, 0.2561149597167969, 0.27117919921875, 0.2862434387207031, 0.30130767822265625, 0.3163719177246094, 0.3314361572265625, 0.3465003967285156, 0.36156463623046875, 0.3766288757324219, 0.391693115234375, 0.4067573547363281, 0.42182159423828125, 0.4368858337402344, 0.4519500732421875, 0.4670143127441406, 0.48207855224609375, 0.4971427917480469, 0.51220703125]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 4.0, 3.0, 2.0, 9.0, 4.0, 5.0, 14.0, 18.0, 27.0, 61.0, 69.0, 117.0, 123.0, 138.0, 122.0, 101.0, 71.0, 47.0, 19.0, 17.0, 10.0, 12.0, 6.0, 2.0, 4.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.4623613357543945, -3.2829596996307373, -3.10355806350708, -2.9241561889648438, -2.7447547912597656, -2.5653529167175293, -2.385951280593872, -2.206549644470215, -2.0271480083465576, -1.8477463722229004, -1.6683447360992432, -1.4889429807662964, -1.3095413446426392, -1.130139708518982, -0.9507379531860352, -0.7713363170623779, -0.5919346809387207, -0.4125330150127411, -0.23313134908676147, -0.05372965335845947, 0.12567198276519775, 0.305073618888855, 0.48447537422180176, 0.663877010345459, 0.8432786464691162, 1.0226802825927734, 1.2020819187164307, 1.3814836740493774, 1.5608853101730347, 1.740286946296692, 1.9196887016296387, 2.099090337753296, 2.278491973876953, 2.4578936100006104, 2.6372952461242676, 2.816697120666504, 2.996098518371582, 3.1755003929138184, 3.3549020290374756, 3.534303665161133, 3.71370530128479, 3.8931069374084473, 4.072508811950684, 4.251910209655762, 4.431312084197998, 4.610713481903076, 4.7901153564453125, 4.969516754150391, 5.148918628692627, 5.328320503234863, 5.507721900939941, 5.687123775482178, 5.866525173187256, 6.045927047729492, 6.22532844543457, 6.404730319976807, 6.584132194519043, 6.763534069061279, 6.942935466766357, 7.122337341308594, 7.301738739013672, 7.481140613555908, 7.6605424880981445, 7.839943885803223, 8.0193452835083]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 3.0, 4.0, 4.0, 1.0, 4.0, 4.0, 4.0, 6.0, 7.0, 12.0, 16.0, 17.0, 16.0, 13.0, 20.0, 19.0, 26.0, 40.0, 26.0, 41.0, 36.0, 31.0, 43.0, 54.0, 47.0, 44.0, 30.0, 48.0, 31.0, 36.0, 44.0, 33.0, 36.0, 32.0, 38.0, 19.0, 24.0, 16.0, 16.0, 12.0, 10.0, 8.0, 8.0, 5.0, 1.0, 10.0, 7.0, 2.0, 1.0, 2.0, 3.0, 2.0, 1.0, 0.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.815579891204834, -1.752791166305542, -1.6900023221969604, -1.6272135972976685, -1.5644248723983765, -1.501636028289795, -1.438847303390503, -1.376058578491211, -1.313269853591919, -1.250481128692627, -1.1876922845840454, -1.1249035596847534, -1.0621148347854614, -0.9993260502815247, -0.9365372657775879, -0.8737485408782959, -0.8109596967697144, -0.7481709122657776, -0.6853821873664856, -0.6225934028625488, -0.5598046779632568, -0.49701589345932007, -0.4342271089553833, -0.3714383542537689, -0.30864959955215454, -0.24586084485054016, -0.1830720752477646, -0.12028330564498901, -0.057494550943374634, 0.005294203758239746, 0.06808298826217651, 0.1308717429637909, 0.19366049766540527, 0.25644925236701965, 0.31923800706863403, 0.3820267915725708, 0.4448155462741852, 0.5076043009757996, 0.5703930854797363, 0.6331818103790283, 0.6959705948829651, 0.7587593793869019, 0.8215481042861938, 0.8843368887901306, 0.9471256732940674, 1.0099143981933594, 1.0727031230926514, 1.135491967201233, 1.198280692100525, 1.261069416999817, 1.3238582611083984, 1.3866469860076904, 1.4494357109069824, 1.5122244358062744, 1.575013279914856, 1.637802004814148, 1.7005908489227295, 1.7633795738220215, 1.826168417930603, 1.888957142829895, 1.951745867729187, 2.0145347118377686, 2.0773234367370605, 2.1401121616363525, 2.2029008865356445]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 1.0, 3.0, 1.0, 3.0, 3.0, 3.0, 6.0, 8.0, 13.0, 30.0, 30.0, 40.0, 59.0, 89.0, 115.0, 208.0, 271.0, 467.0, 758.0, 1228.0, 2127.0, 3909.0, 7292.0, 14769.0, 31612.0, 74056.0, 176935.0, 308155.0, 236582.0, 104924.0, 43706.0, 19803.0, 9637.0, 4904.0, 2762.0, 1567.0, 897.0, 557.0, 320.0, 251.0, 159.0, 86.0, 56.0, 58.0, 34.0, 19.0, 11.0, 14.0, 9.0, 7.0, 2.0, 5.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.1610107421875, -0.15576553344726562, -0.15052032470703125, -0.14527511596679688, -0.1400299072265625, -0.13478469848632812, -0.12953948974609375, -0.12429428100585938, -0.119049072265625, -0.11380386352539062, -0.10855865478515625, -0.10331344604492188, -0.0980682373046875, -0.09282302856445312, -0.08757781982421875, -0.08233261108398438, -0.07708740234375, -0.07184219360351562, -0.06659698486328125, -0.061351776123046875, -0.0561065673828125, -0.050861358642578125, -0.04561614990234375, -0.040370941162109375, -0.035125732421875, -0.029880523681640625, -0.02463531494140625, -0.019390106201171875, -0.0141448974609375, -0.008899688720703125, -0.00365447998046875, 0.001590728759765625, 0.0068359375, 0.012081146240234375, 0.01732635498046875, 0.022571563720703125, 0.0278167724609375, 0.033061981201171875, 0.03830718994140625, 0.043552398681640625, 0.048797607421875, 0.054042816162109375, 0.05928802490234375, 0.06453323364257812, 0.0697784423828125, 0.07502365112304688, 0.08026885986328125, 0.08551406860351562, 0.09075927734375, 0.09600448608398438, 0.10124969482421875, 0.10649490356445312, 0.1117401123046875, 0.11698532104492188, 0.12223052978515625, 0.12747573852539062, 0.132720947265625, 0.13796615600585938, 0.14321136474609375, 0.14845657348632812, 0.1537017822265625, 0.15894699096679688, 0.16419219970703125, 0.16943740844726562, 0.1746826171875]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 1.0, 1.0, 1.0, 3.0, 4.0, 7.0, 9.0, 10.0, 9.0, 13.0, 16.0, 17.0, 32.0, 41.0, 39.0, 46.0, 49.0, 46.0, 38.0, 59.0, 46.0, 51.0, 57.0, 50.0, 45.0, 46.0, 55.0, 41.0, 33.0, 28.0, 29.0, 21.0, 17.0, 7.0, 10.0, 6.0, 8.0, 7.0, 3.0, 2.0, 2.0, 3.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.34423828125, -0.3320579528808594, -0.31987762451171875, -0.3076972961425781, -0.2955169677734375, -0.2833366394042969, -0.27115631103515625, -0.2589759826660156, -0.246795654296875, -0.23461532592773438, -0.22243499755859375, -0.21025466918945312, -0.1980743408203125, -0.18589401245117188, -0.17371368408203125, -0.16153335571289062, -0.14935302734375, -0.13717269897460938, -0.12499237060546875, -0.11281204223632812, -0.1006317138671875, -0.08845138549804688, -0.07627105712890625, -0.06409072875976562, -0.051910400390625, -0.039730072021484375, -0.02754974365234375, -0.015369415283203125, -0.0031890869140625, 0.008991241455078125, 0.02117156982421875, 0.033351898193359375, 0.0455322265625, 0.057712554931640625, 0.06989288330078125, 0.08207321166992188, 0.0942535400390625, 0.10643386840820312, 0.11861419677734375, 0.13079452514648438, 0.142974853515625, 0.15515518188476562, 0.16733551025390625, 0.17951583862304688, 0.1916961669921875, 0.20387649536132812, 0.21605682373046875, 0.22823715209960938, 0.24041748046875, 0.2525978088378906, 0.26477813720703125, 0.2769584655761719, 0.2891387939453125, 0.3013191223144531, 0.31349945068359375, 0.3256797790527344, 0.337860107421875, 0.3500404357910156, 0.36222076416015625, 0.3744010925292969, 0.3865814208984375, 0.3987617492675781, 0.41094207763671875, 0.4231224060058594, 0.435302734375]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 4.0, 4.0, 2.0, 8.0, 8.0, 13.0, 6.0, 15.0, 18.0, 34.0, 47.0, 61.0, 105.0, 147.0, 235.0, 373.0, 641.0, 1149.0, 2053.0, 4297.0, 9511.0, 25990.0, 85367.0, 396552.0, 393107.0, 84097.0, 25972.0, 9783.0, 4212.0, 2040.0, 1042.0, 615.0, 378.0, 217.0, 158.0, 97.0, 60.0, 46.0, 27.0, 19.0, 23.0, 9.0, 11.0, 5.0, 5.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.2459716796875, -0.23851776123046875, -0.2310638427734375, -0.22360992431640625, -0.216156005859375, -0.20870208740234375, -0.2012481689453125, -0.19379425048828125, -0.18634033203125, -0.17888641357421875, -0.1714324951171875, -0.16397857666015625, -0.156524658203125, -0.14907073974609375, -0.1416168212890625, -0.13416290283203125, -0.126708984375, -0.11925506591796875, -0.1118011474609375, -0.10434722900390625, -0.096893310546875, -0.08943939208984375, -0.0819854736328125, -0.07453155517578125, -0.06707763671875, -0.05962371826171875, -0.0521697998046875, -0.04471588134765625, -0.037261962890625, -0.02980804443359375, -0.0223541259765625, -0.01490020751953125, -0.0074462890625, 7.62939453125e-06, 0.0074615478515625, 0.01491546630859375, 0.022369384765625, 0.02982330322265625, 0.0372772216796875, 0.04473114013671875, 0.05218505859375, 0.05963897705078125, 0.0670928955078125, 0.07454681396484375, 0.082000732421875, 0.08945465087890625, 0.0969085693359375, 0.10436248779296875, 0.11181640625, 0.11927032470703125, 0.1267242431640625, 0.13417816162109375, 0.141632080078125, 0.14908599853515625, 0.1565399169921875, 0.16399383544921875, 0.17144775390625, 0.17890167236328125, 0.1863555908203125, 0.19380950927734375, 0.201263427734375, 0.20871734619140625, 0.2161712646484375, 0.22362518310546875, 0.2310791015625]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 4.0, 3.0, 8.0, 9.0, 12.0, 19.0, 28.0, 24.0, 35.0, 60.0, 91.0, 81.0, 103.0, 104.0, 96.0, 77.0, 71.0, 49.0, 30.0, 25.0, 14.0, 18.0, 13.0, 13.0, 4.0, 4.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3095703125, -1.26458740234375, -1.2196044921875, -1.17462158203125, -1.129638671875, -1.08465576171875, -1.0396728515625, -0.99468994140625, -0.94970703125, -0.90472412109375, -0.8597412109375, -0.81475830078125, -0.769775390625, -0.72479248046875, -0.6798095703125, -0.63482666015625, -0.58984375, -0.54486083984375, -0.4998779296875, -0.45489501953125, -0.409912109375, -0.36492919921875, -0.3199462890625, -0.27496337890625, -0.22998046875, -0.18499755859375, -0.1400146484375, -0.09503173828125, -0.050048828125, -0.00506591796875, 0.0399169921875, 0.08489990234375, 0.1298828125, 0.17486572265625, 0.2198486328125, 0.26483154296875, 0.309814453125, 0.35479736328125, 0.3997802734375, 0.44476318359375, 0.48974609375, 0.53472900390625, 0.5797119140625, 0.62469482421875, 0.669677734375, 0.71466064453125, 0.7596435546875, 0.80462646484375, 0.849609375, 0.89459228515625, 0.9395751953125, 0.98455810546875, 1.029541015625, 1.07452392578125, 1.1195068359375, 1.16448974609375, 1.20947265625, 1.25445556640625, 1.2994384765625, 1.34442138671875, 1.389404296875, 1.43438720703125, 1.4793701171875, 1.52435302734375, 1.5693359375]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 4.0, 1.0, 2.0, 5.0, 2.0, 7.0, 2.0, 5.0, 1.0, 7.0, 4.0, 12.0, 13.0, 21.0, 34.0, 57.0, 115.0, 225.0, 418.0, 1032.0, 3630.0, 55540.0, 902027.0, 79269.0, 4001.0, 1065.0, 440.0, 284.0, 127.0, 65.0, 30.0, 30.0, 16.0, 15.0, 9.0, 10.0, 6.0, 11.0, 6.0, 6.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.1646728515625, -0.15909957885742188, -0.15352630615234375, -0.14795303344726562, -0.1423797607421875, -0.13680648803710938, -0.13123321533203125, -0.12565994262695312, -0.120086669921875, -0.11451339721679688, -0.10894012451171875, -0.10336685180664062, -0.0977935791015625, -0.09222030639648438, -0.08664703369140625, -0.08107376098632812, -0.07550048828125, -0.06992721557617188, -0.06435394287109375, -0.058780670166015625, -0.0532073974609375, -0.047634124755859375, -0.04206085205078125, -0.036487579345703125, -0.030914306640625, -0.025341033935546875, -0.01976776123046875, -0.014194488525390625, -0.0086212158203125, -0.003047943115234375, 0.00252532958984375, 0.008098602294921875, 0.013671875, 0.019245147705078125, 0.02481842041015625, 0.030391693115234375, 0.0359649658203125, 0.041538238525390625, 0.04711151123046875, 0.052684783935546875, 0.058258056640625, 0.06383132934570312, 0.06940460205078125, 0.07497787475585938, 0.0805511474609375, 0.08612442016601562, 0.09169769287109375, 0.09727096557617188, 0.10284423828125, 0.10841751098632812, 0.11399078369140625, 0.11956405639648438, 0.1251373291015625, 0.13071060180664062, 0.13628387451171875, 0.14185714721679688, 0.147430419921875, 0.15300369262695312, 0.15857696533203125, 0.16415023803710938, 0.1697235107421875, 0.17529678344726562, 0.18087005615234375, 0.18644332885742188, 0.1920166015625]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 1.0, 1.0, 1.0, 5.0, 1.0, 7.0, 7.0, 12.0, 17.0, 24.0, 28.0, 26.0, 42.0, 59.0, 74.0, 93.0, 85.0, 89.0, 107.0, 76.0, 64.0, 56.0, 36.0, 20.0, 18.0, 20.0, 14.0, 5.0, 5.0, 4.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.3603439331054688e-05, -2.2950582206249237e-05, -2.2297725081443787e-05, -2.1644867956638336e-05, -2.0992010831832886e-05, -2.0339153707027435e-05, -1.9686296582221985e-05, -1.9033439457416534e-05, -1.8380582332611084e-05, -1.7727725207805634e-05, -1.7074868083000183e-05, -1.6422010958194733e-05, -1.5769153833389282e-05, -1.5116296708583832e-05, -1.4463439583778381e-05, -1.3810582458972931e-05, -1.315772533416748e-05, -1.250486820936203e-05, -1.185201108455658e-05, -1.1199153959751129e-05, -1.0546296834945679e-05, -9.893439710140228e-06, -9.240582585334778e-06, -8.587725460529327e-06, -7.934868335723877e-06, -7.2820112109184265e-06, -6.629154086112976e-06, -5.976296961307526e-06, -5.323439836502075e-06, -4.670582711696625e-06, -4.017725586891174e-06, -3.364868462085724e-06, -2.7120113372802734e-06, -2.059154212474823e-06, -1.4062970876693726e-06, -7.534399628639221e-07, -1.0058283805847168e-07, 5.522742867469788e-07, 1.2051314115524292e-06, 1.8579885363578796e-06, 2.51084566116333e-06, 3.1637027859687805e-06, 3.816559910774231e-06, 4.469417035579681e-06, 5.122274160385132e-06, 5.775131285190582e-06, 6.427988409996033e-06, 7.080845534801483e-06, 7.733702659606934e-06, 8.386559784412384e-06, 9.039416909217834e-06, 9.692274034023285e-06, 1.0345131158828735e-05, 1.0997988283634186e-05, 1.1650845408439636e-05, 1.2303702533245087e-05, 1.2956559658050537e-05, 1.3609416782855988e-05, 1.4262273907661438e-05, 1.4915131032466888e-05, 1.556798815727234e-05, 1.622084528207779e-05, 1.687370240688324e-05, 1.752655953168869e-05, 1.817941665649414e-05]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 5.0, 1.0, 3.0, 2.0, 3.0, 4.0, 7.0, 3.0, 6.0, 11.0, 6.0, 8.0, 12.0, 37.0, 29.0, 44.0, 80.0, 122.0, 173.0, 305.0, 681.0, 1852.0, 6935.0, 38978.0, 337944.0, 587399.0, 60009.0, 9765.0, 2389.0, 797.0, 387.0, 189.0, 124.0, 76.0, 55.0, 42.0, 19.0, 19.0, 12.0, 13.0, 7.0, 3.0, 1.0, 5.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.162353515625, -0.1584033966064453, -0.15445327758789062, -0.15050315856933594, -0.14655303955078125, -0.14260292053222656, -0.13865280151367188, -0.1347026824951172, -0.1307525634765625, -0.1268024444580078, -0.12285232543945312, -0.11890220642089844, -0.11495208740234375, -0.11100196838378906, -0.10705184936523438, -0.10310173034667969, -0.099151611328125, -0.09520149230957031, -0.09125137329101562, -0.08730125427246094, -0.08335113525390625, -0.07940101623535156, -0.07545089721679688, -0.07150077819824219, -0.0675506591796875, -0.06360054016113281, -0.059650421142578125, -0.05570030212402344, -0.05175018310546875, -0.04780006408691406, -0.043849945068359375, -0.03989982604980469, -0.03594970703125, -0.03199958801269531, -0.028049468994140625, -0.024099349975585938, -0.02014923095703125, -0.016199111938476562, -0.012248992919921875, -0.008298873901367188, -0.0043487548828125, -0.0003986358642578125, 0.003551483154296875, 0.0075016021728515625, 0.01145172119140625, 0.015401840209960938, 0.019351959228515625, 0.023302078247070312, 0.027252197265625, 0.031202316284179688, 0.035152435302734375, 0.03910255432128906, 0.04305267333984375, 0.04700279235839844, 0.050952911376953125, 0.05490303039550781, 0.0588531494140625, 0.06280326843261719, 0.06675338745117188, 0.07070350646972656, 0.07465362548828125, 0.07860374450683594, 0.08255386352539062, 0.08650398254394531, 0.0904541015625]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 6.0, 6.0, 20.0, 19.0, 26.0, 39.0, 45.0, 54.0, 81.0, 105.0, 131.0, 124.0, 113.0, 68.0, 48.0, 25.0, 27.0, 19.0, 18.0, 7.0, 7.0, 6.0, 6.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.28271484375, -0.27582359313964844, -0.2689323425292969, -0.2620410919189453, -0.25514984130859375, -0.2482585906982422, -0.24136734008789062, -0.23447608947753906, -0.2275848388671875, -0.22069358825683594, -0.21380233764648438, -0.2069110870361328, -0.20001983642578125, -0.1931285858154297, -0.18623733520507812, -0.17934608459472656, -0.172454833984375, -0.16556358337402344, -0.15867233276367188, -0.1517810821533203, -0.14488983154296875, -0.1379985809326172, -0.13110733032226562, -0.12421607971191406, -0.1173248291015625, -0.11043357849121094, -0.10354232788085938, -0.09665107727050781, -0.08975982666015625, -0.08286857604980469, -0.07597732543945312, -0.06908607482910156, -0.06219482421875, -0.05530357360839844, -0.048412322998046875, -0.04152107238769531, -0.03462982177734375, -0.027738571166992188, -0.020847320556640625, -0.013956069946289062, -0.0070648193359375, -0.0001735687255859375, 0.006717681884765625, 0.013608932495117188, 0.02050018310546875, 0.027391433715820312, 0.034282684326171875, 0.04117393493652344, 0.048065185546875, 0.05495643615722656, 0.061847686767578125, 0.06873893737792969, 0.07563018798828125, 0.08252143859863281, 0.08941268920898438, 0.09630393981933594, 0.1031951904296875, 0.11008644104003906, 0.11697769165039062, 0.12386894226074219, 0.13076019287109375, 0.1376514434814453, 0.14454269409179688, 0.15143394470214844, 0.1583251953125]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 3.0, 8.0, 11.0, 22.0, 37.0, 98.0, 175.0, 243.0, 201.0, 117.0, 48.0, 20.0, 6.0, 5.0, 4.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.990947961807251, -3.857576847076416, -3.72420597076416, -3.590834856033325, -3.4574637413024902, -3.3240928649902344, -3.1907217502593994, -3.0573506355285645, -2.9239797592163086, -2.7906086444854736, -2.6572377681732178, -2.523866653442383, -2.390495777130127, -2.257124662399292, -2.123753547668457, -1.9903825521469116, -1.8570115566253662, -1.7236405611038208, -1.5902695655822754, -1.4568984508514404, -1.323527455329895, -1.1901564598083496, -1.0567853450775146, -0.9234143495559692, -0.7900433540344238, -0.6566723585128784, -0.5233013033866882, -0.38993027806282043, -0.25655925273895264, -0.12318825721740723, 0.010182797908782959, 0.14355385303497314, 0.27692461013793945, 0.41029563546180725, 0.543666660785675, 0.6770377159118652, 0.8104087114334106, 0.943779706954956, 1.077150821685791, 1.2105218172073364, 1.3438928127288818, 1.4772638082504272, 1.6106348037719727, 1.7440059185028076, 1.877376914024353, 2.0107479095458984, 2.1441190242767334, 2.2774901390075684, 2.410861015319824, 2.544232130050659, 2.677603006362915, 2.81097412109375, 2.944344997406006, 3.077716112136841, 3.211087226867676, 3.3444581031799316, 3.4778292179107666, 3.6112003326416016, 3.7445712089538574, 3.8779423236846924, 4.011313438415527, 4.144684314727783, 4.278055191040039, 4.411426544189453, 4.544797420501709]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 7.0, 6.0, 6.0, 20.0, 27.0, 44.0, 60.0, 84.0, 98.0, 132.0, 148.0, 131.0, 69.0, 72.0, 38.0, 22.0, 17.0, 12.0, 6.0, 3.0, 6.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.8151190280914307, -3.604804515838623, -3.3944902420043945, -3.184175729751587, -2.9738612174987793, -2.763546943664551, -2.553232431411743, -2.3429179191589355, -2.132603645324707, -1.922289252281189, -1.7119747400283813, -1.5016603469848633, -1.2913458347320557, -1.0810314416885376, -0.8707170486450195, -0.6604025363922119, -0.4500880241394043, -0.23977358639240265, -0.029459148645401, 0.18085527420043945, 0.3911697268486023, 0.6014841794967651, 0.8117985725402832, 1.0221130847930908, 1.2324274778366089, 1.442741870880127, 1.6530563831329346, 1.8633707761764526, 2.0736851692199707, 2.2839996814727783, 2.494314193725586, 2.7046284675598145, 2.914943218231201, 3.125257730484009, 3.3355720043182373, 3.545886516571045, 3.7562010288238525, 3.96651554107666, 4.176829814910889, 4.387144088745117, 4.597458839416504, 4.807773113250732, 5.018087863922119, 5.228402137756348, 5.438716411590576, 5.649031162261963, 5.859345436096191, 6.069660186767578, 6.279973983764648, 6.490288257598877, 6.700603008270264, 6.910917282104492, 7.121231555938721, 7.331546306610107, 7.541860580444336, 7.752175331115723, 7.962489604949951, 8.17280387878418, 8.383118629455566, 8.593433380126953, 8.803747177124023, 9.01406192779541, 9.224376678466797, 9.434690475463867, 9.645005226135254]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 2.0, 3.0, 9.0, 4.0, 11.0, 14.0, 16.0, 40.0, 53.0, 85.0, 291.0, 277.0, 63.0, 50.0, 32.0, 18.0, 16.0, 17.0, 6.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.433837890625, -0.4048271179199219, -0.37581634521484375, -0.3468055725097656, -0.3177947998046875, -0.2887840270996094, -0.25977325439453125, -0.23076248168945312, -0.201751708984375, -0.17274093627929688, -0.14373016357421875, -0.11471939086914062, -0.0857086181640625, -0.056697845458984375, -0.02768707275390625, 0.001323699951171875, 0.03033447265625, 0.059345245361328125, 0.08835601806640625, 0.11736679077148438, 0.1463775634765625, 0.17538833618164062, 0.20439910888671875, 0.23340988159179688, 0.262420654296875, 0.2914314270019531, 0.32044219970703125, 0.3494529724121094, 0.3784637451171875, 0.4074745178222656, 0.43648529052734375, 0.4654960632324219, 0.4945068359375, 0.5235176086425781, 0.5525283813476562, 0.5815391540527344, 0.6105499267578125, 0.6395606994628906, 0.6685714721679688, 0.6975822448730469, 0.726593017578125, 0.7556037902832031, 0.7846145629882812, 0.8136253356933594, 0.8426361083984375, 0.8716468811035156, 0.9006576538085938, 0.9296684265136719, 0.95867919921875, 0.9876899719238281, 1.0167007446289062, 1.0457115173339844, 1.0747222900390625, 1.1037330627441406, 1.1327438354492188, 1.1617546081542969, 1.190765380859375, 1.2197761535644531, 1.2487869262695312, 1.2777976989746094, 1.3068084716796875, 1.3358192443847656, 1.3648300170898438, 1.3938407897949219, 1.4228515625]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 0.0, 2.0, 2.0, 2.0, 8.0, 8.0, 11.0, 12.0, 13.0, 26.0, 25.0, 42.0, 59.0, 99.0, 134.0, 214.0, 316.0, 690.0, 1329.0, 3099.0, 8935.0, 49167.0, 8267784.0, 43449.0, 8082.0, 2674.0, 1133.0, 554.0, 286.0, 152.0, 89.0, 52.0, 56.0, 27.0, 20.0, 12.0, 6.0, 7.0, 7.0, 4.0, 2.0, 4.0, 3.0, 2.0, 0.0, 1.0], "bins": [-1.5676206350326538, -1.5289087295532227, -1.4901968240737915, -1.4514849185943604, -1.4127731323242188, -1.3740612268447876, -1.3353493213653564, -1.2966374158859253, -1.2579255104064941, -1.219213604927063, -1.1805016994476318, -1.1417899131774902, -1.103078007698059, -1.064366102218628, -1.0256541967391968, -0.9869422912597656, -0.9482304453849792, -0.9095185399055481, -0.8708066940307617, -0.8320947885513306, -0.7933828830718994, -0.7546709775924683, -0.7159591317176819, -0.6772472262382507, -0.6385353803634644, -0.5998234748840332, -0.5611116290092468, -0.5223997235298157, -0.4836878180503845, -0.44497594237327576, -0.406264066696167, -0.36755216121673584, -0.3288401961326599, -0.29012832045555115, -0.25141641497612, -0.21270453929901123, -0.17399264872074127, -0.1352807581424713, -0.09656888246536255, -0.057856976985931396, -0.019145101308822632, 0.019566785544157028, 0.05827867239713669, 0.09699055552482605, 0.135702446103096, 0.17441433668136597, 0.21312621235847473, 0.2518381178379059, 0.29054999351501465, 0.3292618691921234, 0.36797377467155457, 0.40668565034866333, 0.4453975558280945, 0.48410943150520325, 0.522821307182312, 0.5615332126617432, 0.6002451181411743, 0.6389570236206055, 0.6776688694953918, 0.716380774974823, 0.7550926804542542, 0.7938045263290405, 0.8325164318084717, 0.8712283372879028, 0.9099401831626892]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 2.0, 4.0, 1.0, 4.0, 3.0, 3.0, 0.0, 4.0, 5.0, 1.0, 5.0, 2.0, 3.0, 1.0, 0.0, 4.0, 6.0, 2.0, 6.0, 3.0, 2.0, 1.0, 4.0, 5.0, 6.0, 2.0, 5.0, 3.0, 2.0, 3.0, 0.0, 2.0, 4.0, 0.0, 4.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.59829843044281, -1.550153374671936, -1.5020081996917725, -1.4538631439208984, -1.4057179689407349, -1.3575729131698608, -1.3094277381896973, -1.2612826824188232, -1.2131376266479492, -1.1649925708770752, -1.1168473958969116, -1.0687023401260376, -1.020557165145874, -0.972412109375, -0.9242669939994812, -0.8761218786239624, -0.8279767632484436, -0.7798316478729248, -0.731686532497406, -0.6835414171218872, -0.6353963613510132, -0.5872512459754944, -0.5391061305999756, -0.4909610450267792, -0.4428159296512604, -0.3946708142757416, -0.34652572870254517, -0.29838061332702637, -0.25023549795150757, -0.20209041237831116, -0.15394529700279236, -0.10580021142959595, -0.05765509605407715, -0.009509991854429245, 0.03863511234521866, 0.08678022027015686, 0.13492532074451447, 0.18307042121887207, 0.23121553659439087, 0.2793606221675873, 0.3275057375431061, 0.3756508529186249, 0.4237959384918213, 0.4719410538673401, 0.5200861692428589, 0.5682312250137329, 0.6163763999938965, 0.6645214557647705, 0.7126665711402893, 0.7608116865158081, 0.8089568018913269, 0.8571019172668457, 0.9052469730377197, 0.9533920884132385, 1.0015372037887573, 1.0496822595596313, 1.097827434539795, 1.145972490310669, 1.1941176652908325, 1.2422627210617065, 1.2904078960418701, 1.3385529518127441, 1.3866980075836182, 1.4348431825637817, 1.4829882383346558]}, "gradients/encoder.masked_spec_embed": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 2.0, 2.0, 4.0, 6.0, 16.0, 28.0, 26.0, 36.0, 51.0, 73.0, 68.0, 80.0, 75.0, 83.0, 70.0, 66.0, 54.0, 56.0, 57.0, 38.0, 29.0, 26.0, 17.0, 11.0, 8.0, 11.0, 2.0, 5.0, 5.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2230224609375, -0.21202659606933594, -0.20103073120117188, -0.1900348663330078, -0.17903900146484375, -0.1680431365966797, -0.15704727172851562, -0.14605140686035156, -0.1350555419921875, -0.12405967712402344, -0.11306381225585938, -0.10206794738769531, -0.09107208251953125, -0.08007621765136719, -0.06908035278320312, -0.05808448791503906, -0.047088623046875, -0.03609275817871094, -0.025096893310546875, -0.014101028442382812, -0.00310516357421875, 0.007890701293945312, 0.018886566162109375, 0.029882431030273438, 0.0408782958984375, 0.05187416076660156, 0.06287002563476562, 0.07386589050292969, 0.08486175537109375, 0.09585762023925781, 0.10685348510742188, 0.11784934997558594, 0.12884521484375, 0.13984107971191406, 0.15083694458007812, 0.1618328094482422, 0.17282867431640625, 0.1838245391845703, 0.19482040405273438, 0.20581626892089844, 0.2168121337890625, 0.22780799865722656, 0.23880386352539062, 0.2497997283935547, 0.26079559326171875, 0.2717914581298828, 0.2827873229980469, 0.29378318786621094, 0.304779052734375, 0.31577491760253906, 0.3267707824707031, 0.3377666473388672, 0.34876251220703125, 0.3597583770751953, 0.3707542419433594, 0.38175010681152344, 0.3927459716796875, 0.40374183654785156, 0.4147377014160156, 0.4257335662841797, 0.43672943115234375, 0.4477252960205078, 0.4587211608886719, 0.46971702575683594, 0.480712890625]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 8.0, 11.0, 8.0, 23.0, 22.0, 57.0, 83.0, 112.0, 175.0, 238.0, 327.0, 514.0, 789.0, 1363.0, 2220.0, 3937.0, 7053.0, 13373.0, 28373.0, 73390.0, 172369.0, 128649.0, 47028.0, 20292.0, 10237.0, 5552.0, 3061.0, 1885.0, 1085.0, 690.0, 456.0, 304.0, 177.0, 116.0, 86.0, 64.0, 53.0, 26.0, 24.0, 15.0, 13.0, 10.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.2578125, -2.17352294921875, -2.0892333984375, -2.00494384765625, -1.920654296875, -1.83636474609375, -1.7520751953125, -1.66778564453125, -1.58349609375, -1.49920654296875, -1.4149169921875, -1.33062744140625, -1.246337890625, -1.16204833984375, -1.0777587890625, -0.99346923828125, -0.9091796875, -0.82489013671875, -0.7406005859375, -0.65631103515625, -0.572021484375, -0.48773193359375, -0.4034423828125, -0.31915283203125, -0.23486328125, -0.15057373046875, -0.0662841796875, 0.01800537109375, 0.102294921875, 0.18658447265625, 0.2708740234375, 0.35516357421875, 0.439453125, 0.52374267578125, 0.6080322265625, 0.69232177734375, 0.776611328125, 0.86090087890625, 0.9451904296875, 1.02947998046875, 1.11376953125, 1.19805908203125, 1.2823486328125, 1.36663818359375, 1.450927734375, 1.53521728515625, 1.6195068359375, 1.70379638671875, 1.7880859375, 1.87237548828125, 1.9566650390625, 2.04095458984375, 2.125244140625, 2.20953369140625, 2.2938232421875, 2.37811279296875, 2.46240234375, 2.54669189453125, 2.6309814453125, 2.71527099609375, 2.799560546875, 2.88385009765625, 2.9681396484375, 3.05242919921875, 3.13671875]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0, 6.0, 6.0, 9.0, 7.0, 6.0, 16.0, 19.0, 18.0, 19.0, 21.0, 36.0, 29.0, 29.0, 45.0, 48.0, 48.0, 50.0, 50.0, 47.0, 59.0, 55.0, 54.0, 33.0, 39.0, 36.0, 29.0, 23.0, 27.0, 32.0, 19.0, 17.0, 10.0, 12.0, 6.0, 11.0, 9.0, 4.0, 4.0, 3.0, 3.0, 3.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.289794921875, -0.27982330322265625, -0.2698516845703125, -0.25988006591796875, -0.249908447265625, -0.23993682861328125, -0.2299652099609375, -0.21999359130859375, -0.21002197265625, -0.20005035400390625, -0.1900787353515625, -0.18010711669921875, -0.170135498046875, -0.16016387939453125, -0.1501922607421875, -0.14022064208984375, -0.1302490234375, -0.12027740478515625, -0.1103057861328125, -0.10033416748046875, -0.090362548828125, -0.08039093017578125, -0.0704193115234375, -0.06044769287109375, -0.05047607421875, -0.04050445556640625, -0.0305328369140625, -0.02056121826171875, -0.010589599609375, -0.00061798095703125, 0.0093536376953125, 0.01932525634765625, 0.029296875, 0.03926849365234375, 0.0492401123046875, 0.05921173095703125, 0.069183349609375, 0.07915496826171875, 0.0891265869140625, 0.09909820556640625, 0.10906982421875, 0.11904144287109375, 0.1290130615234375, 0.13898468017578125, 0.148956298828125, 0.15892791748046875, 0.1688995361328125, 0.17887115478515625, 0.1888427734375, 0.19881439208984375, 0.2087860107421875, 0.21875762939453125, 0.228729248046875, 0.23870086669921875, 0.2486724853515625, 0.25864410400390625, 0.26861572265625, 0.27858734130859375, 0.2885589599609375, 0.29853057861328125, 0.308502197265625, 0.31847381591796875, 0.3284454345703125, 0.33841705322265625, 0.348388671875]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 0.0, 3.0, 2.0, 11.0, 7.0, 5.0, 4.0, 6.0, 13.0, 10.0, 12.0, 19.0, 21.0, 42.0, 39.0, 47.0, 49.0, 37.0, 28.0, 26.0, 17.0, 22.0, 11.0, 13.0, 14.0, 6.0, 6.0, 5.0, 2.0, 3.0, 1.0, 3.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.9147651791572571, -0.8852911591529846, -0.8558171391487122, -0.8263431191444397, -0.796869158744812, -0.7673951387405396, -0.7379211187362671, -0.7084470987319946, -0.6789730787277222, -0.6494990587234497, -0.6200250387191772, -0.5905510187149048, -0.5610769987106323, -0.5316029787063599, -0.5021290183067322, -0.4726549983024597, -0.44318097829818726, -0.4137069582939148, -0.38423293828964233, -0.35475894808769226, -0.3252849280834198, -0.29581090807914734, -0.26633691787719727, -0.2368628978729248, -0.20738887786865234, -0.17791485786437988, -0.14844085276126862, -0.11896684020757675, -0.08949282765388489, -0.06001880764961243, -0.03054480254650116, -0.0010707974433898926, 0.02840322256088257, 0.05787723511457443, 0.0873512476682663, 0.11682526022195816, 0.14629927277565002, 0.17577329277992249, 0.20524729788303375, 0.23472130298614502, 0.2641953229904175, 0.29366934299468994, 0.3231433629989624, 0.3526173532009125, 0.38209137320518494, 0.4115653932094574, 0.44103938341140747, 0.47051340341567993, 0.4999874234199524, 0.5294614434242249, 0.5589354634284973, 0.5884094834327698, 0.6178834438323975, 0.6473574638366699, 0.6768314838409424, 0.7063055038452148, 0.7357795238494873, 0.7652535438537598, 0.7947275638580322, 0.8242015838623047, 0.8536756038665771, 0.8831496238708496, 0.9126235842704773, 0.9420976042747498, 0.9715716242790222]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 2.0, 5.0, 0.0, 8.0, 2.0, 5.0, 6.0, 11.0, 6.0, 9.0, 18.0, 21.0, 46.0, 69.0, 97.0, 58.0, 34.0, 17.0, 7.0, 14.0, 7.0, 10.0, 10.0, 7.0, 5.0, 4.0, 4.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.169240951538086, -2.112114191055298, -2.0549871921539307, -1.9978604316711426, -1.9407336711883545, -1.8836067914962769, -1.8264799118041992, -1.7693531513214111, -1.7122262716293335, -1.6550993919372559, -1.5979726314544678, -1.5408457517623901, -1.4837188720703125, -1.4265921115875244, -1.3694652318954468, -1.3123383522033691, -1.255211591720581, -1.1980847120285034, -1.1409579515457153, -1.0838310718536377, -1.0267043113708496, -0.969577431678772, -0.9124505519866943, -0.8553237318992615, -0.7981969118118286, -0.7410700917243958, -0.6839432716369629, -0.6268163919448853, -0.5696895718574524, -0.5125627517700195, -0.4554359018802643, -0.39830905199050903, -0.34118223190307617, -0.2840554118156433, -0.22692856192588806, -0.169801726937294, -0.11267489194869995, -0.05554807186126709, 0.0015787780284881592, 0.05870562791824341, 0.11583244800567627, 0.17295928299427032, 0.23008611798286438, 0.28721296787261963, 0.3443397879600525, 0.40146660804748535, 0.4585934579372406, 0.5157203078269958, 0.5728471279144287, 0.6299739480018616, 0.6871007680892944, 0.7442276477813721, 0.8013544678688049, 0.8584812879562378, 0.9156081676483154, 0.9727349877357483, 1.0298618078231812, 1.0869886875152588, 1.1441154479980469, 1.2012423276901245, 1.2583692073822021, 1.3154959678649902, 1.3726228475570679, 1.4297497272491455, 1.4868764877319336]}, "eval/loss": 1.776824951171875, "eval/bleu": 1.3741745601573323e-19, "eval/runtime": 2494.6636, "eval/samples_per_second": 5.917, "eval/steps_per_second": 0.74} \ No newline at end of file +{"train/loss": 0.4551, "train/learning_rate": 4.81651376146789e-07, "train/epoch": 3.0, "train/global_step": 4860, "_runtime": 68105, "_timestamp": 1651840403, "_step": 4869, "gradients/decoder.model.decoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 8.0, 24.0, 77.0, 200.0, 276.0, 254.0, 130.0, 42.0, 4.0, 3.0], "bins": [-13.15886116027832, -12.93422794342041, -12.709595680236816, -12.484962463378906, -12.260329246520996, -12.035696029663086, -11.811063766479492, -11.586430549621582, -11.361797332763672, -11.137164115905762, -10.912531852722168, -10.687898635864258, -10.463265419006348, -10.238632202148438, -10.013999938964844, -9.789366722106934, -9.564733505249023, -9.340100288391113, -9.11546802520752, -8.89083480834961, -8.6662015914917, -8.441568374633789, -8.216936111450195, -7.992302894592285, -7.767670154571533, -7.543037414550781, -7.318404197692871, -7.093771457672119, -6.869138240814209, -6.644505500793457, -6.419872283935547, -6.195239543914795, -5.970605850219727, -5.745973110198975, -5.5213398933410645, -5.2967071533203125, -5.072073936462402, -4.84744119644165, -4.62280797958374, -4.398175239562988, -4.173542499542236, -3.9489095211029053, -3.724276542663574, -3.499643564224243, -3.275010585784912, -3.05037784576416, -2.82574462890625, -2.601111888885498, -2.376478672027588, -2.151845693588257, -1.9272127151489258, -1.7025797367095947, -1.4779467582702637, -1.2533138990402222, -1.0286809206008911, -0.8040479421615601, -0.579414963722229, -0.35478198528289795, -0.13014903664588928, 0.09448391199111938, 0.31911689043045044, 0.5437498092651367, 0.7683827877044678, 0.9930157661437988, 1.2176487445831299]}, "gradients/decoder.model.decoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 4.0, 4.0, 1.0, 3.0, 2.0, 7.0, 3.0, 5.0, 8.0, 7.0, 10.0, 7.0, 18.0, 16.0, 18.0, 17.0, 24.0, 28.0, 27.0, 25.0, 26.0, 35.0, 41.0, 41.0, 37.0, 31.0, 27.0, 41.0, 43.0, 30.0, 34.0, 42.0, 36.0, 29.0, 32.0, 24.0, 23.0, 34.0, 31.0, 18.0, 18.0, 15.0, 16.0, 15.0, 10.0, 13.0, 10.0, 12.0, 3.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 3.0], "bins": [-1.609847068786621, -1.5599985122680664, -1.5101499557495117, -1.460301399230957, -1.4104528427124023, -1.3606042861938477, -1.310755729675293, -1.2609070539474487, -1.211058497428894, -1.1612099409103394, -1.1113613843917847, -1.06151282787323, -1.0116642713546753, -0.9618156552314758, -0.9119670987129211, -0.8621184825897217, -0.8122699856758118, -0.7624214291572571, -0.7125728726387024, -0.6627242565155029, -0.6128756999969482, -0.5630271434783936, -0.5131785869598389, -0.4633300006389618, -0.4134814441204071, -0.3636328876018524, -0.31378430128097534, -0.26393574476242065, -0.21408717334270477, -0.1642386019229889, -0.1143900454044342, -0.06454145908355713, -0.014692902565002441, 0.03515566512942314, 0.08500423282384872, 0.134852796792984, 0.1847013682126999, 0.23454993963241577, 0.28439849615097046, 0.33424708247184753, 0.3840956389904022, 0.4339441955089569, 0.483792781829834, 0.5336413383483887, 0.5834898948669434, 0.633338451385498, 0.6831870079040527, 0.7330356240272522, 0.7828841805458069, 0.8327327370643616, 0.8825812935829163, 0.9324299097061157, 0.9822784662246704, 1.032127022743225, 1.0819755792617798, 1.1318241357803345, 1.1816726922988892, 1.2315212488174438, 1.2813698053359985, 1.3312183618545532, 1.381066918373108, 1.4309155941009521, 1.4807641506195068, 1.5306127071380615, 1.5804612636566162]}, "gradients/decoder.model.decoder.layers.11.fc2.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 1.0, 3.0, 4.0, 3.0, 9.0, 5.0, 8.0, 16.0, 28.0, 46.0, 40.0, 73.0, 102.0, 134.0, 157.0, 293.0, 338.0, 546.0, 749.0, 1176.0, 1810.0, 2857.0, 4651.0, 8396.0, 16287.0, 37908.0, 115356.0, 476382.0, 2094334.0, 1074426.0, 235549.0, 68808.0, 25514.0, 11907.0, 6186.0, 3737.0, 2177.0, 1404.0, 914.0, 626.0, 409.0, 273.0, 170.0, 153.0, 96.0, 76.0, 47.0, 39.0, 14.0, 24.0, 11.0, 7.0, 5.0, 5.0, 0.0, 3.0, 2.0, 1.0, 1.0, 3.0], "bins": [-3.22265625, -3.124267578125, -3.02587890625, -2.927490234375, -2.8291015625, -2.730712890625, -2.63232421875, -2.533935546875, -2.435546875, -2.337158203125, -2.23876953125, -2.140380859375, -2.0419921875, -1.943603515625, -1.84521484375, -1.746826171875, -1.6484375, -1.550048828125, -1.45166015625, -1.353271484375, -1.2548828125, -1.156494140625, -1.05810546875, -0.959716796875, -0.861328125, -0.762939453125, -0.66455078125, -0.566162109375, -0.4677734375, -0.369384765625, -0.27099609375, -0.172607421875, -0.07421875, 0.024169921875, 0.12255859375, 0.220947265625, 0.3193359375, 0.417724609375, 0.51611328125, 0.614501953125, 0.712890625, 0.811279296875, 0.90966796875, 1.008056640625, 1.1064453125, 1.204833984375, 1.30322265625, 1.401611328125, 1.5, 1.598388671875, 1.69677734375, 1.795166015625, 1.8935546875, 1.991943359375, 2.09033203125, 2.188720703125, 2.287109375, 2.385498046875, 2.48388671875, 2.582275390625, 2.6806640625, 2.779052734375, 2.87744140625, 2.975830078125, 3.07421875]}, "gradients/decoder.model.decoder.layers.11.fc2.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 2.0, 7.0, 4.0, 9.0, 9.0, 6.0, 5.0, 11.0, 10.0, 10.0, 14.0, 12.0, 18.0, 24.0, 17.0, 24.0, 24.0, 32.0, 28.0, 37.0, 46.0, 35.0, 32.0, 50.0, 41.0, 46.0, 41.0, 41.0, 36.0, 38.0, 34.0, 37.0, 31.0, 21.0, 23.0, 15.0, 20.0, 20.0, 24.0, 11.0, 14.0, 10.0, 7.0, 13.0, 2.0, 6.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0], "bins": [-2.61328125, -2.533538818359375, -2.45379638671875, -2.374053955078125, -2.2943115234375, -2.214569091796875, -2.13482666015625, -2.055084228515625, -1.975341796875, -1.895599365234375, -1.81585693359375, -1.736114501953125, -1.6563720703125, -1.576629638671875, -1.49688720703125, -1.417144775390625, -1.33740234375, -1.257659912109375, -1.17791748046875, -1.098175048828125, -1.0184326171875, -0.938690185546875, -0.85894775390625, -0.779205322265625, -0.699462890625, -0.619720458984375, -0.53997802734375, -0.460235595703125, -0.3804931640625, -0.300750732421875, -0.22100830078125, -0.141265869140625, -0.0615234375, 0.018218994140625, 0.09796142578125, 0.177703857421875, 0.2574462890625, 0.337188720703125, 0.41693115234375, 0.496673583984375, 0.576416015625, 0.656158447265625, 0.73590087890625, 0.815643310546875, 0.8953857421875, 0.975128173828125, 1.05487060546875, 1.134613037109375, 1.21435546875, 1.294097900390625, 1.37384033203125, 1.453582763671875, 1.5333251953125, 1.613067626953125, 1.69281005859375, 1.772552490234375, 1.852294921875, 1.932037353515625, 2.01177978515625, 2.091522216796875, 2.1712646484375, 2.251007080078125, 2.33074951171875, 2.410491943359375, 2.490234375]}, "gradients/decoder.model.decoder.layers.11.fc1.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 4.0, 5.0, 0.0, 9.0, 3.0, 9.0, 3.0, 20.0, 10.0, 30.0, 38.0, 50.0, 90.0, 134.0, 227.0, 728.0, 22791.0, 4165919.0, 3273.0, 468.0, 165.0, 101.0, 53.0, 50.0, 19.0, 22.0, 20.0, 17.0, 8.0, 10.0, 4.0, 2.0, 3.0, 0.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.875, -25.67041015625, -24.4658203125, -23.26123046875, -22.056640625, -20.85205078125, -19.6474609375, -18.44287109375, -17.23828125, -16.03369140625, -14.8291015625, -13.62451171875, -12.419921875, -11.21533203125, -10.0107421875, -8.80615234375, -7.6015625, -6.39697265625, -5.1923828125, -3.98779296875, -2.783203125, -1.57861328125, -0.3740234375, 0.83056640625, 2.03515625, 3.23974609375, 4.4443359375, 5.64892578125, 6.853515625, 8.05810546875, 9.2626953125, 10.46728515625, 11.671875, 12.87646484375, 14.0810546875, 15.28564453125, 16.490234375, 17.69482421875, 18.8994140625, 20.10400390625, 21.30859375, 22.51318359375, 23.7177734375, 24.92236328125, 26.126953125, 27.33154296875, 28.5361328125, 29.74072265625, 30.9453125, 32.14990234375, 33.3544921875, 34.55908203125, 35.763671875, 36.96826171875, 38.1728515625, 39.37744140625, 40.58203125, 41.78662109375, 42.9912109375, 44.19580078125, 45.400390625, 46.60498046875, 47.8095703125, 49.01416015625, 50.21875]}, "gradients/decoder.model.decoder.layers.11.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 6.0, 5.0, 5.0, 4.0, 7.0, 13.0, 21.0, 30.0, 30.0, 60.0, 78.0, 135.0, 195.0, 464.0, 1137.0, 958.0, 399.0, 182.0, 110.0, 63.0, 54.0, 22.0, 27.0, 20.0, 15.0, 10.0, 10.0, 8.0, 6.0, 2.0, 1.0, 0.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.234375, -1.180572509765625, -1.12677001953125, -1.072967529296875, -1.0191650390625, -0.965362548828125, -0.91156005859375, -0.857757568359375, -0.803955078125, -0.750152587890625, -0.69635009765625, -0.642547607421875, -0.5887451171875, -0.534942626953125, -0.48114013671875, -0.427337646484375, -0.37353515625, -0.319732666015625, -0.26593017578125, -0.212127685546875, -0.1583251953125, -0.104522705078125, -0.05072021484375, 0.003082275390625, 0.056884765625, 0.110687255859375, 0.16448974609375, 0.218292236328125, 0.2720947265625, 0.325897216796875, 0.37969970703125, 0.433502197265625, 0.4873046875, 0.541107177734375, 0.59490966796875, 0.648712158203125, 0.7025146484375, 0.756317138671875, 0.81011962890625, 0.863922119140625, 0.917724609375, 0.971527099609375, 1.02532958984375, 1.079132080078125, 1.1329345703125, 1.186737060546875, 1.24053955078125, 1.294342041015625, 1.34814453125, 1.401947021484375, 1.45574951171875, 1.509552001953125, 1.5633544921875, 1.617156982421875, 1.67095947265625, 1.724761962890625, 1.778564453125, 1.832366943359375, 1.88616943359375, 1.939971923828125, 1.9937744140625, 2.047576904296875, 2.10137939453125, 2.155181884765625, 2.208984375]}, "gradients/decoder.model.decoder.layers.11.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 6.0, 17.0, 17.0, 29.0, 43.0, 65.0, 67.0, 100.0, 113.0, 111.0, 131.0, 89.0, 71.0, 55.0, 39.0, 24.0, 15.0, 7.0, 6.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.697394847869873, -5.486917972564697, -5.276440620422363, -5.0659637451171875, -4.855486869812012, -4.645009517669678, -4.434532642364502, -4.224055290222168, -4.013578414916992, -3.8031013011932373, -3.5926244258880615, -3.3821473121643066, -3.1716701984405518, -2.961193084716797, -2.750716209411621, -2.540239095687866, -2.3297622203826904, -2.1192851066589355, -1.9088081121444702, -1.6983311176300049, -1.48785400390625, -1.2773770093917847, -1.0669000148773193, -0.8564229011535645, -0.6459459066390991, -0.435468852519989, -0.2249918282032013, -0.014514803886413574, 0.19596225023269653, 0.40643930435180664, 0.616916298866272, 0.8273934125900269, 1.0378704071044922, 1.2483474016189575, 1.4588245153427124, 1.6693015098571777, 1.8797786235809326, 2.0902557373046875, 2.3007326126098633, 2.511209726333618, 2.721686840057373, 2.932163953781128, 3.1426408290863037, 3.3531179428100586, 3.5635950565338135, 3.7740721702575684, 3.984549045562744, 4.195026397705078, 4.405503273010254, 4.61598014831543, 4.826457500457764, 5.0369343757629395, 5.247411251068115, 5.457888603210449, 5.668365478515625, 5.878842353820801, 6.089319229125977, 6.299796104431152, 6.510273456573486, 6.720750331878662, 6.931227207183838, 7.141704559326172, 7.352181434631348, 7.562658309936523, 7.773135662078857]}, "gradients/decoder.model.decoder.layers.11.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 3.0, 8.0, 4.0, 4.0, 13.0, 11.0, 11.0, 17.0, 10.0, 19.0, 13.0, 21.0, 16.0, 34.0, 20.0, 34.0, 46.0, 37.0, 46.0, 64.0, 46.0, 42.0, 37.0, 36.0, 55.0, 34.0, 28.0, 40.0, 34.0, 38.0, 27.0, 21.0, 18.0, 15.0, 14.0, 18.0, 20.0, 12.0, 10.0, 12.0, 3.0, 2.0, 3.0, 4.0, 5.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.9105145931243896, -2.8235185146331787, -2.736522674560547, -2.649526596069336, -2.562530517578125, -2.475534677505493, -2.3885385990142822, -2.3015427589416504, -2.2145466804504395, -2.1275506019592285, -2.0405547618865967, -1.9535586833953857, -1.8665627241134644, -1.779566764831543, -1.692570686340332, -1.6055747270584106, -1.5185787677764893, -1.4315828084945679, -1.3445868492126465, -1.2575907707214355, -1.1705948114395142, -1.0835988521575928, -0.9966028332710266, -0.9096068143844604, -0.8226108551025391, -0.7356148958206177, -0.6486188769340515, -0.5616228580474854, -0.47462689876556396, -0.3876309096813202, -0.3006349205970764, -0.21363890171051025, -0.12664294242858887, -0.03964695334434509, 0.04734903573989868, 0.13434502482414246, 0.22134101390838623, 0.30833700299263, 0.3953329920768738, 0.48232901096343994, 0.5693249702453613, 0.6563209295272827, 0.7433169484138489, 0.830312967300415, 0.9173089265823364, 1.0043048858642578, 1.0913009643554688, 1.1782969236373901, 1.2652928829193115, 1.352288842201233, 1.4392848014831543, 1.5262808799743652, 1.6132768392562866, 1.700272798538208, 1.787268877029419, 1.8742648363113403, 1.9612607955932617, 2.0482568740844727, 2.1352527141571045, 2.2222487926483154, 2.3092446327209473, 2.396240711212158, 2.483236789703369, 2.57023286819458, 2.657228708267212]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 2.0, 7.0, 9.0, 13.0, 22.0, 30.0, 37.0, 44.0, 61.0, 79.0, 121.0, 165.0, 288.0, 364.0, 566.0, 780.0, 1253.0, 2011.0, 3341.0, 5704.0, 10887.0, 21374.0, 46147.0, 102860.0, 211023.0, 286573.0, 186015.0, 87086.0, 39820.0, 18798.0, 9522.0, 5223.0, 2990.0, 1854.0, 1112.0, 738.0, 480.0, 329.0, 216.0, 188.0, 141.0, 88.0, 52.0, 41.0, 32.0, 23.0, 16.0, 10.0, 8.0, 4.0, 6.0, 5.0, 3.0, 3.0], "bins": [-1.197265625, -1.1634445190429688, -1.1296234130859375, -1.0958023071289062, -1.061981201171875, -1.0281600952148438, -0.9943389892578125, -0.9605178833007812, -0.92669677734375, -0.8928756713867188, -0.8590545654296875, -0.8252334594726562, -0.791412353515625, -0.7575912475585938, -0.7237701416015625, -0.6899490356445312, -0.6561279296875, -0.6223068237304688, -0.5884857177734375, -0.5546646118164062, -0.520843505859375, -0.48702239990234375, -0.4532012939453125, -0.41938018798828125, -0.38555908203125, -0.35173797607421875, -0.3179168701171875, -0.28409576416015625, -0.250274658203125, -0.21645355224609375, -0.1826324462890625, -0.14881134033203125, -0.114990234375, -0.08116912841796875, -0.0473480224609375, -0.01352691650390625, 0.020294189453125, 0.05411529541015625, 0.0879364013671875, 0.12175750732421875, 0.15557861328125, 0.18939971923828125, 0.2232208251953125, 0.25704193115234375, 0.290863037109375, 0.32468414306640625, 0.3585052490234375, 0.39232635498046875, 0.4261474609375, 0.45996856689453125, 0.4937896728515625, 0.5276107788085938, 0.561431884765625, 0.5952529907226562, 0.6290740966796875, 0.6628952026367188, 0.69671630859375, 0.7305374145507812, 0.7643585205078125, 0.7981796264648438, 0.832000732421875, 0.8658218383789062, 0.8996429443359375, 0.9334640502929688, 0.96728515625]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 2.0, 4.0, 3.0, 7.0, 8.0, 6.0, 12.0, 19.0, 9.0, 13.0, 25.0, 27.0, 29.0, 29.0, 40.0, 47.0, 39.0, 58.0, 59.0, 56.0, 50.0, 54.0, 43.0, 48.0, 43.0, 43.0, 32.0, 38.0, 42.0, 21.0, 13.0, 15.0, 19.0, 17.0, 16.0, 7.0, 5.0, 4.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.751953125, -2.6737060546875, -2.595458984375, -2.5172119140625, -2.43896484375, -2.3607177734375, -2.282470703125, -2.2042236328125, -2.1259765625, -2.0477294921875, -1.969482421875, -1.8912353515625, -1.81298828125, -1.7347412109375, -1.656494140625, -1.5782470703125, -1.5, -1.4217529296875, -1.343505859375, -1.2652587890625, -1.18701171875, -1.1087646484375, -1.030517578125, -0.9522705078125, -0.8740234375, -0.7957763671875, -0.717529296875, -0.6392822265625, -0.56103515625, -0.4827880859375, -0.404541015625, -0.3262939453125, -0.248046875, -0.1697998046875, -0.091552734375, -0.0133056640625, 0.06494140625, 0.1431884765625, 0.221435546875, 0.2996826171875, 0.3779296875, 0.4561767578125, 0.534423828125, 0.6126708984375, 0.69091796875, 0.7691650390625, 0.847412109375, 0.9256591796875, 1.00390625, 1.0821533203125, 1.160400390625, 1.2386474609375, 1.31689453125, 1.3951416015625, 1.473388671875, 1.5516357421875, 1.6298828125, 1.7081298828125, 1.786376953125, 1.8646240234375, 1.94287109375, 2.0211181640625, 2.099365234375, 2.1776123046875, 2.255859375]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 5.0, 5.0, 4.0, 8.0, 3.0, 10.0, 11.0, 20.0, 19.0, 11.0, 26.0, 23.0, 41.0, 66.0, 76.0, 129.0, 235.0, 372.0, 602.0, 1326.0, 2806.0, 7404.0, 23825.0, 111714.0, 541590.0, 287292.0, 49553.0, 12720.0, 4499.0, 1983.0, 875.0, 468.0, 275.0, 153.0, 113.0, 65.0, 53.0, 39.0, 32.0, 26.0, 19.0, 16.0, 18.0, 9.0, 2.0, 7.0, 3.0, 4.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-1.8359375, -1.7781219482421875, -1.720306396484375, -1.6624908447265625, -1.60467529296875, -1.5468597412109375, -1.489044189453125, -1.4312286376953125, -1.3734130859375, -1.3155975341796875, -1.257781982421875, -1.1999664306640625, -1.14215087890625, -1.0843353271484375, -1.026519775390625, -0.9687042236328125, -0.910888671875, -0.8530731201171875, -0.795257568359375, -0.7374420166015625, -0.67962646484375, -0.6218109130859375, -0.563995361328125, -0.5061798095703125, -0.4483642578125, -0.3905487060546875, -0.332733154296875, -0.2749176025390625, -0.21710205078125, -0.1592864990234375, -0.101470947265625, -0.0436553955078125, 0.01416015625, 0.0719757080078125, 0.129791259765625, 0.1876068115234375, 0.24542236328125, 0.3032379150390625, 0.361053466796875, 0.4188690185546875, 0.4766845703125, 0.5345001220703125, 0.592315673828125, 0.6501312255859375, 0.70794677734375, 0.7657623291015625, 0.823577880859375, 0.8813934326171875, 0.939208984375, 0.9970245361328125, 1.054840087890625, 1.1126556396484375, 1.17047119140625, 1.2282867431640625, 1.286102294921875, 1.3439178466796875, 1.4017333984375, 1.4595489501953125, 1.517364501953125, 1.5751800537109375, 1.63299560546875, 1.6908111572265625, 1.748626708984375, 1.8064422607421875, 1.8642578125]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 5.0, 3.0, 5.0, 8.0, 7.0, 13.0, 11.0, 23.0, 13.0, 25.0, 34.0, 24.0, 33.0, 31.0, 25.0, 29.0, 47.0, 46.0, 46.0, 55.0, 45.0, 34.0, 45.0, 42.0, 33.0, 40.0, 42.0, 39.0, 30.0, 26.0, 29.0, 27.0, 18.0, 11.0, 18.0, 16.0, 11.0, 6.0, 2.0, 6.0, 2.0, 0.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.76953125, -4.61285400390625, -4.4561767578125, -4.29949951171875, -4.142822265625, -3.98614501953125, -3.8294677734375, -3.67279052734375, -3.51611328125, -3.35943603515625, -3.2027587890625, -3.04608154296875, -2.889404296875, -2.73272705078125, -2.5760498046875, -2.41937255859375, -2.2626953125, -2.10601806640625, -1.9493408203125, -1.79266357421875, -1.635986328125, -1.47930908203125, -1.3226318359375, -1.16595458984375, -1.00927734375, -0.85260009765625, -0.6959228515625, -0.53924560546875, -0.382568359375, -0.22589111328125, -0.0692138671875, 0.08746337890625, 0.244140625, 0.40081787109375, 0.5574951171875, 0.71417236328125, 0.870849609375, 1.02752685546875, 1.1842041015625, 1.34088134765625, 1.49755859375, 1.65423583984375, 1.8109130859375, 1.96759033203125, 2.124267578125, 2.28094482421875, 2.4376220703125, 2.59429931640625, 2.7509765625, 2.90765380859375, 3.0643310546875, 3.22100830078125, 3.377685546875, 3.53436279296875, 3.6910400390625, 3.84771728515625, 4.00439453125, 4.16107177734375, 4.3177490234375, 4.47442626953125, 4.631103515625, 4.78778076171875, 4.9444580078125, 5.10113525390625, 5.2578125]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 4.0, 4.0, 7.0, 11.0, 8.0, 12.0, 14.0, 15.0, 27.0, 36.0, 62.0, 98.0, 149.0, 276.0, 495.0, 1059.0, 2594.0, 9546.0, 77971.0, 830079.0, 109062.0, 11599.0, 2931.0, 1213.0, 533.0, 276.0, 164.0, 89.0, 67.0, 35.0, 33.0, 22.0, 15.0, 14.0, 12.0, 5.0, 6.0, 2.0, 3.0, 3.0, 5.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.1875, -1.1444091796875, -1.101318359375, -1.0582275390625, -1.01513671875, -0.9720458984375, -0.928955078125, -0.8858642578125, -0.8427734375, -0.7996826171875, -0.756591796875, -0.7135009765625, -0.67041015625, -0.6273193359375, -0.584228515625, -0.5411376953125, -0.498046875, -0.4549560546875, -0.411865234375, -0.3687744140625, -0.32568359375, -0.2825927734375, -0.239501953125, -0.1964111328125, -0.1533203125, -0.1102294921875, -0.067138671875, -0.0240478515625, 0.01904296875, 0.0621337890625, 0.105224609375, 0.1483154296875, 0.19140625, 0.2344970703125, 0.277587890625, 0.3206787109375, 0.36376953125, 0.4068603515625, 0.449951171875, 0.4930419921875, 0.5361328125, 0.5792236328125, 0.622314453125, 0.6654052734375, 0.70849609375, 0.7515869140625, 0.794677734375, 0.8377685546875, 0.880859375, 0.9239501953125, 0.967041015625, 1.0101318359375, 1.05322265625, 1.0963134765625, 1.139404296875, 1.1824951171875, 1.2255859375, 1.2686767578125, 1.311767578125, 1.3548583984375, 1.39794921875, 1.4410400390625, 1.484130859375, 1.5272216796875, 1.5703125]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 3.0, 5.0, 6.0, 3.0, 3.0, 7.0, 13.0, 16.0, 21.0, 40.0, 47.0, 74.0, 107.0, 135.0, 151.0, 114.0, 80.0, 50.0, 43.0, 23.0, 17.0, 12.0, 14.0, 12.0, 2.0, 4.0, 2.0, 5.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0006003379821777344, -0.0005841776728630066, -0.0005680173635482788, -0.000551857054233551, -0.0005356967449188232, -0.0005195364356040955, -0.0005033761262893677, -0.0004872158169746399, -0.0004710555076599121, -0.0004548951983451843, -0.00043873488903045654, -0.00042257457971572876, -0.000406414270401001, -0.0003902539610862732, -0.0003740936517715454, -0.0003579333424568176, -0.00034177303314208984, -0.00032561272382736206, -0.0003094524145126343, -0.0002932921051979065, -0.0002771317958831787, -0.00026097148656845093, -0.00024481117725372314, -0.00022865086793899536, -0.00021249055862426758, -0.0001963302493095398, -0.000180169939994812, -0.00016400963068008423, -0.00014784932136535645, -0.00013168901205062866, -0.00011552870273590088, -9.93683934211731e-05, -8.320808410644531e-05, -6.704777479171753e-05, -5.0887465476989746e-05, -3.472715616226196e-05, -1.856684684753418e-05, -2.4065375328063965e-06, 1.3753771781921387e-05, 2.991408109664917e-05, 4.607439041137695e-05, 6.223469972610474e-05, 7.839500904083252e-05, 9.45553183555603e-05, 0.00011071562767028809, 0.00012687593698501587, 0.00014303624629974365, 0.00015919655561447144, 0.00017535686492919922, 0.000191517174243927, 0.00020767748355865479, 0.00022383779287338257, 0.00023999810218811035, 0.00025615841150283813, 0.0002723187208175659, 0.0002884790301322937, 0.0003046393394470215, 0.00032079964876174927, 0.00033695995807647705, 0.00035312026739120483, 0.0003692805767059326, 0.0003854408860206604, 0.0004016011953353882, 0.00041776150465011597, 0.00043392181396484375]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 8.0, 7.0, 14.0, 14.0, 33.0, 62.0, 158.0, 367.0, 1184.0, 5107.0, 136965.0, 883438.0, 17829.0, 2272.0, 648.0, 234.0, 86.0, 49.0, 24.0, 11.0, 13.0, 7.0, 7.0, 3.0, 3.0, 2.0, 2.0, 4.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.439453125, -2.356048583984375, -2.27264404296875, -2.189239501953125, -2.1058349609375, -2.022430419921875, -1.93902587890625, -1.855621337890625, -1.772216796875, -1.688812255859375, -1.60540771484375, -1.522003173828125, -1.4385986328125, -1.355194091796875, -1.27178955078125, -1.188385009765625, -1.10498046875, -1.021575927734375, -0.93817138671875, -0.854766845703125, -0.7713623046875, -0.687957763671875, -0.60455322265625, -0.521148681640625, -0.437744140625, -0.354339599609375, -0.27093505859375, -0.187530517578125, -0.1041259765625, -0.020721435546875, 0.06268310546875, 0.146087646484375, 0.2294921875, 0.312896728515625, 0.39630126953125, 0.479705810546875, 0.5631103515625, 0.646514892578125, 0.72991943359375, 0.813323974609375, 0.896728515625, 0.980133056640625, 1.06353759765625, 1.146942138671875, 1.2303466796875, 1.313751220703125, 1.39715576171875, 1.480560302734375, 1.56396484375, 1.647369384765625, 1.73077392578125, 1.814178466796875, 1.8975830078125, 1.980987548828125, 2.06439208984375, 2.147796630859375, 2.231201171875, 2.314605712890625, 2.39801025390625, 2.481414794921875, 2.5648193359375, 2.648223876953125, 2.73162841796875, 2.815032958984375, 2.8984375]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 3.0, 4.0, 11.0, 11.0, 10.0, 20.0, 25.0, 34.0, 47.0, 86.0, 116.0, 109.0, 121.0, 130.0, 80.0, 60.0, 35.0, 23.0, 23.0, 14.0, 11.0, 9.0, 5.0, 3.0, 2.0, 3.0, 2.0, 4.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.31298828125, -0.3026008605957031, -0.29221343994140625, -0.2818260192871094, -0.2714385986328125, -0.2610511779785156, -0.25066375732421875, -0.24027633666992188, -0.229888916015625, -0.21950149536132812, -0.20911407470703125, -0.19872665405273438, -0.1883392333984375, -0.17795181274414062, -0.16756439208984375, -0.15717697143554688, -0.14678955078125, -0.13640213012695312, -0.12601470947265625, -0.11562728881835938, -0.1052398681640625, -0.09485244750976562, -0.08446502685546875, -0.07407760620117188, -0.063690185546875, -0.053302764892578125, -0.04291534423828125, -0.032527923583984375, -0.0221405029296875, -0.011753082275390625, -0.00136566162109375, 0.009021759033203125, 0.0194091796875, 0.029796600341796875, 0.04018402099609375, 0.050571441650390625, 0.0609588623046875, 0.07134628295898438, 0.08173370361328125, 0.09212112426757812, 0.102508544921875, 0.11289596557617188, 0.12328338623046875, 0.13367080688476562, 0.1440582275390625, 0.15444564819335938, 0.16483306884765625, 0.17522048950195312, 0.18560791015625, 0.19599533081054688, 0.20638275146484375, 0.21677017211914062, 0.2271575927734375, 0.23754501342773438, 0.24793243408203125, 0.2583198547363281, 0.268707275390625, 0.2790946960449219, 0.28948211669921875, 0.2998695373535156, 0.3102569580078125, 0.3206443786621094, 0.33103179931640625, 0.3414192199707031, 0.351806640625]}, "gradients/decoder.model.decoder.layers.11.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 5.0, 13.0, 22.0, 64.0, 103.0, 159.0, 217.0, 195.0, 117.0, 55.0, 34.0, 12.0, 5.0, 3.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.632196426391602, -8.367332458496094, -8.102468490600586, -7.83760404586792, -7.572740077972412, -7.307876110076904, -7.043011665344238, -6.7781476974487305, -6.513283729553223, -6.248419761657715, -5.983555793762207, -5.718691349029541, -5.453827381134033, -5.188963413238525, -4.924098968505859, -4.659235000610352, -4.394371032714844, -4.129507064819336, -3.864642858505249, -3.599778652191162, -3.3349146842956543, -3.0700507164001465, -2.8051865100860596, -2.5403223037719727, -2.275458335876465, -2.010594367980957, -1.7457301616668701, -1.4808660745620728, -1.2160019874572754, -0.951137900352478, -0.6862738132476807, -0.4214097261428833, -0.15654659271240234, 0.10831749439239502, 0.3731815814971924, 0.6380456686019897, 0.9029097557067871, 1.1677738428115845, 1.4326379299163818, 1.6975020170211792, 1.9623661041259766, 2.2272300720214844, 2.4920942783355713, 2.756958484649658, 3.021822452545166, 3.286686420440674, 3.5515506267547607, 3.8164148330688477, 4.0812788009643555, 4.346142768859863, 4.611006736755371, 4.875871181488037, 5.140735149383545, 5.405599117279053, 5.670463562011719, 5.935327529907227, 6.200191497802734, 6.465055465698242, 6.72991943359375, 6.994783878326416, 7.259647846221924, 7.524511814117432, 7.789376258850098, 8.054240226745605, 8.319104194641113]}, "gradients/decoder.model.decoder.layers.11.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 6.0, 6.0, 7.0, 5.0, 0.0, 7.0, 8.0, 13.0, 10.0, 15.0, 16.0, 17.0, 17.0, 31.0, 28.0, 34.0, 36.0, 33.0, 44.0, 30.0, 39.0, 59.0, 40.0, 49.0, 40.0, 48.0, 39.0, 36.0, 29.0, 38.0, 25.0, 27.0, 30.0, 20.0, 25.0, 13.0, 15.0, 5.0, 9.0, 18.0, 10.0, 6.0, 10.0, 2.0, 7.0, 0.0, 2.0, 3.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.0750010013580322, -2.010267734527588, -1.945534348487854, -1.8808010816574097, -1.8160676956176758, -1.7513344287872314, -1.686601161956787, -1.6218678951263428, -1.5571345090866089, -1.4924012422561646, -1.4276678562164307, -1.3629345893859863, -1.298201322555542, -1.233467936515808, -1.1687346696853638, -1.1040012836456299, -1.0392680168151855, -0.9745346903800964, -0.9098013639450073, -0.845068097114563, -0.7803347706794739, -0.7156014442443848, -0.6508681774139404, -0.5861348509788513, -0.5214015245437622, -0.4566681981086731, -0.39193490147590637, -0.32720160484313965, -0.26246827840805054, -0.19773495197296143, -0.1330016553401947, -0.06826835870742798, -0.0035352706909179688, 0.06119804084300995, 0.12593135237693787, 0.19066466391086578, 0.2553979754447937, 0.3201313018798828, 0.38486459851264954, 0.44959789514541626, 0.5143312215805054, 0.5790645480155945, 0.6437978744506836, 0.7085311412811279, 0.773264467716217, 0.8379977941513062, 0.9027310609817505, 0.9674643874168396, 1.0321977138519287, 1.096930980682373, 1.161664366722107, 1.2263976335525513, 1.2911310195922852, 1.3558642864227295, 1.4205975532531738, 1.4853308200836182, 1.550064206123352, 1.6147974729537964, 1.6795308589935303, 1.7442641258239746, 1.808997392654419, 1.8737307786941528, 1.9384640455245972, 2.003197431564331, 2.0679306983947754]}, "gradients/decoder.model.decoder.layers.11.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 4.0, 4.0, 4.0, 5.0, 9.0, 11.0, 17.0, 33.0, 37.0, 33.0, 50.0, 73.0, 116.0, 127.0, 192.0, 274.0, 414.0, 574.0, 929.0, 1416.0, 2283.0, 3933.0, 6969.0, 13413.0, 26953.0, 57350.0, 124815.0, 235287.0, 267219.0, 158783.0, 74891.0, 34452.0, 16715.0, 8731.0, 4815.0, 2633.0, 1681.0, 1066.0, 741.0, 457.0, 305.0, 201.0, 150.0, 102.0, 78.0, 52.0, 51.0, 27.0, 29.0, 22.0, 13.0, 10.0, 4.0, 5.0, 3.0, 4.0, 3.0, 1.0, 3.0], "bins": [-0.970703125, -0.941436767578125, -0.91217041015625, -0.882904052734375, -0.8536376953125, -0.824371337890625, -0.79510498046875, -0.765838623046875, -0.736572265625, -0.707305908203125, -0.67803955078125, -0.648773193359375, -0.6195068359375, -0.590240478515625, -0.56097412109375, -0.531707763671875, -0.50244140625, -0.473175048828125, -0.44390869140625, -0.414642333984375, -0.3853759765625, -0.356109619140625, -0.32684326171875, -0.297576904296875, -0.268310546875, -0.239044189453125, -0.20977783203125, -0.180511474609375, -0.1512451171875, -0.121978759765625, -0.09271240234375, -0.063446044921875, -0.0341796875, -0.004913330078125, 0.02435302734375, 0.053619384765625, 0.0828857421875, 0.112152099609375, 0.14141845703125, 0.170684814453125, 0.199951171875, 0.229217529296875, 0.25848388671875, 0.287750244140625, 0.3170166015625, 0.346282958984375, 0.37554931640625, 0.404815673828125, 0.43408203125, 0.463348388671875, 0.49261474609375, 0.521881103515625, 0.5511474609375, 0.580413818359375, 0.60968017578125, 0.638946533203125, 0.668212890625, 0.697479248046875, 0.72674560546875, 0.756011962890625, 0.7852783203125, 0.814544677734375, 0.84381103515625, 0.873077392578125, 0.90234375]}, "gradients/decoder.model.decoder.layers.11.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 6.0, 3.0, 4.0, 1.0, 2.0, 5.0, 7.0, 10.0, 9.0, 23.0, 14.0, 18.0, 25.0, 19.0, 35.0, 22.0, 28.0, 36.0, 39.0, 48.0, 51.0, 50.0, 48.0, 61.0, 44.0, 46.0, 41.0, 36.0, 38.0, 33.0, 37.0, 28.0, 19.0, 20.0, 20.0, 15.0, 8.0, 14.0, 13.0, 10.0, 6.0, 5.0, 2.0, 7.0, 2.0, 4.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.84375, -8.5592041015625, -8.274658203125, -7.9901123046875, -7.70556640625, -7.4210205078125, -7.136474609375, -6.8519287109375, -6.5673828125, -6.2828369140625, -5.998291015625, -5.7137451171875, -5.42919921875, -5.1446533203125, -4.860107421875, -4.5755615234375, -4.291015625, -4.0064697265625, -3.721923828125, -3.4373779296875, -3.15283203125, -2.8682861328125, -2.583740234375, -2.2991943359375, -2.0146484375, -1.7301025390625, -1.445556640625, -1.1610107421875, -0.87646484375, -0.5919189453125, -0.307373046875, -0.0228271484375, 0.26171875, 0.5462646484375, 0.830810546875, 1.1153564453125, 1.39990234375, 1.6844482421875, 1.968994140625, 2.2535400390625, 2.5380859375, 2.8226318359375, 3.107177734375, 3.3917236328125, 3.67626953125, 3.9608154296875, 4.245361328125, 4.5299072265625, 4.814453125, 5.0989990234375, 5.383544921875, 5.6680908203125, 5.95263671875, 6.2371826171875, 6.521728515625, 6.8062744140625, 7.0908203125, 7.3753662109375, 7.659912109375, 7.9444580078125, 8.22900390625, 8.5135498046875, 8.798095703125, 9.0826416015625, 9.3671875]}, "gradients/decoder.model.decoder.layers.11.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 6.0, 3.0, 3.0, 4.0, 6.0, 4.0, 17.0, 24.0, 22.0, 28.0, 34.0, 49.0, 70.0, 102.0, 138.0, 194.0, 328.0, 619.0, 2391.0, 87776.0, 929600.0, 24263.0, 1424.0, 524.0, 272.0, 179.0, 120.0, 78.0, 72.0, 54.0, 31.0, 36.0, 20.0, 17.0, 20.0, 9.0, 4.0, 7.0, 6.0, 2.0, 5.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.60546875, -4.4371337890625, -4.268798828125, -4.1004638671875, -3.93212890625, -3.7637939453125, -3.595458984375, -3.4271240234375, -3.2587890625, -3.0904541015625, -2.922119140625, -2.7537841796875, -2.58544921875, -2.4171142578125, -2.248779296875, -2.0804443359375, -1.912109375, -1.7437744140625, -1.575439453125, -1.4071044921875, -1.23876953125, -1.0704345703125, -0.902099609375, -0.7337646484375, -0.5654296875, -0.3970947265625, -0.228759765625, -0.0604248046875, 0.10791015625, 0.2762451171875, 0.444580078125, 0.6129150390625, 0.78125, 0.9495849609375, 1.117919921875, 1.2862548828125, 1.45458984375, 1.6229248046875, 1.791259765625, 1.9595947265625, 2.1279296875, 2.2962646484375, 2.464599609375, 2.6329345703125, 2.80126953125, 2.9696044921875, 3.137939453125, 3.3062744140625, 3.474609375, 3.6429443359375, 3.811279296875, 3.9796142578125, 4.14794921875, 4.3162841796875, 4.484619140625, 4.6529541015625, 4.8212890625, 4.9896240234375, 5.157958984375, 5.3262939453125, 5.49462890625, 5.6629638671875, 5.831298828125, 5.9996337890625, 6.16796875]}, "gradients/decoder.model.decoder.layers.11.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 4.0, 4.0, 6.0, 9.0, 9.0, 15.0, 15.0, 16.0, 28.0, 26.0, 29.0, 32.0, 43.0, 49.0, 44.0, 56.0, 63.0, 62.0, 66.0, 66.0, 52.0, 48.0, 48.0, 36.0, 28.0, 28.0, 16.0, 25.0, 19.0, 19.0, 11.0, 5.0, 11.0, 6.0, 7.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.21875, -8.8961181640625, -8.573486328125, -8.2508544921875, -7.92822265625, -7.6055908203125, -7.282958984375, -6.9603271484375, -6.6376953125, -6.3150634765625, -5.992431640625, -5.6697998046875, -5.34716796875, -5.0245361328125, -4.701904296875, -4.3792724609375, -4.056640625, -3.7340087890625, -3.411376953125, -3.0887451171875, -2.76611328125, -2.4434814453125, -2.120849609375, -1.7982177734375, -1.4755859375, -1.1529541015625, -0.830322265625, -0.5076904296875, -0.18505859375, 0.1375732421875, 0.460205078125, 0.7828369140625, 1.10546875, 1.4281005859375, 1.750732421875, 2.0733642578125, 2.39599609375, 2.7186279296875, 3.041259765625, 3.3638916015625, 3.6865234375, 4.0091552734375, 4.331787109375, 4.6544189453125, 4.97705078125, 5.2996826171875, 5.622314453125, 5.9449462890625, 6.267578125, 6.5902099609375, 6.912841796875, 7.2354736328125, 7.55810546875, 7.8807373046875, 8.203369140625, 8.5260009765625, 8.8486328125, 9.1712646484375, 9.493896484375, 9.8165283203125, 10.13916015625, 10.4617919921875, 10.784423828125, 11.1070556640625, 11.4296875]}, "gradients/decoder.model.decoder.layers.11.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 4.0, 3.0, 5.0, 6.0, 5.0, 11.0, 17.0, 40.0, 57.0, 81.0, 128.0, 215.0, 357.0, 778.0, 1941.0, 6420.0, 27492.0, 259357.0, 682348.0, 54009.0, 10172.0, 2902.0, 1108.0, 465.0, 219.0, 144.0, 96.0, 59.0, 48.0, 17.0, 20.0, 5.0, 8.0, 5.0, 4.0, 3.0, 4.0, 6.0, 5.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.51513671875, -0.5016441345214844, -0.48815155029296875, -0.4746589660644531, -0.4611663818359375, -0.4476737976074219, -0.43418121337890625, -0.4206886291503906, -0.407196044921875, -0.3937034606933594, -0.38021087646484375, -0.3667182922363281, -0.3532257080078125, -0.3397331237792969, -0.32624053955078125, -0.3127479553222656, -0.29925537109375, -0.2857627868652344, -0.27227020263671875, -0.2587776184082031, -0.2452850341796875, -0.23179244995117188, -0.21829986572265625, -0.20480728149414062, -0.191314697265625, -0.17782211303710938, -0.16432952880859375, -0.15083694458007812, -0.1373443603515625, -0.12385177612304688, -0.11035919189453125, -0.09686660766601562, -0.0833740234375, -0.06988143920898438, -0.05638885498046875, -0.042896270751953125, -0.0294036865234375, -0.015911102294921875, -0.00241851806640625, 0.011074066162109375, 0.024566650390625, 0.038059234619140625, 0.05155181884765625, 0.06504440307617188, 0.0785369873046875, 0.09202957153320312, 0.10552215576171875, 0.11901473999023438, 0.13250732421875, 0.14599990844726562, 0.15949249267578125, 0.17298507690429688, 0.1864776611328125, 0.19997024536132812, 0.21346282958984375, 0.22695541381835938, 0.240447998046875, 0.2539405822753906, 0.26743316650390625, 0.2809257507324219, 0.2944183349609375, 0.3079109191894531, 0.32140350341796875, 0.3348960876464844, 0.348388671875]}, "gradients/decoder.model.decoder.layers.11.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 0.0, 2.0, 5.0, 7.0, 5.0, 4.0, 9.0, 5.0, 6.0, 10.0, 13.0, 13.0, 19.0, 14.0, 40.0, 46.0, 44.0, 90.0, 114.0, 119.0, 109.0, 79.0, 74.0, 43.0, 20.0, 32.0, 18.0, 15.0, 12.0, 11.0, 6.0, 3.0, 2.0, 4.0, 2.0, 3.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-5.7637691497802734e-05, -5.581323057413101e-05, -5.398876965045929e-05, -5.216430872678757e-05, -5.0339847803115845e-05, -4.851538687944412e-05, -4.66909259557724e-05, -4.486646503210068e-05, -4.3042004108428955e-05, -4.121754318475723e-05, -3.939308226108551e-05, -3.756862133741379e-05, -3.5744160413742065e-05, -3.391969949007034e-05, -3.209523856639862e-05, -3.0270777642726898e-05, -2.8446316719055176e-05, -2.6621855795383453e-05, -2.479739487171173e-05, -2.297293394804001e-05, -2.1148473024368286e-05, -1.9324012100696564e-05, -1.749955117702484e-05, -1.567509025335312e-05, -1.3850629329681396e-05, -1.2026168406009674e-05, -1.0201707482337952e-05, -8.37724655866623e-06, -6.552785634994507e-06, -4.7283247113227844e-06, -2.903863787651062e-06, -1.0794028639793396e-06, 7.450580596923828e-07, 2.5695189833641052e-06, 4.393979907035828e-06, 6.21844083070755e-06, 8.042901754379272e-06, 9.867362678050995e-06, 1.1691823601722717e-05, 1.351628452539444e-05, 1.5340745449066162e-05, 1.7165206372737885e-05, 1.8989667296409607e-05, 2.081412822008133e-05, 2.2638589143753052e-05, 2.4463050067424774e-05, 2.6287510991096497e-05, 2.811197191476822e-05, 2.993643283843994e-05, 3.1760893762111664e-05, 3.3585354685783386e-05, 3.540981560945511e-05, 3.723427653312683e-05, 3.9058737456798553e-05, 4.0883198380470276e-05, 4.2707659304142e-05, 4.453212022781372e-05, 4.635658115148544e-05, 4.8181042075157166e-05, 5.000550299882889e-05, 5.182996392250061e-05, 5.365442484617233e-05, 5.5478885769844055e-05, 5.730334669351578e-05, 5.91278076171875e-05]}, "gradients/decoder.model.decoder.layers.11.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 5.0, 5.0, 2.0, 5.0, 16.0, 8.0, 28.0, 35.0, 68.0, 135.0, 260.0, 662.0, 1912.0, 7228.0, 43435.0, 748919.0, 220296.0, 19330.0, 4045.0, 1254.0, 439.0, 188.0, 99.0, 72.0, 42.0, 20.0, 14.0, 11.0, 9.0, 3.0, 1.0, 8.0, 0.0, 4.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.405517578125, -0.3884773254394531, -0.37143707275390625, -0.3543968200683594, -0.3373565673828125, -0.3203163146972656, -0.30327606201171875, -0.2862358093261719, -0.269195556640625, -0.2521553039550781, -0.23511505126953125, -0.21807479858398438, -0.2010345458984375, -0.18399429321289062, -0.16695404052734375, -0.14991378784179688, -0.13287353515625, -0.11583328247070312, -0.09879302978515625, -0.08175277709960938, -0.0647125244140625, -0.047672271728515625, -0.03063201904296875, -0.013591766357421875, 0.003448486328125, 0.020488739013671875, 0.03752899169921875, 0.054569244384765625, 0.0716094970703125, 0.08864974975585938, 0.10569000244140625, 0.12273025512695312, 0.1397705078125, 0.15681076049804688, 0.17385101318359375, 0.19089126586914062, 0.2079315185546875, 0.22497177124023438, 0.24201202392578125, 0.2590522766113281, 0.276092529296875, 0.2931327819824219, 0.31017303466796875, 0.3272132873535156, 0.3442535400390625, 0.3612937927246094, 0.37833404541015625, 0.3953742980957031, 0.41241455078125, 0.4294548034667969, 0.44649505615234375, 0.4635353088378906, 0.4805755615234375, 0.4976158142089844, 0.5146560668945312, 0.5316963195800781, 0.548736572265625, 0.5657768249511719, 0.5828170776367188, 0.5998573303222656, 0.6168975830078125, 0.6339378356933594, 0.6509780883789062, 0.6680183410644531, 0.68505859375]}, "gradients/decoder.model.decoder.layers.11.self_attn.q_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 4.0, 1.0, 7.0, 3.0, 4.0, 7.0, 8.0, 11.0, 18.0, 27.0, 34.0, 66.0, 86.0, 104.0, 149.0, 163.0, 108.0, 63.0, 44.0, 23.0, 15.0, 15.0, 12.0, 10.0, 3.0, 4.0, 5.0, 3.0, 1.0, 1.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.131591796875, -0.1257648468017578, -0.11993789672851562, -0.11411094665527344, -0.10828399658203125, -0.10245704650878906, -0.09663009643554688, -0.09080314636230469, -0.0849761962890625, -0.07914924621582031, -0.07332229614257812, -0.06749534606933594, -0.06166839599609375, -0.05584144592285156, -0.050014495849609375, -0.04418754577636719, -0.038360595703125, -0.03253364562988281, -0.026706695556640625, -0.020879745483398438, -0.01505279541015625, -0.009225845336914062, -0.003398895263671875, 0.0024280548095703125, 0.0082550048828125, 0.014081954956054688, 0.019908905029296875, 0.025735855102539062, 0.03156280517578125, 0.03738975524902344, 0.043216705322265625, 0.04904365539550781, 0.05487060546875, 0.06069755554199219, 0.06652450561523438, 0.07235145568847656, 0.07817840576171875, 0.08400535583496094, 0.08983230590820312, 0.09565925598144531, 0.1014862060546875, 0.10731315612792969, 0.11314010620117188, 0.11896705627441406, 0.12479400634765625, 0.13062095642089844, 0.13644790649414062, 0.1422748565673828, 0.148101806640625, 0.1539287567138672, 0.15975570678710938, 0.16558265686035156, 0.17140960693359375, 0.17723655700683594, 0.18306350708007812, 0.1888904571533203, 0.1947174072265625, 0.2005443572998047, 0.20637130737304688, 0.21219825744628906, 0.21802520751953125, 0.22385215759277344, 0.22967910766601562, 0.2355060577392578, 0.2413330078125]}, "gradients/decoder.model.decoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 1.0, 5.0, 6.0, 6.0, 17.0, 24.0, 30.0, 34.0, 52.0, 49.0, 60.0, 86.0, 75.0, 95.0, 89.0, 85.0, 71.0, 51.0, 49.0, 31.0, 25.0, 16.0, 15.0, 13.0, 5.0, 6.0, 2.0, 2.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-7.336471080780029, -7.15939998626709, -6.98232889175415, -6.805257797241211, -6.62818717956543, -6.45111608505249, -6.274044990539551, -6.096973896026611, -5.919902801513672, -5.742831707000732, -5.565760612487793, -5.388689994812012, -5.211618900299072, -5.034547805786133, -4.857476711273193, -4.680405616760254, -4.503334999084473, -4.326263904571533, -4.149192810058594, -3.9721219539642334, -3.795051097869873, -3.6179800033569336, -3.440908908843994, -3.2638378143310547, -3.0867669582366943, -2.909695863723755, -2.7326250076293945, -2.555553913116455, -2.3784828186035156, -2.2014119625091553, -2.024340867996216, -1.847269892692566, -1.6701984405517578, -1.493127465248108, -1.316056489944458, -1.1389853954315186, -0.9619144201278687, -0.7848434448242188, -0.6077723503112793, -0.4307013750076294, -0.2536303997039795, -0.0765593945980072, 0.10051161050796509, 0.27758264541625977, 0.45465362071990967, 0.6317245960235596, 0.808795690536499, 0.9858666658401489, 1.1629376411437988, 1.3400086164474487, 1.5170795917510986, 1.694150686264038, 1.871221661567688, 2.048292636871338, 2.2253637313842773, 2.402434825897217, 2.579505681991577, 2.7565767765045166, 2.933647632598877, 3.1107187271118164, 3.287789821624756, 3.464860677719116, 3.6419317722320557, 3.819002628326416, 3.9960737228393555]}, "gradients/decoder.model.decoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 3.0, 1.0, 6.0, 2.0, 0.0, 4.0, 5.0, 12.0, 6.0, 5.0, 8.0, 15.0, 17.0, 17.0, 15.0, 29.0, 21.0, 25.0, 24.0, 28.0, 28.0, 29.0, 42.0, 37.0, 40.0, 38.0, 32.0, 49.0, 36.0, 38.0, 41.0, 32.0, 30.0, 33.0, 33.0, 36.0, 28.0, 25.0, 21.0, 14.0, 15.0, 10.0, 17.0, 11.0, 16.0, 15.0, 6.0, 3.0, 3.0, 3.0, 5.0, 0.0, 3.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0], "bins": [-12.357428550720215, -11.960549354553223, -11.56367015838623, -11.166790008544922, -10.76991081237793, -10.373031616210938, -9.976152420043945, -9.579273223876953, -9.182394027709961, -8.785514831542969, -8.388635635375977, -7.991755962371826, -7.594876289367676, -7.197997093200684, -6.801117897033691, -6.404238700866699, -6.007358551025391, -5.610479354858398, -5.213599681854248, -4.816720485687256, -4.4198408126831055, -4.022961616516113, -3.626082420349121, -3.22920298576355, -2.8323235511779785, -2.4354441165924072, -2.038564682006836, -1.6416854858398438, -1.2448060512542725, -0.8479266166687012, -0.451047420501709, -0.054167985916137695, 0.3427114486694336, 0.7395908236503601, 1.1364701986312866, 1.5333495140075684, 1.9302289485931396, 2.327108383178711, 2.723987579345703, 3.1208670139312744, 3.5177464485168457, 3.914625883102417, 4.311505317687988, 4.7083845138549805, 5.105263710021973, 5.502143383026123, 5.899022579193115, 6.295902252197266, 6.692781448364258, 7.08966064453125, 7.4865403175354, 7.883419513702393, 8.280299186706543, 8.677178382873535, 9.074057579040527, 9.47093677520752, 9.867816925048828, 10.26469612121582, 10.661575317382812, 11.058454513549805, 11.455334663391113, 11.852213859558105, 12.249093055725098, 12.64597225189209, 13.042851448059082]}, "gradients/decoder.model.decoder.layers.10.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 6.0, 3.0, 2.0, 8.0, 12.0, 15.0, 22.0, 31.0, 41.0, 62.0, 74.0, 154.0, 210.0, 355.0, 606.0, 1259.0, 2690.0, 6355.0, 17323.0, 71951.0, 648958.0, 2897034.0, 461135.0, 59984.0, 15174.0, 5584.0, 2465.0, 1180.0, 595.0, 347.0, 246.0, 152.0, 81.0, 56.0, 42.0, 27.0, 17.0, 8.0, 5.0, 6.0, 7.0, 3.0, 1.0, 6.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-4.28125, -4.15692138671875, -4.0325927734375, -3.90826416015625, -3.783935546875, -3.65960693359375, -3.5352783203125, -3.41094970703125, -3.28662109375, -3.16229248046875, -3.0379638671875, -2.91363525390625, -2.789306640625, -2.66497802734375, -2.5406494140625, -2.41632080078125, -2.2919921875, -2.16766357421875, -2.0433349609375, -1.91900634765625, -1.794677734375, -1.67034912109375, -1.5460205078125, -1.42169189453125, -1.29736328125, -1.17303466796875, -1.0487060546875, -0.92437744140625, -0.800048828125, -0.67572021484375, -0.5513916015625, -0.42706298828125, -0.302734375, -0.17840576171875, -0.0540771484375, 0.07025146484375, 0.194580078125, 0.31890869140625, 0.4432373046875, 0.56756591796875, 0.69189453125, 0.81622314453125, 0.9405517578125, 1.06488037109375, 1.189208984375, 1.31353759765625, 1.4378662109375, 1.56219482421875, 1.6865234375, 1.81085205078125, 1.9351806640625, 2.05950927734375, 2.183837890625, 2.30816650390625, 2.4324951171875, 2.55682373046875, 2.68115234375, 2.80548095703125, 2.9298095703125, 3.05413818359375, 3.178466796875, 3.30279541015625, 3.4271240234375, 3.55145263671875, 3.67578125]}, "gradients/decoder.model.decoder.layers.10.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 4.0, 3.0, 4.0, 1.0, 4.0, 7.0, 4.0, 7.0, 14.0, 9.0, 14.0, 13.0, 11.0, 21.0, 22.0, 34.0, 25.0, 50.0, 33.0, 34.0, 48.0, 55.0, 50.0, 45.0, 48.0, 57.0, 49.0, 46.0, 45.0, 36.0, 34.0, 25.0, 25.0, 25.0, 28.0, 15.0, 11.0, 14.0, 5.0, 11.0, 6.0, 6.0, 7.0, 1.0, 3.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.71875, -2.642333984375, -2.56591796875, -2.489501953125, -2.4130859375, -2.336669921875, -2.26025390625, -2.183837890625, -2.107421875, -2.031005859375, -1.95458984375, -1.878173828125, -1.8017578125, -1.725341796875, -1.64892578125, -1.572509765625, -1.49609375, -1.419677734375, -1.34326171875, -1.266845703125, -1.1904296875, -1.114013671875, -1.03759765625, -0.961181640625, -0.884765625, -0.808349609375, -0.73193359375, -0.655517578125, -0.5791015625, -0.502685546875, -0.42626953125, -0.349853515625, -0.2734375, -0.197021484375, -0.12060546875, -0.044189453125, 0.0322265625, 0.108642578125, 0.18505859375, 0.261474609375, 0.337890625, 0.414306640625, 0.49072265625, 0.567138671875, 0.6435546875, 0.719970703125, 0.79638671875, 0.872802734375, 0.94921875, 1.025634765625, 1.10205078125, 1.178466796875, 1.2548828125, 1.331298828125, 1.40771484375, 1.484130859375, 1.560546875, 1.636962890625, 1.71337890625, 1.789794921875, 1.8662109375, 1.942626953125, 2.01904296875, 2.095458984375, 2.171875]}, "gradients/decoder.model.decoder.layers.10.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 5.0, 2.0, 6.0, 13.0, 31.0, 103.0, 374.0, 4190474.0, 3047.0, 160.0, 48.0, 12.0, 7.0, 6.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-79.8125, -77.515625, -75.21875, -72.921875, -70.625, -68.328125, -66.03125, -63.734375, -61.4375, -59.140625, -56.84375, -54.546875, -52.25, -49.953125, -47.65625, -45.359375, -43.0625, -40.765625, -38.46875, -36.171875, -33.875, -31.578125, -29.28125, -26.984375, -24.6875, -22.390625, -20.09375, -17.796875, -15.5, -13.203125, -10.90625, -8.609375, -6.3125, -4.015625, -1.71875, 0.578125, 2.875, 5.171875, 7.46875, 9.765625, 12.0625, 14.359375, 16.65625, 18.953125, 21.25, 23.546875, 25.84375, 28.140625, 30.4375, 32.734375, 35.03125, 37.328125, 39.625, 41.921875, 44.21875, 46.515625, 48.8125, 51.109375, 53.40625, 55.703125, 58.0, 60.296875, 62.59375, 64.890625, 67.1875]}, "gradients/decoder.model.decoder.layers.10.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 7.0, 4.0, 6.0, 8.0, 5.0, 19.0, 29.0, 36.0, 51.0, 77.0, 114.0, 224.0, 437.0, 838.0, 1042.0, 548.0, 248.0, 150.0, 81.0, 63.0, 30.0, 21.0, 14.0, 13.0, 4.0, 6.0, 6.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.873046875, -1.827545166015625, -1.78204345703125, -1.736541748046875, -1.6910400390625, -1.645538330078125, -1.60003662109375, -1.554534912109375, -1.509033203125, -1.463531494140625, -1.41802978515625, -1.372528076171875, -1.3270263671875, -1.281524658203125, -1.23602294921875, -1.190521240234375, -1.14501953125, -1.099517822265625, -1.05401611328125, -1.008514404296875, -0.9630126953125, -0.917510986328125, -0.87200927734375, -0.826507568359375, -0.781005859375, -0.735504150390625, -0.69000244140625, -0.644500732421875, -0.5989990234375, -0.553497314453125, -0.50799560546875, -0.462493896484375, -0.4169921875, -0.371490478515625, -0.32598876953125, -0.280487060546875, -0.2349853515625, -0.189483642578125, -0.14398193359375, -0.098480224609375, -0.052978515625, -0.007476806640625, 0.03802490234375, 0.083526611328125, 0.1290283203125, 0.174530029296875, 0.22003173828125, 0.265533447265625, 0.31103515625, 0.356536865234375, 0.40203857421875, 0.447540283203125, 0.4930419921875, 0.538543701171875, 0.58404541015625, 0.629547119140625, 0.675048828125, 0.720550537109375, 0.76605224609375, 0.811553955078125, 0.8570556640625, 0.902557373046875, 0.94805908203125, 0.993560791015625, 1.0390625]}, "gradients/decoder.model.decoder.layers.10.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 7.0, 9.0, 7.0, 17.0, 21.0, 36.0, 62.0, 84.0, 114.0, 114.0, 136.0, 110.0, 97.0, 62.0, 52.0, 34.0, 20.0, 13.0, 7.0, 4.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.53286600112915, -6.346932411193848, -6.160998344421387, -5.975064754486084, -5.789131164550781, -5.60319709777832, -5.417263507843018, -5.231329917907715, -5.045395851135254, -4.859462261199951, -4.67352819442749, -4.4875946044921875, -4.301661014556885, -4.115727424621582, -3.929793357849121, -3.7438597679138184, -3.5579261779785156, -3.371992349624634, -3.186058759689331, -3.000124931335449, -2.8141913414001465, -2.6282575130462646, -2.442323684692383, -2.25639009475708, -2.0704562664031982, -1.884522557258606, -1.6985888481140137, -1.5126550197601318, -1.3267213106155396, -1.1407876014709473, -0.9548537731170654, -0.7689200639724731, -0.5829858779907227, -0.397052139043808, -0.2111184000968933, -0.02518463134765625, 0.16074907779693604, 0.3466827869415283, 0.5326166152954102, 0.7185503244400024, 0.9044840335845947, 1.090417742729187, 1.2763514518737793, 1.4622852802276611, 1.6482189893722534, 1.8341526985168457, 2.0200865268707275, 2.2060203552246094, 2.391953945159912, 2.577887773513794, 2.7638213634490967, 2.9497551918029785, 3.1356887817382812, 3.321622610092163, 3.507556438446045, 3.6934900283813477, 3.8794238567352295, 4.065357685089111, 4.251291275024414, 4.437225341796875, 4.623158931732178, 4.8090925216674805, 4.995026588439941, 5.180960178375244, 5.366893768310547]}, "gradients/decoder.model.decoder.layers.10.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 5.0, 2.0, 4.0, 4.0, 3.0, 6.0, 6.0, 10.0, 11.0, 14.0, 13.0, 14.0, 11.0, 25.0, 21.0, 30.0, 38.0, 25.0, 51.0, 35.0, 41.0, 41.0, 41.0, 44.0, 40.0, 37.0, 34.0, 47.0, 48.0, 41.0, 31.0, 27.0, 31.0, 33.0, 30.0, 19.0, 22.0, 13.0, 12.0, 13.0, 6.0, 10.0, 5.0, 4.0, 3.0, 5.0, 4.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.3284897804260254, -2.2530298233032227, -2.177569627761841, -2.102109670639038, -2.0266494750976562, -1.9511895179748535, -1.8757294416427612, -1.800269365310669, -1.7248094081878662, -1.649349331855774, -1.5738892555236816, -1.498429298400879, -1.4229692220687866, -1.3475091457366943, -1.272049069404602, -1.1965889930725098, -1.1211289167404175, -1.0456688404083252, -0.9702088236808777, -0.8947487473487854, -0.8192887306213379, -0.7438286542892456, -0.6683685779571533, -0.5929085612297058, -0.5174484848976135, -0.44198843836784363, -0.36652839183807373, -0.29106831550598145, -0.21560826897621155, -0.14014822244644165, -0.06468814611434937, 0.010771870613098145, 0.08623194694519043, 0.16169199347496033, 0.23715205490589142, 0.3126121163368225, 0.3880721628665924, 0.4635322093963623, 0.5389922857284546, 0.6144523024559021, 0.6899123787879944, 0.7653724551200867, 0.8408324718475342, 0.9162925481796265, 0.9917526245117188, 1.0672125816345215, 1.1426727771759033, 1.218132734298706, 1.2935928106307983, 1.3690528869628906, 1.444512963294983, 1.5199730396270752, 1.595432996749878, 1.6708930730819702, 1.7463531494140625, 1.8218131065368652, 1.897273302078247, 1.9727333784103394, 2.0481934547424316, 2.1236534118652344, 2.199113607406616, 2.274573564529419, 2.350033760070801, 2.4254937171936035, 2.5009536743164062]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 3.0, 4.0, 2.0, 10.0, 9.0, 9.0, 13.0, 20.0, 23.0, 59.0, 66.0, 95.0, 144.0, 181.0, 270.0, 393.0, 582.0, 854.0, 1344.0, 2151.0, 3673.0, 6349.0, 11770.0, 23389.0, 49980.0, 113669.0, 251035.0, 306714.0, 146844.0, 65096.0, 29668.0, 14724.0, 7758.0, 4382.0, 2592.0, 1544.0, 1015.0, 669.0, 441.0, 321.0, 195.0, 152.0, 108.0, 65.0, 49.0, 35.0, 25.0, 13.0, 13.0, 12.0, 11.0, 9.0, 6.0, 2.0, 1.0, 1.0, 4.0], "bins": [-0.96875, -0.9403915405273438, -0.9120330810546875, -0.8836746215820312, -0.855316162109375, -0.8269577026367188, -0.7985992431640625, -0.7702407836914062, -0.74188232421875, -0.7135238647460938, -0.6851654052734375, -0.6568069458007812, -0.628448486328125, -0.6000900268554688, -0.5717315673828125, -0.5433731079101562, -0.5150146484375, -0.48665618896484375, -0.4582977294921875, -0.42993927001953125, -0.401580810546875, -0.37322235107421875, -0.3448638916015625, -0.31650543212890625, -0.28814697265625, -0.25978851318359375, -0.2314300537109375, -0.20307159423828125, -0.174713134765625, -0.14635467529296875, -0.1179962158203125, -0.08963775634765625, -0.061279296875, -0.03292083740234375, -0.0045623779296875, 0.02379608154296875, 0.052154541015625, 0.08051300048828125, 0.1088714599609375, 0.13722991943359375, 0.16558837890625, 0.19394683837890625, 0.2223052978515625, 0.25066375732421875, 0.279022216796875, 0.30738067626953125, 0.3357391357421875, 0.36409759521484375, 0.3924560546875, 0.42081451416015625, 0.4491729736328125, 0.47753143310546875, 0.505889892578125, 0.5342483520507812, 0.5626068115234375, 0.5909652709960938, 0.61932373046875, 0.6476821899414062, 0.6760406494140625, 0.7043991088867188, 0.732757568359375, 0.7611160278320312, 0.7894744873046875, 0.8178329467773438, 0.84619140625]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 7.0, 6.0, 5.0, 12.0, 13.0, 26.0, 12.0, 25.0, 29.0, 40.0, 44.0, 53.0, 46.0, 60.0, 63.0, 70.0, 51.0, 38.0, 73.0, 62.0, 53.0, 33.0, 38.0, 41.0, 31.0, 25.0, 14.0, 6.0, 6.0, 4.0, 6.0, 6.0, 3.0, 6.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.42578125, -2.35614013671875, -2.2864990234375, -2.21685791015625, -2.147216796875, -2.07757568359375, -2.0079345703125, -1.93829345703125, -1.86865234375, -1.79901123046875, -1.7293701171875, -1.65972900390625, -1.590087890625, -1.52044677734375, -1.4508056640625, -1.38116455078125, -1.3115234375, -1.24188232421875, -1.1722412109375, -1.10260009765625, -1.032958984375, -0.96331787109375, -0.8936767578125, -0.82403564453125, -0.75439453125, -0.68475341796875, -0.6151123046875, -0.54547119140625, -0.475830078125, -0.40618896484375, -0.3365478515625, -0.26690673828125, -0.197265625, -0.12762451171875, -0.0579833984375, 0.01165771484375, 0.081298828125, 0.15093994140625, 0.2205810546875, 0.29022216796875, 0.35986328125, 0.42950439453125, 0.4991455078125, 0.56878662109375, 0.638427734375, 0.70806884765625, 0.7777099609375, 0.84735107421875, 0.9169921875, 0.98663330078125, 1.0562744140625, 1.12591552734375, 1.195556640625, 1.26519775390625, 1.3348388671875, 1.40447998046875, 1.47412109375, 1.54376220703125, 1.6134033203125, 1.68304443359375, 1.752685546875, 1.82232666015625, 1.8919677734375, 1.96160888671875, 2.03125]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 1.0, 2.0, 3.0, 0.0, 6.0, 6.0, 1.0, 2.0, 7.0, 7.0, 6.0, 15.0, 16.0, 21.0, 43.0, 68.0, 115.0, 220.0, 403.0, 792.0, 1897.0, 5374.0, 22281.0, 171598.0, 709402.0, 112140.0, 16634.0, 4443.0, 1569.0, 703.0, 327.0, 176.0, 106.0, 52.0, 43.0, 17.0, 9.0, 9.0, 13.0, 4.0, 8.0, 2.0, 5.0, 7.0, 2.0, 1.0, 1.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.8671875, -1.8095703125, -1.751953125, -1.6943359375, -1.63671875, -1.5791015625, -1.521484375, -1.4638671875, -1.40625, -1.3486328125, -1.291015625, -1.2333984375, -1.17578125, -1.1181640625, -1.060546875, -1.0029296875, -0.9453125, -0.8876953125, -0.830078125, -0.7724609375, -0.71484375, -0.6572265625, -0.599609375, -0.5419921875, -0.484375, -0.4267578125, -0.369140625, -0.3115234375, -0.25390625, -0.1962890625, -0.138671875, -0.0810546875, -0.0234375, 0.0341796875, 0.091796875, 0.1494140625, 0.20703125, 0.2646484375, 0.322265625, 0.3798828125, 0.4375, 0.4951171875, 0.552734375, 0.6103515625, 0.66796875, 0.7255859375, 0.783203125, 0.8408203125, 0.8984375, 0.9560546875, 1.013671875, 1.0712890625, 1.12890625, 1.1865234375, 1.244140625, 1.3017578125, 1.359375, 1.4169921875, 1.474609375, 1.5322265625, 1.58984375, 1.6474609375, 1.705078125, 1.7626953125, 1.8203125]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 6.0, 7.0, 3.0, 3.0, 4.0, 10.0, 11.0, 10.0, 12.0, 18.0, 20.0, 19.0, 33.0, 35.0, 35.0, 40.0, 38.0, 49.0, 41.0, 47.0, 53.0, 49.0, 42.0, 37.0, 44.0, 49.0, 36.0, 36.0, 31.0, 27.0, 21.0, 19.0, 18.0, 14.0, 14.0, 16.0, 10.0, 6.0, 10.0, 10.0, 4.0, 3.0, 3.0, 1.0, 6.0, 5.0, 1.0, 3.0, 2.0, 1.0, 2.0], "bins": [-3.54296875, -3.439208984375, -3.33544921875, -3.231689453125, -3.1279296875, -3.024169921875, -2.92041015625, -2.816650390625, -2.712890625, -2.609130859375, -2.50537109375, -2.401611328125, -2.2978515625, -2.194091796875, -2.09033203125, -1.986572265625, -1.8828125, -1.779052734375, -1.67529296875, -1.571533203125, -1.4677734375, -1.364013671875, -1.26025390625, -1.156494140625, -1.052734375, -0.948974609375, -0.84521484375, -0.741455078125, -0.6376953125, -0.533935546875, -0.43017578125, -0.326416015625, -0.22265625, -0.118896484375, -0.01513671875, 0.088623046875, 0.1923828125, 0.296142578125, 0.39990234375, 0.503662109375, 0.607421875, 0.711181640625, 0.81494140625, 0.918701171875, 1.0224609375, 1.126220703125, 1.22998046875, 1.333740234375, 1.4375, 1.541259765625, 1.64501953125, 1.748779296875, 1.8525390625, 1.956298828125, 2.06005859375, 2.163818359375, 2.267578125, 2.371337890625, 2.47509765625, 2.578857421875, 2.6826171875, 2.786376953125, 2.89013671875, 2.993896484375, 3.09765625]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 5.0, 5.0, 6.0, 9.0, 13.0, 24.0, 39.0, 64.0, 89.0, 153.0, 300.0, 652.0, 1536.0, 4102.0, 15013.0, 102833.0, 750743.0, 146532.0, 18512.0, 4678.0, 1700.0, 768.0, 347.0, 180.0, 109.0, 50.0, 31.0, 23.0, 17.0, 12.0, 6.0, 7.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.53759765625, -0.515716552734375, -0.49383544921875, -0.471954345703125, -0.4500732421875, -0.428192138671875, -0.40631103515625, -0.384429931640625, -0.362548828125, -0.340667724609375, -0.31878662109375, -0.296905517578125, -0.2750244140625, -0.253143310546875, -0.23126220703125, -0.209381103515625, -0.1875, -0.165618896484375, -0.14373779296875, -0.121856689453125, -0.0999755859375, -0.078094482421875, -0.05621337890625, -0.034332275390625, -0.012451171875, 0.009429931640625, 0.03131103515625, 0.053192138671875, 0.0750732421875, 0.096954345703125, 0.11883544921875, 0.140716552734375, 0.16259765625, 0.184478759765625, 0.20635986328125, 0.228240966796875, 0.2501220703125, 0.272003173828125, 0.29388427734375, 0.315765380859375, 0.337646484375, 0.359527587890625, 0.38140869140625, 0.403289794921875, 0.4251708984375, 0.447052001953125, 0.46893310546875, 0.490814208984375, 0.5126953125, 0.534576416015625, 0.55645751953125, 0.578338623046875, 0.6002197265625, 0.622100830078125, 0.64398193359375, 0.665863037109375, 0.687744140625, 0.709625244140625, 0.73150634765625, 0.753387451171875, 0.7752685546875, 0.797149658203125, 0.81903076171875, 0.840911865234375, 0.86279296875]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 1.0, 3.0, 2.0, 2.0, 2.0, 3.0, 5.0, 3.0, 13.0, 35.0, 51.0, 61.0, 101.0, 144.0, 147.0, 141.0, 93.0, 67.0, 40.0, 37.0, 13.0, 11.0, 8.0, 9.0, 4.0, 2.0, 5.0, 3.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.000568389892578125, -0.0005540400743484497, -0.0005396902561187744, -0.0005253404378890991, -0.0005109906196594238, -0.0004966408014297485, -0.00048229098320007324, -0.00046794116497039795, -0.00045359134674072266, -0.00043924152851104736, -0.00042489171028137207, -0.0004105418920516968, -0.0003961920738220215, -0.0003818422555923462, -0.0003674924373626709, -0.0003531426191329956, -0.0003387928009033203, -0.000324442982673645, -0.0003100931644439697, -0.00029574334621429443, -0.00028139352798461914, -0.00026704370975494385, -0.00025269389152526855, -0.00023834407329559326, -0.00022399425506591797, -0.00020964443683624268, -0.00019529461860656738, -0.0001809448003768921, -0.0001665949821472168, -0.0001522451639175415, -0.0001378953456878662, -0.00012354552745819092, -0.00010919570922851562, -9.484589099884033e-05, -8.049607276916504e-05, -6.614625453948975e-05, -5.179643630981445e-05, -3.744661808013916e-05, -2.3096799850463867e-05, -8.746981620788574e-06, 5.602836608886719e-06, 1.9952654838562012e-05, 3.4302473068237305e-05, 4.86522912979126e-05, 6.300210952758789e-05, 7.735192775726318e-05, 9.170174598693848e-05, 0.00010605156421661377, 0.00012040138244628906, 0.00013475120067596436, 0.00014910101890563965, 0.00016345083713531494, 0.00017780065536499023, 0.00019215047359466553, 0.00020650029182434082, 0.0002208501100540161, 0.0002351999282836914, 0.0002495497465133667, 0.000263899564743042, 0.0002782493829727173, 0.0002925992012023926, 0.00030694901943206787, 0.00032129883766174316, 0.00033564865589141846, 0.00034999847412109375]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 3.0, 1.0, 5.0, 6.0, 4.0, 10.0, 9.0, 10.0, 19.0, 29.0, 54.0, 155.0, 502.0, 2332.0, 17791.0, 622138.0, 389977.0, 13032.0, 1811.0, 400.0, 131.0, 52.0, 32.0, 9.0, 16.0, 5.0, 4.0, 6.0, 4.0, 4.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.3076171875, -1.2666778564453125, -1.225738525390625, -1.1847991943359375, -1.14385986328125, -1.1029205322265625, -1.061981201171875, -1.0210418701171875, -0.9801025390625, -0.9391632080078125, -0.898223876953125, -0.8572845458984375, -0.81634521484375, -0.7754058837890625, -0.734466552734375, -0.6935272216796875, -0.652587890625, -0.6116485595703125, -0.570709228515625, -0.5297698974609375, -0.48883056640625, -0.4478912353515625, -0.406951904296875, -0.3660125732421875, -0.3250732421875, -0.2841339111328125, -0.243194580078125, -0.2022552490234375, -0.16131591796875, -0.1203765869140625, -0.079437255859375, -0.0384979248046875, 0.00244140625, 0.0433807373046875, 0.084320068359375, 0.1252593994140625, 0.16619873046875, 0.2071380615234375, 0.248077392578125, 0.2890167236328125, 0.3299560546875, 0.3708953857421875, 0.411834716796875, 0.4527740478515625, 0.49371337890625, 0.5346527099609375, 0.575592041015625, 0.6165313720703125, 0.657470703125, 0.6984100341796875, 0.739349365234375, 0.7802886962890625, 0.82122802734375, 0.8621673583984375, 0.903106689453125, 0.9440460205078125, 0.9849853515625, 1.0259246826171875, 1.066864013671875, 1.1078033447265625, 1.14874267578125, 1.1896820068359375, 1.230621337890625, 1.2715606689453125, 1.3125]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 5.0, 6.0, 8.0, 16.0, 18.0, 15.0, 19.0, 27.0, 32.0, 36.0, 57.0, 62.0, 79.0, 89.0, 85.0, 68.0, 78.0, 69.0, 45.0, 39.0, 41.0, 22.0, 21.0, 11.0, 13.0, 10.0, 3.0, 1.0, 7.0, 4.0, 4.0, 3.0, 3.0, 1.0, 1.0, 1.0, 3.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.09637451171875, -0.09309196472167969, -0.08980941772460938, -0.08652687072753906, -0.08324432373046875, -0.07996177673339844, -0.07667922973632812, -0.07339668273925781, -0.0701141357421875, -0.06683158874511719, -0.06354904174804688, -0.06026649475097656, -0.05698394775390625, -0.05370140075683594, -0.050418853759765625, -0.04713630676269531, -0.043853759765625, -0.04057121276855469, -0.037288665771484375, -0.03400611877441406, -0.03072357177734375, -0.027441024780273438, -0.024158477783203125, -0.020875930786132812, -0.0175933837890625, -0.014310836791992188, -0.011028289794921875, -0.0077457427978515625, -0.00446319580078125, -0.0011806488037109375, 0.002101898193359375, 0.0053844451904296875, 0.0086669921875, 0.011949539184570312, 0.015232086181640625, 0.018514633178710938, 0.02179718017578125, 0.025079727172851562, 0.028362274169921875, 0.03164482116699219, 0.0349273681640625, 0.03820991516113281, 0.041492462158203125, 0.04477500915527344, 0.04805755615234375, 0.05134010314941406, 0.054622650146484375, 0.05790519714355469, 0.061187744140625, 0.06447029113769531, 0.06775283813476562, 0.07103538513183594, 0.07431793212890625, 0.07760047912597656, 0.08088302612304688, 0.08416557312011719, 0.0874481201171875, 0.09073066711425781, 0.09401321411132812, 0.09729576110839844, 0.10057830810546875, 0.10386085510253906, 0.10714340209960938, 0.11042594909667969, 0.11370849609375]}, "gradients/decoder.model.decoder.layers.10.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 2.0, 2.0, 9.0, 2.0, 11.0, 14.0, 22.0, 41.0, 67.0, 87.0, 109.0, 122.0, 127.0, 126.0, 100.0, 56.0, 37.0, 34.0, 16.0, 5.0, 6.0, 4.0, 5.0, 3.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-4.699546813964844, -4.582073211669922, -4.464600086212158, -4.347126483917236, -4.2296528816223145, -4.112179279327393, -3.994706153869629, -3.877232551574707, -3.759758949279785, -3.6422855854034424, -3.5248119831085205, -3.4073386192321777, -3.289865016937256, -3.172391653060913, -3.0549182891845703, -2.9374446868896484, -2.8199713230133057, -2.702497959136963, -2.585024356842041, -2.4675509929656982, -2.3500773906707764, -2.2326040267944336, -2.1151304244995117, -1.997657060623169, -1.8801835775375366, -1.7627100944519043, -1.645236611366272, -1.5277631282806396, -1.4102897644042969, -1.292816162109375, -1.1753427982330322, -1.0578693151474, -0.9403958320617676, -0.8229223489761353, -0.7054488658905029, -0.5879754424095154, -0.47050195932388306, -0.35302847623825073, -0.23555505275726318, -0.11808156967163086, -0.0006080865859985352, 0.1168653815984726, 0.23433884978294373, 0.35181230306625366, 0.469285786151886, 0.5867592692375183, 0.7042326927185059, 0.8217061758041382, 0.9391796588897705, 1.0566531419754028, 1.1741266250610352, 1.291599988937378, 1.4090735912322998, 1.5265469551086426, 1.644020438194275, 1.7614939212799072, 1.8789674043655396, 1.9964408874511719, 2.1139142513275146, 2.2313878536224365, 2.3488612174987793, 2.466334819793701, 2.583808183670044, 2.7012815475463867, 2.8187551498413086]}, "gradients/decoder.model.decoder.layers.10.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 3.0, 10.0, 6.0, 8.0, 7.0, 13.0, 14.0, 22.0, 23.0, 34.0, 43.0, 41.0, 59.0, 56.0, 63.0, 59.0, 56.0, 45.0, 69.0, 50.0, 57.0, 42.0, 57.0, 42.0, 28.0, 20.0, 18.0, 16.0, 11.0, 10.0, 11.0, 3.0, 5.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0], "bins": [-2.69895076751709, -2.630011558532715, -2.56107234954834, -2.492133140563965, -2.42319393157959, -2.354254722595215, -2.28531551361084, -2.216376304626465, -2.14743709564209, -2.078497886657715, -2.00955867767334, -1.9406194686889648, -1.8716802597045898, -1.8027410507202148, -1.7338018417358398, -1.6648626327514648, -1.5959234237670898, -1.5269842147827148, -1.4580450057983398, -1.3891057968139648, -1.3201665878295898, -1.2512273788452148, -1.1822881698608398, -1.1133489608764648, -1.0444097518920898, -0.9754705429077148, -0.9065313339233398, -0.8375921249389648, -0.7686529159545898, -0.6997137069702148, -0.6307744979858398, -0.5618352890014648, -0.4928959608078003, -0.4239567518234253, -0.3550175428390503, -0.2860783338546753, -0.2171391248703003, -0.1481999158859253, -0.07926070690155029, -0.010321497917175293, 0.05861771106719971, 0.1275569200515747, 0.1964961290359497, 0.2654353380203247, 0.3343745470046997, 0.4033137559890747, 0.4722529649734497, 0.5411921739578247, 0.6101313829421997, 0.6790705919265747, 0.7480098009109497, 0.8169490098953247, 0.8858882188796997, 0.9548274278640747, 1.0237666368484497, 1.0927058458328247, 1.1616450548171997, 1.2305842638015747, 1.2995234727859497, 1.3684626817703247, 1.4374018907546997, 1.5063410997390747, 1.5752803087234497, 1.6442195177078247, 1.7131587266921997]}, "gradients/decoder.model.decoder.layers.10.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 3.0, 4.0, 9.0, 4.0, 16.0, 20.0, 30.0, 33.0, 56.0, 72.0, 136.0, 198.0, 304.0, 425.0, 705.0, 1090.0, 1738.0, 2768.0, 4661.0, 8231.0, 15800.0, 31958.0, 74098.0, 204202.0, 395907.0, 177578.0, 65816.0, 29010.0, 14330.0, 7873.0, 4344.0, 2604.0, 1684.0, 981.0, 625.0, 403.0, 246.0, 195.0, 142.0, 78.0, 57.0, 44.0, 41.0, 15.0, 9.0, 6.0, 8.0, 2.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.85888671875, -0.8286819458007812, -0.7984771728515625, -0.7682723999023438, -0.738067626953125, -0.7078628540039062, -0.6776580810546875, -0.6474533081054688, -0.61724853515625, -0.5870437622070312, -0.5568389892578125, -0.5266342163085938, -0.496429443359375, -0.46622467041015625, -0.4360198974609375, -0.40581512451171875, -0.3756103515625, -0.34540557861328125, -0.3152008056640625, -0.28499603271484375, -0.254791259765625, -0.22458648681640625, -0.1943817138671875, -0.16417694091796875, -0.13397216796875, -0.10376739501953125, -0.0735626220703125, -0.04335784912109375, -0.013153076171875, 0.01705169677734375, 0.0472564697265625, 0.07746124267578125, 0.107666015625, 0.13787078857421875, 0.1680755615234375, 0.19828033447265625, 0.228485107421875, 0.25868988037109375, 0.2888946533203125, 0.31909942626953125, 0.34930419921875, 0.37950897216796875, 0.4097137451171875, 0.43991851806640625, 0.470123291015625, 0.5003280639648438, 0.5305328369140625, 0.5607376098632812, 0.5909423828125, 0.6211471557617188, 0.6513519287109375, 0.6815567016601562, 0.711761474609375, 0.7419662475585938, 0.7721710205078125, 0.8023757934570312, 0.83258056640625, 0.8627853393554688, 0.8929901123046875, 0.9231948852539062, 0.953399658203125, 0.9836044311523438, 1.0138092041015625, 1.0440139770507812, 1.07421875]}, "gradients/decoder.model.decoder.layers.10.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 2.0, 1.0, 3.0, 2.0, 6.0, 5.0, 6.0, 7.0, 10.0, 10.0, 10.0, 19.0, 35.0, 27.0, 30.0, 28.0, 49.0, 52.0, 58.0, 56.0, 66.0, 77.0, 47.0, 50.0, 50.0, 51.0, 47.0, 42.0, 32.0, 29.0, 23.0, 18.0, 17.0, 8.0, 12.0, 11.0, 3.0, 2.0, 4.0, 4.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-6.74609375, -6.5657958984375, -6.385498046875, -6.2052001953125, -6.02490234375, -5.8446044921875, -5.664306640625, -5.4840087890625, -5.3037109375, -5.1234130859375, -4.943115234375, -4.7628173828125, -4.58251953125, -4.4022216796875, -4.221923828125, -4.0416259765625, -3.861328125, -3.6810302734375, -3.500732421875, -3.3204345703125, -3.14013671875, -2.9598388671875, -2.779541015625, -2.5992431640625, -2.4189453125, -2.2386474609375, -2.058349609375, -1.8780517578125, -1.69775390625, -1.5174560546875, -1.337158203125, -1.1568603515625, -0.9765625, -0.7962646484375, -0.615966796875, -0.4356689453125, -0.25537109375, -0.0750732421875, 0.105224609375, 0.2855224609375, 0.4658203125, 0.6461181640625, 0.826416015625, 1.0067138671875, 1.18701171875, 1.3673095703125, 1.547607421875, 1.7279052734375, 1.908203125, 2.0885009765625, 2.268798828125, 2.4490966796875, 2.62939453125, 2.8096923828125, 2.989990234375, 3.1702880859375, 3.3505859375, 3.5308837890625, 3.711181640625, 3.8914794921875, 4.07177734375, 4.2520751953125, 4.432373046875, 4.6126708984375, 4.79296875]}, "gradients/decoder.model.decoder.layers.10.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 4.0, 1.0, 3.0, 1.0, 7.0, 9.0, 3.0, 8.0, 10.0, 8.0, 20.0, 23.0, 22.0, 28.0, 44.0, 34.0, 48.0, 50.0, 46.0, 66.0, 127.0, 2429.0, 1044335.0, 712.0, 108.0, 59.0, 65.0, 42.0, 37.0, 37.0, 40.0, 33.0, 27.0, 21.0, 18.0, 11.0, 4.0, 8.0, 7.0, 1.0, 1.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.203125, -18.591552734375, -17.97998046875, -17.368408203125, -16.7568359375, -16.145263671875, -15.53369140625, -14.922119140625, -14.310546875, -13.698974609375, -13.08740234375, -12.475830078125, -11.8642578125, -11.252685546875, -10.64111328125, -10.029541015625, -9.41796875, -8.806396484375, -8.19482421875, -7.583251953125, -6.9716796875, -6.360107421875, -5.74853515625, -5.136962890625, -4.525390625, -3.913818359375, -3.30224609375, -2.690673828125, -2.0791015625, -1.467529296875, -0.85595703125, -0.244384765625, 0.3671875, 0.978759765625, 1.59033203125, 2.201904296875, 2.8134765625, 3.425048828125, 4.03662109375, 4.648193359375, 5.259765625, 5.871337890625, 6.48291015625, 7.094482421875, 7.7060546875, 8.317626953125, 8.92919921875, 9.540771484375, 10.15234375, 10.763916015625, 11.37548828125, 11.987060546875, 12.5986328125, 13.210205078125, 13.82177734375, 14.433349609375, 15.044921875, 15.656494140625, 16.26806640625, 16.879638671875, 17.4912109375, 18.102783203125, 18.71435546875, 19.325927734375, 19.9375]}, "gradients/decoder.model.decoder.layers.10.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 1.0, 2.0, 2.0, 7.0, 9.0, 7.0, 7.0, 7.0, 11.0, 19.0, 23.0, 23.0, 31.0, 31.0, 48.0, 34.0, 45.0, 42.0, 39.0, 52.0, 58.0, 55.0, 43.0, 32.0, 53.0, 44.0, 30.0, 35.0, 41.0, 32.0, 37.0, 27.0, 21.0, 16.0, 13.0, 6.0, 7.0, 5.0, 4.0, 4.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.6875, -5.5069580078125, -5.326416015625, -5.1458740234375, -4.96533203125, -4.7847900390625, -4.604248046875, -4.4237060546875, -4.2431640625, -4.0626220703125, -3.882080078125, -3.7015380859375, -3.52099609375, -3.3404541015625, -3.159912109375, -2.9793701171875, -2.798828125, -2.6182861328125, -2.437744140625, -2.2572021484375, -2.07666015625, -1.8961181640625, -1.715576171875, -1.5350341796875, -1.3544921875, -1.1739501953125, -0.993408203125, -0.8128662109375, -0.63232421875, -0.4517822265625, -0.271240234375, -0.0906982421875, 0.08984375, 0.2703857421875, 0.450927734375, 0.6314697265625, 0.81201171875, 0.9925537109375, 1.173095703125, 1.3536376953125, 1.5341796875, 1.7147216796875, 1.895263671875, 2.0758056640625, 2.25634765625, 2.4368896484375, 2.617431640625, 2.7979736328125, 2.978515625, 3.1590576171875, 3.339599609375, 3.5201416015625, 3.70068359375, 3.8812255859375, 4.061767578125, 4.2423095703125, 4.4228515625, 4.6033935546875, 4.783935546875, 4.9644775390625, 5.14501953125, 5.3255615234375, 5.506103515625, 5.6866455078125, 5.8671875]}, "gradients/decoder.model.decoder.layers.10.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 1.0, 2.0, 3.0, 7.0, 4.0, 7.0, 7.0, 11.0, 24.0, 33.0, 69.0, 158.0, 526.0, 2701.0, 46343.0, 969893.0, 26035.0, 1975.0, 430.0, 148.0, 60.0, 31.0, 29.0, 12.0, 13.0, 10.0, 4.0, 6.0, 6.0, 4.0, 4.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.740234375, -1.67437744140625, -1.6085205078125, -1.54266357421875, -1.476806640625, -1.41094970703125, -1.3450927734375, -1.27923583984375, -1.21337890625, -1.14752197265625, -1.0816650390625, -1.01580810546875, -0.949951171875, -0.88409423828125, -0.8182373046875, -0.75238037109375, -0.6865234375, -0.62066650390625, -0.5548095703125, -0.48895263671875, -0.423095703125, -0.35723876953125, -0.2913818359375, -0.22552490234375, -0.15966796875, -0.09381103515625, -0.0279541015625, 0.03790283203125, 0.103759765625, 0.16961669921875, 0.2354736328125, 0.30133056640625, 0.3671875, 0.43304443359375, 0.4989013671875, 0.56475830078125, 0.630615234375, 0.69647216796875, 0.7623291015625, 0.82818603515625, 0.89404296875, 0.95989990234375, 1.0257568359375, 1.09161376953125, 1.157470703125, 1.22332763671875, 1.2891845703125, 1.35504150390625, 1.4208984375, 1.48675537109375, 1.5526123046875, 1.61846923828125, 1.684326171875, 1.75018310546875, 1.8160400390625, 1.88189697265625, 1.94775390625, 2.01361083984375, 2.0794677734375, 2.14532470703125, 2.211181640625, 2.27703857421875, 2.3428955078125, 2.40875244140625, 2.474609375]}, "gradients/decoder.model.decoder.layers.10.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0, 1.0, 4.0, 4.0, 3.0, 5.0, 6.0, 8.0, 9.0, 15.0, 24.0, 45.0, 31.0, 68.0, 114.0, 182.0, 161.0, 107.0, 62.0, 49.0, 31.0, 18.0, 20.0, 10.0, 7.0, 5.0, 7.0, 6.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.0001327991485595703, -0.00012910738587379456, -0.0001254156231880188, -0.00012172386050224304, -0.00011803209781646729, -0.00011434033513069153, -0.00011064857244491577, -0.00010695680975914001, -0.00010326504707336426, -9.95732843875885e-05, -9.588152170181274e-05, -9.218975901603699e-05, -8.849799633026123e-05, -8.480623364448547e-05, -8.111447095870972e-05, -7.742270827293396e-05, -7.37309455871582e-05, -7.003918290138245e-05, -6.634742021560669e-05, -6.265565752983093e-05, -5.8963894844055176e-05, -5.527213215827942e-05, -5.158036947250366e-05, -4.7888606786727905e-05, -4.419684410095215e-05, -4.050508141517639e-05, -3.6813318729400635e-05, -3.312155604362488e-05, -2.942979335784912e-05, -2.5738030672073364e-05, -2.2046267986297607e-05, -1.835450530052185e-05, -1.4662742614746094e-05, -1.0970979928970337e-05, -7.27921724319458e-06, -3.5874545574188232e-06, 1.043081283569336e-07, 3.7960708141326904e-06, 7.487833499908447e-06, 1.1179596185684204e-05, 1.4871358871459961e-05, 1.8563121557235718e-05, 2.2254884243011475e-05, 2.594664692878723e-05, 2.9638409614562988e-05, 3.3330172300338745e-05, 3.70219349861145e-05, 4.071369767189026e-05, 4.4405460357666016e-05, 4.809722304344177e-05, 5.178898572921753e-05, 5.5480748414993286e-05, 5.917251110076904e-05, 6.28642737865448e-05, 6.655603647232056e-05, 7.024779915809631e-05, 7.393956184387207e-05, 7.763132452964783e-05, 8.132308721542358e-05, 8.501484990119934e-05, 8.87066125869751e-05, 9.239837527275085e-05, 9.609013795852661e-05, 9.978190064430237e-05, 0.00010347366333007812]}, "gradients/decoder.model.decoder.layers.10.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 5.0, 2.0, 4.0, 1.0, 8.0, 11.0, 17.0, 33.0, 59.0, 115.0, 333.0, 1245.0, 8805.0, 603998.0, 423927.0, 8190.0, 1188.0, 350.0, 130.0, 64.0, 26.0, 17.0, 9.0, 4.0, 9.0, 5.0, 1.0, 3.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.41015625, -2.3449859619140625, -2.279815673828125, -2.2146453857421875, -2.14947509765625, -2.0843048095703125, -2.019134521484375, -1.9539642333984375, -1.8887939453125, -1.8236236572265625, -1.758453369140625, -1.6932830810546875, -1.62811279296875, -1.5629425048828125, -1.497772216796875, -1.4326019287109375, -1.367431640625, -1.3022613525390625, -1.237091064453125, -1.1719207763671875, -1.10675048828125, -1.0415802001953125, -0.976409912109375, -0.9112396240234375, -0.8460693359375, -0.7808990478515625, -0.715728759765625, -0.6505584716796875, -0.58538818359375, -0.5202178955078125, -0.455047607421875, -0.3898773193359375, -0.32470703125, -0.2595367431640625, -0.194366455078125, -0.1291961669921875, -0.06402587890625, 0.0011444091796875, 0.066314697265625, 0.1314849853515625, 0.1966552734375, 0.2618255615234375, 0.326995849609375, 0.3921661376953125, 0.45733642578125, 0.5225067138671875, 0.587677001953125, 0.6528472900390625, 0.718017578125, 0.7831878662109375, 0.848358154296875, 0.9135284423828125, 0.97869873046875, 1.0438690185546875, 1.109039306640625, 1.1742095947265625, 1.2393798828125, 1.3045501708984375, 1.369720458984375, 1.4348907470703125, 1.50006103515625, 1.5652313232421875, 1.630401611328125, 1.6955718994140625, 1.7607421875]}, "gradients/decoder.model.decoder.layers.10.self_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 2.0, 4.0, 6.0, 6.0, 8.0, 12.0, 12.0, 19.0, 27.0, 29.0, 41.0, 48.0, 62.0, 163.0, 173.0, 115.0, 69.0, 47.0, 36.0, 24.0, 20.0, 14.0, 16.0, 12.0, 7.0, 7.0, 6.0, 5.0, 3.0, 0.0, 7.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.275146484375, -0.26502227783203125, -0.2548980712890625, -0.24477386474609375, -0.234649658203125, -0.22452545166015625, -0.2144012451171875, -0.20427703857421875, -0.19415283203125, -0.18402862548828125, -0.1739044189453125, -0.16378021240234375, -0.153656005859375, -0.14353179931640625, -0.1334075927734375, -0.12328338623046875, -0.1131591796875, -0.10303497314453125, -0.0929107666015625, -0.08278656005859375, -0.072662353515625, -0.06253814697265625, -0.0524139404296875, -0.04228973388671875, -0.03216552734375, -0.02204132080078125, -0.0119171142578125, -0.00179290771484375, 0.008331298828125, 0.01845550537109375, 0.0285797119140625, 0.03870391845703125, 0.048828125, 0.05895233154296875, 0.0690765380859375, 0.07920074462890625, 0.089324951171875, 0.09944915771484375, 0.1095733642578125, 0.11969757080078125, 0.12982177734375, 0.13994598388671875, 0.1500701904296875, 0.16019439697265625, 0.170318603515625, 0.18044281005859375, 0.1905670166015625, 0.20069122314453125, 0.2108154296875, 0.22093963623046875, 0.2310638427734375, 0.24118804931640625, 0.251312255859375, 0.26143646240234375, 0.2715606689453125, 0.28168487548828125, 0.29180908203125, 0.30193328857421875, 0.3120574951171875, 0.32218170166015625, 0.332305908203125, 0.34243011474609375, 0.3525543212890625, 0.36267852783203125, 0.372802734375]}, "gradients/decoder.model.decoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 6.0, 9.0, 37.0, 164.0, 402.0, 297.0, 83.0, 16.0, 5.0, 0.0, 1.0, 1.0], "bins": [-42.62360763549805, -41.87306213378906, -41.12251663208008, -40.371971130371094, -39.62142562866211, -38.870880126953125, -38.12033462524414, -37.369789123535156, -36.61924362182617, -35.86869812011719, -35.1181526184082, -34.36760711669922, -33.617061614990234, -32.86651611328125, -32.115970611572266, -31.36542510986328, -30.614879608154297, -29.864334106445312, -29.113788604736328, -28.363243103027344, -27.61269760131836, -26.862152099609375, -26.11160659790039, -25.361061096191406, -24.610517501831055, -23.85997200012207, -23.109426498413086, -22.3588809967041, -21.608335494995117, -20.857789993286133, -20.10724449157715, -19.356698989868164, -18.606155395507812, -17.855609893798828, -17.105064392089844, -16.35451889038086, -15.603973388671875, -14.85342788696289, -14.102882385253906, -13.352336883544922, -12.601791381835938, -11.851245880126953, -11.100700378417969, -10.350154876708984, -9.599609375, -8.849063873291016, -8.098518371582031, -7.347973346710205, -6.597427845001221, -5.846882343292236, -5.096336841583252, -4.345791816711426, -3.5952460765838623, -2.844700574874878, -2.0941553115844727, -1.3436098098754883, -0.5930643081665039, 0.1574811339378357, 0.9080265760421753, 1.6585719585418701, 2.4091174602508545, 3.159662961959839, 3.910208225250244, 4.6607537269592285, 5.411299228668213]}, "gradients/decoder.model.decoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 4.0, 7.0, 10.0, 5.0, 12.0, 12.0, 15.0, 16.0, 11.0, 25.0, 30.0, 18.0, 33.0, 38.0, 31.0, 35.0, 38.0, 47.0, 31.0, 42.0, 53.0, 44.0, 42.0, 41.0, 38.0, 34.0, 39.0, 39.0, 37.0, 23.0, 19.0, 34.0, 19.0, 11.0, 16.0, 13.0, 8.0, 6.0, 4.0, 5.0, 2.0, 8.0, 5.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.370148181915283, -7.139651775360107, -6.909154891967773, -6.678658485412598, -6.448162078857422, -6.217665195465088, -5.987168788909912, -5.756671905517578, -5.526175498962402, -5.295679092407227, -5.065182209014893, -4.834685802459717, -4.604188919067383, -4.373692512512207, -4.143196105957031, -3.9126994609832764, -3.6822028160095215, -3.4517061710357666, -3.2212095260620117, -2.990713119506836, -2.760216474533081, -2.529719829559326, -2.2992234230041504, -2.0687267780303955, -1.8382301330566406, -1.6077334880828857, -1.3772369623184204, -1.146740436553955, -0.9162437915802002, -0.6857471466064453, -0.45525062084198, -0.22475409507751465, 0.005742549896240234, 0.23623913526535034, 0.46673572063446045, 0.6972323060035706, 0.9277288913726807, 1.1582255363464355, 1.3887220621109009, 1.6192185878753662, 1.849715232849121, 2.080211877822876, 2.310708522796631, 2.5412049293518066, 2.7717015743255615, 3.0021982192993164, 3.232694625854492, 3.463191270828247, 3.693687915802002, 3.924184560775757, 4.154681205749512, 4.3851776123046875, 4.615674018859863, 4.846170902252197, 5.076667308807373, 5.307164192199707, 5.537660598754883, 5.768157005310059, 5.998653888702393, 6.229150295257568, 6.459647178649902, 6.690143585205078, 6.920639991760254, 7.15113639831543, 7.381633281707764]}, "gradients/decoder.model.decoder.layers.9.fc2.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 0.0, 4.0, 6.0, 6.0, 14.0, 11.0, 15.0, 14.0, 32.0, 38.0, 64.0, 113.0, 192.0, 453.0, 1061.0, 2993.0, 11250.0, 78057.0, 2870337.0, 1174529.0, 43264.0, 7780.0, 2324.0, 841.0, 397.0, 183.0, 93.0, 59.0, 42.0, 29.0, 22.0, 14.0, 13.0, 6.0, 10.0, 4.0, 1.0, 5.0, 5.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.33984375, -6.1527099609375, -5.965576171875, -5.7784423828125, -5.59130859375, -5.4041748046875, -5.217041015625, -5.0299072265625, -4.8427734375, -4.6556396484375, -4.468505859375, -4.2813720703125, -4.09423828125, -3.9071044921875, -3.719970703125, -3.5328369140625, -3.345703125, -3.1585693359375, -2.971435546875, -2.7843017578125, -2.59716796875, -2.4100341796875, -2.222900390625, -2.0357666015625, -1.8486328125, -1.6614990234375, -1.474365234375, -1.2872314453125, -1.10009765625, -0.9129638671875, -0.725830078125, -0.5386962890625, -0.3515625, -0.1644287109375, 0.022705078125, 0.2098388671875, 0.39697265625, 0.5841064453125, 0.771240234375, 0.9583740234375, 1.1455078125, 1.3326416015625, 1.519775390625, 1.7069091796875, 1.89404296875, 2.0811767578125, 2.268310546875, 2.4554443359375, 2.642578125, 2.8297119140625, 3.016845703125, 3.2039794921875, 3.39111328125, 3.5782470703125, 3.765380859375, 3.9525146484375, 4.1396484375, 4.3267822265625, 4.513916015625, 4.7010498046875, 4.88818359375, 5.0753173828125, 5.262451171875, 5.4495849609375, 5.63671875]}, "gradients/decoder.model.decoder.layers.9.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 6.0, 3.0, 4.0, 6.0, 4.0, 8.0, 7.0, 16.0, 9.0, 11.0, 22.0, 16.0, 22.0, 35.0, 27.0, 45.0, 38.0, 35.0, 52.0, 46.0, 43.0, 39.0, 46.0, 50.0, 43.0, 49.0, 43.0, 47.0, 38.0, 26.0, 34.0, 23.0, 16.0, 21.0, 22.0, 11.0, 10.0, 7.0, 7.0, 4.0, 6.0, 4.0, 3.0, 5.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-1.88671875, -1.8279571533203125, -1.769195556640625, -1.7104339599609375, -1.65167236328125, -1.5929107666015625, -1.534149169921875, -1.4753875732421875, -1.4166259765625, -1.3578643798828125, -1.299102783203125, -1.2403411865234375, -1.18157958984375, -1.1228179931640625, -1.064056396484375, -1.0052947998046875, -0.946533203125, -0.8877716064453125, -0.829010009765625, -0.7702484130859375, -0.71148681640625, -0.6527252197265625, -0.593963623046875, -0.5352020263671875, -0.4764404296875, -0.4176788330078125, -0.358917236328125, -0.3001556396484375, -0.24139404296875, -0.1826324462890625, -0.123870849609375, -0.0651092529296875, -0.00634765625, 0.0524139404296875, 0.111175537109375, 0.1699371337890625, 0.22869873046875, 0.2874603271484375, 0.346221923828125, 0.4049835205078125, 0.4637451171875, 0.5225067138671875, 0.581268310546875, 0.6400299072265625, 0.69879150390625, 0.7575531005859375, 0.816314697265625, 0.8750762939453125, 0.933837890625, 0.9925994873046875, 1.051361083984375, 1.1101226806640625, 1.16888427734375, 1.2276458740234375, 1.286407470703125, 1.3451690673828125, 1.4039306640625, 1.4626922607421875, 1.521453857421875, 1.5802154541015625, 1.63897705078125, 1.6977386474609375, 1.756500244140625, 1.8152618408203125, 1.8740234375]}, "gradients/decoder.model.decoder.layers.9.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 0.0, 10.0, 17.0, 72.0, 216.0, 8216.0, 4184379.0, 1184.0, 124.0, 37.0, 12.0, 8.0, 3.0, 0.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.03125, -26.0048828125, -24.978515625, -23.9521484375, -22.92578125, -21.8994140625, -20.873046875, -19.8466796875, -18.8203125, -17.7939453125, -16.767578125, -15.7412109375, -14.71484375, -13.6884765625, -12.662109375, -11.6357421875, -10.609375, -9.5830078125, -8.556640625, -7.5302734375, -6.50390625, -5.4775390625, -4.451171875, -3.4248046875, -2.3984375, -1.3720703125, -0.345703125, 0.6806640625, 1.70703125, 2.7333984375, 3.759765625, 4.7861328125, 5.8125, 6.8388671875, 7.865234375, 8.8916015625, 9.91796875, 10.9443359375, 11.970703125, 12.9970703125, 14.0234375, 15.0498046875, 16.076171875, 17.1025390625, 18.12890625, 19.1552734375, 20.181640625, 21.2080078125, 22.234375, 23.2607421875, 24.287109375, 25.3134765625, 26.33984375, 27.3662109375, 28.392578125, 29.4189453125, 30.4453125, 31.4716796875, 32.498046875, 33.5244140625, 34.55078125, 35.5771484375, 36.603515625, 37.6298828125, 38.65625]}, "gradients/decoder.model.decoder.layers.9.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 5.0, 4.0, 8.0, 9.0, 11.0, 13.0, 27.0, 36.0, 73.0, 95.0, 128.0, 205.0, 386.0, 613.0, 921.0, 651.0, 329.0, 191.0, 122.0, 75.0, 57.0, 40.0, 33.0, 15.0, 14.0, 10.0, 5.0, 1.0, 4.0, 0.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.3203125, -1.2859039306640625, -1.251495361328125, -1.2170867919921875, -1.18267822265625, -1.1482696533203125, -1.113861083984375, -1.0794525146484375, -1.0450439453125, -1.0106353759765625, -0.976226806640625, -0.9418182373046875, -0.90740966796875, -0.8730010986328125, -0.838592529296875, -0.8041839599609375, -0.769775390625, -0.7353668212890625, -0.700958251953125, -0.6665496826171875, -0.63214111328125, -0.5977325439453125, -0.563323974609375, -0.5289154052734375, -0.4945068359375, -0.4600982666015625, -0.425689697265625, -0.3912811279296875, -0.35687255859375, -0.3224639892578125, -0.288055419921875, -0.2536468505859375, -0.21923828125, -0.1848297119140625, -0.150421142578125, -0.1160125732421875, -0.08160400390625, -0.0471954345703125, -0.012786865234375, 0.0216217041015625, 0.0560302734375, 0.0904388427734375, 0.124847412109375, 0.1592559814453125, 0.19366455078125, 0.2280731201171875, 0.262481689453125, 0.2968902587890625, 0.331298828125, 0.3657073974609375, 0.400115966796875, 0.4345245361328125, 0.46893310546875, 0.5033416748046875, 0.537750244140625, 0.5721588134765625, 0.6065673828125, 0.6409759521484375, 0.675384521484375, 0.7097930908203125, 0.74420166015625, 0.7786102294921875, 0.813018798828125, 0.8474273681640625, 0.8818359375]}, "gradients/decoder.model.decoder.layers.9.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 6.0, 4.0, 3.0, 7.0, 12.0, 6.0, 21.0, 19.0, 29.0, 39.0, 46.0, 77.0, 77.0, 102.0, 98.0, 86.0, 73.0, 72.0, 56.0, 58.0, 34.0, 20.0, 25.0, 8.0, 8.0, 8.0, 4.0, 4.0, 1.0, 2.0, 0.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 2.0], "bins": [-4.74462366104126, -4.627485275268555, -4.510346412658691, -4.393208026885986, -4.276069641113281, -4.158930778503418, -4.041792392730713, -3.9246537685394287, -3.8075151443481445, -3.6903765201568604, -3.5732381343841553, -3.456099510192871, -3.338960886001587, -3.2218222618103027, -3.1046838760375977, -2.9875452518463135, -2.8704068660736084, -2.753268241882324, -2.636129856109619, -2.518991231918335, -2.401852607727051, -2.2847142219543457, -2.1675755977630615, -2.0504369735717773, -1.9332984685897827, -1.816159963607788, -1.699021339416504, -1.5818828344345093, -1.4647443294525146, -1.3476057052612305, -1.2304672002792358, -1.1133286952972412, -0.996190071105957, -0.8790515065193176, -0.7619129419326782, -0.6447744369506836, -0.5276358723640442, -0.4104973077774048, -0.29335880279541016, -0.17622023820877075, -0.05908167362213135, 0.05805687606334686, 0.17519542574882507, 0.2923339605331421, 0.4094725251197815, 0.5266110897064209, 0.6437495946884155, 0.7608881592750549, 0.8780267238616943, 0.9951652884483337, 1.1123038530349731, 1.2294423580169678, 1.346580982208252, 1.4637194871902466, 1.5808579921722412, 1.6979966163635254, 1.81513512134552, 1.9322736263275146, 2.049412250518799, 2.166550636291504, 2.283689260482788, 2.4008278846740723, 2.5179662704467773, 2.6351048946380615, 2.7522435188293457]}, "gradients/decoder.model.decoder.layers.9.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 3.0, 6.0, 2.0, 5.0, 10.0, 10.0, 17.0, 11.0, 17.0, 14.0, 23.0, 18.0, 29.0, 31.0, 33.0, 28.0, 45.0, 29.0, 48.0, 44.0, 39.0, 40.0, 42.0, 39.0, 33.0, 40.0, 43.0, 37.0, 31.0, 28.0, 33.0, 25.0, 32.0, 19.0, 8.0, 11.0, 19.0, 11.0, 12.0, 8.0, 8.0, 5.0, 5.0, 3.0, 4.0, 4.0, 4.0, 0.0, 3.0, 1.0], "bins": [-2.2083804607391357, -2.1468148231506348, -2.085249423980713, -2.023683786392212, -1.96211838722229, -1.900552749633789, -1.8389872312545776, -1.7774217128753662, -1.7158561944961548, -1.6542906761169434, -1.592725157737732, -1.5311596393585205, -1.4695940017700195, -1.4080286026000977, -1.3464629650115967, -1.2848974466323853, -1.2233319282531738, -1.1617664098739624, -1.100200891494751, -1.0386353731155396, -0.9770697951316833, -0.9155042767524719, -0.8539386987686157, -0.7923731803894043, -0.7308076620101929, -0.6692421436309814, -0.60767662525177, -0.5461110472679138, -0.4845455288887024, -0.42298001050949097, -0.36141446232795715, -0.29984891414642334, -0.23828327655792236, -0.17671774327754974, -0.11515220999717712, -0.053586676716804504, 0.007978856563568115, 0.06954437494277954, 0.13110992312431335, 0.19267547130584717, 0.2542409896850586, 0.31580650806427, 0.37737205624580383, 0.43893760442733765, 0.5005031228065491, 0.5620686411857605, 0.6236342191696167, 0.6851997375488281, 0.7467652559280396, 0.808330774307251, 0.8698962926864624, 0.9314618706703186, 0.99302738904953, 1.0545928478240967, 1.1161584854125977, 1.177724003791809, 1.2392895221710205, 1.300855040550232, 1.3624205589294434, 1.4239860773086548, 1.4855515956878662, 1.5471172332763672, 1.6086827516555786, 1.67024827003479, 1.7318137884140015]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 1.0, 2.0, 2.0, 2.0, 6.0, 8.0, 10.0, 13.0, 28.0, 43.0, 55.0, 110.0, 265.0, 522.0, 1342.0, 3440.0, 10413.0, 38161.0, 175120.0, 526050.0, 225916.0, 47694.0, 12570.0, 4031.0, 1489.0, 624.0, 277.0, 164.0, 91.0, 50.0, 31.0, 10.0, 11.0, 8.0, 4.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.97900390625, -0.9356460571289062, -0.8922882080078125, -0.8489303588867188, -0.805572509765625, -0.7622146606445312, -0.7188568115234375, -0.6754989624023438, -0.63214111328125, -0.5887832641601562, -0.5454254150390625, -0.5020675659179688, -0.458709716796875, -0.41535186767578125, -0.3719940185546875, -0.32863616943359375, -0.2852783203125, -0.24192047119140625, -0.1985626220703125, -0.15520477294921875, -0.111846923828125, -0.06848907470703125, -0.0251312255859375, 0.01822662353515625, 0.06158447265625, 0.10494232177734375, 0.1483001708984375, 0.19165802001953125, 0.235015869140625, 0.27837371826171875, 0.3217315673828125, 0.36508941650390625, 0.408447265625, 0.45180511474609375, 0.4951629638671875, 0.5385208129882812, 0.581878662109375, 0.6252365112304688, 0.6685943603515625, 0.7119522094726562, 0.75531005859375, 0.7986679077148438, 0.8420257568359375, 0.8853836059570312, 0.928741455078125, 0.9720993041992188, 1.0154571533203125, 1.0588150024414062, 1.1021728515625, 1.1455307006835938, 1.1888885498046875, 1.2322463989257812, 1.275604248046875, 1.3189620971679688, 1.3623199462890625, 1.4056777954101562, 1.44903564453125, 1.4923934936523438, 1.5357513427734375, 1.5791091918945312, 1.622467041015625, 1.6658248901367188, 1.7091827392578125, 1.7525405883789062, 1.7958984375]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 0.0, 4.0, 3.0, 3.0, 3.0, 8.0, 10.0, 9.0, 13.0, 19.0, 17.0, 33.0, 28.0, 39.0, 46.0, 60.0, 67.0, 64.0, 60.0, 64.0, 55.0, 58.0, 60.0, 43.0, 48.0, 37.0, 33.0, 23.0, 29.0, 16.0, 20.0, 6.0, 9.0, 4.0, 9.0, 3.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6787109375, -1.623504638671875, -1.56829833984375, -1.513092041015625, -1.4578857421875, -1.402679443359375, -1.34747314453125, -1.292266845703125, -1.237060546875, -1.181854248046875, -1.12664794921875, -1.071441650390625, -1.0162353515625, -0.961029052734375, -0.90582275390625, -0.850616455078125, -0.79541015625, -0.740203857421875, -0.68499755859375, -0.629791259765625, -0.5745849609375, -0.519378662109375, -0.46417236328125, -0.408966064453125, -0.353759765625, -0.298553466796875, -0.24334716796875, -0.188140869140625, -0.1329345703125, -0.077728271484375, -0.02252197265625, 0.032684326171875, 0.087890625, 0.143096923828125, 0.19830322265625, 0.253509521484375, 0.3087158203125, 0.363922119140625, 0.41912841796875, 0.474334716796875, 0.529541015625, 0.584747314453125, 0.63995361328125, 0.695159912109375, 0.7503662109375, 0.805572509765625, 0.86077880859375, 0.915985107421875, 0.97119140625, 1.026397705078125, 1.08160400390625, 1.136810302734375, 1.1920166015625, 1.247222900390625, 1.30242919921875, 1.357635498046875, 1.412841796875, 1.468048095703125, 1.52325439453125, 1.578460693359375, 1.6336669921875, 1.688873291015625, 1.74407958984375, 1.799285888671875, 1.8544921875]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 10.0, 5.0, 10.0, 9.0, 13.0, 11.0, 25.0, 46.0, 55.0, 66.0, 105.0, 189.0, 308.0, 516.0, 942.0, 2025.0, 4661.0, 12800.0, 42311.0, 171515.0, 493648.0, 236240.0, 56041.0, 16183.0, 5759.0, 2384.0, 1152.0, 595.0, 336.0, 197.0, 120.0, 78.0, 47.0, 31.0, 26.0, 26.0, 22.0, 16.0, 6.0, 8.0, 3.0, 2.0, 5.0, 2.0, 1.0, 5.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.88818359375, -0.8609466552734375, -0.833709716796875, -0.8064727783203125, -0.77923583984375, -0.7519989013671875, -0.724761962890625, -0.6975250244140625, -0.6702880859375, -0.6430511474609375, -0.615814208984375, -0.5885772705078125, -0.56134033203125, -0.5341033935546875, -0.506866455078125, -0.4796295166015625, -0.452392578125, -0.4251556396484375, -0.397918701171875, -0.3706817626953125, -0.34344482421875, -0.3162078857421875, -0.288970947265625, -0.2617340087890625, -0.2344970703125, -0.2072601318359375, -0.180023193359375, -0.1527862548828125, -0.12554931640625, -0.0983123779296875, -0.071075439453125, -0.0438385009765625, -0.0166015625, 0.0106353759765625, 0.037872314453125, 0.0651092529296875, 0.09234619140625, 0.1195831298828125, 0.146820068359375, 0.1740570068359375, 0.2012939453125, 0.2285308837890625, 0.255767822265625, 0.2830047607421875, 0.31024169921875, 0.3374786376953125, 0.364715576171875, 0.3919525146484375, 0.419189453125, 0.4464263916015625, 0.473663330078125, 0.5009002685546875, 0.52813720703125, 0.5553741455078125, 0.582611083984375, 0.6098480224609375, 0.6370849609375, 0.6643218994140625, 0.691558837890625, 0.7187957763671875, 0.74603271484375, 0.7732696533203125, 0.800506591796875, 0.8277435302734375, 0.85498046875]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 6.0, 5.0, 9.0, 12.0, 7.0, 21.0, 17.0, 17.0, 25.0, 29.0, 35.0, 40.0, 34.0, 37.0, 35.0, 49.0, 46.0, 49.0, 67.0, 41.0, 60.0, 33.0, 39.0, 35.0, 40.0, 39.0, 31.0, 21.0, 25.0, 21.0, 20.0, 19.0, 11.0, 9.0, 8.0, 4.0, 2.0, 5.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.5625, -2.476654052734375, -2.39080810546875, -2.304962158203125, -2.2191162109375, -2.133270263671875, -2.04742431640625, -1.961578369140625, -1.875732421875, -1.789886474609375, -1.70404052734375, -1.618194580078125, -1.5323486328125, -1.446502685546875, -1.36065673828125, -1.274810791015625, -1.18896484375, -1.103118896484375, -1.01727294921875, -0.931427001953125, -0.8455810546875, -0.759735107421875, -0.67388916015625, -0.588043212890625, -0.502197265625, -0.416351318359375, -0.33050537109375, -0.244659423828125, -0.1588134765625, -0.072967529296875, 0.01287841796875, 0.098724365234375, 0.1845703125, 0.270416259765625, 0.35626220703125, 0.442108154296875, 0.5279541015625, 0.613800048828125, 0.69964599609375, 0.785491943359375, 0.871337890625, 0.957183837890625, 1.04302978515625, 1.128875732421875, 1.2147216796875, 1.300567626953125, 1.38641357421875, 1.472259521484375, 1.55810546875, 1.643951416015625, 1.72979736328125, 1.815643310546875, 1.9014892578125, 1.987335205078125, 2.07318115234375, 2.159027099609375, 2.244873046875, 2.330718994140625, 2.41656494140625, 2.502410888671875, 2.5882568359375, 2.674102783203125, 2.75994873046875, 2.845794677734375, 2.931640625]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 3.0, 3.0, 9.0, 14.0, 9.0, 14.0, 20.0, 29.0, 33.0, 68.0, 101.0, 232.0, 363.0, 753.0, 1528.0, 3809.0, 11603.0, 54244.0, 465751.0, 440663.0, 51530.0, 11026.0, 3730.0, 1440.0, 679.0, 380.0, 208.0, 120.0, 60.0, 46.0, 32.0, 11.0, 21.0, 12.0, 4.0, 7.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.529296875, -0.5122146606445312, -0.4951324462890625, -0.47805023193359375, -0.460968017578125, -0.44388580322265625, -0.4268035888671875, -0.40972137451171875, -0.39263916015625, -0.37555694580078125, -0.3584747314453125, -0.34139251708984375, -0.324310302734375, -0.30722808837890625, -0.2901458740234375, -0.27306365966796875, -0.2559814453125, -0.23889923095703125, -0.2218170166015625, -0.20473480224609375, -0.187652587890625, -0.17057037353515625, -0.1534881591796875, -0.13640594482421875, -0.11932373046875, -0.10224151611328125, -0.0851593017578125, -0.06807708740234375, -0.050994873046875, -0.03391265869140625, -0.0168304443359375, 0.00025177001953125, 0.017333984375, 0.03441619873046875, 0.0514984130859375, 0.06858062744140625, 0.085662841796875, 0.10274505615234375, 0.1198272705078125, 0.13690948486328125, 0.15399169921875, 0.17107391357421875, 0.1881561279296875, 0.20523834228515625, 0.222320556640625, 0.23940277099609375, 0.2564849853515625, 0.27356719970703125, 0.2906494140625, 0.30773162841796875, 0.3248138427734375, 0.34189605712890625, 0.358978271484375, 0.37606048583984375, 0.3931427001953125, 0.41022491455078125, 0.42730712890625, 0.44438934326171875, 0.4614715576171875, 0.47855377197265625, 0.495635986328125, 0.5127182006835938, 0.5298004150390625, 0.5468826293945312, 0.56396484375]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 1.0, 3.0, 5.0, 7.0, 10.0, 13.0, 18.0, 29.0, 45.0, 55.0, 77.0, 95.0, 126.0, 123.0, 123.0, 96.0, 63.0, 38.0, 25.0, 12.0, 11.0, 9.0, 5.0, 4.0, 3.0, 5.0, 5.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0003070831298828125, -0.00029693543910980225, -0.000286787748336792, -0.00027664005756378174, -0.0002664923667907715, -0.00025634467601776123, -0.000246196985244751, -0.00023604929447174072, -0.00022590160369873047, -0.00021575391292572021, -0.00020560622215270996, -0.0001954585313796997, -0.00018531084060668945, -0.0001751631498336792, -0.00016501545906066895, -0.0001548677682876587, -0.00014472007751464844, -0.00013457238674163818, -0.00012442469596862793, -0.00011427700519561768, -0.00010412931442260742, -9.398162364959717e-05, -8.383393287658691e-05, -7.368624210357666e-05, -6.35385513305664e-05, -5.339086055755615e-05, -4.32431697845459e-05, -3.3095479011535645e-05, -2.294778823852539e-05, -1.2800097465515137e-05, -2.652406692504883e-06, 7.495284080505371e-06, 1.7642974853515625e-05, 2.779066562652588e-05, 3.793835639953613e-05, 4.808604717254639e-05, 5.823373794555664e-05, 6.83814287185669e-05, 7.852911949157715e-05, 8.86768102645874e-05, 9.882450103759766e-05, 0.00010897219181060791, 0.00011911988258361816, 0.00012926757335662842, 0.00013941526412963867, 0.00014956295490264893, 0.00015971064567565918, 0.00016985833644866943, 0.0001800060272216797, 0.00019015371799468994, 0.0002003014087677002, 0.00021044909954071045, 0.0002205967903137207, 0.00023074448108673096, 0.0002408921718597412, 0.00025103986263275146, 0.0002611875534057617, 0.00027133524417877197, 0.0002814829349517822, 0.0002916306257247925, 0.00030177831649780273, 0.000311926007270813, 0.00032207369804382324, 0.0003322213888168335, 0.00034236907958984375]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 2.0, 3.0, 5.0, 5.0, 9.0, 21.0, 26.0, 38.0, 61.0, 94.0, 127.0, 215.0, 363.0, 591.0, 1113.0, 2284.0, 5253.0, 15350.0, 67573.0, 384636.0, 455963.0, 85049.0, 18429.0, 5968.0, 2495.0, 1198.0, 669.0, 407.0, 216.0, 126.0, 105.0, 54.0, 34.0, 24.0, 21.0, 10.0, 8.0, 4.0, 4.0, 1.0, 1.0, 2.0, 3.0, 2.0, 0.0, 2.0], "bins": [-0.5791015625, -0.5638885498046875, -0.548675537109375, -0.5334625244140625, -0.51824951171875, -0.5030364990234375, -0.487823486328125, -0.4726104736328125, -0.4573974609375, -0.4421844482421875, -0.426971435546875, -0.4117584228515625, -0.39654541015625, -0.3813323974609375, -0.366119384765625, -0.3509063720703125, -0.335693359375, -0.3204803466796875, -0.305267333984375, -0.2900543212890625, -0.27484130859375, -0.2596282958984375, -0.244415283203125, -0.2292022705078125, -0.2139892578125, -0.1987762451171875, -0.183563232421875, -0.1683502197265625, -0.15313720703125, -0.1379241943359375, -0.122711181640625, -0.1074981689453125, -0.09228515625, -0.0770721435546875, -0.061859130859375, -0.0466461181640625, -0.03143310546875, -0.0162200927734375, -0.001007080078125, 0.0142059326171875, 0.0294189453125, 0.0446319580078125, 0.059844970703125, 0.0750579833984375, 0.09027099609375, 0.1054840087890625, 0.120697021484375, 0.1359100341796875, 0.151123046875, 0.1663360595703125, 0.181549072265625, 0.1967620849609375, 0.21197509765625, 0.2271881103515625, 0.242401123046875, 0.2576141357421875, 0.2728271484375, 0.2880401611328125, 0.303253173828125, 0.3184661865234375, 0.33367919921875, 0.3488922119140625, 0.364105224609375, 0.3793182373046875, 0.39453125]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 6.0, 10.0, 19.0, 25.0, 32.0, 42.0, 46.0, 50.0, 67.0, 84.0, 122.0, 107.0, 92.0, 61.0, 65.0, 44.0, 41.0, 28.0, 15.0, 14.0, 8.0, 7.0, 3.0, 3.0, 2.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.12225341796875, -0.1186513900756836, -0.11504936218261719, -0.11144733428955078, -0.10784530639648438, -0.10424327850341797, -0.10064125061035156, -0.09703922271728516, -0.09343719482421875, -0.08983516693115234, -0.08623313903808594, -0.08263111114501953, -0.07902908325195312, -0.07542705535888672, -0.07182502746582031, -0.0682229995727539, -0.0646209716796875, -0.061018943786621094, -0.05741691589355469, -0.05381488800048828, -0.050212860107421875, -0.04661083221435547, -0.04300880432128906, -0.039406776428222656, -0.03580474853515625, -0.032202720642089844, -0.028600692749023438, -0.02499866485595703, -0.021396636962890625, -0.01779460906982422, -0.014192581176757812, -0.010590553283691406, -0.006988525390625, -0.0033864974975585938, 0.0002155303955078125, 0.0038175582885742188, 0.007419586181640625, 0.011021614074707031, 0.014623641967773438, 0.018225669860839844, 0.02182769775390625, 0.025429725646972656, 0.029031753540039062, 0.03263378143310547, 0.036235809326171875, 0.03983783721923828, 0.04343986511230469, 0.047041893005371094, 0.0506439208984375, 0.054245948791503906, 0.05784797668457031, 0.06145000457763672, 0.06505203247070312, 0.06865406036376953, 0.07225608825683594, 0.07585811614990234, 0.07946014404296875, 0.08306217193603516, 0.08666419982910156, 0.09026622772216797, 0.09386825561523438, 0.09747028350830078, 0.10107231140136719, 0.1046743392944336, 0.1082763671875]}, "gradients/decoder.model.decoder.layers.9.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 4.0, 1.0, 3.0, 6.0, 11.0, 13.0, 15.0, 21.0, 51.0, 57.0, 73.0, 112.0, 116.0, 111.0, 114.0, 86.0, 58.0, 56.0, 37.0, 18.0, 11.0, 15.0, 2.0, 3.0, 4.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.1737794876098633, -3.090355396270752, -3.0069315433502197, -2.9235074520111084, -2.840083599090576, -2.756659507751465, -2.6732354164123535, -2.589811325073242, -2.50638747215271, -2.4229633808135986, -2.3395395278930664, -2.256115436553955, -2.1726913452148438, -2.0892674922943115, -2.0058434009552, -1.9224194288253784, -1.8389954566955566, -1.7555714845657349, -1.672147512435913, -1.5887234210968018, -1.50529944896698, -1.4218754768371582, -1.3384513854980469, -1.255027413368225, -1.1716034412384033, -1.0881794691085815, -1.0047554969787598, -0.9213314056396484, -0.8379074335098267, -0.7544834613800049, -0.6710594296455383, -0.5876353979110718, -0.5042116641998291, -0.42078766226768494, -0.33736366033554077, -0.2539396584033966, -0.17051565647125244, -0.08709165453910828, -0.0036676526069641113, 0.07975637912750244, 0.16318035125732422, 0.24660435318946838, 0.33002835512161255, 0.4134523570537567, 0.4968763589859009, 0.5803003311157227, 0.6637243628501892, 0.7471483945846558, 0.8305723667144775, 0.9139963388442993, 0.9974203705787659, 1.0808444023132324, 1.1642683744430542, 1.247692346572876, 1.3311164379119873, 1.414540410041809, 1.4979643821716309, 1.5813883543014526, 1.6648123264312744, 1.7482364177703857, 1.8316603899002075, 1.9150843620300293, 1.9985084533691406, 2.081932544708252, 2.165356397628784]}, "gradients/decoder.model.decoder.layers.9.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 3.0, 5.0, 11.0, 14.0, 15.0, 15.0, 19.0, 25.0, 36.0, 36.0, 56.0, 52.0, 63.0, 60.0, 66.0, 73.0, 55.0, 59.0, 44.0, 54.0, 47.0, 52.0, 26.0, 26.0, 22.0, 20.0, 19.0, 8.0, 9.0, 6.0, 2.0, 5.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5837723016738892, -1.5298136472702026, -1.4758549928665161, -1.4218963384628296, -1.367937684059143, -1.3139790296554565, -1.2600202560424805, -1.206061601638794, -1.1521029472351074, -1.098144292831421, -1.0441856384277344, -0.9902269840240479, -0.9362683296203613, -0.8823096752166748, -0.8283509612083435, -0.774392306804657, -0.7204337120056152, -0.6664750576019287, -0.6125164031982422, -0.5585577487945557, -0.5045990943908691, -0.45064041018486023, -0.3966817259788513, -0.3427230715751648, -0.28876441717147827, -0.23480576276779175, -0.18084709346294403, -0.1268884241580963, -0.07292976975440979, -0.018971115350723267, 0.034987568855285645, 0.08894622325897217, 0.14290475845336914, 0.19686341285705566, 0.2508220672607422, 0.3047807514667511, 0.3587394058704376, 0.41269806027412415, 0.46665674448013306, 0.5206153988838196, 0.5745740532875061, 0.6285327076911926, 0.6824913620948792, 0.7364500761032104, 0.790408730506897, 0.8443673849105835, 0.89832603931427, 0.9522846937179565, 1.006243348121643, 1.0602020025253296, 1.1141606569290161, 1.1681193113327026, 1.2220779657363892, 1.2760366201400757, 1.3299953937530518, 1.3839540481567383, 1.4379127025604248, 1.4918713569641113, 1.5458300113677979, 1.5997886657714844, 1.653747320175171, 1.7077059745788574, 1.761664628982544, 1.8156232833862305, 1.869581937789917]}, "gradients/decoder.model.decoder.layers.9.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 2.0, 1.0, 7.0, 7.0, 17.0, 17.0, 25.0, 35.0, 38.0, 64.0, 109.0, 167.0, 255.0, 374.0, 646.0, 1105.0, 1846.0, 3230.0, 6373.0, 12903.0, 29583.0, 83111.0, 320799.0, 417439.0, 104159.0, 35217.0, 14726.0, 7301.0, 3760.0, 2040.0, 1185.0, 722.0, 475.0, 269.0, 193.0, 110.0, 64.0, 59.0, 36.0, 36.0, 11.0, 13.0, 11.0, 6.0, 6.0, 7.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.5693359375, -1.52191162109375, -1.4744873046875, -1.42706298828125, -1.379638671875, -1.33221435546875, -1.2847900390625, -1.23736572265625, -1.18994140625, -1.14251708984375, -1.0950927734375, -1.04766845703125, -1.000244140625, -0.95281982421875, -0.9053955078125, -0.85797119140625, -0.810546875, -0.76312255859375, -0.7156982421875, -0.66827392578125, -0.620849609375, -0.57342529296875, -0.5260009765625, -0.47857666015625, -0.43115234375, -0.38372802734375, -0.3363037109375, -0.28887939453125, -0.241455078125, -0.19403076171875, -0.1466064453125, -0.09918212890625, -0.0517578125, -0.00433349609375, 0.0430908203125, 0.09051513671875, 0.137939453125, 0.18536376953125, 0.2327880859375, 0.28021240234375, 0.32763671875, 0.37506103515625, 0.4224853515625, 0.46990966796875, 0.517333984375, 0.56475830078125, 0.6121826171875, 0.65960693359375, 0.70703125, 0.75445556640625, 0.8018798828125, 0.84930419921875, 0.896728515625, 0.94415283203125, 0.9915771484375, 1.03900146484375, 1.08642578125, 1.13385009765625, 1.1812744140625, 1.22869873046875, 1.276123046875, 1.32354736328125, 1.3709716796875, 1.41839599609375, 1.4658203125]}, "gradients/decoder.model.decoder.layers.9.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 4.0, 1.0, 4.0, 1.0, 2.0, 3.0, 3.0, 10.0, 13.0, 17.0, 17.0, 14.0, 25.0, 33.0, 35.0, 33.0, 47.0, 53.0, 47.0, 58.0, 74.0, 63.0, 62.0, 61.0, 51.0, 43.0, 48.0, 42.0, 29.0, 18.0, 29.0, 21.0, 25.0, 10.0, 3.0, 3.0, 5.0, 1.0, 2.0, 2.0, 0.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.779296875, -3.657989501953125, -3.53668212890625, -3.415374755859375, -3.2940673828125, -3.172760009765625, -3.05145263671875, -2.930145263671875, -2.808837890625, -2.687530517578125, -2.56622314453125, -2.444915771484375, -2.3236083984375, -2.202301025390625, -2.08099365234375, -1.959686279296875, -1.83837890625, -1.717071533203125, -1.59576416015625, -1.474456787109375, -1.3531494140625, -1.231842041015625, -1.11053466796875, -0.989227294921875, -0.867919921875, -0.746612548828125, -0.62530517578125, -0.503997802734375, -0.3826904296875, -0.261383056640625, -0.14007568359375, -0.018768310546875, 0.1025390625, 0.223846435546875, 0.34515380859375, 0.466461181640625, 0.5877685546875, 0.709075927734375, 0.83038330078125, 0.951690673828125, 1.072998046875, 1.194305419921875, 1.31561279296875, 1.436920166015625, 1.5582275390625, 1.679534912109375, 1.80084228515625, 1.922149658203125, 2.04345703125, 2.164764404296875, 2.28607177734375, 2.407379150390625, 2.5286865234375, 2.649993896484375, 2.77130126953125, 2.892608642578125, 3.013916015625, 3.135223388671875, 3.25653076171875, 3.377838134765625, 3.4991455078125, 3.620452880859375, 3.74176025390625, 3.863067626953125, 3.984375]}, "gradients/decoder.model.decoder.layers.9.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 1.0, 2.0, 5.0, 6.0, 9.0, 7.0, 17.0, 15.0, 12.0, 22.0, 26.0, 33.0, 33.0, 40.0, 44.0, 48.0, 51.0, 77.0, 813.0, 512893.0, 533189.0, 778.0, 87.0, 51.0, 33.0, 42.0, 36.0, 38.0, 28.0, 28.0, 21.0, 18.0, 18.0, 11.0, 6.0, 7.0, 8.0, 4.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-13.40625, -13.011962890625, -12.61767578125, -12.223388671875, -11.8291015625, -11.434814453125, -11.04052734375, -10.646240234375, -10.251953125, -9.857666015625, -9.46337890625, -9.069091796875, -8.6748046875, -8.280517578125, -7.88623046875, -7.491943359375, -7.09765625, -6.703369140625, -6.30908203125, -5.914794921875, -5.5205078125, -5.126220703125, -4.73193359375, -4.337646484375, -3.943359375, -3.549072265625, -3.15478515625, -2.760498046875, -2.3662109375, -1.971923828125, -1.57763671875, -1.183349609375, -0.7890625, -0.394775390625, -0.00048828125, 0.393798828125, 0.7880859375, 1.182373046875, 1.57666015625, 1.970947265625, 2.365234375, 2.759521484375, 3.15380859375, 3.548095703125, 3.9423828125, 4.336669921875, 4.73095703125, 5.125244140625, 5.51953125, 5.913818359375, 6.30810546875, 6.702392578125, 7.0966796875, 7.490966796875, 7.88525390625, 8.279541015625, 8.673828125, 9.068115234375, 9.46240234375, 9.856689453125, 10.2509765625, 10.645263671875, 11.03955078125, 11.433837890625, 11.828125]}, "gradients/decoder.model.decoder.layers.9.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 0.0, 1.0, 4.0, 8.0, 4.0, 8.0, 10.0, 14.0, 12.0, 23.0, 22.0, 30.0, 44.0, 30.0, 40.0, 36.0, 48.0, 35.0, 43.0, 50.0, 39.0, 48.0, 57.0, 40.0, 52.0, 30.0, 42.0, 31.0, 37.0, 27.0, 32.0, 27.0, 22.0, 17.0, 9.0, 11.0, 9.0, 6.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.8125, -3.7000732421875, -3.587646484375, -3.4752197265625, -3.36279296875, -3.2503662109375, -3.137939453125, -3.0255126953125, -2.9130859375, -2.8006591796875, -2.688232421875, -2.5758056640625, -2.46337890625, -2.3509521484375, -2.238525390625, -2.1260986328125, -2.013671875, -1.9012451171875, -1.788818359375, -1.6763916015625, -1.56396484375, -1.4515380859375, -1.339111328125, -1.2266845703125, -1.1142578125, -1.0018310546875, -0.889404296875, -0.7769775390625, -0.66455078125, -0.5521240234375, -0.439697265625, -0.3272705078125, -0.21484375, -0.1024169921875, 0.010009765625, 0.1224365234375, 0.23486328125, 0.3472900390625, 0.459716796875, 0.5721435546875, 0.6845703125, 0.7969970703125, 0.909423828125, 1.0218505859375, 1.13427734375, 1.2467041015625, 1.359130859375, 1.4715576171875, 1.583984375, 1.6964111328125, 1.808837890625, 1.9212646484375, 2.03369140625, 2.1461181640625, 2.258544921875, 2.3709716796875, 2.4833984375, 2.5958251953125, 2.708251953125, 2.8206787109375, 2.93310546875, 3.0455322265625, 3.157958984375, 3.2703857421875, 3.3828125]}, "gradients/decoder.model.decoder.layers.9.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 7.0, 9.0, 14.0, 17.0, 20.0, 27.0, 76.0, 104.0, 211.0, 399.0, 849.0, 2140.0, 5900.0, 21577.0, 119424.0, 703889.0, 156549.0, 26400.0, 6741.0, 2301.0, 908.0, 440.0, 230.0, 107.0, 64.0, 50.0, 26.0, 24.0, 19.0, 7.0, 7.0, 6.0, 3.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.75439453125, -0.7297134399414062, -0.7050323486328125, -0.6803512573242188, -0.655670166015625, -0.6309890747070312, -0.6063079833984375, -0.5816268920898438, -0.55694580078125, -0.5322647094726562, -0.5075836181640625, -0.48290252685546875, -0.458221435546875, -0.43354034423828125, -0.4088592529296875, -0.38417816162109375, -0.3594970703125, -0.33481597900390625, -0.3101348876953125, -0.28545379638671875, -0.260772705078125, -0.23609161376953125, -0.2114105224609375, -0.18672943115234375, -0.16204833984375, -0.13736724853515625, -0.1126861572265625, -0.08800506591796875, -0.063323974609375, -0.03864288330078125, -0.0139617919921875, 0.01071929931640625, 0.035400390625, 0.06008148193359375, 0.0847625732421875, 0.10944366455078125, 0.134124755859375, 0.15880584716796875, 0.1834869384765625, 0.20816802978515625, 0.23284912109375, 0.25753021240234375, 0.2822113037109375, 0.30689239501953125, 0.331573486328125, 0.35625457763671875, 0.3809356689453125, 0.40561676025390625, 0.4302978515625, 0.45497894287109375, 0.4796600341796875, 0.5043411254882812, 0.529022216796875, 0.5537033081054688, 0.5783843994140625, 0.6030654907226562, 0.62774658203125, 0.6524276733398438, 0.6771087646484375, 0.7017898559570312, 0.726470947265625, 0.7511520385742188, 0.7758331298828125, 0.8005142211914062, 0.8251953125]}, "gradients/decoder.model.decoder.layers.9.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 8.0, 2.0, 8.0, 9.0, 9.0, 16.0, 17.0, 17.0, 21.0, 28.0, 50.0, 70.0, 84.0, 130.0, 150.0, 95.0, 75.0, 50.0, 36.0, 32.0, 17.0, 16.0, 18.0, 19.0, 7.0, 4.0, 4.0, 3.0, 4.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.00012803077697753906, -0.0001247590407729149, -0.00012148730456829071, -0.00011821556836366653, -0.00011494383215904236, -0.00011167209595441818, -0.000108400359749794, -0.00010512862354516983, -0.00010185688734054565, -9.858515113592148e-05, -9.53134149312973e-05, -9.204167872667313e-05, -8.876994252204895e-05, -8.549820631742477e-05, -8.22264701128006e-05, -7.895473390817642e-05, -7.568299770355225e-05, -7.241126149892807e-05, -6.91395252943039e-05, -6.586778908967972e-05, -6.259605288505554e-05, -5.9324316680431366e-05, -5.605258047580719e-05, -5.2780844271183014e-05, -4.950910806655884e-05, -4.623737186193466e-05, -4.2965635657310486e-05, -3.969389945268631e-05, -3.6422163248062134e-05, -3.315042704343796e-05, -2.9878690838813782e-05, -2.6606954634189606e-05, -2.333521842956543e-05, -2.0063482224941254e-05, -1.6791746020317078e-05, -1.3520009815692902e-05, -1.0248273611068726e-05, -6.9765374064445496e-06, -3.7048012018203735e-06, -4.330649971961975e-07, 2.8386712074279785e-06, 6.1104074120521545e-06, 9.38214361667633e-06, 1.2653879821300507e-05, 1.5925616025924683e-05, 1.919735223054886e-05, 2.2469088435173035e-05, 2.574082463979721e-05, 2.9012560844421387e-05, 3.228429704904556e-05, 3.555603325366974e-05, 3.8827769458293915e-05, 4.209950566291809e-05, 4.537124186754227e-05, 4.864297807216644e-05, 5.191471427679062e-05, 5.5186450481414795e-05, 5.845818668603897e-05, 6.172992289066315e-05, 6.500165909528732e-05, 6.82733952999115e-05, 7.154513150453568e-05, 7.481686770915985e-05, 7.808860391378403e-05, 8.13603401184082e-05]}, "gradients/decoder.model.decoder.layers.9.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 5.0, 4.0, 9.0, 8.0, 23.0, 27.0, 25.0, 51.0, 110.0, 145.0, 263.0, 474.0, 766.0, 1431.0, 2529.0, 4924.0, 10326.0, 23714.0, 62373.0, 206741.0, 503891.0, 147339.0, 47291.0, 18441.0, 8387.0, 4202.0, 2182.0, 1157.0, 661.0, 387.0, 268.0, 140.0, 93.0, 67.0, 42.0, 22.0, 10.0, 13.0, 5.0, 6.0, 5.0, 1.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.3876953125, -0.3744926452636719, -0.36128997802734375, -0.3480873107910156, -0.3348846435546875, -0.3216819763183594, -0.30847930908203125, -0.2952766418457031, -0.282073974609375, -0.2688713073730469, -0.25566864013671875, -0.24246597290039062, -0.2292633056640625, -0.21606063842773438, -0.20285797119140625, -0.18965530395507812, -0.17645263671875, -0.16324996948242188, -0.15004730224609375, -0.13684463500976562, -0.1236419677734375, -0.11043930053710938, -0.09723663330078125, -0.08403396606445312, -0.070831298828125, -0.057628631591796875, -0.04442596435546875, -0.031223297119140625, -0.0180206298828125, -0.004817962646484375, 0.00838470458984375, 0.021587371826171875, 0.0347900390625, 0.047992706298828125, 0.06119537353515625, 0.07439804077148438, 0.0876007080078125, 0.10080337524414062, 0.11400604248046875, 0.12720870971679688, 0.140411376953125, 0.15361404418945312, 0.16681671142578125, 0.18001937866210938, 0.1932220458984375, 0.20642471313476562, 0.21962738037109375, 0.23283004760742188, 0.24603271484375, 0.2592353820800781, 0.27243804931640625, 0.2856407165527344, 0.2988433837890625, 0.3120460510253906, 0.32524871826171875, 0.3384513854980469, 0.351654052734375, 0.3648567199707031, 0.37805938720703125, 0.3912620544433594, 0.4044647216796875, 0.4176673889160156, 0.43087005615234375, 0.4440727233886719, 0.457275390625]}, "gradients/decoder.model.decoder.layers.9.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 5.0, 4.0, 6.0, 10.0, 9.0, 13.0, 13.0, 24.0, 24.0, 19.0, 36.0, 52.0, 45.0, 50.0, 80.0, 145.0, 100.0, 74.0, 52.0, 45.0, 44.0, 29.0, 26.0, 26.0, 16.0, 9.0, 15.0, 8.0, 10.0, 4.0, 4.0, 5.0, 3.0, 3.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.227294921875, -0.2191314697265625, -0.210968017578125, -0.2028045654296875, -0.19464111328125, -0.1864776611328125, -0.178314208984375, -0.1701507568359375, -0.1619873046875, -0.1538238525390625, -0.145660400390625, -0.1374969482421875, -0.12933349609375, -0.1211700439453125, -0.113006591796875, -0.1048431396484375, -0.0966796875, -0.0885162353515625, -0.080352783203125, -0.0721893310546875, -0.06402587890625, -0.0558624267578125, -0.047698974609375, -0.0395355224609375, -0.0313720703125, -0.0232086181640625, -0.015045166015625, -0.0068817138671875, 0.00128173828125, 0.0094451904296875, 0.017608642578125, 0.0257720947265625, 0.033935546875, 0.0420989990234375, 0.050262451171875, 0.0584259033203125, 0.06658935546875, 0.0747528076171875, 0.082916259765625, 0.0910797119140625, 0.0992431640625, 0.1074066162109375, 0.115570068359375, 0.1237335205078125, 0.13189697265625, 0.1400604248046875, 0.148223876953125, 0.1563873291015625, 0.16455078125, 0.1727142333984375, 0.180877685546875, 0.1890411376953125, 0.19720458984375, 0.2053680419921875, 0.213531494140625, 0.2216949462890625, 0.2298583984375, 0.2380218505859375, 0.246185302734375, 0.2543487548828125, 0.26251220703125, 0.2706756591796875, 0.278839111328125, 0.2870025634765625, 0.295166015625]}, "gradients/decoder.model.decoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 7.0, 11.0, 18.0, 52.0, 131.0, 233.0, 238.0, 169.0, 91.0, 37.0, 10.0, 7.0, 2.0, 4.0, 2.0], "bins": [-20.11668586730957, -19.75222396850586, -19.38776206970215, -19.02330207824707, -18.65884017944336, -18.29437828063965, -17.929916381835938, -17.56545639038086, -17.20099449157715, -16.836532592773438, -16.472070693969727, -16.10761070251465, -15.743148803710938, -15.378686904907227, -15.014225959777832, -14.649764060974121, -14.285303115844727, -13.920841217041016, -13.556380271911621, -13.19191837310791, -12.827457427978516, -12.462995529174805, -12.09853458404541, -11.7340726852417, -11.369610786437988, -11.005148887634277, -10.640687942504883, -10.276226043701172, -9.911765098571777, -9.547303199768066, -9.182842254638672, -8.818380355834961, -8.453919410705566, -8.089457511901855, -7.724996566772461, -7.360535144805908, -6.9960737228393555, -6.631612300872803, -6.26715087890625, -5.902688980102539, -5.5382280349731445, -5.173766613006592, -4.809305191040039, -4.444843769073486, -4.080382347106934, -3.715920925140381, -3.351459264755249, -2.9869978427886963, -2.6225364208221436, -2.258074998855591, -1.893613576889038, -1.5291520357131958, -1.164690613746643, -0.8002291917800903, -0.43576765060424805, -0.07130622863769531, 0.2931551933288574, 0.6576166152954102, 1.022078037261963, 1.3865395784378052, 1.751001000404358, 2.115462303161621, 2.479923963546753, 2.8443853855133057, 3.2088468074798584]}, "gradients/decoder.model.decoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 3.0, 3.0, 9.0, 2.0, 8.0, 5.0, 3.0, 11.0, 16.0, 19.0, 18.0, 26.0, 22.0, 29.0, 41.0, 41.0, 41.0, 39.0, 48.0, 36.0, 49.0, 50.0, 38.0, 49.0, 45.0, 38.0, 38.0, 30.0, 32.0, 36.0, 27.0, 25.0, 22.0, 21.0, 18.0, 8.0, 12.0, 10.0, 12.0, 11.0, 4.0, 2.0, 3.0, 6.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-5.974123001098633, -5.799110412597656, -5.624098300933838, -5.449085712432861, -5.274073600769043, -5.099061012268066, -4.92404842376709, -4.749035835266113, -4.574023723602295, -4.399011135101318, -4.2239990234375, -4.048986434936523, -3.873974084854126, -3.6989617347717285, -3.523949146270752, -3.3489367961883545, -3.173924446105957, -2.9989120960235596, -2.823899745941162, -2.6488871574401855, -2.473874807357788, -2.2988624572753906, -2.123849868774414, -1.9488375186920166, -1.7738251686096191, -1.5988128185272217, -1.4238003492355347, -1.2487878799438477, -1.0737755298614502, -0.898763120174408, -0.7237507104873657, -0.5487382411956787, -0.37372589111328125, -0.198713481426239, -0.023701071739196777, 0.15131133794784546, 0.3263237476348877, 0.5013361573219299, 0.6763485670089722, 0.8513610363006592, 1.0263733863830566, 1.201385736465454, 1.3763982057571411, 1.5514106750488281, 1.7264230251312256, 1.901435375213623, 2.0764479637145996, 2.251460313796997, 2.4264726638793945, 2.601485013961792, 2.7764973640441895, 2.951509952545166, 3.1265223026275635, 3.301534652709961, 3.4765472412109375, 3.651559591293335, 3.8265719413757324, 4.001584529876709, 4.176596641540527, 4.351609230041504, 4.5266218185424805, 4.701633930206299, 4.876646518707275, 5.051658630371094, 5.22667121887207]}, "gradients/decoder.model.decoder.layers.8.fc2.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 1.0, 8.0, 3.0, 13.0, 15.0, 21.0, 30.0, 23.0, 32.0, 33.0, 77.0, 93.0, 156.0, 289.0, 636.0, 1873.0, 6349.0, 33666.0, 830210.0, 3217214.0, 87358.0, 11383.0, 2800.0, 1037.0, 374.0, 208.0, 108.0, 65.0, 48.0, 36.0, 35.0, 23.0, 18.0, 10.0, 14.0, 7.0, 7.0, 1.0, 5.0, 1.0, 2.0, 4.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.83203125, -4.65435791015625, -4.4766845703125, -4.29901123046875, -4.121337890625, -3.94366455078125, -3.7659912109375, -3.58831787109375, -3.41064453125, -3.23297119140625, -3.0552978515625, -2.87762451171875, -2.699951171875, -2.52227783203125, -2.3446044921875, -2.16693115234375, -1.9892578125, -1.81158447265625, -1.6339111328125, -1.45623779296875, -1.278564453125, -1.10089111328125, -0.9232177734375, -0.74554443359375, -0.56787109375, -0.39019775390625, -0.2125244140625, -0.03485107421875, 0.142822265625, 0.32049560546875, 0.4981689453125, 0.67584228515625, 0.853515625, 1.03118896484375, 1.2088623046875, 1.38653564453125, 1.564208984375, 1.74188232421875, 1.9195556640625, 2.09722900390625, 2.27490234375, 2.45257568359375, 2.6302490234375, 2.80792236328125, 2.985595703125, 3.16326904296875, 3.3409423828125, 3.51861572265625, 3.6962890625, 3.87396240234375, 4.0516357421875, 4.22930908203125, 4.406982421875, 4.58465576171875, 4.7623291015625, 4.94000244140625, 5.11767578125, 5.29534912109375, 5.4730224609375, 5.65069580078125, 5.828369140625, 6.00604248046875, 6.1837158203125, 6.36138916015625, 6.5390625]}, "gradients/decoder.model.decoder.layers.8.fc2.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 4.0, 3.0, 2.0, 6.0, 10.0, 8.0, 8.0, 10.0, 11.0, 11.0, 16.0, 20.0, 26.0, 35.0, 29.0, 50.0, 39.0, 39.0, 41.0, 52.0, 55.0, 45.0, 43.0, 49.0, 45.0, 46.0, 43.0, 37.0, 33.0, 31.0, 19.0, 27.0, 19.0, 23.0, 20.0, 17.0, 13.0, 5.0, 4.0, 2.0, 3.0, 3.0, 4.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.5927734375, -1.542755126953125, -1.49273681640625, -1.442718505859375, -1.3927001953125, -1.342681884765625, -1.29266357421875, -1.242645263671875, -1.192626953125, -1.142608642578125, -1.09259033203125, -1.042572021484375, -0.9925537109375, -0.942535400390625, -0.89251708984375, -0.842498779296875, -0.79248046875, -0.742462158203125, -0.69244384765625, -0.642425537109375, -0.5924072265625, -0.542388916015625, -0.49237060546875, -0.442352294921875, -0.392333984375, -0.342315673828125, -0.29229736328125, -0.242279052734375, -0.1922607421875, -0.142242431640625, -0.09222412109375, -0.042205810546875, 0.0078125, 0.057830810546875, 0.10784912109375, 0.157867431640625, 0.2078857421875, 0.257904052734375, 0.30792236328125, 0.357940673828125, 0.407958984375, 0.457977294921875, 0.50799560546875, 0.558013916015625, 0.6080322265625, 0.658050537109375, 0.70806884765625, 0.758087158203125, 0.80810546875, 0.858123779296875, 0.90814208984375, 0.958160400390625, 1.0081787109375, 1.058197021484375, 1.10821533203125, 1.158233642578125, 1.208251953125, 1.258270263671875, 1.30828857421875, 1.358306884765625, 1.4083251953125, 1.458343505859375, 1.50836181640625, 1.558380126953125, 1.6083984375]}, "gradients/decoder.model.decoder.layers.8.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 4.0, 1.0, 5.0, 4.0, 6.0, 8.0, 10.0, 14.0, 38.0, 33.0, 91.0, 163.0, 369.0, 1361.0, 11417.0, 451291.0, 3688502.0, 36915.0, 2977.0, 603.0, 195.0, 91.0, 61.0, 43.0, 18.0, 18.0, 16.0, 8.0, 6.0, 9.0, 5.0, 2.0, 4.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-6.97265625, -6.756103515625, -6.53955078125, -6.322998046875, -6.1064453125, -5.889892578125, -5.67333984375, -5.456787109375, -5.240234375, -5.023681640625, -4.80712890625, -4.590576171875, -4.3740234375, -4.157470703125, -3.94091796875, -3.724365234375, -3.5078125, -3.291259765625, -3.07470703125, -2.858154296875, -2.6416015625, -2.425048828125, -2.20849609375, -1.991943359375, -1.775390625, -1.558837890625, -1.34228515625, -1.125732421875, -0.9091796875, -0.692626953125, -0.47607421875, -0.259521484375, -0.04296875, 0.173583984375, 0.39013671875, 0.606689453125, 0.8232421875, 1.039794921875, 1.25634765625, 1.472900390625, 1.689453125, 1.906005859375, 2.12255859375, 2.339111328125, 2.5556640625, 2.772216796875, 2.98876953125, 3.205322265625, 3.421875, 3.638427734375, 3.85498046875, 4.071533203125, 4.2880859375, 4.504638671875, 4.72119140625, 4.937744140625, 5.154296875, 5.370849609375, 5.58740234375, 5.803955078125, 6.0205078125, 6.237060546875, 6.45361328125, 6.670166015625, 6.88671875]}, "gradients/decoder.model.decoder.layers.8.fc1.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 4.0, 12.0, 6.0, 7.0, 14.0, 15.0, 20.0, 27.0, 33.0, 51.0, 59.0, 106.0, 119.0, 162.0, 271.0, 448.0, 563.0, 695.0, 504.0, 302.0, 189.0, 131.0, 80.0, 73.0, 46.0, 41.0, 28.0, 19.0, 12.0, 12.0, 8.0, 4.0, 7.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6474609375, -0.6236114501953125, -0.599761962890625, -0.5759124755859375, -0.55206298828125, -0.5282135009765625, -0.504364013671875, -0.4805145263671875, -0.4566650390625, -0.4328155517578125, -0.408966064453125, -0.3851165771484375, -0.36126708984375, -0.3374176025390625, -0.313568115234375, -0.2897186279296875, -0.265869140625, -0.2420196533203125, -0.218170166015625, -0.1943206787109375, -0.17047119140625, -0.1466217041015625, -0.122772216796875, -0.0989227294921875, -0.0750732421875, -0.0512237548828125, -0.027374267578125, -0.0035247802734375, 0.02032470703125, 0.0441741943359375, 0.068023681640625, 0.0918731689453125, 0.11572265625, 0.1395721435546875, 0.163421630859375, 0.1872711181640625, 0.21112060546875, 0.2349700927734375, 0.258819580078125, 0.2826690673828125, 0.3065185546875, 0.3303680419921875, 0.354217529296875, 0.3780670166015625, 0.40191650390625, 0.4257659912109375, 0.449615478515625, 0.4734649658203125, 0.497314453125, 0.5211639404296875, 0.545013427734375, 0.5688629150390625, 0.59271240234375, 0.6165618896484375, 0.640411376953125, 0.6642608642578125, 0.6881103515625, 0.7119598388671875, 0.735809326171875, 0.7596588134765625, 0.78350830078125, 0.8073577880859375, 0.831207275390625, 0.8550567626953125, 0.87890625]}, "gradients/decoder.model.decoder.layers.8.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 5.0, 5.0, 6.0, 4.0, 11.0, 17.0, 19.0, 32.0, 53.0, 69.0, 84.0, 69.0, 91.0, 99.0, 114.0, 91.0, 64.0, 62.0, 35.0, 19.0, 17.0, 11.0, 6.0, 1.0, 5.0, 4.0, 6.0, 7.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.634354829788208, -3.5254557132720947, -3.4165568351745605, -3.3076577186584473, -3.198758602142334, -3.0898594856262207, -2.9809603691101074, -2.8720614910125732, -2.76316237449646, -2.6542632579803467, -2.5453643798828125, -2.436465263366699, -2.327566146850586, -2.2186670303344727, -2.1097679138183594, -2.000869035720825, -1.891969919204712, -1.7830708026885986, -1.674171805381775, -1.5652728080749512, -1.456373691558838, -1.3474745750427246, -1.2385755777359009, -1.1296765804290771, -1.0207774639129639, -0.9118784070014954, -0.8029793500900269, -0.6940802931785583, -0.5851812362670898, -0.47628217935562134, -0.36738312244415283, -0.2584840655326843, -0.14958500862121582, -0.040685951709747314, 0.06821310520172119, 0.1771121621131897, 0.2860112190246582, 0.3949102759361267, 0.5038093328475952, 0.6127083897590637, 0.7216074466705322, 0.8305065035820007, 0.9394055604934692, 1.048304557800293, 1.1572036743164062, 1.2661027908325195, 1.3750017881393433, 1.483900785446167, 1.5927999019622803, 1.7016990184783936, 1.8105980157852173, 1.919497013092041, 2.0283961296081543, 2.1372952461242676, 2.246194362640381, 2.355093240737915, 2.4639923572540283, 2.5728914737701416, 2.681790351867676, 2.790689468383789, 2.8995885848999023, 3.0084877014160156, 3.117386817932129, 3.226285696029663, 3.3351848125457764]}, "gradients/decoder.model.decoder.layers.8.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 3.0, 3.0, 3.0, 2.0, 6.0, 11.0, 9.0, 16.0, 8.0, 14.0, 14.0, 8.0, 21.0, 31.0, 34.0, 26.0, 43.0, 45.0, 45.0, 47.0, 52.0, 42.0, 51.0, 53.0, 42.0, 37.0, 42.0, 45.0, 33.0, 39.0, 29.0, 26.0, 19.0, 17.0, 16.0, 15.0, 12.0, 14.0, 11.0, 9.0, 5.0, 3.0, 0.0, 7.0, 2.0, 1.0, 5.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.0938661098480225, -2.0367066860198975, -1.9795475006103516, -1.9223880767822266, -1.8652287721633911, -1.8080694675445557, -1.7509101629257202, -1.6937508583068848, -1.6365914344787598, -1.5794321298599243, -1.5222728252410889, -1.4651134014129639, -1.4079540967941284, -1.350794792175293, -1.2936354875564575, -1.236476182937622, -1.1793168783187866, -1.1221575736999512, -1.0649982690811157, -1.0078389644622803, -0.9506795406341553, -0.8935202360153198, -0.8363609313964844, -0.7792016267776489, -0.7220422625541687, -0.6648829579353333, -0.607723593711853, -0.5505642890930176, -0.49340495467185974, -0.4362456202507019, -0.37908631563186646, -0.3219269812107086, -0.26476752758026123, -0.2076081931591034, -0.15044887363910675, -0.09328955411911011, -0.03613021969795227, 0.021029114723205566, 0.07818841934204102, 0.13534775376319885, 0.1925070881843567, 0.24966642260551453, 0.30682575702667236, 0.3639850616455078, 0.42114439606666565, 0.4783037304878235, 0.5354630351066589, 0.5926223993301392, 0.6497817039489746, 0.7069410085678101, 0.7641003727912903, 0.8212596774101257, 0.878419041633606, 0.9355783462524414, 0.9927376508712769, 1.0498969554901123, 1.1070563793182373, 1.1642156839370728, 1.2213749885559082, 1.2785344123840332, 1.3356937170028687, 1.392853021621704, 1.4500123262405396, 1.507171630859375, 1.5643309354782104]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 4.0, 3.0, 6.0, 7.0, 8.0, 9.0, 10.0, 15.0, 22.0, 48.0, 70.0, 105.0, 146.0, 257.0, 413.0, 759.0, 1345.0, 2529.0, 5354.0, 11595.0, 29072.0, 78996.0, 239898.0, 407948.0, 171411.0, 58201.0, 22249.0, 9230.0, 4128.0, 2084.0, 1137.0, 558.0, 332.0, 182.0, 131.0, 87.0, 70.0, 37.0, 28.0, 18.0, 13.0, 13.0, 9.0, 7.0, 7.0, 5.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.62890625, -0.608184814453125, -0.58746337890625, -0.566741943359375, -0.5460205078125, -0.525299072265625, -0.50457763671875, -0.483856201171875, -0.463134765625, -0.442413330078125, -0.42169189453125, -0.400970458984375, -0.3802490234375, -0.359527587890625, -0.33880615234375, -0.318084716796875, -0.29736328125, -0.276641845703125, -0.25592041015625, -0.235198974609375, -0.2144775390625, -0.193756103515625, -0.17303466796875, -0.152313232421875, -0.131591796875, -0.110870361328125, -0.09014892578125, -0.069427490234375, -0.0487060546875, -0.027984619140625, -0.00726318359375, 0.013458251953125, 0.0341796875, 0.054901123046875, 0.07562255859375, 0.096343994140625, 0.1170654296875, 0.137786865234375, 0.15850830078125, 0.179229736328125, 0.199951171875, 0.220672607421875, 0.24139404296875, 0.262115478515625, 0.2828369140625, 0.303558349609375, 0.32427978515625, 0.345001220703125, 0.36572265625, 0.386444091796875, 0.40716552734375, 0.427886962890625, 0.4486083984375, 0.469329833984375, 0.49005126953125, 0.510772705078125, 0.531494140625, 0.552215576171875, 0.57293701171875, 0.593658447265625, 0.6143798828125, 0.635101318359375, 0.65582275390625, 0.676544189453125, 0.697265625]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 4.0, 6.0, 9.0, 5.0, 9.0, 8.0, 15.0, 13.0, 15.0, 21.0, 25.0, 24.0, 35.0, 43.0, 41.0, 48.0, 51.0, 52.0, 55.0, 54.0, 51.0, 50.0, 47.0, 47.0, 36.0, 28.0, 42.0, 24.0, 31.0, 15.0, 21.0, 8.0, 15.0, 11.0, 9.0, 7.0, 8.0, 4.0, 2.0, 5.0, 3.0, 2.0, 8.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.2412109375, -1.204193115234375, -1.16717529296875, -1.130157470703125, -1.0931396484375, -1.056121826171875, -1.01910400390625, -0.982086181640625, -0.945068359375, -0.908050537109375, -0.87103271484375, -0.834014892578125, -0.7969970703125, -0.759979248046875, -0.72296142578125, -0.685943603515625, -0.64892578125, -0.611907958984375, -0.57489013671875, -0.537872314453125, -0.5008544921875, -0.463836669921875, -0.42681884765625, -0.389801025390625, -0.352783203125, -0.315765380859375, -0.27874755859375, -0.241729736328125, -0.2047119140625, -0.167694091796875, -0.13067626953125, -0.093658447265625, -0.056640625, -0.019622802734375, 0.01739501953125, 0.054412841796875, 0.0914306640625, 0.128448486328125, 0.16546630859375, 0.202484130859375, 0.239501953125, 0.276519775390625, 0.31353759765625, 0.350555419921875, 0.3875732421875, 0.424591064453125, 0.46160888671875, 0.498626708984375, 0.53564453125, 0.572662353515625, 0.60968017578125, 0.646697998046875, 0.6837158203125, 0.720733642578125, 0.75775146484375, 0.794769287109375, 0.831787109375, 0.868804931640625, 0.90582275390625, 0.942840576171875, 0.9798583984375, 1.016876220703125, 1.05389404296875, 1.090911865234375, 1.1279296875]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 5.0, 3.0, 6.0, 9.0, 8.0, 12.0, 18.0, 19.0, 39.0, 82.0, 132.0, 236.0, 411.0, 893.0, 2123.0, 5908.0, 21297.0, 105104.0, 564230.0, 283845.0, 47063.0, 11162.0, 3403.0, 1308.0, 553.0, 275.0, 154.0, 93.0, 58.0, 32.0, 25.0, 17.0, 12.0, 5.0, 3.0, 7.0, 3.0, 1.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.79931640625, -0.7733306884765625, -0.747344970703125, -0.7213592529296875, -0.69537353515625, -0.6693878173828125, -0.643402099609375, -0.6174163818359375, -0.5914306640625, -0.5654449462890625, -0.539459228515625, -0.5134735107421875, -0.48748779296875, -0.4615020751953125, -0.435516357421875, -0.4095306396484375, -0.383544921875, -0.3575592041015625, -0.331573486328125, -0.3055877685546875, -0.27960205078125, -0.2536163330078125, -0.227630615234375, -0.2016448974609375, -0.1756591796875, -0.1496734619140625, -0.123687744140625, -0.0977020263671875, -0.07171630859375, -0.0457305908203125, -0.019744873046875, 0.0062408447265625, 0.0322265625, 0.0582122802734375, 0.084197998046875, 0.1101837158203125, 0.13616943359375, 0.1621551513671875, 0.188140869140625, 0.2141265869140625, 0.2401123046875, 0.2660980224609375, 0.292083740234375, 0.3180694580078125, 0.34405517578125, 0.3700408935546875, 0.396026611328125, 0.4220123291015625, 0.447998046875, 0.4739837646484375, 0.499969482421875, 0.5259552001953125, 0.55194091796875, 0.5779266357421875, 0.603912353515625, 0.6298980712890625, 0.6558837890625, 0.6818695068359375, 0.707855224609375, 0.7338409423828125, 0.75982666015625, 0.7858123779296875, 0.811798095703125, 0.8377838134765625, 0.86376953125]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 2.0, 0.0, 2.0, 3.0, 1.0, 5.0, 6.0, 7.0, 1.0, 12.0, 13.0, 9.0, 16.0, 14.0, 21.0, 24.0, 19.0, 28.0, 29.0, 28.0, 45.0, 47.0, 42.0, 37.0, 38.0, 32.0, 41.0, 35.0, 37.0, 39.0, 40.0, 40.0, 43.0, 33.0, 31.0, 25.0, 24.0, 25.0, 20.0, 16.0, 9.0, 17.0, 13.0, 10.0, 6.0, 5.0, 4.0, 4.0, 6.0, 6.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.787109375, -1.72772216796875, -1.6683349609375, -1.60894775390625, -1.549560546875, -1.49017333984375, -1.4307861328125, -1.37139892578125, -1.31201171875, -1.25262451171875, -1.1932373046875, -1.13385009765625, -1.074462890625, -1.01507568359375, -0.9556884765625, -0.89630126953125, -0.8369140625, -0.77752685546875, -0.7181396484375, -0.65875244140625, -0.599365234375, -0.53997802734375, -0.4805908203125, -0.42120361328125, -0.36181640625, -0.30242919921875, -0.2430419921875, -0.18365478515625, -0.124267578125, -0.06488037109375, -0.0054931640625, 0.05389404296875, 0.11328125, 0.17266845703125, 0.2320556640625, 0.29144287109375, 0.350830078125, 0.41021728515625, 0.4696044921875, 0.52899169921875, 0.58837890625, 0.64776611328125, 0.7071533203125, 0.76654052734375, 0.825927734375, 0.88531494140625, 0.9447021484375, 1.00408935546875, 1.0634765625, 1.12286376953125, 1.1822509765625, 1.24163818359375, 1.301025390625, 1.36041259765625, 1.4197998046875, 1.47918701171875, 1.53857421875, 1.59796142578125, 1.6573486328125, 1.71673583984375, 1.776123046875, 1.83551025390625, 1.8948974609375, 1.95428466796875, 2.013671875]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 3.0, 5.0, 5.0, 8.0, 12.0, 19.0, 20.0, 28.0, 28.0, 53.0, 74.0, 103.0, 156.0, 211.0, 355.0, 543.0, 920.0, 1633.0, 3128.0, 6485.0, 16650.0, 59971.0, 341276.0, 489181.0, 89166.0, 22035.0, 8042.0, 3636.0, 1909.0, 1078.0, 649.0, 411.0, 233.0, 151.0, 118.0, 72.0, 51.0, 33.0, 18.0, 24.0, 14.0, 15.0, 10.0, 3.0, 6.0, 4.0, 3.0, 10.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.287109375, -0.27788543701171875, -0.2686614990234375, -0.25943756103515625, -0.250213623046875, -0.24098968505859375, -0.2317657470703125, -0.22254180908203125, -0.21331787109375, -0.20409393310546875, -0.1948699951171875, -0.18564605712890625, -0.176422119140625, -0.16719818115234375, -0.1579742431640625, -0.14875030517578125, -0.1395263671875, -0.13030242919921875, -0.1210784912109375, -0.11185455322265625, -0.102630615234375, -0.09340667724609375, -0.0841827392578125, -0.07495880126953125, -0.06573486328125, -0.05651092529296875, -0.0472869873046875, -0.03806304931640625, -0.028839111328125, -0.01961517333984375, -0.0103912353515625, -0.00116729736328125, 0.008056640625, 0.01728057861328125, 0.0265045166015625, 0.03572845458984375, 0.044952392578125, 0.05417633056640625, 0.0634002685546875, 0.07262420654296875, 0.08184814453125, 0.09107208251953125, 0.1002960205078125, 0.10951995849609375, 0.118743896484375, 0.12796783447265625, 0.1371917724609375, 0.14641571044921875, 0.1556396484375, 0.16486358642578125, 0.1740875244140625, 0.18331146240234375, 0.192535400390625, 0.20175933837890625, 0.2109832763671875, 0.22020721435546875, 0.22943115234375, 0.23865509033203125, 0.2478790283203125, 0.25710296630859375, 0.266326904296875, 0.27555084228515625, 0.2847747802734375, 0.29399871826171875, 0.30322265625]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 5.0, 2.0, 6.0, 3.0, 13.0, 23.0, 33.0, 65.0, 108.0, 141.0, 164.0, 166.0, 108.0, 58.0, 53.0, 17.0, 11.0, 14.0, 6.0, 7.0, 3.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0003566741943359375, -0.0003471672534942627, -0.0003376603126525879, -0.0003281533718109131, -0.0003186464309692383, -0.0003091394901275635, -0.00029963254928588867, -0.00029012560844421387, -0.00028061866760253906, -0.00027111172676086426, -0.00026160478591918945, -0.00025209784507751465, -0.00024259090423583984, -0.00023308396339416504, -0.00022357702255249023, -0.00021407008171081543, -0.00020456314086914062, -0.00019505620002746582, -0.00018554925918579102, -0.0001760423183441162, -0.0001665353775024414, -0.0001570284366607666, -0.0001475214958190918, -0.000138014554977417, -0.0001285076141357422, -0.00011900067329406738, -0.00010949373245239258, -9.998679161071777e-05, -9.047985076904297e-05, -8.097290992736816e-05, -7.146596908569336e-05, -6.195902824401855e-05, -5.245208740234375e-05, -4.2945146560668945e-05, -3.343820571899414e-05, -2.3931264877319336e-05, -1.4424324035644531e-05, -4.9173831939697266e-06, 4.589557647705078e-06, 1.4096498489379883e-05, 2.3603439331054688e-05, 3.311038017272949e-05, 4.26173210144043e-05, 5.21242618560791e-05, 6.16312026977539e-05, 7.113814353942871e-05, 8.064508438110352e-05, 9.015202522277832e-05, 9.965896606445312e-05, 0.00010916590690612793, 0.00011867284774780273, 0.00012817978858947754, 0.00013768672943115234, 0.00014719367027282715, 0.00015670061111450195, 0.00016620755195617676, 0.00017571449279785156, 0.00018522143363952637, 0.00019472837448120117, 0.00020423531532287598, 0.00021374225616455078, 0.00022324919700622559, 0.0002327561378479004, 0.0002422630786895752, 0.00025177001953125]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 4.0, 4.0, 5.0, 5.0, 4.0, 12.0, 16.0, 31.0, 26.0, 67.0, 127.0, 145.0, 256.0, 473.0, 828.0, 1704.0, 3595.0, 9483.0, 35665.0, 238137.0, 614678.0, 110448.0, 20939.0, 6485.0, 2512.0, 1291.0, 655.0, 375.0, 245.0, 132.0, 77.0, 44.0, 31.0, 18.0, 20.0, 8.0, 7.0, 4.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.425048828125, -0.4126625061035156, -0.40027618408203125, -0.3878898620605469, -0.3755035400390625, -0.3631172180175781, -0.35073089599609375, -0.3383445739746094, -0.325958251953125, -0.3135719299316406, -0.30118560791015625, -0.2887992858886719, -0.2764129638671875, -0.2640266418457031, -0.25164031982421875, -0.23925399780273438, -0.22686767578125, -0.21448135375976562, -0.20209503173828125, -0.18970870971679688, -0.1773223876953125, -0.16493606567382812, -0.15254974365234375, -0.14016342163085938, -0.127777099609375, -0.11539077758789062, -0.10300445556640625, -0.09061813354492188, -0.0782318115234375, -0.06584548950195312, -0.05345916748046875, -0.041072845458984375, -0.0286865234375, -0.016300201416015625, -0.00391387939453125, 0.008472442626953125, 0.0208587646484375, 0.033245086669921875, 0.04563140869140625, 0.058017730712890625, 0.070404052734375, 0.08279037475585938, 0.09517669677734375, 0.10756301879882812, 0.1199493408203125, 0.13233566284179688, 0.14472198486328125, 0.15710830688476562, 0.16949462890625, 0.18188095092773438, 0.19426727294921875, 0.20665359497070312, 0.2190399169921875, 0.23142623901367188, 0.24381256103515625, 0.2561988830566406, 0.268585205078125, 0.2809715270996094, 0.29335784912109375, 0.3057441711425781, 0.3181304931640625, 0.3305168151855469, 0.34290313720703125, 0.3552894592285156, 0.36767578125]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 3.0, 0.0, 5.0, 3.0, 3.0, 4.0, 3.0, 7.0, 2.0, 9.0, 12.0, 23.0, 36.0, 42.0, 51.0, 90.0, 116.0, 118.0, 125.0, 85.0, 88.0, 45.0, 32.0, 37.0, 29.0, 11.0, 12.0, 3.0, 8.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0831298828125, -0.0801401138305664, -0.07715034484863281, -0.07416057586669922, -0.07117080688476562, -0.06818103790283203, -0.06519126892089844, -0.062201499938964844, -0.05921173095703125, -0.056221961975097656, -0.05323219299316406, -0.05024242401123047, -0.047252655029296875, -0.04426288604736328, -0.04127311706542969, -0.038283348083496094, -0.0352935791015625, -0.032303810119628906, -0.029314041137695312, -0.02632427215576172, -0.023334503173828125, -0.02034473419189453, -0.017354965209960938, -0.014365196228027344, -0.01137542724609375, -0.008385658264160156, -0.0053958892822265625, -0.0024061203002929688, 0.000583648681640625, 0.0035734176635742188, 0.0065631866455078125, 0.009552955627441406, 0.012542724609375, 0.015532493591308594, 0.018522262573242188, 0.02151203155517578, 0.024501800537109375, 0.02749156951904297, 0.030481338500976562, 0.033471107482910156, 0.03646087646484375, 0.039450645446777344, 0.04244041442871094, 0.04543018341064453, 0.048419952392578125, 0.05140972137451172, 0.05439949035644531, 0.057389259338378906, 0.0603790283203125, 0.0633687973022461, 0.06635856628417969, 0.06934833526611328, 0.07233810424804688, 0.07532787322998047, 0.07831764221191406, 0.08130741119384766, 0.08429718017578125, 0.08728694915771484, 0.09027671813964844, 0.09326648712158203, 0.09625625610351562, 0.09924602508544922, 0.10223579406738281, 0.1052255630493164, 0.10821533203125]}, "gradients/decoder.model.decoder.layers.8.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 5.0, 3.0, 4.0, 11.0, 7.0, 26.0, 30.0, 49.0, 71.0, 80.0, 111.0, 103.0, 138.0, 114.0, 78.0, 54.0, 38.0, 26.0, 16.0, 10.0, 7.0, 7.0, 5.0, 2.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.2829670906066895, -2.2065343856811523, -2.130101442337036, -2.05366849899292, -1.9772357940673828, -1.9008029699325562, -1.8243701457977295, -1.7479373216629028, -1.6715044975280762, -1.5950716733932495, -1.5186388492584229, -1.4422060251235962, -1.3657732009887695, -1.2893403768539429, -1.2129075527191162, -1.1364747285842896, -1.060041904449463, -0.9836090803146362, -0.9071762561798096, -0.8307434320449829, -0.7543106079101562, -0.6778777837753296, -0.6014449596405029, -0.5250121355056763, -0.4485793113708496, -0.37214648723602295, -0.2957136631011963, -0.21928083896636963, -0.14284801483154297, -0.06641519069671631, 0.010017633438110352, 0.08645045757293701, 0.16288328170776367, 0.23931610584259033, 0.315748929977417, 0.39218175411224365, 0.4686145782470703, 0.545047402381897, 0.6214802265167236, 0.6979130506515503, 0.774345874786377, 0.8507786989212036, 0.9272115230560303, 1.003644347190857, 1.0800771713256836, 1.1565099954605103, 1.232942819595337, 1.3093756437301636, 1.3858084678649902, 1.462241291999817, 1.5386741161346436, 1.6151069402694702, 1.6915397644042969, 1.7679725885391235, 1.8444054126739502, 1.9208382368087769, 1.9972710609436035, 2.0737037658691406, 2.150136709213257, 2.226569652557373, 2.30300235748291, 2.3794350624084473, 2.4558680057525635, 2.5323009490966797, 2.608733654022217]}, "gradients/decoder.model.decoder.layers.8.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 2.0, 5.0, 5.0, 10.0, 13.0, 9.0, 13.0, 12.0, 14.0, 16.0, 24.0, 27.0, 42.0, 35.0, 55.0, 53.0, 51.0, 58.0, 59.0, 54.0, 47.0, 56.0, 44.0, 48.0, 39.0, 32.0, 35.0, 28.0, 22.0, 17.0, 21.0, 13.0, 11.0, 13.0, 5.0, 3.0, 4.0, 2.0, 5.0, 1.0, 2.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.4039427042007446, -1.365138292312622, -1.32633376121521, -1.2875292301177979, -1.2487248182296753, -1.2099204063415527, -1.1711158752441406, -1.1323113441467285, -1.093506932258606, -1.0547025203704834, -1.0158979892730713, -0.977093517780304, -0.9382890462875366, -0.8994845747947693, -0.860680103302002, -0.8218756318092346, -0.7830711603164673, -0.7442666888237, -0.7054622173309326, -0.6666577458381653, -0.627853274345398, -0.5890488028526306, -0.5502443313598633, -0.511439859867096, -0.4726353883743286, -0.4338309168815613, -0.39502644538879395, -0.3562219738960266, -0.3174175024032593, -0.27861303091049194, -0.2398085594177246, -0.20100408792495728, -0.1621994972229004, -0.12339502573013306, -0.08459055423736572, -0.04578608274459839, -0.006981611251831055, 0.03182286024093628, 0.07062733173370361, 0.10943180322647095, 0.14823627471923828, 0.18704074621200562, 0.22584521770477295, 0.2646496891975403, 0.3034541606903076, 0.34225863218307495, 0.3810631036758423, 0.4198675751686096, 0.45867204666137695, 0.4974765181541443, 0.5362809896469116, 0.575085461139679, 0.6138899326324463, 0.6526944041252136, 0.691498875617981, 0.7303033471107483, 0.7691078186035156, 0.807912290096283, 0.8467167615890503, 0.8855212330818176, 0.924325704574585, 0.9631301760673523, 1.0019346475601196, 1.0407390594482422, 1.0795435905456543]}, "gradients/decoder.model.decoder.layers.8.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 3.0, 1.0, 2.0, 4.0, 6.0, 8.0, 9.0, 15.0, 18.0, 23.0, 34.0, 54.0, 75.0, 128.0, 176.0, 270.0, 412.0, 626.0, 1001.0, 1667.0, 2914.0, 5332.0, 10825.0, 22905.0, 57349.0, 190466.0, 501934.0, 159417.0, 50488.0, 20651.0, 9645.0, 5056.0, 2803.0, 1566.0, 940.0, 602.0, 371.0, 238.0, 175.0, 101.0, 75.0, 52.0, 35.0, 33.0, 12.0, 10.0, 5.0, 13.0, 8.0, 3.0, 2.0, 1.0, 2.0, 1.0, 3.0, 0.0, 3.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.2783203125, -1.234893798828125, -1.19146728515625, -1.148040771484375, -1.1046142578125, -1.061187744140625, -1.01776123046875, -0.974334716796875, -0.930908203125, -0.887481689453125, -0.84405517578125, -0.800628662109375, -0.7572021484375, -0.713775634765625, -0.67034912109375, -0.626922607421875, -0.58349609375, -0.540069580078125, -0.49664306640625, -0.453216552734375, -0.4097900390625, -0.366363525390625, -0.32293701171875, -0.279510498046875, -0.236083984375, -0.192657470703125, -0.14923095703125, -0.105804443359375, -0.0623779296875, -0.018951416015625, 0.02447509765625, 0.067901611328125, 0.111328125, 0.154754638671875, 0.19818115234375, 0.241607666015625, 0.2850341796875, 0.328460693359375, 0.37188720703125, 0.415313720703125, 0.458740234375, 0.502166748046875, 0.54559326171875, 0.589019775390625, 0.6324462890625, 0.675872802734375, 0.71929931640625, 0.762725830078125, 0.80615234375, 0.849578857421875, 0.89300537109375, 0.936431884765625, 0.9798583984375, 1.023284912109375, 1.06671142578125, 1.110137939453125, 1.153564453125, 1.196990966796875, 1.24041748046875, 1.283843994140625, 1.3272705078125, 1.370697021484375, 1.41412353515625, 1.457550048828125, 1.5009765625]}, "gradients/decoder.model.decoder.layers.8.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 5.0, 5.0, 4.0, 5.0, 7.0, 7.0, 8.0, 11.0, 23.0, 16.0, 22.0, 21.0, 26.0, 37.0, 39.0, 47.0, 50.0, 54.0, 70.0, 58.0, 54.0, 66.0, 42.0, 41.0, 33.0, 37.0, 34.0, 32.0, 33.0, 28.0, 25.0, 13.0, 13.0, 13.0, 6.0, 4.0, 5.0, 3.0, 2.0, 2.0, 0.0, 5.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-3.201171875, -3.1141357421875, -3.027099609375, -2.9400634765625, -2.85302734375, -2.7659912109375, -2.678955078125, -2.5919189453125, -2.5048828125, -2.4178466796875, -2.330810546875, -2.2437744140625, -2.15673828125, -2.0697021484375, -1.982666015625, -1.8956298828125, -1.80859375, -1.7215576171875, -1.634521484375, -1.5474853515625, -1.46044921875, -1.3734130859375, -1.286376953125, -1.1993408203125, -1.1123046875, -1.0252685546875, -0.938232421875, -0.8511962890625, -0.76416015625, -0.6771240234375, -0.590087890625, -0.5030517578125, -0.416015625, -0.3289794921875, -0.241943359375, -0.1549072265625, -0.06787109375, 0.0191650390625, 0.106201171875, 0.1932373046875, 0.2802734375, 0.3673095703125, 0.454345703125, 0.5413818359375, 0.62841796875, 0.7154541015625, 0.802490234375, 0.8895263671875, 0.9765625, 1.0635986328125, 1.150634765625, 1.2376708984375, 1.32470703125, 1.4117431640625, 1.498779296875, 1.5858154296875, 1.6728515625, 1.7598876953125, 1.846923828125, 1.9339599609375, 2.02099609375, 2.1080322265625, 2.195068359375, 2.2821044921875, 2.369140625]}, "gradients/decoder.model.decoder.layers.8.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 2.0, 0.0, 2.0, 4.0, 9.0, 2.0, 6.0, 8.0, 7.0, 5.0, 15.0, 14.0, 18.0, 14.0, 16.0, 27.0, 23.0, 32.0, 31.0, 41.0, 43.0, 56.0, 86.0, 332.0, 4166.0, 696155.0, 343676.0, 3087.0, 259.0, 81.0, 53.0, 37.0, 27.0, 30.0, 36.0, 21.0, 28.0, 24.0, 16.0, 13.0, 8.0, 13.0, 9.0, 5.0, 10.0, 8.0, 3.0, 5.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.23046875, -6.98907470703125, -6.7476806640625, -6.50628662109375, -6.264892578125, -6.02349853515625, -5.7821044921875, -5.54071044921875, -5.29931640625, -5.05792236328125, -4.8165283203125, -4.57513427734375, -4.333740234375, -4.09234619140625, -3.8509521484375, -3.60955810546875, -3.3681640625, -3.12677001953125, -2.8853759765625, -2.64398193359375, -2.402587890625, -2.16119384765625, -1.9197998046875, -1.67840576171875, -1.43701171875, -1.19561767578125, -0.9542236328125, -0.71282958984375, -0.471435546875, -0.23004150390625, 0.0113525390625, 0.25274658203125, 0.494140625, 0.73553466796875, 0.9769287109375, 1.21832275390625, 1.459716796875, 1.70111083984375, 1.9425048828125, 2.18389892578125, 2.42529296875, 2.66668701171875, 2.9080810546875, 3.14947509765625, 3.390869140625, 3.63226318359375, 3.8736572265625, 4.11505126953125, 4.3564453125, 4.59783935546875, 4.8392333984375, 5.08062744140625, 5.322021484375, 5.56341552734375, 5.8048095703125, 6.04620361328125, 6.28759765625, 6.52899169921875, 6.7703857421875, 7.01177978515625, 7.253173828125, 7.49456787109375, 7.7359619140625, 7.97735595703125, 8.21875]}, "gradients/decoder.model.decoder.layers.8.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 3.0, 3.0, 2.0, 8.0, 4.0, 5.0, 9.0, 8.0, 10.0, 20.0, 16.0, 17.0, 15.0, 23.0, 25.0, 34.0, 41.0, 26.0, 40.0, 36.0, 44.0, 42.0, 45.0, 45.0, 40.0, 43.0, 38.0, 39.0, 39.0, 28.0, 33.0, 34.0, 32.0, 29.0, 18.0, 19.0, 23.0, 13.0, 11.0, 9.0, 9.0, 14.0, 5.0, 5.0, 2.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-2.353515625, -2.277099609375, -2.20068359375, -2.124267578125, -2.0478515625, -1.971435546875, -1.89501953125, -1.818603515625, -1.7421875, -1.665771484375, -1.58935546875, -1.512939453125, -1.4365234375, -1.360107421875, -1.28369140625, -1.207275390625, -1.130859375, -1.054443359375, -0.97802734375, -0.901611328125, -0.8251953125, -0.748779296875, -0.67236328125, -0.595947265625, -0.51953125, -0.443115234375, -0.36669921875, -0.290283203125, -0.2138671875, -0.137451171875, -0.06103515625, 0.015380859375, 0.091796875, 0.168212890625, 0.24462890625, 0.321044921875, 0.3974609375, 0.473876953125, 0.55029296875, 0.626708984375, 0.703125, 0.779541015625, 0.85595703125, 0.932373046875, 1.0087890625, 1.085205078125, 1.16162109375, 1.238037109375, 1.314453125, 1.390869140625, 1.46728515625, 1.543701171875, 1.6201171875, 1.696533203125, 1.77294921875, 1.849365234375, 1.92578125, 2.002197265625, 2.07861328125, 2.155029296875, 2.2314453125, 2.307861328125, 2.38427734375, 2.460693359375, 2.537109375]}, "gradients/decoder.model.decoder.layers.8.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 2.0, 7.0, 3.0, 9.0, 9.0, 12.0, 16.0, 17.0, 32.0, 43.0, 63.0, 135.0, 210.0, 467.0, 1084.0, 3598.0, 14290.0, 90957.0, 751136.0, 158280.0, 20537.0, 4836.0, 1544.0, 581.0, 272.0, 154.0, 87.0, 39.0, 41.0, 24.0, 20.0, 10.0, 11.0, 12.0, 4.0, 6.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.79248046875, -0.7689056396484375, -0.745330810546875, -0.7217559814453125, -0.69818115234375, -0.6746063232421875, -0.651031494140625, -0.6274566650390625, -0.6038818359375, -0.5803070068359375, -0.556732177734375, -0.5331573486328125, -0.50958251953125, -0.4860076904296875, -0.462432861328125, -0.4388580322265625, -0.415283203125, -0.3917083740234375, -0.368133544921875, -0.3445587158203125, -0.32098388671875, -0.2974090576171875, -0.273834228515625, -0.2502593994140625, -0.2266845703125, -0.2031097412109375, -0.179534912109375, -0.1559600830078125, -0.13238525390625, -0.1088104248046875, -0.085235595703125, -0.0616607666015625, -0.0380859375, -0.0145111083984375, 0.009063720703125, 0.0326385498046875, 0.05621337890625, 0.0797882080078125, 0.103363037109375, 0.1269378662109375, 0.1505126953125, 0.1740875244140625, 0.197662353515625, 0.2212371826171875, 0.24481201171875, 0.2683868408203125, 0.291961669921875, 0.3155364990234375, 0.339111328125, 0.3626861572265625, 0.386260986328125, 0.4098358154296875, 0.43341064453125, 0.4569854736328125, 0.480560302734375, 0.5041351318359375, 0.5277099609375, 0.5512847900390625, 0.574859619140625, 0.5984344482421875, 0.62200927734375, 0.6455841064453125, 0.669158935546875, 0.6927337646484375, 0.71630859375]}, "gradients/decoder.model.decoder.layers.8.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0, 4.0, 4.0, 2.0, 3.0, 4.0, 6.0, 4.0, 6.0, 10.0, 8.0, 15.0, 22.0, 20.0, 30.0, 34.0, 49.0, 79.0, 83.0, 115.0, 137.0, 111.0, 64.0, 48.0, 28.0, 37.0, 21.0, 11.0, 13.0, 8.0, 12.0, 4.0, 3.0, 5.0, 3.0, 3.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.20159912109375e-05, -7.952749729156494e-05, -7.703900337219238e-05, -7.455050945281982e-05, -7.206201553344727e-05, -6.957352161407471e-05, -6.708502769470215e-05, -6.459653377532959e-05, -6.210803985595703e-05, -5.961954593658447e-05, -5.7131052017211914e-05, -5.4642558097839355e-05, -5.21540641784668e-05, -4.966557025909424e-05, -4.717707633972168e-05, -4.468858242034912e-05, -4.220008850097656e-05, -3.9711594581604004e-05, -3.7223100662231445e-05, -3.473460674285889e-05, -3.224611282348633e-05, -2.975761890411377e-05, -2.726912498474121e-05, -2.4780631065368652e-05, -2.2292137145996094e-05, -1.9803643226623535e-05, -1.7315149307250977e-05, -1.4826655387878418e-05, -1.233816146850586e-05, -9.8496675491333e-06, -7.361173629760742e-06, -4.872679710388184e-06, -2.384185791015625e-06, 1.043081283569336e-07, 2.592802047729492e-06, 5.081295967102051e-06, 7.569789886474609e-06, 1.0058283805847168e-05, 1.2546777725219727e-05, 1.5035271644592285e-05, 1.7523765563964844e-05, 2.0012259483337402e-05, 2.250075340270996e-05, 2.498924732208252e-05, 2.7477741241455078e-05, 2.9966235160827637e-05, 3.2454729080200195e-05, 3.4943222999572754e-05, 3.743171691894531e-05, 3.992021083831787e-05, 4.240870475769043e-05, 4.489719867706299e-05, 4.738569259643555e-05, 4.9874186515808105e-05, 5.2362680435180664e-05, 5.485117435455322e-05, 5.733966827392578e-05, 5.982816219329834e-05, 6.23166561126709e-05, 6.480515003204346e-05, 6.729364395141602e-05, 6.978213787078857e-05, 7.227063179016113e-05, 7.475912570953369e-05, 7.724761962890625e-05]}, "gradients/decoder.model.decoder.layers.8.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 5.0, 4.0, 8.0, 12.0, 20.0, 31.0, 42.0, 81.0, 142.0, 233.0, 458.0, 922.0, 2112.0, 5695.0, 19321.0, 100238.0, 686144.0, 190675.0, 29466.0, 7784.0, 2735.0, 1148.0, 560.0, 299.0, 153.0, 113.0, 50.0, 36.0, 24.0, 17.0, 12.0, 6.0, 7.0, 5.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5908203125, -0.570892333984375, -0.55096435546875, -0.531036376953125, -0.5111083984375, -0.491180419921875, -0.47125244140625, -0.451324462890625, -0.431396484375, -0.411468505859375, -0.39154052734375, -0.371612548828125, -0.3516845703125, -0.331756591796875, -0.31182861328125, -0.291900634765625, -0.27197265625, -0.252044677734375, -0.23211669921875, -0.212188720703125, -0.1922607421875, -0.172332763671875, -0.15240478515625, -0.132476806640625, -0.112548828125, -0.092620849609375, -0.07269287109375, -0.052764892578125, -0.0328369140625, -0.012908935546875, 0.00701904296875, 0.026947021484375, 0.046875, 0.066802978515625, 0.08673095703125, 0.106658935546875, 0.1265869140625, 0.146514892578125, 0.16644287109375, 0.186370849609375, 0.206298828125, 0.226226806640625, 0.24615478515625, 0.266082763671875, 0.2860107421875, 0.305938720703125, 0.32586669921875, 0.345794677734375, 0.36572265625, 0.385650634765625, 0.40557861328125, 0.425506591796875, 0.4454345703125, 0.465362548828125, 0.48529052734375, 0.505218505859375, 0.525146484375, 0.545074462890625, 0.56500244140625, 0.584930419921875, 0.6048583984375, 0.624786376953125, 0.64471435546875, 0.664642333984375, 0.6845703125]}, "gradients/decoder.model.decoder.layers.8.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 6.0, 3.0, 3.0, 9.0, 7.0, 12.0, 20.0, 18.0, 36.0, 51.0, 44.0, 70.0, 123.0, 129.0, 145.0, 98.0, 80.0, 37.0, 24.0, 23.0, 15.0, 15.0, 14.0, 7.0, 10.0, 1.0, 3.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0], "bins": [-0.350830078125, -0.3415546417236328, -0.3322792053222656, -0.32300376892089844, -0.31372833251953125, -0.30445289611816406, -0.2951774597167969, -0.2859020233154297, -0.2766265869140625, -0.2673511505126953, -0.2580757141113281, -0.24880027770996094, -0.23952484130859375, -0.23024940490722656, -0.22097396850585938, -0.2116985321044922, -0.202423095703125, -0.1931476593017578, -0.18387222290039062, -0.17459678649902344, -0.16532135009765625, -0.15604591369628906, -0.14677047729492188, -0.1374950408935547, -0.1282196044921875, -0.11894416809082031, -0.10966873168945312, -0.10039329528808594, -0.09111785888671875, -0.08184242248535156, -0.07256698608398438, -0.06329154968261719, -0.05401611328125, -0.04474067687988281, -0.035465240478515625, -0.026189804077148438, -0.01691436767578125, -0.0076389312744140625, 0.001636505126953125, 0.010911941528320312, 0.0201873779296875, 0.029462814331054688, 0.038738250732421875, 0.04801368713378906, 0.05728912353515625, 0.06656455993652344, 0.07583999633789062, 0.08511543273925781, 0.094390869140625, 0.10366630554199219, 0.11294174194335938, 0.12221717834472656, 0.13149261474609375, 0.14076805114746094, 0.15004348754882812, 0.1593189239501953, 0.1685943603515625, 0.1778697967529297, 0.18714523315429688, 0.19642066955566406, 0.20569610595703125, 0.21497154235839844, 0.22424697875976562, 0.2335224151611328, 0.2427978515625]}, "gradients/decoder.model.decoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 1.0, 4.0, 6.0, 7.0, 22.0, 32.0, 63.0, 71.0, 120.0, 142.0, 171.0, 129.0, 108.0, 51.0, 23.0, 24.0, 13.0, 9.0, 8.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.3423027992248535, -4.138338088989258, -3.934372901916504, -3.730408191680908, -3.5264432430267334, -3.3224782943725586, -3.118513584136963, -2.914548635482788, -2.7105836868286133, -2.5066187381744385, -2.3026537895202637, -2.098689079284668, -1.8947241306304932, -1.6907591819763184, -1.486794352531433, -1.2828295230865479, -1.078864574432373, -0.874899685382843, -0.670934796333313, -0.46696990728378296, -0.26300501823425293, -0.059040069580078125, 0.14492475986480713, 0.3488895893096924, 0.5528545379638672, 0.7568194270133972, 0.9607843160629272, 1.1647491455078125, 1.3687140941619873, 1.572679042816162, 1.7766438722610474, 1.9806087017059326, 2.1845741271972656, 2.3885390758514404, 2.5925040245056152, 2.796468734741211, 3.0004336833953857, 3.2043986320495605, 3.4083633422851562, 3.612328290939331, 3.816293239593506, 4.020257949829102, 4.2242231369018555, 4.428187847137451, 4.632152557373047, 4.836117744445801, 5.0400824546813965, 5.244047164916992, 5.448012351989746, 5.651977062225342, 5.855942249298096, 6.059906959533691, 6.263872146606445, 6.467836856842041, 6.671801567077637, 6.875766754150391, 7.079731464385986, 7.283696174621582, 7.487661361694336, 7.691626071929932, 7.895590782165527, 8.099555969238281, 8.303521156311035, 8.507485389709473, 8.711450576782227]}, "gradients/decoder.model.decoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 2.0, 2.0, 3.0, 2.0, 10.0, 5.0, 15.0, 12.0, 9.0, 14.0, 12.0, 15.0, 14.0, 31.0, 24.0, 14.0, 39.0, 25.0, 47.0, 42.0, 42.0, 36.0, 35.0, 52.0, 47.0, 44.0, 52.0, 45.0, 35.0, 29.0, 39.0, 26.0, 28.0, 29.0, 22.0, 22.0, 15.0, 20.0, 17.0, 5.0, 8.0, 4.0, 3.0, 2.0, 6.0, 6.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-4.134178638458252, -4.001101970672607, -3.868025541305542, -3.7349491119384766, -3.601872444152832, -3.4687960147857666, -3.335719585418701, -3.2026429176330566, -3.069566249847412, -2.9364898204803467, -2.803413152694702, -2.6703367233276367, -2.537260055541992, -2.4041836261749268, -2.2711071968078613, -2.138030529022217, -2.0049540996551514, -1.8718775510787964, -1.7388010025024414, -1.605724573135376, -1.4726479053497314, -1.339571475982666, -1.206494927406311, -1.073418378829956, -0.9403418302536011, -0.8072652816772461, -0.6741887331008911, -0.5411122441291809, -0.4080356955528259, -0.27495914697647095, -0.14188265800476074, -0.008806109428405762, 0.12427043914794922, 0.2573469877243042, 0.3904235064983368, 0.5235000252723694, 0.6565765738487244, 0.7896531224250793, 0.9227296113967896, 1.0558061599731445, 1.1888827085494995, 1.3219592571258545, 1.4550358057022095, 1.5881123542785645, 1.7211887836456299, 1.8542654514312744, 1.9873418807983398, 2.1204185485839844, 2.25349497795105, 2.3865714073181152, 2.5196480751037598, 2.652724504470825, 2.7858011722564697, 2.918877601623535, 3.0519542694091797, 3.185030698776245, 3.3181071281433105, 3.451183557510376, 3.5842602252960205, 3.717336654663086, 3.8504133224487305, 3.983489751815796, 4.116566181182861, 4.249642848968506, 4.38271951675415]}, "gradients/decoder.model.decoder.layers.7.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 3.0, 4.0, 5.0, 9.0, 10.0, 18.0, 10.0, 30.0, 43.0, 60.0, 85.0, 150.0, 245.0, 459.0, 803.0, 1553.0, 3337.0, 8341.0, 25663.0, 152915.0, 2730072.0, 1161789.0, 78096.0, 18463.0, 6396.0, 2785.0, 1276.0, 656.0, 390.0, 246.0, 138.0, 78.0, 49.0, 39.0, 31.0, 12.0, 10.0, 6.0, 3.0, 6.0, 3.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.583984375, -3.4840087890625, -3.384033203125, -3.2840576171875, -3.18408203125, -3.0841064453125, -2.984130859375, -2.8841552734375, -2.7841796875, -2.6842041015625, -2.584228515625, -2.4842529296875, -2.38427734375, -2.2843017578125, -2.184326171875, -2.0843505859375, -1.984375, -1.8843994140625, -1.784423828125, -1.6844482421875, -1.58447265625, -1.4844970703125, -1.384521484375, -1.2845458984375, -1.1845703125, -1.0845947265625, -0.984619140625, -0.8846435546875, -0.78466796875, -0.6846923828125, -0.584716796875, -0.4847412109375, -0.384765625, -0.2847900390625, -0.184814453125, -0.0848388671875, 0.01513671875, 0.1151123046875, 0.215087890625, 0.3150634765625, 0.4150390625, 0.5150146484375, 0.614990234375, 0.7149658203125, 0.81494140625, 0.9149169921875, 1.014892578125, 1.1148681640625, 1.21484375, 1.3148193359375, 1.414794921875, 1.5147705078125, 1.61474609375, 1.7147216796875, 1.814697265625, 1.9146728515625, 2.0146484375, 2.1146240234375, 2.214599609375, 2.3145751953125, 2.41455078125, 2.5145263671875, 2.614501953125, 2.7144775390625, 2.814453125]}, "gradients/decoder.model.decoder.layers.7.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 6.0, 3.0, 2.0, 4.0, 13.0, 10.0, 7.0, 24.0, 14.0, 18.0, 26.0, 35.0, 31.0, 45.0, 55.0, 62.0, 52.0, 69.0, 67.0, 54.0, 54.0, 51.0, 59.0, 37.0, 43.0, 34.0, 32.0, 22.0, 21.0, 13.0, 8.0, 9.0, 14.0, 6.0, 4.0, 6.0, 0.0, 1.0, 0.0, 3.0, 2.0, 0.0, 3.0], "bins": [-2.142578125, -2.0882415771484375, -2.033905029296875, -1.9795684814453125, -1.92523193359375, -1.8708953857421875, -1.816558837890625, -1.7622222900390625, -1.7078857421875, -1.6535491943359375, -1.599212646484375, -1.5448760986328125, -1.49053955078125, -1.4362030029296875, -1.381866455078125, -1.3275299072265625, -1.273193359375, -1.2188568115234375, -1.164520263671875, -1.1101837158203125, -1.05584716796875, -1.0015106201171875, -0.947174072265625, -0.8928375244140625, -0.8385009765625, -0.7841644287109375, -0.729827880859375, -0.6754913330078125, -0.62115478515625, -0.5668182373046875, -0.512481689453125, -0.4581451416015625, -0.40380859375, -0.3494720458984375, -0.295135498046875, -0.2407989501953125, -0.18646240234375, -0.1321258544921875, -0.077789306640625, -0.0234527587890625, 0.0308837890625, 0.0852203369140625, 0.139556884765625, 0.1938934326171875, 0.24822998046875, 0.3025665283203125, 0.356903076171875, 0.4112396240234375, 0.465576171875, 0.5199127197265625, 0.574249267578125, 0.6285858154296875, 0.68292236328125, 0.7372589111328125, 0.791595458984375, 0.8459320068359375, 0.9002685546875, 0.9546051025390625, 1.008941650390625, 1.0632781982421875, 1.11761474609375, 1.1719512939453125, 1.226287841796875, 1.2806243896484375, 1.3349609375]}, "gradients/decoder.model.decoder.layers.7.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 2.0, 3.0, 3.0, 4.0, 3.0, 10.0, 4.0, 15.0, 16.0, 22.0, 28.0, 35.0, 45.0, 74.0, 116.0, 255.0, 660.0, 2767.0, 27849.0, 3241052.0, 901885.0, 16312.0, 2049.0, 515.0, 218.0, 113.0, 81.0, 40.0, 31.0, 20.0, 11.0, 15.0, 11.0, 7.0, 7.0, 3.0, 8.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.08984375, -4.91375732421875, -4.7376708984375, -4.56158447265625, -4.385498046875, -4.20941162109375, -4.0333251953125, -3.85723876953125, -3.68115234375, -3.50506591796875, -3.3289794921875, -3.15289306640625, -2.976806640625, -2.80072021484375, -2.6246337890625, -2.44854736328125, -2.2724609375, -2.09637451171875, -1.9202880859375, -1.74420166015625, -1.568115234375, -1.39202880859375, -1.2159423828125, -1.03985595703125, -0.86376953125, -0.68768310546875, -0.5115966796875, -0.33551025390625, -0.159423828125, 0.01666259765625, 0.1927490234375, 0.36883544921875, 0.544921875, 0.72100830078125, 0.8970947265625, 1.07318115234375, 1.249267578125, 1.42535400390625, 1.6014404296875, 1.77752685546875, 1.95361328125, 2.12969970703125, 2.3057861328125, 2.48187255859375, 2.657958984375, 2.83404541015625, 3.0101318359375, 3.18621826171875, 3.3623046875, 3.53839111328125, 3.7144775390625, 3.89056396484375, 4.066650390625, 4.24273681640625, 4.4188232421875, 4.59490966796875, 4.77099609375, 4.94708251953125, 5.1231689453125, 5.29925537109375, 5.475341796875, 5.65142822265625, 5.8275146484375, 6.00360107421875, 6.1796875]}, "gradients/decoder.model.decoder.layers.7.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 6.0, 3.0, 9.0, 13.0, 7.0, 26.0, 22.0, 29.0, 39.0, 61.0, 76.0, 104.0, 165.0, 247.0, 404.0, 669.0, 709.0, 548.0, 311.0, 166.0, 131.0, 73.0, 66.0, 66.0, 33.0, 29.0, 17.0, 16.0, 5.0, 4.0, 10.0, 4.0, 4.0, 3.0, 6.0, 1.0, 1.0, 2.0, 0.0, 2.0], "bins": [-0.8310546875, -0.8103713989257812, -0.7896881103515625, -0.7690048217773438, -0.748321533203125, -0.7276382446289062, -0.7069549560546875, -0.6862716674804688, -0.66558837890625, -0.6449050903320312, -0.6242218017578125, -0.6035385131835938, -0.582855224609375, -0.5621719360351562, -0.5414886474609375, -0.5208053588867188, -0.5001220703125, -0.47943878173828125, -0.4587554931640625, -0.43807220458984375, -0.417388916015625, -0.39670562744140625, -0.3760223388671875, -0.35533905029296875, -0.33465576171875, -0.31397247314453125, -0.2932891845703125, -0.27260589599609375, -0.251922607421875, -0.23123931884765625, -0.2105560302734375, -0.18987274169921875, -0.169189453125, -0.14850616455078125, -0.1278228759765625, -0.10713958740234375, -0.086456298828125, -0.06577301025390625, -0.0450897216796875, -0.02440643310546875, -0.00372314453125, 0.01696014404296875, 0.0376434326171875, 0.05832672119140625, 0.079010009765625, 0.09969329833984375, 0.1203765869140625, 0.14105987548828125, 0.1617431640625, 0.18242645263671875, 0.2031097412109375, 0.22379302978515625, 0.244476318359375, 0.26515960693359375, 0.2858428955078125, 0.30652618408203125, 0.32720947265625, 0.34789276123046875, 0.3685760498046875, 0.38925933837890625, 0.409942626953125, 0.43062591552734375, 0.4513092041015625, 0.47199249267578125, 0.49267578125]}, "gradients/decoder.model.decoder.layers.7.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 9.0, 9.0, 13.0, 7.0, 13.0, 28.0, 22.0, 51.0, 51.0, 71.0, 107.0, 102.0, 116.0, 94.0, 76.0, 60.0, 49.0, 35.0, 20.0, 15.0, 19.0, 11.0, 5.0, 6.0, 3.0, 4.0, 4.0, 5.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-2.5289342403411865, -2.4392733573913574, -2.3496124744415283, -2.259951591491699, -2.170290470123291, -2.080629587173462, -1.9909687042236328, -1.9013078212738037, -1.8116469383239746, -1.7219860553741455, -1.6323251724243164, -1.5426641702651978, -1.4530032873153687, -1.3633424043655396, -1.273681402206421, -1.1840205192565918, -1.0943596363067627, -1.0046987533569336, -0.9150378108024597, -0.8253768682479858, -0.7357159852981567, -0.6460551023483276, -0.5563941597938538, -0.4667332172393799, -0.3770723342895508, -0.2874114215373993, -0.1977505087852478, -0.10808959603309631, -0.018428683280944824, 0.07123222947120667, 0.16089314222335815, 0.25055408477783203, 0.34021472930908203, 0.4298756420612335, 0.519536554813385, 0.6091974973678589, 0.698858380317688, 0.7885192632675171, 0.878180205821991, 0.9678411483764648, 1.057502031326294, 1.147162914276123, 1.2368237972259521, 1.3264847993850708, 1.4161456823349, 1.505806565284729, 1.5954675674438477, 1.6851284503936768, 1.7747893333435059, 1.864450216293335, 1.954111099243164, 2.043771982192993, 2.1334328651428223, 2.2230939865112305, 2.3127548694610596, 2.4024157524108887, 2.4920766353607178, 2.581737518310547, 2.671398401260376, 2.761059284210205, 2.8507204055786133, 2.9403812885284424, 3.0300421714782715, 3.1197030544281006, 3.2093639373779297]}, "gradients/decoder.model.decoder.layers.7.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 4.0, 12.0, 5.0, 5.0, 12.0, 8.0, 15.0, 19.0, 22.0, 25.0, 26.0, 42.0, 29.0, 33.0, 50.0, 61.0, 50.0, 52.0, 64.0, 51.0, 51.0, 54.0, 49.0, 48.0, 33.0, 41.0, 30.0, 31.0, 17.0, 14.0, 19.0, 11.0, 1.0, 8.0, 9.0, 3.0, 0.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.9839613437652588, -1.9269685745239258, -1.8699758052825928, -1.8129830360412598, -1.7559902667999268, -1.6989974975585938, -1.6420047283172607, -1.5850119590759277, -1.5280191898345947, -1.4710264205932617, -1.4140336513519287, -1.3570408821105957, -1.3000481128692627, -1.2430553436279297, -1.1860625743865967, -1.1290698051452637, -1.0720769166946411, -1.015084147453308, -0.9580913782119751, -0.9010986089706421, -0.8441058397293091, -0.7871130704879761, -0.7301202416419983, -0.6731274724006653, -0.6161347031593323, -0.5591419339179993, -0.5021491646766663, -0.44515636563301086, -0.38816359639167786, -0.33117082715034485, -0.27417802810668945, -0.21718525886535645, -0.160192608833313, -0.10319983214139938, -0.04620705544948578, 0.010785728693008423, 0.06777849793434143, 0.12477126717567444, 0.18176406621932983, 0.23875683546066284, 0.29574960470199585, 0.35274237394332886, 0.40973514318466187, 0.46672794222831726, 0.5237207412719727, 0.5807135105133057, 0.6377062797546387, 0.6946990489959717, 0.7516918182373047, 0.8086845874786377, 0.8656773567199707, 0.9226701259613037, 0.9796628952026367, 1.0366556644439697, 1.0936484336853027, 1.1506412029266357, 1.2076339721679688, 1.2646267414093018, 1.3216195106506348, 1.3786122798919678, 1.4356050491333008, 1.4925978183746338, 1.5495905876159668, 1.6065833568572998, 1.6635762453079224]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 8.0, 4.0, 6.0, 7.0, 13.0, 20.0, 33.0, 39.0, 67.0, 124.0, 173.0, 330.0, 572.0, 1047.0, 2069.0, 4465.0, 10073.0, 23183.0, 57630.0, 157045.0, 392653.0, 249505.0, 88518.0, 34543.0, 14094.0, 6219.0, 2917.0, 1441.0, 680.0, 397.0, 272.0, 146.0, 77.0, 64.0, 42.0, 32.0, 18.0, 10.0, 8.0, 6.0, 5.0, 3.0, 1.0, 5.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.418212890625, -0.4041404724121094, -0.39006805419921875, -0.3759956359863281, -0.3619232177734375, -0.3478507995605469, -0.33377838134765625, -0.3197059631347656, -0.305633544921875, -0.2915611267089844, -0.27748870849609375, -0.2634162902832031, -0.2493438720703125, -0.23527145385742188, -0.22119903564453125, -0.20712661743164062, -0.19305419921875, -0.17898178100585938, -0.16490936279296875, -0.15083694458007812, -0.1367645263671875, -0.12269210815429688, -0.10861968994140625, -0.09454727172851562, -0.080474853515625, -0.06640243530273438, -0.05233001708984375, -0.038257598876953125, -0.0241851806640625, -0.010112762451171875, 0.00395965576171875, 0.018032073974609375, 0.0321044921875, 0.046176910400390625, 0.06024932861328125, 0.07432174682617188, 0.0883941650390625, 0.10246658325195312, 0.11653900146484375, 0.13061141967773438, 0.144683837890625, 0.15875625610351562, 0.17282867431640625, 0.18690109252929688, 0.2009735107421875, 0.21504592895507812, 0.22911834716796875, 0.24319076538085938, 0.25726318359375, 0.2713356018066406, 0.28540802001953125, 0.2994804382324219, 0.3135528564453125, 0.3276252746582031, 0.34169769287109375, 0.3557701110839844, 0.369842529296875, 0.3839149475097656, 0.39798736572265625, 0.4120597839355469, 0.4261322021484375, 0.4402046203613281, 0.45427703857421875, 0.4683494567871094, 0.482421875]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 3.0, 5.0, 7.0, 6.0, 15.0, 16.0, 25.0, 21.0, 36.0, 34.0, 43.0, 47.0, 64.0, 66.0, 81.0, 69.0, 64.0, 72.0, 66.0, 53.0, 51.0, 41.0, 30.0, 28.0, 23.0, 16.0, 6.0, 9.0, 3.0, 3.0, 2.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-1.955078125, -1.90777587890625, -1.8604736328125, -1.81317138671875, -1.765869140625, -1.71856689453125, -1.6712646484375, -1.62396240234375, -1.57666015625, -1.52935791015625, -1.4820556640625, -1.43475341796875, -1.387451171875, -1.34014892578125, -1.2928466796875, -1.24554443359375, -1.1982421875, -1.15093994140625, -1.1036376953125, -1.05633544921875, -1.009033203125, -0.96173095703125, -0.9144287109375, -0.86712646484375, -0.81982421875, -0.77252197265625, -0.7252197265625, -0.67791748046875, -0.630615234375, -0.58331298828125, -0.5360107421875, -0.48870849609375, -0.44140625, -0.39410400390625, -0.3468017578125, -0.29949951171875, -0.252197265625, -0.20489501953125, -0.1575927734375, -0.11029052734375, -0.06298828125, -0.01568603515625, 0.0316162109375, 0.07891845703125, 0.126220703125, 0.17352294921875, 0.2208251953125, 0.26812744140625, 0.3154296875, 0.36273193359375, 0.4100341796875, 0.45733642578125, 0.504638671875, 0.55194091796875, 0.5992431640625, 0.64654541015625, 0.69384765625, 0.74114990234375, 0.7884521484375, 0.83575439453125, 0.883056640625, 0.93035888671875, 0.9776611328125, 1.02496337890625, 1.072265625]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 4.0, 1.0, 2.0, 3.0, 2.0, 5.0, 5.0, 12.0, 16.0, 22.0, 21.0, 40.0, 37.0, 64.0, 91.0, 142.0, 194.0, 324.0, 567.0, 972.0, 1937.0, 4267.0, 10262.0, 27909.0, 84030.0, 276861.0, 419704.0, 146244.0, 46116.0, 16303.0, 6431.0, 2778.0, 1351.0, 685.0, 416.0, 248.0, 152.0, 101.0, 68.0, 65.0, 35.0, 25.0, 17.0, 5.0, 9.0, 10.0, 5.0, 2.0, 2.0, 6.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.41552734375, -0.4022216796875, -0.388916015625, -0.3756103515625, -0.3623046875, -0.3489990234375, -0.335693359375, -0.3223876953125, -0.30908203125, -0.2957763671875, -0.282470703125, -0.2691650390625, -0.255859375, -0.2425537109375, -0.229248046875, -0.2159423828125, -0.20263671875, -0.1893310546875, -0.176025390625, -0.1627197265625, -0.1494140625, -0.1361083984375, -0.122802734375, -0.1094970703125, -0.09619140625, -0.0828857421875, -0.069580078125, -0.0562744140625, -0.04296875, -0.0296630859375, -0.016357421875, -0.0030517578125, 0.01025390625, 0.0235595703125, 0.036865234375, 0.0501708984375, 0.0634765625, 0.0767822265625, 0.090087890625, 0.1033935546875, 0.11669921875, 0.1300048828125, 0.143310546875, 0.1566162109375, 0.169921875, 0.1832275390625, 0.196533203125, 0.2098388671875, 0.22314453125, 0.2364501953125, 0.249755859375, 0.2630615234375, 0.2763671875, 0.2896728515625, 0.302978515625, 0.3162841796875, 0.32958984375, 0.3428955078125, 0.356201171875, 0.3695068359375, 0.3828125, 0.3961181640625, 0.409423828125, 0.4227294921875, 0.43603515625]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 10.0, 1.0, 2.0, 12.0, 8.0, 17.0, 12.0, 13.0, 16.0, 28.0, 18.0, 28.0, 27.0, 30.0, 51.0, 44.0, 30.0, 63.0, 59.0, 54.0, 48.0, 50.0, 42.0, 55.0, 41.0, 38.0, 39.0, 35.0, 29.0, 18.0, 21.0, 14.0, 17.0, 10.0, 9.0, 9.0, 4.0, 1.0, 4.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.513671875, -2.442840576171875, -2.37200927734375, -2.301177978515625, -2.2303466796875, -2.159515380859375, -2.08868408203125, -2.017852783203125, -1.947021484375, -1.876190185546875, -1.80535888671875, -1.734527587890625, -1.6636962890625, -1.592864990234375, -1.52203369140625, -1.451202392578125, -1.38037109375, -1.309539794921875, -1.23870849609375, -1.167877197265625, -1.0970458984375, -1.026214599609375, -0.95538330078125, -0.884552001953125, -0.813720703125, -0.742889404296875, -0.67205810546875, -0.601226806640625, -0.5303955078125, -0.459564208984375, -0.38873291015625, -0.317901611328125, -0.2470703125, -0.176239013671875, -0.10540771484375, -0.034576416015625, 0.0362548828125, 0.107086181640625, 0.17791748046875, 0.248748779296875, 0.319580078125, 0.390411376953125, 0.46124267578125, 0.532073974609375, 0.6029052734375, 0.673736572265625, 0.74456787109375, 0.815399169921875, 0.88623046875, 0.957061767578125, 1.02789306640625, 1.098724365234375, 1.1695556640625, 1.240386962890625, 1.31121826171875, 1.382049560546875, 1.452880859375, 1.523712158203125, 1.59454345703125, 1.665374755859375, 1.7362060546875, 1.807037353515625, 1.87786865234375, 1.948699951171875, 2.01953125]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 7.0, 0.0, 12.0, 12.0, 17.0, 42.0, 45.0, 79.0, 127.0, 221.0, 366.0, 680.0, 1402.0, 3028.0, 7323.0, 21018.0, 79038.0, 408330.0, 412639.0, 79170.0, 21309.0, 7487.0, 3137.0, 1400.0, 698.0, 395.0, 230.0, 125.0, 72.0, 55.0, 30.0, 25.0, 15.0, 17.0, 5.0, 2.0, 3.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.265380859375, -0.25839805603027344, -0.2514152526855469, -0.2444324493408203, -0.23744964599609375, -0.2304668426513672, -0.22348403930664062, -0.21650123596191406, -0.2095184326171875, -0.20253562927246094, -0.19555282592773438, -0.1885700225830078, -0.18158721923828125, -0.1746044158935547, -0.16762161254882812, -0.16063880920410156, -0.153656005859375, -0.14667320251464844, -0.13969039916992188, -0.1327075958251953, -0.12572479248046875, -0.11874198913574219, -0.11175918579101562, -0.10477638244628906, -0.0977935791015625, -0.09081077575683594, -0.08382797241210938, -0.07684516906738281, -0.06986236572265625, -0.06287956237792969, -0.055896759033203125, -0.04891395568847656, -0.04193115234375, -0.03494834899902344, -0.027965545654296875, -0.020982742309570312, -0.01399993896484375, -0.0070171356201171875, -3.4332275390625e-05, 0.0069484710693359375, 0.0139312744140625, 0.020914077758789062, 0.027896881103515625, 0.03487968444824219, 0.04186248779296875, 0.04884529113769531, 0.055828094482421875, 0.06281089782714844, 0.069793701171875, 0.07677650451660156, 0.08375930786132812, 0.09074211120605469, 0.09772491455078125, 0.10470771789550781, 0.11169052124023438, 0.11867332458496094, 0.1256561279296875, 0.13263893127441406, 0.13962173461914062, 0.1466045379638672, 0.15358734130859375, 0.1605701446533203, 0.16755294799804688, 0.17453575134277344, 0.1815185546875]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 2.0, 5.0, 3.0, 3.0, 4.0, 7.0, 12.0, 2.0, 11.0, 15.0, 21.0, 23.0, 43.0, 34.0, 51.0, 61.0, 72.0, 88.0, 100.0, 88.0, 71.0, 68.0, 48.0, 37.0, 37.0, 18.0, 14.0, 14.0, 8.0, 5.0, 8.0, 5.0, 5.0, 4.0, 1.0, 1.0, 6.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.00010198354721069336, -9.852088987827301e-05, -9.505823254585266e-05, -9.159557521343231e-05, -8.813291788101196e-05, -8.467026054859161e-05, -8.120760321617126e-05, -7.774494588375092e-05, -7.428228855133057e-05, -7.081963121891022e-05, -6.735697388648987e-05, -6.389431655406952e-05, -6.043165922164917e-05, -5.696900188922882e-05, -5.350634455680847e-05, -5.004368722438812e-05, -4.6581029891967773e-05, -4.3118372559547424e-05, -3.9655715227127075e-05, -3.6193057894706726e-05, -3.273040056228638e-05, -2.9267743229866028e-05, -2.580508589744568e-05, -2.234242856502533e-05, -1.887977123260498e-05, -1.541711390018463e-05, -1.1954456567764282e-05, -8.491799235343933e-06, -5.029141902923584e-06, -1.5664845705032349e-06, 1.8961727619171143e-06, 5.358830094337463e-06, 8.821487426757812e-06, 1.2284144759178162e-05, 1.574680209159851e-05, 1.920945942401886e-05, 2.267211675643921e-05, 2.6134774088859558e-05, 2.9597431421279907e-05, 3.3060088753700256e-05, 3.6522746086120605e-05, 3.9985403418540955e-05, 4.3448060750961304e-05, 4.691071808338165e-05, 5.0373375415802e-05, 5.383603274822235e-05, 5.72986900806427e-05, 6.076134741306305e-05, 6.42240047454834e-05, 6.768666207790375e-05, 7.11493194103241e-05, 7.461197674274445e-05, 7.80746340751648e-05, 8.153729140758514e-05, 8.499994874000549e-05, 8.846260607242584e-05, 9.192526340484619e-05, 9.538792073726654e-05, 9.885057806968689e-05, 0.00010231323540210724, 0.00010577589273452759, 0.00010923855006694794, 0.00011270120739936829, 0.00011616386473178864, 0.00011962652206420898]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 5.0, 5.0, 4.0, 4.0, 3.0, 6.0, 14.0, 7.0, 14.0, 25.0, 31.0, 55.0, 57.0, 119.0, 228.0, 393.0, 911.0, 1955.0, 5196.0, 15514.0, 53200.0, 210640.0, 511286.0, 180974.0, 46035.0, 13700.0, 4636.0, 1848.0, 787.0, 389.0, 183.0, 113.0, 66.0, 46.0, 26.0, 11.0, 14.0, 13.0, 11.0, 8.0, 6.0, 5.0, 7.0, 2.0, 5.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.2120361328125, -0.2052936553955078, -0.19855117797851562, -0.19180870056152344, -0.18506622314453125, -0.17832374572753906, -0.17158126831054688, -0.1648387908935547, -0.1580963134765625, -0.1513538360595703, -0.14461135864257812, -0.13786888122558594, -0.13112640380859375, -0.12438392639160156, -0.11764144897460938, -0.11089897155761719, -0.104156494140625, -0.09741401672363281, -0.09067153930664062, -0.08392906188964844, -0.07718658447265625, -0.07044410705566406, -0.06370162963867188, -0.05695915222167969, -0.0502166748046875, -0.04347419738769531, -0.036731719970703125, -0.029989242553710938, -0.02324676513671875, -0.016504287719726562, -0.009761810302734375, -0.0030193328857421875, 0.00372314453125, 0.010465621948242188, 0.017208099365234375, 0.023950576782226562, 0.03069305419921875, 0.03743553161621094, 0.044178009033203125, 0.05092048645019531, 0.0576629638671875, 0.06440544128417969, 0.07114791870117188, 0.07789039611816406, 0.08463287353515625, 0.09137535095214844, 0.09811782836914062, 0.10486030578613281, 0.111602783203125, 0.11834526062011719, 0.12508773803710938, 0.13183021545410156, 0.13857269287109375, 0.14531517028808594, 0.15205764770507812, 0.1588001251220703, 0.1655426025390625, 0.1722850799560547, 0.17902755737304688, 0.18577003479003906, 0.19251251220703125, 0.19925498962402344, 0.20599746704101562, 0.2127399444580078, 0.219482421875]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 4.0, 3.0, 11.0, 10.0, 15.0, 15.0, 12.0, 16.0, 24.0, 31.0, 30.0, 37.0, 33.0, 48.0, 63.0, 55.0, 65.0, 68.0, 76.0, 64.0, 54.0, 48.0, 39.0, 36.0, 26.0, 25.0, 20.0, 12.0, 9.0, 11.0, 11.0, 7.0, 5.0, 8.0, 3.0, 4.0, 1.0, 0.0, 2.0, 4.0, 1.0, 3.0], "bins": [-0.048431396484375, -0.047203779220581055, -0.04597616195678711, -0.044748544692993164, -0.04352092742919922, -0.04229331016540527, -0.04106569290161133, -0.03983807563781738, -0.03861045837402344, -0.03738284111022949, -0.03615522384643555, -0.0349276065826416, -0.033699989318847656, -0.03247237205505371, -0.031244754791259766, -0.03001713752746582, -0.028789520263671875, -0.02756190299987793, -0.026334285736083984, -0.02510666847229004, -0.023879051208496094, -0.02265143394470215, -0.021423816680908203, -0.020196199417114258, -0.018968582153320312, -0.017740964889526367, -0.016513347625732422, -0.015285730361938477, -0.014058113098144531, -0.012830495834350586, -0.01160287857055664, -0.010375261306762695, -0.00914764404296875, -0.007920026779174805, -0.006692409515380859, -0.005464792251586914, -0.004237174987792969, -0.0030095577239990234, -0.0017819404602050781, -0.0005543231964111328, 0.0006732940673828125, 0.0019009113311767578, 0.003128528594970703, 0.0043561458587646484, 0.005583763122558594, 0.006811380386352539, 0.008038997650146484, 0.00926661491394043, 0.010494232177734375, 0.01172184944152832, 0.012949466705322266, 0.014177083969116211, 0.015404701232910156, 0.0166323184967041, 0.017859935760498047, 0.019087553024291992, 0.020315170288085938, 0.021542787551879883, 0.022770404815673828, 0.023998022079467773, 0.02522563934326172, 0.026453256607055664, 0.02768087387084961, 0.028908491134643555, 0.0301361083984375]}, "gradients/decoder.model.decoder.layers.7.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 6.0, 7.0, 9.0, 9.0, 20.0, 22.0, 32.0, 61.0, 70.0, 102.0, 156.0, 104.0, 130.0, 84.0, 51.0, 42.0, 30.0, 16.0, 16.0, 8.0, 7.0, 4.0, 4.0, 6.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.1160409450531006, -2.0484204292297363, -1.980799913406372, -1.9131795167922974, -1.845559000968933, -1.7779384851455688, -1.7103180885314941, -1.6426975727081299, -1.5750770568847656, -1.5074565410614014, -1.439836025238037, -1.3722156286239624, -1.3045951128005981, -1.2369745969772339, -1.1693542003631592, -1.101733684539795, -1.0341131687164307, -0.9664926528930664, -0.8988721966743469, -0.8312517404556274, -0.7636312246322632, -0.6960107088088989, -0.6283902525901794, -0.56076979637146, -0.4931492805480957, -0.42552879452705383, -0.35790830850601196, -0.2902878224849701, -0.22266733646392822, -0.15504685044288635, -0.08742636442184448, -0.019805878400802612, 0.047814369201660156, 0.11543485522270203, 0.1830553412437439, 0.25067582726478577, 0.31829631328582764, 0.3859167993068695, 0.4535372853279114, 0.5211577415466309, 0.5887782573699951, 0.6563987731933594, 0.7240192294120789, 0.7916396856307983, 0.8592602014541626, 0.9268807172775269, 0.9945011734962463, 1.0621216297149658, 1.12974214553833, 1.1973626613616943, 1.2649831771850586, 1.3326035737991333, 1.4002240896224976, 1.4678446054458618, 1.5354650020599365, 1.6030855178833008, 1.670706033706665, 1.7383265495300293, 1.8059470653533936, 1.8735674619674683, 1.9411879777908325, 2.0088083744049072, 2.0764288902282715, 2.1440494060516357, 2.211669921875]}, "gradients/decoder.model.decoder.layers.7.self_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 3.0, 2.0, 10.0, 3.0, 7.0, 8.0, 9.0, 16.0, 18.0, 23.0, 35.0, 31.0, 41.0, 52.0, 38.0, 62.0, 62.0, 67.0, 65.0, 59.0, 58.0, 71.0, 48.0, 34.0, 40.0, 28.0, 37.0, 18.0, 17.0, 15.0, 9.0, 4.0, 11.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-1.5177342891693115, -1.4779725074768066, -1.4382108449935913, -1.3984490633010864, -1.358687400817871, -1.3189256191253662, -1.2791638374328613, -1.2394020557403564, -1.1996403932571411, -1.1598786115646362, -1.120116949081421, -1.080355167388916, -1.0405933856964111, -1.0008317232131958, -0.9610699415206909, -0.9213082194328308, -0.8815464973449707, -0.8417847752571106, -0.8020230531692505, -0.7622612714767456, -0.7224995493888855, -0.6827378273010254, -0.6429760456085205, -0.6032143235206604, -0.5634526014328003, -0.5236908793449402, -0.4839291274547577, -0.4441673755645752, -0.4044056534767151, -0.364643931388855, -0.3248821794986725, -0.28512042760849, -0.24535858631134033, -0.20559684932231903, -0.16583511233329773, -0.12607337534427643, -0.08631163835525513, -0.046549901366233826, -0.006788164377212524, 0.03297358751296997, 0.07273530960083008, 0.11249704658985138, 0.15225878357887268, 0.19202052056789398, 0.23178225755691528, 0.2715439796447754, 0.3113057315349579, 0.3510674834251404, 0.3908292055130005, 0.4305909276008606, 0.4703526794910431, 0.5101144313812256, 0.5498761534690857, 0.5896378755569458, 0.6293996572494507, 0.6691613793373108, 0.7089231014251709, 0.748684823513031, 0.7884465456008911, 0.828208327293396, 0.8679700493812561, 0.9077317714691162, 0.9474935531616211, 0.9872552752494812, 1.0270169973373413]}, "gradients/decoder.model.decoder.layers.7.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 0.0, 3.0, 2.0, 1.0, 1.0, 5.0, 8.0, 6.0, 10.0, 13.0, 16.0, 27.0, 41.0, 67.0, 141.0, 350.0, 935.0, 2625.0, 9855.0, 53096.0, 680498.0, 264276.0, 27568.0, 6027.0, 1827.0, 635.0, 237.0, 129.0, 40.0, 31.0, 15.0, 21.0, 6.0, 11.0, 11.0, 3.0, 9.0, 5.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0], "bins": [-3.94921875, -3.84197998046875, -3.7347412109375, -3.62750244140625, -3.520263671875, -3.41302490234375, -3.3057861328125, -3.19854736328125, -3.09130859375, -2.98406982421875, -2.8768310546875, -2.76959228515625, -2.662353515625, -2.55511474609375, -2.4478759765625, -2.34063720703125, -2.2333984375, -2.12615966796875, -2.0189208984375, -1.91168212890625, -1.804443359375, -1.69720458984375, -1.5899658203125, -1.48272705078125, -1.37548828125, -1.26824951171875, -1.1610107421875, -1.05377197265625, -0.946533203125, -0.83929443359375, -0.7320556640625, -0.62481689453125, -0.517578125, -0.41033935546875, -0.3031005859375, -0.19586181640625, -0.088623046875, 0.01861572265625, 0.1258544921875, 0.23309326171875, 0.34033203125, 0.44757080078125, 0.5548095703125, 0.66204833984375, 0.769287109375, 0.87652587890625, 0.9837646484375, 1.09100341796875, 1.1982421875, 1.30548095703125, 1.4127197265625, 1.51995849609375, 1.627197265625, 1.73443603515625, 1.8416748046875, 1.94891357421875, 2.05615234375, 2.16339111328125, 2.2706298828125, 2.37786865234375, 2.485107421875, 2.59234619140625, 2.6995849609375, 2.80682373046875, 2.9140625]}, "gradients/decoder.model.decoder.layers.7.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 3.0, 3.0, 2.0, 3.0, 5.0, 9.0, 8.0, 14.0, 16.0, 17.0, 17.0, 32.0, 30.0, 39.0, 45.0, 46.0, 57.0, 48.0, 57.0, 63.0, 54.0, 56.0, 68.0, 59.0, 48.0, 28.0, 40.0, 29.0, 30.0, 18.0, 19.0, 10.0, 11.0, 5.0, 8.0, 5.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.796875, -2.71844482421875, -2.6400146484375, -2.56158447265625, -2.483154296875, -2.40472412109375, -2.3262939453125, -2.24786376953125, -2.16943359375, -2.09100341796875, -2.0125732421875, -1.93414306640625, -1.855712890625, -1.77728271484375, -1.6988525390625, -1.62042236328125, -1.5419921875, -1.46356201171875, -1.3851318359375, -1.30670166015625, -1.228271484375, -1.14984130859375, -1.0714111328125, -0.99298095703125, -0.91455078125, -0.83612060546875, -0.7576904296875, -0.67926025390625, -0.600830078125, -0.52239990234375, -0.4439697265625, -0.36553955078125, -0.287109375, -0.20867919921875, -0.1302490234375, -0.05181884765625, 0.026611328125, 0.10504150390625, 0.1834716796875, 0.26190185546875, 0.34033203125, 0.41876220703125, 0.4971923828125, 0.57562255859375, 0.654052734375, 0.73248291015625, 0.8109130859375, 0.88934326171875, 0.9677734375, 1.04620361328125, 1.1246337890625, 1.20306396484375, 1.281494140625, 1.35992431640625, 1.4383544921875, 1.51678466796875, 1.59521484375, 1.67364501953125, 1.7520751953125, 1.83050537109375, 1.908935546875, 1.98736572265625, 2.0657958984375, 2.14422607421875, 2.22265625]}, "gradients/decoder.model.decoder.layers.7.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 2.0, 5.0, 2.0, 2.0, 5.0, 7.0, 5.0, 11.0, 13.0, 15.0, 19.0, 18.0, 23.0, 18.0, 41.0, 38.0, 60.0, 70.0, 90.0, 149.0, 282.0, 585.0, 1554.0, 4873.0, 19120.0, 148198.0, 766035.0, 87323.0, 13788.0, 3786.0, 1154.0, 461.0, 247.0, 150.0, 74.0, 72.0, 56.0, 42.0, 38.0, 21.0, 27.0, 19.0, 12.0, 14.0, 8.0, 8.0, 2.0, 8.0, 6.0, 3.0, 1.0, 4.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-2.51171875, -2.4290771484375, -2.346435546875, -2.2637939453125, -2.18115234375, -2.0985107421875, -2.015869140625, -1.9332275390625, -1.8505859375, -1.7679443359375, -1.685302734375, -1.6026611328125, -1.52001953125, -1.4373779296875, -1.354736328125, -1.2720947265625, -1.189453125, -1.1068115234375, -1.024169921875, -0.9415283203125, -0.85888671875, -0.7762451171875, -0.693603515625, -0.6109619140625, -0.5283203125, -0.4456787109375, -0.363037109375, -0.2803955078125, -0.19775390625, -0.1151123046875, -0.032470703125, 0.0501708984375, 0.1328125, 0.2154541015625, 0.298095703125, 0.3807373046875, 0.46337890625, 0.5460205078125, 0.628662109375, 0.7113037109375, 0.7939453125, 0.8765869140625, 0.959228515625, 1.0418701171875, 1.12451171875, 1.2071533203125, 1.289794921875, 1.3724365234375, 1.455078125, 1.5377197265625, 1.620361328125, 1.7030029296875, 1.78564453125, 1.8682861328125, 1.950927734375, 2.0335693359375, 2.1162109375, 2.1988525390625, 2.281494140625, 2.3641357421875, 2.44677734375, 2.5294189453125, 2.612060546875, 2.6947021484375, 2.77734375]}, "gradients/decoder.model.decoder.layers.7.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 5.0, 4.0, 8.0, 5.0, 4.0, 5.0, 7.0, 11.0, 9.0, 8.0, 23.0, 16.0, 11.0, 17.0, 30.0, 20.0, 23.0, 26.0, 35.0, 33.0, 32.0, 35.0, 39.0, 38.0, 43.0, 39.0, 39.0, 39.0, 34.0, 40.0, 40.0, 35.0, 23.0, 39.0, 19.0, 22.0, 23.0, 21.0, 15.0, 17.0, 11.0, 11.0, 9.0, 8.0, 14.0, 3.0, 0.0, 6.0, 6.0, 3.0, 2.0, 1.0, 4.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-1.828125, -1.767852783203125, -1.70758056640625, -1.647308349609375, -1.5870361328125, -1.526763916015625, -1.46649169921875, -1.406219482421875, -1.345947265625, -1.285675048828125, -1.22540283203125, -1.165130615234375, -1.1048583984375, -1.044586181640625, -0.98431396484375, -0.924041748046875, -0.86376953125, -0.803497314453125, -0.74322509765625, -0.682952880859375, -0.6226806640625, -0.562408447265625, -0.50213623046875, -0.441864013671875, -0.381591796875, -0.321319580078125, -0.26104736328125, -0.200775146484375, -0.1405029296875, -0.080230712890625, -0.01995849609375, 0.040313720703125, 0.1005859375, 0.160858154296875, 0.22113037109375, 0.281402587890625, 0.3416748046875, 0.401947021484375, 0.46221923828125, 0.522491455078125, 0.582763671875, 0.643035888671875, 0.70330810546875, 0.763580322265625, 0.8238525390625, 0.884124755859375, 0.94439697265625, 1.004669189453125, 1.06494140625, 1.125213623046875, 1.18548583984375, 1.245758056640625, 1.3060302734375, 1.366302490234375, 1.42657470703125, 1.486846923828125, 1.547119140625, 1.607391357421875, 1.66766357421875, 1.727935791015625, 1.7882080078125, 1.848480224609375, 1.90875244140625, 1.969024658203125, 2.029296875]}, "gradients/decoder.model.decoder.layers.7.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 4.0, 4.0, 3.0, 9.0, 12.0, 9.0, 12.0, 27.0, 40.0, 58.0, 103.0, 159.0, 283.0, 521.0, 1216.0, 2898.0, 8245.0, 31556.0, 192157.0, 676722.0, 104348.0, 20659.0, 5708.0, 1938.0, 855.0, 417.0, 213.0, 136.0, 92.0, 50.0, 35.0, 17.0, 21.0, 16.0, 4.0, 4.0, 6.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6708984375, -0.6524429321289062, -0.6339874267578125, -0.6155319213867188, -0.597076416015625, -0.5786209106445312, -0.5601654052734375, -0.5417098999023438, -0.52325439453125, -0.5047988891601562, -0.4863433837890625, -0.46788787841796875, -0.449432373046875, -0.43097686767578125, -0.4125213623046875, -0.39406585693359375, -0.3756103515625, -0.35715484619140625, -0.3386993408203125, -0.32024383544921875, -0.301788330078125, -0.28333282470703125, -0.2648773193359375, -0.24642181396484375, -0.22796630859375, -0.20951080322265625, -0.1910552978515625, -0.17259979248046875, -0.154144287109375, -0.13568878173828125, -0.1172332763671875, -0.09877777099609375, -0.080322265625, -0.06186676025390625, -0.0434112548828125, -0.02495574951171875, -0.006500244140625, 0.01195526123046875, 0.0304107666015625, 0.04886627197265625, 0.06732177734375, 0.08577728271484375, 0.1042327880859375, 0.12268829345703125, 0.141143798828125, 0.15959930419921875, 0.1780548095703125, 0.19651031494140625, 0.2149658203125, 0.23342132568359375, 0.2518768310546875, 0.27033233642578125, 0.288787841796875, 0.30724334716796875, 0.3256988525390625, 0.34415435791015625, 0.36260986328125, 0.38106536865234375, 0.3995208740234375, 0.41797637939453125, 0.436431884765625, 0.45488739013671875, 0.4733428955078125, 0.49179840087890625, 0.51025390625]}, "gradients/decoder.model.decoder.layers.7.self_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 1.0, 4.0, 8.0, 8.0, 12.0, 11.0, 10.0, 3.0, 20.0, 26.0, 35.0, 56.0, 72.0, 106.0, 114.0, 122.0, 105.0, 54.0, 57.0, 47.0, 24.0, 24.0, 13.0, 12.0, 10.0, 13.0, 5.0, 9.0, 4.0, 2.0, 8.0, 4.0, 2.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-6.35385513305664e-05, -6.0910359025001526e-05, -5.8282166719436646e-05, -5.5653974413871765e-05, -5.3025782108306885e-05, -5.0397589802742004e-05, -4.7769397497177124e-05, -4.5141205191612244e-05, -4.251301288604736e-05, -3.988482058048248e-05, -3.72566282749176e-05, -3.462843596935272e-05, -3.200024366378784e-05, -2.937205135822296e-05, -2.674385905265808e-05, -2.41156667470932e-05, -2.148747444152832e-05, -1.885928213596344e-05, -1.623108983039856e-05, -1.360289752483368e-05, -1.0974705219268799e-05, -8.346512913703918e-06, -5.718320608139038e-06, -3.0901283025741577e-06, -4.6193599700927734e-07, 2.166256308555603e-06, 4.794448614120483e-06, 7.422640919685364e-06, 1.0050833225250244e-05, 1.2679025530815125e-05, 1.5307217836380005e-05, 1.7935410141944885e-05, 2.0563602447509766e-05, 2.3191794753074646e-05, 2.5819987058639526e-05, 2.8448179364204407e-05, 3.107637166976929e-05, 3.370456397533417e-05, 3.633275628089905e-05, 3.896094858646393e-05, 4.158914089202881e-05, 4.421733319759369e-05, 4.684552550315857e-05, 4.947371780872345e-05, 5.210191011428833e-05, 5.473010241985321e-05, 5.735829472541809e-05, 5.998648703098297e-05, 6.261467933654785e-05, 6.524287164211273e-05, 6.787106394767761e-05, 7.049925625324249e-05, 7.312744855880737e-05, 7.575564086437225e-05, 7.838383316993713e-05, 8.101202547550201e-05, 8.36402177810669e-05, 8.626841008663177e-05, 8.889660239219666e-05, 9.152479469776154e-05, 9.415298700332642e-05, 9.67811793088913e-05, 9.940937161445618e-05, 0.00010203756392002106, 0.00010466575622558594]}, "gradients/decoder.model.decoder.layers.7.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 8.0, 8.0, 5.0, 10.0, 17.0, 21.0, 34.0, 54.0, 70.0, 157.0, 244.0, 407.0, 718.0, 1482.0, 3402.0, 8998.0, 31100.0, 163578.0, 670879.0, 127193.0, 26267.0, 7903.0, 3047.0, 1336.0, 646.0, 407.0, 207.0, 120.0, 78.0, 56.0, 32.0, 25.0, 18.0, 9.0, 7.0, 4.0, 4.0, 2.0, 2.0, 2.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.53564453125, -0.5174484252929688, -0.4992523193359375, -0.48105621337890625, -0.462860107421875, -0.44466400146484375, -0.4264678955078125, -0.40827178955078125, -0.39007568359375, -0.37187957763671875, -0.3536834716796875, -0.33548736572265625, -0.317291259765625, -0.29909515380859375, -0.2808990478515625, -0.26270294189453125, -0.2445068359375, -0.22631072998046875, -0.2081146240234375, -0.18991851806640625, -0.171722412109375, -0.15352630615234375, -0.1353302001953125, -0.11713409423828125, -0.09893798828125, -0.08074188232421875, -0.0625457763671875, -0.04434967041015625, -0.026153564453125, -0.00795745849609375, 0.0102386474609375, 0.02843475341796875, 0.046630859375, 0.06482696533203125, 0.0830230712890625, 0.10121917724609375, 0.119415283203125, 0.13761138916015625, 0.1558074951171875, 0.17400360107421875, 0.19219970703125, 0.21039581298828125, 0.2285919189453125, 0.24678802490234375, 0.264984130859375, 0.28318023681640625, 0.3013763427734375, 0.31957244873046875, 0.3377685546875, 0.35596466064453125, 0.3741607666015625, 0.39235687255859375, 0.410552978515625, 0.42874908447265625, 0.4469451904296875, 0.46514129638671875, 0.48333740234375, 0.5015335083007812, 0.5197296142578125, 0.5379257202148438, 0.556121826171875, 0.5743179321289062, 0.5925140380859375, 0.6107101440429688, 0.62890625]}, "gradients/decoder.model.decoder.layers.7.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 0.0, 2.0, 2.0, 3.0, 1.0, 5.0, 8.0, 3.0, 17.0, 11.0, 25.0, 30.0, 47.0, 51.0, 73.0, 105.0, 146.0, 109.0, 99.0, 75.0, 60.0, 30.0, 28.0, 22.0, 16.0, 7.0, 6.0, 7.0, 6.0, 3.0, 6.0, 4.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.26953125, -0.25986480712890625, -0.2501983642578125, -0.24053192138671875, -0.230865478515625, -0.22119903564453125, -0.2115325927734375, -0.20186614990234375, -0.19219970703125, -0.18253326416015625, -0.1728668212890625, -0.16320037841796875, -0.153533935546875, -0.14386749267578125, -0.1342010498046875, -0.12453460693359375, -0.1148681640625, -0.10520172119140625, -0.0955352783203125, -0.08586883544921875, -0.076202392578125, -0.06653594970703125, -0.0568695068359375, -0.04720306396484375, -0.03753662109375, -0.02787017822265625, -0.0182037353515625, -0.00853729248046875, 0.001129150390625, 0.01079559326171875, 0.0204620361328125, 0.03012847900390625, 0.039794921875, 0.04946136474609375, 0.0591278076171875, 0.06879425048828125, 0.078460693359375, 0.08812713623046875, 0.0977935791015625, 0.10746002197265625, 0.11712646484375, 0.12679290771484375, 0.1364593505859375, 0.14612579345703125, 0.155792236328125, 0.16545867919921875, 0.1751251220703125, 0.18479156494140625, 0.1944580078125, 0.20412445068359375, 0.2137908935546875, 0.22345733642578125, 0.233123779296875, 0.24279022216796875, 0.2524566650390625, 0.26212310791015625, 0.27178955078125, 0.28145599365234375, 0.2911224365234375, 0.30078887939453125, 0.310455322265625, 0.32012176513671875, 0.3297882080078125, 0.33945465087890625, 0.34912109375]}, "gradients/decoder.model.decoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 1.0, 5.0, 7.0, 14.0, 30.0, 33.0, 59.0, 99.0, 127.0, 154.0, 154.0, 102.0, 71.0, 68.0, 29.0, 14.0, 9.0, 8.0, 4.0, 6.0, 3.0, 1.0, 2.0, 1.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.992317199707031, -4.825910568237305, -4.659504413604736, -4.49309778213501, -4.326691150665283, -4.160284996032715, -3.9938783645629883, -3.8274717330932617, -3.6610653400421143, -3.494658946990967, -3.3282523155212402, -3.1618459224700928, -2.9954395294189453, -2.8290328979492188, -2.6626265048980713, -2.496220111846924, -2.3298134803771973, -2.16340708732605, -1.9970004558563232, -1.8305940628051758, -1.6641875505447388, -1.4977810382843018, -1.3313746452331543, -1.1649681329727173, -0.9985616207122803, -0.8321551084518433, -0.665748655796051, -0.4993421733379364, -0.3329356908798218, -0.16652917861938477, -0.0001227259635925293, 0.1662837266921997, 0.3326897621154785, 0.49909624457359314, 0.6655027270317078, 0.8319091796875, 0.998315691947937, 1.164722204208374, 1.3311285972595215, 1.4975351095199585, 1.6639416217803955, 1.8303481340408325, 1.9967546463012695, 2.163161039352417, 2.3295674324035645, 2.495974063873291, 2.6623804569244385, 2.828786849975586, 2.9951934814453125, 3.16159987449646, 3.3280065059661865, 3.494412899017334, 3.6608195304870605, 3.827225923538208, 3.9936323165893555, 4.160038948059082, 4.326445579528809, 4.492852210998535, 4.6592583656311035, 4.82566499710083, 4.992071628570557, 5.158477783203125, 5.324884414672852, 5.491291046142578, 5.6576972007751465]}, "gradients/decoder.model.decoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 3.0, 3.0, 3.0, 1.0, 2.0, 7.0, 6.0, 9.0, 8.0, 4.0, 8.0, 8.0, 15.0, 15.0, 14.0, 12.0, 19.0, 24.0, 23.0, 27.0, 31.0, 33.0, 27.0, 43.0, 45.0, 30.0, 37.0, 38.0, 44.0, 38.0, 52.0, 31.0, 40.0, 40.0, 40.0, 35.0, 24.0, 20.0, 22.0, 19.0, 17.0, 14.0, 20.0, 12.0, 12.0, 11.0, 10.0, 6.0, 4.0, 1.0, 5.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.448025703430176, -3.3351693153381348, -3.2223126888275146, -3.1094563007354736, -2.9965996742248535, -2.8837432861328125, -2.7708868980407715, -2.6580302715301514, -2.5451738834381104, -2.4323174953460693, -2.319460868835449, -2.206604480743408, -2.093747854232788, -1.980891466140747, -1.8680349588394165, -1.755178451538086, -1.6423219442367554, -1.5294654369354248, -1.4166089296340942, -1.3037524223327637, -1.1908960342407227, -1.078039526939392, -0.9651830196380615, -0.8523265719413757, -0.7394700646400452, -0.6266135573387146, -0.5137571096420288, -0.40090060234069824, -0.28804412484169006, -0.17518764734268188, -0.06233114004135132, 0.05052530765533447, 0.16338181495666504, 0.2762382924556732, 0.3890947699546814, 0.501951277256012, 0.6148077249526978, 0.7276642322540283, 0.8405207395553589, 0.9533771872520447, 1.0662336349487305, 1.179090142250061, 1.2919466495513916, 1.4048030376434326, 1.5176595449447632, 1.6305160522460938, 1.7433725595474243, 1.8562290668487549, 1.9690855741500854, 2.081942081451416, 2.194798469543457, 2.307655096054077, 2.420511484146118, 2.5333681106567383, 2.6462244987487793, 2.7590808868408203, 2.8719375133514404, 2.9847939014434814, 3.0976505279541016, 3.2105069160461426, 3.3233635425567627, 3.4362199306488037, 3.549076557159424, 3.661932945251465, 3.774789333343506]}, "gradients/decoder.model.decoder.layers.6.fc2.weight": {"_type": "histogram", "values": [4.0, 1.0, 0.0, 2.0, 0.0, 1.0, 4.0, 8.0, 5.0, 6.0, 8.0, 13.0, 13.0, 20.0, 32.0, 38.0, 72.0, 93.0, 113.0, 187.0, 316.0, 489.0, 797.0, 1490.0, 2698.0, 5403.0, 13272.0, 44129.0, 306929.0, 3006587.0, 702501.0, 75569.0, 18932.0, 7036.0, 3232.0, 1786.0, 874.0, 568.0, 370.0, 225.0, 166.0, 89.0, 65.0, 42.0, 35.0, 18.0, 18.0, 14.0, 9.0, 2.0, 9.0, 4.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.111328125, -2.040130615234375, -1.96893310546875, -1.897735595703125, -1.8265380859375, -1.755340576171875, -1.68414306640625, -1.612945556640625, -1.541748046875, -1.470550537109375, -1.39935302734375, -1.328155517578125, -1.2569580078125, -1.185760498046875, -1.11456298828125, -1.043365478515625, -0.97216796875, -0.900970458984375, -0.82977294921875, -0.758575439453125, -0.6873779296875, -0.616180419921875, -0.54498291015625, -0.473785400390625, -0.402587890625, -0.331390380859375, -0.26019287109375, -0.188995361328125, -0.1177978515625, -0.046600341796875, 0.02459716796875, 0.095794677734375, 0.1669921875, 0.238189697265625, 0.30938720703125, 0.380584716796875, 0.4517822265625, 0.522979736328125, 0.59417724609375, 0.665374755859375, 0.736572265625, 0.807769775390625, 0.87896728515625, 0.950164794921875, 1.0213623046875, 1.092559814453125, 1.16375732421875, 1.234954833984375, 1.30615234375, 1.377349853515625, 1.44854736328125, 1.519744873046875, 1.5909423828125, 1.662139892578125, 1.73333740234375, 1.804534912109375, 1.875732421875, 1.946929931640625, 2.01812744140625, 2.089324951171875, 2.1605224609375, 2.231719970703125, 2.30291748046875, 2.374114990234375, 2.4453125]}, "gradients/decoder.model.decoder.layers.6.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 4.0, 2.0, 6.0, 3.0, 5.0, 14.0, 13.0, 12.0, 24.0, 29.0, 31.0, 28.0, 37.0, 36.0, 44.0, 53.0, 42.0, 57.0, 66.0, 64.0, 68.0, 56.0, 40.0, 52.0, 39.0, 32.0, 26.0, 32.0, 22.0, 17.0, 18.0, 3.0, 5.0, 6.0, 3.0, 6.0, 4.0, 2.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.7333984375, -1.686065673828125, -1.63873291015625, -1.591400146484375, -1.5440673828125, -1.496734619140625, -1.44940185546875, -1.402069091796875, -1.354736328125, -1.307403564453125, -1.26007080078125, -1.212738037109375, -1.1654052734375, -1.118072509765625, -1.07073974609375, -1.023406982421875, -0.97607421875, -0.928741455078125, -0.88140869140625, -0.834075927734375, -0.7867431640625, -0.739410400390625, -0.69207763671875, -0.644744873046875, -0.597412109375, -0.550079345703125, -0.50274658203125, -0.455413818359375, -0.4080810546875, -0.360748291015625, -0.31341552734375, -0.266082763671875, -0.21875, -0.171417236328125, -0.12408447265625, -0.076751708984375, -0.0294189453125, 0.017913818359375, 0.06524658203125, 0.112579345703125, 0.159912109375, 0.207244873046875, 0.25457763671875, 0.301910400390625, 0.3492431640625, 0.396575927734375, 0.44390869140625, 0.491241455078125, 0.53857421875, 0.585906982421875, 0.63323974609375, 0.680572509765625, 0.7279052734375, 0.775238037109375, 0.82257080078125, 0.869903564453125, 0.917236328125, 0.964569091796875, 1.01190185546875, 1.059234619140625, 1.1065673828125, 1.153900146484375, 1.20123291015625, 1.248565673828125, 1.2958984375]}, "gradients/decoder.model.decoder.layers.6.fc1.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 5.0, 1.0, 5.0, 5.0, 12.0, 8.0, 16.0, 28.0, 19.0, 36.0, 78.0, 96.0, 201.0, 624.0, 2502.0, 21670.0, 2115665.0, 2028043.0, 21567.0, 2495.0, 641.0, 213.0, 122.0, 74.0, 43.0, 28.0, 23.0, 17.0, 7.0, 9.0, 5.0, 9.0, 4.0, 6.0, 3.0, 1.0, 3.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.2421875, -4.10076904296875, -3.9593505859375, -3.81793212890625, -3.676513671875, -3.53509521484375, -3.3936767578125, -3.25225830078125, -3.11083984375, -2.96942138671875, -2.8280029296875, -2.68658447265625, -2.545166015625, -2.40374755859375, -2.2623291015625, -2.12091064453125, -1.9794921875, -1.83807373046875, -1.6966552734375, -1.55523681640625, -1.413818359375, -1.27239990234375, -1.1309814453125, -0.98956298828125, -0.84814453125, -0.70672607421875, -0.5653076171875, -0.42388916015625, -0.282470703125, -0.14105224609375, 0.0003662109375, 0.14178466796875, 0.283203125, 0.42462158203125, 0.5660400390625, 0.70745849609375, 0.848876953125, 0.99029541015625, 1.1317138671875, 1.27313232421875, 1.41455078125, 1.55596923828125, 1.6973876953125, 1.83880615234375, 1.980224609375, 2.12164306640625, 2.2630615234375, 2.40447998046875, 2.5458984375, 2.68731689453125, 2.8287353515625, 2.97015380859375, 3.111572265625, 3.25299072265625, 3.3944091796875, 3.53582763671875, 3.67724609375, 3.81866455078125, 3.9600830078125, 4.10150146484375, 4.242919921875, 4.38433837890625, 4.5257568359375, 4.66717529296875, 4.80859375]}, "gradients/decoder.model.decoder.layers.6.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 0.0, 1.0, 3.0, 5.0, 2.0, 8.0, 6.0, 9.0, 13.0, 13.0, 24.0, 25.0, 30.0, 44.0, 69.0, 87.0, 150.0, 194.0, 347.0, 537.0, 722.0, 630.0, 381.0, 251.0, 165.0, 89.0, 74.0, 44.0, 39.0, 39.0, 20.0, 18.0, 10.0, 8.0, 12.0, 3.0, 2.0, 2.0, 2.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.58447265625, -0.5676498413085938, -0.5508270263671875, -0.5340042114257812, -0.517181396484375, -0.5003585815429688, -0.4835357666015625, -0.46671295166015625, -0.44989013671875, -0.43306732177734375, -0.4162445068359375, -0.39942169189453125, -0.382598876953125, -0.36577606201171875, -0.3489532470703125, -0.33213043212890625, -0.3153076171875, -0.29848480224609375, -0.2816619873046875, -0.26483917236328125, -0.248016357421875, -0.23119354248046875, -0.2143707275390625, -0.19754791259765625, -0.18072509765625, -0.16390228271484375, -0.1470794677734375, -0.13025665283203125, -0.113433837890625, -0.09661102294921875, -0.0797882080078125, -0.06296539306640625, -0.046142578125, -0.02931976318359375, -0.0124969482421875, 0.00432586669921875, 0.021148681640625, 0.03797149658203125, 0.0547943115234375, 0.07161712646484375, 0.08843994140625, 0.10526275634765625, 0.1220855712890625, 0.13890838623046875, 0.155731201171875, 0.17255401611328125, 0.1893768310546875, 0.20619964599609375, 0.2230224609375, 0.23984527587890625, 0.2566680908203125, 0.27349090576171875, 0.290313720703125, 0.30713653564453125, 0.3239593505859375, 0.34078216552734375, 0.35760498046875, 0.37442779541015625, 0.3912506103515625, 0.40807342529296875, 0.424896240234375, 0.44171905517578125, 0.4585418701171875, 0.47536468505859375, 0.4921875]}, "gradients/decoder.model.decoder.layers.6.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 2.0, 2.0, 4.0, 1.0, 6.0, 5.0, 15.0, 10.0, 19.0, 33.0, 36.0, 55.0, 75.0, 102.0, 106.0, 108.0, 108.0, 88.0, 70.0, 35.0, 44.0, 17.0, 18.0, 15.0, 8.0, 8.0, 1.0, 6.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.254340410232544, -2.169137716293335, -2.083934783935547, -1.998732089996338, -1.9135292768478394, -1.8283264636993408, -1.7431236505508423, -1.6579208374023438, -1.5727181434631348, -1.4875153303146362, -1.4023125171661377, -1.3171098232269287, -1.2319070100784302, -1.1467041969299316, -1.061501383781433, -0.9762986302375793, -0.891095757484436, -0.8058929443359375, -0.7206901907920837, -0.6354873776435852, -0.5502846240997314, -0.4650818109512329, -0.3798789978027344, -0.2946762442588806, -0.20947343111038208, -0.12427064031362534, -0.03906784951686859, 0.04613494873046875, 0.1313377320766449, 0.21654051542282104, 0.3017433285713196, 0.38694608211517334, 0.4721488952636719, 0.5573517084121704, 0.6425544619560242, 0.7277572751045227, 0.8129600286483765, 0.898162841796875, 0.9833656549453735, 1.068568468093872, 1.153771162033081, 1.2389739751815796, 1.3241767883300781, 1.409379482269287, 1.4945822954177856, 1.5797851085662842, 1.6649879217147827, 1.7501907348632812, 1.8353935480117798, 1.9205963611602783, 2.0057990550994873, 2.0910019874572754, 2.1762046813964844, 2.2614073753356934, 2.3466103076934814, 2.4318130016326904, 2.5170159339904785, 2.6022186279296875, 2.6874215602874756, 2.7726242542266846, 2.8578271865844727, 2.9430298805236816, 3.0282325744628906, 3.1134355068206787, 3.1986382007598877]}, "gradients/decoder.model.decoder.layers.6.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 3.0, 4.0, 5.0, 4.0, 11.0, 15.0, 16.0, 20.0, 26.0, 21.0, 35.0, 34.0, 33.0, 46.0, 51.0, 60.0, 60.0, 58.0, 56.0, 53.0, 50.0, 52.0, 40.0, 44.0, 37.0, 39.0, 24.0, 22.0, 27.0, 19.0, 12.0, 9.0, 4.0, 2.0, 5.0, 1.0, 4.0, 2.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.9941903352737427, -1.9397519826889038, -1.885313630104065, -1.8308751583099365, -1.7764368057250977, -1.7219984531402588, -1.66756010055542, -1.613121747970581, -1.5586833953857422, -1.5042450428009033, -1.4498066902160645, -1.3953683376312256, -1.3409298658370972, -1.2864915132522583, -1.2320531606674194, -1.1776148080825806, -1.1231763362884521, -1.0687379837036133, -1.0142996311187744, -0.9598612189292908, -0.9054228663444519, -0.8509844541549683, -0.7965461015701294, -0.7421077489852905, -0.6876693964004517, -0.6332310438156128, -0.5787926316261292, -0.5243542790412903, -0.4699159264564514, -0.41547754406929016, -0.3610391616821289, -0.30660080909729004, -0.25216245651245117, -0.1977240890264511, -0.14328572154045105, -0.0888473391532898, -0.034408971667289734, 0.020029395818710327, 0.07446777820587158, 0.12890613079071045, 0.1833445131778717, 0.23778288066387177, 0.2922212481498718, 0.3466596305370331, 0.40109801292419434, 0.4555363655090332, 0.5099747180938721, 0.5644130706787109, 0.6188514828681946, 0.6732898354530334, 0.7277282476425171, 0.782166600227356, 0.8366049528121948, 0.8910433053970337, 0.9454817175865173, 0.9999200701713562, 1.0543584823608398, 1.1087968349456787, 1.1632351875305176, 1.2176735401153564, 1.2721120119094849, 1.3265503644943237, 1.3809887170791626, 1.4354270696640015, 1.4898654222488403]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 7.0, 5.0, 10.0, 9.0, 14.0, 19.0, 38.0, 55.0, 84.0, 120.0, 281.0, 468.0, 847.0, 1574.0, 3019.0, 6235.0, 13926.0, 37853.0, 160916.0, 587361.0, 169520.0, 38757.0, 14261.0, 6430.0, 3089.0, 1648.0, 856.0, 496.0, 243.0, 155.0, 92.0, 49.0, 32.0, 33.0, 13.0, 16.0, 10.0, 8.0, 6.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.525390625, -0.5092315673828125, -0.493072509765625, -0.4769134521484375, -0.46075439453125, -0.4445953369140625, -0.428436279296875, -0.4122772216796875, -0.3961181640625, -0.3799591064453125, -0.363800048828125, -0.3476409912109375, -0.33148193359375, -0.3153228759765625, -0.299163818359375, -0.2830047607421875, -0.266845703125, -0.2506866455078125, -0.234527587890625, -0.2183685302734375, -0.20220947265625, -0.1860504150390625, -0.169891357421875, -0.1537322998046875, -0.1375732421875, -0.1214141845703125, -0.105255126953125, -0.0890960693359375, -0.07293701171875, -0.0567779541015625, -0.040618896484375, -0.0244598388671875, -0.00830078125, 0.0078582763671875, 0.024017333984375, 0.0401763916015625, 0.05633544921875, 0.0724945068359375, 0.088653564453125, 0.1048126220703125, 0.1209716796875, 0.1371307373046875, 0.153289794921875, 0.1694488525390625, 0.18560791015625, 0.2017669677734375, 0.217926025390625, 0.2340850830078125, 0.250244140625, 0.2664031982421875, 0.282562255859375, 0.2987213134765625, 0.31488037109375, 0.3310394287109375, 0.347198486328125, 0.3633575439453125, 0.3795166015625, 0.3956756591796875, 0.411834716796875, 0.4279937744140625, 0.44415283203125, 0.4603118896484375, 0.476470947265625, 0.4926300048828125, 0.5087890625]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 4.0, 2.0, 10.0, 12.0, 12.0, 25.0, 32.0, 37.0, 32.0, 53.0, 59.0, 83.0, 77.0, 75.0, 91.0, 70.0, 61.0, 58.0, 38.0, 48.0, 35.0, 24.0, 19.0, 15.0, 11.0, 4.0, 9.0, 3.0, 6.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.818359375, -1.7690277099609375, -1.719696044921875, -1.6703643798828125, -1.62103271484375, -1.5717010498046875, -1.522369384765625, -1.4730377197265625, -1.4237060546875, -1.3743743896484375, -1.325042724609375, -1.2757110595703125, -1.22637939453125, -1.1770477294921875, -1.127716064453125, -1.0783843994140625, -1.029052734375, -0.9797210693359375, -0.930389404296875, -0.8810577392578125, -0.83172607421875, -0.7823944091796875, -0.733062744140625, -0.6837310791015625, -0.6343994140625, -0.5850677490234375, -0.535736083984375, -0.4864044189453125, -0.43707275390625, -0.3877410888671875, -0.338409423828125, -0.2890777587890625, -0.23974609375, -0.1904144287109375, -0.141082763671875, -0.0917510986328125, -0.04241943359375, 0.0069122314453125, 0.056243896484375, 0.1055755615234375, 0.1549072265625, 0.2042388916015625, 0.253570556640625, 0.3029022216796875, 0.35223388671875, 0.4015655517578125, 0.450897216796875, 0.5002288818359375, 0.549560546875, 0.5988922119140625, 0.648223876953125, 0.6975555419921875, 0.74688720703125, 0.7962188720703125, 0.845550537109375, 0.8948822021484375, 0.9442138671875, 0.9935455322265625, 1.042877197265625, 1.0922088623046875, 1.14154052734375, 1.1908721923828125, 1.240203857421875, 1.2895355224609375, 1.3388671875]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 5.0, 1.0, 5.0, 3.0, 7.0, 9.0, 12.0, 10.0, 20.0, 27.0, 23.0, 50.0, 71.0, 114.0, 185.0, 323.0, 599.0, 1121.0, 2497.0, 5757.0, 15588.0, 61113.0, 465838.0, 415868.0, 54522.0, 14582.0, 5460.0, 2334.0, 1092.0, 500.0, 312.0, 168.0, 107.0, 59.0, 51.0, 28.0, 24.0, 21.0, 15.0, 6.0, 9.0, 3.0, 6.0, 5.0, 4.0, 4.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0], "bins": [-0.5625, -0.5464134216308594, -0.5303268432617188, -0.5142402648925781, -0.4981536865234375, -0.4820671081542969, -0.46598052978515625, -0.4498939514160156, -0.433807373046875, -0.4177207946777344, -0.40163421630859375, -0.3855476379394531, -0.3694610595703125, -0.3533744812011719, -0.33728790283203125, -0.3212013244628906, -0.30511474609375, -0.2890281677246094, -0.27294158935546875, -0.2568550109863281, -0.2407684326171875, -0.22468185424804688, -0.20859527587890625, -0.19250869750976562, -0.176422119140625, -0.16033554077148438, -0.14424896240234375, -0.12816238403320312, -0.1120758056640625, -0.09598922729492188, -0.07990264892578125, -0.06381607055664062, -0.0477294921875, -0.031642913818359375, -0.01555633544921875, 0.000530242919921875, 0.0166168212890625, 0.032703399658203125, 0.04878997802734375, 0.06487655639648438, 0.080963134765625, 0.09704971313476562, 0.11313629150390625, 0.12922286987304688, 0.1453094482421875, 0.16139602661132812, 0.17748260498046875, 0.19356918334960938, 0.20965576171875, 0.22574234008789062, 0.24182891845703125, 0.2579154968261719, 0.2740020751953125, 0.2900886535644531, 0.30617523193359375, 0.3222618103027344, 0.338348388671875, 0.3544349670410156, 0.37052154541015625, 0.3866081237792969, 0.4026947021484375, 0.4187812805175781, 0.43486785888671875, 0.4509544372558594, 0.467041015625]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 3.0, 4.0, 8.0, 3.0, 11.0, 11.0, 9.0, 11.0, 16.0, 12.0, 33.0, 23.0, 27.0, 29.0, 39.0, 40.0, 37.0, 44.0, 44.0, 56.0, 49.0, 45.0, 46.0, 43.0, 40.0, 52.0, 33.0, 41.0, 26.0, 30.0, 26.0, 22.0, 12.0, 11.0, 15.0, 12.0, 15.0, 9.0, 6.0, 1.0, 3.0, 3.0, 0.0, 2.0, 4.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0], "bins": [-2.126953125, -2.0626678466796875, -1.998382568359375, -1.9340972900390625, -1.86981201171875, -1.8055267333984375, -1.741241455078125, -1.6769561767578125, -1.6126708984375, -1.5483856201171875, -1.484100341796875, -1.4198150634765625, -1.35552978515625, -1.2912445068359375, -1.226959228515625, -1.1626739501953125, -1.098388671875, -1.0341033935546875, -0.969818115234375, -0.9055328369140625, -0.84124755859375, -0.7769622802734375, -0.712677001953125, -0.6483917236328125, -0.5841064453125, -0.5198211669921875, -0.455535888671875, -0.3912506103515625, -0.32696533203125, -0.2626800537109375, -0.198394775390625, -0.1341094970703125, -0.06982421875, -0.0055389404296875, 0.058746337890625, 0.1230316162109375, 0.18731689453125, 0.2516021728515625, 0.315887451171875, 0.3801727294921875, 0.4444580078125, 0.5087432861328125, 0.573028564453125, 0.6373138427734375, 0.70159912109375, 0.7658843994140625, 0.830169677734375, 0.8944549560546875, 0.958740234375, 1.0230255126953125, 1.087310791015625, 1.1515960693359375, 1.21588134765625, 1.2801666259765625, 1.344451904296875, 1.4087371826171875, 1.4730224609375, 1.5373077392578125, 1.601593017578125, 1.6658782958984375, 1.73016357421875, 1.7944488525390625, 1.858734130859375, 1.9230194091796875, 1.9873046875]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 6.0, 6.0, 7.0, 9.0, 19.0, 17.0, 30.0, 75.0, 75.0, 145.0, 268.0, 525.0, 1024.0, 2514.0, 7387.0, 31655.0, 317021.0, 616600.0, 54429.0, 10699.0, 3343.0, 1305.0, 598.0, 336.0, 177.0, 112.0, 56.0, 39.0, 31.0, 22.0, 10.0, 12.0, 4.0, 4.0, 2.0, 4.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.273193359375, -0.2646942138671875, -0.256195068359375, -0.2476959228515625, -0.23919677734375, -0.2306976318359375, -0.222198486328125, -0.2136993408203125, -0.2052001953125, -0.1967010498046875, -0.188201904296875, -0.1797027587890625, -0.17120361328125, -0.1627044677734375, -0.154205322265625, -0.1457061767578125, -0.13720703125, -0.1287078857421875, -0.120208740234375, -0.1117095947265625, -0.10321044921875, -0.0947113037109375, -0.086212158203125, -0.0777130126953125, -0.0692138671875, -0.0607147216796875, -0.052215576171875, -0.0437164306640625, -0.03521728515625, -0.0267181396484375, -0.018218994140625, -0.0097198486328125, -0.001220703125, 0.0072784423828125, 0.015777587890625, 0.0242767333984375, 0.03277587890625, 0.0412750244140625, 0.049774169921875, 0.0582733154296875, 0.0667724609375, 0.0752716064453125, 0.083770751953125, 0.0922698974609375, 0.10076904296875, 0.1092681884765625, 0.117767333984375, 0.1262664794921875, 0.134765625, 0.1432647705078125, 0.151763916015625, 0.1602630615234375, 0.16876220703125, 0.1772613525390625, 0.185760498046875, 0.1942596435546875, 0.2027587890625, 0.2112579345703125, 0.219757080078125, 0.2282562255859375, 0.23675537109375, 0.2452545166015625, 0.253753662109375, 0.2622528076171875, 0.270751953125]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 3.0, 1.0, 4.0, 8.0, 7.0, 22.0, 26.0, 48.0, 76.0, 96.0, 161.0, 175.0, 149.0, 75.0, 70.0, 27.0, 21.0, 12.0, 12.0, 4.0, 6.0, 2.0, 5.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00023651123046875, -0.00023077800869941711, -0.00022504478693008423, -0.00021931156516075134, -0.00021357834339141846, -0.00020784512162208557, -0.00020211189985275269, -0.0001963786780834198, -0.00019064545631408691, -0.00018491223454475403, -0.00017917901277542114, -0.00017344579100608826, -0.00016771256923675537, -0.00016197934746742249, -0.0001562461256980896, -0.00015051290392875671, -0.00014477968215942383, -0.00013904646039009094, -0.00013331323862075806, -0.00012758001685142517, -0.00012184679508209229, -0.0001161135733127594, -0.00011038035154342651, -0.00010464712977409363, -9.891390800476074e-05, -9.318068623542786e-05, -8.744746446609497e-05, -8.171424269676208e-05, -7.59810209274292e-05, -7.024779915809631e-05, -6.451457738876343e-05, -5.878135561943054e-05, -5.3048133850097656e-05, -4.731491208076477e-05, -4.1581690311431885e-05, -3.5848468542099e-05, -3.0115246772766113e-05, -2.4382025003433228e-05, -1.8648803234100342e-05, -1.2915581464767456e-05, -7.18235969543457e-06, -1.4491379261016846e-06, 4.284083843231201e-06, 1.0017305612564087e-05, 1.5750527381896973e-05, 2.148374915122986e-05, 2.7216970920562744e-05, 3.295019268989563e-05, 3.8683414459228516e-05, 4.44166362285614e-05, 5.014985799789429e-05, 5.588307976722717e-05, 6.161630153656006e-05, 6.734952330589294e-05, 7.308274507522583e-05, 7.881596684455872e-05, 8.45491886138916e-05, 9.028241038322449e-05, 9.601563215255737e-05, 0.00010174885392189026, 0.00010748207569122314, 0.00011321529746055603, 0.00011894851922988892, 0.0001246817409992218, 0.0001304149627685547]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 4.0, 1.0, 3.0, 1.0, 3.0, 7.0, 3.0, 11.0, 10.0, 11.0, 15.0, 13.0, 27.0, 31.0, 53.0, 80.0, 152.0, 275.0, 495.0, 989.0, 2027.0, 4582.0, 13093.0, 51474.0, 317157.0, 540033.0, 87305.0, 19319.0, 6364.0, 2506.0, 1186.0, 545.0, 287.0, 167.0, 115.0, 74.0, 45.0, 33.0, 16.0, 9.0, 14.0, 6.0, 8.0, 2.0, 4.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.1888427734375, -0.18213653564453125, -0.1754302978515625, -0.16872406005859375, -0.162017822265625, -0.15531158447265625, -0.1486053466796875, -0.14189910888671875, -0.13519287109375, -0.12848663330078125, -0.1217803955078125, -0.11507415771484375, -0.108367919921875, -0.10166168212890625, -0.0949554443359375, -0.08824920654296875, -0.08154296875, -0.07483673095703125, -0.0681304931640625, -0.06142425537109375, -0.054718017578125, -0.04801177978515625, -0.0413055419921875, -0.03459930419921875, -0.02789306640625, -0.02118682861328125, -0.0144805908203125, -0.00777435302734375, -0.001068115234375, 0.00563812255859375, 0.0123443603515625, 0.01905059814453125, 0.0257568359375, 0.03246307373046875, 0.0391693115234375, 0.04587554931640625, 0.052581787109375, 0.05928802490234375, 0.0659942626953125, 0.07270050048828125, 0.07940673828125, 0.08611297607421875, 0.0928192138671875, 0.09952545166015625, 0.106231689453125, 0.11293792724609375, 0.1196441650390625, 0.12635040283203125, 0.133056640625, 0.13976287841796875, 0.1464691162109375, 0.15317535400390625, 0.159881591796875, 0.16658782958984375, 0.1732940673828125, 0.18000030517578125, 0.18670654296875, 0.19341278076171875, 0.2001190185546875, 0.20682525634765625, 0.213531494140625, 0.22023773193359375, 0.2269439697265625, 0.23365020751953125, 0.2403564453125]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 0.0, 4.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 2.0, 4.0, 2.0, 2.0, 5.0, 5.0, 4.0, 7.0, 6.0, 12.0, 16.0, 25.0, 25.0, 40.0, 57.0, 59.0, 92.0, 113.0, 114.0, 102.0, 70.0, 56.0, 42.0, 38.0, 23.0, 22.0, 12.0, 9.0, 5.0, 4.0, 4.0, 2.0, 2.0, 4.0, 1.0, 4.0, 2.0, 1.0, 3.0, 5.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.050262451171875, -0.04883289337158203, -0.04740333557128906, -0.045973777770996094, -0.044544219970703125, -0.043114662170410156, -0.04168510437011719, -0.04025554656982422, -0.03882598876953125, -0.03739643096923828, -0.03596687316894531, -0.034537315368652344, -0.033107757568359375, -0.031678199768066406, -0.030248641967773438, -0.02881908416748047, -0.0273895263671875, -0.02595996856689453, -0.024530410766601562, -0.023100852966308594, -0.021671295166015625, -0.020241737365722656, -0.018812179565429688, -0.01738262176513672, -0.01595306396484375, -0.014523506164550781, -0.013093948364257812, -0.011664390563964844, -0.010234832763671875, -0.008805274963378906, -0.0073757171630859375, -0.005946159362792969, -0.0045166015625, -0.0030870437622070312, -0.0016574859619140625, -0.00022792816162109375, 0.001201629638671875, 0.0026311874389648438, 0.0040607452392578125, 0.005490303039550781, 0.00691986083984375, 0.008349418640136719, 0.009778976440429688, 0.011208534240722656, 0.012638092041015625, 0.014067649841308594, 0.015497207641601562, 0.01692676544189453, 0.0183563232421875, 0.01978588104248047, 0.021215438842773438, 0.022644996643066406, 0.024074554443359375, 0.025504112243652344, 0.026933670043945312, 0.02836322784423828, 0.02979278564453125, 0.03122234344482422, 0.03265190124511719, 0.034081459045410156, 0.035511016845703125, 0.036940574645996094, 0.03837013244628906, 0.03979969024658203, 0.041229248046875]}, "gradients/decoder.model.decoder.layers.6.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 5.0, 2.0, 4.0, 4.0, 3.0, 5.0, 9.0, 15.0, 25.0, 43.0, 64.0, 100.0, 145.0, 161.0, 140.0, 95.0, 78.0, 32.0, 27.0, 20.0, 9.0, 12.0, 4.0, 4.0, 0.0, 2.0, 0.0, 1.0, 4.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8391799926757812, -1.7646205425262451, -1.690061092376709, -1.6155016422271729, -1.5409420728683472, -1.466382622718811, -1.391823172569275, -1.3172636032104492, -1.242704153060913, -1.168144702911377, -1.0935852527618408, -1.0190258026123047, -0.944466233253479, -0.8699067831039429, -0.7953473329544067, -0.7207878232002258, -0.6462284326553345, -0.5716689825057983, -0.49710947275161743, -0.4225500226020813, -0.3479905426502228, -0.27343106269836426, -0.19887161254882812, -0.12431210279464722, -0.049752652645111084, 0.02480681985616684, 0.09936629235744476, 0.1739257574081421, 0.2484852373600006, 0.32304471731185913, 0.39760416746139526, 0.47216367721557617, 0.5467231273651123, 0.6212825775146484, 0.6958420872688293, 0.7704015374183655, 0.8449610471725464, 0.9195204973220825, 0.9940799474716187, 1.0686395168304443, 1.1431989669799805, 1.2177584171295166, 1.2923178672790527, 1.3668773174285889, 1.4414368867874146, 1.5159963369369507, 1.5905557870864868, 1.6651153564453125, 1.739674687385559, 1.8142341375350952, 1.8887935876846313, 1.963353157043457, 2.037912607192993, 2.1124720573425293, 2.1870315074920654, 2.2615909576416016, 2.3361504077911377, 2.410709857940674, 2.48526930809021, 2.559828758239746, 2.6343882083892822, 2.7089476585388184, 2.7835073471069336, 2.8580667972564697, 2.932626247406006]}, "gradients/decoder.model.decoder.layers.6.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 0.0, 2.0, 4.0, 7.0, 4.0, 12.0, 14.0, 31.0, 34.0, 40.0, 34.0, 64.0, 66.0, 74.0, 83.0, 84.0, 78.0, 71.0, 49.0, 59.0, 50.0, 41.0, 37.0, 24.0, 16.0, 9.0, 6.0, 2.0, 6.0, 2.0, 2.0, 0.0, 2.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.502951979637146, -1.4553520679473877, -1.407752275466919, -1.3601523637771606, -1.3125524520874023, -1.2649526596069336, -1.2173527479171753, -1.169752836227417, -1.1221530437469482, -1.07455313205719, -1.0269533395767212, -0.9793534278869629, -0.9317535758018494, -0.8841537237167358, -0.8365538120269775, -0.788953959941864, -0.7413540482521057, -0.6937541961669922, -0.6461542844772339, -0.5985544323921204, -0.5509545803070068, -0.5033546686172485, -0.455754816532135, -0.4081549644470215, -0.36055508255958557, -0.31295520067214966, -0.26535534858703613, -0.21775546669960022, -0.1701555997133255, -0.12255573272705078, -0.07495585083961487, -0.027355998754501343, 0.02024388313293457, 0.06784375011920929, 0.1154436245560646, 0.16304349899291992, 0.21064336597919464, 0.25824323296546936, 0.3058431148529053, 0.3534429669380188, 0.4010428488254547, 0.4486427307128906, 0.49624258279800415, 0.5438424348831177, 0.591442346572876, 0.6390421986579895, 0.686642050743103, 0.7342419624328613, 0.7818418145179749, 0.8294416666030884, 0.8770415782928467, 0.9246414303779602, 0.9722412824630737, 1.019841194152832, 1.0674409866333008, 1.115040898323059, 1.1626408100128174, 1.2102407217025757, 1.2578405141830444, 1.3054404258728027, 1.353040337562561, 1.4006401300430298, 1.448240041732788, 1.4958398342132568, 1.5434397459030151]}, "gradients/decoder.model.decoder.layers.6.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 0.0, 0.0, 0.0, 2.0, 6.0, 0.0, 6.0, 2.0, 5.0, 5.0, 15.0, 10.0, 18.0, 32.0, 79.0, 204.0, 708.0, 2458.0, 12271.0, 108913.0, 858027.0, 55153.0, 7930.0, 1904.0, 469.0, 171.0, 76.0, 23.0, 16.0, 9.0, 11.0, 10.0, 7.0, 5.0, 3.0, 5.0, 2.0, 3.0, 1.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.359375, -3.248779296875, -3.13818359375, -3.027587890625, -2.9169921875, -2.806396484375, -2.69580078125, -2.585205078125, -2.474609375, -2.364013671875, -2.25341796875, -2.142822265625, -2.0322265625, -1.921630859375, -1.81103515625, -1.700439453125, -1.58984375, -1.479248046875, -1.36865234375, -1.258056640625, -1.1474609375, -1.036865234375, -0.92626953125, -0.815673828125, -0.705078125, -0.594482421875, -0.48388671875, -0.373291015625, -0.2626953125, -0.152099609375, -0.04150390625, 0.069091796875, 0.1796875, 0.290283203125, 0.40087890625, 0.511474609375, 0.6220703125, 0.732666015625, 0.84326171875, 0.953857421875, 1.064453125, 1.175048828125, 1.28564453125, 1.396240234375, 1.5068359375, 1.617431640625, 1.72802734375, 1.838623046875, 1.94921875, 2.059814453125, 2.17041015625, 2.281005859375, 2.3916015625, 2.502197265625, 2.61279296875, 2.723388671875, 2.833984375, 2.944580078125, 3.05517578125, 3.165771484375, 3.2763671875, 3.386962890625, 3.49755859375, 3.608154296875, 3.71875]}, "gradients/decoder.model.decoder.layers.6.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 4.0, 0.0, 2.0, 9.0, 10.0, 27.0, 41.0, 80.0, 107.0, 135.0, 172.0, 133.0, 123.0, 80.0, 52.0, 23.0, 12.0, 2.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.041015625, -2.831756591796875, -2.62249755859375, -2.413238525390625, -2.2039794921875, -1.994720458984375, -1.78546142578125, -1.576202392578125, -1.366943359375, -1.157684326171875, -0.94842529296875, -0.739166259765625, -0.5299072265625, -0.320648193359375, -0.11138916015625, 0.097869873046875, 0.30712890625, 0.516387939453125, 0.72564697265625, 0.934906005859375, 1.1441650390625, 1.353424072265625, 1.56268310546875, 1.771942138671875, 1.981201171875, 2.190460205078125, 2.39971923828125, 2.608978271484375, 2.8182373046875, 3.027496337890625, 3.23675537109375, 3.446014404296875, 3.6552734375, 3.864532470703125, 4.07379150390625, 4.283050537109375, 4.4923095703125, 4.701568603515625, 4.91082763671875, 5.120086669921875, 5.329345703125, 5.538604736328125, 5.74786376953125, 5.957122802734375, 6.1663818359375, 6.375640869140625, 6.58489990234375, 6.794158935546875, 7.00341796875, 7.212677001953125, 7.42193603515625, 7.631195068359375, 7.8404541015625, 8.049713134765625, 8.25897216796875, 8.468231201171875, 8.677490234375, 8.886749267578125, 9.09600830078125, 9.305267333984375, 9.5145263671875, 9.723785400390625, 9.93304443359375, 10.142303466796875, 10.3515625]}, "gradients/decoder.model.decoder.layers.6.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 6.0, 7.0, 11.0, 13.0, 12.0, 19.0, 21.0, 34.0, 62.0, 67.0, 111.0, 156.0, 244.0, 464.0, 827.0, 1588.0, 3406.0, 8146.0, 22220.0, 83818.0, 555608.0, 294922.0, 49963.0, 15171.0, 6073.0, 2632.0, 1212.0, 705.0, 360.0, 209.0, 141.0, 108.0, 66.0, 47.0, 33.0, 18.0, 20.0, 14.0, 10.0, 6.0, 3.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.0810546875, -1.042205810546875, -1.00335693359375, -0.964508056640625, -0.9256591796875, -0.886810302734375, -0.84796142578125, -0.809112548828125, -0.770263671875, -0.731414794921875, -0.69256591796875, -0.653717041015625, -0.6148681640625, -0.576019287109375, -0.53717041015625, -0.498321533203125, -0.45947265625, -0.420623779296875, -0.38177490234375, -0.342926025390625, -0.3040771484375, -0.265228271484375, -0.22637939453125, -0.187530517578125, -0.148681640625, -0.109832763671875, -0.07098388671875, -0.032135009765625, 0.0067138671875, 0.045562744140625, 0.08441162109375, 0.123260498046875, 0.162109375, 0.200958251953125, 0.23980712890625, 0.278656005859375, 0.3175048828125, 0.356353759765625, 0.39520263671875, 0.434051513671875, 0.472900390625, 0.511749267578125, 0.55059814453125, 0.589447021484375, 0.6282958984375, 0.667144775390625, 0.70599365234375, 0.744842529296875, 0.78369140625, 0.822540283203125, 0.86138916015625, 0.900238037109375, 0.9390869140625, 0.977935791015625, 1.01678466796875, 1.055633544921875, 1.094482421875, 1.133331298828125, 1.17218017578125, 1.211029052734375, 1.2498779296875, 1.288726806640625, 1.32757568359375, 1.366424560546875, 1.4052734375]}, "gradients/decoder.model.decoder.layers.6.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 0.0, 1.0, 4.0, 3.0, 2.0, 2.0, 6.0, 5.0, 7.0, 9.0, 15.0, 8.0, 17.0, 24.0, 23.0, 20.0, 35.0, 30.0, 29.0, 33.0, 29.0, 40.0, 41.0, 36.0, 52.0, 38.0, 28.0, 40.0, 59.0, 36.0, 34.0, 29.0, 29.0, 35.0, 20.0, 27.0, 21.0, 18.0, 24.0, 24.0, 17.0, 17.0, 10.0, 3.0, 6.0, 3.0, 4.0, 7.0, 3.0, 1.0, 3.0, 1.0, 1.0, 3.0, 1.0], "bins": [-2.642578125, -2.566986083984375, -2.49139404296875, -2.415802001953125, -2.3402099609375, -2.264617919921875, -2.18902587890625, -2.113433837890625, -2.037841796875, -1.962249755859375, -1.88665771484375, -1.811065673828125, -1.7354736328125, -1.659881591796875, -1.58428955078125, -1.508697509765625, -1.43310546875, -1.357513427734375, -1.28192138671875, -1.206329345703125, -1.1307373046875, -1.055145263671875, -0.97955322265625, -0.903961181640625, -0.828369140625, -0.752777099609375, -0.67718505859375, -0.601593017578125, -0.5260009765625, -0.450408935546875, -0.37481689453125, -0.299224853515625, -0.2236328125, -0.148040771484375, -0.07244873046875, 0.003143310546875, 0.0787353515625, 0.154327392578125, 0.22991943359375, 0.305511474609375, 0.381103515625, 0.456695556640625, 0.53228759765625, 0.607879638671875, 0.6834716796875, 0.759063720703125, 0.83465576171875, 0.910247802734375, 0.98583984375, 1.061431884765625, 1.13702392578125, 1.212615966796875, 1.2882080078125, 1.363800048828125, 1.43939208984375, 1.514984130859375, 1.590576171875, 1.666168212890625, 1.74176025390625, 1.817352294921875, 1.8929443359375, 1.968536376953125, 2.04412841796875, 2.119720458984375, 2.1953125]}, "gradients/decoder.model.decoder.layers.6.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 5.0, 2.0, 7.0, 18.0, 19.0, 45.0, 62.0, 98.0, 176.0, 285.0, 620.0, 1157.0, 2718.0, 6601.0, 19659.0, 77507.0, 488822.0, 360397.0, 62382.0, 16922.0, 6135.0, 2532.0, 1124.0, 575.0, 291.0, 170.0, 83.0, 48.0, 30.0, 24.0, 12.0, 13.0, 8.0, 1.0, 6.0, 5.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.439453125, -0.42687225341796875, -0.4142913818359375, -0.40171051025390625, -0.389129638671875, -0.37654876708984375, -0.3639678955078125, -0.35138702392578125, -0.33880615234375, -0.32622528076171875, -0.3136444091796875, -0.30106353759765625, -0.288482666015625, -0.27590179443359375, -0.2633209228515625, -0.25074005126953125, -0.2381591796875, -0.22557830810546875, -0.2129974365234375, -0.20041656494140625, -0.187835693359375, -0.17525482177734375, -0.1626739501953125, -0.15009307861328125, -0.13751220703125, -0.12493133544921875, -0.1123504638671875, -0.09976959228515625, -0.087188720703125, -0.07460784912109375, -0.0620269775390625, -0.04944610595703125, -0.036865234375, -0.02428436279296875, -0.0117034912109375, 0.00087738037109375, 0.013458251953125, 0.02603912353515625, 0.0386199951171875, 0.05120086669921875, 0.06378173828125, 0.07636260986328125, 0.0889434814453125, 0.10152435302734375, 0.114105224609375, 0.12668609619140625, 0.1392669677734375, 0.15184783935546875, 0.1644287109375, 0.17700958251953125, 0.1895904541015625, 0.20217132568359375, 0.214752197265625, 0.22733306884765625, 0.2399139404296875, 0.25249481201171875, 0.26507568359375, 0.27765655517578125, 0.2902374267578125, 0.30281829833984375, 0.315399169921875, 0.32798004150390625, 0.3405609130859375, 0.35314178466796875, 0.36572265625]}, "gradients/decoder.model.decoder.layers.6.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 7.0, 7.0, 4.0, 9.0, 10.0, 5.0, 11.0, 14.0, 19.0, 20.0, 25.0, 31.0, 48.0, 51.0, 62.0, 73.0, 111.0, 101.0, 69.0, 70.0, 44.0, 44.0, 28.0, 21.0, 35.0, 19.0, 13.0, 15.0, 5.0, 9.0, 7.0, 5.0, 4.0, 4.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.65648078918457e-05, -5.47775998711586e-05, -5.2990391850471497e-05, -5.120318382978439e-05, -4.941597580909729e-05, -4.762876778841019e-05, -4.5841559767723083e-05, -4.405435174703598e-05, -4.226714372634888e-05, -4.0479935705661774e-05, -3.869272768497467e-05, -3.690551966428757e-05, -3.5118311643600464e-05, -3.333110362291336e-05, -3.154389560222626e-05, -2.9756687581539154e-05, -2.796947956085205e-05, -2.6182271540164948e-05, -2.4395063519477844e-05, -2.260785549879074e-05, -2.0820647478103638e-05, -1.9033439457416534e-05, -1.724623143672943e-05, -1.5459023416042328e-05, -1.3671815395355225e-05, -1.1884607374668121e-05, -1.0097399353981018e-05, -8.310191333293915e-06, -6.5229833126068115e-06, -4.735775291919708e-06, -2.948567271232605e-06, -1.1613592505455017e-06, 6.258487701416016e-07, 2.413056790828705e-06, 4.200264811515808e-06, 5.987472832202911e-06, 7.774680852890015e-06, 9.561888873577118e-06, 1.1349096894264221e-05, 1.3136304914951324e-05, 1.4923512935638428e-05, 1.671072095632553e-05, 1.8497928977012634e-05, 2.0285136997699738e-05, 2.207234501838684e-05, 2.3859553039073944e-05, 2.5646761059761047e-05, 2.743396908044815e-05, 2.9221177101135254e-05, 3.100838512182236e-05, 3.279559314250946e-05, 3.4582801163196564e-05, 3.637000918388367e-05, 3.815721720457077e-05, 3.9944425225257874e-05, 4.173163324594498e-05, 4.351884126663208e-05, 4.530604928731918e-05, 4.709325730800629e-05, 4.888046532869339e-05, 5.066767334938049e-05, 5.2454881370067596e-05, 5.42420893907547e-05, 5.60292974114418e-05, 5.7816505432128906e-05]}, "gradients/decoder.model.decoder.layers.6.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 9.0, 2.0, 5.0, 6.0, 9.0, 14.0, 6.0, 20.0, 38.0, 47.0, 74.0, 113.0, 156.0, 269.0, 453.0, 856.0, 1611.0, 3320.0, 7530.0, 20338.0, 67971.0, 339945.0, 478451.0, 86259.0, 24739.0, 8637.0, 3718.0, 1726.0, 938.0, 513.0, 290.0, 170.0, 88.0, 81.0, 42.0, 22.0, 24.0, 32.0, 12.0, 9.0, 8.0, 4.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3935546875, -0.38166046142578125, -0.3697662353515625, -0.35787200927734375, -0.345977783203125, -0.33408355712890625, -0.3221893310546875, -0.31029510498046875, -0.29840087890625, -0.28650665283203125, -0.2746124267578125, -0.26271820068359375, -0.250823974609375, -0.23892974853515625, -0.2270355224609375, -0.21514129638671875, -0.2032470703125, -0.19135284423828125, -0.1794586181640625, -0.16756439208984375, -0.155670166015625, -0.14377593994140625, -0.1318817138671875, -0.11998748779296875, -0.10809326171875, -0.09619903564453125, -0.0843048095703125, -0.07241058349609375, -0.060516357421875, -0.04862213134765625, -0.0367279052734375, -0.02483367919921875, -0.012939453125, -0.00104522705078125, 0.0108489990234375, 0.02274322509765625, 0.034637451171875, 0.04653167724609375, 0.0584259033203125, 0.07032012939453125, 0.08221435546875, 0.09410858154296875, 0.1060028076171875, 0.11789703369140625, 0.129791259765625, 0.14168548583984375, 0.1535797119140625, 0.16547393798828125, 0.1773681640625, 0.18926239013671875, 0.2011566162109375, 0.21305084228515625, 0.224945068359375, 0.23683929443359375, 0.2487335205078125, 0.26062774658203125, 0.27252197265625, 0.28441619873046875, 0.2963104248046875, 0.30820465087890625, 0.320098876953125, 0.33199310302734375, 0.3438873291015625, 0.35578155517578125, 0.36767578125]}, "gradients/decoder.model.decoder.layers.6.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 2.0, 5.0, 3.0, 2.0, 3.0, 8.0, 12.0, 7.0, 7.0, 10.0, 19.0, 16.0, 19.0, 20.0, 28.0, 30.0, 37.0, 50.0, 49.0, 67.0, 98.0, 83.0, 88.0, 55.0, 59.0, 53.0, 21.0, 33.0, 16.0, 22.0, 14.0, 17.0, 12.0, 8.0, 8.0, 7.0, 4.0, 3.0, 8.0, 3.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.198486328125, -0.19329071044921875, -0.1880950927734375, -0.18289947509765625, -0.177703857421875, -0.17250823974609375, -0.1673126220703125, -0.16211700439453125, -0.15692138671875, -0.15172576904296875, -0.1465301513671875, -0.14133453369140625, -0.136138916015625, -0.13094329833984375, -0.1257476806640625, -0.12055206298828125, -0.1153564453125, -0.11016082763671875, -0.1049652099609375, -0.09976959228515625, -0.094573974609375, -0.08937835693359375, -0.0841827392578125, -0.07898712158203125, -0.07379150390625, -0.06859588623046875, -0.0634002685546875, -0.05820465087890625, -0.053009033203125, -0.04781341552734375, -0.0426177978515625, -0.03742218017578125, -0.0322265625, -0.02703094482421875, -0.0218353271484375, -0.01663970947265625, -0.011444091796875, -0.00624847412109375, -0.0010528564453125, 0.00414276123046875, 0.00933837890625, 0.01453399658203125, 0.0197296142578125, 0.02492523193359375, 0.030120849609375, 0.03531646728515625, 0.0405120849609375, 0.04570770263671875, 0.0509033203125, 0.05609893798828125, 0.0612945556640625, 0.06649017333984375, 0.071685791015625, 0.07688140869140625, 0.0820770263671875, 0.08727264404296875, 0.09246826171875, 0.09766387939453125, 0.1028594970703125, 0.10805511474609375, 0.113250732421875, 0.11844635009765625, 0.1236419677734375, 0.12883758544921875, 0.134033203125]}, "gradients/decoder.model.decoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 5.0, 4.0, 15.0, 31.0, 54.0, 119.0, 247.0, 237.0, 158.0, 76.0, 35.0, 11.0, 7.0, 3.0, 3.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.497779130935669, -3.2514922618865967, -3.0052051544189453, -2.758918285369873, -2.5126311779022217, -2.2663443088531494, -2.020057201385498, -1.7737703323364258, -1.527483344078064, -1.2811963558197021, -1.0349093675613403, -0.7886224389076233, -0.5423354506492615, -0.29604852199554443, -0.04976153373718262, 0.1965254545211792, 0.442812442779541, 0.6890994310379028, 0.9353864192962646, 1.181673288345337, 1.4279603958129883, 1.6742472648620605, 1.9205342531204224, 2.166821241378784, 2.4131083488464355, 2.659395217895508, 2.905682325363159, 3.1519691944122314, 3.398256301879883, 3.644543170928955, 3.8908300399780273, 4.137117385864258, 4.38340425491333, 4.629691123962402, 4.875977993011475, 5.122265338897705, 5.368552207946777, 5.61483907699585, 5.861125946044922, 6.107413291931152, 6.353700160980225, 6.599987030029297, 6.846273899078369, 7.0925612449646, 7.338848114013672, 7.585134983062744, 7.831421852111816, 8.077709197998047, 8.323995590209961, 8.570282936096191, 8.816569328308105, 9.062856674194336, 9.30914306640625, 9.55543041229248, 9.801717758178711, 10.048004150390625, 10.294291496276855, 10.540578842163086, 10.786865234375, 11.03315258026123, 11.279438972473145, 11.525726318359375, 11.772013664245605, 12.01830005645752, 12.26458740234375]}, "gradients/decoder.model.decoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 5.0, 6.0, 6.0, 8.0, 11.0, 17.0, 17.0, 27.0, 21.0, 34.0, 32.0, 36.0, 62.0, 49.0, 59.0, 56.0, 60.0, 65.0, 53.0, 56.0, 47.0, 44.0, 47.0, 39.0, 44.0, 21.0, 26.0, 20.0, 9.0, 7.0, 9.0, 8.0, 5.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.8459830284118652, -3.653721809387207, -3.4614603519439697, -3.2691988945007324, -3.076937675476074, -2.884676456451416, -2.6924149990081787, -2.5001535415649414, -2.307892322540283, -2.115631103515625, -1.9233696460723877, -1.73110830783844, -1.5388469696044922, -1.3465856313705444, -1.1543242931365967, -0.9620629549026489, -0.7698016166687012, -0.5775402784347534, -0.38527894020080566, -0.1930176019668579, -0.0007562637329101562, 0.1915050745010376, 0.38376641273498535, 0.5760277509689331, 0.7682890892028809, 0.9605504274368286, 1.1528117656707764, 1.3450731039047241, 1.5373344421386719, 1.7295957803726196, 1.9218571186065674, 2.1141185760498047, 2.306380271911621, 2.4986414909362793, 2.6909029483795166, 2.883164405822754, 3.075425624847412, 3.2676868438720703, 3.4599483013153076, 3.652209758758545, 3.844470977783203, 4.036732196807861, 4.2289934158325195, 4.421255111694336, 4.613516330718994, 4.805777549743652, 4.998039245605469, 5.190300464630127, 5.382561683654785, 5.574822902679443, 5.767084121704102, 5.959345817565918, 6.151607036590576, 6.343868255615234, 6.536129951477051, 6.728391170501709, 6.920652389526367, 7.112913608551025, 7.305174827575684, 7.4974365234375, 7.689697742462158, 7.881958961486816, 8.074220657348633, 8.266481399536133, 8.45874309539795]}, "gradients/decoder.model.decoder.layers.5.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 8.0, 12.0, 11.0, 17.0, 36.0, 39.0, 69.0, 118.0, 181.0, 352.0, 756.0, 1607.0, 4206.0, 14582.0, 103196.0, 3074763.0, 935093.0, 44889.0, 9003.0, 2891.0, 1174.0, 575.0, 288.0, 153.0, 94.0, 52.0, 41.0, 18.0, 17.0, 12.0, 8.0, 5.0, 5.0, 3.0, 1.0, 3.0, 2.0, 2.0, 2.0, 1.0], "bins": [-3.611328125, -3.5206298828125, -3.429931640625, -3.3392333984375, -3.24853515625, -3.1578369140625, -3.067138671875, -2.9764404296875, -2.8857421875, -2.7950439453125, -2.704345703125, -2.6136474609375, -2.52294921875, -2.4322509765625, -2.341552734375, -2.2508544921875, -2.16015625, -2.0694580078125, -1.978759765625, -1.8880615234375, -1.79736328125, -1.7066650390625, -1.615966796875, -1.5252685546875, -1.4345703125, -1.3438720703125, -1.253173828125, -1.1624755859375, -1.07177734375, -0.9810791015625, -0.890380859375, -0.7996826171875, -0.708984375, -0.6182861328125, -0.527587890625, -0.4368896484375, -0.34619140625, -0.2554931640625, -0.164794921875, -0.0740966796875, 0.0166015625, 0.1072998046875, 0.197998046875, 0.2886962890625, 0.37939453125, 0.4700927734375, 0.560791015625, 0.6514892578125, 0.7421875, 0.8328857421875, 0.923583984375, 1.0142822265625, 1.10498046875, 1.1956787109375, 1.286376953125, 1.3770751953125, 1.4677734375, 1.5584716796875, 1.649169921875, 1.7398681640625, 1.83056640625, 1.9212646484375, 2.011962890625, 2.1026611328125, 2.193359375]}, "gradients/decoder.model.decoder.layers.5.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 2.0, 0.0, 5.0, 5.0, 7.0, 12.0, 6.0, 20.0, 20.0, 31.0, 27.0, 39.0, 50.0, 53.0, 44.0, 63.0, 75.0, 69.0, 59.0, 73.0, 65.0, 39.0, 45.0, 43.0, 37.0, 18.0, 20.0, 20.0, 18.0, 14.0, 10.0, 5.0, 3.0, 2.0, 3.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.6484375, -1.60113525390625, -1.5538330078125, -1.50653076171875, -1.459228515625, -1.41192626953125, -1.3646240234375, -1.31732177734375, -1.27001953125, -1.22271728515625, -1.1754150390625, -1.12811279296875, -1.080810546875, -1.03350830078125, -0.9862060546875, -0.93890380859375, -0.8916015625, -0.84429931640625, -0.7969970703125, -0.74969482421875, -0.702392578125, -0.65509033203125, -0.6077880859375, -0.56048583984375, -0.51318359375, -0.46588134765625, -0.4185791015625, -0.37127685546875, -0.323974609375, -0.27667236328125, -0.2293701171875, -0.18206787109375, -0.134765625, -0.08746337890625, -0.0401611328125, 0.00714111328125, 0.054443359375, 0.10174560546875, 0.1490478515625, 0.19635009765625, 0.24365234375, 0.29095458984375, 0.3382568359375, 0.38555908203125, 0.432861328125, 0.48016357421875, 0.5274658203125, 0.57476806640625, 0.6220703125, 0.66937255859375, 0.7166748046875, 0.76397705078125, 0.811279296875, 0.85858154296875, 0.9058837890625, 0.95318603515625, 1.00048828125, 1.04779052734375, 1.0950927734375, 1.14239501953125, 1.189697265625, 1.23699951171875, 1.2843017578125, 1.33160400390625, 1.37890625]}, "gradients/decoder.model.decoder.layers.5.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 6.0, 2.0, 0.0, 3.0, 2.0, 5.0, 2.0, 12.0, 14.0, 23.0, 32.0, 36.0, 57.0, 123.0, 207.0, 447.0, 1093.0, 3234.0, 13862.0, 114244.0, 3648474.0, 377380.0, 27069.0, 5233.0, 1580.0, 552.0, 239.0, 122.0, 75.0, 47.0, 36.0, 28.0, 15.0, 10.0, 10.0, 5.0, 5.0, 5.0, 4.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.36328125, -2.283660888671875, -2.20404052734375, -2.124420166015625, -2.0447998046875, -1.965179443359375, -1.88555908203125, -1.805938720703125, -1.726318359375, -1.646697998046875, -1.56707763671875, -1.487457275390625, -1.4078369140625, -1.328216552734375, -1.24859619140625, -1.168975830078125, -1.08935546875, -1.009735107421875, -0.93011474609375, -0.850494384765625, -0.7708740234375, -0.691253662109375, -0.61163330078125, -0.532012939453125, -0.452392578125, -0.372772216796875, -0.29315185546875, -0.213531494140625, -0.1339111328125, -0.054290771484375, 0.02532958984375, 0.104949951171875, 0.1845703125, 0.264190673828125, 0.34381103515625, 0.423431396484375, 0.5030517578125, 0.582672119140625, 0.66229248046875, 0.741912841796875, 0.821533203125, 0.901153564453125, 0.98077392578125, 1.060394287109375, 1.1400146484375, 1.219635009765625, 1.29925537109375, 1.378875732421875, 1.45849609375, 1.538116455078125, 1.61773681640625, 1.697357177734375, 1.7769775390625, 1.856597900390625, 1.93621826171875, 2.015838623046875, 2.095458984375, 2.175079345703125, 2.25469970703125, 2.334320068359375, 2.4139404296875, 2.493560791015625, 2.57318115234375, 2.652801513671875, 2.732421875]}, "gradients/decoder.model.decoder.layers.5.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 4.0, 4.0, 3.0, 4.0, 11.0, 8.0, 13.0, 15.0, 22.0, 28.0, 25.0, 50.0, 42.0, 86.0, 145.0, 240.0, 388.0, 523.0, 725.0, 571.0, 387.0, 250.0, 151.0, 103.0, 80.0, 49.0, 37.0, 32.0, 22.0, 11.0, 6.0, 9.0, 8.0, 7.0, 8.0, 1.0, 1.0, 2.0, 3.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.443115234375, -0.4290924072265625, -0.415069580078125, -0.4010467529296875, -0.38702392578125, -0.3730010986328125, -0.358978271484375, -0.3449554443359375, -0.3309326171875, -0.3169097900390625, -0.302886962890625, -0.2888641357421875, -0.27484130859375, -0.2608184814453125, -0.246795654296875, -0.2327728271484375, -0.21875, -0.2047271728515625, -0.190704345703125, -0.1766815185546875, -0.16265869140625, -0.1486358642578125, -0.134613037109375, -0.1205902099609375, -0.1065673828125, -0.0925445556640625, -0.078521728515625, -0.0644989013671875, -0.05047607421875, -0.0364532470703125, -0.022430419921875, -0.0084075927734375, 0.005615234375, 0.0196380615234375, 0.033660888671875, 0.0476837158203125, 0.06170654296875, 0.0757293701171875, 0.089752197265625, 0.1037750244140625, 0.1177978515625, 0.1318206787109375, 0.145843505859375, 0.1598663330078125, 0.17388916015625, 0.1879119873046875, 0.201934814453125, 0.2159576416015625, 0.22998046875, 0.2440032958984375, 0.258026123046875, 0.2720489501953125, 0.28607177734375, 0.3000946044921875, 0.314117431640625, 0.3281402587890625, 0.3421630859375, 0.3561859130859375, 0.370208740234375, 0.3842315673828125, 0.39825439453125, 0.4122772216796875, 0.426300048828125, 0.4403228759765625, 0.454345703125]}, "gradients/decoder.model.decoder.layers.5.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 3.0, 0.0, 1.0, 3.0, 4.0, 6.0, 9.0, 14.0, 16.0, 21.0, 41.0, 52.0, 101.0, 115.0, 136.0, 134.0, 104.0, 87.0, 55.0, 39.0, 24.0, 9.0, 10.0, 4.0, 14.0, 2.0, 4.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.1852829456329346, -2.0978095531463623, -2.01033616065979, -1.9228627681732178, -1.8353893756866455, -1.7479159832000732, -1.660442590713501, -1.5729691982269287, -1.4854958057403564, -1.3980224132537842, -1.310549020767212, -1.2230756282806396, -1.1356022357940674, -1.0481288433074951, -0.9606554508209229, -0.8731820583343506, -0.7857086658477783, -0.698235273361206, -0.6107618808746338, -0.5232884883880615, -0.43581509590148926, -0.348341703414917, -0.2608683109283447, -0.17339491844177246, -0.0859215259552002, 0.0015518665313720703, 0.08902525901794434, 0.1764986515045166, 0.26397204399108887, 0.35144543647766113, 0.4389188289642334, 0.5263922214508057, 0.613865852355957, 0.7013392448425293, 0.7888126373291016, 0.8762860298156738, 0.9637594223022461, 1.0512328147888184, 1.1387062072753906, 1.226179599761963, 1.3136529922485352, 1.4011263847351074, 1.4885997772216797, 1.576073169708252, 1.6635465621948242, 1.7510199546813965, 1.8384933471679688, 1.925966739654541, 2.0134401321411133, 2.1009135246276855, 2.188386917114258, 2.27586030960083, 2.3633337020874023, 2.4508070945739746, 2.538280487060547, 2.625753879547119, 2.7132272720336914, 2.8007006645202637, 2.888174057006836, 2.975647449493408, 3.0631208419799805, 3.1505942344665527, 3.238067626953125, 3.3255410194396973, 3.4130144119262695]}, "gradients/decoder.model.decoder.layers.5.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 1.0, 5.0, 3.0, 11.0, 7.0, 8.0, 18.0, 10.0, 26.0, 24.0, 29.0, 36.0, 38.0, 24.0, 43.0, 56.0, 57.0, 46.0, 59.0, 40.0, 48.0, 48.0, 41.0, 37.0, 44.0, 37.0, 26.0, 29.0, 24.0, 27.0, 16.0, 17.0, 14.0, 15.0, 15.0, 3.0, 4.0, 8.0, 2.0, 1.0, 3.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.3523730039596558, -1.3117446899414062, -1.2711163759231567, -1.2304879426956177, -1.1898596286773682, -1.1492313146591187, -1.1086030006408691, -1.0679746866226196, -1.0273463726043701, -0.9867180585861206, -0.9460896849632263, -0.9054613709449768, -0.8648329973220825, -0.824204683303833, -0.7835763692855835, -0.742948055267334, -0.7023196220397949, -0.6616913080215454, -0.6210629343986511, -0.5804346203804016, -0.5398062467575073, -0.4991779327392578, -0.4585496187210083, -0.4179212749004364, -0.3772929310798645, -0.3366645872592926, -0.2960362434387207, -0.2554079294204712, -0.2147795855998993, -0.1741512417793274, -0.1335229128599167, -0.09289458394050598, -0.05226635932922363, -0.01163802295923233, 0.028990313410758972, 0.06961864978075027, 0.11024698615074158, 0.15087532997131348, 0.19150365889072418, 0.2321319878101349, 0.2727603316307068, 0.3133886754512787, 0.3540170192718506, 0.3946453332901001, 0.435273677110672, 0.4759020209312439, 0.5165303349494934, 0.5571587085723877, 0.5977870225906372, 0.6384153366088867, 0.679043710231781, 0.7196720242500305, 0.7603003978729248, 0.8009287118911743, 0.8415570259094238, 0.8821853399276733, 0.9228137135505676, 0.9634420275688171, 1.0040704011917114, 1.044698715209961, 1.0853270292282104, 1.12595534324646, 1.166583776473999, 1.2072120904922485, 1.247840404510498]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 6.0, 8.0, 8.0, 13.0, 27.0, 21.0, 35.0, 63.0, 84.0, 115.0, 199.0, 310.0, 516.0, 844.0, 1541.0, 3024.0, 5860.0, 13115.0, 32608.0, 95155.0, 319319.0, 383681.0, 121927.0, 39583.0, 15771.0, 7062.0, 3401.0, 1795.0, 928.0, 552.0, 350.0, 195.0, 161.0, 102.0, 57.0, 33.0, 29.0, 20.0, 8.0, 7.0, 6.0, 9.0, 5.0, 5.0, 3.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2489013671875, -0.2411479949951172, -0.23339462280273438, -0.22564125061035156, -0.21788787841796875, -0.21013450622558594, -0.20238113403320312, -0.1946277618408203, -0.1868743896484375, -0.1791210174560547, -0.17136764526367188, -0.16361427307128906, -0.15586090087890625, -0.14810752868652344, -0.14035415649414062, -0.1326007843017578, -0.124847412109375, -0.11709403991699219, -0.10934066772460938, -0.10158729553222656, -0.09383392333984375, -0.08608055114746094, -0.07832717895507812, -0.07057380676269531, -0.0628204345703125, -0.05506706237792969, -0.047313690185546875, -0.03956031799316406, -0.03180694580078125, -0.024053573608398438, -0.016300201416015625, -0.008546829223632812, -0.00079345703125, 0.0069599151611328125, 0.014713287353515625, 0.022466659545898438, 0.03022003173828125, 0.03797340393066406, 0.045726776123046875, 0.05348014831542969, 0.0612335205078125, 0.06898689270019531, 0.07674026489257812, 0.08449363708496094, 0.09224700927734375, 0.10000038146972656, 0.10775375366210938, 0.11550712585449219, 0.123260498046875, 0.1310138702392578, 0.13876724243164062, 0.14652061462402344, 0.15427398681640625, 0.16202735900878906, 0.16978073120117188, 0.1775341033935547, 0.1852874755859375, 0.1930408477783203, 0.20079421997070312, 0.20854759216308594, 0.21630096435546875, 0.22405433654785156, 0.23180770874023438, 0.2395610809326172, 0.247314453125]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 4.0, 4.0, 5.0, 3.0, 6.0, 8.0, 11.0, 20.0, 26.0, 23.0, 39.0, 44.0, 42.0, 55.0, 59.0, 56.0, 63.0, 79.0, 67.0, 67.0, 48.0, 49.0, 35.0, 36.0, 29.0, 23.0, 28.0, 20.0, 14.0, 8.0, 6.0, 12.0, 9.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.1728515625, -1.139801025390625, -1.10675048828125, -1.073699951171875, -1.0406494140625, -1.007598876953125, -0.97454833984375, -0.941497802734375, -0.908447265625, -0.875396728515625, -0.84234619140625, -0.809295654296875, -0.7762451171875, -0.743194580078125, -0.71014404296875, -0.677093505859375, -0.64404296875, -0.610992431640625, -0.57794189453125, -0.544891357421875, -0.5118408203125, -0.478790283203125, -0.44573974609375, -0.412689208984375, -0.379638671875, -0.346588134765625, -0.31353759765625, -0.280487060546875, -0.2474365234375, -0.214385986328125, -0.18133544921875, -0.148284912109375, -0.115234375, -0.082183837890625, -0.04913330078125, -0.016082763671875, 0.0169677734375, 0.050018310546875, 0.08306884765625, 0.116119384765625, 0.149169921875, 0.182220458984375, 0.21527099609375, 0.248321533203125, 0.2813720703125, 0.314422607421875, 0.34747314453125, 0.380523681640625, 0.41357421875, 0.446624755859375, 0.47967529296875, 0.512725830078125, 0.5457763671875, 0.578826904296875, 0.61187744140625, 0.644927978515625, 0.677978515625, 0.711029052734375, 0.74407958984375, 0.777130126953125, 0.8101806640625, 0.843231201171875, 0.87628173828125, 0.909332275390625, 0.9423828125]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 2.0, 1.0, 5.0, 4.0, 9.0, 14.0, 15.0, 20.0, 21.0, 30.0, 54.0, 90.0, 149.0, 262.0, 488.0, 1104.0, 2958.0, 8916.0, 37795.0, 247705.0, 602685.0, 116012.0, 20780.0, 5643.0, 2047.0, 827.0, 385.0, 221.0, 103.0, 74.0, 46.0, 24.0, 17.0, 18.0, 16.0, 6.0, 3.0, 4.0, 3.0, 3.0, 3.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.29296875, -0.2818336486816406, -0.27069854736328125, -0.2595634460449219, -0.2484283447265625, -0.23729324340820312, -0.22615814208984375, -0.21502304077148438, -0.203887939453125, -0.19275283813476562, -0.18161773681640625, -0.17048263549804688, -0.1593475341796875, -0.14821243286132812, -0.13707733154296875, -0.12594223022460938, -0.11480712890625, -0.10367202758789062, -0.09253692626953125, -0.08140182495117188, -0.0702667236328125, -0.059131622314453125, -0.04799652099609375, -0.036861419677734375, -0.025726318359375, -0.014591217041015625, -0.00345611572265625, 0.007678985595703125, 0.0188140869140625, 0.029949188232421875, 0.04108428955078125, 0.052219390869140625, 0.0633544921875, 0.07448959350585938, 0.08562469482421875, 0.09675979614257812, 0.1078948974609375, 0.11902999877929688, 0.13016510009765625, 0.14130020141601562, 0.152435302734375, 0.16357040405273438, 0.17470550537109375, 0.18584060668945312, 0.1969757080078125, 0.20811080932617188, 0.21924591064453125, 0.23038101196289062, 0.24151611328125, 0.2526512145996094, 0.26378631591796875, 0.2749214172363281, 0.2860565185546875, 0.2971916198730469, 0.30832672119140625, 0.3194618225097656, 0.330596923828125, 0.3417320251464844, 0.35286712646484375, 0.3640022277832031, 0.3751373291015625, 0.3862724304199219, 0.39740753173828125, 0.4085426330566406, 0.419677734375]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 5.0, 1.0, 0.0, 4.0, 2.0, 5.0, 4.0, 14.0, 13.0, 11.0, 12.0, 19.0, 22.0, 21.0, 21.0, 20.0, 27.0, 28.0, 27.0, 39.0, 45.0, 46.0, 42.0, 40.0, 43.0, 55.0, 47.0, 49.0, 38.0, 25.0, 40.0, 29.0, 37.0, 23.0, 24.0, 21.0, 14.0, 16.0, 16.0, 15.0, 13.0, 7.0, 7.0, 6.0, 2.0, 6.0, 2.0, 1.0, 3.0, 1.0, 4.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-1.458984375, -1.4101104736328125, -1.361236572265625, -1.3123626708984375, -1.26348876953125, -1.2146148681640625, -1.165740966796875, -1.1168670654296875, -1.0679931640625, -1.0191192626953125, -0.970245361328125, -0.9213714599609375, -0.87249755859375, -0.8236236572265625, -0.774749755859375, -0.7258758544921875, -0.677001953125, -0.6281280517578125, -0.579254150390625, -0.5303802490234375, -0.48150634765625, -0.4326324462890625, -0.383758544921875, -0.3348846435546875, -0.2860107421875, -0.2371368408203125, -0.188262939453125, -0.1393890380859375, -0.09051513671875, -0.0416412353515625, 0.007232666015625, 0.0561065673828125, 0.10498046875, 0.1538543701171875, 0.202728271484375, 0.2516021728515625, 0.30047607421875, 0.3493499755859375, 0.398223876953125, 0.4470977783203125, 0.4959716796875, 0.5448455810546875, 0.593719482421875, 0.6425933837890625, 0.69146728515625, 0.7403411865234375, 0.789215087890625, 0.8380889892578125, 0.886962890625, 0.9358367919921875, 0.984710693359375, 1.0335845947265625, 1.08245849609375, 1.1313323974609375, 1.180206298828125, 1.2290802001953125, 1.2779541015625, 1.3268280029296875, 1.375701904296875, 1.4245758056640625, 1.47344970703125, 1.5223236083984375, 1.571197509765625, 1.6200714111328125, 1.6689453125]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 5.0, 1.0, 9.0, 7.0, 16.0, 11.0, 16.0, 21.0, 46.0, 60.0, 79.0, 148.0, 234.0, 394.0, 789.0, 1757.0, 4109.0, 11055.0, 37419.0, 201121.0, 628308.0, 121364.0, 26817.0, 8552.0, 3251.0, 1370.0, 616.0, 348.0, 223.0, 157.0, 77.0, 53.0, 41.0, 24.0, 17.0, 14.0, 5.0, 14.0, 4.0, 1.0, 2.0, 1.0, 3.0, 2.0, 1.0, 2.0, 1.0], "bins": [-0.1529541015625, -0.14886093139648438, -0.14476776123046875, -0.14067459106445312, -0.1365814208984375, -0.13248825073242188, -0.12839508056640625, -0.12430191040039062, -0.120208740234375, -0.11611557006835938, -0.11202239990234375, -0.10792922973632812, -0.1038360595703125, -0.09974288940429688, -0.09564971923828125, -0.09155654907226562, -0.08746337890625, -0.08337020874023438, -0.07927703857421875, -0.07518386840820312, -0.0710906982421875, -0.06699752807617188, -0.06290435791015625, -0.058811187744140625, -0.054718017578125, -0.050624847412109375, -0.04653167724609375, -0.042438507080078125, -0.0383453369140625, -0.034252166748046875, -0.03015899658203125, -0.026065826416015625, -0.02197265625, -0.017879486083984375, -0.01378631591796875, -0.009693145751953125, -0.0055999755859375, -0.001506805419921875, 0.00258636474609375, 0.006679534912109375, 0.010772705078125, 0.014865875244140625, 0.01895904541015625, 0.023052215576171875, 0.0271453857421875, 0.031238555908203125, 0.03533172607421875, 0.039424896240234375, 0.04351806640625, 0.047611236572265625, 0.05170440673828125, 0.055797576904296875, 0.0598907470703125, 0.06398391723632812, 0.06807708740234375, 0.07217025756835938, 0.076263427734375, 0.08035659790039062, 0.08444976806640625, 0.08854293823242188, 0.0926361083984375, 0.09672927856445312, 0.10082244873046875, 0.10491561889648438, 0.1090087890625]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 4.0, 2.0, 3.0, 6.0, 8.0, 11.0, 9.0, 8.0, 17.0, 23.0, 38.0, 38.0, 67.0, 64.0, 85.0, 92.0, 86.0, 93.0, 75.0, 55.0, 36.0, 51.0, 26.0, 18.0, 15.0, 9.0, 12.0, 12.0, 10.0, 2.0, 9.0, 3.0, 6.0, 2.0, 2.0, 3.0, 3.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.181001663208008e-05, -6.0074031352996826e-05, -5.8338046073913574e-05, -5.660206079483032e-05, -5.486607551574707e-05, -5.313009023666382e-05, -5.1394104957580566e-05, -4.9658119678497314e-05, -4.792213439941406e-05, -4.618614912033081e-05, -4.445016384124756e-05, -4.271417856216431e-05, -4.0978193283081055e-05, -3.92422080039978e-05, -3.750622272491455e-05, -3.57702374458313e-05, -3.403425216674805e-05, -3.2298266887664795e-05, -3.056228160858154e-05, -2.882629632949829e-05, -2.709031105041504e-05, -2.5354325771331787e-05, -2.3618340492248535e-05, -2.1882355213165283e-05, -2.014636993408203e-05, -1.841038465499878e-05, -1.6674399375915527e-05, -1.4938414096832275e-05, -1.3202428817749023e-05, -1.1466443538665771e-05, -9.73045825958252e-06, -7.994472980499268e-06, -6.258487701416016e-06, -4.522502422332764e-06, -2.7865171432495117e-06, -1.0505318641662598e-06, 6.854534149169922e-07, 2.421438694000244e-06, 4.157423973083496e-06, 5.893409252166748e-06, 7.62939453125e-06, 9.365379810333252e-06, 1.1101365089416504e-05, 1.2837350368499756e-05, 1.4573335647583008e-05, 1.630932092666626e-05, 1.8045306205749512e-05, 1.9781291484832764e-05, 2.1517276763916016e-05, 2.3253262042999268e-05, 2.498924732208252e-05, 2.672523260116577e-05, 2.8461217880249023e-05, 3.0197203159332275e-05, 3.193318843841553e-05, 3.366917371749878e-05, 3.540515899658203e-05, 3.714114427566528e-05, 3.8877129554748535e-05, 4.061311483383179e-05, 4.234910011291504e-05, 4.408508539199829e-05, 4.582107067108154e-05, 4.7557055950164795e-05, 4.929304122924805e-05]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 3.0, 3.0, 4.0, 3.0, 6.0, 5.0, 8.0, 9.0, 20.0, 16.0, 17.0, 43.0, 62.0, 85.0, 153.0, 261.0, 410.0, 832.0, 1737.0, 3916.0, 10194.0, 29664.0, 108700.0, 481778.0, 309306.0, 68145.0, 20133.0, 7144.0, 3019.0, 1309.0, 644.0, 328.0, 197.0, 134.0, 84.0, 43.0, 43.0, 28.0, 19.0, 17.0, 9.0, 13.0, 8.0, 4.0, 2.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.11602783203125, -0.11238288879394531, -0.10873794555664062, -0.10509300231933594, -0.10144805908203125, -0.09780311584472656, -0.09415817260742188, -0.09051322937011719, -0.0868682861328125, -0.08322334289550781, -0.07957839965820312, -0.07593345642089844, -0.07228851318359375, -0.06864356994628906, -0.06499862670898438, -0.06135368347167969, -0.057708740234375, -0.05406379699707031, -0.050418853759765625, -0.04677391052246094, -0.04312896728515625, -0.03948402404785156, -0.035839080810546875, -0.03219413757324219, -0.0285491943359375, -0.024904251098632812, -0.021259307861328125, -0.017614364624023438, -0.01396942138671875, -0.010324478149414062, -0.006679534912109375, -0.0030345916748046875, 0.0006103515625, 0.0042552947998046875, 0.007900238037109375, 0.011545181274414062, 0.01519012451171875, 0.018835067749023438, 0.022480010986328125, 0.026124954223632812, 0.0297698974609375, 0.03341484069824219, 0.037059783935546875, 0.04070472717285156, 0.04434967041015625, 0.04799461364746094, 0.051639556884765625, 0.05528450012207031, 0.058929443359375, 0.06257438659667969, 0.06621932983398438, 0.06986427307128906, 0.07350921630859375, 0.07715415954589844, 0.08079910278320312, 0.08444404602050781, 0.0880889892578125, 0.09173393249511719, 0.09537887573242188, 0.09902381896972656, 0.10266876220703125, 0.10631370544433594, 0.10995864868164062, 0.11360359191894531, 0.11724853515625]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 3.0, 1.0, 1.0, 2.0, 5.0, 5.0, 7.0, 6.0, 6.0, 10.0, 6.0, 13.0, 18.0, 19.0, 31.0, 19.0, 38.0, 46.0, 60.0, 83.0, 86.0, 80.0, 83.0, 75.0, 70.0, 43.0, 39.0, 33.0, 24.0, 24.0, 11.0, 12.0, 14.0, 10.0, 7.0, 9.0, 3.0, 2.0, 1.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.024871826171875, -0.02405571937561035, -0.023239612579345703, -0.022423505783081055, -0.021607398986816406, -0.020791292190551758, -0.01997518539428711, -0.01915907859802246, -0.018342971801757812, -0.017526865005493164, -0.016710758209228516, -0.015894651412963867, -0.015078544616699219, -0.01426243782043457, -0.013446331024169922, -0.012630224227905273, -0.011814117431640625, -0.010998010635375977, -0.010181903839111328, -0.00936579704284668, -0.008549690246582031, -0.007733583450317383, -0.006917476654052734, -0.006101369857788086, -0.0052852630615234375, -0.004469156265258789, -0.0036530494689941406, -0.002836942672729492, -0.0020208358764648438, -0.0012047290802001953, -0.0003886222839355469, 0.00042748451232910156, 0.00124359130859375, 0.0020596981048583984, 0.002875804901123047, 0.0036919116973876953, 0.004508018493652344, 0.005324125289916992, 0.006140232086181641, 0.006956338882446289, 0.0077724456787109375, 0.008588552474975586, 0.009404659271240234, 0.010220766067504883, 0.011036872863769531, 0.01185297966003418, 0.012669086456298828, 0.013485193252563477, 0.014301300048828125, 0.015117406845092773, 0.015933513641357422, 0.01674962043762207, 0.01756572723388672, 0.018381834030151367, 0.019197940826416016, 0.020014047622680664, 0.020830154418945312, 0.02164626121520996, 0.02246236801147461, 0.023278474807739258, 0.024094581604003906, 0.024910688400268555, 0.025726795196533203, 0.02654290199279785, 0.0273590087890625]}, "gradients/decoder.model.decoder.layers.5.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 3.0, 1.0, 5.0, 8.0, 9.0, 10.0, 26.0, 41.0, 83.0, 141.0, 187.0, 186.0, 121.0, 77.0, 44.0, 25.0, 9.0, 12.0, 12.0, 3.0, 1.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5356738567352295, -1.4625478982925415, -1.3894219398498535, -1.3162959814071655, -1.2431700229644775, -1.1700440645217896, -1.0969181060791016, -1.0237921476364136, -0.9506661891937256, -0.8775402307510376, -0.8044142723083496, -0.7312883138656616, -0.6581623554229736, -0.5850363969802856, -0.5119104385375977, -0.43878448009490967, -0.3656585216522217, -0.2925325632095337, -0.2194066047668457, -0.14628064632415771, -0.07315468788146973, -2.872943878173828e-05, 0.07309722900390625, 0.14622318744659424, 0.21934914588928223, 0.2924751043319702, 0.3656010627746582, 0.4387270212173462, 0.5118529796600342, 0.5849789381027222, 0.6581048965454102, 0.7312308549880981, 0.8043568134307861, 0.8774827718734741, 0.9506087303161621, 1.02373468875885, 1.096860647201538, 1.169986605644226, 1.243112564086914, 1.316238522529602, 1.38936448097229, 1.462490439414978, 1.535616397857666, 1.608742356300354, 1.681868314743042, 1.75499427318573, 1.828120231628418, 1.901246190071106, 1.974372148513794, 2.0474982261657715, 2.12062406539917, 2.1937499046325684, 2.266875982284546, 2.3400020599365234, 2.413127899169922, 2.4862537384033203, 2.559379816055298, 2.6325058937072754, 2.705631732940674, 2.7787575721740723, 2.85188364982605, 2.9250097274780273, 2.998135566711426, 3.071261405944824, 3.1443874835968018]}, "gradients/decoder.model.decoder.layers.5.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 2.0, 5.0, 9.0, 5.0, 8.0, 12.0, 23.0, 25.0, 35.0, 40.0, 48.0, 39.0, 74.0, 60.0, 57.0, 70.0, 54.0, 60.0, 59.0, 57.0, 54.0, 38.0, 31.0, 21.0, 30.0, 20.0, 13.0, 16.0, 11.0, 10.0, 4.0, 4.0, 5.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.024644374847412, -0.9926322102546692, -0.9606200456619263, -0.9286079406738281, -0.8965957760810852, -0.8645836114883423, -0.8325715065002441, -0.8005593419075012, -0.7685471773147583, -0.7365350127220154, -0.7045228481292725, -0.6725107431411743, -0.6404985785484314, -0.6084864139556885, -0.5764743089675903, -0.5444621443748474, -0.5124499797821045, -0.4804378151893616, -0.44842568039894104, -0.4164135456085205, -0.3844013810157776, -0.35238921642303467, -0.32037708163261414, -0.2883649468421936, -0.2563527822494507, -0.22434063255786896, -0.19232848286628723, -0.1603163331747055, -0.12830418348312378, -0.09629203379154205, -0.06427988409996033, -0.0322677344083786, -0.0002557039260864258, 0.0317564457654953, 0.06376859545707703, 0.09578074514865875, 0.12779289484024048, 0.1598050445318222, 0.19181719422340393, 0.22382934391498566, 0.2558414936065674, 0.2878536581993103, 0.31986579298973083, 0.35187792778015137, 0.3838900923728943, 0.4159022569656372, 0.44791439175605774, 0.47992652654647827, 0.5119386911392212, 0.5439508557319641, 0.575963020324707, 0.6079751253128052, 0.6399872899055481, 0.671999454498291, 0.7040115594863892, 0.7360237240791321, 0.768035888671875, 0.8000480532646179, 0.8320602178573608, 0.864072322845459, 0.8960844874382019, 0.9280966520309448, 0.960108757019043, 0.9921209216117859, 1.0241330862045288]}, "gradients/decoder.model.decoder.layers.5.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 5.0, 3.0, 1.0, 2.0, 7.0, 13.0, 17.0, 19.0, 36.0, 46.0, 85.0, 136.0, 272.0, 434.0, 786.0, 1714.0, 3623.0, 8689.0, 23676.0, 86117.0, 513110.0, 321308.0, 58050.0, 17598.0, 6868.0, 2927.0, 1404.0, 727.0, 370.0, 195.0, 128.0, 83.0, 40.0, 29.0, 17.0, 10.0, 6.0, 6.0, 3.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.1025390625, -1.0709152221679688, -1.0392913818359375, -1.0076675415039062, -0.976043701171875, -0.9444198608398438, -0.9127960205078125, -0.8811721801757812, -0.84954833984375, -0.8179244995117188, -0.7863006591796875, -0.7546768188476562, -0.723052978515625, -0.6914291381835938, -0.6598052978515625, -0.6281814575195312, -0.5965576171875, -0.5649337768554688, -0.5333099365234375, -0.5016860961914062, -0.470062255859375, -0.43843841552734375, -0.4068145751953125, -0.37519073486328125, -0.34356689453125, -0.31194305419921875, -0.2803192138671875, -0.24869537353515625, -0.217071533203125, -0.18544769287109375, -0.1538238525390625, -0.12220001220703125, -0.090576171875, -0.05895233154296875, -0.0273284912109375, 0.00429534912109375, 0.035919189453125, 0.06754302978515625, 0.0991668701171875, 0.13079071044921875, 0.16241455078125, 0.19403839111328125, 0.2256622314453125, 0.25728607177734375, 0.288909912109375, 0.32053375244140625, 0.3521575927734375, 0.38378143310546875, 0.4154052734375, 0.44702911376953125, 0.4786529541015625, 0.5102767944335938, 0.541900634765625, 0.5735244750976562, 0.6051483154296875, 0.6367721557617188, 0.66839599609375, 0.7000198364257812, 0.7316436767578125, 0.7632675170898438, 0.794891357421875, 0.8265151977539062, 0.8581390380859375, 0.8897628784179688, 0.92138671875]}, "gradients/decoder.model.decoder.layers.5.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 6.0, 1.0, 5.0, 2.0, 4.0, 9.0, 7.0, 9.0, 14.0, 24.0, 26.0, 28.0, 44.0, 48.0, 51.0, 64.0, 60.0, 55.0, 76.0, 59.0, 66.0, 61.0, 52.0, 33.0, 41.0, 28.0, 28.0, 30.0, 14.0, 12.0, 10.0, 12.0, 9.0, 5.0, 3.0, 5.0, 3.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.73046875, -2.6517333984375, -2.572998046875, -2.4942626953125, -2.41552734375, -2.3367919921875, -2.258056640625, -2.1793212890625, -2.1005859375, -2.0218505859375, -1.943115234375, -1.8643798828125, -1.78564453125, -1.7069091796875, -1.628173828125, -1.5494384765625, -1.470703125, -1.3919677734375, -1.313232421875, -1.2344970703125, -1.15576171875, -1.0770263671875, -0.998291015625, -0.9195556640625, -0.8408203125, -0.7620849609375, -0.683349609375, -0.6046142578125, -0.52587890625, -0.4471435546875, -0.368408203125, -0.2896728515625, -0.2109375, -0.1322021484375, -0.053466796875, 0.0252685546875, 0.10400390625, 0.1827392578125, 0.261474609375, 0.3402099609375, 0.4189453125, 0.4976806640625, 0.576416015625, 0.6551513671875, 0.73388671875, 0.8126220703125, 0.891357421875, 0.9700927734375, 1.048828125, 1.1275634765625, 1.206298828125, 1.2850341796875, 1.36376953125, 1.4425048828125, 1.521240234375, 1.5999755859375, 1.6787109375, 1.7574462890625, 1.836181640625, 1.9149169921875, 1.99365234375, 2.0723876953125, 2.151123046875, 2.2298583984375, 2.30859375]}, "gradients/decoder.model.decoder.layers.5.self_attn.v_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 6.0, 11.0, 2.0, 12.0, 11.0, 19.0, 25.0, 29.0, 51.0, 41.0, 64.0, 115.0, 138.0, 197.0, 343.0, 609.0, 1165.0, 2873.0, 8387.0, 32756.0, 187994.0, 650182.0, 127617.0, 24215.0, 6823.0, 2364.0, 970.0, 549.0, 309.0, 195.0, 116.0, 97.0, 79.0, 48.0, 35.0, 24.0, 15.0, 17.0, 18.0, 19.0, 12.0, 3.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.88671875, -0.8584823608398438, -0.8302459716796875, -0.8020095825195312, -0.773773193359375, -0.7455368041992188, -0.7173004150390625, -0.6890640258789062, -0.66082763671875, -0.6325912475585938, -0.6043548583984375, -0.5761184692382812, -0.547882080078125, -0.5196456909179688, -0.4914093017578125, -0.46317291259765625, -0.4349365234375, -0.40670013427734375, -0.3784637451171875, -0.35022735595703125, -0.321990966796875, -0.29375457763671875, -0.2655181884765625, -0.23728179931640625, -0.20904541015625, -0.18080902099609375, -0.1525726318359375, -0.12433624267578125, -0.096099853515625, -0.06786346435546875, -0.0396270751953125, -0.01139068603515625, 0.016845703125, 0.04508209228515625, 0.0733184814453125, 0.10155487060546875, 0.129791259765625, 0.15802764892578125, 0.1862640380859375, 0.21450042724609375, 0.24273681640625, 0.27097320556640625, 0.2992095947265625, 0.32744598388671875, 0.355682373046875, 0.38391876220703125, 0.4121551513671875, 0.44039154052734375, 0.4686279296875, 0.49686431884765625, 0.5251007080078125, 0.5533370971679688, 0.581573486328125, 0.6098098754882812, 0.6380462646484375, 0.6662826538085938, 0.69451904296875, 0.7227554321289062, 0.7509918212890625, 0.7792282104492188, 0.807464599609375, 0.8357009887695312, 0.8639373779296875, 0.8921737670898438, 0.92041015625]}, "gradients/decoder.model.decoder.layers.5.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 0.0, 1.0, 3.0, 4.0, 4.0, 4.0, 9.0, 9.0, 14.0, 13.0, 23.0, 29.0, 22.0, 24.0, 22.0, 51.0, 42.0, 41.0, 51.0, 47.0, 63.0, 51.0, 45.0, 67.0, 53.0, 34.0, 27.0, 46.0, 40.0, 31.0, 28.0, 20.0, 24.0, 9.0, 10.0, 11.0, 11.0, 10.0, 7.0, 2.0, 4.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.951171875, -2.863128662109375, -2.77508544921875, -2.687042236328125, -2.5989990234375, -2.510955810546875, -2.42291259765625, -2.334869384765625, -2.246826171875, -2.158782958984375, -2.07073974609375, -1.982696533203125, -1.8946533203125, -1.806610107421875, -1.71856689453125, -1.630523681640625, -1.54248046875, -1.454437255859375, -1.36639404296875, -1.278350830078125, -1.1903076171875, -1.102264404296875, -1.01422119140625, -0.926177978515625, -0.838134765625, -0.750091552734375, -0.66204833984375, -0.574005126953125, -0.4859619140625, -0.397918701171875, -0.30987548828125, -0.221832275390625, -0.1337890625, -0.045745849609375, 0.04229736328125, 0.130340576171875, 0.2183837890625, 0.306427001953125, 0.39447021484375, 0.482513427734375, 0.570556640625, 0.658599853515625, 0.74664306640625, 0.834686279296875, 0.9227294921875, 1.010772705078125, 1.09881591796875, 1.186859130859375, 1.27490234375, 1.362945556640625, 1.45098876953125, 1.539031982421875, 1.6270751953125, 1.715118408203125, 1.80316162109375, 1.891204833984375, 1.979248046875, 2.067291259765625, 2.15533447265625, 2.243377685546875, 2.3314208984375, 2.419464111328125, 2.50750732421875, 2.595550537109375, 2.68359375]}, "gradients/decoder.model.decoder.layers.5.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 4.0, 3.0, 4.0, 6.0, 9.0, 11.0, 15.0, 22.0, 44.0, 36.0, 62.0, 87.0, 127.0, 221.0, 374.0, 794.0, 1682.0, 4446.0, 14266.0, 69921.0, 603732.0, 297400.0, 39634.0, 9612.0, 3182.0, 1295.0, 641.0, 329.0, 187.0, 139.0, 86.0, 68.0, 32.0, 25.0, 23.0, 9.0, 6.0, 10.0, 5.0, 3.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.320068359375, -0.3093414306640625, -0.298614501953125, -0.2878875732421875, -0.27716064453125, -0.2664337158203125, -0.255706787109375, -0.2449798583984375, -0.2342529296875, -0.2235260009765625, -0.212799072265625, -0.2020721435546875, -0.19134521484375, -0.1806182861328125, -0.169891357421875, -0.1591644287109375, -0.1484375, -0.1377105712890625, -0.126983642578125, -0.1162567138671875, -0.10552978515625, -0.0948028564453125, -0.084075927734375, -0.0733489990234375, -0.0626220703125, -0.0518951416015625, -0.041168212890625, -0.0304412841796875, -0.01971435546875, -0.0089874267578125, 0.001739501953125, 0.0124664306640625, 0.023193359375, 0.0339202880859375, 0.044647216796875, 0.0553741455078125, 0.06610107421875, 0.0768280029296875, 0.087554931640625, 0.0982818603515625, 0.1090087890625, 0.1197357177734375, 0.130462646484375, 0.1411895751953125, 0.15191650390625, 0.1626434326171875, 0.173370361328125, 0.1840972900390625, 0.19482421875, 0.2055511474609375, 0.216278076171875, 0.2270050048828125, 0.23773193359375, 0.2484588623046875, 0.259185791015625, 0.2699127197265625, 0.2806396484375, 0.2913665771484375, 0.302093505859375, 0.3128204345703125, 0.32354736328125, 0.3342742919921875, 0.345001220703125, 0.3557281494140625, 0.366455078125]}, "gradients/decoder.model.decoder.layers.5.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 4.0, 1.0, 7.0, 6.0, 5.0, 7.0, 12.0, 14.0, 11.0, 20.0, 31.0, 27.0, 45.0, 48.0, 78.0, 92.0, 117.0, 115.0, 68.0, 68.0, 57.0, 26.0, 31.0, 21.0, 19.0, 14.0, 12.0, 7.0, 5.0, 5.0, 7.0, 6.0, 3.0, 5.0, 4.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.476308822631836e-05, -4.339776933193207e-05, -4.2032450437545776e-05, -4.0667131543159485e-05, -3.930181264877319e-05, -3.79364937543869e-05, -3.657117486000061e-05, -3.520585596561432e-05, -3.384053707122803e-05, -3.2475218176841736e-05, -3.1109899282455444e-05, -2.9744580388069153e-05, -2.837926149368286e-05, -2.701394259929657e-05, -2.564862370491028e-05, -2.4283304810523987e-05, -2.2917985916137695e-05, -2.1552667021751404e-05, -2.0187348127365112e-05, -1.882202923297882e-05, -1.745671033859253e-05, -1.6091391444206238e-05, -1.4726072549819946e-05, -1.3360753655433655e-05, -1.1995434761047363e-05, -1.0630115866661072e-05, -9.26479697227478e-06, -7.899478077888489e-06, -6.534159183502197e-06, -5.168840289115906e-06, -3.8035213947296143e-06, -2.4382025003433228e-06, -1.0728836059570312e-06, 2.9243528842926025e-07, 1.6577541828155518e-06, 3.0230730772018433e-06, 4.388391971588135e-06, 5.753710865974426e-06, 7.119029760360718e-06, 8.48434865474701e-06, 9.8496675491333e-06, 1.1214986443519592e-05, 1.2580305337905884e-05, 1.3945624232292175e-05, 1.5310943126678467e-05, 1.6676262021064758e-05, 1.804158091545105e-05, 1.940689980983734e-05, 2.0772218704223633e-05, 2.2137537598609924e-05, 2.3502856492996216e-05, 2.4868175387382507e-05, 2.62334942817688e-05, 2.759881317615509e-05, 2.8964132070541382e-05, 3.0329450964927673e-05, 3.1694769859313965e-05, 3.3060088753700256e-05, 3.442540764808655e-05, 3.579072654247284e-05, 3.715604543685913e-05, 3.852136433124542e-05, 3.9886683225631714e-05, 4.1252002120018005e-05, 4.26173210144043e-05]}, "gradients/decoder.model.decoder.layers.5.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 4.0, 8.0, 7.0, 10.0, 13.0, 21.0, 25.0, 48.0, 42.0, 62.0, 66.0, 143.0, 210.0, 308.0, 551.0, 979.0, 1663.0, 3424.0, 7991.0, 21553.0, 76930.0, 477262.0, 361681.0, 62852.0, 18676.0, 7098.0, 3133.0, 1500.0, 846.0, 512.0, 288.0, 180.0, 133.0, 86.0, 73.0, 48.0, 29.0, 26.0, 24.0, 10.0, 12.0, 9.0, 6.0, 5.0, 4.0, 1.0, 4.0, 2.0, 2.0, 1.0, 0.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.2451171875, -0.23664474487304688, -0.22817230224609375, -0.21969985961914062, -0.2112274169921875, -0.20275497436523438, -0.19428253173828125, -0.18581008911132812, -0.177337646484375, -0.16886520385742188, -0.16039276123046875, -0.15192031860351562, -0.1434478759765625, -0.13497543334960938, -0.12650299072265625, -0.11803054809570312, -0.10955810546875, -0.10108566284179688, -0.09261322021484375, -0.08414077758789062, -0.0756683349609375, -0.06719589233398438, -0.05872344970703125, -0.050251007080078125, -0.041778564453125, -0.033306121826171875, -0.02483367919921875, -0.016361236572265625, -0.0078887939453125, 0.000583648681640625, 0.00905609130859375, 0.017528533935546875, 0.0260009765625, 0.034473419189453125, 0.04294586181640625, 0.051418304443359375, 0.0598907470703125, 0.06836318969726562, 0.07683563232421875, 0.08530807495117188, 0.093780517578125, 0.10225296020507812, 0.11072540283203125, 0.11919784545898438, 0.1276702880859375, 0.13614273071289062, 0.14461517333984375, 0.15308761596679688, 0.16156005859375, 0.17003250122070312, 0.17850494384765625, 0.18697738647460938, 0.1954498291015625, 0.20392227172851562, 0.21239471435546875, 0.22086715698242188, 0.229339599609375, 0.23781204223632812, 0.24628448486328125, 0.2547569274902344, 0.2632293701171875, 0.2717018127441406, 0.28017425537109375, 0.2886466979980469, 0.297119140625]}, "gradients/decoder.model.decoder.layers.5.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 4.0, 2.0, 2.0, 3.0, 1.0, 2.0, 3.0, 6.0, 9.0, 5.0, 6.0, 11.0, 10.0, 21.0, 23.0, 25.0, 36.0, 50.0, 62.0, 78.0, 75.0, 109.0, 102.0, 86.0, 69.0, 47.0, 38.0, 31.0, 22.0, 15.0, 15.0, 14.0, 5.0, 8.0, 6.0, 1.0, 4.0, 2.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.218505859375, -0.21299362182617188, -0.20748138427734375, -0.20196914672851562, -0.1964569091796875, -0.19094467163085938, -0.18543243408203125, -0.17992019653320312, -0.174407958984375, -0.16889572143554688, -0.16338348388671875, -0.15787124633789062, -0.1523590087890625, -0.14684677124023438, -0.14133453369140625, -0.13582229614257812, -0.13031005859375, -0.12479782104492188, -0.11928558349609375, -0.11377334594726562, -0.1082611083984375, -0.10274887084960938, -0.09723663330078125, -0.09172439575195312, -0.086212158203125, -0.08069992065429688, -0.07518768310546875, -0.06967544555664062, -0.0641632080078125, -0.058650970458984375, -0.05313873291015625, -0.047626495361328125, -0.0421142578125, -0.036602020263671875, -0.03108978271484375, -0.025577545166015625, -0.0200653076171875, -0.014553070068359375, -0.00904083251953125, -0.003528594970703125, 0.001983642578125, 0.007495880126953125, 0.01300811767578125, 0.018520355224609375, 0.0240325927734375, 0.029544830322265625, 0.03505706787109375, 0.040569305419921875, 0.04608154296875, 0.051593780517578125, 0.05710601806640625, 0.06261825561523438, 0.0681304931640625, 0.07364273071289062, 0.07915496826171875, 0.08466720581054688, 0.090179443359375, 0.09569168090820312, 0.10120391845703125, 0.10671615600585938, 0.1122283935546875, 0.11774063110351562, 0.12325286865234375, 0.12876510620117188, 0.13427734375]}, "gradients/decoder.model.decoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 3.0, 4.0, 11.0, 19.0, 78.0, 292.0, 361.0, 178.0, 46.0, 13.0, 5.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.203277826309204, -2.858440637588501, -2.5136032104492188, -2.1687660217285156, -1.8239288330078125, -1.4790916442871094, -1.1342542171478271, -0.789417028427124, -0.4445798397064209, -0.099742591381073, 0.2450946569442749, 0.5899319648742676, 0.9347691535949707, 1.2796063423156738, 1.624443769454956, 1.9692809581756592, 2.3141181468963623, 2.6589553356170654, 3.0037927627563477, 3.348629951477051, 3.693467140197754, 4.038304328918457, 4.38314151763916, 4.727978706359863, 5.072815895080566, 5.4176530838012695, 5.762490272521973, 6.107327461242676, 6.452164649963379, 6.797001838684082, 7.141839504241943, 7.4866766929626465, 7.831514358520508, 8.176351547241211, 8.521188735961914, 8.866025924682617, 9.21086311340332, 9.555700302124023, 9.900537490844727, 10.24537467956543, 10.590211868286133, 10.935049057006836, 11.279886245727539, 11.624723434448242, 11.969560623168945, 12.314397811889648, 12.659235000610352, 13.004072189331055, 13.348910331726074, 13.693747520446777, 14.03858470916748, 14.383421897888184, 14.728259086608887, 15.07309627532959, 15.41793441772461, 15.762771606445312, 16.107608795166016, 16.45244598388672, 16.797283172607422, 17.142120361328125, 17.486957550048828, 17.83179473876953, 18.176631927490234, 18.521469116210938, 18.86630630493164]}, "gradients/decoder.model.decoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 4.0, 5.0, 0.0, 2.0, 4.0, 3.0, 6.0, 8.0, 11.0, 11.0, 9.0, 15.0, 18.0, 15.0, 20.0, 18.0, 32.0, 23.0, 35.0, 35.0, 41.0, 34.0, 38.0, 41.0, 27.0, 35.0, 44.0, 35.0, 47.0, 30.0, 37.0, 41.0, 38.0, 38.0, 27.0, 19.0, 29.0, 23.0, 13.0, 22.0, 10.0, 13.0, 18.0, 6.0, 10.0, 4.0, 6.0, 6.0, 1.0, 3.0, 2.0, 1.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.7992794513702393, -3.670844554901123, -3.542409658432007, -3.4139747619628906, -3.2855398654937744, -3.157104969024658, -3.028670310974121, -2.900235176086426, -2.7718005180358887, -2.6433656215667725, -2.5149307250976562, -2.38649582862854, -2.258060932159424, -2.1296260356903076, -2.0011911392211914, -1.8727563619613647, -1.744321346282959, -1.6158864498138428, -1.4874515533447266, -1.3590166568756104, -1.2305817604064941, -1.102146863937378, -0.9737120866775513, -0.8452771902084351, -0.7168422937393188, -0.5884073972702026, -0.4599725306034088, -0.331537663936615, -0.20310276746749878, -0.07466787099838257, 0.05376696586608887, 0.18220186233520508, 0.3106369972229004, 0.4390718936920166, 0.5675067901611328, 0.6959416270256042, 0.8243765234947205, 0.9528114199638367, 1.081246256828308, 1.2096811532974243, 1.3381160497665405, 1.4665509462356567, 1.594985842704773, 1.7234206199645996, 1.8518555164337158, 1.980290412902832, 2.1087253093719482, 2.2371602058410645, 2.3655951023101807, 2.494029998779297, 2.622464895248413, 2.7508997917175293, 2.8793346881866455, 3.0077695846557617, 3.136204242706299, 3.264639377593994, 3.3930740356445312, 3.5215089321136475, 3.6499438285827637, 3.77837872505188, 3.906813621520996, 4.035248279571533, 4.1636834144592285, 4.292118072509766, 4.420553207397461]}, "gradients/decoder.model.decoder.layers.4.fc2.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 6.0, 1.0, 7.0, 5.0, 7.0, 6.0, 12.0, 24.0, 21.0, 43.0, 65.0, 120.0, 181.0, 294.0, 520.0, 974.0, 1835.0, 3584.0, 8522.0, 25047.0, 131773.0, 2426948.0, 1467389.0, 91783.0, 21043.0, 7312.0, 3144.0, 1518.0, 821.0, 477.0, 285.0, 175.0, 109.0, 65.0, 49.0, 39.0, 28.0, 17.0, 16.0, 5.0, 4.0, 5.0, 3.0, 3.0, 1.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.916015625, -1.859527587890625, -1.80303955078125, -1.746551513671875, -1.6900634765625, -1.633575439453125, -1.57708740234375, -1.520599365234375, -1.464111328125, -1.407623291015625, -1.35113525390625, -1.294647216796875, -1.2381591796875, -1.181671142578125, -1.12518310546875, -1.068695068359375, -1.01220703125, -0.955718994140625, -0.89923095703125, -0.842742919921875, -0.7862548828125, -0.729766845703125, -0.67327880859375, -0.616790771484375, -0.560302734375, -0.503814697265625, -0.44732666015625, -0.390838623046875, -0.3343505859375, -0.277862548828125, -0.22137451171875, -0.164886474609375, -0.1083984375, -0.051910400390625, 0.00457763671875, 0.061065673828125, 0.1175537109375, 0.174041748046875, 0.23052978515625, 0.287017822265625, 0.343505859375, 0.399993896484375, 0.45648193359375, 0.512969970703125, 0.5694580078125, 0.625946044921875, 0.68243408203125, 0.738922119140625, 0.79541015625, 0.851898193359375, 0.90838623046875, 0.964874267578125, 1.0213623046875, 1.077850341796875, 1.13433837890625, 1.190826416015625, 1.247314453125, 1.303802490234375, 1.36029052734375, 1.416778564453125, 1.4732666015625, 1.529754638671875, 1.58624267578125, 1.642730712890625, 1.69921875]}, "gradients/decoder.model.decoder.layers.4.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 0.0, 2.0, 3.0, 4.0, 2.0, 8.0, 14.0, 18.0, 25.0, 24.0, 38.0, 42.0, 58.0, 82.0, 85.0, 67.0, 77.0, 73.0, 72.0, 62.0, 49.0, 51.0, 37.0, 25.0, 20.0, 22.0, 12.0, 9.0, 10.0, 1.0, 4.0, 4.0, 4.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.44921875, -1.403106689453125, -1.35699462890625, -1.310882568359375, -1.2647705078125, -1.218658447265625, -1.17254638671875, -1.126434326171875, -1.080322265625, -1.034210205078125, -0.98809814453125, -0.941986083984375, -0.8958740234375, -0.849761962890625, -0.80364990234375, -0.757537841796875, -0.71142578125, -0.665313720703125, -0.61920166015625, -0.573089599609375, -0.5269775390625, -0.480865478515625, -0.43475341796875, -0.388641357421875, -0.342529296875, -0.296417236328125, -0.25030517578125, -0.204193115234375, -0.1580810546875, -0.111968994140625, -0.06585693359375, -0.019744873046875, 0.0263671875, 0.072479248046875, 0.11859130859375, 0.164703369140625, 0.2108154296875, 0.256927490234375, 0.30303955078125, 0.349151611328125, 0.395263671875, 0.441375732421875, 0.48748779296875, 0.533599853515625, 0.5797119140625, 0.625823974609375, 0.67193603515625, 0.718048095703125, 0.76416015625, 0.810272216796875, 0.85638427734375, 0.902496337890625, 0.9486083984375, 0.994720458984375, 1.04083251953125, 1.086944580078125, 1.133056640625, 1.179168701171875, 1.22528076171875, 1.271392822265625, 1.3175048828125, 1.363616943359375, 1.40972900390625, 1.455841064453125, 1.501953125]}, "gradients/decoder.model.decoder.layers.4.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 6.0, 10.0, 7.0, 20.0, 15.0, 32.0, 53.0, 75.0, 144.0, 266.0, 897.0, 3259.0, 18775.0, 294567.0, 3772590.0, 91048.0, 9459.0, 1929.0, 625.0, 226.0, 117.0, 61.0, 33.0, 24.0, 19.0, 10.0, 6.0, 4.0, 5.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.0078125, -2.925018310546875, -2.84222412109375, -2.759429931640625, -2.6766357421875, -2.593841552734375, -2.51104736328125, -2.428253173828125, -2.345458984375, -2.262664794921875, -2.17987060546875, -2.097076416015625, -2.0142822265625, -1.931488037109375, -1.84869384765625, -1.765899658203125, -1.68310546875, -1.600311279296875, -1.51751708984375, -1.434722900390625, -1.3519287109375, -1.269134521484375, -1.18634033203125, -1.103546142578125, -1.020751953125, -0.937957763671875, -0.85516357421875, -0.772369384765625, -0.6895751953125, -0.606781005859375, -0.52398681640625, -0.441192626953125, -0.3583984375, -0.275604248046875, -0.19281005859375, -0.110015869140625, -0.0272216796875, 0.055572509765625, 0.13836669921875, 0.221160888671875, 0.303955078125, 0.386749267578125, 0.46954345703125, 0.552337646484375, 0.6351318359375, 0.717926025390625, 0.80072021484375, 0.883514404296875, 0.96630859375, 1.049102783203125, 1.13189697265625, 1.214691162109375, 1.2974853515625, 1.380279541015625, 1.46307373046875, 1.545867919921875, 1.628662109375, 1.711456298828125, 1.79425048828125, 1.877044677734375, 1.9598388671875, 2.042633056640625, 2.12542724609375, 2.208221435546875, 2.291015625]}, "gradients/decoder.model.decoder.layers.4.fc1.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 3.0, 5.0, 6.0, 4.0, 2.0, 2.0, 5.0, 4.0, 15.0, 22.0, 16.0, 37.0, 37.0, 48.0, 53.0, 102.0, 148.0, 216.0, 423.0, 630.0, 770.0, 575.0, 314.0, 181.0, 133.0, 90.0, 59.0, 34.0, 25.0, 29.0, 27.0, 17.0, 11.0, 13.0, 11.0, 9.0, 5.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.30810546875, -0.29543304443359375, -0.2827606201171875, -0.27008819580078125, -0.257415771484375, -0.24474334716796875, -0.2320709228515625, -0.21939849853515625, -0.20672607421875, -0.19405364990234375, -0.1813812255859375, -0.16870880126953125, -0.156036376953125, -0.14336395263671875, -0.1306915283203125, -0.11801910400390625, -0.1053466796875, -0.09267425537109375, -0.0800018310546875, -0.06732940673828125, -0.054656982421875, -0.04198455810546875, -0.0293121337890625, -0.01663970947265625, -0.00396728515625, 0.00870513916015625, 0.0213775634765625, 0.03404998779296875, 0.046722412109375, 0.05939483642578125, 0.0720672607421875, 0.08473968505859375, 0.097412109375, 0.11008453369140625, 0.1227569580078125, 0.13542938232421875, 0.148101806640625, 0.16077423095703125, 0.1734466552734375, 0.18611907958984375, 0.19879150390625, 0.21146392822265625, 0.2241363525390625, 0.23680877685546875, 0.249481201171875, 0.26215362548828125, 0.2748260498046875, 0.28749847412109375, 0.3001708984375, 0.31284332275390625, 0.3255157470703125, 0.33818817138671875, 0.350860595703125, 0.36353302001953125, 0.3762054443359375, 0.38887786865234375, 0.40155029296875, 0.41422271728515625, 0.4268951416015625, 0.43956756591796875, 0.452239990234375, 0.46491241455078125, 0.4775848388671875, 0.49025726318359375, 0.5029296875]}, "gradients/decoder.model.decoder.layers.4.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 4.0, 3.0, 5.0, 12.0, 8.0, 16.0, 26.0, 27.0, 45.0, 59.0, 91.0, 98.0, 135.0, 121.0, 91.0, 81.0, 51.0, 36.0, 22.0, 12.0, 13.0, 14.0, 8.0, 4.0, 5.0, 4.0, 4.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6753681898117065, -1.6107511520385742, -1.546134114265442, -1.4815170764923096, -1.4169001579284668, -1.3522831201553345, -1.2876660823822021, -1.2230490446090698, -1.1584320068359375, -1.0938149690628052, -1.0291979312896729, -0.9645809531211853, -0.8999639749526978, -0.8353469371795654, -0.7707298994064331, -0.7061128616333008, -0.641495943069458, -0.5768789052963257, -0.5122619271278381, -0.4476448893547058, -0.3830278813838959, -0.31841087341308594, -0.2537938356399536, -0.18917682766914368, -0.12455981969833374, -0.05994280427694321, 0.004674211144447327, 0.06929123401641846, 0.1339082419872284, 0.19852524995803833, 0.26314228773117065, 0.3277592957019806, 0.392376184463501, 0.4569931924343109, 0.5216102004051208, 0.5862272381782532, 0.6508442163467407, 0.715461254119873, 0.7800782918930054, 0.8446953296661377, 0.9093123078346252, 0.9739293456077576, 1.0385463237762451, 1.1031633615493774, 1.1677803993225098, 1.2323973178863525, 1.2970144748687744, 1.3616313934326172, 1.4262484312057495, 1.4908654689788818, 1.5554825067520142, 1.6200995445251465, 1.6847164630889893, 1.7493335008621216, 1.813950538635254, 1.8785675764083862, 1.9431846141815186, 2.0078015327453613, 2.072418689727783, 2.137035608291626, 2.201652765274048, 2.2662696838378906, 2.3308868408203125, 2.3955037593841553, 2.460120677947998]}, "gradients/decoder.model.decoder.layers.4.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 3.0, 8.0, 3.0, 3.0, 8.0, 5.0, 10.0, 12.0, 9.0, 16.0, 17.0, 30.0, 28.0, 48.0, 39.0, 59.0, 52.0, 37.0, 55.0, 41.0, 55.0, 51.0, 42.0, 45.0, 46.0, 41.0, 27.0, 41.0, 31.0, 25.0, 22.0, 23.0, 16.0, 9.0, 10.0, 15.0, 5.0, 5.0, 4.0, 4.0, 1.0, 2.0, 2.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.2554036378860474, -1.2193665504455566, -1.183329463005066, -1.1472923755645752, -1.111255168914795, -1.0752180814743042, -1.0391809940338135, -1.0031439065933228, -0.967106819152832, -0.9310697317123413, -0.8950326442718506, -0.8589954972267151, -0.8229584097862244, -0.7869213223457336, -0.7508841753005981, -0.7148470878601074, -0.6788100004196167, -0.642772912979126, -0.6067358255386353, -0.5706986784934998, -0.534661591053009, -0.4986245036125183, -0.4625873863697052, -0.4265502691268921, -0.39051318168640137, -0.35447609424591064, -0.31843897700309753, -0.2824018597602844, -0.2463647723197937, -0.21032766997814178, -0.17429056763648987, -0.13825345039367676, -0.10221648216247559, -0.06617937982082367, -0.030142277479171753, 0.005894824862480164, 0.04193192720413208, 0.077969029545784, 0.11400613188743591, 0.15004324913024902, 0.18608033657073975, 0.22211743891239166, 0.2581545412540436, 0.2941916584968567, 0.3302287459373474, 0.36626583337783813, 0.40230295062065125, 0.43834006786346436, 0.4743771553039551, 0.5104142427444458, 0.5464513301849365, 0.582488477230072, 0.6185255646705627, 0.6545626521110535, 0.690599799156189, 0.7266368865966797, 0.7626739740371704, 0.7987110614776611, 0.8347481489181519, 0.8707852959632874, 0.9068223834037781, 0.9428594708442688, 0.9788966178894043, 1.014933705329895, 1.0509707927703857]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 4.0, 3.0, 4.0, 3.0, 3.0, 7.0, 5.0, 8.0, 12.0, 13.0, 18.0, 36.0, 40.0, 46.0, 77.0, 121.0, 140.0, 252.0, 392.0, 700.0, 1196.0, 2265.0, 4239.0, 8356.0, 18217.0, 46738.0, 148659.0, 405106.0, 276051.0, 81986.0, 28770.0, 12164.0, 5860.0, 2987.0, 1619.0, 885.0, 570.0, 345.0, 215.0, 133.0, 86.0, 57.0, 57.0, 31.0, 19.0, 15.0, 8.0, 14.0, 4.0, 6.0, 5.0, 7.0, 5.0, 0.0, 4.0, 2.0, 0.0, 3.0, 1.0, 3.0], "bins": [-0.1981201171875, -0.1918811798095703, -0.18564224243164062, -0.17940330505371094, -0.17316436767578125, -0.16692543029785156, -0.16068649291992188, -0.1544475555419922, -0.1482086181640625, -0.1419696807861328, -0.13573074340820312, -0.12949180603027344, -0.12325286865234375, -0.11701393127441406, -0.11077499389648438, -0.10453605651855469, -0.098297119140625, -0.09205818176269531, -0.08581924438476562, -0.07958030700683594, -0.07334136962890625, -0.06710243225097656, -0.060863494873046875, -0.05462455749511719, -0.0483856201171875, -0.04214668273925781, -0.035907745361328125, -0.029668807983398438, -0.02342987060546875, -0.017190933227539062, -0.010951995849609375, -0.0047130584716796875, 0.00152587890625, 0.0077648162841796875, 0.014003753662109375, 0.020242691040039062, 0.02648162841796875, 0.03272056579589844, 0.038959503173828125, 0.04519844055175781, 0.0514373779296875, 0.05767631530761719, 0.06391525268554688, 0.07015419006347656, 0.07639312744140625, 0.08263206481933594, 0.08887100219726562, 0.09510993957519531, 0.101348876953125, 0.10758781433105469, 0.11382675170898438, 0.12006568908691406, 0.12630462646484375, 0.13254356384277344, 0.13878250122070312, 0.1450214385986328, 0.1512603759765625, 0.1574993133544922, 0.16373825073242188, 0.16997718811035156, 0.17621612548828125, 0.18245506286621094, 0.18869400024414062, 0.1949329376220703, 0.201171875]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 2.0, 3.0, 5.0, 2.0, 12.0, 10.0, 3.0, 9.0, 10.0, 25.0, 32.0, 28.0, 52.0, 39.0, 52.0, 62.0, 63.0, 55.0, 63.0, 56.0, 60.0, 46.0, 49.0, 46.0, 40.0, 35.0, 36.0, 28.0, 19.0, 9.0, 7.0, 11.0, 11.0, 11.0, 4.0, 4.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.9775390625, -0.9476776123046875, -0.917816162109375, -0.8879547119140625, -0.85809326171875, -0.8282318115234375, -0.798370361328125, -0.7685089111328125, -0.7386474609375, -0.7087860107421875, -0.678924560546875, -0.6490631103515625, -0.61920166015625, -0.5893402099609375, -0.559478759765625, -0.5296173095703125, -0.499755859375, -0.4698944091796875, -0.440032958984375, -0.4101715087890625, -0.38031005859375, -0.3504486083984375, -0.320587158203125, -0.2907257080078125, -0.2608642578125, -0.2310028076171875, -0.201141357421875, -0.1712799072265625, -0.14141845703125, -0.1115570068359375, -0.081695556640625, -0.0518341064453125, -0.02197265625, 0.0078887939453125, 0.037750244140625, 0.0676116943359375, 0.09747314453125, 0.1273345947265625, 0.157196044921875, 0.1870574951171875, 0.2169189453125, 0.2467803955078125, 0.276641845703125, 0.3065032958984375, 0.33636474609375, 0.3662261962890625, 0.396087646484375, 0.4259490966796875, 0.455810546875, 0.4856719970703125, 0.515533447265625, 0.5453948974609375, 0.57525634765625, 0.6051177978515625, 0.634979248046875, 0.6648406982421875, 0.6947021484375, 0.7245635986328125, 0.754425048828125, 0.7842864990234375, 0.81414794921875, 0.8440093994140625, 0.873870849609375, 0.9037322998046875, 0.93359375]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 1.0, 2.0, 3.0, 2.0, 12.0, 10.0, 18.0, 18.0, 22.0, 36.0, 63.0, 79.0, 124.0, 164.0, 220.0, 400.0, 634.0, 1290.0, 2343.0, 4851.0, 10933.0, 30657.0, 112330.0, 410909.0, 343509.0, 86673.0, 24752.0, 9460.0, 4156.0, 2045.0, 1123.0, 643.0, 385.0, 225.0, 128.0, 92.0, 63.0, 57.0, 39.0, 31.0, 19.0, 8.0, 11.0, 9.0, 1.0, 2.0, 4.0, 5.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.171630859375, -0.1652507781982422, -0.15887069702148438, -0.15249061584472656, -0.14611053466796875, -0.13973045349121094, -0.13335037231445312, -0.1269702911376953, -0.1205902099609375, -0.11421012878417969, -0.10783004760742188, -0.10144996643066406, -0.09506988525390625, -0.08868980407714844, -0.08230972290039062, -0.07592964172363281, -0.069549560546875, -0.06316947937011719, -0.056789398193359375, -0.05040931701660156, -0.04402923583984375, -0.03764915466308594, -0.031269073486328125, -0.024888992309570312, -0.0185089111328125, -0.012128829956054688, -0.005748748779296875, 0.0006313323974609375, 0.00701141357421875, 0.013391494750976562, 0.019771575927734375, 0.026151657104492188, 0.03253173828125, 0.03891181945800781, 0.045291900634765625, 0.05167198181152344, 0.05805206298828125, 0.06443214416503906, 0.07081222534179688, 0.07719230651855469, 0.0835723876953125, 0.08995246887207031, 0.09633255004882812, 0.10271263122558594, 0.10909271240234375, 0.11547279357910156, 0.12185287475585938, 0.1282329559326172, 0.134613037109375, 0.1409931182861328, 0.14737319946289062, 0.15375328063964844, 0.16013336181640625, 0.16651344299316406, 0.17289352416992188, 0.1792736053466797, 0.1856536865234375, 0.1920337677001953, 0.19841384887695312, 0.20479393005371094, 0.21117401123046875, 0.21755409240722656, 0.22393417358398438, 0.2303142547607422, 0.2366943359375]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 4.0, 3.0, 1.0, 2.0, 2.0, 3.0, 3.0, 5.0, 8.0, 8.0, 10.0, 10.0, 14.0, 18.0, 14.0, 20.0, 13.0, 22.0, 26.0, 26.0, 30.0, 31.0, 22.0, 44.0, 31.0, 34.0, 38.0, 54.0, 35.0, 47.0, 26.0, 30.0, 36.0, 34.0, 41.0, 28.0, 19.0, 29.0, 25.0, 32.0, 21.0, 18.0, 12.0, 17.0, 15.0, 12.0, 6.0, 4.0, 5.0, 6.0, 4.0, 2.0, 3.0, 7.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0], "bins": [-1.298828125, -1.2568511962890625, -1.214874267578125, -1.1728973388671875, -1.13092041015625, -1.0889434814453125, -1.046966552734375, -1.0049896240234375, -0.9630126953125, -0.9210357666015625, -0.879058837890625, -0.8370819091796875, -0.79510498046875, -0.7531280517578125, -0.711151123046875, -0.6691741943359375, -0.627197265625, -0.5852203369140625, -0.543243408203125, -0.5012664794921875, -0.45928955078125, -0.4173126220703125, -0.375335693359375, -0.3333587646484375, -0.2913818359375, -0.2494049072265625, -0.207427978515625, -0.1654510498046875, -0.12347412109375, -0.0814971923828125, -0.039520263671875, 0.0024566650390625, 0.04443359375, 0.0864105224609375, 0.128387451171875, 0.1703643798828125, 0.21234130859375, 0.2543182373046875, 0.296295166015625, 0.3382720947265625, 0.3802490234375, 0.4222259521484375, 0.464202880859375, 0.5061798095703125, 0.54815673828125, 0.5901336669921875, 0.632110595703125, 0.6740875244140625, 0.716064453125, 0.7580413818359375, 0.800018310546875, 0.8419952392578125, 0.88397216796875, 0.9259490966796875, 0.967926025390625, 1.0099029541015625, 1.0518798828125, 1.0938568115234375, 1.135833740234375, 1.1778106689453125, 1.21978759765625, 1.2617645263671875, 1.303741455078125, 1.3457183837890625, 1.3876953125]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 4.0, 7.0, 1.0, 5.0, 9.0, 19.0, 37.0, 55.0, 159.0, 403.0, 1797.0, 16290.0, 915115.0, 109090.0, 4344.0, 766.0, 245.0, 97.0, 47.0, 26.0, 19.0, 8.0, 12.0, 5.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.423583984375, -0.41205596923828125, -0.4005279541015625, -0.38899993896484375, -0.377471923828125, -0.36594390869140625, -0.3544158935546875, -0.34288787841796875, -0.33135986328125, -0.31983184814453125, -0.3083038330078125, -0.29677581787109375, -0.285247802734375, -0.27371978759765625, -0.2621917724609375, -0.25066375732421875, -0.2391357421875, -0.22760772705078125, -0.2160797119140625, -0.20455169677734375, -0.193023681640625, -0.18149566650390625, -0.1699676513671875, -0.15843963623046875, -0.14691162109375, -0.13538360595703125, -0.1238555908203125, -0.11232757568359375, -0.100799560546875, -0.08927154541015625, -0.0777435302734375, -0.06621551513671875, -0.0546875, -0.04315948486328125, -0.0316314697265625, -0.02010345458984375, -0.008575439453125, 0.00295257568359375, 0.0144805908203125, 0.02600860595703125, 0.03753662109375, 0.04906463623046875, 0.0605926513671875, 0.07212066650390625, 0.083648681640625, 0.09517669677734375, 0.1067047119140625, 0.11823272705078125, 0.1297607421875, 0.14128875732421875, 0.1528167724609375, 0.16434478759765625, 0.175872802734375, 0.18740081787109375, 0.1989288330078125, 0.21045684814453125, 0.22198486328125, 0.23351287841796875, 0.2450408935546875, 0.25656890869140625, 0.268096923828125, 0.27962493896484375, 0.2911529541015625, 0.30268096923828125, 0.314208984375]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 7.0, 2.0, 3.0, 10.0, 18.0, 14.0, 24.0, 36.0, 39.0, 72.0, 89.0, 110.0, 135.0, 131.0, 100.0, 60.0, 44.0, 23.0, 25.0, 19.0, 10.0, 8.0, 8.0, 9.0, 5.0, 1.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.511543273925781e-05, -8.263718336820602e-05, -8.015893399715424e-05, -7.768068462610245e-05, -7.520243525505066e-05, -7.272418588399887e-05, -7.024593651294708e-05, -6.77676871418953e-05, -6.52894377708435e-05, -6.281118839979172e-05, -6.033293902873993e-05, -5.785468965768814e-05, -5.537644028663635e-05, -5.2898190915584564e-05, -5.0419941544532776e-05, -4.794169217348099e-05, -4.54634428024292e-05, -4.298519343137741e-05, -4.050694406032562e-05, -3.8028694689273834e-05, -3.5550445318222046e-05, -3.307219594717026e-05, -3.059394657611847e-05, -2.811569720506668e-05, -2.5637447834014893e-05, -2.3159198462963104e-05, -2.0680949091911316e-05, -1.8202699720859528e-05, -1.572445034980774e-05, -1.3246200978755951e-05, -1.0767951607704163e-05, -8.289702236652374e-06, -5.811452865600586e-06, -3.3332034945487976e-06, -8.549541234970093e-07, 1.623295247554779e-06, 4.101544618606567e-06, 6.579793989658356e-06, 9.058043360710144e-06, 1.1536292731761932e-05, 1.401454210281372e-05, 1.649279147386551e-05, 1.8971040844917297e-05, 2.1449290215969086e-05, 2.3927539587020874e-05, 2.6405788958072662e-05, 2.888403832912445e-05, 3.136228770017624e-05, 3.384053707122803e-05, 3.6318786442279816e-05, 3.8797035813331604e-05, 4.127528518438339e-05, 4.375353455543518e-05, 4.623178392648697e-05, 4.871003329753876e-05, 5.1188282668590546e-05, 5.3666532039642334e-05, 5.614478141069412e-05, 5.862303078174591e-05, 6.11012801527977e-05, 6.357952952384949e-05, 6.605777889490128e-05, 6.853602826595306e-05, 7.101427763700485e-05, 7.349252700805664e-05]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 4.0, 8.0, 16.0, 11.0, 17.0, 16.0, 33.0, 34.0, 60.0, 110.0, 152.0, 294.0, 544.0, 1209.0, 3819.0, 21784.0, 530139.0, 464335.0, 19839.0, 3686.0, 1151.0, 531.0, 298.0, 146.0, 110.0, 64.0, 47.0, 39.0, 25.0, 10.0, 7.0, 5.0, 7.0, 2.0, 2.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1951904296875, -0.18767738342285156, -0.18016433715820312, -0.1726512908935547, -0.16513824462890625, -0.1576251983642578, -0.15011215209960938, -0.14259910583496094, -0.1350860595703125, -0.12757301330566406, -0.12005996704101562, -0.11254692077636719, -0.10503387451171875, -0.09752082824707031, -0.09000778198242188, -0.08249473571777344, -0.074981689453125, -0.06746864318847656, -0.059955596923828125, -0.05244255065917969, -0.04492950439453125, -0.03741645812988281, -0.029903411865234375, -0.022390365600585938, -0.0148773193359375, -0.0073642730712890625, 0.000148773193359375, 0.0076618194580078125, 0.01517486572265625, 0.022687911987304688, 0.030200958251953125, 0.03771400451660156, 0.04522705078125, 0.05274009704589844, 0.060253143310546875, 0.06776618957519531, 0.07527923583984375, 0.08279228210449219, 0.09030532836914062, 0.09781837463378906, 0.1053314208984375, 0.11284446716308594, 0.12035751342773438, 0.1278705596923828, 0.13538360595703125, 0.1428966522216797, 0.15040969848632812, 0.15792274475097656, 0.165435791015625, 0.17294883728027344, 0.18046188354492188, 0.1879749298095703, 0.19548797607421875, 0.2030010223388672, 0.21051406860351562, 0.21802711486816406, 0.2255401611328125, 0.23305320739746094, 0.24056625366210938, 0.2480792999267578, 0.25559234619140625, 0.2631053924560547, 0.2706184387207031, 0.27813148498535156, 0.28564453125]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 8.0, 6.0, 5.0, 7.0, 18.0, 28.0, 50.0, 59.0, 107.0, 165.0, 198.0, 123.0, 94.0, 50.0, 32.0, 19.0, 11.0, 10.0, 4.0, 5.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.05474853515625, -0.0532841682434082, -0.051819801330566406, -0.05035543441772461, -0.04889106750488281, -0.047426700592041016, -0.04596233367919922, -0.04449796676635742, -0.043033599853515625, -0.04156923294067383, -0.04010486602783203, -0.038640499114990234, -0.03717613220214844, -0.03571176528930664, -0.034247398376464844, -0.03278303146362305, -0.03131866455078125, -0.029854297637939453, -0.028389930725097656, -0.02692556381225586, -0.025461196899414062, -0.023996829986572266, -0.02253246307373047, -0.021068096160888672, -0.019603729248046875, -0.018139362335205078, -0.01667499542236328, -0.015210628509521484, -0.013746261596679688, -0.01228189468383789, -0.010817527770996094, -0.009353160858154297, -0.0078887939453125, -0.006424427032470703, -0.004960060119628906, -0.0034956932067871094, -0.0020313262939453125, -0.0005669593811035156, 0.0008974075317382812, 0.002361774444580078, 0.003826141357421875, 0.005290508270263672, 0.006754875183105469, 0.008219242095947266, 0.009683609008789062, 0.01114797592163086, 0.012612342834472656, 0.014076709747314453, 0.01554107666015625, 0.017005443572998047, 0.018469810485839844, 0.01993417739868164, 0.021398544311523438, 0.022862911224365234, 0.02432727813720703, 0.025791645050048828, 0.027256011962890625, 0.028720378875732422, 0.03018474578857422, 0.031649112701416016, 0.03311347961425781, 0.03457784652709961, 0.036042213439941406, 0.0375065803527832, 0.038970947265625]}, "gradients/decoder.model.decoder.layers.4.self_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 4.0, 2.0, 4.0, 9.0, 4.0, 4.0, 9.0, 21.0, 25.0, 38.0, 62.0, 88.0, 139.0, 164.0, 135.0, 111.0, 66.0, 37.0, 23.0, 22.0, 12.0, 9.0, 4.0, 5.0, 6.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.327288031578064, -1.2735381126403809, -1.2197883129119873, -1.1660385131835938, -1.1122885942459106, -1.0585386753082275, -1.004788875579834, -0.9510390162467957, -0.8972891569137573, -0.843539297580719, -0.7897894382476807, -0.7360395789146423, -0.682289719581604, -0.6285398602485657, -0.5747900009155273, -0.521040141582489, -0.4672902822494507, -0.41354042291641235, -0.359790563583374, -0.3060407042503357, -0.25229084491729736, -0.19854098558425903, -0.1447911262512207, -0.09104126691818237, -0.03729140758514404, 0.016458451747894287, 0.07020831108093262, 0.12395817041397095, 0.17770802974700928, 0.2314578890800476, 0.28520774841308594, 0.33895760774612427, 0.39270734786987305, 0.4464572072029114, 0.5002070665359497, 0.553956925868988, 0.6077067852020264, 0.6614566445350647, 0.715206503868103, 0.7689563632011414, 0.8227062225341797, 0.876456081867218, 0.9302059412002563, 0.9839558005332947, 1.037705659866333, 1.0914554595947266, 1.1452053785324097, 1.1989552974700928, 1.2527050971984863, 1.3064548969268799, 1.360204815864563, 1.413954734802246, 1.4677045345306396, 1.5214543342590332, 1.5752042531967163, 1.6289541721343994, 1.682703971862793, 1.7364537715911865, 1.7902036905288696, 1.8439536094665527, 1.8977034091949463, 1.9514532089233398, 2.0052032470703125, 2.058953046798706, 2.1127028465270996]}, "gradients/decoder.model.decoder.layers.4.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 5.0, 4.0, 1.0, 3.0, 8.0, 8.0, 12.0, 7.0, 16.0, 21.0, 28.0, 41.0, 46.0, 66.0, 68.0, 57.0, 57.0, 53.0, 76.0, 47.0, 59.0, 49.0, 48.0, 53.0, 34.0, 34.0, 22.0, 21.0, 10.0, 9.0, 16.0, 6.0, 5.0, 7.0, 1.0, 3.0, 5.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.0548725128173828, -1.0247845649719238, -0.9946966171264648, -0.9646086692810059, -0.9345207214355469, -0.9044327735900879, -0.8743448257446289, -0.8442568778991699, -0.8141689300537109, -0.784080982208252, -0.753993034362793, -0.723905086517334, -0.693817138671875, -0.663729190826416, -0.633641242980957, -0.603553295135498, -0.5734653472900391, -0.5433773994445801, -0.5132894515991211, -0.4832015037536621, -0.4531135559082031, -0.42302560806274414, -0.39293766021728516, -0.36284971237182617, -0.3327617645263672, -0.3026738166809082, -0.2725858688354492, -0.24249792098999023, -0.21240997314453125, -0.18232202529907227, -0.15223407745361328, -0.1221461296081543, -0.09205824136734009, -0.061970293521881104, -0.03188234567642212, -0.0017943978309631348, 0.02829355001449585, 0.058381497859954834, 0.08846944570541382, 0.1185573935508728, 0.1486453413963318, 0.17873328924179077, 0.20882123708724976, 0.23890918493270874, 0.2689971327781677, 0.2990850806236267, 0.3291730284690857, 0.3592609763145447, 0.38934892416000366, 0.41943687200546265, 0.44952481985092163, 0.4796127676963806, 0.5097007155418396, 0.5397886633872986, 0.5698766112327576, 0.5999645590782166, 0.6300525069236755, 0.6601404547691345, 0.6902284026145935, 0.7203163504600525, 0.7504042983055115, 0.7804922461509705, 0.8105801939964294, 0.8406681418418884, 0.8707560896873474]}, "gradients/decoder.model.decoder.layers.4.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 6.0, 6.0, 4.0, 8.0, 11.0, 16.0, 18.0, 31.0, 55.0, 63.0, 90.0, 137.0, 191.0, 337.0, 496.0, 838.0, 1498.0, 2998.0, 7223.0, 21487.0, 108613.0, 738442.0, 127609.0, 23683.0, 7444.0, 3236.0, 1596.0, 901.0, 522.0, 324.0, 201.0, 143.0, 106.0, 64.0, 41.0, 38.0, 19.0, 23.0, 15.0, 10.0, 5.0, 5.0, 1.0, 3.0, 2.0, 4.0, 2.0, 0.0, 2.0], "bins": [-1.3251953125, -1.2889251708984375, -1.252655029296875, -1.2163848876953125, -1.18011474609375, -1.1438446044921875, -1.107574462890625, -1.0713043212890625, -1.0350341796875, -0.9987640380859375, -0.962493896484375, -0.9262237548828125, -0.88995361328125, -0.8536834716796875, -0.817413330078125, -0.7811431884765625, -0.744873046875, -0.7086029052734375, -0.672332763671875, -0.6360626220703125, -0.59979248046875, -0.5635223388671875, -0.527252197265625, -0.4909820556640625, -0.4547119140625, -0.4184417724609375, -0.382171630859375, -0.3459014892578125, -0.30963134765625, -0.2733612060546875, -0.237091064453125, -0.2008209228515625, -0.16455078125, -0.1282806396484375, -0.092010498046875, -0.0557403564453125, -0.01947021484375, 0.0167999267578125, 0.053070068359375, 0.0893402099609375, 0.1256103515625, 0.1618804931640625, 0.198150634765625, 0.2344207763671875, 0.27069091796875, 0.3069610595703125, 0.343231201171875, 0.3795013427734375, 0.415771484375, 0.4520416259765625, 0.488311767578125, 0.5245819091796875, 0.56085205078125, 0.5971221923828125, 0.633392333984375, 0.6696624755859375, 0.7059326171875, 0.7422027587890625, 0.778472900390625, 0.8147430419921875, 0.85101318359375, 0.8872833251953125, 0.923553466796875, 0.9598236083984375, 0.99609375]}, "gradients/decoder.model.decoder.layers.4.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 4.0, 2.0, 6.0, 4.0, 9.0, 12.0, 14.0, 14.0, 19.0, 33.0, 42.0, 62.0, 69.0, 69.0, 78.0, 64.0, 61.0, 75.0, 61.0, 59.0, 43.0, 51.0, 33.0, 31.0, 20.0, 16.0, 13.0, 4.0, 9.0, 11.0, 7.0, 2.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.7109375, -2.638031005859375, -2.56512451171875, -2.492218017578125, -2.4193115234375, -2.346405029296875, -2.27349853515625, -2.200592041015625, -2.127685546875, -2.054779052734375, -1.98187255859375, -1.908966064453125, -1.8360595703125, -1.763153076171875, -1.69024658203125, -1.617340087890625, -1.54443359375, -1.471527099609375, -1.39862060546875, -1.325714111328125, -1.2528076171875, -1.179901123046875, -1.10699462890625, -1.034088134765625, -0.961181640625, -0.888275146484375, -0.81536865234375, -0.742462158203125, -0.6695556640625, -0.596649169921875, -0.52374267578125, -0.450836181640625, -0.3779296875, -0.305023193359375, -0.23211669921875, -0.159210205078125, -0.0863037109375, -0.013397216796875, 0.05950927734375, 0.132415771484375, 0.205322265625, 0.278228759765625, 0.35113525390625, 0.424041748046875, 0.4969482421875, 0.569854736328125, 0.64276123046875, 0.715667724609375, 0.78857421875, 0.861480712890625, 0.93438720703125, 1.007293701171875, 1.0802001953125, 1.153106689453125, 1.22601318359375, 1.298919677734375, 1.371826171875, 1.444732666015625, 1.51763916015625, 1.590545654296875, 1.6634521484375, 1.736358642578125, 1.80926513671875, 1.882171630859375, 1.955078125]}, "gradients/decoder.model.decoder.layers.4.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 4.0, 6.0, 1.0, 4.0, 11.0, 11.0, 13.0, 19.0, 28.0, 33.0, 79.0, 104.0, 157.0, 299.0, 571.0, 1326.0, 3629.0, 13248.0, 88321.0, 797149.0, 120275.0, 16043.0, 4167.0, 1564.0, 694.0, 331.0, 173.0, 106.0, 59.0, 47.0, 26.0, 19.0, 17.0, 6.0, 5.0, 3.0, 5.0, 4.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.1962890625, -1.1595458984375, -1.122802734375, -1.0860595703125, -1.04931640625, -1.0125732421875, -0.975830078125, -0.9390869140625, -0.90234375, -0.8656005859375, -0.828857421875, -0.7921142578125, -0.75537109375, -0.7186279296875, -0.681884765625, -0.6451416015625, -0.6083984375, -0.5716552734375, -0.534912109375, -0.4981689453125, -0.46142578125, -0.4246826171875, -0.387939453125, -0.3511962890625, -0.314453125, -0.2777099609375, -0.240966796875, -0.2042236328125, -0.16748046875, -0.1307373046875, -0.093994140625, -0.0572509765625, -0.0205078125, 0.0162353515625, 0.052978515625, 0.0897216796875, 0.12646484375, 0.1632080078125, 0.199951171875, 0.2366943359375, 0.2734375, 0.3101806640625, 0.346923828125, 0.3836669921875, 0.42041015625, 0.4571533203125, 0.493896484375, 0.5306396484375, 0.5673828125, 0.6041259765625, 0.640869140625, 0.6776123046875, 0.71435546875, 0.7510986328125, 0.787841796875, 0.8245849609375, 0.861328125, 0.8980712890625, 0.934814453125, 0.9715576171875, 1.00830078125, 1.0450439453125, 1.081787109375, 1.1185302734375, 1.1552734375]}, "gradients/decoder.model.decoder.layers.4.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 1.0, 2.0, 2.0, 5.0, 3.0, 8.0, 7.0, 15.0, 14.0, 18.0, 14.0, 22.0, 19.0, 27.0, 33.0, 35.0, 36.0, 46.0, 36.0, 42.0, 37.0, 57.0, 47.0, 38.0, 44.0, 47.0, 49.0, 42.0, 39.0, 40.0, 35.0, 27.0, 25.0, 15.0, 23.0, 14.0, 8.0, 5.0, 10.0, 5.0, 4.0, 4.0, 3.0, 7.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9296875, -1.8651123046875, -1.800537109375, -1.7359619140625, -1.67138671875, -1.6068115234375, -1.542236328125, -1.4776611328125, -1.4130859375, -1.3485107421875, -1.283935546875, -1.2193603515625, -1.15478515625, -1.0902099609375, -1.025634765625, -0.9610595703125, -0.896484375, -0.8319091796875, -0.767333984375, -0.7027587890625, -0.63818359375, -0.5736083984375, -0.509033203125, -0.4444580078125, -0.3798828125, -0.3153076171875, -0.250732421875, -0.1861572265625, -0.12158203125, -0.0570068359375, 0.007568359375, 0.0721435546875, 0.13671875, 0.2012939453125, 0.265869140625, 0.3304443359375, 0.39501953125, 0.4595947265625, 0.524169921875, 0.5887451171875, 0.6533203125, 0.7178955078125, 0.782470703125, 0.8470458984375, 0.91162109375, 0.9761962890625, 1.040771484375, 1.1053466796875, 1.169921875, 1.2344970703125, 1.299072265625, 1.3636474609375, 1.42822265625, 1.4927978515625, 1.557373046875, 1.6219482421875, 1.6865234375, 1.7510986328125, 1.815673828125, 1.8802490234375, 1.94482421875, 2.0093994140625, 2.073974609375, 2.1385498046875, 2.203125]}, "gradients/decoder.model.decoder.layers.4.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 4.0, 5.0, 4.0, 2.0, 6.0, 6.0, 6.0, 20.0, 20.0, 20.0, 49.0, 71.0, 120.0, 206.0, 457.0, 1058.0, 3094.0, 11274.0, 61202.0, 672140.0, 257431.0, 31114.0, 6634.0, 2099.0, 765.0, 340.0, 163.0, 81.0, 50.0, 37.0, 26.0, 18.0, 12.0, 7.0, 8.0, 7.0, 3.0, 3.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.38134765625, -0.36936187744140625, -0.3573760986328125, -0.34539031982421875, -0.333404541015625, -0.32141876220703125, -0.3094329833984375, -0.29744720458984375, -0.28546142578125, -0.27347564697265625, -0.2614898681640625, -0.24950408935546875, -0.237518310546875, -0.22553253173828125, -0.2135467529296875, -0.20156097412109375, -0.1895751953125, -0.17758941650390625, -0.1656036376953125, -0.15361785888671875, -0.141632080078125, -0.12964630126953125, -0.1176605224609375, -0.10567474365234375, -0.09368896484375, -0.08170318603515625, -0.0697174072265625, -0.05773162841796875, -0.045745849609375, -0.03376007080078125, -0.0217742919921875, -0.00978851318359375, 0.002197265625, 0.01418304443359375, 0.0261688232421875, 0.03815460205078125, 0.050140380859375, 0.06212615966796875, 0.0741119384765625, 0.08609771728515625, 0.09808349609375, 0.11006927490234375, 0.1220550537109375, 0.13404083251953125, 0.146026611328125, 0.15801239013671875, 0.1699981689453125, 0.18198394775390625, 0.1939697265625, 0.20595550537109375, 0.2179412841796875, 0.22992706298828125, 0.241912841796875, 0.25389862060546875, 0.2658843994140625, 0.27787017822265625, 0.28985595703125, 0.30184173583984375, 0.3138275146484375, 0.32581329345703125, 0.337799072265625, 0.34978485107421875, 0.3617706298828125, 0.37375640869140625, 0.3857421875]}, "gradients/decoder.model.decoder.layers.4.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 6.0, 6.0, 3.0, 3.0, 12.0, 14.0, 21.0, 25.0, 26.0, 40.0, 50.0, 84.0, 219.0, 165.0, 103.0, 56.0, 39.0, 37.0, 19.0, 24.0, 23.0, 4.0, 7.0, 3.0, 1.0, 1.0, 7.0, 5.0, 0.0, 2.0, 0.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.9485435485839844e-05, -5.75091689825058e-05, -5.553290247917175e-05, -5.355663597583771e-05, -5.158036947250366e-05, -4.960410296916962e-05, -4.762783646583557e-05, -4.5651569962501526e-05, -4.367530345916748e-05, -4.1699036955833435e-05, -3.972277045249939e-05, -3.7746503949165344e-05, -3.57702374458313e-05, -3.3793970942497253e-05, -3.181770443916321e-05, -2.9841437935829163e-05, -2.7865171432495117e-05, -2.5888904929161072e-05, -2.3912638425827026e-05, -2.193637192249298e-05, -1.9960105419158936e-05, -1.798383891582489e-05, -1.6007572412490845e-05, -1.40313059091568e-05, -1.2055039405822754e-05, -1.0078772902488708e-05, -8.102506399154663e-06, -6.126239895820618e-06, -4.149973392486572e-06, -2.173706889152527e-06, -1.9744038581848145e-07, 1.778826117515564e-06, 3.7550926208496094e-06, 5.731359124183655e-06, 7.7076256275177e-06, 9.683892130851746e-06, 1.1660158634185791e-05, 1.3636425137519836e-05, 1.5612691640853882e-05, 1.7588958144187927e-05, 1.9565224647521973e-05, 2.1541491150856018e-05, 2.3517757654190063e-05, 2.549402415752411e-05, 2.7470290660858154e-05, 2.94465571641922e-05, 3.1422823667526245e-05, 3.339909017086029e-05, 3.5375356674194336e-05, 3.735162317752838e-05, 3.932788968086243e-05, 4.130415618419647e-05, 4.328042268753052e-05, 4.525668919086456e-05, 4.723295569419861e-05, 4.9209222197532654e-05, 5.11854887008667e-05, 5.3161755204200745e-05, 5.513802170753479e-05, 5.7114288210868835e-05, 5.909055471420288e-05, 6.106682121753693e-05, 6.304308772087097e-05, 6.501935422420502e-05, 6.699562072753906e-05]}, "gradients/decoder.model.decoder.layers.4.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 7.0, 5.0, 9.0, 9.0, 11.0, 24.0, 25.0, 61.0, 78.0, 144.0, 274.0, 527.0, 1086.0, 2480.0, 6777.0, 21568.0, 99485.0, 687964.0, 179279.0, 33402.0, 9230.0, 3356.0, 1389.0, 612.0, 298.0, 163.0, 95.0, 88.0, 34.0, 21.0, 16.0, 13.0, 9.0, 11.0, 5.0, 2.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.421142578125, -0.4105224609375, -0.39990234375, -0.3892822265625, -0.378662109375, -0.3680419921875, -0.357421875, -0.3468017578125, -0.336181640625, -0.3255615234375, -0.31494140625, -0.3043212890625, -0.293701171875, -0.2830810546875, -0.2724609375, -0.2618408203125, -0.251220703125, -0.2406005859375, -0.22998046875, -0.2193603515625, -0.208740234375, -0.1981201171875, -0.1875, -0.1768798828125, -0.166259765625, -0.1556396484375, -0.14501953125, -0.1343994140625, -0.123779296875, -0.1131591796875, -0.1025390625, -0.0919189453125, -0.081298828125, -0.0706787109375, -0.06005859375, -0.0494384765625, -0.038818359375, -0.0281982421875, -0.017578125, -0.0069580078125, 0.003662109375, 0.0142822265625, 0.02490234375, 0.0355224609375, 0.046142578125, 0.0567626953125, 0.0673828125, 0.0780029296875, 0.088623046875, 0.0992431640625, 0.10986328125, 0.1204833984375, 0.131103515625, 0.1417236328125, 0.15234375, 0.1629638671875, 0.173583984375, 0.1842041015625, 0.19482421875, 0.2054443359375, 0.216064453125, 0.2266845703125, 0.2373046875, 0.2479248046875, 0.258544921875]}, "gradients/decoder.model.decoder.layers.4.self_attn.q_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 3.0, 2.0, 0.0, 1.0, 2.0, 4.0, 3.0, 0.0, 5.0, 3.0, 5.0, 5.0, 9.0, 5.0, 11.0, 21.0, 14.0, 17.0, 20.0, 17.0, 32.0, 42.0, 37.0, 49.0, 60.0, 88.0, 144.0, 72.0, 53.0, 47.0, 46.0, 40.0, 28.0, 29.0, 13.0, 13.0, 8.0, 11.0, 10.0, 6.0, 8.0, 5.0, 4.0, 2.0, 4.0, 4.0, 3.0, 3.0, 1.0, 2.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.09735107421875, -0.09414386749267578, -0.09093666076660156, -0.08772945404052734, -0.08452224731445312, -0.0813150405883789, -0.07810783386230469, -0.07490062713623047, -0.07169342041015625, -0.06848621368408203, -0.06527900695800781, -0.062071800231933594, -0.058864593505859375, -0.055657386779785156, -0.05245018005371094, -0.04924297332763672, -0.0460357666015625, -0.04282855987548828, -0.03962135314941406, -0.036414146423339844, -0.033206939697265625, -0.029999732971191406, -0.026792526245117188, -0.02358531951904297, -0.02037811279296875, -0.01717090606689453, -0.013963699340820312, -0.010756492614746094, -0.007549285888671875, -0.004342079162597656, -0.0011348724365234375, 0.0020723342895507812, 0.005279541015625, 0.008486747741699219, 0.011693954467773438, 0.014901161193847656, 0.018108367919921875, 0.021315574645996094, 0.024522781372070312, 0.02772998809814453, 0.03093719482421875, 0.03414440155029297, 0.03735160827636719, 0.040558815002441406, 0.043766021728515625, 0.046973228454589844, 0.05018043518066406, 0.05338764190673828, 0.0565948486328125, 0.05980205535888672, 0.06300926208496094, 0.06621646881103516, 0.06942367553710938, 0.0726308822631836, 0.07583808898925781, 0.07904529571533203, 0.08225250244140625, 0.08545970916748047, 0.08866691589355469, 0.0918741226196289, 0.09508132934570312, 0.09828853607177734, 0.10149574279785156, 0.10470294952392578, 0.10791015625]}, "gradients/decoder.model.decoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 5.0, 7.0, 3.0, 11.0, 10.0, 17.0, 40.0, 76.0, 147.0, 200.0, 209.0, 110.0, 72.0, 44.0, 26.0, 9.0, 7.0, 5.0, 4.0, 2.0, 1.0, 1.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.891600608825684, -6.738542556762695, -6.585484504699707, -6.4324259757995605, -6.279367923736572, -6.126309871673584, -5.973251819610596, -5.820193290710449, -5.667135238647461, -5.514077186584473, -5.361019134521484, -5.207960605621338, -5.05490255355835, -4.901844501495361, -4.748786449432373, -4.595727920532227, -4.442669868469238, -4.28961181640625, -4.136553764343262, -3.9834954738616943, -3.830437183380127, -3.6773791313171387, -3.5243210792541504, -3.371262788772583, -3.218204975128174, -3.0651469230651855, -2.912088632583618, -2.75903058052063, -2.6059722900390625, -2.452914237976074, -2.299856185913086, -2.1467978954315186, -1.993739366531372, -1.8406811952590942, -1.6876230239868164, -1.5345649719238281, -1.3815066814422607, -1.2284486293792725, -1.0753904581069946, -0.9223322868347168, -0.769274115562439, -0.6162159442901611, -0.4631578028202057, -0.31009966135025024, -0.1570414900779724, -0.00398331880569458, 0.14907479286193848, 0.3021329641342163, 0.45519113540649414, 0.608249306678772, 0.7613074779510498, 0.9143655896186829, 1.0674238204956055, 1.2204818725585938, 1.3735400438308716, 1.5265982151031494, 1.6796563863754272, 1.832714557647705, 1.985772728919983, 2.1388309001922607, 2.291888952255249, 2.4449472427368164, 2.5980052947998047, 2.751063346862793, 2.9041216373443604]}, "gradients/decoder.model.decoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 3.0, 1.0, 3.0, 5.0, 12.0, 9.0, 14.0, 6.0, 15.0, 8.0, 23.0, 15.0, 27.0, 28.0, 25.0, 22.0, 38.0, 24.0, 42.0, 50.0, 36.0, 48.0, 40.0, 37.0, 28.0, 43.0, 39.0, 27.0, 31.0, 33.0, 28.0, 32.0, 26.0, 41.0, 23.0, 22.0, 13.0, 16.0, 19.0, 8.0, 7.0, 9.0, 6.0, 5.0, 4.0, 9.0, 4.0, 3.0, 3.0, 2.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.975710391998291, -2.8761162757873535, -2.776522159576416, -2.6769280433654785, -2.57733416557312, -2.4777400493621826, -2.378145933151245, -2.2785518169403076, -2.178957939147949, -2.0793638229370117, -1.9797698259353638, -1.8801757097244263, -1.7805817127227783, -1.6809875965118408, -1.5813934803009033, -1.4817993640899658, -1.3822052478790283, -1.2826111316680908, -1.1830171346664429, -1.0834230184555054, -0.9838289618492126, -0.8842349052429199, -0.7846407890319824, -0.6850467324256897, -0.585452675819397, -0.48585861921310425, -0.38626453280448914, -0.286670446395874, -0.1870763897895813, -0.08748233318328857, 0.012111783027648926, 0.11170583963394165, 0.21129965782165527, 0.310893714427948, 0.4104878008365631, 0.5100818872451782, 0.609675943851471, 0.7092700004577637, 0.8088641166687012, 0.9084581732749939, 1.0080522298812866, 1.1076463460922241, 1.207240343093872, 1.3068344593048096, 1.406428575515747, 1.506022572517395, 1.6056166887283325, 1.7052106857299805, 1.804804801940918, 1.9043989181518555, 2.003993034362793, 2.1035871505737305, 2.203181028366089, 2.3027751445770264, 2.402369260787964, 2.5019633769989014, 2.6015572547912598, 2.7011513710021973, 2.8007454872131348, 2.9003396034240723, 2.9999334812164307, 3.099527597427368, 3.1991217136383057, 3.298715829849243, 3.3983099460601807]}, "gradients/decoder.model.decoder.layers.3.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 1.0, 3.0, 4.0, 6.0, 6.0, 16.0, 10.0, 20.0, 43.0, 57.0, 75.0, 121.0, 200.0, 337.0, 571.0, 1002.0, 1858.0, 4039.0, 11407.0, 47108.0, 665739.0, 3288974.0, 138788.0, 21137.0, 6699.0, 2774.0, 1327.0, 794.0, 412.0, 237.0, 165.0, 112.0, 68.0, 55.0, 38.0, 31.0, 14.0, 6.0, 13.0, 4.0, 6.0, 5.0, 2.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-2.10546875, -2.04400634765625, -1.9825439453125, -1.92108154296875, -1.859619140625, -1.79815673828125, -1.7366943359375, -1.67523193359375, -1.61376953125, -1.55230712890625, -1.4908447265625, -1.42938232421875, -1.367919921875, -1.30645751953125, -1.2449951171875, -1.18353271484375, -1.1220703125, -1.06060791015625, -0.9991455078125, -0.93768310546875, -0.876220703125, -0.81475830078125, -0.7532958984375, -0.69183349609375, -0.63037109375, -0.56890869140625, -0.5074462890625, -0.44598388671875, -0.384521484375, -0.32305908203125, -0.2615966796875, -0.20013427734375, -0.138671875, -0.07720947265625, -0.0157470703125, 0.04571533203125, 0.107177734375, 0.16864013671875, 0.2301025390625, 0.29156494140625, 0.35302734375, 0.41448974609375, 0.4759521484375, 0.53741455078125, 0.598876953125, 0.66033935546875, 0.7218017578125, 0.78326416015625, 0.8447265625, 0.90618896484375, 0.9676513671875, 1.02911376953125, 1.090576171875, 1.15203857421875, 1.2135009765625, 1.27496337890625, 1.33642578125, 1.39788818359375, 1.4593505859375, 1.52081298828125, 1.582275390625, 1.64373779296875, 1.7052001953125, 1.76666259765625, 1.828125]}, "gradients/decoder.model.decoder.layers.3.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 5.0, 2.0, 4.0, 3.0, 5.0, 3.0, 9.0, 8.0, 10.0, 19.0, 7.0, 29.0, 40.0, 42.0, 35.0, 42.0, 56.0, 58.0, 64.0, 61.0, 56.0, 61.0, 58.0, 54.0, 60.0, 45.0, 26.0, 26.0, 23.0, 16.0, 17.0, 14.0, 5.0, 18.0, 7.0, 4.0, 3.0, 5.0, 3.0, 6.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.0556640625, -1.02392578125, -0.9921875, -0.96044921875, -0.9287109375, -0.89697265625, -0.865234375, -0.83349609375, -0.8017578125, -0.77001953125, -0.73828125, -0.70654296875, -0.6748046875, -0.64306640625, -0.611328125, -0.57958984375, -0.5478515625, -0.51611328125, -0.484375, -0.45263671875, -0.4208984375, -0.38916015625, -0.357421875, -0.32568359375, -0.2939453125, -0.26220703125, -0.23046875, -0.19873046875, -0.1669921875, -0.13525390625, -0.103515625, -0.07177734375, -0.0400390625, -0.00830078125, 0.0234375, 0.05517578125, 0.0869140625, 0.11865234375, 0.150390625, 0.18212890625, 0.2138671875, 0.24560546875, 0.27734375, 0.30908203125, 0.3408203125, 0.37255859375, 0.404296875, 0.43603515625, 0.4677734375, 0.49951171875, 0.53125, 0.56298828125, 0.5947265625, 0.62646484375, 0.658203125, 0.68994140625, 0.7216796875, 0.75341796875, 0.78515625, 0.81689453125, 0.8486328125, 0.88037109375, 0.912109375, 0.94384765625, 0.9755859375]}, "gradients/decoder.model.decoder.layers.3.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 5.0, 9.0, 1.0, 3.0, 10.0, 11.0, 27.0, 34.0, 43.0, 81.0, 139.0, 343.0, 776.0, 2872.0, 16572.0, 253535.0, 3823007.0, 85028.0, 8862.0, 1863.0, 548.0, 237.0, 95.0, 58.0, 29.0, 25.0, 16.0, 17.0, 11.0, 5.0, 3.0, 4.0, 8.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.349609375, -2.26953125, -2.189453125, -2.109375, -2.029296875, -1.94921875, -1.869140625, -1.7890625, -1.708984375, -1.62890625, -1.548828125, -1.46875, -1.388671875, -1.30859375, -1.228515625, -1.1484375, -1.068359375, -0.98828125, -0.908203125, -0.828125, -0.748046875, -0.66796875, -0.587890625, -0.5078125, -0.427734375, -0.34765625, -0.267578125, -0.1875, -0.107421875, -0.02734375, 0.052734375, 0.1328125, 0.212890625, 0.29296875, 0.373046875, 0.453125, 0.533203125, 0.61328125, 0.693359375, 0.7734375, 0.853515625, 0.93359375, 1.013671875, 1.09375, 1.173828125, 1.25390625, 1.333984375, 1.4140625, 1.494140625, 1.57421875, 1.654296875, 1.734375, 1.814453125, 1.89453125, 1.974609375, 2.0546875, 2.134765625, 2.21484375, 2.294921875, 2.375, 2.455078125, 2.53515625, 2.615234375, 2.6953125, 2.775390625]}, "gradients/decoder.model.decoder.layers.3.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 12.0, 2.0, 5.0, 8.0, 11.0, 21.0, 19.0, 21.0, 35.0, 54.0, 64.0, 73.0, 108.0, 204.0, 295.0, 506.0, 693.0, 682.0, 414.0, 239.0, 155.0, 107.0, 81.0, 71.0, 43.0, 35.0, 16.0, 25.0, 22.0, 11.0, 13.0, 5.0, 6.0, 1.0, 4.0, 2.0, 2.0, 2.0, 2.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.37158203125, -0.36061859130859375, -0.3496551513671875, -0.33869171142578125, -0.327728271484375, -0.31676483154296875, -0.3058013916015625, -0.29483795166015625, -0.28387451171875, -0.27291107177734375, -0.2619476318359375, -0.25098419189453125, -0.240020751953125, -0.22905731201171875, -0.2180938720703125, -0.20713043212890625, -0.1961669921875, -0.18520355224609375, -0.1742401123046875, -0.16327667236328125, -0.152313232421875, -0.14134979248046875, -0.1303863525390625, -0.11942291259765625, -0.10845947265625, -0.09749603271484375, -0.0865325927734375, -0.07556915283203125, -0.064605712890625, -0.05364227294921875, -0.0426788330078125, -0.03171539306640625, -0.020751953125, -0.00978851318359375, 0.0011749267578125, 0.01213836669921875, 0.023101806640625, 0.03406524658203125, 0.0450286865234375, 0.05599212646484375, 0.06695556640625, 0.07791900634765625, 0.0888824462890625, 0.09984588623046875, 0.110809326171875, 0.12177276611328125, 0.1327362060546875, 0.14369964599609375, 0.1546630859375, 0.16562652587890625, 0.1765899658203125, 0.18755340576171875, 0.198516845703125, 0.20948028564453125, 0.2204437255859375, 0.23140716552734375, 0.24237060546875, 0.25333404541015625, 0.2642974853515625, 0.27526092529296875, 0.286224365234375, 0.29718780517578125, 0.3081512451171875, 0.31911468505859375, 0.330078125]}, "gradients/decoder.model.decoder.layers.3.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 5.0, 5.0, 10.0, 10.0, 18.0, 15.0, 21.0, 21.0, 47.0, 67.0, 73.0, 96.0, 102.0, 102.0, 111.0, 81.0, 60.0, 43.0, 28.0, 19.0, 19.0, 19.0, 11.0, 6.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2212915420532227, -1.1661452054977417, -1.1109989881515503, -1.0558526515960693, -1.000706434249878, -0.945560097694397, -0.8904138207435608, -0.8352675437927246, -0.7801212668418884, -0.7249749898910522, -0.6698287129402161, -0.6146824359893799, -0.5595360994338989, -0.5043898820877075, -0.44924354553222656, -0.3940972685813904, -0.3389509916305542, -0.283804714679718, -0.22865842282772064, -0.17351213097572327, -0.11836585402488708, -0.0632195770740509, -0.008073270320892334, 0.04707300662994385, 0.10221928358078003, 0.1573655605316162, 0.2125118523836136, 0.26765814423561096, 0.32280442118644714, 0.3779506981372833, 0.4330970048904419, 0.4882432818412781, 0.5433895587921143, 0.5985358357429504, 0.6536821126937866, 0.7088284492492676, 0.763974666595459, 0.8191210031509399, 0.8742672801017761, 0.9294135570526123, 0.9845598340034485, 1.0397061109542847, 1.0948524475097656, 1.149998664855957, 1.205145001411438, 1.2602912187576294, 1.3154375553131104, 1.3705837726593018, 1.4257301092147827, 1.4808764457702637, 1.536022663116455, 1.591168999671936, 1.6463152170181274, 1.7014615535736084, 1.7566077709197998, 1.8117541074752808, 1.8669004440307617, 1.9220467805862427, 1.977192997932434, 2.032339334487915, 2.0874855518341064, 2.142631769180298, 2.1977782249450684, 2.2529244422912598, 2.308070659637451]}, "gradients/decoder.model.decoder.layers.3.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 4.0, 4.0, 6.0, 7.0, 9.0, 12.0, 12.0, 18.0, 16.0, 30.0, 28.0, 31.0, 44.0, 41.0, 39.0, 48.0, 56.0, 49.0, 57.0, 40.0, 41.0, 57.0, 48.0, 40.0, 44.0, 41.0, 32.0, 27.0, 23.0, 18.0, 19.0, 11.0, 7.0, 13.0, 11.0, 7.0, 5.0, 1.0, 5.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.1321346759796143, -1.0990865230560303, -1.0660383701324463, -1.0329902172088623, -0.9999420046806335, -0.9668938517570496, -0.9338456988334656, -0.9007975459098816, -0.8677493333816528, -0.8347011804580688, -0.8016530275344849, -0.7686048746109009, -0.7355566620826721, -0.7025085091590881, -0.6694603562355042, -0.6364122033119202, -0.6033640503883362, -0.5703158974647522, -0.5372677445411682, -0.5042195320129395, -0.47117137908935547, -0.4381232261657715, -0.4050750732421875, -0.3720269203186035, -0.33897873759269714, -0.30593058466911316, -0.2728824019432068, -0.2398342490196228, -0.20678608119487762, -0.17373791337013245, -0.14068976044654846, -0.10764159262180328, -0.07459348440170288, -0.041545320302248, -0.008497156202793121, 0.02455100417137146, 0.05759917199611664, 0.09064733982086182, 0.1236954927444458, 0.15674366056919098, 0.18979182839393616, 0.22283999621868134, 0.2558881640434265, 0.2889363169670105, 0.3219844698905945, 0.35503265261650085, 0.38808080554008484, 0.4211289882659912, 0.4541771411895752, 0.4872252941131592, 0.5202734470367432, 0.5533215999603271, 0.5863698124885559, 0.6194179654121399, 0.6524661183357239, 0.6855142712593079, 0.7185624837875366, 0.7516106367111206, 0.7846587896347046, 0.8177069425582886, 0.8507551550865173, 0.8838033080101013, 0.9168514609336853, 0.9498996138572693, 0.9829477667808533]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 0.0, 6.0, 3.0, 7.0, 6.0, 20.0, 15.0, 30.0, 49.0, 63.0, 91.0, 141.0, 222.0, 413.0, 746.0, 1392.0, 2851.0, 6455.0, 17152.0, 63936.0, 327870.0, 479472.0, 106063.0, 25231.0, 8663.0, 3690.0, 1819.0, 885.0, 508.0, 286.0, 164.0, 102.0, 64.0, 48.0, 32.0, 24.0, 15.0, 8.0, 6.0, 4.0, 3.0, 5.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.306884765625, -0.2979011535644531, -0.28891754150390625, -0.2799339294433594, -0.2709503173828125, -0.2619667053222656, -0.25298309326171875, -0.24399948120117188, -0.235015869140625, -0.22603225708007812, -0.21704864501953125, -0.20806503295898438, -0.1990814208984375, -0.19009780883789062, -0.18111419677734375, -0.17213058471679688, -0.16314697265625, -0.15416336059570312, -0.14517974853515625, -0.13619613647460938, -0.1272125244140625, -0.11822891235351562, -0.10924530029296875, -0.10026168823242188, -0.091278076171875, -0.08229446411132812, -0.07331085205078125, -0.06432723999023438, -0.0553436279296875, -0.046360015869140625, -0.03737640380859375, -0.028392791748046875, -0.0194091796875, -0.010425567626953125, -0.00144195556640625, 0.007541656494140625, 0.0165252685546875, 0.025508880615234375, 0.03449249267578125, 0.043476104736328125, 0.052459716796875, 0.061443328857421875, 0.07042694091796875, 0.07941055297851562, 0.0883941650390625, 0.09737777709960938, 0.10636138916015625, 0.11534500122070312, 0.12432861328125, 0.13331222534179688, 0.14229583740234375, 0.15127944946289062, 0.1602630615234375, 0.16924667358398438, 0.17823028564453125, 0.18721389770507812, 0.196197509765625, 0.20518112182617188, 0.21416473388671875, 0.22314834594726562, 0.2321319580078125, 0.24111557006835938, 0.25009918212890625, 0.2590827941894531, 0.26806640625]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0, 3.0, 2.0, 7.0, 3.0, 6.0, 10.0, 9.0, 9.0, 14.0, 17.0, 13.0, 31.0, 41.0, 39.0, 34.0, 43.0, 51.0, 46.0, 65.0, 49.0, 66.0, 62.0, 49.0, 52.0, 42.0, 47.0, 50.0, 32.0, 22.0, 16.0, 18.0, 9.0, 4.0, 13.0, 11.0, 7.0, 6.0, 5.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0], "bins": [-0.91552734375, -0.8913116455078125, -0.867095947265625, -0.8428802490234375, -0.81866455078125, -0.7944488525390625, -0.770233154296875, -0.7460174560546875, -0.7218017578125, -0.6975860595703125, -0.673370361328125, -0.6491546630859375, -0.62493896484375, -0.6007232666015625, -0.576507568359375, -0.5522918701171875, -0.528076171875, -0.5038604736328125, -0.479644775390625, -0.4554290771484375, -0.43121337890625, -0.4069976806640625, -0.382781982421875, -0.3585662841796875, -0.3343505859375, -0.3101348876953125, -0.285919189453125, -0.2617034912109375, -0.23748779296875, -0.2132720947265625, -0.189056396484375, -0.1648406982421875, -0.140625, -0.1164093017578125, -0.092193603515625, -0.0679779052734375, -0.04376220703125, -0.0195465087890625, 0.004669189453125, 0.0288848876953125, 0.0531005859375, 0.0773162841796875, 0.101531982421875, 0.1257476806640625, 0.14996337890625, 0.1741790771484375, 0.198394775390625, 0.2226104736328125, 0.246826171875, 0.2710418701171875, 0.295257568359375, 0.3194732666015625, 0.34368896484375, 0.3679046630859375, 0.392120361328125, 0.4163360595703125, 0.4405517578125, 0.4647674560546875, 0.488983154296875, 0.5131988525390625, 0.53741455078125, 0.5616302490234375, 0.585845947265625, 0.6100616455078125, 0.63427734375]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 3.0, 2.0, 2.0, 7.0, 11.0, 18.0, 29.0, 54.0, 87.0, 172.0, 389.0, 987.0, 3346.0, 14774.0, 185781.0, 767864.0, 63755.0, 7988.0, 1984.0, 707.0, 290.0, 142.0, 65.0, 37.0, 19.0, 13.0, 8.0, 6.0, 10.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.419921875, -0.40607452392578125, -0.3922271728515625, -0.37837982177734375, -0.364532470703125, -0.35068511962890625, -0.3368377685546875, -0.32299041748046875, -0.30914306640625, -0.29529571533203125, -0.2814483642578125, -0.26760101318359375, -0.253753662109375, -0.23990631103515625, -0.2260589599609375, -0.21221160888671875, -0.1983642578125, -0.18451690673828125, -0.1706695556640625, -0.15682220458984375, -0.142974853515625, -0.12912750244140625, -0.1152801513671875, -0.10143280029296875, -0.08758544921875, -0.07373809814453125, -0.0598907470703125, -0.04604339599609375, -0.032196044921875, -0.01834869384765625, -0.0045013427734375, 0.00934600830078125, 0.023193359375, 0.03704071044921875, 0.0508880615234375, 0.06473541259765625, 0.078582763671875, 0.09243011474609375, 0.1062774658203125, 0.12012481689453125, 0.13397216796875, 0.14781951904296875, 0.1616668701171875, 0.17551422119140625, 0.189361572265625, 0.20320892333984375, 0.2170562744140625, 0.23090362548828125, 0.2447509765625, 0.25859832763671875, 0.2724456787109375, 0.28629302978515625, 0.300140380859375, 0.31398773193359375, 0.3278350830078125, 0.34168243408203125, 0.35552978515625, 0.36937713623046875, 0.3832244873046875, 0.39707183837890625, 0.410919189453125, 0.42476654052734375, 0.4386138916015625, 0.45246124267578125, 0.46630859375]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 6.0, 2.0, 8.0, 7.0, 10.0, 12.0, 10.0, 18.0, 24.0, 17.0, 27.0, 36.0, 36.0, 33.0, 32.0, 51.0, 45.0, 53.0, 58.0, 52.0, 59.0, 49.0, 43.0, 36.0, 37.0, 33.0, 34.0, 30.0, 29.0, 30.0, 11.0, 14.0, 15.0, 12.0, 8.0, 7.0, 7.0, 3.0, 2.0, 2.0, 4.0, 3.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4501953125, -1.4057769775390625, -1.361358642578125, -1.3169403076171875, -1.27252197265625, -1.2281036376953125, -1.183685302734375, -1.1392669677734375, -1.0948486328125, -1.0504302978515625, -1.006011962890625, -0.9615936279296875, -0.91717529296875, -0.8727569580078125, -0.828338623046875, -0.7839202880859375, -0.739501953125, -0.6950836181640625, -0.650665283203125, -0.6062469482421875, -0.56182861328125, -0.5174102783203125, -0.472991943359375, -0.4285736083984375, -0.3841552734375, -0.3397369384765625, -0.295318603515625, -0.2509002685546875, -0.20648193359375, -0.1620635986328125, -0.117645263671875, -0.0732269287109375, -0.02880859375, 0.0156097412109375, 0.060028076171875, 0.1044464111328125, 0.14886474609375, 0.1932830810546875, 0.237701416015625, 0.2821197509765625, 0.3265380859375, 0.3709564208984375, 0.415374755859375, 0.4597930908203125, 0.50421142578125, 0.5486297607421875, 0.593048095703125, 0.6374664306640625, 0.681884765625, 0.7263031005859375, 0.770721435546875, 0.8151397705078125, 0.85955810546875, 0.9039764404296875, 0.948394775390625, 0.9928131103515625, 1.0372314453125, 1.0816497802734375, 1.126068115234375, 1.1704864501953125, 1.21490478515625, 1.2593231201171875, 1.303741455078125, 1.3481597900390625, 1.392578125]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 3.0, 2.0, 5.0, 9.0, 9.0, 16.0, 20.0, 32.0, 33.0, 75.0, 97.0, 164.0, 358.0, 645.0, 1331.0, 3456.0, 11481.0, 64340.0, 647327.0, 278728.0, 29001.0, 7014.0, 2301.0, 976.0, 477.0, 285.0, 146.0, 92.0, 49.0, 33.0, 16.0, 16.0, 4.0, 7.0, 2.0, 5.0, 5.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.1302490234375, -0.1255626678466797, -0.12087631225585938, -0.11618995666503906, -0.11150360107421875, -0.10681724548339844, -0.10213088989257812, -0.09744453430175781, -0.0927581787109375, -0.08807182312011719, -0.08338546752929688, -0.07869911193847656, -0.07401275634765625, -0.06932640075683594, -0.06464004516601562, -0.05995368957519531, -0.055267333984375, -0.05058097839355469, -0.045894622802734375, -0.04120826721191406, -0.03652191162109375, -0.03183555603027344, -0.027149200439453125, -0.022462844848632812, -0.0177764892578125, -0.013090133666992188, -0.008403778076171875, -0.0037174224853515625, 0.00096893310546875, 0.0056552886962890625, 0.010341644287109375, 0.015027999877929688, 0.01971435546875, 0.024400711059570312, 0.029087066650390625, 0.03377342224121094, 0.03845977783203125, 0.04314613342285156, 0.047832489013671875, 0.05251884460449219, 0.0572052001953125, 0.06189155578613281, 0.06657791137695312, 0.07126426696777344, 0.07595062255859375, 0.08063697814941406, 0.08532333374023438, 0.09000968933105469, 0.094696044921875, 0.09938240051269531, 0.10406875610351562, 0.10875511169433594, 0.11344146728515625, 0.11812782287597656, 0.12281417846679688, 0.1275005340576172, 0.1321868896484375, 0.1368732452392578, 0.14155960083007812, 0.14624595642089844, 0.15093231201171875, 0.15561866760253906, 0.16030502319335938, 0.1649913787841797, 0.169677734375]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 5.0, 4.0, 4.0, 13.0, 7.0, 22.0, 23.0, 37.0, 54.0, 61.0, 84.0, 133.0, 125.0, 126.0, 75.0, 54.0, 61.0, 37.0, 26.0, 14.0, 11.0, 10.0, 6.0, 7.0, 0.0, 3.0, 1.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.693601608276367e-05, -6.479769945144653e-05, -6.26593828201294e-05, -6.0521066188812256e-05, -5.838274955749512e-05, -5.624443292617798e-05, -5.410611629486084e-05, -5.19677996635437e-05, -4.982948303222656e-05, -4.7691166400909424e-05, -4.5552849769592285e-05, -4.3414533138275146e-05, -4.127621650695801e-05, -3.913789987564087e-05, -3.699958324432373e-05, -3.486126661300659e-05, -3.272294998168945e-05, -3.0584633350372314e-05, -2.8446316719055176e-05, -2.6308000087738037e-05, -2.41696834564209e-05, -2.203136682510376e-05, -1.989305019378662e-05, -1.7754733562469482e-05, -1.5616416931152344e-05, -1.3478100299835205e-05, -1.1339783668518066e-05, -9.201467037200928e-06, -7.063150405883789e-06, -4.92483377456665e-06, -2.7865171432495117e-06, -6.48200511932373e-07, 1.4901161193847656e-06, 3.6284327507019043e-06, 5.766749382019043e-06, 7.905066013336182e-06, 1.004338264465332e-05, 1.2181699275970459e-05, 1.4320015907287598e-05, 1.6458332538604736e-05, 1.8596649169921875e-05, 2.0734965801239014e-05, 2.2873282432556152e-05, 2.501159906387329e-05, 2.714991569519043e-05, 2.928823232650757e-05, 3.142654895782471e-05, 3.3564865589141846e-05, 3.5703182220458984e-05, 3.784149885177612e-05, 3.997981548309326e-05, 4.21181321144104e-05, 4.425644874572754e-05, 4.639476537704468e-05, 4.8533082008361816e-05, 5.0671398639678955e-05, 5.2809715270996094e-05, 5.494803190231323e-05, 5.708634853363037e-05, 5.922466516494751e-05, 6.136298179626465e-05, 6.350129842758179e-05, 6.563961505889893e-05, 6.777793169021606e-05, 6.99162483215332e-05]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 2.0, 3.0, 4.0, 4.0, 9.0, 7.0, 18.0, 21.0, 28.0, 48.0, 95.0, 187.0, 260.0, 509.0, 869.0, 1836.0, 4094.0, 11278.0, 40574.0, 209933.0, 574915.0, 155738.0, 31891.0, 9171.0, 3510.0, 1648.0, 845.0, 470.0, 256.0, 115.0, 88.0, 39.0, 30.0, 22.0, 10.0, 13.0, 4.0, 5.0, 6.0, 3.0, 3.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.128173828125, -0.12455463409423828, -0.12093544006347656, -0.11731624603271484, -0.11369705200195312, -0.1100778579711914, -0.10645866394042969, -0.10283946990966797, -0.09922027587890625, -0.09560108184814453, -0.09198188781738281, -0.0883626937866211, -0.08474349975585938, -0.08112430572509766, -0.07750511169433594, -0.07388591766357422, -0.0702667236328125, -0.06664752960205078, -0.06302833557128906, -0.059409141540527344, -0.055789947509765625, -0.052170753479003906, -0.04855155944824219, -0.04493236541748047, -0.04131317138671875, -0.03769397735595703, -0.03407478332519531, -0.030455589294433594, -0.026836395263671875, -0.023217201232910156, -0.019598007202148438, -0.01597881317138672, -0.012359619140625, -0.008740425109863281, -0.0051212310791015625, -0.0015020370483398438, 0.002117156982421875, 0.005736351013183594, 0.009355545043945312, 0.012974739074707031, 0.01659393310546875, 0.02021312713623047, 0.023832321166992188, 0.027451515197753906, 0.031070709228515625, 0.034689903259277344, 0.03830909729003906, 0.04192829132080078, 0.0455474853515625, 0.04916667938232422, 0.05278587341308594, 0.056405067443847656, 0.060024261474609375, 0.0636434555053711, 0.06726264953613281, 0.07088184356689453, 0.07450103759765625, 0.07812023162841797, 0.08173942565917969, 0.0853586196899414, 0.08897781372070312, 0.09259700775146484, 0.09621620178222656, 0.09983539581298828, 0.10345458984375]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 1.0, 3.0, 4.0, 3.0, 5.0, 2.0, 11.0, 9.0, 7.0, 9.0, 14.0, 18.0, 25.0, 20.0, 29.0, 40.0, 43.0, 55.0, 70.0, 93.0, 84.0, 74.0, 56.0, 55.0, 56.0, 50.0, 34.0, 21.0, 25.0, 19.0, 12.0, 17.0, 9.0, 4.0, 7.0, 5.0, 4.0, 2.0, 5.0, 3.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.022705078125, -0.02191162109375, -0.0211181640625, -0.02032470703125, -0.01953125, -0.01873779296875, -0.0179443359375, -0.01715087890625, -0.016357421875, -0.01556396484375, -0.0147705078125, -0.01397705078125, -0.01318359375, -0.01239013671875, -0.0115966796875, -0.01080322265625, -0.010009765625, -0.00921630859375, -0.0084228515625, -0.00762939453125, -0.0068359375, -0.00604248046875, -0.0052490234375, -0.00445556640625, -0.003662109375, -0.00286865234375, -0.0020751953125, -0.00128173828125, -0.00048828125, 0.00030517578125, 0.0010986328125, 0.00189208984375, 0.002685546875, 0.00347900390625, 0.0042724609375, 0.00506591796875, 0.005859375, 0.00665283203125, 0.0074462890625, 0.00823974609375, 0.009033203125, 0.00982666015625, 0.0106201171875, 0.01141357421875, 0.01220703125, 0.01300048828125, 0.0137939453125, 0.01458740234375, 0.015380859375, 0.01617431640625, 0.0169677734375, 0.01776123046875, 0.0185546875, 0.01934814453125, 0.0201416015625, 0.02093505859375, 0.021728515625, 0.02252197265625, 0.0233154296875, 0.02410888671875, 0.02490234375, 0.02569580078125, 0.0264892578125, 0.02728271484375, 0.028076171875]}, "gradients/decoder.model.decoder.layers.3.self_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 4.0, 3.0, 2.0, 4.0, 6.0, 3.0, 13.0, 12.0, 9.0, 24.0, 30.0, 38.0, 57.0, 68.0, 95.0, 110.0, 116.0, 104.0, 83.0, 54.0, 49.0, 33.0, 24.0, 21.0, 8.0, 13.0, 8.0, 5.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.8218085765838623, -0.7864886522293091, -0.7511687278747559, -0.7158488035202026, -0.6805288791656494, -0.6452089548110962, -0.6098890900611877, -0.5745691657066345, -0.5392492413520813, -0.5039293169975281, -0.46860939264297485, -0.433289498090744, -0.3979695737361908, -0.3626496493816376, -0.32732975482940674, -0.2920098304748535, -0.2566899061203003, -0.22136998176574707, -0.18605007231235504, -0.150730162858963, -0.11541023850440979, -0.08009031414985657, -0.04477040469646454, -0.00945049524307251, 0.025869429111480713, 0.06118934601545334, 0.09650926291942596, 0.131829172372818, 0.16714909672737122, 0.20246902108192444, 0.23778893053531647, 0.2731088399887085, 0.30842864513397217, 0.3437485694885254, 0.3790684938430786, 0.41438838839530945, 0.44970831274986267, 0.4850282371044159, 0.5203481316566467, 0.5556680560112, 0.5909879803657532, 0.6263079047203064, 0.6616278290748596, 0.6969477534294128, 0.7322676181793213, 0.7675875425338745, 0.8029074668884277, 0.838227391242981, 0.8735473155975342, 0.9088672399520874, 0.9441871643066406, 0.9795070886611938, 1.014827013015747, 1.0501469373703003, 1.0854668617248535, 1.1207866668701172, 1.15610671043396, 1.1914266347885132, 1.2267465591430664, 1.2620664834976196, 1.2973864078521729, 1.332706332206726, 1.3680262565612793, 1.403346061706543, 1.4386659860610962]}, "gradients/decoder.model.decoder.layers.3.self_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 3.0, 0.0, 2.0, 3.0, 5.0, 8.0, 13.0, 11.0, 18.0, 16.0, 26.0, 35.0, 39.0, 49.0, 59.0, 60.0, 71.0, 59.0, 73.0, 58.0, 55.0, 65.0, 54.0, 53.0, 38.0, 33.0, 16.0, 16.0, 17.0, 16.0, 9.0, 10.0, 5.0, 4.0, 3.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.905998706817627, -0.8788833022117615, -0.8517679572105408, -0.8246525526046753, -0.7975372076034546, -0.7704218029975891, -0.7433063983917236, -0.7161910533905029, -0.6890757083892822, -0.6619603037834167, -0.634844958782196, -0.6077295541763306, -0.5806142091751099, -0.5534988045692444, -0.5263833999633789, -0.4992680549621582, -0.4721526503562927, -0.44503727555274963, -0.41792190074920654, -0.39080649614334106, -0.36369115114212036, -0.3365757465362549, -0.3094603717327118, -0.2823449969291687, -0.2552296221256256, -0.22811424732208252, -0.20099887251853943, -0.17388348281383514, -0.14676810801029205, -0.11965273320674896, -0.09253734350204468, -0.06542196869850159, -0.038306593894958496, -0.011191215366125107, 0.015924163162708282, 0.04303954541683197, 0.07015492022037506, 0.09727029502391815, 0.12438568472862244, 0.15150105953216553, 0.17861643433570862, 0.2057318091392517, 0.2328471839427948, 0.2599625587463379, 0.28707796335220337, 0.3141933083534241, 0.34130871295928955, 0.36842408776283264, 0.39553946256637573, 0.4226548373699188, 0.4497702121734619, 0.4768856167793274, 0.5040009617805481, 0.5311163663864136, 0.5582317113876343, 0.5853471159934998, 0.6124625205993652, 0.6395779252052307, 0.6666932702064514, 0.6938086748123169, 0.7209240198135376, 0.7480394244194031, 0.7751548290252686, 0.8022701740264893, 0.82938551902771]}, "gradients/decoder.model.decoder.layers.3.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 4.0, 3.0, 7.0, 3.0, 6.0, 8.0, 16.0, 19.0, 37.0, 44.0, 71.0, 102.0, 164.0, 250.0, 397.0, 748.0, 1330.0, 2534.0, 5069.0, 10936.0, 32342.0, 449288.0, 489771.0, 33113.0, 11356.0, 5098.0, 2554.0, 1353.0, 709.0, 457.0, 245.0, 167.0, 122.0, 75.0, 46.0, 38.0, 21.0, 23.0, 12.0, 10.0, 11.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 3.0], "bins": [-1.0546875, -1.0269393920898438, -0.9991912841796875, -0.9714431762695312, -0.943695068359375, -0.9159469604492188, -0.8881988525390625, -0.8604507446289062, -0.83270263671875, -0.8049545288085938, -0.7772064208984375, -0.7494583129882812, -0.721710205078125, -0.6939620971679688, -0.6662139892578125, -0.6384658813476562, -0.6107177734375, -0.5829696655273438, -0.5552215576171875, -0.5274734497070312, -0.499725341796875, -0.47197723388671875, -0.4442291259765625, -0.41648101806640625, -0.38873291015625, -0.36098480224609375, -0.3332366943359375, -0.30548858642578125, -0.277740478515625, -0.24999237060546875, -0.2222442626953125, -0.19449615478515625, -0.166748046875, -0.13899993896484375, -0.1112518310546875, -0.08350372314453125, -0.055755615234375, -0.02800750732421875, -0.0002593994140625, 0.02748870849609375, 0.05523681640625, 0.08298492431640625, 0.1107330322265625, 0.13848114013671875, 0.166229248046875, 0.19397735595703125, 0.2217254638671875, 0.24947357177734375, 0.2772216796875, 0.30496978759765625, 0.3327178955078125, 0.36046600341796875, 0.388214111328125, 0.41596221923828125, 0.4437103271484375, 0.47145843505859375, 0.49920654296875, 0.5269546508789062, 0.5547027587890625, 0.5824508666992188, 0.610198974609375, 0.6379470825195312, 0.6656951904296875, 0.6934432983398438, 0.72119140625]}, "gradients/decoder.model.decoder.layers.3.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 6.0, 2.0, 6.0, 5.0, 11.0, 7.0, 15.0, 20.0, 21.0, 22.0, 36.0, 40.0, 47.0, 62.0, 65.0, 59.0, 59.0, 76.0, 47.0, 61.0, 53.0, 63.0, 42.0, 32.0, 28.0, 23.0, 19.0, 16.0, 17.0, 10.0, 10.0, 8.0, 5.0, 7.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-1.98046875, -1.92718505859375, -1.8739013671875, -1.82061767578125, -1.767333984375, -1.71405029296875, -1.6607666015625, -1.60748291015625, -1.55419921875, -1.50091552734375, -1.4476318359375, -1.39434814453125, -1.341064453125, -1.28778076171875, -1.2344970703125, -1.18121337890625, -1.1279296875, -1.07464599609375, -1.0213623046875, -0.96807861328125, -0.914794921875, -0.86151123046875, -0.8082275390625, -0.75494384765625, -0.70166015625, -0.64837646484375, -0.5950927734375, -0.54180908203125, -0.488525390625, -0.43524169921875, -0.3819580078125, -0.32867431640625, -0.275390625, -0.22210693359375, -0.1688232421875, -0.11553955078125, -0.062255859375, -0.00897216796875, 0.0443115234375, 0.09759521484375, 0.15087890625, 0.20416259765625, 0.2574462890625, 0.31072998046875, 0.364013671875, 0.41729736328125, 0.4705810546875, 0.52386474609375, 0.5771484375, 0.63043212890625, 0.6837158203125, 0.73699951171875, 0.790283203125, 0.84356689453125, 0.8968505859375, 0.95013427734375, 1.00341796875, 1.05670166015625, 1.1099853515625, 1.16326904296875, 1.216552734375, 1.26983642578125, 1.3231201171875, 1.37640380859375, 1.4296875]}, "gradients/decoder.model.decoder.layers.3.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 5.0, 1.0, 9.0, 6.0, 11.0, 7.0, 11.0, 14.0, 19.0, 24.0, 35.0, 37.0, 53.0, 89.0, 182.0, 672.0, 4554.0, 73163.0, 953092.0, 14239.0, 1645.0, 301.0, 115.0, 61.0, 43.0, 35.0, 32.0, 22.0, 23.0, 14.0, 9.0, 12.0, 8.0, 5.0, 3.0, 4.0, 3.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-2.416015625, -2.345458984375, -2.27490234375, -2.204345703125, -2.1337890625, -2.063232421875, -1.99267578125, -1.922119140625, -1.8515625, -1.781005859375, -1.71044921875, -1.639892578125, -1.5693359375, -1.498779296875, -1.42822265625, -1.357666015625, -1.287109375, -1.216552734375, -1.14599609375, -1.075439453125, -1.0048828125, -0.934326171875, -0.86376953125, -0.793212890625, -0.72265625, -0.652099609375, -0.58154296875, -0.510986328125, -0.4404296875, -0.369873046875, -0.29931640625, -0.228759765625, -0.158203125, -0.087646484375, -0.01708984375, 0.053466796875, 0.1240234375, 0.194580078125, 0.26513671875, 0.335693359375, 0.40625, 0.476806640625, 0.54736328125, 0.617919921875, 0.6884765625, 0.759033203125, 0.82958984375, 0.900146484375, 0.970703125, 1.041259765625, 1.11181640625, 1.182373046875, 1.2529296875, 1.323486328125, 1.39404296875, 1.464599609375, 1.53515625, 1.605712890625, 1.67626953125, 1.746826171875, 1.8173828125, 1.887939453125, 1.95849609375, 2.029052734375, 2.099609375]}, "gradients/decoder.model.decoder.layers.3.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 3.0, 7.0, 4.0, 8.0, 11.0, 14.0, 13.0, 17.0, 21.0, 31.0, 31.0, 28.0, 30.0, 59.0, 51.0, 66.0, 54.0, 61.0, 62.0, 67.0, 55.0, 56.0, 37.0, 45.0, 31.0, 25.0, 24.0, 21.0, 17.0, 19.0, 9.0, 12.0, 5.0, 5.0, 2.0, 5.0, 2.0, 1.0, 0.0, 1.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.2421875, -2.17352294921875, -2.1048583984375, -2.03619384765625, -1.967529296875, -1.89886474609375, -1.8302001953125, -1.76153564453125, -1.69287109375, -1.62420654296875, -1.5555419921875, -1.48687744140625, -1.418212890625, -1.34954833984375, -1.2808837890625, -1.21221923828125, -1.1435546875, -1.07489013671875, -1.0062255859375, -0.93756103515625, -0.868896484375, -0.80023193359375, -0.7315673828125, -0.66290283203125, -0.59423828125, -0.52557373046875, -0.4569091796875, -0.38824462890625, -0.319580078125, -0.25091552734375, -0.1822509765625, -0.11358642578125, -0.044921875, 0.02374267578125, 0.0924072265625, 0.16107177734375, 0.229736328125, 0.29840087890625, 0.3670654296875, 0.43572998046875, 0.50439453125, 0.57305908203125, 0.6417236328125, 0.71038818359375, 0.779052734375, 0.84771728515625, 0.9163818359375, 0.98504638671875, 1.0537109375, 1.12237548828125, 1.1910400390625, 1.25970458984375, 1.328369140625, 1.39703369140625, 1.4656982421875, 1.53436279296875, 1.60302734375, 1.67169189453125, 1.7403564453125, 1.80902099609375, 1.877685546875, 1.94635009765625, 2.0150146484375, 2.08367919921875, 2.15234375]}, "gradients/decoder.model.decoder.layers.3.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 2.0, 5.0, 7.0, 12.0, 12.0, 23.0, 41.0, 59.0, 114.0, 282.0, 696.0, 2193.0, 9182.0, 54986.0, 865182.0, 97721.0, 13381.0, 3128.0, 872.0, 333.0, 150.0, 73.0, 37.0, 30.0, 12.0, 10.0, 7.0, 7.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.388427734375, -0.3768730163574219, -0.36531829833984375, -0.3537635803222656, -0.3422088623046875, -0.3306541442871094, -0.31909942626953125, -0.3075447082519531, -0.295989990234375, -0.2844352722167969, -0.27288055419921875, -0.2613258361816406, -0.2497711181640625, -0.23821640014648438, -0.22666168212890625, -0.21510696411132812, -0.20355224609375, -0.19199752807617188, -0.18044281005859375, -0.16888809204101562, -0.1573333740234375, -0.14577865600585938, -0.13422393798828125, -0.12266921997070312, -0.111114501953125, -0.09955978393554688, -0.08800506591796875, -0.07645034790039062, -0.0648956298828125, -0.053340911865234375, -0.04178619384765625, -0.030231475830078125, -0.0186767578125, -0.007122039794921875, 0.00443267822265625, 0.015987396240234375, 0.0275421142578125, 0.039096832275390625, 0.05065155029296875, 0.062206268310546875, 0.073760986328125, 0.08531570434570312, 0.09687042236328125, 0.10842514038085938, 0.1199798583984375, 0.13153457641601562, 0.14308929443359375, 0.15464401245117188, 0.16619873046875, 0.17775344848632812, 0.18930816650390625, 0.20086288452148438, 0.2124176025390625, 0.22397232055664062, 0.23552703857421875, 0.24708175659179688, 0.258636474609375, 0.2701911926269531, 0.28174591064453125, 0.2933006286621094, 0.3048553466796875, 0.3164100646972656, 0.32796478271484375, 0.3395195007324219, 0.35107421875]}, "gradients/decoder.model.decoder.layers.3.self_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 1.0, 3.0, 1.0, 2.0, 2.0, 4.0, 3.0, 3.0, 6.0, 3.0, 13.0, 8.0, 13.0, 16.0, 17.0, 25.0, 33.0, 46.0, 69.0, 89.0, 173.0, 145.0, 95.0, 50.0, 36.0, 29.0, 26.0, 21.0, 20.0, 10.0, 6.0, 9.0, 5.0, 5.0, 5.0, 1.0, 3.0, 1.0, 4.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.676248550415039e-05, -2.5949440896511078e-05, -2.5136396288871765e-05, -2.4323351681232452e-05, -2.351030707359314e-05, -2.2697262465953827e-05, -2.1884217858314514e-05, -2.10711732506752e-05, -2.025812864303589e-05, -1.9445084035396576e-05, -1.8632039427757263e-05, -1.781899482011795e-05, -1.7005950212478638e-05, -1.6192905604839325e-05, -1.5379860997200012e-05, -1.45668163895607e-05, -1.3753771781921387e-05, -1.2940727174282074e-05, -1.2127682566642761e-05, -1.1314637959003448e-05, -1.0501593351364136e-05, -9.688548743724823e-06, -8.87550413608551e-06, -8.062459528446198e-06, -7.249414920806885e-06, -6.436370313167572e-06, -5.623325705528259e-06, -4.8102810978889465e-06, -3.997236490249634e-06, -3.184191882610321e-06, -2.3711472749710083e-06, -1.5581026673316956e-06, -7.450580596923828e-07, 6.798654794692993e-08, 8.810311555862427e-07, 1.6940757632255554e-06, 2.507120370864868e-06, 3.320164978504181e-06, 4.133209586143494e-06, 4.946254193782806e-06, 5.759298801422119e-06, 6.572343409061432e-06, 7.385388016700745e-06, 8.198432624340057e-06, 9.01147723197937e-06, 9.824521839618683e-06, 1.0637566447257996e-05, 1.1450611054897308e-05, 1.2263655662536621e-05, 1.3076700270175934e-05, 1.3889744877815247e-05, 1.470278948545456e-05, 1.5515834093093872e-05, 1.6328878700733185e-05, 1.7141923308372498e-05, 1.795496791601181e-05, 1.8768012523651123e-05, 1.9581057131290436e-05, 2.039410173892975e-05, 2.120714634656906e-05, 2.2020190954208374e-05, 2.2833235561847687e-05, 2.3646280169487e-05, 2.4459324777126312e-05, 2.5272369384765625e-05]}, "gradients/decoder.model.decoder.layers.3.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 5.0, 3.0, 6.0, 9.0, 16.0, 24.0, 39.0, 65.0, 107.0, 225.0, 437.0, 869.0, 1869.0, 5020.0, 15766.0, 83905.0, 831071.0, 84693.0, 15924.0, 4922.0, 1865.0, 806.0, 382.0, 202.0, 128.0, 80.0, 43.0, 26.0, 14.0, 14.0, 9.0, 4.0, 4.0, 1.0, 3.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.287353515625, -0.2772712707519531, -0.26718902587890625, -0.2571067810058594, -0.2470245361328125, -0.23694229125976562, -0.22686004638671875, -0.21677780151367188, -0.206695556640625, -0.19661331176757812, -0.18653106689453125, -0.17644882202148438, -0.1663665771484375, -0.15628433227539062, -0.14620208740234375, -0.13611984252929688, -0.12603759765625, -0.11595535278320312, -0.10587310791015625, -0.09579086303710938, -0.0857086181640625, -0.07562637329101562, -0.06554412841796875, -0.055461883544921875, -0.045379638671875, -0.035297393798828125, -0.02521514892578125, -0.015132904052734375, -0.0050506591796875, 0.005031585693359375, 0.01511383056640625, 0.025196075439453125, 0.0352783203125, 0.045360565185546875, 0.05544281005859375, 0.06552505493164062, 0.0756072998046875, 0.08568954467773438, 0.09577178955078125, 0.10585403442382812, 0.115936279296875, 0.12601852416992188, 0.13610076904296875, 0.14618301391601562, 0.1562652587890625, 0.16634750366210938, 0.17642974853515625, 0.18651199340820312, 0.19659423828125, 0.20667648315429688, 0.21675872802734375, 0.22684097290039062, 0.2369232177734375, 0.24700546264648438, 0.25708770751953125, 0.2671699523925781, 0.277252197265625, 0.2873344421386719, 0.29741668701171875, 0.3074989318847656, 0.3175811767578125, 0.3276634216308594, 0.33774566650390625, 0.3478279113769531, 0.35791015625]}, "gradients/decoder.model.decoder.layers.3.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 2.0, 5.0, 2.0, 1.0, 1.0, 1.0, 5.0, 4.0, 9.0, 8.0, 7.0, 13.0, 24.0, 28.0, 42.0, 70.0, 124.0, 280.0, 118.0, 62.0, 53.0, 46.0, 24.0, 20.0, 14.0, 7.0, 8.0, 9.0, 6.0, 6.0, 4.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1495361328125, -0.1454477310180664, -0.1413593292236328, -0.13727092742919922, -0.13318252563476562, -0.12909412384033203, -0.12500572204589844, -0.12091732025146484, -0.11682891845703125, -0.11274051666259766, -0.10865211486816406, -0.10456371307373047, -0.10047531127929688, -0.09638690948486328, -0.09229850769042969, -0.0882101058959961, -0.0841217041015625, -0.0800333023071289, -0.07594490051269531, -0.07185649871826172, -0.06776809692382812, -0.06367969512939453, -0.05959129333496094, -0.055502891540527344, -0.05141448974609375, -0.047326087951660156, -0.04323768615722656, -0.03914928436279297, -0.035060882568359375, -0.03097248077392578, -0.026884078979492188, -0.022795677185058594, -0.018707275390625, -0.014618873596191406, -0.010530471801757812, -0.006442070007324219, -0.002353668212890625, 0.0017347335815429688, 0.0058231353759765625, 0.009911537170410156, 0.01399993896484375, 0.018088340759277344, 0.022176742553710938, 0.02626514434814453, 0.030353546142578125, 0.03444194793701172, 0.03853034973144531, 0.042618751525878906, 0.0467071533203125, 0.050795555114746094, 0.05488395690917969, 0.05897235870361328, 0.06306076049804688, 0.06714916229248047, 0.07123756408691406, 0.07532596588134766, 0.07941436767578125, 0.08350276947021484, 0.08759117126464844, 0.09167957305908203, 0.09576797485351562, 0.09985637664794922, 0.10394477844238281, 0.1080331802368164, 0.11212158203125]}, "gradients/decoder.model.decoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 3.0, 1.0, 3.0, 4.0, 9.0, 12.0, 15.0, 24.0, 35.0, 50.0, 75.0, 109.0, 122.0, 134.0, 116.0, 97.0, 64.0, 50.0, 28.0, 20.0, 14.0, 13.0, 4.0, 2.0, 3.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.550902843475342, -3.458193778991699, -3.3654849529266357, -3.272775888442993, -3.1800670623779297, -3.087357997894287, -2.9946489334106445, -2.901939868927002, -2.8092310428619385, -2.716521978378296, -2.6238131523132324, -2.53110408782959, -2.4383950233459473, -2.345686197280884, -2.252977132797241, -2.1602683067321777, -2.067559242248535, -1.9748502969741821, -1.882141351699829, -1.7894322872161865, -1.6967233419418335, -1.6040143966674805, -1.511305332183838, -1.4185963869094849, -1.3258874416351318, -1.2331784963607788, -1.1404695510864258, -1.0477604866027832, -0.9550515413284302, -0.8623425960540771, -0.7696335911750793, -0.6769245862960815, -0.5842158794403076, -0.4915069043636322, -0.3987979292869568, -0.30608895421028137, -0.21337997913360596, -0.12067100405693054, -0.027962028980255127, 0.06474697589874268, 0.1574559211730957, 0.2501648962497711, 0.34287387132644653, 0.43558284640312195, 0.5282918214797974, 0.6210007667541504, 0.7137097716331482, 0.806418776512146, 0.899127721786499, 0.991836667060852, 1.084545612335205, 1.1772546768188477, 1.2699636220932007, 1.3626725673675537, 1.4553816318511963, 1.5480905771255493, 1.6407995223999023, 1.7335084676742554, 1.8262174129486084, 1.918926477432251, 2.0116353034973145, 2.104344367980957, 2.1970534324645996, 2.289762496948242, 2.3824713230133057]}, "gradients/decoder.model.decoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 5.0, 5.0, 5.0, 4.0, 4.0, 5.0, 11.0, 4.0, 14.0, 18.0, 18.0, 19.0, 24.0, 31.0, 27.0, 37.0, 28.0, 33.0, 26.0, 36.0, 55.0, 38.0, 56.0, 39.0, 41.0, 47.0, 27.0, 54.0, 44.0, 33.0, 25.0, 28.0, 29.0, 28.0, 20.0, 23.0, 11.0, 9.0, 14.0, 10.0, 8.0, 2.0, 6.0, 4.0, 5.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.0867416858673096, -2.9973676204681396, -2.9079935550689697, -2.8186194896698, -2.72924542427063, -2.639871597290039, -2.550497531890869, -2.461123466491699, -2.3717494010925293, -2.2823753356933594, -2.1930012702941895, -2.1036272048950195, -2.0142531394958496, -1.9248791933059692, -1.8355051279067993, -1.746131181716919, -1.6567569971084595, -1.5673829317092896, -1.4780088663101196, -1.3886349201202393, -1.2992608547210693, -1.2098867893218994, -1.1205127239227295, -1.0311386585235596, -0.9417646527290344, -0.8523905873298645, -0.7630165815353394, -0.6736425161361694, -0.5842684507369995, -0.49489444494247437, -0.40552037954330444, -0.3161463737487793, -0.22677230834960938, -0.13739827275276184, -0.04802422225475311, 0.041349828243255615, 0.13072386384010315, 0.22009789943695068, 0.3094719648361206, 0.39884597063064575, 0.4882200360298157, 0.5775941014289856, 0.6669681072235107, 0.7563421726226807, 0.8457162380218506, 0.9350902438163757, 1.0244643688201904, 1.1138383150100708, 1.2032123804092407, 1.2925864458084106, 1.3819605112075806, 1.471334457397461, 1.5607085227966309, 1.6500825881958008, 1.7394566535949707, 1.8288307189941406, 1.9182047843933105, 2.0075788497924805, 2.0969529151916504, 2.1863269805908203, 2.2757010459899902, 2.36507511138916, 2.45444917678833, 2.543823003768921, 2.633197069168091]}, "gradients/decoder.model.decoder.layers.2.fc2.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 6.0, 5.0, 8.0, 5.0, 5.0, 4.0, 12.0, 13.0, 20.0, 30.0, 34.0, 30.0, 61.0, 64.0, 97.0, 136.0, 237.0, 298.0, 541.0, 1068.0, 2160.0, 4891.0, 13094.0, 53144.0, 791164.0, 3163954.0, 126438.0, 23078.0, 7429.0, 2938.0, 1374.0, 706.0, 447.0, 248.0, 145.0, 97.0, 71.0, 60.0, 38.0, 39.0, 24.0, 19.0, 13.0, 12.0, 9.0, 4.0, 7.0, 7.0, 3.0, 4.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.4365234375, -1.3856048583984375, -1.334686279296875, -1.2837677001953125, -1.23284912109375, -1.1819305419921875, -1.131011962890625, -1.0800933837890625, -1.0291748046875, -0.9782562255859375, -0.927337646484375, -0.8764190673828125, -0.82550048828125, -0.7745819091796875, -0.723663330078125, -0.6727447509765625, -0.621826171875, -0.5709075927734375, -0.519989013671875, -0.4690704345703125, -0.41815185546875, -0.3672332763671875, -0.316314697265625, -0.2653961181640625, -0.2144775390625, -0.1635589599609375, -0.112640380859375, -0.0617218017578125, -0.01080322265625, 0.0401153564453125, 0.091033935546875, 0.1419525146484375, 0.19287109375, 0.2437896728515625, 0.294708251953125, 0.3456268310546875, 0.39654541015625, 0.4474639892578125, 0.498382568359375, 0.5493011474609375, 0.6002197265625, 0.6511383056640625, 0.702056884765625, 0.7529754638671875, 0.80389404296875, 0.8548126220703125, 0.905731201171875, 0.9566497802734375, 1.007568359375, 1.0584869384765625, 1.109405517578125, 1.1603240966796875, 1.21124267578125, 1.2621612548828125, 1.313079833984375, 1.3639984130859375, 1.4149169921875, 1.4658355712890625, 1.516754150390625, 1.5676727294921875, 1.61859130859375, 1.6695098876953125, 1.720428466796875, 1.7713470458984375, 1.822265625]}, "gradients/decoder.model.decoder.layers.2.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 1.0, 2.0, 4.0, 6.0, 5.0, 11.0, 13.0, 13.0, 18.0, 28.0, 34.0, 32.0, 48.0, 75.0, 86.0, 83.0, 70.0, 79.0, 68.0, 70.0, 52.0, 43.0, 39.0, 29.0, 26.0, 12.0, 18.0, 9.0, 8.0, 6.0, 5.0, 3.0, 4.0, 6.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.3056640625, -1.27276611328125, -1.2398681640625, -1.20697021484375, -1.174072265625, -1.14117431640625, -1.1082763671875, -1.07537841796875, -1.04248046875, -1.00958251953125, -0.9766845703125, -0.94378662109375, -0.910888671875, -0.87799072265625, -0.8450927734375, -0.81219482421875, -0.779296875, -0.74639892578125, -0.7135009765625, -0.68060302734375, -0.647705078125, -0.61480712890625, -0.5819091796875, -0.54901123046875, -0.51611328125, -0.48321533203125, -0.4503173828125, -0.41741943359375, -0.384521484375, -0.35162353515625, -0.3187255859375, -0.28582763671875, -0.2529296875, -0.22003173828125, -0.1871337890625, -0.15423583984375, -0.121337890625, -0.08843994140625, -0.0555419921875, -0.02264404296875, 0.01025390625, 0.04315185546875, 0.0760498046875, 0.10894775390625, 0.141845703125, 0.17474365234375, 0.2076416015625, 0.24053955078125, 0.2734375, 0.30633544921875, 0.3392333984375, 0.37213134765625, 0.405029296875, 0.43792724609375, 0.4708251953125, 0.50372314453125, 0.53662109375, 0.56951904296875, 0.6024169921875, 0.63531494140625, 0.668212890625, 0.70111083984375, 0.7340087890625, 0.76690673828125, 0.7998046875]}, "gradients/decoder.model.decoder.layers.2.fc1.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 2.0, 8.0, 8.0, 16.0, 12.0, 14.0, 25.0, 37.0, 74.0, 129.0, 334.0, 973.0, 4671.0, 44594.0, 3721165.0, 403785.0, 15034.0, 2306.0, 614.0, 206.0, 98.0, 55.0, 36.0, 31.0, 13.0, 13.0, 5.0, 7.0, 4.0, 6.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.681640625, -2.59161376953125, -2.5015869140625, -2.41156005859375, -2.321533203125, -2.23150634765625, -2.1414794921875, -2.05145263671875, -1.96142578125, -1.87139892578125, -1.7813720703125, -1.69134521484375, -1.601318359375, -1.51129150390625, -1.4212646484375, -1.33123779296875, -1.2412109375, -1.15118408203125, -1.0611572265625, -0.97113037109375, -0.881103515625, -0.79107666015625, -0.7010498046875, -0.61102294921875, -0.52099609375, -0.43096923828125, -0.3409423828125, -0.25091552734375, -0.160888671875, -0.07086181640625, 0.0191650390625, 0.10919189453125, 0.19921875, 0.28924560546875, 0.3792724609375, 0.46929931640625, 0.559326171875, 0.64935302734375, 0.7393798828125, 0.82940673828125, 0.91943359375, 1.00946044921875, 1.0994873046875, 1.18951416015625, 1.279541015625, 1.36956787109375, 1.4595947265625, 1.54962158203125, 1.6396484375, 1.72967529296875, 1.8197021484375, 1.90972900390625, 1.999755859375, 2.08978271484375, 2.1798095703125, 2.26983642578125, 2.35986328125, 2.44989013671875, 2.5399169921875, 2.62994384765625, 2.719970703125, 2.80999755859375, 2.9000244140625, 2.99005126953125, 3.080078125]}, "gradients/decoder.model.decoder.layers.2.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 3.0, 2.0, 0.0, 0.0, 2.0, 3.0, 6.0, 0.0, 4.0, 8.0, 15.0, 12.0, 16.0, 19.0, 36.0, 44.0, 48.0, 88.0, 131.0, 189.0, 344.0, 608.0, 913.0, 601.0, 362.0, 215.0, 124.0, 76.0, 55.0, 40.0, 26.0, 19.0, 20.0, 16.0, 11.0, 4.0, 8.0, 4.0, 2.0, 4.0, 1.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.377197265625, -0.3648490905761719, -0.35250091552734375, -0.3401527404785156, -0.3278045654296875, -0.3154563903808594, -0.30310821533203125, -0.2907600402832031, -0.278411865234375, -0.2660636901855469, -0.25371551513671875, -0.24136734008789062, -0.2290191650390625, -0.21667098999023438, -0.20432281494140625, -0.19197463989257812, -0.17962646484375, -0.16727828979492188, -0.15493011474609375, -0.14258193969726562, -0.1302337646484375, -0.11788558959960938, -0.10553741455078125, -0.09318923950195312, -0.080841064453125, -0.06849288940429688, -0.05614471435546875, -0.043796539306640625, -0.0314483642578125, -0.019100189208984375, -0.00675201416015625, 0.005596160888671875, 0.0179443359375, 0.030292510986328125, 0.04264068603515625, 0.054988861083984375, 0.0673370361328125, 0.07968521118164062, 0.09203338623046875, 0.10438156127929688, 0.116729736328125, 0.12907791137695312, 0.14142608642578125, 0.15377426147460938, 0.1661224365234375, 0.17847061157226562, 0.19081878662109375, 0.20316696166992188, 0.21551513671875, 0.22786331176757812, 0.24021148681640625, 0.2525596618652344, 0.2649078369140625, 0.2772560119628906, 0.28960418701171875, 0.3019523620605469, 0.314300537109375, 0.3266487121582031, 0.33899688720703125, 0.3513450622558594, 0.3636932373046875, 0.3760414123535156, 0.38838958740234375, 0.4007377624511719, 0.4130859375]}, "gradients/decoder.model.decoder.layers.2.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 5.0, 2.0, 7.0, 7.0, 11.0, 15.0, 25.0, 18.0, 28.0, 26.0, 38.0, 50.0, 59.0, 78.0, 92.0, 78.0, 89.0, 70.0, 82.0, 45.0, 45.0, 32.0, 31.0, 17.0, 19.0, 8.0, 5.0, 5.0, 4.0, 6.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.1661241054534912, -1.1265599727630615, -1.0869957208633423, -1.0474315881729126, -1.007867455482483, -0.9683032631874084, -0.928739070892334, -0.8891749382019043, -0.8496107459068298, -0.8100465536117554, -0.7704824209213257, -0.7309182286262512, -0.6913540363311768, -0.6517899036407471, -0.6122257113456726, -0.5726615190505981, -0.5330973863601685, -0.4935332238674164, -0.4539690613746643, -0.41440486907958984, -0.37484070658683777, -0.3352765440940857, -0.29571235179901123, -0.25614818930625916, -0.21658402681350708, -0.177019864320755, -0.13745568692684174, -0.09789151698350906, -0.05832734704017639, -0.018763184547424316, 0.020800992846488953, 0.06036517024040222, 0.09992945194244385, 0.13949361443519592, 0.1790577918291092, 0.21862196922302246, 0.25818613171577454, 0.2977502942085266, 0.3373144865036011, 0.37687864899635315, 0.4164428114891052, 0.4560069739818573, 0.4955711364746094, 0.5351353287696838, 0.5746995210647583, 0.614263653755188, 0.6538278460502625, 0.6933920383453369, 0.7329561710357666, 0.7725203633308411, 0.8120844960212708, 0.8516486883163452, 0.8912128210067749, 0.9307770133018494, 0.9703412055969238, 1.0099053382873535, 1.0494694709777832, 1.089033603668213, 1.1285978555679321, 1.1681619882583618, 1.2077261209487915, 1.2472903728485107, 1.2868545055389404, 1.3264186382293701, 1.3659828901290894]}, "gradients/decoder.model.decoder.layers.2.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 4.0, 8.0, 2.0, 8.0, 12.0, 6.0, 8.0, 14.0, 16.0, 19.0, 27.0, 21.0, 25.0, 35.0, 33.0, 56.0, 47.0, 48.0, 53.0, 47.0, 44.0, 50.0, 60.0, 40.0, 33.0, 39.0, 44.0, 28.0, 30.0, 20.0, 26.0, 19.0, 21.0, 11.0, 10.0, 10.0, 6.0, 11.0, 7.0, 3.0, 5.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-1.0714930295944214, -1.0423909425735474, -1.0132887363433838, -0.984186589717865, -0.9550844430923462, -0.9259823560714722, -0.8968801498413086, -0.8677780628204346, -0.8386759161949158, -0.809573769569397, -0.7804716229438782, -0.7513694763183594, -0.7222673296928406, -0.6931651830673218, -0.6640630960464478, -0.634960949420929, -0.6058588027954102, -0.5767566561698914, -0.5476545095443726, -0.5185523629188538, -0.48945024609565735, -0.46034809947013855, -0.43124595284461975, -0.40214383602142334, -0.37304162979125977, -0.34393948316574097, -0.31483733654022217, -0.28573518991470337, -0.25663307309150696, -0.22753092646598816, -0.19842877984046936, -0.16932664811611176, -0.14022451639175415, -0.11112237721681595, -0.08202023804187775, -0.05291809141635895, -0.023815952241420746, 0.005286186933517456, 0.034388333559036255, 0.06349046528339386, 0.09259261190891266, 0.12169475108385086, 0.15079689025878906, 0.17989903688430786, 0.20900118350982666, 0.23810331523418427, 0.26720547676086426, 0.29630759358406067, 0.32540974020957947, 0.35451188683509827, 0.38361403346061707, 0.4127161502838135, 0.4418182969093323, 0.4709204435348511, 0.5000225901603699, 0.5291247367858887, 0.5582268834114075, 0.5873290300369263, 0.6164311766624451, 0.6455333232879639, 0.6746354699134827, 0.7037376165390015, 0.7328397035598755, 0.7619418501853943, 0.7910439968109131]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 0.0, 3.0, 1.0, 4.0, 2.0, 1.0, 5.0, 9.0, 14.0, 13.0, 20.0, 30.0, 40.0, 69.0, 74.0, 120.0, 177.0, 266.0, 482.0, 681.0, 1240.0, 2138.0, 4224.0, 8477.0, 20666.0, 61130.0, 238566.0, 486453.0, 151514.0, 42344.0, 15155.0, 6780.0, 3316.0, 1831.0, 1006.0, 606.0, 369.0, 229.0, 152.0, 108.0, 69.0, 44.0, 37.0, 25.0, 23.0, 15.0, 14.0, 4.0, 7.0, 7.0, 0.0, 0.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.284912109375, -0.2758216857910156, -0.26673126220703125, -0.2576408386230469, -0.2485504150390625, -0.23945999145507812, -0.23036956787109375, -0.22127914428710938, -0.212188720703125, -0.20309829711914062, -0.19400787353515625, -0.18491744995117188, -0.1758270263671875, -0.16673660278320312, -0.15764617919921875, -0.14855575561523438, -0.13946533203125, -0.13037490844726562, -0.12128448486328125, -0.11219406127929688, -0.1031036376953125, -0.09401321411132812, -0.08492279052734375, -0.07583236694335938, -0.066741943359375, -0.057651519775390625, -0.04856109619140625, -0.039470672607421875, -0.0303802490234375, -0.021289825439453125, -0.01219940185546875, -0.003108978271484375, 0.0059814453125, 0.015071868896484375, 0.02416229248046875, 0.033252716064453125, 0.0423431396484375, 0.051433563232421875, 0.06052398681640625, 0.06961441040039062, 0.078704833984375, 0.08779525756835938, 0.09688568115234375, 0.10597610473632812, 0.1150665283203125, 0.12415695190429688, 0.13324737548828125, 0.14233779907226562, 0.15142822265625, 0.16051864624023438, 0.16960906982421875, 0.17869949340820312, 0.1877899169921875, 0.19688034057617188, 0.20597076416015625, 0.21506118774414062, 0.224151611328125, 0.23324203491210938, 0.24233245849609375, 0.2514228820800781, 0.2605133056640625, 0.2696037292480469, 0.27869415283203125, 0.2877845764160156, 0.296875]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 7.0, 5.0, 11.0, 13.0, 13.0, 10.0, 12.0, 25.0, 24.0, 25.0, 26.0, 32.0, 37.0, 46.0, 52.0, 56.0, 53.0, 31.0, 54.0, 53.0, 57.0, 42.0, 40.0, 35.0, 33.0, 36.0, 34.0, 25.0, 17.0, 23.0, 13.0, 13.0, 12.0, 10.0, 5.0, 3.0, 5.0, 3.0, 3.0, 2.0, 3.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.63623046875, -0.6144027709960938, -0.5925750732421875, -0.5707473754882812, -0.548919677734375, -0.5270919799804688, -0.5052642822265625, -0.48343658447265625, -0.46160888671875, -0.43978118896484375, -0.4179534912109375, -0.39612579345703125, -0.374298095703125, -0.35247039794921875, -0.3306427001953125, -0.30881500244140625, -0.2869873046875, -0.26515960693359375, -0.2433319091796875, -0.22150421142578125, -0.199676513671875, -0.17784881591796875, -0.1560211181640625, -0.13419342041015625, -0.11236572265625, -0.09053802490234375, -0.0687103271484375, -0.04688262939453125, -0.025054931640625, -0.00322723388671875, 0.0186004638671875, 0.04042816162109375, 0.062255859375, 0.08408355712890625, 0.1059112548828125, 0.12773895263671875, 0.149566650390625, 0.17139434814453125, 0.1932220458984375, 0.21504974365234375, 0.23687744140625, 0.25870513916015625, 0.2805328369140625, 0.30236053466796875, 0.324188232421875, 0.34601593017578125, 0.3678436279296875, 0.38967132568359375, 0.4114990234375, 0.43332672119140625, 0.4551544189453125, 0.47698211669921875, 0.498809814453125, 0.5206375122070312, 0.5424652099609375, 0.5642929077148438, 0.58612060546875, 0.6079483032226562, 0.6297760009765625, 0.6516036987304688, 0.673431396484375, 0.6952590942382812, 0.7170867919921875, 0.7389144897460938, 0.7607421875]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 6.0, 3.0, 6.0, 3.0, 5.0, 4.0, 11.0, 16.0, 16.0, 35.0, 51.0, 86.0, 210.0, 427.0, 1005.0, 3095.0, 12405.0, 89641.0, 752683.0, 164122.0, 18307.0, 4110.0, 1275.0, 494.0, 245.0, 130.0, 43.0, 41.0, 24.0, 18.0, 10.0, 9.0, 7.0, 12.0, 2.0, 2.0, 1.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.438232421875, -0.4234352111816406, -0.40863800048828125, -0.3938407897949219, -0.3790435791015625, -0.3642463684082031, -0.34944915771484375, -0.3346519470214844, -0.319854736328125, -0.3050575256347656, -0.29026031494140625, -0.2754631042480469, -0.2606658935546875, -0.24586868286132812, -0.23107147216796875, -0.21627426147460938, -0.20147705078125, -0.18667984008789062, -0.17188262939453125, -0.15708541870117188, -0.1422882080078125, -0.12749099731445312, -0.11269378662109375, -0.09789657592773438, -0.083099365234375, -0.06830215454101562, -0.05350494384765625, -0.038707733154296875, -0.0239105224609375, -0.009113311767578125, 0.00568389892578125, 0.020481109619140625, 0.0352783203125, 0.050075531005859375, 0.06487274169921875, 0.07966995239257812, 0.0944671630859375, 0.10926437377929688, 0.12406158447265625, 0.13885879516601562, 0.153656005859375, 0.16845321655273438, 0.18325042724609375, 0.19804763793945312, 0.2128448486328125, 0.22764205932617188, 0.24243927001953125, 0.2572364807128906, 0.27203369140625, 0.2868309020996094, 0.30162811279296875, 0.3164253234863281, 0.3312225341796875, 0.3460197448730469, 0.36081695556640625, 0.3756141662597656, 0.390411376953125, 0.4052085876464844, 0.42000579833984375, 0.4348030090332031, 0.4496002197265625, 0.4643974304199219, 0.47919464111328125, 0.4939918518066406, 0.5087890625]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 1.0, 5.0, 8.0, 5.0, 4.0, 3.0, 9.0, 12.0, 14.0, 14.0, 15.0, 25.0, 18.0, 30.0, 30.0, 27.0, 33.0, 36.0, 39.0, 47.0, 43.0, 51.0, 46.0, 41.0, 40.0, 54.0, 36.0, 43.0, 36.0, 41.0, 26.0, 26.0, 19.0, 15.0, 22.0, 16.0, 10.0, 14.0, 7.0, 10.0, 11.0, 9.0, 7.0, 4.0, 2.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.474609375, -1.4295654296875, -1.384521484375, -1.3394775390625, -1.29443359375, -1.2493896484375, -1.204345703125, -1.1593017578125, -1.1142578125, -1.0692138671875, -1.024169921875, -0.9791259765625, -0.93408203125, -0.8890380859375, -0.843994140625, -0.7989501953125, -0.75390625, -0.7088623046875, -0.663818359375, -0.6187744140625, -0.57373046875, -0.5286865234375, -0.483642578125, -0.4385986328125, -0.3935546875, -0.3485107421875, -0.303466796875, -0.2584228515625, -0.21337890625, -0.1683349609375, -0.123291015625, -0.0782470703125, -0.033203125, 0.0118408203125, 0.056884765625, 0.1019287109375, 0.14697265625, 0.1920166015625, 0.237060546875, 0.2821044921875, 0.3271484375, 0.3721923828125, 0.417236328125, 0.4622802734375, 0.50732421875, 0.5523681640625, 0.597412109375, 0.6424560546875, 0.6875, 0.7325439453125, 0.777587890625, 0.8226318359375, 0.86767578125, 0.9127197265625, 0.957763671875, 1.0028076171875, 1.0478515625, 1.0928955078125, 1.137939453125, 1.1829833984375, 1.22802734375, 1.2730712890625, 1.318115234375, 1.3631591796875, 1.408203125]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 2.0, 2.0, 6.0, 4.0, 8.0, 7.0, 14.0, 22.0, 37.0, 69.0, 103.0, 190.0, 392.0, 820.0, 2049.0, 6042.0, 26543.0, 348865.0, 611826.0, 39493.0, 7636.0, 2460.0, 985.0, 438.0, 230.0, 143.0, 65.0, 39.0, 30.0, 19.0, 10.0, 4.0, 5.0, 2.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1593017578125, -0.1531982421875, -0.1470947265625, -0.1409912109375, -0.1348876953125, -0.1287841796875, -0.1226806640625, -0.1165771484375, -0.1104736328125, -0.1043701171875, -0.0982666015625, -0.0921630859375, -0.0860595703125, -0.0799560546875, -0.0738525390625, -0.0677490234375, -0.0616455078125, -0.0555419921875, -0.0494384765625, -0.0433349609375, -0.0372314453125, -0.0311279296875, -0.0250244140625, -0.0189208984375, -0.0128173828125, -0.0067138671875, -0.0006103515625, 0.0054931640625, 0.0115966796875, 0.0177001953125, 0.0238037109375, 0.0299072265625, 0.0360107421875, 0.0421142578125, 0.0482177734375, 0.0543212890625, 0.0604248046875, 0.0665283203125, 0.0726318359375, 0.0787353515625, 0.0848388671875, 0.0909423828125, 0.0970458984375, 0.1031494140625, 0.1092529296875, 0.1153564453125, 0.1214599609375, 0.1275634765625, 0.1336669921875, 0.1397705078125, 0.1458740234375, 0.1519775390625, 0.1580810546875, 0.1641845703125, 0.1702880859375, 0.1763916015625, 0.1824951171875, 0.1885986328125, 0.1947021484375, 0.2008056640625, 0.2069091796875, 0.2130126953125, 0.2191162109375, 0.2252197265625, 0.2313232421875]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 1.0, 3.0, 4.0, 3.0, 4.0, 6.0, 7.0, 8.0, 11.0, 15.0, 16.0, 33.0, 53.0, 58.0, 89.0, 97.0, 119.0, 114.0, 91.0, 67.0, 58.0, 38.0, 30.0, 27.0, 12.0, 12.0, 9.0, 4.0, 3.0, 3.0, 3.0, 2.0, 2.0, 0.0, 2.0, 3.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.300210952758789e-05, -6.08125701546669e-05, -5.862303078174591e-05, -5.643349140882492e-05, -5.424395203590393e-05, -5.205441266298294e-05, -4.986487329006195e-05, -4.767533391714096e-05, -4.548579454421997e-05, -4.329625517129898e-05, -4.110671579837799e-05, -3.8917176425457e-05, -3.672763705253601e-05, -3.453809767961502e-05, -3.234855830669403e-05, -3.015901893377304e-05, -2.796947956085205e-05, -2.577994018793106e-05, -2.359040081501007e-05, -2.140086144208908e-05, -1.921132206916809e-05, -1.70217826962471e-05, -1.483224332332611e-05, -1.2642703950405121e-05, -1.0453164577484131e-05, -8.263625204563141e-06, -6.074085831642151e-06, -3.884546458721161e-06, -1.695007085800171e-06, 4.945322871208191e-07, 2.684071660041809e-06, 4.873611032962799e-06, 7.063150405883789e-06, 9.252689778804779e-06, 1.1442229151725769e-05, 1.3631768524646759e-05, 1.582130789756775e-05, 1.801084727048874e-05, 2.020038664340973e-05, 2.238992601633072e-05, 2.457946538925171e-05, 2.67690047621727e-05, 2.895854413509369e-05, 3.114808350801468e-05, 3.333762288093567e-05, 3.552716225385666e-05, 3.771670162677765e-05, 3.990624099969864e-05, 4.209578037261963e-05, 4.428531974554062e-05, 4.647485911846161e-05, 4.86643984913826e-05, 5.085393786430359e-05, 5.304347723722458e-05, 5.523301661014557e-05, 5.742255598306656e-05, 5.961209535598755e-05, 6.180163472890854e-05, 6.399117410182953e-05, 6.618071347475052e-05, 6.837025284767151e-05, 7.05597922205925e-05, 7.274933159351349e-05, 7.493887096643448e-05, 7.712841033935547e-05]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 2.0, 3.0, 5.0, 2.0, 4.0, 9.0, 10.0, 17.0, 22.0, 39.0, 34.0, 73.0, 114.0, 236.0, 479.0, 969.0, 2028.0, 5032.0, 15955.0, 97573.0, 737051.0, 156503.0, 21527.0, 6179.0, 2456.0, 1094.0, 491.0, 268.0, 150.0, 83.0, 52.0, 29.0, 14.0, 15.0, 13.0, 7.0, 4.0, 5.0, 6.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.197265625, -0.1910228729248047, -0.18478012084960938, -0.17853736877441406, -0.17229461669921875, -0.16605186462402344, -0.15980911254882812, -0.1535663604736328, -0.1473236083984375, -0.1410808563232422, -0.13483810424804688, -0.12859535217285156, -0.12235260009765625, -0.11610984802246094, -0.10986709594726562, -0.10362434387207031, -0.097381591796875, -0.09113883972167969, -0.08489608764648438, -0.07865333557128906, -0.07241058349609375, -0.06616783142089844, -0.059925079345703125, -0.05368232727050781, -0.0474395751953125, -0.04119682312011719, -0.034954071044921875, -0.028711318969726562, -0.02246856689453125, -0.016225814819335938, -0.009983062744140625, -0.0037403106689453125, 0.00250244140625, 0.008745193481445312, 0.014987945556640625, 0.021230697631835938, 0.02747344970703125, 0.03371620178222656, 0.039958953857421875, 0.04620170593261719, 0.0524444580078125, 0.05868721008300781, 0.06492996215820312, 0.07117271423339844, 0.07741546630859375, 0.08365821838378906, 0.08990097045898438, 0.09614372253417969, 0.102386474609375, 0.10862922668457031, 0.11487197875976562, 0.12111473083496094, 0.12735748291015625, 0.13360023498535156, 0.13984298706054688, 0.1460857391357422, 0.1523284912109375, 0.1585712432861328, 0.16481399536132812, 0.17105674743652344, 0.17729949951171875, 0.18354225158691406, 0.18978500366210938, 0.1960277557373047, 0.2022705078125]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 6.0, 5.0, 5.0, 9.0, 12.0, 16.0, 31.0, 38.0, 84.0, 132.0, 158.0, 167.0, 110.0, 76.0, 37.0, 36.0, 25.0, 14.0, 17.0, 5.0, 3.0, 2.0, 4.0, 3.0, 1.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.07159423828125, -0.06975317001342773, -0.06791210174560547, -0.0660710334777832, -0.06422996520996094, -0.06238889694213867, -0.060547828674316406, -0.05870676040649414, -0.056865692138671875, -0.05502462387084961, -0.053183555603027344, -0.05134248733520508, -0.04950141906738281, -0.04766035079956055, -0.04581928253173828, -0.043978214263916016, -0.04213714599609375, -0.040296077728271484, -0.03845500946044922, -0.03661394119262695, -0.03477287292480469, -0.03293180465698242, -0.031090736389160156, -0.02924966812133789, -0.027408599853515625, -0.02556753158569336, -0.023726463317871094, -0.021885395050048828, -0.020044326782226562, -0.018203258514404297, -0.01636219024658203, -0.014521121978759766, -0.0126800537109375, -0.010838985443115234, -0.008997917175292969, -0.007156848907470703, -0.0053157806396484375, -0.003474712371826172, -0.0016336441040039062, 0.00020742416381835938, 0.002048492431640625, 0.0038895606994628906, 0.005730628967285156, 0.007571697235107422, 0.009412765502929688, 0.011253833770751953, 0.013094902038574219, 0.014935970306396484, 0.01677703857421875, 0.018618106842041016, 0.02045917510986328, 0.022300243377685547, 0.024141311645507812, 0.025982379913330078, 0.027823448181152344, 0.02966451644897461, 0.031505584716796875, 0.03334665298461914, 0.035187721252441406, 0.03702878952026367, 0.03886985778808594, 0.0407109260559082, 0.04255199432373047, 0.044393062591552734, 0.046234130859375]}, "gradients/decoder.model.decoder.layers.2.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 0.0, 4.0, 4.0, 9.0, 6.0, 12.0, 13.0, 19.0, 18.0, 25.0, 39.0, 39.0, 60.0, 80.0, 80.0, 87.0, 90.0, 87.0, 72.0, 61.0, 54.0, 31.0, 35.0, 31.0, 10.0, 10.0, 6.0, 9.0, 3.0, 5.0, 5.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9139941334724426, -0.8844901323318481, -0.8549860715866089, -0.8254820704460144, -0.7959780693054199, -0.7664740681648254, -0.736970067024231, -0.7074660062789917, -0.6779620051383972, -0.6484580039978027, -0.6189539432525635, -0.589449942111969, -0.5599459409713745, -0.53044193983078, -0.5009379386901855, -0.4714338779449463, -0.4419298768043518, -0.4124258756637573, -0.38292184472084045, -0.3534178137779236, -0.3239138126373291, -0.2944098114967346, -0.26490578055381775, -0.23540176451206207, -0.2058977484703064, -0.17639373242855072, -0.14688971638679504, -0.11738570034503937, -0.08788168430328369, -0.058377668261528015, -0.02887365221977234, 0.0006303638219833374, 0.030134379863739014, 0.05963839590549469, 0.08914241194725037, 0.11864642798900604, 0.14815044403076172, 0.1776544600725174, 0.20715847611427307, 0.23666249215602875, 0.2661665081977844, 0.2956705093383789, 0.3251745402812958, 0.35467857122421265, 0.38418257236480713, 0.4136865735054016, 0.4431906044483185, 0.47269463539123535, 0.5021986365318298, 0.5317026376724243, 0.5612066984176636, 0.5907106995582581, 0.6202147006988525, 0.649718701839447, 0.6792227029800415, 0.7087267637252808, 0.7382307648658752, 0.7677347660064697, 0.797238826751709, 0.8267428278923035, 0.856246829032898, 0.8857508301734924, 0.9152548313140869, 0.9447588920593262, 0.9742628931999207]}, "gradients/decoder.model.decoder.layers.2.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 5.0, 0.0, 1.0, 3.0, 1.0, 7.0, 5.0, 10.0, 11.0, 12.0, 9.0, 26.0, 19.0, 24.0, 25.0, 34.0, 46.0, 46.0, 49.0, 54.0, 70.0, 41.0, 47.0, 57.0, 61.0, 36.0, 58.0, 28.0, 32.0, 37.0, 31.0, 17.0, 22.0, 19.0, 17.0, 12.0, 12.0, 6.0, 6.0, 4.0, 5.0, 3.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7585477232933044, -0.7357789278030396, -0.7130101323127747, -0.690241277217865, -0.6674724817276001, -0.6447036862373352, -0.6219348907470703, -0.5991660356521606, -0.5763972401618958, -0.5536284446716309, -0.530859649181366, -0.5080907940864563, -0.4853219985961914, -0.4625532031059265, -0.4397844076156616, -0.41701558232307434, -0.39424678683280945, -0.37147799134254456, -0.3487091660499573, -0.3259403705596924, -0.3031715452671051, -0.2804027497768402, -0.25763392448425293, -0.23486512899398804, -0.21209631860256195, -0.18932750821113586, -0.16655869781970978, -0.1437898874282837, -0.1210210844874382, -0.09825227409601212, -0.07548347115516663, -0.05271466076374054, -0.029945850372314453, -0.007177041843533516, 0.015591766685247421, 0.03836057335138321, 0.061129383742809296, 0.08389819413423538, 0.10666699707508087, 0.12943580746650696, 0.15220461785793304, 0.17497342824935913, 0.19774223864078522, 0.2205110490322113, 0.2432798445224762, 0.2660486698150635, 0.28881746530532837, 0.31158626079559326, 0.33435508608818054, 0.35712388157844543, 0.3798927068710327, 0.4026615023612976, 0.4254303276538849, 0.4481991231441498, 0.47096794843673706, 0.49373674392700195, 0.5165055394172668, 0.5392743349075317, 0.5620431303977966, 0.5848119854927063, 0.6075807809829712, 0.6303495764732361, 0.653118371963501, 0.6758872270584106, 0.6986560225486755]}, "gradients/decoder.model.decoder.layers.2.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 3.0, 3.0, 3.0, 4.0, 8.0, 9.0, 8.0, 20.0, 29.0, 27.0, 45.0, 59.0, 82.0, 100.0, 146.0, 216.0, 277.0, 415.0, 602.0, 939.0, 1512.0, 2463.0, 4287.0, 7585.0, 16350.0, 47424.0, 269482.0, 568972.0, 81015.0, 23097.0, 9850.0, 5239.0, 2995.0, 1813.0, 1121.0, 705.0, 482.0, 322.0, 250.0, 162.0, 128.0, 83.0, 74.0, 43.0, 28.0, 27.0, 25.0, 8.0, 9.0, 7.0, 3.0, 2.0, 4.0, 1.0, 5.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.673828125, -0.6522216796875, -0.630615234375, -0.6090087890625, -0.58740234375, -0.5657958984375, -0.544189453125, -0.5225830078125, -0.5009765625, -0.4793701171875, -0.457763671875, -0.4361572265625, -0.41455078125, -0.3929443359375, -0.371337890625, -0.3497314453125, -0.328125, -0.3065185546875, -0.284912109375, -0.2633056640625, -0.24169921875, -0.2200927734375, -0.198486328125, -0.1768798828125, -0.1552734375, -0.1336669921875, -0.112060546875, -0.0904541015625, -0.06884765625, -0.0472412109375, -0.025634765625, -0.0040283203125, 0.017578125, 0.0391845703125, 0.060791015625, 0.0823974609375, 0.10400390625, 0.1256103515625, 0.147216796875, 0.1688232421875, 0.1904296875, 0.2120361328125, 0.233642578125, 0.2552490234375, 0.27685546875, 0.2984619140625, 0.320068359375, 0.3416748046875, 0.36328125, 0.3848876953125, 0.406494140625, 0.4281005859375, 0.44970703125, 0.4713134765625, 0.492919921875, 0.5145263671875, 0.5361328125, 0.5577392578125, 0.579345703125, 0.6009521484375, 0.62255859375, 0.6441650390625, 0.665771484375, 0.6873779296875, 0.708984375]}, "gradients/decoder.model.decoder.layers.2.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 3.0, 1.0, 2.0, 1.0, 2.0, 3.0, 1.0, 2.0, 6.0, 7.0, 7.0, 3.0, 8.0, 10.0, 16.0, 20.0, 22.0, 31.0, 40.0, 25.0, 32.0, 60.0, 47.0, 56.0, 54.0, 51.0, 68.0, 48.0, 39.0, 47.0, 46.0, 43.0, 33.0, 28.0, 26.0, 27.0, 26.0, 12.0, 13.0, 10.0, 5.0, 12.0, 6.0, 1.0, 3.0, 4.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0], "bins": [-1.52734375, -1.483489990234375, -1.43963623046875, -1.395782470703125, -1.3519287109375, -1.308074951171875, -1.26422119140625, -1.220367431640625, -1.176513671875, -1.132659912109375, -1.08880615234375, -1.044952392578125, -1.0010986328125, -0.957244873046875, -0.91339111328125, -0.869537353515625, -0.82568359375, -0.781829833984375, -0.73797607421875, -0.694122314453125, -0.6502685546875, -0.606414794921875, -0.56256103515625, -0.518707275390625, -0.474853515625, -0.430999755859375, -0.38714599609375, -0.343292236328125, -0.2994384765625, -0.255584716796875, -0.21173095703125, -0.167877197265625, -0.1240234375, -0.080169677734375, -0.03631591796875, 0.007537841796875, 0.0513916015625, 0.095245361328125, 0.13909912109375, 0.182952880859375, 0.226806640625, 0.270660400390625, 0.31451416015625, 0.358367919921875, 0.4022216796875, 0.446075439453125, 0.48992919921875, 0.533782958984375, 0.57763671875, 0.621490478515625, 0.66534423828125, 0.709197998046875, 0.7530517578125, 0.796905517578125, 0.84075927734375, 0.884613037109375, 0.928466796875, 0.972320556640625, 1.01617431640625, 1.060028076171875, 1.1038818359375, 1.147735595703125, 1.19158935546875, 1.235443115234375, 1.279296875]}, "gradients/decoder.model.decoder.layers.2.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 3.0, 9.0, 2.0, 5.0, 4.0, 13.0, 9.0, 14.0, 16.0, 18.0, 23.0, 31.0, 33.0, 61.0, 104.0, 157.0, 460.0, 1695.0, 22111.0, 999488.0, 21785.0, 1605.0, 393.0, 174.0, 110.0, 49.0, 46.0, 33.0, 30.0, 25.0, 10.0, 14.0, 6.0, 8.0, 3.0, 4.0, 1.0, 6.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.078125, -2.9661865234375, -2.854248046875, -2.7423095703125, -2.63037109375, -2.5184326171875, -2.406494140625, -2.2945556640625, -2.1826171875, -2.0706787109375, -1.958740234375, -1.8468017578125, -1.73486328125, -1.6229248046875, -1.510986328125, -1.3990478515625, -1.287109375, -1.1751708984375, -1.063232421875, -0.9512939453125, -0.83935546875, -0.7274169921875, -0.615478515625, -0.5035400390625, -0.3916015625, -0.2796630859375, -0.167724609375, -0.0557861328125, 0.05615234375, 0.1680908203125, 0.280029296875, 0.3919677734375, 0.50390625, 0.6158447265625, 0.727783203125, 0.8397216796875, 0.95166015625, 1.0635986328125, 1.175537109375, 1.2874755859375, 1.3994140625, 1.5113525390625, 1.623291015625, 1.7352294921875, 1.84716796875, 1.9591064453125, 2.071044921875, 2.1829833984375, 2.294921875, 2.4068603515625, 2.518798828125, 2.6307373046875, 2.74267578125, 2.8546142578125, 2.966552734375, 3.0784912109375, 3.1904296875, 3.3023681640625, 3.414306640625, 3.5262451171875, 3.63818359375, 3.7501220703125, 3.862060546875, 3.9739990234375, 4.0859375]}, "gradients/decoder.model.decoder.layers.2.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 4.0, 3.0, 3.0, 6.0, 8.0, 5.0, 11.0, 18.0, 17.0, 15.0, 21.0, 20.0, 23.0, 45.0, 43.0, 41.0, 51.0, 48.0, 57.0, 56.0, 56.0, 48.0, 50.0, 42.0, 52.0, 49.0, 35.0, 29.0, 29.0, 31.0, 20.0, 19.0, 10.0, 9.0, 8.0, 6.0, 3.0, 4.0, 7.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.921875, -1.858734130859375, -1.79559326171875, -1.732452392578125, -1.6693115234375, -1.606170654296875, -1.54302978515625, -1.479888916015625, -1.416748046875, -1.353607177734375, -1.29046630859375, -1.227325439453125, -1.1641845703125, -1.101043701171875, -1.03790283203125, -0.974761962890625, -0.91162109375, -0.848480224609375, -0.78533935546875, -0.722198486328125, -0.6590576171875, -0.595916748046875, -0.53277587890625, -0.469635009765625, -0.406494140625, -0.343353271484375, -0.28021240234375, -0.217071533203125, -0.1539306640625, -0.090789794921875, -0.02764892578125, 0.035491943359375, 0.0986328125, 0.161773681640625, 0.22491455078125, 0.288055419921875, 0.3511962890625, 0.414337158203125, 0.47747802734375, 0.540618896484375, 0.603759765625, 0.666900634765625, 0.73004150390625, 0.793182373046875, 0.8563232421875, 0.919464111328125, 0.98260498046875, 1.045745849609375, 1.10888671875, 1.172027587890625, 1.23516845703125, 1.298309326171875, 1.3614501953125, 1.424591064453125, 1.48773193359375, 1.550872802734375, 1.614013671875, 1.677154541015625, 1.74029541015625, 1.803436279296875, 1.8665771484375, 1.929718017578125, 1.99285888671875, 2.055999755859375, 2.119140625]}, "gradients/decoder.model.decoder.layers.2.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 2.0, 4.0, 4.0, 6.0, 8.0, 7.0, 9.0, 14.0, 20.0, 28.0, 47.0, 59.0, 122.0, 239.0, 529.0, 1322.0, 4417.0, 20148.0, 159939.0, 758668.0, 84835.0, 13180.0, 3101.0, 988.0, 393.0, 201.0, 95.0, 69.0, 29.0, 25.0, 11.0, 11.0, 8.0, 8.0, 1.0, 3.0, 5.0, 3.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.27685546875, -0.26773834228515625, -0.2586212158203125, -0.24950408935546875, -0.240386962890625, -0.23126983642578125, -0.2221527099609375, -0.21303558349609375, -0.20391845703125, -0.19480133056640625, -0.1856842041015625, -0.17656707763671875, -0.167449951171875, -0.15833282470703125, -0.1492156982421875, -0.14009857177734375, -0.1309814453125, -0.12186431884765625, -0.1127471923828125, -0.10363006591796875, -0.094512939453125, -0.08539581298828125, -0.0762786865234375, -0.06716156005859375, -0.05804443359375, -0.04892730712890625, -0.0398101806640625, -0.03069305419921875, -0.021575927734375, -0.01245880126953125, -0.0033416748046875, 0.00577545166015625, 0.014892578125, 0.02400970458984375, 0.0331268310546875, 0.04224395751953125, 0.051361083984375, 0.06047821044921875, 0.0695953369140625, 0.07871246337890625, 0.08782958984375, 0.09694671630859375, 0.1060638427734375, 0.11518096923828125, 0.124298095703125, 0.13341522216796875, 0.1425323486328125, 0.15164947509765625, 0.1607666015625, 0.16988372802734375, 0.1790008544921875, 0.18811798095703125, 0.197235107421875, 0.20635223388671875, 0.2154693603515625, 0.22458648681640625, 0.23370361328125, 0.24282073974609375, 0.2519378662109375, 0.26105499267578125, 0.270172119140625, 0.27928924560546875, 0.2884063720703125, 0.29752349853515625, 0.306640625]}, "gradients/decoder.model.decoder.layers.2.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 6.0, 2.0, 9.0, 14.0, 9.0, 21.0, 24.0, 31.0, 60.0, 71.0, 120.0, 183.0, 153.0, 88.0, 61.0, 32.0, 29.0, 24.0, 18.0, 15.0, 4.0, 10.0, 2.0, 3.0, 4.0, 2.0, 0.0, 3.0, 2.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.935264587402344e-05, -4.8012472689151764e-05, -4.667229950428009e-05, -4.533212631940842e-05, -4.399195313453674e-05, -4.265177994966507e-05, -4.1311606764793396e-05, -3.997143357992172e-05, -3.863126039505005e-05, -3.7291087210178375e-05, -3.59509140253067e-05, -3.461074084043503e-05, -3.3270567655563354e-05, -3.193039447069168e-05, -3.059022128582001e-05, -2.9250048100948334e-05, -2.790987491607666e-05, -2.6569701731204987e-05, -2.5229528546333313e-05, -2.388935536146164e-05, -2.2549182176589966e-05, -2.1209008991718292e-05, -1.986883580684662e-05, -1.8528662621974945e-05, -1.718848943710327e-05, -1.5848316252231598e-05, -1.4508143067359924e-05, -1.316796988248825e-05, -1.1827796697616577e-05, -1.0487623512744904e-05, -9.14745032787323e-06, -7.807277143001556e-06, -6.467103958129883e-06, -5.126930773258209e-06, -3.7867575883865356e-06, -2.446584403514862e-06, -1.1064112186431885e-06, 2.337619662284851e-07, 1.5739351511001587e-06, 2.9141083359718323e-06, 4.254281520843506e-06, 5.5944547057151794e-06, 6.934627890586853e-06, 8.274801075458527e-06, 9.6149742603302e-06, 1.0955147445201874e-05, 1.2295320630073547e-05, 1.3635493814945221e-05, 1.4975666999816895e-05, 1.6315840184688568e-05, 1.7656013369560242e-05, 1.8996186554431915e-05, 2.033635973930359e-05, 2.1676532924175262e-05, 2.3016706109046936e-05, 2.435687929391861e-05, 2.5697052478790283e-05, 2.7037225663661957e-05, 2.837739884853363e-05, 2.9717572033405304e-05, 3.105774521827698e-05, 3.239791840314865e-05, 3.3738091588020325e-05, 3.5078264772892e-05, 3.641843795776367e-05]}, "gradients/decoder.model.decoder.layers.2.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 5.0, 3.0, 7.0, 3.0, 7.0, 12.0, 20.0, 29.0, 49.0, 66.0, 95.0, 171.0, 317.0, 720.0, 1851.0, 5648.0, 24639.0, 242006.0, 704967.0, 53469.0, 9649.0, 2794.0, 1015.0, 457.0, 238.0, 118.0, 65.0, 44.0, 23.0, 23.0, 10.0, 14.0, 10.0, 12.0, 4.0, 4.0, 2.0, 0.0, 3.0, 2.0], "bins": [-0.4326171875, -0.4223651885986328, -0.4121131896972656, -0.40186119079589844, -0.39160919189453125, -0.38135719299316406, -0.3711051940917969, -0.3608531951904297, -0.3506011962890625, -0.3403491973876953, -0.3300971984863281, -0.31984519958496094, -0.30959320068359375, -0.29934120178222656, -0.2890892028808594, -0.2788372039794922, -0.268585205078125, -0.2583332061767578, -0.24808120727539062, -0.23782920837402344, -0.22757720947265625, -0.21732521057128906, -0.20707321166992188, -0.1968212127685547, -0.1865692138671875, -0.1763172149658203, -0.16606521606445312, -0.15581321716308594, -0.14556121826171875, -0.13530921936035156, -0.12505722045898438, -0.11480522155761719, -0.10455322265625, -0.09430122375488281, -0.08404922485351562, -0.07379722595214844, -0.06354522705078125, -0.05329322814941406, -0.043041229248046875, -0.03278923034667969, -0.0225372314453125, -0.012285232543945312, -0.002033233642578125, 0.008218765258789062, 0.01847076416015625, 0.028722763061523438, 0.038974761962890625, 0.04922676086425781, 0.059478759765625, 0.06973075866699219, 0.07998275756835938, 0.09023475646972656, 0.10048675537109375, 0.11073875427246094, 0.12099075317382812, 0.1312427520751953, 0.1414947509765625, 0.1517467498779297, 0.16199874877929688, 0.17225074768066406, 0.18250274658203125, 0.19275474548339844, 0.20300674438476562, 0.2132587432861328, 0.2235107421875]}, "gradients/decoder.model.decoder.layers.2.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 5.0, 2.0, 3.0, 4.0, 3.0, 6.0, 8.0, 11.0, 14.0, 18.0, 25.0, 31.0, 36.0, 39.0, 63.0, 64.0, 101.0, 156.0, 86.0, 76.0, 61.0, 39.0, 30.0, 24.0, 9.0, 22.0, 4.0, 13.0, 7.0, 10.0, 8.0, 10.0, 7.0, 1.0, 3.0, 3.0, 5.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09588623046875, -0.0929107666015625, -0.089935302734375, -0.0869598388671875, -0.083984375, -0.0810089111328125, -0.078033447265625, -0.0750579833984375, -0.07208251953125, -0.0691070556640625, -0.066131591796875, -0.0631561279296875, -0.0601806640625, -0.0572052001953125, -0.054229736328125, -0.0512542724609375, -0.04827880859375, -0.0453033447265625, -0.042327880859375, -0.0393524169921875, -0.036376953125, -0.0334014892578125, -0.030426025390625, -0.0274505615234375, -0.02447509765625, -0.0214996337890625, -0.018524169921875, -0.0155487060546875, -0.0125732421875, -0.0095977783203125, -0.006622314453125, -0.0036468505859375, -0.00067138671875, 0.0023040771484375, 0.005279541015625, 0.0082550048828125, 0.01123046875, 0.0142059326171875, 0.017181396484375, 0.0201568603515625, 0.02313232421875, 0.0261077880859375, 0.029083251953125, 0.0320587158203125, 0.0350341796875, 0.0380096435546875, 0.040985107421875, 0.0439605712890625, 0.04693603515625, 0.0499114990234375, 0.052886962890625, 0.0558624267578125, 0.058837890625, 0.0618133544921875, 0.064788818359375, 0.0677642822265625, 0.07073974609375, 0.0737152099609375, 0.076690673828125, 0.0796661376953125, 0.0826416015625, 0.0856170654296875, 0.088592529296875, 0.0915679931640625, 0.09454345703125]}, "gradients/decoder.model.decoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 2.0, 5.0, 7.0, 8.0, 13.0, 17.0, 29.0, 33.0, 40.0, 81.0, 105.0, 123.0, 127.0, 118.0, 91.0, 82.0, 46.0, 32.0, 19.0, 19.0, 4.0, 7.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.864041805267334, -3.7787461280822754, -3.693450450897217, -3.608154773712158, -3.5228588581085205, -3.437563180923462, -3.3522675037384033, -3.2669718265533447, -3.181675910949707, -3.0963802337646484, -3.01108455657959, -2.9257888793945312, -2.8404929637908936, -2.755197286605835, -2.6699016094207764, -2.5846059322357178, -2.499310255050659, -2.4140145778656006, -2.328718900680542, -2.2434229850769043, -2.1581273078918457, -2.072831630706787, -1.9875359535217285, -1.90224027633667, -1.8169444799423218, -1.7316488027572632, -1.646353006362915, -1.5610573291778564, -1.4757616519927979, -1.3904658555984497, -1.3051701784133911, -1.219874382019043, -1.1345789432525635, -1.0492832660675049, -0.9639874696731567, -0.8786917924880981, -0.7933960556983948, -0.7081003189086914, -0.6228046417236328, -0.5375089049339294, -0.4522131681442261, -0.3669174313545227, -0.2816217243671417, -0.19632601737976074, -0.11103028059005737, -0.025734543800354004, 0.05956113338470459, 0.14485687017440796, 0.23015260696411133, 0.3154483437538147, 0.4007440507411957, 0.48603975772857666, 0.57133549451828, 0.6566312313079834, 0.741926908493042, 0.8272226452827454, 0.9125183820724487, 0.9978141188621521, 1.0831098556518555, 1.168405532836914, 1.2537012100219727, 1.3389970064163208, 1.4242926836013794, 1.5095884799957275, 1.5948841571807861]}, "gradients/decoder.model.decoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 1.0, 3.0, 0.0, 2.0, 3.0, 1.0, 1.0, 3.0, 3.0, 6.0, 5.0, 12.0, 12.0, 13.0, 11.0, 17.0, 28.0, 22.0, 29.0, 25.0, 33.0, 34.0, 34.0, 35.0, 46.0, 55.0, 39.0, 51.0, 48.0, 51.0, 40.0, 55.0, 45.0, 37.0, 31.0, 24.0, 31.0, 23.0, 11.0, 21.0, 11.0, 20.0, 10.0, 6.0, 11.0, 4.0, 6.0, 1.0, 3.0, 0.0, 0.0, 1.0, 3.0], "bins": [-3.2957420349121094, -3.209303855895996, -3.1228654384613037, -3.0364272594451904, -2.949989080429077, -2.8635506629943848, -2.7771124839782715, -2.690674304962158, -2.604235887527466, -2.5177977085113525, -2.43135929107666, -2.344921112060547, -2.2584829330444336, -2.172044515609741, -2.085606336593628, -1.999168038368225, -1.9127298593521118, -1.826291561126709, -1.7398533821105957, -1.6534150838851929, -1.56697678565979, -1.4805386066436768, -1.394100308418274, -1.307662010192871, -1.2212238311767578, -1.134785532951355, -1.0483473539352417, -0.9619090557098389, -0.875470757484436, -0.789032518863678, -0.7025942802429199, -0.6161559820175171, -0.5297176837921143, -0.4432794153690338, -0.35684114694595337, -0.2704029083251953, -0.18396463990211487, -0.09752637147903442, -0.011088132858276367, 0.07535016536712646, 0.16178840398788452, 0.24822667241096497, 0.3346649408340454, 0.42110317945480347, 0.5075414180755615, 0.5939797163009644, 0.6804179549217224, 0.7668562531471252, 0.8532944917678833, 0.9397327303886414, 1.0261709690093994, 1.1126092672348022, 1.199047565460205, 1.2854857444763184, 1.3719240427017212, 1.458362340927124, 1.5448005199432373, 1.6312388181686401, 1.7176769971847534, 1.8041152954101562, 1.890553593635559, 1.976991891860962, 2.063430070877075, 2.1498684883117676, 2.236306667327881]}, "gradients/decoder.model.decoder.layers.1.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 3.0, 4.0, 2.0, 12.0, 10.0, 11.0, 17.0, 29.0, 37.0, 47.0, 67.0, 92.0, 135.0, 221.0, 304.0, 478.0, 781.0, 1571.0, 3294.0, 7606.0, 23446.0, 125533.0, 2709414.0, 1216663.0, 74974.0, 17583.0, 6105.0, 2625.0, 1290.0, 718.0, 389.0, 241.0, 178.0, 115.0, 79.0, 56.0, 39.0, 32.0, 23.0, 17.0, 21.0, 8.0, 8.0, 5.0, 3.0, 1.0, 3.0, 2.0], "bins": [-1.6630859375, -1.62030029296875, -1.5775146484375, -1.53472900390625, -1.491943359375, -1.44915771484375, -1.4063720703125, -1.36358642578125, -1.32080078125, -1.27801513671875, -1.2352294921875, -1.19244384765625, -1.149658203125, -1.10687255859375, -1.0640869140625, -1.02130126953125, -0.978515625, -0.93572998046875, -0.8929443359375, -0.85015869140625, -0.807373046875, -0.76458740234375, -0.7218017578125, -0.67901611328125, -0.63623046875, -0.59344482421875, -0.5506591796875, -0.50787353515625, -0.465087890625, -0.42230224609375, -0.3795166015625, -0.33673095703125, -0.2939453125, -0.25115966796875, -0.2083740234375, -0.16558837890625, -0.122802734375, -0.08001708984375, -0.0372314453125, 0.00555419921875, 0.04833984375, 0.09112548828125, 0.1339111328125, 0.17669677734375, 0.219482421875, 0.26226806640625, 0.3050537109375, 0.34783935546875, 0.390625, 0.43341064453125, 0.4761962890625, 0.51898193359375, 0.561767578125, 0.60455322265625, 0.6473388671875, 0.69012451171875, 0.73291015625, 0.77569580078125, 0.8184814453125, 0.86126708984375, 0.904052734375, 0.94683837890625, 0.9896240234375, 1.03240966796875, 1.0751953125]}, "gradients/decoder.model.decoder.layers.1.fc2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 5.0, 9.0, 7.0, 9.0, 5.0, 20.0, 15.0, 19.0, 29.0, 33.0, 40.0, 37.0, 48.0, 49.0, 48.0, 65.0, 69.0, 61.0, 58.0, 47.0, 42.0, 59.0, 48.0, 29.0, 28.0, 21.0, 16.0, 20.0, 20.0, 6.0, 6.0, 5.0, 11.0, 7.0, 4.0, 2.0, 0.0, 4.0, 1.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7919921875, -0.7693328857421875, -0.746673583984375, -0.7240142822265625, -0.70135498046875, -0.6786956787109375, -0.656036376953125, -0.6333770751953125, -0.6107177734375, -0.5880584716796875, -0.565399169921875, -0.5427398681640625, -0.52008056640625, -0.4974212646484375, -0.474761962890625, -0.4521026611328125, -0.429443359375, -0.4067840576171875, -0.384124755859375, -0.3614654541015625, -0.33880615234375, -0.3161468505859375, -0.293487548828125, -0.2708282470703125, -0.2481689453125, -0.2255096435546875, -0.202850341796875, -0.1801910400390625, -0.15753173828125, -0.1348724365234375, -0.112213134765625, -0.0895538330078125, -0.06689453125, -0.0442352294921875, -0.021575927734375, 0.0010833740234375, 0.02374267578125, 0.0464019775390625, 0.069061279296875, 0.0917205810546875, 0.1143798828125, 0.1370391845703125, 0.159698486328125, 0.1823577880859375, 0.20501708984375, 0.2276763916015625, 0.250335693359375, 0.2729949951171875, 0.295654296875, 0.3183135986328125, 0.340972900390625, 0.3636322021484375, 0.38629150390625, 0.4089508056640625, 0.431610107421875, 0.4542694091796875, 0.4769287109375, 0.4995880126953125, 0.522247314453125, 0.5449066162109375, 0.56756591796875, 0.5902252197265625, 0.612884521484375, 0.6355438232421875, 0.658203125]}, "gradients/decoder.model.decoder.layers.1.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 4.0, 4.0, 6.0, 9.0, 10.0, 13.0, 16.0, 20.0, 40.0, 67.0, 119.0, 235.0, 573.0, 2898.0, 38526.0, 3899427.0, 242605.0, 7932.0, 1073.0, 338.0, 142.0, 67.0, 59.0, 30.0, 27.0, 11.0, 17.0, 6.0, 9.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0], "bins": [-4.2734375, -4.165863037109375, -4.05828857421875, -3.950714111328125, -3.8431396484375, -3.735565185546875, -3.62799072265625, -3.520416259765625, -3.412841796875, -3.305267333984375, -3.19769287109375, -3.090118408203125, -2.9825439453125, -2.874969482421875, -2.76739501953125, -2.659820556640625, -2.55224609375, -2.444671630859375, -2.33709716796875, -2.229522705078125, -2.1219482421875, -2.014373779296875, -1.90679931640625, -1.799224853515625, -1.691650390625, -1.584075927734375, -1.47650146484375, -1.368927001953125, -1.2613525390625, -1.153778076171875, -1.04620361328125, -0.938629150390625, -0.8310546875, -0.723480224609375, -0.61590576171875, -0.508331298828125, -0.4007568359375, -0.293182373046875, -0.18560791015625, -0.078033447265625, 0.029541015625, 0.137115478515625, 0.24468994140625, 0.352264404296875, 0.4598388671875, 0.567413330078125, 0.67498779296875, 0.782562255859375, 0.89013671875, 0.997711181640625, 1.10528564453125, 1.212860107421875, 1.3204345703125, 1.428009033203125, 1.53558349609375, 1.643157958984375, 1.750732421875, 1.858306884765625, 1.96588134765625, 2.073455810546875, 2.1810302734375, 2.288604736328125, 2.39617919921875, 2.503753662109375, 2.611328125]}, "gradients/decoder.model.decoder.layers.1.fc1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 6.0, 3.0, 7.0, 14.0, 30.0, 20.0, 40.0, 42.0, 86.0, 126.0, 203.0, 382.0, 764.0, 1011.0, 609.0, 302.0, 149.0, 94.0, 62.0, 50.0, 27.0, 9.0, 8.0, 7.0, 11.0, 6.0, 8.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.318603515625, -0.3028755187988281, -0.28714752197265625, -0.2714195251464844, -0.2556915283203125, -0.23996353149414062, -0.22423553466796875, -0.20850753784179688, -0.192779541015625, -0.17705154418945312, -0.16132354736328125, -0.14559555053710938, -0.1298675537109375, -0.11413955688476562, -0.09841156005859375, -0.08268356323242188, -0.06695556640625, -0.051227569580078125, -0.03549957275390625, -0.019771575927734375, -0.0040435791015625, 0.011684417724609375, 0.02741241455078125, 0.043140411376953125, 0.058868408203125, 0.07459640502929688, 0.09032440185546875, 0.10605239868164062, 0.1217803955078125, 0.13750839233398438, 0.15323638916015625, 0.16896438598632812, 0.1846923828125, 0.20042037963867188, 0.21614837646484375, 0.23187637329101562, 0.2476043701171875, 0.2633323669433594, 0.27906036376953125, 0.2947883605957031, 0.310516357421875, 0.3262443542480469, 0.34197235107421875, 0.3577003479003906, 0.3734283447265625, 0.3891563415527344, 0.40488433837890625, 0.4206123352050781, 0.43634033203125, 0.4520683288574219, 0.46779632568359375, 0.4835243225097656, 0.4992523193359375, 0.5149803161621094, 0.5307083129882812, 0.5464363098144531, 0.562164306640625, 0.5778923034667969, 0.5936203002929688, 0.6093482971191406, 0.6250762939453125, 0.6408042907714844, 0.6565322875976562, 0.6722602844238281, 0.68798828125]}, "gradients/decoder.model.decoder.layers.1.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 6.0, 2.0, 1.0, 9.0, 4.0, 4.0, 7.0, 12.0, 21.0, 18.0, 28.0, 32.0, 39.0, 47.0, 51.0, 63.0, 68.0, 67.0, 69.0, 51.0, 67.0, 59.0, 65.0, 42.0, 32.0, 31.0, 38.0, 16.0, 20.0, 7.0, 4.0, 8.0, 7.0, 4.0, 5.0, 2.0, 1.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.8065317869186401, -0.7748379707336426, -0.743144154548645, -0.7114503383636475, -0.6797565221786499, -0.6480627059936523, -0.61636883020401, -0.5846750140190125, -0.5529811978340149, -0.5212873816490173, -0.4895935654640198, -0.45789971947669983, -0.42620590329170227, -0.3945120871067047, -0.36281824111938477, -0.3311244249343872, -0.29943060874938965, -0.2677367925643921, -0.23604296147823334, -0.20434913039207458, -0.17265531420707703, -0.14096149802207947, -0.10926766693592072, -0.07757383584976196, -0.045880019664764404, -0.014186196029186249, 0.017507627606391907, 0.04920145124197006, 0.08089527487754822, 0.11258909106254578, 0.14428292214870453, 0.17597675323486328, 0.20767056941986084, 0.2393643856048584, 0.27105820178985596, 0.3027520477771759, 0.33444586396217346, 0.366139680147171, 0.39783352613449097, 0.4295273423194885, 0.4612211585044861, 0.49291497468948364, 0.5246087908744812, 0.5563026070594788, 0.5879964828491211, 0.6196902990341187, 0.6513841152191162, 0.6830779314041138, 0.7147717475891113, 0.7464655637741089, 0.7781593799591064, 0.809853196144104, 0.8415470123291016, 0.8732408285140991, 0.9049347043037415, 0.936628520488739, 0.9683223366737366, 1.000016212463379, 1.0317100286483765, 1.063403844833374, 1.0950976610183716, 1.1267914772033691, 1.1584852933883667, 1.1901791095733643, 1.2218729257583618]}, "gradients/decoder.model.decoder.layers.1.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 0.0, 3.0, 4.0, 6.0, 7.0, 5.0, 14.0, 9.0, 10.0, 13.0, 11.0, 13.0, 22.0, 20.0, 25.0, 25.0, 28.0, 36.0, 37.0, 48.0, 48.0, 38.0, 34.0, 44.0, 47.0, 38.0, 41.0, 41.0, 46.0, 52.0, 29.0, 23.0, 29.0, 25.0, 24.0, 11.0, 13.0, 18.0, 15.0, 6.0, 6.0, 8.0, 7.0, 6.0, 2.0, 6.0, 4.0, 4.0, 6.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.7598395347595215, -0.7360734343528748, -0.7123072743415833, -0.6885411739349365, -0.664775013923645, -0.6410089135169983, -0.6172428131103516, -0.5934766530990601, -0.5697104930877686, -0.5459443926811218, -0.5221782326698303, -0.4984121322631836, -0.4746459722518921, -0.45087987184524536, -0.42711374163627625, -0.40334761142730713, -0.3795815110206604, -0.3558153808116913, -0.33204925060272217, -0.30828315019607544, -0.28451699018478394, -0.2607508897781372, -0.2369847595691681, -0.21321862936019897, -0.18945249915122986, -0.16568636894226074, -0.14192023873329163, -0.1181541234254837, -0.09438799321651459, -0.07062186300754547, -0.04685574769973755, -0.023089617490768433, 0.0006765127182006836, 0.0244426392018795, 0.04820876568555832, 0.07197488844394684, 0.09574101865291595, 0.11950714886188507, 0.143273264169693, 0.1670393943786621, 0.19080552458763123, 0.21457165479660034, 0.23833778500556946, 0.2621039152145386, 0.2858700156211853, 0.3096361756324768, 0.33340227603912354, 0.35716840624809265, 0.38093453645706177, 0.4047006666660309, 0.428466796875, 0.45223289728164673, 0.47599905729293823, 0.49976515769958496, 0.5235313177108765, 0.5472974181175232, 0.5710635185241699, 0.5948296189308167, 0.6185957789421082, 0.6423618793487549, 0.6661280393600464, 0.6898941397666931, 0.7136602401733398, 0.7374264001846313, 0.7611925601959229]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 6.0, 5.0, 5.0, 15.0, 24.0, 20.0, 25.0, 42.0, 50.0, 63.0, 102.0, 161.0, 248.0, 340.0, 513.0, 836.0, 1299.0, 2158.0, 3742.0, 6773.0, 13273.0, 28158.0, 66306.0, 170819.0, 347969.0, 237079.0, 93135.0, 37866.0, 17180.0, 8676.0, 4718.0, 2604.0, 1505.0, 959.0, 628.0, 382.0, 280.0, 182.0, 116.0, 81.0, 60.0, 49.0, 26.0, 21.0, 20.0, 13.0, 8.0, 7.0, 6.0, 4.0, 4.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.195556640625, -0.18975067138671875, -0.1839447021484375, -0.17813873291015625, -0.172332763671875, -0.16652679443359375, -0.1607208251953125, -0.15491485595703125, -0.14910888671875, -0.14330291748046875, -0.1374969482421875, -0.13169097900390625, -0.125885009765625, -0.12007904052734375, -0.1142730712890625, -0.10846710205078125, -0.1026611328125, -0.09685516357421875, -0.0910491943359375, -0.08524322509765625, -0.079437255859375, -0.07363128662109375, -0.0678253173828125, -0.06201934814453125, -0.05621337890625, -0.05040740966796875, -0.0446014404296875, -0.03879547119140625, -0.032989501953125, -0.02718353271484375, -0.0213775634765625, -0.01557159423828125, -0.009765625, -0.00395965576171875, 0.0018463134765625, 0.00765228271484375, 0.013458251953125, 0.01926422119140625, 0.0250701904296875, 0.03087615966796875, 0.03668212890625, 0.04248809814453125, 0.0482940673828125, 0.05410003662109375, 0.059906005859375, 0.06571197509765625, 0.0715179443359375, 0.07732391357421875, 0.0831298828125, 0.08893585205078125, 0.0947418212890625, 0.10054779052734375, 0.106353759765625, 0.11215972900390625, 0.1179656982421875, 0.12377166748046875, 0.12957763671875, 0.13538360595703125, 0.1411895751953125, 0.14699554443359375, 0.152801513671875, 0.15860748291015625, 0.1644134521484375, 0.17021942138671875, 0.176025390625]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 3.0, 3.0, 3.0, 3.0, 4.0, 4.0, 11.0, 9.0, 15.0, 10.0, 13.0, 16.0, 16.0, 21.0, 25.0, 31.0, 26.0, 42.0, 46.0, 50.0, 48.0, 47.0, 45.0, 66.0, 50.0, 48.0, 41.0, 38.0, 41.0, 32.0, 36.0, 25.0, 24.0, 19.0, 12.0, 16.0, 16.0, 8.0, 7.0, 8.0, 7.0, 5.0, 9.0, 2.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0], "bins": [-0.5751953125, -0.5583648681640625, -0.541534423828125, -0.5247039794921875, -0.50787353515625, -0.4910430908203125, -0.474212646484375, -0.4573822021484375, -0.4405517578125, -0.4237213134765625, -0.406890869140625, -0.3900604248046875, -0.37322998046875, -0.3563995361328125, -0.339569091796875, -0.3227386474609375, -0.305908203125, -0.2890777587890625, -0.272247314453125, -0.2554168701171875, -0.23858642578125, -0.2217559814453125, -0.204925537109375, -0.1880950927734375, -0.1712646484375, -0.1544342041015625, -0.137603759765625, -0.1207733154296875, -0.10394287109375, -0.0871124267578125, -0.070281982421875, -0.0534515380859375, -0.03662109375, -0.0197906494140625, -0.002960205078125, 0.0138702392578125, 0.03070068359375, 0.0475311279296875, 0.064361572265625, 0.0811920166015625, 0.0980224609375, 0.1148529052734375, 0.131683349609375, 0.1485137939453125, 0.16534423828125, 0.1821746826171875, 0.199005126953125, 0.2158355712890625, 0.232666015625, 0.2494964599609375, 0.266326904296875, 0.2831573486328125, 0.29998779296875, 0.3168182373046875, 0.333648681640625, 0.3504791259765625, 0.3673095703125, 0.3841400146484375, 0.400970458984375, 0.4178009033203125, 0.43463134765625, 0.4514617919921875, 0.468292236328125, 0.4851226806640625, 0.501953125]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 4.0, 3.0, 5.0, 5.0, 9.0, 11.0, 16.0, 16.0, 22.0, 30.0, 46.0, 68.0, 88.0, 132.0, 169.0, 307.0, 498.0, 857.0, 1675.0, 3383.0, 8053.0, 23192.0, 82676.0, 329508.0, 430971.0, 117701.0, 30394.0, 10217.0, 4136.0, 1933.0, 906.0, 542.0, 329.0, 211.0, 142.0, 84.0, 47.0, 51.0, 29.0, 22.0, 20.0, 11.0, 11.0, 4.0, 7.0, 5.0, 2.0, 3.0, 4.0, 2.0, 5.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.2359619140625, -0.2288379669189453, -0.22171401977539062, -0.21459007263183594, -0.20746612548828125, -0.20034217834472656, -0.19321823120117188, -0.1860942840576172, -0.1789703369140625, -0.1718463897705078, -0.16472244262695312, -0.15759849548339844, -0.15047454833984375, -0.14335060119628906, -0.13622665405273438, -0.1291027069091797, -0.121978759765625, -0.11485481262207031, -0.10773086547851562, -0.10060691833496094, -0.09348297119140625, -0.08635902404785156, -0.07923507690429688, -0.07211112976074219, -0.0649871826171875, -0.05786323547363281, -0.050739288330078125, -0.04361534118652344, -0.03649139404296875, -0.029367446899414062, -0.022243499755859375, -0.015119552612304688, -0.00799560546875, -0.0008716583251953125, 0.006252288818359375, 0.013376235961914062, 0.02050018310546875, 0.027624130249023438, 0.034748077392578125, 0.04187202453613281, 0.0489959716796875, 0.05611991882324219, 0.06324386596679688, 0.07036781311035156, 0.07749176025390625, 0.08461570739746094, 0.09173965454101562, 0.09886360168457031, 0.105987548828125, 0.11311149597167969, 0.12023544311523438, 0.12735939025878906, 0.13448333740234375, 0.14160728454589844, 0.14873123168945312, 0.1558551788330078, 0.1629791259765625, 0.1701030731201172, 0.17722702026367188, 0.18435096740722656, 0.19147491455078125, 0.19859886169433594, 0.20572280883789062, 0.2128467559814453, 0.219970703125]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 3.0, 7.0, 5.0, 1.0, 3.0, 3.0, 10.0, 15.0, 9.0, 22.0, 19.0, 15.0, 23.0, 28.0, 24.0, 29.0, 34.0, 30.0, 28.0, 51.0, 52.0, 57.0, 44.0, 36.0, 54.0, 56.0, 30.0, 35.0, 37.0, 45.0, 31.0, 29.0, 25.0, 19.0, 16.0, 14.0, 15.0, 10.0, 14.0, 9.0, 3.0, 2.0, 4.0, 4.0, 5.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.236328125, -1.198699951171875, -1.16107177734375, -1.123443603515625, -1.0858154296875, -1.048187255859375, -1.01055908203125, -0.972930908203125, -0.935302734375, -0.897674560546875, -0.86004638671875, -0.822418212890625, -0.7847900390625, -0.747161865234375, -0.70953369140625, -0.671905517578125, -0.63427734375, -0.596649169921875, -0.55902099609375, -0.521392822265625, -0.4837646484375, -0.446136474609375, -0.40850830078125, -0.370880126953125, -0.333251953125, -0.295623779296875, -0.25799560546875, -0.220367431640625, -0.1827392578125, -0.145111083984375, -0.10748291015625, -0.069854736328125, -0.0322265625, 0.005401611328125, 0.04302978515625, 0.080657958984375, 0.1182861328125, 0.155914306640625, 0.19354248046875, 0.231170654296875, 0.268798828125, 0.306427001953125, 0.34405517578125, 0.381683349609375, 0.4193115234375, 0.456939697265625, 0.49456787109375, 0.532196044921875, 0.56982421875, 0.607452392578125, 0.64508056640625, 0.682708740234375, 0.7203369140625, 0.757965087890625, 0.79559326171875, 0.833221435546875, 0.870849609375, 0.908477783203125, 0.94610595703125, 0.983734130859375, 1.0213623046875, 1.058990478515625, 1.09661865234375, 1.134246826171875, 1.171875]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 2.0, 3.0, 5.0, 5.0, 5.0, 9.0, 22.0, 37.0, 46.0, 106.0, 179.0, 415.0, 949.0, 2486.0, 8529.0, 46110.0, 503689.0, 433384.0, 40981.0, 7680.0, 2304.0, 848.0, 355.0, 159.0, 91.0, 58.0, 36.0, 23.0, 18.0, 8.0, 3.0, 5.0, 5.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.16015625, -0.15443038940429688, -0.14870452880859375, -0.14297866821289062, -0.1372528076171875, -0.13152694702148438, -0.12580108642578125, -0.12007522583007812, -0.114349365234375, -0.10862350463867188, -0.10289764404296875, -0.09717178344726562, -0.0914459228515625, -0.08572006225585938, -0.07999420166015625, -0.07426834106445312, -0.06854248046875, -0.06281661987304688, -0.05709075927734375, -0.051364898681640625, -0.0456390380859375, -0.039913177490234375, -0.03418731689453125, -0.028461456298828125, -0.022735595703125, -0.017009735107421875, -0.01128387451171875, -0.005558013916015625, 0.0001678466796875, 0.005893707275390625, 0.01161956787109375, 0.017345428466796875, 0.0230712890625, 0.028797149658203125, 0.03452301025390625, 0.040248870849609375, 0.0459747314453125, 0.051700592041015625, 0.05742645263671875, 0.06315231323242188, 0.068878173828125, 0.07460403442382812, 0.08032989501953125, 0.08605575561523438, 0.0917816162109375, 0.09750747680664062, 0.10323333740234375, 0.10895919799804688, 0.11468505859375, 0.12041091918945312, 0.12613677978515625, 0.13186264038085938, 0.1375885009765625, 0.14331436157226562, 0.14904022216796875, 0.15476608276367188, 0.160491943359375, 0.16621780395507812, 0.17194366455078125, 0.17766952514648438, 0.1833953857421875, 0.18912124633789062, 0.19484710693359375, 0.20057296752929688, 0.206298828125]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 4.0, 7.0, 1.0, 2.0, 3.0, 7.0, 6.0, 4.0, 4.0, 6.0, 12.0, 15.0, 17.0, 29.0, 37.0, 44.0, 47.0, 62.0, 84.0, 81.0, 106.0, 87.0, 76.0, 50.0, 41.0, 35.0, 25.0, 24.0, 18.0, 10.0, 13.0, 12.0, 3.0, 9.0, 6.0, 3.0, 4.0, 4.0, 0.0, 3.0, 2.0, 4.0, 4.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-6.61015510559082e-05, -6.427150219678879e-05, -6.244145333766937e-05, -6.061140447854996e-05, -5.878135561943054e-05, -5.695130676031113e-05, -5.512125790119171e-05, -5.3291209042072296e-05, -5.146116018295288e-05, -4.9631111323833466e-05, -4.780106246471405e-05, -4.5971013605594635e-05, -4.414096474647522e-05, -4.2310915887355804e-05, -4.048086702823639e-05, -3.8650818169116974e-05, -3.682076930999756e-05, -3.499072045087814e-05, -3.316067159175873e-05, -3.133062273263931e-05, -2.9500573873519897e-05, -2.7670525014400482e-05, -2.5840476155281067e-05, -2.401042729616165e-05, -2.2180378437042236e-05, -2.035032957792282e-05, -1.8520280718803406e-05, -1.669023185968399e-05, -1.4860183000564575e-05, -1.303013414144516e-05, -1.1200085282325745e-05, -9.37003642320633e-06, -7.539987564086914e-06, -5.709938704967499e-06, -3.8798898458480835e-06, -2.0498409867286682e-06, -2.1979212760925293e-07, 1.6102567315101624e-06, 3.4403055906295776e-06, 5.270354449748993e-06, 7.100403308868408e-06, 8.930452167987823e-06, 1.0760501027107239e-05, 1.2590549886226654e-05, 1.442059874534607e-05, 1.6250647604465485e-05, 1.80806964635849e-05, 1.9910745322704315e-05, 2.174079418182373e-05, 2.3570843040943146e-05, 2.540089190006256e-05, 2.7230940759181976e-05, 2.906098961830139e-05, 3.089103847742081e-05, 3.272108733654022e-05, 3.455113619565964e-05, 3.638118505477905e-05, 3.821123391389847e-05, 4.004128277301788e-05, 4.18713316321373e-05, 4.3701380491256714e-05, 4.553142935037613e-05, 4.7361478209495544e-05, 4.919152706861496e-05, 5.1021575927734375e-05]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 0.0, 1.0, 4.0, 5.0, 8.0, 6.0, 5.0, 13.0, 12.0, 25.0, 31.0, 48.0, 95.0, 186.0, 331.0, 726.0, 1889.0, 5195.0, 15778.0, 55681.0, 247420.0, 527046.0, 142753.0, 34711.0, 10379.0, 3674.0, 1350.0, 544.0, 257.0, 147.0, 72.0, 54.0, 34.0, 26.0, 10.0, 12.0, 8.0, 4.0, 8.0, 6.0, 7.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0], "bins": [-0.166748046875, -0.1621570587158203, -0.15756607055664062, -0.15297508239746094, -0.14838409423828125, -0.14379310607910156, -0.13920211791992188, -0.1346111297607422, -0.1300201416015625, -0.1254291534423828, -0.12083816528320312, -0.11624717712402344, -0.11165618896484375, -0.10706520080566406, -0.10247421264648438, -0.09788322448730469, -0.093292236328125, -0.08870124816894531, -0.08411026000976562, -0.07951927185058594, -0.07492828369140625, -0.07033729553222656, -0.06574630737304688, -0.06115531921386719, -0.0565643310546875, -0.05197334289550781, -0.047382354736328125, -0.04279136657714844, -0.03820037841796875, -0.03360939025878906, -0.029018402099609375, -0.024427413940429688, -0.01983642578125, -0.015245437622070312, -0.010654449462890625, -0.0060634613037109375, -0.00147247314453125, 0.0031185150146484375, 0.007709503173828125, 0.012300491333007812, 0.0168914794921875, 0.021482467651367188, 0.026073455810546875, 0.030664443969726562, 0.03525543212890625, 0.03984642028808594, 0.044437408447265625, 0.04902839660644531, 0.053619384765625, 0.05821037292480469, 0.06280136108398438, 0.06739234924316406, 0.07198333740234375, 0.07657432556152344, 0.08116531372070312, 0.08575630187988281, 0.0903472900390625, 0.09493827819824219, 0.09952926635742188, 0.10412025451660156, 0.10871124267578125, 0.11330223083496094, 0.11789321899414062, 0.12248420715332031, 0.1270751953125]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 4.0, 0.0, 6.0, 0.0, 0.0, 4.0, 3.0, 3.0, 3.0, 6.0, 11.0, 9.0, 13.0, 7.0, 18.0, 18.0, 20.0, 29.0, 55.0, 65.0, 63.0, 100.0, 92.0, 97.0, 82.0, 70.0, 37.0, 44.0, 40.0, 24.0, 23.0, 18.0, 12.0, 11.0, 3.0, 7.0, 4.0, 4.0, 1.0, 2.0, 2.0, 1.0, 0.0, 3.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.037933349609375, -0.03681325912475586, -0.03569316864013672, -0.03457307815551758, -0.03345298767089844, -0.0323328971862793, -0.031212806701660156, -0.030092716217041016, -0.028972625732421875, -0.027852535247802734, -0.026732444763183594, -0.025612354278564453, -0.024492263793945312, -0.023372173309326172, -0.02225208282470703, -0.02113199234008789, -0.02001190185546875, -0.01889181137084961, -0.01777172088623047, -0.016651630401611328, -0.015531539916992188, -0.014411449432373047, -0.013291358947753906, -0.012171268463134766, -0.011051177978515625, -0.009931087493896484, -0.008810997009277344, -0.007690906524658203, -0.0065708160400390625, -0.005450725555419922, -0.004330635070800781, -0.0032105445861816406, -0.0020904541015625, -0.0009703636169433594, 0.00014972686767578125, 0.0012698173522949219, 0.0023899078369140625, 0.003509998321533203, 0.004630088806152344, 0.005750179290771484, 0.006870269775390625, 0.007990360260009766, 0.009110450744628906, 0.010230541229248047, 0.011350631713867188, 0.012470722198486328, 0.013590812683105469, 0.01471090316772461, 0.01583099365234375, 0.01695108413696289, 0.01807117462158203, 0.019191265106201172, 0.020311355590820312, 0.021431446075439453, 0.022551536560058594, 0.023671627044677734, 0.024791717529296875, 0.025911808013916016, 0.027031898498535156, 0.028151988983154297, 0.029272079467773438, 0.030392169952392578, 0.03151226043701172, 0.03263235092163086, 0.03375244140625]}, "gradients/decoder.model.decoder.layers.1.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 5.0, 2.0, 3.0, 5.0, 8.0, 9.0, 14.0, 9.0, 22.0, 25.0, 25.0, 34.0, 37.0, 39.0, 43.0, 63.0, 62.0, 50.0, 59.0, 59.0, 68.0, 54.0, 69.0, 38.0, 40.0, 35.0, 24.0, 19.0, 17.0, 11.0, 7.0, 7.0, 8.0, 10.0, 6.0, 6.0, 2.0, 2.0, 4.0, 3.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.5560969114303589, -0.5394974946975708, -0.5228980779647827, -0.5062986612319946, -0.48969921469688416, -0.4730997681617737, -0.4565003514289856, -0.4399009346961975, -0.4233015179634094, -0.40670210123062134, -0.39010265469551086, -0.3735032379627228, -0.3569038212299347, -0.3403043746948242, -0.32370495796203613, -0.30710554122924805, -0.2905060946941376, -0.2739066779613495, -0.257307231426239, -0.24070781469345093, -0.22410839796066284, -0.20750896632671356, -0.19090953469276428, -0.1743101179599762, -0.15771068632602692, -0.14111125469207764, -0.12451183795928955, -0.10791240632534027, -0.09131298214197159, -0.0747135579586029, -0.058114126324653625, -0.04151470214128494, -0.02491527795791626, -0.008315851911902428, 0.008283574134111404, 0.024883002042770386, 0.04148242622613907, 0.05808185040950775, 0.07468128204345703, 0.09128070622682571, 0.1078801304101944, 0.12447955459356308, 0.14107897877693176, 0.15767841041088104, 0.17427784204483032, 0.1908772587776184, 0.2074766904115677, 0.22407612204551697, 0.24067553877830505, 0.25727495551109314, 0.2738744020462036, 0.2904738187789917, 0.3070732355117798, 0.32367265224456787, 0.34027209877967834, 0.35687151551246643, 0.3734709620475769, 0.390070378780365, 0.40666982531547546, 0.42326924204826355, 0.43986865878105164, 0.4564681053161621, 0.4730675220489502, 0.4896669387817383, 0.5062663555145264]}, "gradients/decoder.model.decoder.layers.1.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 2.0, 6.0, 5.0, 3.0, 13.0, 9.0, 6.0, 8.0, 17.0, 19.0, 18.0, 14.0, 25.0, 29.0, 22.0, 49.0, 45.0, 42.0, 56.0, 47.0, 41.0, 50.0, 40.0, 49.0, 55.0, 51.0, 47.0, 39.0, 25.0, 29.0, 20.0, 16.0, 27.0, 12.0, 18.0, 9.0, 8.0, 6.0, 5.0, 7.0, 5.0, 0.0, 5.0, 3.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.5035885572433472, -0.4874865710735321, -0.47138458490371704, -0.455282598733902, -0.4391806125640869, -0.42307862639427185, -0.4069766402244568, -0.39087462425231934, -0.37477266788482666, -0.3586706817150116, -0.34256869554519653, -0.32646670937538147, -0.3103647232055664, -0.29426273703575134, -0.2781607508659363, -0.26205873489379883, -0.24595674872398376, -0.2298547625541687, -0.21375277638435364, -0.19765079021453857, -0.1815488040447235, -0.16544681787490845, -0.1493448168039322, -0.13324283063411713, -0.11714084446430206, -0.101038858294487, -0.08493687212467194, -0.06883487850427628, -0.05273289233446121, -0.03663090616464615, -0.02052891254425049, -0.004426926374435425, 0.011675059795379639, 0.02777704782783985, 0.043879035860300064, 0.059981025755405426, 0.07608301192522049, 0.09218499809503555, 0.10828699171543121, 0.12438897788524628, 0.14049096405506134, 0.1565929502248764, 0.17269493639469147, 0.18879693746566772, 0.2048989236354828, 0.22100090980529785, 0.23710289597511292, 0.253204882144928, 0.26930686831474304, 0.2854088544845581, 0.30151084065437317, 0.31761282682418823, 0.3337148129940033, 0.34981679916381836, 0.3659188151359558, 0.3820207715034485, 0.39812278747558594, 0.414224773645401, 0.43032675981521606, 0.44642874598503113, 0.4625307321548462, 0.47863271832466125, 0.4947347044944763, 0.5108367204666138, 0.5269386768341064]}, "gradients/decoder.model.decoder.layers.1.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 0.0, 3.0, 3.0, 5.0, 6.0, 9.0, 10.0, 15.0, 14.0, 30.0, 38.0, 68.0, 99.0, 151.0, 265.0, 389.0, 584.0, 1093.0, 1952.0, 3541.0, 6581.0, 13252.0, 28082.0, 65329.0, 200999.0, 457261.0, 162421.0, 56601.0, 24678.0, 11895.0, 5883.0, 3080.0, 1707.0, 971.0, 563.0, 353.0, 219.0, 149.0, 87.0, 62.0, 27.0, 27.0, 23.0, 12.0, 7.0, 4.0, 4.0, 3.0, 3.0, 2.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.701171875, -0.6795425415039062, -0.6579132080078125, -0.6362838745117188, -0.614654541015625, -0.5930252075195312, -0.5713958740234375, -0.5497665405273438, -0.52813720703125, -0.5065078735351562, -0.4848785400390625, -0.46324920654296875, -0.441619873046875, -0.41999053955078125, -0.3983612060546875, -0.37673187255859375, -0.3551025390625, -0.33347320556640625, -0.3118438720703125, -0.29021453857421875, -0.268585205078125, -0.24695587158203125, -0.2253265380859375, -0.20369720458984375, -0.18206787109375, -0.16043853759765625, -0.1388092041015625, -0.11717987060546875, -0.095550537109375, -0.07392120361328125, -0.0522918701171875, -0.03066253662109375, -0.009033203125, 0.01259613037109375, 0.0342254638671875, 0.05585479736328125, 0.077484130859375, 0.09911346435546875, 0.1207427978515625, 0.14237213134765625, 0.16400146484375, 0.18563079833984375, 0.2072601318359375, 0.22888946533203125, 0.250518798828125, 0.27214813232421875, 0.2937774658203125, 0.31540679931640625, 0.3370361328125, 0.35866546630859375, 0.3802947998046875, 0.40192413330078125, 0.423553466796875, 0.44518280029296875, 0.4668121337890625, 0.48844146728515625, 0.51007080078125, 0.5317001342773438, 0.5533294677734375, 0.5749588012695312, 0.596588134765625, 0.6182174682617188, 0.6398468017578125, 0.6614761352539062, 0.68310546875]}, "gradients/decoder.model.decoder.layers.1.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 6.0, 5.0, 2.0, 5.0, 11.0, 12.0, 16.0, 10.0, 19.0, 14.0, 21.0, 23.0, 23.0, 41.0, 36.0, 37.0, 48.0, 41.0, 49.0, 57.0, 45.0, 49.0, 49.0, 62.0, 45.0, 41.0, 40.0, 41.0, 29.0, 30.0, 18.0, 9.0, 17.0, 6.0, 10.0, 9.0, 7.0, 8.0, 8.0, 2.0, 4.0, 2.0, 3.0, 2.0, 2.0, 0.0, 1.0], "bins": [-1.345703125, -1.3097000122070312, -1.2736968994140625, -1.2376937866210938, -1.201690673828125, -1.1656875610351562, -1.1296844482421875, -1.0936813354492188, -1.05767822265625, -1.0216751098632812, -0.9856719970703125, -0.9496688842773438, -0.913665771484375, -0.8776626586914062, -0.8416595458984375, -0.8056564331054688, -0.7696533203125, -0.7336502075195312, -0.6976470947265625, -0.6616439819335938, -0.625640869140625, -0.5896377563476562, -0.5536346435546875, -0.5176315307617188, -0.48162841796875, -0.44562530517578125, -0.4096221923828125, -0.37361907958984375, -0.337615966796875, -0.30161285400390625, -0.2656097412109375, -0.22960662841796875, -0.193603515625, -0.15760040283203125, -0.1215972900390625, -0.08559417724609375, -0.049591064453125, -0.01358795166015625, 0.0224151611328125, 0.05841827392578125, 0.09442138671875, 0.13042449951171875, 0.1664276123046875, 0.20243072509765625, 0.238433837890625, 0.27443695068359375, 0.3104400634765625, 0.34644317626953125, 0.3824462890625, 0.41844940185546875, 0.4544525146484375, 0.49045562744140625, 0.526458740234375, 0.5624618530273438, 0.5984649658203125, 0.6344680786132812, 0.67047119140625, 0.7064743041992188, 0.7424774169921875, 0.7784805297851562, 0.814483642578125, 0.8504867553710938, 0.8864898681640625, 0.9224929809570312, 0.95849609375]}, "gradients/decoder.model.decoder.layers.1.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 5.0, 2.0, 3.0, 7.0, 4.0, 7.0, 17.0, 10.0, 21.0, 45.0, 74.0, 155.0, 344.0, 977.0, 3512.0, 18285.0, 161522.0, 767009.0, 81711.0, 11138.0, 2423.0, 717.0, 294.0, 118.0, 48.0, 39.0, 24.0, 15.0, 7.0, 6.0, 6.0, 1.0, 7.0, 4.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.701171875, -1.6486053466796875, -1.596038818359375, -1.5434722900390625, -1.49090576171875, -1.4383392333984375, -1.385772705078125, -1.3332061767578125, -1.2806396484375, -1.2280731201171875, -1.175506591796875, -1.1229400634765625, -1.07037353515625, -1.0178070068359375, -0.965240478515625, -0.9126739501953125, -0.860107421875, -0.8075408935546875, -0.754974365234375, -0.7024078369140625, -0.64984130859375, -0.5972747802734375, -0.544708251953125, -0.4921417236328125, -0.4395751953125, -0.3870086669921875, -0.334442138671875, -0.2818756103515625, -0.22930908203125, -0.1767425537109375, -0.124176025390625, -0.0716094970703125, -0.01904296875, 0.0335235595703125, 0.086090087890625, 0.1386566162109375, 0.19122314453125, 0.2437896728515625, 0.296356201171875, 0.3489227294921875, 0.4014892578125, 0.4540557861328125, 0.506622314453125, 0.5591888427734375, 0.61175537109375, 0.6643218994140625, 0.716888427734375, 0.7694549560546875, 0.822021484375, 0.8745880126953125, 0.927154541015625, 0.9797210693359375, 1.03228759765625, 1.0848541259765625, 1.137420654296875, 1.1899871826171875, 1.2425537109375, 1.2951202392578125, 1.347686767578125, 1.4002532958984375, 1.45281982421875, 1.5053863525390625, 1.557952880859375, 1.6105194091796875, 1.6630859375]}, "gradients/decoder.model.decoder.layers.1.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 4.0, 4.0, 1.0, 3.0, 12.0, 13.0, 18.0, 18.0, 25.0, 26.0, 33.0, 39.0, 36.0, 43.0, 51.0, 55.0, 64.0, 58.0, 56.0, 57.0, 59.0, 54.0, 45.0, 32.0, 37.0, 34.0, 16.0, 25.0, 20.0, 17.0, 8.0, 6.0, 11.0, 9.0, 5.0, 5.0, 5.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3662109375, -1.3169708251953125, -1.267730712890625, -1.2184906005859375, -1.16925048828125, -1.1200103759765625, -1.070770263671875, -1.0215301513671875, -0.9722900390625, -0.9230499267578125, -0.873809814453125, -0.8245697021484375, -0.77532958984375, -0.7260894775390625, -0.676849365234375, -0.6276092529296875, -0.578369140625, -0.5291290283203125, -0.479888916015625, -0.4306488037109375, -0.38140869140625, -0.3321685791015625, -0.282928466796875, -0.2336883544921875, -0.1844482421875, -0.1352081298828125, -0.085968017578125, -0.0367279052734375, 0.01251220703125, 0.0617523193359375, 0.110992431640625, 0.1602325439453125, 0.20947265625, 0.2587127685546875, 0.307952880859375, 0.3571929931640625, 0.40643310546875, 0.4556732177734375, 0.504913330078125, 0.5541534423828125, 0.6033935546875, 0.6526336669921875, 0.701873779296875, 0.7511138916015625, 0.80035400390625, 0.8495941162109375, 0.898834228515625, 0.9480743408203125, 0.997314453125, 1.0465545654296875, 1.095794677734375, 1.1450347900390625, 1.19427490234375, 1.2435150146484375, 1.292755126953125, 1.3419952392578125, 1.3912353515625, 1.4404754638671875, 1.489715576171875, 1.5389556884765625, 1.58819580078125, 1.6374359130859375, 1.686676025390625, 1.7359161376953125, 1.78515625]}, "gradients/decoder.model.decoder.layers.1.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 5.0, 3.0, 5.0, 5.0, 13.0, 15.0, 19.0, 34.0, 50.0, 76.0, 217.0, 617.0, 2070.0, 9028.0, 54447.0, 542867.0, 387132.0, 41860.0, 7333.0, 1767.0, 538.0, 201.0, 80.0, 58.0, 33.0, 27.0, 13.0, 14.0, 9.0, 5.0, 3.0, 5.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3359375, -0.32471466064453125, -0.3134918212890625, -0.30226898193359375, -0.291046142578125, -0.27982330322265625, -0.2686004638671875, -0.25737762451171875, -0.24615478515625, -0.23493194580078125, -0.2237091064453125, -0.21248626708984375, -0.201263427734375, -0.19004058837890625, -0.1788177490234375, -0.16759490966796875, -0.1563720703125, -0.14514923095703125, -0.1339263916015625, -0.12270355224609375, -0.111480712890625, -0.10025787353515625, -0.0890350341796875, -0.07781219482421875, -0.06658935546875, -0.05536651611328125, -0.0441436767578125, -0.03292083740234375, -0.021697998046875, -0.01047515869140625, 0.0007476806640625, 0.01197052001953125, 0.023193359375, 0.03441619873046875, 0.0456390380859375, 0.05686187744140625, 0.068084716796875, 0.07930755615234375, 0.0905303955078125, 0.10175323486328125, 0.11297607421875, 0.12419891357421875, 0.1354217529296875, 0.14664459228515625, 0.157867431640625, 0.16909027099609375, 0.1803131103515625, 0.19153594970703125, 0.2027587890625, 0.21398162841796875, 0.2252044677734375, 0.23642730712890625, 0.247650146484375, 0.25887298583984375, 0.2700958251953125, 0.28131866455078125, 0.29254150390625, 0.30376434326171875, 0.3149871826171875, 0.32621002197265625, 0.337432861328125, 0.34865570068359375, 0.3598785400390625, 0.37110137939453125, 0.38232421875]}, "gradients/decoder.model.decoder.layers.1.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 3.0, 4.0, 6.0, 3.0, 7.0, 8.0, 13.0, 10.0, 10.0, 16.0, 24.0, 34.0, 40.0, 54.0, 63.0, 88.0, 103.0, 114.0, 85.0, 79.0, 54.0, 47.0, 28.0, 32.0, 20.0, 15.0, 9.0, 9.0, 9.0, 3.0, 6.0, 2.0, 1.0, 3.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.68952751159668e-05, -3.5626813769340515e-05, -3.4358352422714233e-05, -3.308989107608795e-05, -3.182142972946167e-05, -3.055296838283539e-05, -2.9284507036209106e-05, -2.8016045689582825e-05, -2.6747584342956543e-05, -2.547912299633026e-05, -2.421066164970398e-05, -2.2942200303077698e-05, -2.1673738956451416e-05, -2.0405277609825134e-05, -1.9136816263198853e-05, -1.786835491657257e-05, -1.659989356994629e-05, -1.5331432223320007e-05, -1.4062970876693726e-05, -1.2794509530067444e-05, -1.1526048183441162e-05, -1.025758683681488e-05, -8.989125490188599e-06, -7.720664143562317e-06, -6.452202796936035e-06, -5.183741450309753e-06, -3.915280103683472e-06, -2.64681875705719e-06, -1.3783574104309082e-06, -1.0989606380462646e-07, 1.1585652828216553e-06, 2.427026629447937e-06, 3.6954879760742188e-06, 4.9639493227005005e-06, 6.232410669326782e-06, 7.500872015953064e-06, 8.769333362579346e-06, 1.0037794709205627e-05, 1.130625605583191e-05, 1.2574717402458191e-05, 1.3843178749084473e-05, 1.5111640095710754e-05, 1.6380101442337036e-05, 1.7648562788963318e-05, 1.89170241355896e-05, 2.018548548221588e-05, 2.1453946828842163e-05, 2.2722408175468445e-05, 2.3990869522094727e-05, 2.5259330868721008e-05, 2.652779221534729e-05, 2.7796253561973572e-05, 2.9064714908599854e-05, 3.0333176255226135e-05, 3.160163760185242e-05, 3.28700989484787e-05, 3.413856029510498e-05, 3.540702164173126e-05, 3.6675482988357544e-05, 3.7943944334983826e-05, 3.921240568161011e-05, 4.048086702823639e-05, 4.174932837486267e-05, 4.301778972148895e-05, 4.4286251068115234e-05]}, "gradients/decoder.model.decoder.layers.1.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 4.0, 9.0, 9.0, 16.0, 11.0, 12.0, 33.0, 62.0, 138.0, 333.0, 947.0, 2821.0, 10609.0, 60173.0, 532347.0, 382413.0, 46085.0, 8760.0, 2422.0, 824.0, 276.0, 129.0, 53.0, 26.0, 22.0, 6.0, 9.0, 1.0, 7.0, 3.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4248046875, -0.41228485107421875, -0.3997650146484375, -0.38724517822265625, -0.374725341796875, -0.36220550537109375, -0.3496856689453125, -0.33716583251953125, -0.32464599609375, -0.31212615966796875, -0.2996063232421875, -0.28708648681640625, -0.274566650390625, -0.26204681396484375, -0.2495269775390625, -0.23700714111328125, -0.2244873046875, -0.21196746826171875, -0.1994476318359375, -0.18692779541015625, -0.174407958984375, -0.16188812255859375, -0.1493682861328125, -0.13684844970703125, -0.12432861328125, -0.11180877685546875, -0.0992889404296875, -0.08676910400390625, -0.074249267578125, -0.06172943115234375, -0.0492095947265625, -0.03668975830078125, -0.024169921875, -0.01165008544921875, 0.0008697509765625, 0.01338958740234375, 0.025909423828125, 0.03842926025390625, 0.0509490966796875, 0.06346893310546875, 0.07598876953125, 0.08850860595703125, 0.1010284423828125, 0.11354827880859375, 0.126068115234375, 0.13858795166015625, 0.1511077880859375, 0.16362762451171875, 0.1761474609375, 0.18866729736328125, 0.2011871337890625, 0.21370697021484375, 0.226226806640625, 0.23874664306640625, 0.2512664794921875, 0.26378631591796875, 0.27630615234375, 0.28882598876953125, 0.3013458251953125, 0.31386566162109375, 0.326385498046875, 0.33890533447265625, 0.3514251708984375, 0.36394500732421875, 0.37646484375]}, "gradients/decoder.model.decoder.layers.1.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 3.0, 4.0, 3.0, 5.0, 12.0, 7.0, 11.0, 19.0, 20.0, 24.0, 35.0, 44.0, 80.0, 68.0, 87.0, 131.0, 96.0, 88.0, 67.0, 45.0, 35.0, 34.0, 13.0, 14.0, 14.0, 17.0, 11.0, 7.0, 4.0, 3.0, 1.0, 6.0, 7.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1474609375, -0.14249038696289062, -0.13751983642578125, -0.13254928588867188, -0.1275787353515625, -0.12260818481445312, -0.11763763427734375, -0.11266708374023438, -0.107696533203125, -0.10272598266601562, -0.09775543212890625, -0.09278488159179688, -0.0878143310546875, -0.08284378051757812, -0.07787322998046875, -0.07290267944335938, -0.06793212890625, -0.06296157836914062, -0.05799102783203125, -0.053020477294921875, -0.0480499267578125, -0.043079376220703125, -0.03810882568359375, -0.033138275146484375, -0.028167724609375, -0.023197174072265625, -0.01822662353515625, -0.013256072998046875, -0.0082855224609375, -0.003314971923828125, 0.00165557861328125, 0.006626129150390625, 0.0115966796875, 0.016567230224609375, 0.02153778076171875, 0.026508331298828125, 0.0314788818359375, 0.036449432373046875, 0.04141998291015625, 0.046390533447265625, 0.051361083984375, 0.056331634521484375, 0.06130218505859375, 0.06627273559570312, 0.0712432861328125, 0.07621383666992188, 0.08118438720703125, 0.08615493774414062, 0.09112548828125, 0.09609603881835938, 0.10106658935546875, 0.10603713989257812, 0.1110076904296875, 0.11597824096679688, 0.12094879150390625, 0.12591934204101562, 0.130889892578125, 0.13586044311523438, 0.14083099365234375, 0.14580154418945312, 0.1507720947265625, 0.15574264526367188, 0.16071319580078125, 0.16568374633789062, 0.170654296875]}, "gradients/decoder.model.decoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 10.0, 19.0, 77.0, 213.0, 324.0, 254.0, 86.0, 24.0, 9.0], "bins": [-12.412637710571289, -12.204093933105469, -11.995550155639648, -11.787006378173828, -11.578463554382324, -11.369919776916504, -11.161375999450684, -10.952832221984863, -10.744288444519043, -10.535744667053223, -10.327200889587402, -10.118657112121582, -9.910114288330078, -9.701570510864258, -9.493026733398438, -9.284482955932617, -9.075939178466797, -8.867395401000977, -8.658851623535156, -8.450307846069336, -8.241765022277832, -8.033221244812012, -7.824677467346191, -7.616133689880371, -7.407590389251709, -7.199046611785889, -6.990503311157227, -6.781959533691406, -6.573415756225586, -6.364871978759766, -6.1563286781311035, -5.947784900665283, -5.739241600036621, -5.530697822570801, -5.322154521942139, -5.113610744476318, -4.905066967010498, -4.696523666381836, -4.487979888916016, -4.279436111450195, -4.070892333984375, -3.862348794937134, -3.6538050174713135, -3.4452614784240723, -3.236717700958252, -3.0281741619110107, -2.8196306228637695, -2.611086845397949, -2.402543067932129, -2.1939995288848877, -1.9854557514190674, -1.7769122123718262, -1.5683684349060059, -1.3598248958587646, -1.1512812376022339, -0.9427375793457031, -0.7341940402984619, -0.5256503820419312, -0.3171067535877228, -0.1085631251335144, 0.09998053312301636, 0.30852413177490234, 0.5170677900314331, 0.7256114482879639, 0.9341551065444946]}, "gradients/decoder.model.decoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 2.0, 0.0, 2.0, 6.0, 3.0, 3.0, 1.0, 6.0, 14.0, 9.0, 18.0, 12.0, 16.0, 24.0, 26.0, 24.0, 29.0, 31.0, 32.0, 27.0, 25.0, 40.0, 32.0, 32.0, 27.0, 42.0, 42.0, 32.0, 42.0, 38.0, 38.0, 31.0, 41.0, 33.0, 31.0, 24.0, 24.0, 18.0, 25.0, 13.0, 11.0, 18.0, 13.0, 10.0, 13.0, 3.0, 7.0, 8.0, 5.0, 3.0, 1.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-1.900421380996704, -1.8415392637252808, -1.7826571464538574, -1.7237751483917236, -1.6648930311203003, -1.606010913848877, -1.5471287965774536, -1.4882466793060303, -1.4293646812438965, -1.3704825639724731, -1.3116004467010498, -1.252718448638916, -1.1938363313674927, -1.1349542140960693, -1.076072096824646, -1.0171899795532227, -0.9583079218864441, -0.8994258046150208, -0.8405437469482422, -0.7816616296768188, -0.7227795720100403, -0.6638974547386169, -0.6050153970718384, -0.546133279800415, -0.4872511923313141, -0.42836910486221313, -0.3694870173931122, -0.31060492992401123, -0.2517228126525879, -0.19284072518348694, -0.133958637714386, -0.07507655024528503, -0.016194462776184082, 0.04268762841820717, 0.10156971961259842, 0.16045181453227997, 0.21933390200138092, 0.27821600437164307, 0.337098091840744, 0.39598017930984497, 0.4548622667789459, 0.5137443542480469, 0.5726264715194702, 0.6315085291862488, 0.6903906464576721, 0.7492727041244507, 0.808154821395874, 0.8670369386672974, 0.9259189963340759, 0.9848011136054993, 1.0436831712722778, 1.1025652885437012, 1.1614474058151245, 1.2203295230865479, 1.2792115211486816, 1.338093638420105, 1.3969757556915283, 1.4558578729629517, 1.514739990234375, 1.5736219882965088, 1.6325041055679321, 1.6913862228393555, 1.7502683401107788, 1.8091504573822021, 1.868032455444336]}, "gradients/decoder.model.decoder.layers.0.fc2.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 5.0, 5.0, 7.0, 6.0, 7.0, 14.0, 20.0, 29.0, 42.0, 48.0, 68.0, 107.0, 134.0, 186.0, 344.0, 645.0, 1268.0, 2816.0, 8438.0, 34890.0, 716187.0, 3319047.0, 86891.0, 14666.0, 4514.0, 1798.0, 804.0, 447.0, 258.0, 193.0, 113.0, 74.0, 64.0, 55.0, 25.0, 15.0, 13.0, 13.0, 9.0, 5.0, 8.0, 5.0, 3.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7548828125, -1.702056884765625, -1.64923095703125, -1.596405029296875, -1.5435791015625, -1.490753173828125, -1.43792724609375, -1.385101318359375, -1.332275390625, -1.279449462890625, -1.22662353515625, -1.173797607421875, -1.1209716796875, -1.068145751953125, -1.01531982421875, -0.962493896484375, -0.90966796875, -0.856842041015625, -0.80401611328125, -0.751190185546875, -0.6983642578125, -0.645538330078125, -0.59271240234375, -0.539886474609375, -0.487060546875, -0.434234619140625, -0.38140869140625, -0.328582763671875, -0.2757568359375, -0.222930908203125, -0.17010498046875, -0.117279052734375, -0.064453125, -0.011627197265625, 0.04119873046875, 0.094024658203125, 0.1468505859375, 0.199676513671875, 0.25250244140625, 0.305328369140625, 0.358154296875, 0.410980224609375, 0.46380615234375, 0.516632080078125, 0.5694580078125, 0.622283935546875, 0.67510986328125, 0.727935791015625, 0.78076171875, 0.833587646484375, 0.88641357421875, 0.939239501953125, 0.9920654296875, 1.044891357421875, 1.09771728515625, 1.150543212890625, 1.203369140625, 1.256195068359375, 1.30902099609375, 1.361846923828125, 1.4146728515625, 1.467498779296875, 1.52032470703125, 1.573150634765625, 1.6259765625]}, "gradients/decoder.model.decoder.layers.0.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 5.0, 9.0, 10.0, 11.0, 11.0, 15.0, 22.0, 25.0, 30.0, 45.0, 46.0, 45.0, 62.0, 62.0, 77.0, 70.0, 59.0, 59.0, 60.0, 48.0, 47.0, 34.0, 27.0, 29.0, 25.0, 19.0, 8.0, 13.0, 6.0, 10.0, 6.0, 2.0, 2.0, 4.0, 5.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.66748046875, -0.6475448608398438, -0.6276092529296875, -0.6076736450195312, -0.587738037109375, -0.5678024291992188, -0.5478668212890625, -0.5279312133789062, -0.50799560546875, -0.48805999755859375, -0.4681243896484375, -0.44818878173828125, -0.428253173828125, -0.40831756591796875, -0.3883819580078125, -0.36844635009765625, -0.3485107421875, -0.32857513427734375, -0.3086395263671875, -0.28870391845703125, -0.268768310546875, -0.24883270263671875, -0.2288970947265625, -0.20896148681640625, -0.18902587890625, -0.16909027099609375, -0.1491546630859375, -0.12921905517578125, -0.109283447265625, -0.08934783935546875, -0.0694122314453125, -0.04947662353515625, -0.029541015625, -0.00960540771484375, 0.0103302001953125, 0.03026580810546875, 0.050201416015625, 0.07013702392578125, 0.0900726318359375, 0.11000823974609375, 0.12994384765625, 0.14987945556640625, 0.1698150634765625, 0.18975067138671875, 0.209686279296875, 0.22962188720703125, 0.2495574951171875, 0.26949310302734375, 0.2894287109375, 0.30936431884765625, 0.3292999267578125, 0.34923553466796875, 0.369171142578125, 0.38910675048828125, 0.4090423583984375, 0.42897796630859375, 0.44891357421875, 0.46884918212890625, 0.4887847900390625, 0.5087203979492188, 0.528656005859375, 0.5485916137695312, 0.5685272216796875, 0.5884628295898438, 0.6083984375]}, "gradients/decoder.model.decoder.layers.0.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 6.0, 5.0, 7.0, 11.0, 12.0, 28.0, 36.0, 67.0, 108.0, 146.0, 274.0, 769.0, 5107.0, 110296.0, 3985741.0, 85647.0, 4624.0, 755.0, 256.0, 133.0, 81.0, 53.0, 43.0, 26.0, 15.0, 14.0, 7.0, 9.0, 9.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-3.44921875, -3.3660430908203125, -3.282867431640625, -3.1996917724609375, -3.11651611328125, -3.0333404541015625, -2.950164794921875, -2.8669891357421875, -2.7838134765625, -2.7006378173828125, -2.617462158203125, -2.5342864990234375, -2.45111083984375, -2.3679351806640625, -2.284759521484375, -2.2015838623046875, -2.118408203125, -2.0352325439453125, -1.952056884765625, -1.8688812255859375, -1.78570556640625, -1.7025299072265625, -1.619354248046875, -1.5361785888671875, -1.4530029296875, -1.3698272705078125, -1.286651611328125, -1.2034759521484375, -1.12030029296875, -1.0371246337890625, -0.953948974609375, -0.8707733154296875, -0.78759765625, -0.7044219970703125, -0.621246337890625, -0.5380706787109375, -0.45489501953125, -0.3717193603515625, -0.288543701171875, -0.2053680419921875, -0.1221923828125, -0.0390167236328125, 0.044158935546875, 0.1273345947265625, 0.21051025390625, 0.2936859130859375, 0.376861572265625, 0.4600372314453125, 0.543212890625, 0.6263885498046875, 0.709564208984375, 0.7927398681640625, 0.87591552734375, 0.9590911865234375, 1.042266845703125, 1.1254425048828125, 1.2086181640625, 1.2917938232421875, 1.374969482421875, 1.4581451416015625, 1.54132080078125, 1.6244964599609375, 1.707672119140625, 1.7908477783203125, 1.8740234375]}, "gradients/decoder.model.decoder.layers.0.fc1.bias": {"_type": "histogram", "values": [4.0, 2.0, 1.0, 0.0, 5.0, 6.0, 13.0, 16.0, 19.0, 36.0, 48.0, 63.0, 164.0, 310.0, 674.0, 1085.0, 786.0, 421.0, 175.0, 97.0, 72.0, 37.0, 28.0, 17.0, 6.0, 4.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.25634765625, -0.23998260498046875, -0.2236175537109375, -0.20725250244140625, -0.190887451171875, -0.17452239990234375, -0.1581573486328125, -0.14179229736328125, -0.12542724609375, -0.10906219482421875, -0.0926971435546875, -0.07633209228515625, -0.059967041015625, -0.04360198974609375, -0.0272369384765625, -0.01087188720703125, 0.0054931640625, 0.02185821533203125, 0.0382232666015625, 0.05458831787109375, 0.070953369140625, 0.08731842041015625, 0.1036834716796875, 0.12004852294921875, 0.13641357421875, 0.15277862548828125, 0.1691436767578125, 0.18550872802734375, 0.201873779296875, 0.21823883056640625, 0.2346038818359375, 0.25096893310546875, 0.267333984375, 0.28369903564453125, 0.3000640869140625, 0.31642913818359375, 0.332794189453125, 0.34915924072265625, 0.3655242919921875, 0.38188934326171875, 0.39825439453125, 0.41461944580078125, 0.4309844970703125, 0.44734954833984375, 0.463714599609375, 0.48007965087890625, 0.4964447021484375, 0.5128097534179688, 0.5291748046875, 0.5455398559570312, 0.5619049072265625, 0.5782699584960938, 0.594635009765625, 0.6110000610351562, 0.6273651123046875, 0.6437301635742188, 0.66009521484375, 0.6764602661132812, 0.6928253173828125, 0.7091903686523438, 0.725555419921875, 0.7419204711914062, 0.7582855224609375, 0.7746505737304688, 0.791015625]}, "gradients/decoder.model.decoder.layers.0.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 0.0, 0.0, 2.0, 2.0, 4.0, 5.0, 3.0, 7.0, 10.0, 12.0, 16.0, 16.0, 16.0, 17.0, 26.0, 30.0, 47.0, 27.0, 38.0, 41.0, 45.0, 56.0, 57.0, 48.0, 56.0, 54.0, 55.0, 44.0, 43.0, 34.0, 36.0, 32.0, 23.0, 21.0, 9.0, 13.0, 10.0, 11.0, 8.0, 7.0, 8.0, 3.0, 5.0, 7.0, 5.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.7240012884140015, -0.7028717994689941, -0.6817423105239868, -0.6606128215789795, -0.6394833326339722, -0.6183538436889648, -0.5972243547439575, -0.5760948657989502, -0.5549653768539429, -0.5338358879089355, -0.5127063989639282, -0.4915769100189209, -0.4704474210739136, -0.44931793212890625, -0.42818841338157654, -0.4070589244365692, -0.3859294056892395, -0.3647999167442322, -0.34367042779922485, -0.32254093885421753, -0.3014114499092102, -0.2802819609642029, -0.25915244221687317, -0.23802295327186584, -0.21689346432685852, -0.1957639753818512, -0.17463448643684387, -0.15350498259067535, -0.13237549364566803, -0.1112460047006607, -0.09011650085449219, -0.06898701190948486, -0.04785752296447754, -0.026728030294179916, -0.005598537623882294, 0.015530958771705627, 0.03666044771671295, 0.057789936661720276, 0.0789194405078888, 0.10004892945289612, 0.12117841839790344, 0.14230790734291077, 0.1634373962879181, 0.1845669001340866, 0.20569638907909393, 0.22682587802410126, 0.24795538187026978, 0.2690848708152771, 0.2902143597602844, 0.31134384870529175, 0.3324733376502991, 0.3536028265953064, 0.3747323155403137, 0.39586180448532104, 0.41699132323265076, 0.4381208121776581, 0.4592503011226654, 0.48037979006767273, 0.5015093088150024, 0.5226387977600098, 0.5437682867050171, 0.5648977756500244, 0.5860272645950317, 0.6071567535400391, 0.6282862424850464]}, "gradients/decoder.model.decoder.layers.0.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 4.0, 3.0, 5.0, 2.0, 3.0, 10.0, 10.0, 7.0, 8.0, 20.0, 14.0, 19.0, 33.0, 37.0, 26.0, 29.0, 41.0, 48.0, 41.0, 41.0, 51.0, 47.0, 38.0, 43.0, 49.0, 47.0, 34.0, 43.0, 37.0, 23.0, 28.0, 29.0, 17.0, 18.0, 20.0, 15.0, 14.0, 13.0, 15.0, 3.0, 12.0, 7.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.637008547782898, -0.6161890625953674, -0.5953695774078369, -0.5745500922203064, -0.5537306070327759, -0.5329111218452454, -0.5120916366577148, -0.4912721514701843, -0.4704526662826538, -0.4496331810951233, -0.4288136959075928, -0.40799421072006226, -0.38717472553253174, -0.3663552403450012, -0.3455357551574707, -0.3247162699699402, -0.30389678478240967, -0.28307729959487915, -0.26225781440734863, -0.24143832921981812, -0.2206188440322876, -0.19979935884475708, -0.17897987365722656, -0.15816038846969604, -0.13734090328216553, -0.11652141809463501, -0.09570193290710449, -0.07488244771957397, -0.05406296253204346, -0.03324347734451294, -0.012423992156982422, 0.008395493030548096, 0.029214918613433838, 0.050034403800964355, 0.07085388898849487, 0.09167337417602539, 0.11249285936355591, 0.13331234455108643, 0.15413182973861694, 0.17495131492614746, 0.19577080011367798, 0.2165902853012085, 0.237409770488739, 0.25822925567626953, 0.27904874086380005, 0.29986822605133057, 0.3206877112388611, 0.3415071964263916, 0.3623266816139221, 0.38314616680145264, 0.40396565198898315, 0.42478513717651367, 0.4456046223640442, 0.4664241075515747, 0.4872435927391052, 0.5080630779266357, 0.5288825631141663, 0.5497020483016968, 0.5705215334892273, 0.5913410186767578, 0.6121605038642883, 0.6329799890518188, 0.6537994742393494, 0.6746189594268799, 0.6954384446144104]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 5.0, 5.0, 13.0, 6.0, 16.0, 24.0, 38.0, 38.0, 67.0, 91.0, 109.0, 189.0, 263.0, 425.0, 721.0, 1266.0, 2483.0, 5236.0, 11565.0, 32241.0, 177892.0, 594440.0, 168036.0, 31287.0, 11246.0, 5098.0, 2544.0, 1285.0, 688.0, 399.0, 275.0, 163.0, 124.0, 73.0, 63.0, 48.0, 28.0, 18.0, 13.0, 9.0, 9.0, 8.0, 7.0, 2.0, 4.0, 2.0, 0.0, 2.0, 2.0], "bins": [-0.29736328125, -0.2892131805419922, -0.2810630798339844, -0.27291297912597656, -0.26476287841796875, -0.25661277770996094, -0.24846267700195312, -0.2403125762939453, -0.2321624755859375, -0.2240123748779297, -0.21586227416992188, -0.20771217346191406, -0.19956207275390625, -0.19141197204589844, -0.18326187133789062, -0.1751117706298828, -0.166961669921875, -0.1588115692138672, -0.15066146850585938, -0.14251136779785156, -0.13436126708984375, -0.12621116638183594, -0.11806106567382812, -0.10991096496582031, -0.1017608642578125, -0.09361076354980469, -0.08546066284179688, -0.07731056213378906, -0.06916046142578125, -0.06101036071777344, -0.052860260009765625, -0.04471015930175781, -0.03656005859375, -0.028409957885742188, -0.020259857177734375, -0.012109756469726562, -0.00395965576171875, 0.0041904449462890625, 0.012340545654296875, 0.020490646362304688, 0.0286407470703125, 0.03679084777832031, 0.044940948486328125, 0.05309104919433594, 0.06124114990234375, 0.06939125061035156, 0.07754135131835938, 0.08569145202636719, 0.093841552734375, 0.10199165344238281, 0.11014175415039062, 0.11829185485839844, 0.12644195556640625, 0.13459205627441406, 0.14274215698242188, 0.1508922576904297, 0.1590423583984375, 0.1671924591064453, 0.17534255981445312, 0.18349266052246094, 0.19164276123046875, 0.19979286193847656, 0.20794296264648438, 0.2160930633544922, 0.2242431640625]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 3.0, 6.0, 3.0, 9.0, 7.0, 9.0, 11.0, 13.0, 17.0, 15.0, 29.0, 27.0, 33.0, 42.0, 36.0, 51.0, 41.0, 57.0, 44.0, 46.0, 45.0, 48.0, 39.0, 51.0, 43.0, 43.0, 28.0, 37.0, 30.0, 21.0, 22.0, 17.0, 15.0, 20.0, 14.0, 7.0, 11.0, 2.0, 5.0, 6.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.44384765625, -0.4286346435546875, -0.413421630859375, -0.3982086181640625, -0.38299560546875, -0.3677825927734375, -0.352569580078125, -0.3373565673828125, -0.3221435546875, -0.3069305419921875, -0.291717529296875, -0.2765045166015625, -0.26129150390625, -0.2460784912109375, -0.230865478515625, -0.2156524658203125, -0.200439453125, -0.1852264404296875, -0.170013427734375, -0.1548004150390625, -0.13958740234375, -0.1243743896484375, -0.109161376953125, -0.0939483642578125, -0.0787353515625, -0.0635223388671875, -0.048309326171875, -0.0330963134765625, -0.01788330078125, -0.0026702880859375, 0.012542724609375, 0.0277557373046875, 0.04296875, 0.0581817626953125, 0.073394775390625, 0.0886077880859375, 0.10382080078125, 0.1190338134765625, 0.134246826171875, 0.1494598388671875, 0.1646728515625, 0.1798858642578125, 0.195098876953125, 0.2103118896484375, 0.22552490234375, 0.2407379150390625, 0.255950927734375, 0.2711639404296875, 0.286376953125, 0.3015899658203125, 0.316802978515625, 0.3320159912109375, 0.34722900390625, 0.3624420166015625, 0.377655029296875, 0.3928680419921875, 0.4080810546875, 0.4232940673828125, 0.438507080078125, 0.4537200927734375, 0.46893310546875, 0.4841461181640625, 0.499359130859375, 0.5145721435546875, 0.52978515625]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 4.0, 2.0, 4.0, 3.0, 3.0, 5.0, 12.0, 11.0, 7.0, 14.0, 29.0, 26.0, 43.0, 79.0, 173.0, 369.0, 856.0, 2440.0, 9663.0, 61441.0, 764969.0, 184841.0, 17260.0, 4009.0, 1290.0, 501.0, 206.0, 113.0, 54.0, 33.0, 22.0, 23.0, 17.0, 9.0, 9.0, 4.0, 6.0, 6.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.447265625, -0.4343719482421875, -0.421478271484375, -0.4085845947265625, -0.39569091796875, -0.3827972412109375, -0.369903564453125, -0.3570098876953125, -0.3441162109375, -0.3312225341796875, -0.318328857421875, -0.3054351806640625, -0.29254150390625, -0.2796478271484375, -0.266754150390625, -0.2538604736328125, -0.240966796875, -0.2280731201171875, -0.215179443359375, -0.2022857666015625, -0.18939208984375, -0.1764984130859375, -0.163604736328125, -0.1507110595703125, -0.1378173828125, -0.1249237060546875, -0.112030029296875, -0.0991363525390625, -0.08624267578125, -0.0733489990234375, -0.060455322265625, -0.0475616455078125, -0.03466796875, -0.0217742919921875, -0.008880615234375, 0.0040130615234375, 0.01690673828125, 0.0298004150390625, 0.042694091796875, 0.0555877685546875, 0.0684814453125, 0.0813751220703125, 0.094268798828125, 0.1071624755859375, 0.12005615234375, 0.1329498291015625, 0.145843505859375, 0.1587371826171875, 0.171630859375, 0.1845245361328125, 0.197418212890625, 0.2103118896484375, 0.22320556640625, 0.2360992431640625, 0.248992919921875, 0.2618865966796875, 0.2747802734375, 0.2876739501953125, 0.300567626953125, 0.3134613037109375, 0.32635498046875, 0.3392486572265625, 0.352142333984375, 0.3650360107421875, 0.3779296875]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 3.0, 3.0, 3.0, 2.0, 3.0, 2.0, 2.0, 6.0, 8.0, 5.0, 9.0, 4.0, 14.0, 5.0, 8.0, 14.0, 19.0, 18.0, 29.0, 13.0, 26.0, 33.0, 31.0, 31.0, 46.0, 39.0, 43.0, 40.0, 25.0, 37.0, 44.0, 53.0, 35.0, 37.0, 30.0, 39.0, 33.0, 25.0, 26.0, 25.0, 20.0, 20.0, 20.0, 11.0, 17.0, 15.0, 7.0, 14.0, 6.0, 6.0, 6.0, 2.0, 3.0, 1.0, 0.0, 1.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.9658203125, -0.9337921142578125, -0.901763916015625, -0.8697357177734375, -0.83770751953125, -0.8056793212890625, -0.773651123046875, -0.7416229248046875, -0.7095947265625, -0.6775665283203125, -0.645538330078125, -0.6135101318359375, -0.58148193359375, -0.5494537353515625, -0.517425537109375, -0.4853973388671875, -0.453369140625, -0.4213409423828125, -0.389312744140625, -0.3572845458984375, -0.32525634765625, -0.2932281494140625, -0.261199951171875, -0.2291717529296875, -0.1971435546875, -0.1651153564453125, -0.133087158203125, -0.1010589599609375, -0.06903076171875, -0.0370025634765625, -0.004974365234375, 0.0270538330078125, 0.05908203125, 0.0911102294921875, 0.123138427734375, 0.1551666259765625, 0.18719482421875, 0.2192230224609375, 0.251251220703125, 0.2832794189453125, 0.3153076171875, 0.3473358154296875, 0.379364013671875, 0.4113922119140625, 0.44342041015625, 0.4754486083984375, 0.507476806640625, 0.5395050048828125, 0.571533203125, 0.6035614013671875, 0.635589599609375, 0.6676177978515625, 0.69964599609375, 0.7316741943359375, 0.763702392578125, 0.7957305908203125, 0.8277587890625, 0.8597869873046875, 0.891815185546875, 0.9238433837890625, 0.95587158203125, 0.9878997802734375, 1.019927978515625, 1.0519561767578125, 1.083984375]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 1.0, 2.0, 3.0, 2.0, 2.0, 0.0, 4.0, 6.0, 5.0, 9.0, 6.0, 20.0, 16.0, 34.0, 38.0, 56.0, 83.0, 136.0, 214.0, 347.0, 657.0, 1177.0, 2369.0, 5304.0, 14225.0, 53921.0, 385649.0, 487761.0, 68148.0, 16553.0, 6045.0, 2681.0, 1338.0, 700.0, 365.0, 248.0, 118.0, 101.0, 64.0, 39.0, 25.0, 27.0, 17.0, 11.0, 16.0, 7.0, 4.0, 3.0, 3.0, 4.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10552978515625, -0.102020263671875, -0.0985107421875, -0.095001220703125, -0.09149169921875, -0.087982177734375, -0.08447265625, -0.080963134765625, -0.07745361328125, -0.073944091796875, -0.0704345703125, -0.066925048828125, -0.06341552734375, -0.059906005859375, -0.056396484375, -0.052886962890625, -0.04937744140625, -0.045867919921875, -0.0423583984375, -0.038848876953125, -0.03533935546875, -0.031829833984375, -0.0283203125, -0.024810791015625, -0.02130126953125, -0.017791748046875, -0.0142822265625, -0.010772705078125, -0.00726318359375, -0.003753662109375, -0.000244140625, 0.003265380859375, 0.00677490234375, 0.010284423828125, 0.0137939453125, 0.017303466796875, 0.02081298828125, 0.024322509765625, 0.02783203125, 0.031341552734375, 0.03485107421875, 0.038360595703125, 0.0418701171875, 0.045379638671875, 0.04888916015625, 0.052398681640625, 0.055908203125, 0.059417724609375, 0.06292724609375, 0.066436767578125, 0.0699462890625, 0.073455810546875, 0.07696533203125, 0.080474853515625, 0.083984375, 0.087493896484375, 0.09100341796875, 0.094512939453125, 0.0980224609375, 0.101531982421875, 0.10504150390625, 0.108551025390625, 0.112060546875, 0.115570068359375, 0.11907958984375]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 1.0, 2.0, 1.0, 1.0, 7.0, 4.0, 8.0, 12.0, 31.0, 29.0, 49.0, 70.0, 106.0, 151.0, 137.0, 128.0, 98.0, 52.0, 38.0, 23.0, 15.0, 16.0, 10.0, 8.0, 6.0, 3.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.258487701416016e-05, -5.9992074966430664e-05, -5.739927291870117e-05, -5.480647087097168e-05, -5.221366882324219e-05, -4.9620866775512695e-05, -4.70280647277832e-05, -4.443526268005371e-05, -4.184246063232422e-05, -3.9249658584594727e-05, -3.6656856536865234e-05, -3.406405448913574e-05, -3.147125244140625e-05, -2.8878450393676758e-05, -2.6285648345947266e-05, -2.3692846298217773e-05, -2.110004425048828e-05, -1.850724220275879e-05, -1.5914440155029297e-05, -1.3321638107299805e-05, -1.0728836059570312e-05, -8.13603401184082e-06, -5.543231964111328e-06, -2.950429916381836e-06, -3.5762786865234375e-07, 2.2351741790771484e-06, 4.827976226806641e-06, 7.420778274536133e-06, 1.0013580322265625e-05, 1.2606382369995117e-05, 1.519918441772461e-05, 1.77919864654541e-05, 2.0384788513183594e-05, 2.2977590560913086e-05, 2.5570392608642578e-05, 2.816319465637207e-05, 3.075599670410156e-05, 3.3348798751831055e-05, 3.594160079956055e-05, 3.853440284729004e-05, 4.112720489501953e-05, 4.3720006942749023e-05, 4.6312808990478516e-05, 4.890561103820801e-05, 5.14984130859375e-05, 5.409121513366699e-05, 5.6684017181396484e-05, 5.9276819229125977e-05, 6.186962127685547e-05, 6.446242332458496e-05, 6.705522537231445e-05, 6.964802742004395e-05, 7.224082946777344e-05, 7.483363151550293e-05, 7.742643356323242e-05, 8.001923561096191e-05, 8.26120376586914e-05, 8.52048397064209e-05, 8.779764175415039e-05, 9.039044380187988e-05, 9.298324584960938e-05, 9.557604789733887e-05, 9.816884994506836e-05, 0.00010076165199279785, 0.00010335445404052734]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 4.0, 2.0, 7.0, 7.0, 10.0, 14.0, 22.0, 18.0, 36.0, 46.0, 57.0, 116.0, 175.0, 268.0, 410.0, 617.0, 1026.0, 1539.0, 2513.0, 4016.0, 6976.0, 12641.0, 26073.0, 62820.0, 166101.0, 340424.0, 248405.0, 96746.0, 37693.0, 17208.0, 8956.0, 4973.0, 3111.0, 1947.0, 1226.0, 786.0, 528.0, 338.0, 235.0, 158.0, 115.0, 59.0, 54.0, 32.0, 20.0, 10.0, 13.0, 7.0, 5.0, 7.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06036376953125, -0.05833244323730469, -0.056301116943359375, -0.05426979064941406, -0.05223846435546875, -0.05020713806152344, -0.048175811767578125, -0.04614448547363281, -0.0441131591796875, -0.04208183288574219, -0.040050506591796875, -0.03801918029785156, -0.03598785400390625, -0.03395652770996094, -0.031925201416015625, -0.029893875122070312, -0.027862548828125, -0.025831222534179688, -0.023799896240234375, -0.021768569946289062, -0.01973724365234375, -0.017705917358398438, -0.015674591064453125, -0.013643264770507812, -0.0116119384765625, -0.009580612182617188, -0.007549285888671875, -0.0055179595947265625, -0.00348663330078125, -0.0014553070068359375, 0.000576019287109375, 0.0026073455810546875, 0.004638671875, 0.0066699981689453125, 0.008701324462890625, 0.010732650756835938, 0.01276397705078125, 0.014795303344726562, 0.016826629638671875, 0.018857955932617188, 0.0208892822265625, 0.022920608520507812, 0.024951934814453125, 0.026983261108398438, 0.02901458740234375, 0.031045913696289062, 0.033077239990234375, 0.03510856628417969, 0.037139892578125, 0.03917121887207031, 0.041202545166015625, 0.04323387145996094, 0.04526519775390625, 0.04729652404785156, 0.049327850341796875, 0.05135917663574219, 0.0533905029296875, 0.05542182922363281, 0.057453155517578125, 0.05948448181152344, 0.06151580810546875, 0.06354713439941406, 0.06557846069335938, 0.06760978698730469, 0.06964111328125]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 0.0, 3.0, 2.0, 1.0, 8.0, 6.0, 7.0, 7.0, 10.0, 9.0, 22.0, 29.0, 37.0, 41.0, 35.0, 59.0, 60.0, 83.0, 83.0, 110.0, 89.0, 55.0, 57.0, 46.0, 25.0, 29.0, 17.0, 23.0, 10.0, 10.0, 3.0, 4.0, 8.0, 5.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 3.0, 3.0], "bins": [-0.0274505615234375, -0.0266568660736084, -0.025863170623779297, -0.025069475173950195, -0.024275779724121094, -0.023482084274291992, -0.02268838882446289, -0.02189469337463379, -0.021100997924804688, -0.020307302474975586, -0.019513607025146484, -0.018719911575317383, -0.01792621612548828, -0.01713252067565918, -0.016338825225830078, -0.015545129776000977, -0.014751434326171875, -0.013957738876342773, -0.013164043426513672, -0.01237034797668457, -0.011576652526855469, -0.010782957077026367, -0.009989261627197266, -0.009195566177368164, -0.008401870727539062, -0.007608175277709961, -0.006814479827880859, -0.006020784378051758, -0.005227088928222656, -0.004433393478393555, -0.003639698028564453, -0.0028460025787353516, -0.00205230712890625, -0.0012586116790771484, -0.0004649162292480469, 0.0003287792205810547, 0.0011224746704101562, 0.0019161701202392578, 0.0027098655700683594, 0.003503561019897461, 0.0042972564697265625, 0.005090951919555664, 0.005884647369384766, 0.006678342819213867, 0.007472038269042969, 0.00826573371887207, 0.009059429168701172, 0.009853124618530273, 0.010646820068359375, 0.011440515518188477, 0.012234210968017578, 0.01302790641784668, 0.013821601867675781, 0.014615297317504883, 0.015408992767333984, 0.016202688217163086, 0.016996383666992188, 0.01779007911682129, 0.01858377456665039, 0.019377470016479492, 0.020171165466308594, 0.020964860916137695, 0.021758556365966797, 0.0225522518157959, 0.023345947265625]}, "gradients/decoder.model.decoder.layers.0.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 2.0, 1.0, 2.0, 6.0, 3.0, 5.0, 7.0, 6.0, 12.0, 24.0, 25.0, 26.0, 30.0, 34.0, 35.0, 72.0, 56.0, 51.0, 80.0, 71.0, 77.0, 59.0, 42.0, 52.0, 52.0, 31.0, 39.0, 27.0, 22.0, 12.0, 8.0, 13.0, 3.0, 5.0, 8.0, 4.0, 5.0, 0.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4932290315628052, -0.4764740765094757, -0.45971912145614624, -0.4429641366004944, -0.4262091815471649, -0.40945422649383545, -0.3926992416381836, -0.3759442865848541, -0.35918933153152466, -0.3424343764781952, -0.3256794214248657, -0.30892443656921387, -0.2921694815158844, -0.27541452646255493, -0.2586595416069031, -0.2419045865535736, -0.22514963150024414, -0.20839467644691467, -0.191639706492424, -0.17488473653793335, -0.15812978148460388, -0.14137482643127441, -0.12461985647678375, -0.10786489397287369, -0.09110993146896362, -0.07435496896505356, -0.057600006461143494, -0.04084504395723343, -0.024090081453323364, -0.0073351189494132996, 0.009419843554496765, 0.02617480605840683, 0.04292970895767212, 0.059684671461582184, 0.07643963396549225, 0.09319459646940231, 0.10994955897331238, 0.12670451402664185, 0.1434594839811325, 0.16021445393562317, 0.17696940898895264, 0.1937243640422821, 0.21047933399677277, 0.22723430395126343, 0.2439892590045929, 0.26074421405792236, 0.2774991989135742, 0.2942541539669037, 0.31100910902023315, 0.3277640640735626, 0.3445190191268921, 0.36127400398254395, 0.3780289590358734, 0.3947839140892029, 0.41153889894485474, 0.4282938539981842, 0.44504880905151367, 0.46180376410484314, 0.4785587191581726, 0.49531370401382446, 0.5120686292648315, 0.5288236141204834, 0.5455785989761353, 0.5623335242271423, 0.5790885090827942]}, "gradients/decoder.model.decoder.layers.0.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 5.0, 2.0, 2.0, 3.0, 11.0, 16.0, 13.0, 7.0, 16.0, 14.0, 31.0, 32.0, 37.0, 31.0, 45.0, 58.0, 41.0, 47.0, 56.0, 43.0, 59.0, 51.0, 53.0, 45.0, 47.0, 36.0, 27.0, 25.0, 23.0, 29.0, 20.0, 13.0, 11.0, 16.0, 17.0, 9.0, 5.0, 6.0, 5.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.45748579502105713, -0.44255614280700684, -0.42762649059295654, -0.41269683837890625, -0.39776718616485596, -0.38283753395080566, -0.36790788173675537, -0.3529782295227051, -0.3380485773086548, -0.3231189250946045, -0.3081892728805542, -0.2932596206665039, -0.2783299684524536, -0.2634003162384033, -0.24847067892551422, -0.23354102671146393, -0.21861138939857483, -0.20368173718452454, -0.18875208497047424, -0.17382243275642395, -0.15889278054237366, -0.14396312832832336, -0.12903349101543427, -0.11410383880138397, -0.09917418658733368, -0.08424453437328339, -0.0693148821592331, -0.0543852373957634, -0.039455585181713104, -0.02452593296766281, -0.009596288204193115, 0.005333364009857178, 0.02026301622390747, 0.035192668437957764, 0.05012231692671776, 0.06505196541547775, 0.07998161762952805, 0.09491126984357834, 0.10984091460704803, 0.12477056682109833, 0.13970021903514862, 0.1546298712491989, 0.1695595234632492, 0.1844891607761383, 0.1994188129901886, 0.2143484652042389, 0.22927811741828918, 0.24420776963233948, 0.25913742184638977, 0.27406707406044006, 0.28899672627449036, 0.30392637848854065, 0.31885603070259094, 0.33378568291664124, 0.34871530532836914, 0.36364495754241943, 0.3785746097564697, 0.39350426197052, 0.4084339141845703, 0.4233635663986206, 0.4382932186126709, 0.4532228708267212, 0.4681525230407715, 0.4830821752548218, 0.49801182746887207]}, "gradients/decoder.model.decoder.layers.0.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 2.0, 0.0, 3.0, 2.0, 0.0, 3.0, 4.0, 5.0, 4.0, 13.0, 18.0, 28.0, 39.0, 63.0, 111.0, 174.0, 281.0, 439.0, 721.0, 1320.0, 2455.0, 4362.0, 8569.0, 17149.0, 37298.0, 95992.0, 341498.0, 361673.0, 100687.0, 38521.0, 17759.0, 8887.0, 4591.0, 2512.0, 1430.0, 762.0, 449.0, 278.0, 167.0, 108.0, 65.0, 61.0, 24.0, 11.0, 11.0, 10.0, 3.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.69775390625, -0.675262451171875, -0.65277099609375, -0.630279541015625, -0.6077880859375, -0.585296630859375, -0.56280517578125, -0.540313720703125, -0.517822265625, -0.495330810546875, -0.47283935546875, -0.450347900390625, -0.4278564453125, -0.405364990234375, -0.38287353515625, -0.360382080078125, -0.337890625, -0.315399169921875, -0.29290771484375, -0.270416259765625, -0.2479248046875, -0.225433349609375, -0.20294189453125, -0.180450439453125, -0.157958984375, -0.135467529296875, -0.11297607421875, -0.090484619140625, -0.0679931640625, -0.045501708984375, -0.02301025390625, -0.000518798828125, 0.02197265625, 0.044464111328125, 0.06695556640625, 0.089447021484375, 0.1119384765625, 0.134429931640625, 0.15692138671875, 0.179412841796875, 0.201904296875, 0.224395751953125, 0.24688720703125, 0.269378662109375, 0.2918701171875, 0.314361572265625, 0.33685302734375, 0.359344482421875, 0.3818359375, 0.404327392578125, 0.42681884765625, 0.449310302734375, 0.4718017578125, 0.494293212890625, 0.51678466796875, 0.539276123046875, 0.561767578125, 0.584259033203125, 0.60675048828125, 0.629241943359375, 0.6517333984375, 0.674224853515625, 0.69671630859375, 0.719207763671875, 0.74169921875]}, "gradients/decoder.model.decoder.layers.0.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 3.0, 5.0, 9.0, 11.0, 12.0, 7.0, 10.0, 18.0, 21.0, 27.0, 34.0, 50.0, 41.0, 58.0, 66.0, 57.0, 63.0, 60.0, 56.0, 52.0, 48.0, 49.0, 46.0, 34.0, 26.0, 32.0, 25.0, 12.0, 20.0, 14.0, 12.0, 9.0, 7.0, 3.0, 5.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.93994140625, -0.9099655151367188, -0.8799896240234375, -0.8500137329101562, -0.820037841796875, -0.7900619506835938, -0.7600860595703125, -0.7301101684570312, -0.70013427734375, -0.6701583862304688, -0.6401824951171875, -0.6102066040039062, -0.580230712890625, -0.5502548217773438, -0.5202789306640625, -0.49030303955078125, -0.4603271484375, -0.43035125732421875, -0.4003753662109375, -0.37039947509765625, -0.340423583984375, -0.31044769287109375, -0.2804718017578125, -0.25049591064453125, -0.22052001953125, -0.19054412841796875, -0.1605682373046875, -0.13059234619140625, -0.100616455078125, -0.07064056396484375, -0.0406646728515625, -0.01068878173828125, 0.019287109375, 0.04926300048828125, 0.0792388916015625, 0.10921478271484375, 0.139190673828125, 0.16916656494140625, 0.1991424560546875, 0.22911834716796875, 0.25909423828125, 0.28907012939453125, 0.3190460205078125, 0.34902191162109375, 0.378997802734375, 0.40897369384765625, 0.4389495849609375, 0.46892547607421875, 0.4989013671875, 0.5288772583007812, 0.5588531494140625, 0.5888290405273438, 0.618804931640625, 0.6487808227539062, 0.6787567138671875, 0.7087326049804688, 0.73870849609375, 0.7686843872070312, 0.7986602783203125, 0.8286361694335938, 0.858612060546875, 0.8885879516601562, 0.9185638427734375, 0.9485397338867188, 0.978515625]}, "gradients/decoder.model.decoder.layers.0.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 5.0, 3.0, 5.0, 8.0, 13.0, 15.0, 21.0, 24.0, 50.0, 46.0, 74.0, 89.0, 124.0, 184.0, 320.0, 488.0, 872.0, 1452.0, 2815.0, 5565.0, 11742.0, 27575.0, 71230.0, 249451.0, 470139.0, 127225.0, 43881.0, 18252.0, 8027.0, 3875.0, 1920.0, 1106.0, 645.0, 431.0, 258.0, 215.0, 122.0, 95.0, 48.0, 42.0, 33.0, 24.0, 15.0, 9.0, 19.0, 6.0, 3.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6875, -0.66400146484375, -0.6405029296875, -0.61700439453125, -0.593505859375, -0.57000732421875, -0.5465087890625, -0.52301025390625, -0.49951171875, -0.47601318359375, -0.4525146484375, -0.42901611328125, -0.405517578125, -0.38201904296875, -0.3585205078125, -0.33502197265625, -0.3115234375, -0.28802490234375, -0.2645263671875, -0.24102783203125, -0.217529296875, -0.19403076171875, -0.1705322265625, -0.14703369140625, -0.12353515625, -0.10003662109375, -0.0765380859375, -0.05303955078125, -0.029541015625, -0.00604248046875, 0.0174560546875, 0.04095458984375, 0.064453125, 0.08795166015625, 0.1114501953125, 0.13494873046875, 0.158447265625, 0.18194580078125, 0.2054443359375, 0.22894287109375, 0.25244140625, 0.27593994140625, 0.2994384765625, 0.32293701171875, 0.346435546875, 0.36993408203125, 0.3934326171875, 0.41693115234375, 0.4404296875, 0.46392822265625, 0.4874267578125, 0.51092529296875, 0.534423828125, 0.55792236328125, 0.5814208984375, 0.60491943359375, 0.62841796875, 0.65191650390625, 0.6754150390625, 0.69891357421875, 0.722412109375, 0.74591064453125, 0.7694091796875, 0.79290771484375, 0.81640625]}, "gradients/decoder.model.decoder.layers.0.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 5.0, 2.0, 12.0, 8.0, 5.0, 11.0, 5.0, 17.0, 17.0, 16.0, 22.0, 28.0, 25.0, 36.0, 29.0, 40.0, 49.0, 44.0, 46.0, 62.0, 49.0, 50.0, 55.0, 46.0, 45.0, 45.0, 27.0, 43.0, 41.0, 28.0, 23.0, 12.0, 13.0, 8.0, 8.0, 8.0, 3.0, 10.0, 5.0, 3.0, 4.0, 4.0, 3.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.0693359375, -1.0371170043945312, -1.0048980712890625, -0.9726791381835938, -0.940460205078125, -0.9082412719726562, -0.8760223388671875, -0.8438034057617188, -0.81158447265625, -0.7793655395507812, -0.7471466064453125, -0.7149276733398438, -0.682708740234375, -0.6504898071289062, -0.6182708740234375, -0.5860519409179688, -0.5538330078125, -0.5216140747070312, -0.4893951416015625, -0.45717620849609375, -0.424957275390625, -0.39273834228515625, -0.3605194091796875, -0.32830047607421875, -0.29608154296875, -0.26386260986328125, -0.2316436767578125, -0.19942474365234375, -0.167205810546875, -0.13498687744140625, -0.1027679443359375, -0.07054901123046875, -0.038330078125, -0.00611114501953125, 0.0261077880859375, 0.05832672119140625, 0.090545654296875, 0.12276458740234375, 0.1549835205078125, 0.18720245361328125, 0.21942138671875, 0.25164031982421875, 0.2838592529296875, 0.31607818603515625, 0.348297119140625, 0.38051605224609375, 0.4127349853515625, 0.44495391845703125, 0.4771728515625, 0.5093917846679688, 0.5416107177734375, 0.5738296508789062, 0.606048583984375, 0.6382675170898438, 0.6704864501953125, 0.7027053833007812, 0.73492431640625, 0.7671432495117188, 0.7993621826171875, 0.8315811157226562, 0.863800048828125, 0.8960189819335938, 0.9282379150390625, 0.9604568481445312, 0.99267578125]}, "gradients/decoder.model.decoder.layers.0.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 2.0, 5.0, 4.0, 4.0, 7.0, 4.0, 13.0, 15.0, 33.0, 27.0, 37.0, 71.0, 105.0, 112.0, 181.0, 235.0, 372.0, 514.0, 817.0, 1307.0, 2091.0, 3468.0, 6048.0, 11885.0, 25462.0, 63669.0, 195267.0, 464890.0, 167704.0, 55984.0, 22793.0, 10916.0, 5615.0, 3253.0, 1982.0, 1174.0, 831.0, 485.0, 331.0, 261.0, 172.0, 94.0, 98.0, 69.0, 36.0, 26.0, 24.0, 28.0, 14.0, 9.0, 7.0, 8.0, 4.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.152099609375, -0.14710235595703125, -0.1421051025390625, -0.13710784912109375, -0.132110595703125, -0.12711334228515625, -0.1221160888671875, -0.11711883544921875, -0.11212158203125, -0.10712432861328125, -0.1021270751953125, -0.09712982177734375, -0.092132568359375, -0.08713531494140625, -0.0821380615234375, -0.07714080810546875, -0.0721435546875, -0.06714630126953125, -0.0621490478515625, -0.05715179443359375, -0.052154541015625, -0.04715728759765625, -0.0421600341796875, -0.03716278076171875, -0.03216552734375, -0.02716827392578125, -0.0221710205078125, -0.01717376708984375, -0.012176513671875, -0.00717926025390625, -0.0021820068359375, 0.00281524658203125, 0.0078125, 0.01280975341796875, 0.0178070068359375, 0.02280426025390625, 0.027801513671875, 0.03279876708984375, 0.0377960205078125, 0.04279327392578125, 0.04779052734375, 0.05278778076171875, 0.0577850341796875, 0.06278228759765625, 0.067779541015625, 0.07277679443359375, 0.0777740478515625, 0.08277130126953125, 0.0877685546875, 0.09276580810546875, 0.0977630615234375, 0.10276031494140625, 0.107757568359375, 0.11275482177734375, 0.1177520751953125, 0.12274932861328125, 0.12774658203125, 0.13274383544921875, 0.1377410888671875, 0.14273834228515625, 0.147735595703125, 0.15273284912109375, 0.1577301025390625, 0.16272735595703125, 0.167724609375]}, "gradients/decoder.model.decoder.layers.0.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 3.0, 9.0, 7.0, 7.0, 11.0, 11.0, 10.0, 26.0, 46.0, 76.0, 116.0, 186.0, 205.0, 116.0, 62.0, 37.0, 30.0, 16.0, 16.0, 6.0, 6.0, 1.0, 1.0, 5.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.186962127685547e-05, -5.939789116382599e-05, -5.692616105079651e-05, -5.445443093776703e-05, -5.198270082473755e-05, -4.951097071170807e-05, -4.703924059867859e-05, -4.456751048564911e-05, -4.209578037261963e-05, -3.962405025959015e-05, -3.715232014656067e-05, -3.468059003353119e-05, -3.220885992050171e-05, -2.973712980747223e-05, -2.726539969444275e-05, -2.479366958141327e-05, -2.232193946838379e-05, -1.985020935535431e-05, -1.737847924232483e-05, -1.4906749129295349e-05, -1.2435019016265869e-05, -9.96328890323639e-06, -7.491558790206909e-06, -5.019828677177429e-06, -2.5480985641479492e-06, -7.636845111846924e-08, 2.3953616619110107e-06, 4.867091774940491e-06, 7.338821887969971e-06, 9.81055200099945e-06, 1.228228211402893e-05, 1.475401222705841e-05, 1.722574234008789e-05, 1.969747245311737e-05, 2.216920256614685e-05, 2.464093267917633e-05, 2.711266279220581e-05, 2.958439290523529e-05, 3.205612301826477e-05, 3.452785313129425e-05, 3.699958324432373e-05, 3.947131335735321e-05, 4.194304347038269e-05, 4.441477358341217e-05, 4.688650369644165e-05, 4.935823380947113e-05, 5.182996392250061e-05, 5.430169403553009e-05, 5.677342414855957e-05, 5.924515426158905e-05, 6.171688437461853e-05, 6.418861448764801e-05, 6.666034460067749e-05, 6.913207471370697e-05, 7.160380482673645e-05, 7.407553493976593e-05, 7.654726505279541e-05, 7.901899516582489e-05, 8.149072527885437e-05, 8.396245539188385e-05, 8.643418550491333e-05, 8.890591561794281e-05, 9.137764573097229e-05, 9.384937584400177e-05, 9.632110595703125e-05]}, "gradients/decoder.model.decoder.layers.0.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 4.0, 1.0, 4.0, 1.0, 5.0, 7.0, 2.0, 5.0, 15.0, 9.0, 15.0, 11.0, 20.0, 31.0, 58.0, 61.0, 95.0, 164.0, 284.0, 460.0, 811.0, 1416.0, 3013.0, 6344.0, 16845.0, 64034.0, 545789.0, 336237.0, 47965.0, 13694.0, 5449.0, 2577.0, 1308.0, 716.0, 406.0, 222.0, 147.0, 97.0, 74.0, 38.0, 34.0, 23.0, 18.0, 14.0, 6.0, 8.0, 5.0, 9.0, 2.0, 5.0, 3.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.342041015625, -0.3309745788574219, -0.31990814208984375, -0.3088417053222656, -0.2977752685546875, -0.2867088317871094, -0.27564239501953125, -0.2645759582519531, -0.253509521484375, -0.24244308471679688, -0.23137664794921875, -0.22031021118164062, -0.2092437744140625, -0.19817733764648438, -0.18711090087890625, -0.17604446411132812, -0.16497802734375, -0.15391159057617188, -0.14284515380859375, -0.13177871704101562, -0.1207122802734375, -0.10964584350585938, -0.09857940673828125, -0.08751296997070312, -0.076446533203125, -0.06538009643554688, -0.05431365966796875, -0.043247222900390625, -0.0321807861328125, -0.021114349365234375, -0.01004791259765625, 0.001018524169921875, 0.0120849609375, 0.023151397705078125, 0.03421783447265625, 0.045284271240234375, 0.0563507080078125, 0.06741714477539062, 0.07848358154296875, 0.08955001831054688, 0.100616455078125, 0.11168289184570312, 0.12274932861328125, 0.13381576538085938, 0.1448822021484375, 0.15594863891601562, 0.16701507568359375, 0.17808151245117188, 0.18914794921875, 0.20021438598632812, 0.21128082275390625, 0.22234725952148438, 0.2334136962890625, 0.24448013305664062, 0.25554656982421875, 0.2666130065917969, 0.277679443359375, 0.2887458801269531, 0.29981231689453125, 0.3108787536621094, 0.3219451904296875, 0.3330116271972656, 0.34407806396484375, 0.3551445007324219, 0.3662109375]}, "gradients/decoder.model.decoder.layers.0.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 1.0, 5.0, 5.0, 4.0, 9.0, 7.0, 13.0, 11.0, 21.0, 26.0, 44.0, 92.0, 134.0, 160.0, 156.0, 115.0, 68.0, 46.0, 41.0, 15.0, 8.0, 8.0, 5.0, 3.0, 3.0, 4.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.2783203125, -0.27133750915527344, -0.2643547058105469, -0.2573719024658203, -0.25038909912109375, -0.2434062957763672, -0.23642349243164062, -0.22944068908691406, -0.2224578857421875, -0.21547508239746094, -0.20849227905273438, -0.2015094757080078, -0.19452667236328125, -0.1875438690185547, -0.18056106567382812, -0.17357826232910156, -0.166595458984375, -0.15961265563964844, -0.15262985229492188, -0.1456470489501953, -0.13866424560546875, -0.1316814422607422, -0.12469863891601562, -0.11771583557128906, -0.1107330322265625, -0.10375022888183594, -0.09676742553710938, -0.08978462219238281, -0.08280181884765625, -0.07581901550292969, -0.06883621215820312, -0.06185340881347656, -0.05487060546875, -0.04788780212402344, -0.040904998779296875, -0.03392219543457031, -0.02693939208984375, -0.019956588745117188, -0.012973785400390625, -0.0059909820556640625, 0.0009918212890625, 0.007974624633789062, 0.014957427978515625, 0.021940231323242188, 0.02892303466796875, 0.03590583801269531, 0.042888641357421875, 0.04987144470214844, 0.056854248046875, 0.06383705139160156, 0.07081985473632812, 0.07780265808105469, 0.08478546142578125, 0.09176826477050781, 0.09875106811523438, 0.10573387145996094, 0.1127166748046875, 0.11969947814941406, 0.12668228149414062, 0.1336650848388672, 0.14064788818359375, 0.1476306915283203, 0.15461349487304688, 0.16159629821777344, 0.1685791015625]}, "gradients/decoder.model.decoder.layernorm_embedding.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 8.0, 11.0, 36.0, 49.0, 78.0, 122.0, 151.0, 167.0, 158.0, 92.0, 67.0, 19.0, 23.0, 11.0, 4.0, 2.0, 1.0, 3.0, 0.0, 2.0, 1.0], "bins": [-4.432101726531982, -4.343398094177246, -4.25469446182251, -4.165990829467773, -4.077286720275879, -3.9885830879211426, -3.8998794555664062, -3.81117582321167, -3.7224719524383545, -3.633768320083618, -3.5450644493103027, -3.4563608169555664, -3.36765718460083, -3.2789533138275146, -3.1902496814727783, -3.101545810699463, -3.0128421783447266, -2.9241385459899902, -2.835434675216675, -2.7467310428619385, -2.658027410507202, -2.5693235397338867, -2.4806199073791504, -2.391916275024414, -2.3032126426696777, -2.2145090103149414, -2.125805139541626, -2.0371015071868896, -1.9483977556228638, -1.859694004058838, -1.7709903717041016, -1.6822866201400757, -1.5935829877853394, -1.5048792362213135, -1.4161756038665771, -1.3274718523025513, -1.2387681007385254, -1.150064468383789, -1.0613607168197632, -0.9726569652557373, -0.8839532732963562, -0.7952495813369751, -0.7065458297729492, -0.6178421378135681, -0.529138445854187, -0.44043469429016113, -0.35173100233078003, -0.26302725076675415, -0.17432355880737305, -0.08561984449625015, 0.0030838698148727417, 0.09178757667541504, 0.18049129843711853, 0.269195020198822, 0.3578987121582031, 0.446602463722229, 0.5353061556816101, 0.6240098476409912, 0.7127135992050171, 0.8014172911643982, 0.8901209831237793, 0.9788247346878052, 1.067528486251831, 1.1562321186065674, 1.2449358701705933]}, "gradients/decoder.model.decoder.layernorm_embedding.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 4.0, 3.0, 3.0, 3.0, 7.0, 5.0, 3.0, 8.0, 8.0, 8.0, 18.0, 13.0, 20.0, 24.0, 29.0, 26.0, 26.0, 25.0, 35.0, 33.0, 37.0, 41.0, 49.0, 41.0, 56.0, 39.0, 52.0, 45.0, 38.0, 38.0, 27.0, 28.0, 22.0, 25.0, 22.0, 27.0, 30.0, 19.0, 15.0, 12.0, 8.0, 13.0, 9.0, 4.0, 5.0, 3.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.5847102403640747, -1.5333341360092163, -1.4819579124450684, -1.43058180809021, -1.379205584526062, -1.3278294801712036, -1.2764532566070557, -1.2250771522521973, -1.1737009286880493, -1.122324824333191, -1.070948600769043, -1.0195724964141846, -0.9681962728500366, -0.9168201684951782, -0.8654439449310303, -0.8140678405761719, -0.7626916766166687, -0.7113155126571655, -0.6599393486976624, -0.6085631847381592, -0.557187020778656, -0.5058108568191528, -0.45443472266197205, -0.40305855870246887, -0.3516823947429657, -0.3003062307834625, -0.24893006682395935, -0.19755391776561737, -0.1461777538061142, -0.09480160474777222, -0.04342544078826904, 0.00795072317123413, 0.059326887130737305, 0.11070305109024048, 0.16207921504974365, 0.21345536410808563, 0.26483154296875, 0.3162076771259308, 0.36758384108543396, 0.41896000504493713, 0.4703361690044403, 0.5217123031616211, 0.5730884671211243, 0.6244646310806274, 0.6758407950401306, 0.7272169589996338, 0.778593122959137, 0.8299692869186401, 0.8813454508781433, 0.9327216148376465, 0.9840977787971497, 1.0354739427566528, 1.0868500471115112, 1.1382262706756592, 1.1896023750305176, 1.2409785985946655, 1.292354702949524, 1.3437308073043823, 1.3951070308685303, 1.4464831352233887, 1.4978593587875366, 1.549235463142395, 1.600611686706543, 1.6519877910614014, 1.7033640146255493]}, "gradients/decoder.model.decoder.embed_positions.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 1.0, 9.0, 14.0, 8.0, 11.0, 21.0, 13.0, 24.0, 32.0, 48.0, 46.0, 75.0, 94.0, 125.0, 141.0, 171.0, 242.0, 275.0, 314.0, 409.0, 451.0, 700.0, 1522.0, 1041724.0, 1139.0, 610.0, 461.0, 347.0, 292.0, 232.0, 227.0, 215.0, 140.0, 98.0, 90.0, 78.0, 50.0, 38.0, 33.0, 18.0, 16.0, 21.0, 8.0, 9.0, 5.0, 8.0, 2.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0], "bins": [-2.468076467514038, -2.3940749168395996, -2.320073366165161, -2.2460715770721436, -2.172070026397705, -2.0980684757232666, -2.024066925048828, -1.9500653743743896, -1.8760637044906616, -1.8020621538162231, -1.7280604839324951, -1.6540589332580566, -1.5800573825836182, -1.5060557126998901, -1.4320541620254517, -1.3580524921417236, -1.2840509414672852, -1.2100493907928467, -1.1360477209091187, -1.0620461702346802, -0.9880445599555969, -0.9140429496765137, -0.8400413990020752, -0.7660397887229919, -0.6920381784439087, -0.6180365681648254, -0.5440349578857422, -0.4700334072113037, -0.39603179693222046, -0.3220301866531372, -0.24802860617637634, -0.17402702569961548, -0.10002517700195312, -0.026023581624031067, 0.04797801375389099, 0.12197960913181305, 0.1959812045097351, 0.26998281478881836, 0.3439843952655792, 0.4179859757423401, 0.49198758602142334, 0.5659891963005066, 0.6399908065795898, 0.7139923572540283, 0.7879939675331116, 0.8619955778121948, 0.9359971284866333, 1.0099987983703613, 1.0840003490447998, 1.1580018997192383, 1.2320035696029663, 1.3060051202774048, 1.3800067901611328, 1.4540083408355713, 1.5280098915100098, 1.6020114421844482, 1.6760131120681763, 1.7500146627426147, 1.8240163326263428, 1.8980178833007812, 1.9720194339752197, 2.046020984649658, 2.120022773742676, 2.1940243244171143, 2.2680258750915527]}, "gradients/decoder.model.decoder.embed_tokens.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 2.0, 2.0, 3.0, 5.0, 17.0, 21.0, 59.0, 131.0, 291.0, 694.0, 1976.0, 5616.0, 27854.0, 51421724.0, 8201.0, 2864.0, 1128.0, 428.0, 176.0, 75.0, 32.0, 14.0, 9.0, 6.0, 6.0, 2.0, 2.0, 1.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-20.3125, -19.660493850708008, -19.008487701416016, -18.356481552124023, -17.70447540283203, -17.052467346191406, -16.400463104248047, -15.748455047607422, -15.09644889831543, -14.444442749023438, -13.792436599731445, -13.140430450439453, -12.488423347473145, -11.836417198181152, -11.18441104888916, -10.532403945922852, -9.880398750305176, -9.228392601013184, -8.576386451721191, -7.924379825592041, -7.272373199462891, -6.620367050170898, -5.968360900878906, -5.316354274749756, -4.664348125457764, -4.0123419761657715, -3.360335350036621, -2.708329200744629, -2.0563228130340576, -1.4043164253234863, -0.7523102760314941, -0.10030364990234375, 0.5517024993896484, 1.2037088871002197, 1.8557151556015015, 2.507721424102783, 3.1597278118133545, 3.811734199523926, 4.463740348815918, 5.115746974945068, 5.7677531242370605, 6.419759273529053, 7.071765899658203, 7.723772048950195, 8.375778198242188, 9.02778434753418, 9.679790496826172, 10.33179759979248, 10.983803749084473, 11.635809898376465, 12.287816047668457, 12.939823150634766, 13.591829299926758, 14.24383544921875, 14.895841598510742, 15.547847747802734, 16.199853897094727, 16.85186004638672, 17.50386619567871, 18.155872344970703, 18.807878494262695, 19.459884643554688, 20.111892700195312, 20.763898849487305, 21.415904998779297]}, "gradients/encoder.adapter.layers.2.conv.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 5.0, 5.0, 12.0, 9.0, 15.0, 15.0, 25.0, 34.0, 50.0, 57.0, 119.0, 146.0, 230.0, 360.0, 558.0, 947.0, 1626.0, 2726.0, 4804.0, 9109.0, 18165.0, 37692.0, 81677.0, 190319.0, 431175.0, 1665238.0, 2929221.0, 505802.0, 225174.0, 97218.0, 44038.0, 20934.0, 10579.0, 5560.0, 3072.0, 1765.0, 1125.0, 643.0, 369.0, 244.0, 192.0, 126.0, 76.0, 55.0, 44.0, 18.0, 18.0, 13.0, 11.0, 12.0, 8.0, 3.0, 3.0, 1.0, 2.0, 0.0, 3.0, 0.0, 3.0, 0.0, 2.0], "bins": [-1.337890625, -1.2919158935546875, -1.245941162109375, -1.1999664306640625, -1.15399169921875, -1.1080169677734375, -1.062042236328125, -1.0160675048828125, -0.9700927734375, -0.9241180419921875, -0.878143310546875, -0.8321685791015625, -0.78619384765625, -0.7402191162109375, -0.694244384765625, -0.6482696533203125, -0.602294921875, -0.5563201904296875, -0.510345458984375, -0.4643707275390625, -0.41839599609375, -0.3724212646484375, -0.326446533203125, -0.2804718017578125, -0.2344970703125, -0.1885223388671875, -0.142547607421875, -0.0965728759765625, -0.05059814453125, -0.0046234130859375, 0.041351318359375, 0.0873260498046875, 0.13330078125, 0.1792755126953125, 0.225250244140625, 0.2712249755859375, 0.31719970703125, 0.3631744384765625, 0.409149169921875, 0.4551239013671875, 0.5010986328125, 0.5470733642578125, 0.593048095703125, 0.6390228271484375, 0.68499755859375, 0.7309722900390625, 0.776947021484375, 0.8229217529296875, 0.868896484375, 0.9148712158203125, 0.960845947265625, 1.0068206787109375, 1.05279541015625, 1.0987701416015625, 1.144744873046875, 1.1907196044921875, 1.2366943359375, 1.2826690673828125, 1.328643798828125, 1.3746185302734375, 1.42059326171875, 1.4665679931640625, 1.512542724609375, 1.5585174560546875, 1.6044921875]}, "gradients/encoder.adapter.layers.2.conv.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 7.0, 5.0, 9.0, 8.0, 8.0, 7.0, 11.0, 19.0, 16.0, 25.0, 27.0, 32.0, 42.0, 41.0, 40.0, 47.0, 46.0, 47.0, 113.0, 757.0, 276.0, 67.0, 33.0, 52.0, 41.0, 40.0, 28.0, 23.0, 29.0, 25.0, 18.0, 18.0, 15.0, 10.0, 15.0, 5.0, 10.0, 5.0, 5.0, 6.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.890625, -8.5911865234375, -8.291748046875, -7.9923095703125, -7.69287109375, -7.3934326171875, -7.093994140625, -6.7945556640625, -6.4951171875, -6.1956787109375, -5.896240234375, -5.5968017578125, -5.29736328125, -4.9979248046875, -4.698486328125, -4.3990478515625, -4.099609375, -3.8001708984375, -3.500732421875, -3.2012939453125, -2.90185546875, -2.6024169921875, -2.302978515625, -2.0035400390625, -1.7041015625, -1.4046630859375, -1.105224609375, -0.8057861328125, -0.50634765625, -0.2069091796875, 0.092529296875, 0.3919677734375, 0.69140625, 0.9908447265625, 1.290283203125, 1.5897216796875, 1.88916015625, 2.1885986328125, 2.488037109375, 2.7874755859375, 3.0869140625, 3.3863525390625, 3.685791015625, 3.9852294921875, 4.28466796875, 4.5841064453125, 4.883544921875, 5.1829833984375, 5.482421875, 5.7818603515625, 6.081298828125, 6.3807373046875, 6.68017578125, 6.9796142578125, 7.279052734375, 7.5784912109375, 7.8779296875, 8.1773681640625, 8.476806640625, 8.7762451171875, 9.07568359375, 9.3751220703125, 9.674560546875, 9.9739990234375, 10.2734375]}, "gradients/encoder.adapter.layers.1.conv.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 3.0, 7.0, 7.0, 13.0, 18.0, 23.0, 44.0, 56.0, 64.0, 96.0, 173.0, 239.0, 429.0, 659.0, 1142.0, 1930.0, 3532.0, 6475.0, 12416.0, 24428.0, 48348.0, 96056.0, 182830.0, 321733.0, 523129.0, 3327077.0, 872249.0, 384373.0, 229625.0, 124225.0, 63224.0, 31552.0, 16287.0, 8616.0, 4401.0, 2471.0, 1397.0, 773.0, 458.0, 327.0, 190.0, 124.0, 76.0, 54.0, 32.0, 26.0, 14.0, 8.0, 5.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0], "bins": [-0.85009765625, -0.8240966796875, -0.798095703125, -0.7720947265625, -0.74609375, -0.7200927734375, -0.694091796875, -0.6680908203125, -0.64208984375, -0.6160888671875, -0.590087890625, -0.5640869140625, -0.5380859375, -0.5120849609375, -0.486083984375, -0.4600830078125, -0.43408203125, -0.4080810546875, -0.382080078125, -0.3560791015625, -0.330078125, -0.3040771484375, -0.278076171875, -0.2520751953125, -0.22607421875, -0.2000732421875, -0.174072265625, -0.1480712890625, -0.1220703125, -0.0960693359375, -0.070068359375, -0.0440673828125, -0.01806640625, 0.0079345703125, 0.033935546875, 0.0599365234375, 0.0859375, 0.1119384765625, 0.137939453125, 0.1639404296875, 0.18994140625, 0.2159423828125, 0.241943359375, 0.2679443359375, 0.2939453125, 0.3199462890625, 0.345947265625, 0.3719482421875, 0.39794921875, 0.4239501953125, 0.449951171875, 0.4759521484375, 0.501953125, 0.5279541015625, 0.553955078125, 0.5799560546875, 0.60595703125, 0.6319580078125, 0.657958984375, 0.6839599609375, 0.7099609375, 0.7359619140625, 0.761962890625, 0.7879638671875, 0.81396484375]}, "gradients/encoder.adapter.layers.1.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 5.0, 9.0, 5.0, 10.0, 7.0, 9.0, 17.0, 22.0, 34.0, 33.0, 30.0, 45.0, 37.0, 44.0, 44.0, 50.0, 65.0, 695.0, 431.0, 49.0, 57.0, 43.0, 47.0, 46.0, 43.0, 26.0, 22.0, 23.0, 21.0, 18.0, 6.0, 11.0, 10.0, 9.0, 4.0, 2.0, 5.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.4140625, -9.1358642578125, -8.857666015625, -8.5794677734375, -8.30126953125, -8.0230712890625, -7.744873046875, -7.4666748046875, -7.1884765625, -6.9102783203125, -6.632080078125, -6.3538818359375, -6.07568359375, -5.7974853515625, -5.519287109375, -5.2410888671875, -4.962890625, -4.6846923828125, -4.406494140625, -4.1282958984375, -3.85009765625, -3.5718994140625, -3.293701171875, -3.0155029296875, -2.7373046875, -2.4591064453125, -2.180908203125, -1.9027099609375, -1.62451171875, -1.3463134765625, -1.068115234375, -0.7899169921875, -0.51171875, -0.2335205078125, 0.044677734375, 0.3228759765625, 0.60107421875, 0.8792724609375, 1.157470703125, 1.4356689453125, 1.7138671875, 1.9920654296875, 2.270263671875, 2.5484619140625, 2.82666015625, 3.1048583984375, 3.383056640625, 3.6612548828125, 3.939453125, 4.2176513671875, 4.495849609375, 4.7740478515625, 5.05224609375, 5.3304443359375, 5.608642578125, 5.8868408203125, 6.1650390625, 6.4432373046875, 6.721435546875, 6.9996337890625, 7.27783203125, 7.5560302734375, 7.834228515625, 8.1124267578125, 8.390625]}, "gradients/encoder.adapter.layers.0.conv.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 5.0, 3.0, 1.0, 1.0, 8.0, 10.0, 15.0, 17.0, 14.0, 21.0, 41.0, 68.0, 100.0, 172.0, 244.0, 354.0, 562.0, 955.0, 1651.0, 3321.0, 7446.0, 20115.0, 67282.0, 250422.0, 852995.0, 4297649.0, 565066.0, 155023.0, 42395.0, 13905.0, 5424.0, 2607.0, 1384.0, 816.0, 470.0, 297.0, 175.0, 131.0, 104.0, 41.0, 41.0, 26.0, 24.0, 14.0, 8.0, 6.0, 0.0, 0.0, 4.0, 2.0, 2.0, 5.0, 3.0, 2.0], "bins": [-1.9208984375, -1.86651611328125, -1.8121337890625, -1.75775146484375, -1.703369140625, -1.64898681640625, -1.5946044921875, -1.54022216796875, -1.48583984375, -1.43145751953125, -1.3770751953125, -1.32269287109375, -1.268310546875, -1.21392822265625, -1.1595458984375, -1.10516357421875, -1.05078125, -0.99639892578125, -0.9420166015625, -0.88763427734375, -0.833251953125, -0.77886962890625, -0.7244873046875, -0.67010498046875, -0.61572265625, -0.56134033203125, -0.5069580078125, -0.45257568359375, -0.398193359375, -0.34381103515625, -0.2894287109375, -0.23504638671875, -0.1806640625, -0.12628173828125, -0.0718994140625, -0.01751708984375, 0.036865234375, 0.09124755859375, 0.1456298828125, 0.20001220703125, 0.25439453125, 0.30877685546875, 0.3631591796875, 0.41754150390625, 0.471923828125, 0.52630615234375, 0.5806884765625, 0.63507080078125, 0.689453125, 0.74383544921875, 0.7982177734375, 0.85260009765625, 0.906982421875, 0.96136474609375, 1.0157470703125, 1.07012939453125, 1.12451171875, 1.17889404296875, 1.2332763671875, 1.28765869140625, 1.342041015625, 1.39642333984375, 1.4508056640625, 1.50518798828125, 1.5595703125]}, "gradients/encoder.adapter.layers.0.conv.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 8.0, 8.0, 12.0, 9.0, 8.0, 11.0, 12.0, 16.0, 17.0, 27.0, 22.0, 33.0, 30.0, 38.0, 49.0, 48.0, 47.0, 59.0, 443.0, 663.0, 47.0, 47.0, 51.0, 34.0, 38.0, 46.0, 36.0, 34.0, 25.0, 14.0, 18.0, 14.0, 9.0, 12.0, 17.0, 6.0, 5.0, 8.0, 2.0, 3.0, 3.0, 2.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.60546875, -7.33477783203125, -7.0640869140625, -6.79339599609375, -6.522705078125, -6.25201416015625, -5.9813232421875, -5.71063232421875, -5.43994140625, -5.16925048828125, -4.8985595703125, -4.62786865234375, -4.357177734375, -4.08648681640625, -3.8157958984375, -3.54510498046875, -3.2744140625, -3.00372314453125, -2.7330322265625, -2.46234130859375, -2.191650390625, -1.92095947265625, -1.6502685546875, -1.37957763671875, -1.10888671875, -0.83819580078125, -0.5675048828125, -0.29681396484375, -0.026123046875, 0.24456787109375, 0.5152587890625, 0.78594970703125, 1.056640625, 1.32733154296875, 1.5980224609375, 1.86871337890625, 2.139404296875, 2.41009521484375, 2.6807861328125, 2.95147705078125, 3.22216796875, 3.49285888671875, 3.7635498046875, 4.03424072265625, 4.304931640625, 4.57562255859375, 4.8463134765625, 5.11700439453125, 5.3876953125, 5.65838623046875, 5.9290771484375, 6.19976806640625, 6.470458984375, 6.74114990234375, 7.0118408203125, 7.28253173828125, 7.55322265625, 7.82391357421875, 8.0946044921875, 8.36529541015625, 8.635986328125, 8.90667724609375, 9.1773681640625, 9.44805908203125, 9.71875]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 14.0, 26.0, 111.0, 386.0, 335.0, 100.0, 25.0, 8.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.36328125, -30.56127166748047, -28.759262084960938, -26.957250595092773, -25.155241012573242, -23.35323143005371, -21.551219940185547, -19.749210357666016, -17.947200775146484, -16.145191192626953, -14.343180656433105, -12.541170120239258, -10.739160537719727, -8.937150955200195, -7.135140419006348, -5.3331298828125, -3.5311203002929688, -1.7291102409362793, 0.07289981842041016, 1.8749098777770996, 3.676919937133789, 5.47892951965332, 7.280940055847168, 9.082950592041016, 10.884960174560547, 12.686969757080078, 14.488980293273926, 16.290990829467773, 18.093000411987305, 19.895009994506836, 21.697021484375, 23.49903106689453, 25.301040649414062, 27.103050231933594, 28.905059814453125, 30.70707130432129, 32.50907897949219, 34.31108856201172, 36.113101959228516, 37.91511154174805, 39.71712112426758, 41.51913070678711, 43.32114028930664, 45.12314987182617, 46.92516326904297, 48.7271728515625, 50.52918243408203, 52.33119201660156, 54.133201599121094, 55.935211181640625, 57.737220764160156, 59.53923034667969, 61.34123992919922, 63.14324951171875, 64.94525909423828, 66.74726867675781, 68.54928588867188, 70.3512954711914, 72.15330505371094, 73.95531463623047, 75.75732421875, 77.55933380126953, 79.36134338378906, 81.16336059570312, 82.96536254882812]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 5.0, 2.0, 3.0, 8.0, 2.0, 8.0, 5.0, 15.0, 15.0, 14.0, 18.0, 28.0, 20.0, 30.0, 32.0, 30.0, 41.0, 47.0, 41.0, 46.0, 59.0, 62.0, 38.0, 48.0, 49.0, 49.0, 44.0, 41.0, 31.0, 29.0, 28.0, 17.0, 15.0, 18.0, 16.0, 9.0, 6.0, 7.0, 11.0, 6.0, 5.0, 4.0, 2.0, 1.0, 1.0, 6.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.285354614257812, -25.48186683654785, -24.67837905883789, -23.87489128112793, -23.07140350341797, -22.26791763305664, -21.46442985534668, -20.66094207763672, -19.857454299926758, -19.053966522216797, -18.250478744506836, -17.446990966796875, -16.643505096435547, -15.84001636505127, -15.036529541015625, -14.233041763305664, -13.429553985595703, -12.626066207885742, -11.822578430175781, -11.019091606140137, -10.215603828430176, -9.412116050720215, -8.60862922668457, -7.805141448974609, -7.001653671264648, -6.1981658935546875, -5.394678592681885, -4.591191291809082, -3.787703514099121, -2.98421573638916, -2.1807284355163574, -1.3772411346435547, -0.5737552642822266, 0.22973227500915527, 1.033219814300537, 1.836707353591919, 2.640194892883301, 3.4436826705932617, 4.2471699714660645, 5.050657272338867, 5.854145050048828, 6.657632827758789, 7.461120128631592, 8.264607429504395, 9.068095207214355, 9.871582984924316, 10.675069808959961, 11.478557586669922, 12.282045364379883, 13.085533142089844, 13.889020919799805, 14.69250774383545, 15.49599552154541, 16.299484252929688, 17.102970123291016, 17.906457901000977, 18.709945678710938, 19.5134334564209, 20.31692123413086, 21.12040901184082, 21.92389678955078, 22.72738265991211, 23.53087043762207, 24.33435821533203, 25.137845993041992]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 0.0, 1.0, 5.0, 1.0, 4.0, 3.0, 6.0, 4.0, 10.0, 15.0, 20.0, 17.0, 23.0, 26.0, 41.0, 56.0, 67.0, 120.0, 172.0, 326.0, 737.0, 1418.0, 3717.0, 11713.0, 66768.0, 3581763.0, 493717.0, 22603.0, 6575.0, 2239.0, 929.0, 456.0, 244.0, 154.0, 85.0, 61.0, 37.0, 29.0, 22.0, 20.0, 21.0, 17.0, 14.0, 11.0, 8.0, 3.0, 3.0, 1.0, 2.0, 0.0, 4.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.416015625, -0.4020233154296875, -0.388031005859375, -0.3740386962890625, -0.36004638671875, -0.3460540771484375, -0.332061767578125, -0.3180694580078125, -0.3040771484375, -0.2900848388671875, -0.276092529296875, -0.2621002197265625, -0.24810791015625, -0.2341156005859375, -0.220123291015625, -0.2061309814453125, -0.192138671875, -0.1781463623046875, -0.164154052734375, -0.1501617431640625, -0.13616943359375, -0.1221771240234375, -0.108184814453125, -0.0941925048828125, -0.0802001953125, -0.0662078857421875, -0.052215576171875, -0.0382232666015625, -0.02423095703125, -0.0102386474609375, 0.003753662109375, 0.0177459716796875, 0.03173828125, 0.0457305908203125, 0.059722900390625, 0.0737152099609375, 0.08770751953125, 0.1016998291015625, 0.115692138671875, 0.1296844482421875, 0.1436767578125, 0.1576690673828125, 0.171661376953125, 0.1856536865234375, 0.19964599609375, 0.2136383056640625, 0.227630615234375, 0.2416229248046875, 0.255615234375, 0.2696075439453125, 0.283599853515625, 0.2975921630859375, 0.31158447265625, 0.3255767822265625, 0.339569091796875, 0.3535614013671875, 0.3675537109375, 0.3815460205078125, 0.395538330078125, 0.4095306396484375, 0.42352294921875, 0.4375152587890625, 0.451507568359375, 0.4654998779296875, 0.4794921875]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 1.0, 4.0, 4.0, 6.0, 11.0, 9.0, 11.0, 23.0, 16.0, 20.0, 32.0, 28.0, 34.0, 42.0, 59.0, 51.0, 57.0, 36.0, 63.0, 60.0, 68.0, 56.0, 52.0, 36.0, 40.0, 39.0, 32.0, 23.0, 13.0, 17.0, 12.0, 8.0, 12.0, 8.0, 3.0, 3.0, 8.0, 4.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.100341796875, -0.09696197509765625, -0.0935821533203125, -0.09020233154296875, -0.086822509765625, -0.08344268798828125, -0.0800628662109375, -0.07668304443359375, -0.07330322265625, -0.06992340087890625, -0.0665435791015625, -0.06316375732421875, -0.059783935546875, -0.05640411376953125, -0.0530242919921875, -0.04964447021484375, -0.0462646484375, -0.04288482666015625, -0.0395050048828125, -0.03612518310546875, -0.032745361328125, -0.02936553955078125, -0.0259857177734375, -0.02260589599609375, -0.01922607421875, -0.01584625244140625, -0.0124664306640625, -0.00908660888671875, -0.005706787109375, -0.00232696533203125, 0.0010528564453125, 0.00443267822265625, 0.0078125, 0.01119232177734375, 0.0145721435546875, 0.01795196533203125, 0.021331787109375, 0.02471160888671875, 0.0280914306640625, 0.03147125244140625, 0.03485107421875, 0.03823089599609375, 0.0416107177734375, 0.04499053955078125, 0.048370361328125, 0.05175018310546875, 0.0551300048828125, 0.05850982666015625, 0.0618896484375, 0.06526947021484375, 0.0686492919921875, 0.07202911376953125, 0.075408935546875, 0.07878875732421875, 0.0821685791015625, 0.08554840087890625, 0.08892822265625, 0.09230804443359375, 0.0956878662109375, 0.09906768798828125, 0.102447509765625, 0.10582733154296875, 0.1092071533203125, 0.11258697509765625, 0.115966796875]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 6.0, 4.0, 5.0, 5.0, 3.0, 12.0, 8.0, 7.0, 22.0, 18.0, 22.0, 64.0, 129.0, 518.0, 4046.0, 1203019.0, 2980143.0, 5312.0, 606.0, 177.0, 55.0, 37.0, 15.0, 12.0, 6.0, 8.0, 6.0, 6.0, 3.0, 6.0, 5.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0], "bins": [-0.66357421875, -0.6451644897460938, -0.6267547607421875, -0.6083450317382812, -0.589935302734375, -0.5715255737304688, -0.5531158447265625, -0.5347061157226562, -0.51629638671875, -0.49788665771484375, -0.4794769287109375, -0.46106719970703125, -0.442657470703125, -0.42424774169921875, -0.4058380126953125, -0.38742828369140625, -0.3690185546875, -0.35060882568359375, -0.3321990966796875, -0.31378936767578125, -0.295379638671875, -0.27696990966796875, -0.2585601806640625, -0.24015045166015625, -0.22174072265625, -0.20333099365234375, -0.1849212646484375, -0.16651153564453125, -0.148101806640625, -0.12969207763671875, -0.1112823486328125, -0.09287261962890625, -0.074462890625, -0.05605316162109375, -0.0376434326171875, -0.01923370361328125, -0.000823974609375, 0.01758575439453125, 0.0359954833984375, 0.05440521240234375, 0.07281494140625, 0.09122467041015625, 0.1096343994140625, 0.12804412841796875, 0.146453857421875, 0.16486358642578125, 0.1832733154296875, 0.20168304443359375, 0.2200927734375, 0.23850250244140625, 0.2569122314453125, 0.27532196044921875, 0.293731689453125, 0.31214141845703125, 0.3305511474609375, 0.34896087646484375, 0.36737060546875, 0.38578033447265625, 0.4041900634765625, 0.42259979248046875, 0.441009521484375, 0.45941925048828125, 0.4778289794921875, 0.49623870849609375, 0.5146484375]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 3.0, 3.0, 4.0, 5.0, 15.0, 7.0, 12.0, 13.0, 18.0, 37.0, 83.0, 196.0, 408.0, 791.0, 1121.0, 710.0, 296.0, 151.0, 86.0, 37.0, 22.0, 12.0, 15.0, 13.0, 5.0, 7.0, 3.0, 0.0, 2.0, 1.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.160400390625, -0.15453720092773438, -0.14867401123046875, -0.14281082153320312, -0.1369476318359375, -0.13108444213867188, -0.12522125244140625, -0.11935806274414062, -0.113494873046875, -0.10763168334960938, -0.10176849365234375, -0.09590530395507812, -0.0900421142578125, -0.08417892456054688, -0.07831573486328125, -0.07245254516601562, -0.06658935546875, -0.060726165771484375, -0.05486297607421875, -0.048999786376953125, -0.0431365966796875, -0.037273406982421875, -0.03141021728515625, -0.025547027587890625, -0.019683837890625, -0.013820648193359375, -0.00795745849609375, -0.002094268798828125, 0.0037689208984375, 0.009632110595703125, 0.01549530029296875, 0.021358489990234375, 0.0272216796875, 0.033084869384765625, 0.03894805908203125, 0.044811248779296875, 0.0506744384765625, 0.056537628173828125, 0.06240081787109375, 0.06826400756835938, 0.074127197265625, 0.07999038696289062, 0.08585357666015625, 0.09171676635742188, 0.0975799560546875, 0.10344314575195312, 0.10930633544921875, 0.11516952514648438, 0.12103271484375, 0.12689590454101562, 0.13275909423828125, 0.13862228393554688, 0.1444854736328125, 0.15034866333007812, 0.15621185302734375, 0.16207504272460938, 0.167938232421875, 0.17380142211914062, 0.17966461181640625, 0.18552780151367188, 0.1913909912109375, 0.19725418090820312, 0.20311737060546875, 0.20898056030273438, 0.21484375]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 10.0, 41.0, 156.0, 367.0, 296.0, 102.0, 27.0, 11.0, 2.0, 1.0, 2.0], "bins": [-2.7864437103271484, -2.737320899963379, -2.6881983280181885, -2.639075517654419, -2.5899527072906494, -2.540830135345459, -2.4917073249816895, -2.44258451461792, -2.3934619426727295, -2.34433913230896, -2.2952165603637695, -2.24609375, -2.1969709396362305, -2.14784836769104, -2.0987255573272705, -2.049602746963501, -2.0004801750183105, -1.9513574838638306, -1.902234673500061, -1.853111982345581, -1.803989291191101, -1.754866600036621, -1.7057437896728516, -1.6566210985183716, -1.6074981689453125, -1.5583754777908325, -1.509252667427063, -1.460129976272583, -1.411007285118103, -1.361884593963623, -1.3127617835998535, -1.2636390924453735, -1.2145164012908936, -1.1653937101364136, -1.116270899772644, -1.067148208618164, -1.018025517463684, -0.9689027667045593, -0.9197800159454346, -0.8706573247909546, -0.8215345740318298, -0.7724118232727051, -0.7232891321182251, -0.6741663813591003, -0.6250436305999756, -0.5759209394454956, -0.5267981886863708, -0.4776754677295685, -0.4285527467727661, -0.37943002581596375, -0.3303073048591614, -0.2811845541000366, -0.23206183314323425, -0.18293911218643188, -0.13381636142730713, -0.08469364047050476, -0.03557091951370239, 0.013551808893680573, 0.06267453730106354, 0.1117972731590271, 0.16091999411582947, 0.21004271507263184, 0.2591654658317566, 0.30828818678855896, 0.35741090774536133]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 3.0, 7.0, 4.0, 5.0, 2.0, 7.0, 5.0, 6.0, 10.0, 16.0, 19.0, 15.0, 21.0, 24.0, 22.0, 28.0, 43.0, 30.0, 51.0, 49.0, 46.0, 46.0, 46.0, 49.0, 40.0, 37.0, 48.0, 45.0, 33.0, 26.0, 24.0, 22.0, 23.0, 23.0, 27.0, 23.0, 13.0, 5.0, 14.0, 10.0, 4.0, 6.0, 5.0, 11.0, 5.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 1.0, 3.0], "bins": [-0.3067113161087036, -0.29769620299339294, -0.2886810898780823, -0.2796659767627716, -0.27065086364746094, -0.26163575053215027, -0.2526206374168396, -0.24360552430152893, -0.23459041118621826, -0.2255752980709076, -0.21656018495559692, -0.20754507184028625, -0.19852995872497559, -0.18951484560966492, -0.18049973249435425, -0.17148461937904358, -0.16246949136257172, -0.15345437824726105, -0.14443926513195038, -0.1354241520166397, -0.12640903890132904, -0.11739392578601837, -0.1083788052201271, -0.09936369210481644, -0.09034857898950577, -0.0813334658741951, -0.07231835275888443, -0.06330323219299316, -0.054288122802972794, -0.045273009687662125, -0.03625789284706116, -0.02724277973175049, -0.01822766661643982, -0.009212552569806576, -0.00019743852317333221, 0.008817676454782486, 0.017832789570093155, 0.026847902685403824, 0.03586301952600479, 0.04487813264131546, 0.05389324575662613, 0.0629083588719368, 0.07192347198724747, 0.08093859255313873, 0.0899537056684494, 0.09896881878376007, 0.10798393189907074, 0.11699904501438141, 0.12601415812969208, 0.13502927124500275, 0.14404438436031342, 0.15305949747562408, 0.16207461059093475, 0.17108972370624542, 0.18010485172271729, 0.18911996483802795, 0.19813507795333862, 0.2071501910686493, 0.21616530418395996, 0.22518041729927063, 0.2341955304145813, 0.24321064352989197, 0.25222575664520264, 0.2612408697605133, 0.270255982875824]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 3.0, 3.0, 2.0, 4.0, 6.0, 9.0, 13.0, 20.0, 24.0, 37.0, 43.0, 75.0, 91.0, 169.0, 257.0, 370.0, 615.0, 987.0, 2032.0, 4182.0, 11461.0, 68273.0, 862861.0, 75833.0, 12076.0, 4223.0, 2116.0, 1068.0, 616.0, 371.0, 229.0, 142.0, 104.0, 74.0, 48.0, 40.0, 16.0, 23.0, 6.0, 9.0, 10.0, 8.0, 6.0, 4.0, 4.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.50244140625, -0.48542022705078125, -0.4683990478515625, -0.45137786865234375, -0.434356689453125, -0.41733551025390625, -0.4003143310546875, -0.38329315185546875, -0.36627197265625, -0.34925079345703125, -0.3322296142578125, -0.31520843505859375, -0.298187255859375, -0.28116607666015625, -0.2641448974609375, -0.24712371826171875, -0.2301025390625, -0.21308135986328125, -0.1960601806640625, -0.17903900146484375, -0.162017822265625, -0.14499664306640625, -0.1279754638671875, -0.11095428466796875, -0.09393310546875, -0.07691192626953125, -0.0598907470703125, -0.04286956787109375, -0.025848388671875, -0.00882720947265625, 0.0081939697265625, 0.02521514892578125, 0.042236328125, 0.05925750732421875, 0.0762786865234375, 0.09329986572265625, 0.110321044921875, 0.12734222412109375, 0.1443634033203125, 0.16138458251953125, 0.17840576171875, 0.19542694091796875, 0.2124481201171875, 0.22946929931640625, 0.246490478515625, 0.26351165771484375, 0.2805328369140625, 0.29755401611328125, 0.3145751953125, 0.33159637451171875, 0.3486175537109375, 0.36563873291015625, 0.382659912109375, 0.39968109130859375, 0.4167022705078125, 0.43372344970703125, 0.45074462890625, 0.46776580810546875, 0.4847869873046875, 0.5018081665039062, 0.518829345703125, 0.5358505249023438, 0.5528717041015625, 0.5698928833007812, 0.5869140625]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 1.0, 3.0, 2.0, 3.0, 4.0, 4.0, 4.0, 10.0, 13.0, 13.0, 19.0, 26.0, 27.0, 41.0, 45.0, 51.0, 47.0, 58.0, 54.0, 69.0, 79.0, 77.0, 68.0, 54.0, 42.0, 41.0, 36.0, 29.0, 11.0, 14.0, 18.0, 11.0, 9.0, 9.0, 7.0, 4.0, 4.0, 0.0, 4.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.135498046875, -0.13161468505859375, -0.1277313232421875, -0.12384796142578125, -0.119964599609375, -0.11608123779296875, -0.1121978759765625, -0.10831451416015625, -0.10443115234375, -0.10054779052734375, -0.0966644287109375, -0.09278106689453125, -0.088897705078125, -0.08501434326171875, -0.0811309814453125, -0.07724761962890625, -0.0733642578125, -0.06948089599609375, -0.0655975341796875, -0.06171417236328125, -0.057830810546875, -0.05394744873046875, -0.0500640869140625, -0.04618072509765625, -0.04229736328125, -0.03841400146484375, -0.0345306396484375, -0.03064727783203125, -0.026763916015625, -0.02288055419921875, -0.0189971923828125, -0.01511383056640625, -0.01123046875, -0.00734710693359375, -0.0034637451171875, 0.00041961669921875, 0.004302978515625, 0.00818634033203125, 0.0120697021484375, 0.01595306396484375, 0.01983642578125, 0.02371978759765625, 0.0276031494140625, 0.03148651123046875, 0.035369873046875, 0.03925323486328125, 0.0431365966796875, 0.04701995849609375, 0.0509033203125, 0.05478668212890625, 0.0586700439453125, 0.06255340576171875, 0.066436767578125, 0.07032012939453125, 0.0742034912109375, 0.07808685302734375, 0.08197021484375, 0.08585357666015625, 0.0897369384765625, 0.09362030029296875, 0.097503662109375, 0.10138702392578125, 0.1052703857421875, 0.10915374755859375, 0.113037109375]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 0.0, 4.0, 2.0, 6.0, 3.0, 6.0, 11.0, 19.0, 15.0, 24.0, 29.0, 36.0, 49.0, 80.0, 126.0, 207.0, 514.0, 2082.0, 14401.0, 223151.0, 726526.0, 72800.0, 6365.0, 1171.0, 388.0, 165.0, 88.0, 71.0, 44.0, 38.0, 24.0, 29.0, 20.0, 11.0, 8.0, 9.0, 13.0, 7.0, 3.0, 5.0, 2.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.2548828125, -0.2469940185546875, -0.239105224609375, -0.2312164306640625, -0.22332763671875, -0.2154388427734375, -0.207550048828125, -0.1996612548828125, -0.1917724609375, -0.1838836669921875, -0.175994873046875, -0.1681060791015625, -0.16021728515625, -0.1523284912109375, -0.144439697265625, -0.1365509033203125, -0.128662109375, -0.1207733154296875, -0.112884521484375, -0.1049957275390625, -0.09710693359375, -0.0892181396484375, -0.081329345703125, -0.0734405517578125, -0.0655517578125, -0.0576629638671875, -0.049774169921875, -0.0418853759765625, -0.03399658203125, -0.0261077880859375, -0.018218994140625, -0.0103302001953125, -0.00244140625, 0.0054473876953125, 0.013336181640625, 0.0212249755859375, 0.02911376953125, 0.0370025634765625, 0.044891357421875, 0.0527801513671875, 0.0606689453125, 0.0685577392578125, 0.076446533203125, 0.0843353271484375, 0.09222412109375, 0.1001129150390625, 0.108001708984375, 0.1158905029296875, 0.123779296875, 0.1316680908203125, 0.139556884765625, 0.1474456787109375, 0.15533447265625, 0.1632232666015625, 0.171112060546875, 0.1790008544921875, 0.1868896484375, 0.1947784423828125, 0.202667236328125, 0.2105560302734375, 0.21844482421875, 0.2263336181640625, 0.234222412109375, 0.2421112060546875, 0.25]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 5.0, 8.0, 2.0, 8.0, 8.0, 9.0, 7.0, 6.0, 13.0, 21.0, 20.0, 22.0, 24.0, 39.0, 42.0, 37.0, 42.0, 42.0, 45.0, 45.0, 46.0, 54.0, 46.0, 48.0, 39.0, 51.0, 36.0, 27.0, 33.0, 35.0, 25.0, 29.0, 23.0, 13.0, 13.0, 9.0, 7.0, 6.0, 9.0, 1.0, 5.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.230712890625, -0.22384262084960938, -0.21697235107421875, -0.21010208129882812, -0.2032318115234375, -0.19636154174804688, -0.18949127197265625, -0.18262100219726562, -0.175750732421875, -0.16888046264648438, -0.16201019287109375, -0.15513992309570312, -0.1482696533203125, -0.14139938354492188, -0.13452911376953125, -0.12765884399414062, -0.12078857421875, -0.11391830444335938, -0.10704803466796875, -0.10017776489257812, -0.0933074951171875, -0.08643722534179688, -0.07956695556640625, -0.07269668579101562, -0.065826416015625, -0.058956146240234375, -0.05208587646484375, -0.045215606689453125, -0.0383453369140625, -0.031475067138671875, -0.02460479736328125, -0.017734527587890625, -0.0108642578125, -0.003993988037109375, 0.00287628173828125, 0.009746551513671875, 0.0166168212890625, 0.023487091064453125, 0.03035736083984375, 0.037227630615234375, 0.044097900390625, 0.050968170166015625, 0.05783843994140625, 0.06470870971679688, 0.0715789794921875, 0.07844924926757812, 0.08531951904296875, 0.09218978881835938, 0.09906005859375, 0.10593032836914062, 0.11280059814453125, 0.11967086791992188, 0.1265411376953125, 0.13341140747070312, 0.14028167724609375, 0.14715194702148438, 0.154022216796875, 0.16089248657226562, 0.16776275634765625, 0.17463302612304688, 0.1815032958984375, 0.18837356567382812, 0.19524383544921875, 0.20211410522460938, 0.208984375]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 8.0, 4.0, 5.0, 15.0, 16.0, 27.0, 28.0, 48.0, 88.0, 122.0, 224.0, 409.0, 881.0, 1989.0, 5655.0, 23496.0, 239833.0, 681137.0, 76826.0, 11528.0, 3454.0, 1406.0, 619.0, 307.0, 169.0, 93.0, 52.0, 24.0, 30.0, 16.0, 13.0, 7.0, 9.0, 4.0, 8.0, 3.0, 1.0, 5.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.067626953125, -0.06571006774902344, -0.06379318237304688, -0.06187629699707031, -0.05995941162109375, -0.05804252624511719, -0.056125640869140625, -0.05420875549316406, -0.0522918701171875, -0.05037498474121094, -0.048458099365234375, -0.04654121398925781, -0.04462432861328125, -0.04270744323730469, -0.040790557861328125, -0.03887367248535156, -0.036956787109375, -0.03503990173339844, -0.033123016357421875, -0.031206130981445312, -0.02928924560546875, -0.027372360229492188, -0.025455474853515625, -0.023538589477539062, -0.0216217041015625, -0.019704818725585938, -0.017787933349609375, -0.015871047973632812, -0.01395416259765625, -0.012037277221679688, -0.010120391845703125, -0.008203506469726562, -0.00628662109375, -0.0043697357177734375, -0.002452850341796875, -0.0005359649658203125, 0.00138092041015625, 0.0032978057861328125, 0.005214691162109375, 0.0071315765380859375, 0.0090484619140625, 0.010965347290039062, 0.012882232666015625, 0.014799118041992188, 0.01671600341796875, 0.018632888793945312, 0.020549774169921875, 0.022466659545898438, 0.024383544921875, 0.026300430297851562, 0.028217315673828125, 0.030134201049804688, 0.03205108642578125, 0.03396797180175781, 0.035884857177734375, 0.03780174255371094, 0.0397186279296875, 0.04163551330566406, 0.043552398681640625, 0.04546928405761719, 0.04738616943359375, 0.04930305480957031, 0.051219940185546875, 0.05313682556152344, 0.0550537109375]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 4.0, 4.0, 6.0, 5.0, 6.0, 10.0, 9.0, 19.0, 12.0, 21.0, 34.0, 30.0, 48.0, 59.0, 54.0, 73.0, 80.0, 73.0, 104.0, 67.0, 59.0, 42.0, 46.0, 39.0, 33.0, 20.0, 12.0, 13.0, 8.0, 5.0, 4.0, 1.0, 5.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.827976226806641e-06, -4.64264303445816e-06, -4.45730984210968e-06, -4.2719766497612e-06, -4.08664345741272e-06, -3.9013102650642395e-06, -3.7159770727157593e-06, -3.530643880367279e-06, -3.345310688018799e-06, -3.1599774956703186e-06, -2.9746443033218384e-06, -2.789311110973358e-06, -2.603977918624878e-06, -2.4186447262763977e-06, -2.2333115339279175e-06, -2.0479783415794373e-06, -1.862645149230957e-06, -1.6773119568824768e-06, -1.4919787645339966e-06, -1.3066455721855164e-06, -1.1213123798370361e-06, -9.359791874885559e-07, -7.506459951400757e-07, -5.653128027915955e-07, -3.7997961044311523e-07, -1.94646418094635e-07, -9.313225746154785e-09, 1.7601996660232544e-07, 3.6135315895080566e-07, 5.466863512992859e-07, 7.320195436477661e-07, 9.173527359962463e-07, 1.1026859283447266e-06, 1.2880191206932068e-06, 1.473352313041687e-06, 1.6586855053901672e-06, 1.8440186977386475e-06, 2.0293518900871277e-06, 2.214685082435608e-06, 2.400018274784088e-06, 2.5853514671325684e-06, 2.7706846594810486e-06, 2.956017851829529e-06, 3.141351044178009e-06, 3.3266842365264893e-06, 3.5120174288749695e-06, 3.6973506212234497e-06, 3.88268381357193e-06, 4.06801700592041e-06, 4.25335019826889e-06, 4.438683390617371e-06, 4.624016582965851e-06, 4.809349775314331e-06, 4.994682967662811e-06, 5.1800161600112915e-06, 5.365349352359772e-06, 5.550682544708252e-06, 5.736015737056732e-06, 5.921348929405212e-06, 6.106682121753693e-06, 6.292015314102173e-06, 6.477348506450653e-06, 6.662681698799133e-06, 6.8480148911476135e-06, 7.033348083496094e-06]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 5.0, 2.0, 8.0, 4.0, 11.0, 25.0, 36.0, 59.0, 119.0, 221.0, 388.0, 790.0, 1451.0, 2946.0, 6337.0, 18836.0, 157070.0, 745317.0, 90148.0, 14281.0, 5362.0, 2472.0, 1245.0, 649.0, 310.0, 178.0, 108.0, 53.0, 41.0, 23.0, 15.0, 18.0, 8.0, 7.0, 1.0, 4.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.064453125, -0.062183380126953125, -0.05991363525390625, -0.057643890380859375, -0.0553741455078125, -0.053104400634765625, -0.05083465576171875, -0.048564910888671875, -0.046295166015625, -0.044025421142578125, -0.04175567626953125, -0.039485931396484375, -0.0372161865234375, -0.034946441650390625, -0.03267669677734375, -0.030406951904296875, -0.02813720703125, -0.025867462158203125, -0.02359771728515625, -0.021327972412109375, -0.0190582275390625, -0.016788482666015625, -0.01451873779296875, -0.012248992919921875, -0.009979248046875, -0.007709503173828125, -0.00543975830078125, -0.003170013427734375, -0.0009002685546875, 0.001369476318359375, 0.00363922119140625, 0.005908966064453125, 0.0081787109375, 0.010448455810546875, 0.01271820068359375, 0.014987945556640625, 0.0172576904296875, 0.019527435302734375, 0.02179718017578125, 0.024066925048828125, 0.026336669921875, 0.028606414794921875, 0.03087615966796875, 0.033145904541015625, 0.0354156494140625, 0.037685394287109375, 0.03995513916015625, 0.042224884033203125, 0.04449462890625, 0.046764373779296875, 0.04903411865234375, 0.051303863525390625, 0.0535736083984375, 0.055843353271484375, 0.05811309814453125, 0.060382843017578125, 0.062652587890625, 0.06492233276367188, 0.06719207763671875, 0.06946182250976562, 0.0717315673828125, 0.07400131225585938, 0.07627105712890625, 0.07854080200195312, 0.080810546875]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 1.0, 2.0, 3.0, 3.0, 1.0, 2.0, 3.0, 5.0, 6.0, 8.0, 9.0, 11.0, 13.0, 12.0, 14.0, 22.0, 30.0, 43.0, 52.0, 68.0, 76.0, 93.0, 87.0, 87.0, 79.0, 73.0, 57.0, 42.0, 26.0, 20.0, 9.0, 7.0, 10.0, 3.0, 8.0, 3.0, 3.0, 1.0, 3.0, 2.0, 1.0, 0.0, 4.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.04949951171875, -0.04797029495239258, -0.046441078186035156, -0.044911861419677734, -0.04338264465332031, -0.04185342788696289, -0.04032421112060547, -0.03879499435424805, -0.037265777587890625, -0.0357365608215332, -0.03420734405517578, -0.03267812728881836, -0.031148910522460938, -0.029619693756103516, -0.028090476989746094, -0.026561260223388672, -0.02503204345703125, -0.023502826690673828, -0.021973609924316406, -0.020444393157958984, -0.018915176391601562, -0.01738595962524414, -0.01585674285888672, -0.014327526092529297, -0.012798309326171875, -0.011269092559814453, -0.009739875793457031, -0.00821065902709961, -0.0066814422607421875, -0.005152225494384766, -0.0036230087280273438, -0.002093791961669922, -0.0005645751953125, 0.0009646415710449219, 0.0024938583374023438, 0.004023075103759766, 0.0055522918701171875, 0.007081508636474609, 0.008610725402832031, 0.010139942169189453, 0.011669158935546875, 0.013198375701904297, 0.014727592468261719, 0.01625680923461914, 0.017786026000976562, 0.019315242767333984, 0.020844459533691406, 0.022373676300048828, 0.02390289306640625, 0.025432109832763672, 0.026961326599121094, 0.028490543365478516, 0.030019760131835938, 0.03154897689819336, 0.03307819366455078, 0.0346074104309082, 0.036136627197265625, 0.03766584396362305, 0.03919506072998047, 0.04072427749633789, 0.04225349426269531, 0.043782711029052734, 0.045311927795410156, 0.04684114456176758, 0.048370361328125]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 7.0, 32.0, 94.0, 216.0, 349.0, 208.0, 83.0, 16.0, 4.0, 5.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3232911825180054, -1.264230489730835, -1.205169916152954, -1.1461093425750732, -1.0870486497879028, -1.0279879570007324, -0.9689273834228516, -0.9098667502403259, -0.8508061170578003, -0.7917454838752747, -0.732684850692749, -0.6736242175102234, -0.6145635843276978, -0.5555029511451721, -0.4964423179626465, -0.43738168478012085, -0.3783210515975952, -0.3192604184150696, -0.26019978523254395, -0.2011391520500183, -0.14207851886749268, -0.08301788568496704, -0.023957252502441406, 0.03510338068008423, 0.09416401386260986, 0.1532246470451355, 0.21228528022766113, 0.27134591341018677, 0.3304065465927124, 0.38946717977523804, 0.44852781295776367, 0.5075884461402893, 0.5666491985321045, 0.6257098317146301, 0.6847704648971558, 0.7438310980796814, 0.802891731262207, 0.8619523644447327, 0.9210129976272583, 0.9800736308097839, 1.0391342639923096, 1.0981948375701904, 1.1572555303573608, 1.2163162231445312, 1.275376796722412, 1.334437370300293, 1.3934980630874634, 1.4525587558746338, 1.5116193294525146, 1.5706799030303955, 1.629740595817566, 1.6888012886047363, 1.7478618621826172, 1.806922435760498, 1.8659831285476685, 1.9250438213348389, 1.9841043949127197, 2.0431649684906006, 2.1022257804870605, 2.1612863540649414, 2.2203469276428223, 2.279407501220703, 2.338468074798584, 2.397528886795044, 2.456589460372925]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 7.0, 6.0, 6.0, 15.0, 14.0, 15.0, 14.0, 13.0, 22.0, 22.0, 39.0, 29.0, 32.0, 47.0, 35.0, 40.0, 39.0, 34.0, 35.0, 45.0, 42.0, 43.0, 44.0, 43.0, 29.0, 39.0, 32.0, 34.0, 23.0, 28.0, 15.0, 24.0, 12.0, 15.0, 17.0, 9.0, 8.0, 6.0, 8.0, 5.0, 7.0, 1.0, 1.0, 3.0, 4.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8889521360397339, -0.8591723442077637, -0.8293926119804382, -0.799612820148468, -0.7698330879211426, -0.7400532960891724, -0.7102735042572021, -0.6804937720298767, -0.6507139801979065, -0.6209341883659363, -0.5911544561386108, -0.5613746643066406, -0.5315949320793152, -0.501815140247345, -0.47203537821769714, -0.4422556161880493, -0.4124758541584015, -0.38269609212875366, -0.35291633009910583, -0.323136568069458, -0.2933567762374878, -0.26357701420783997, -0.23379725217819214, -0.20401747524738312, -0.1742377132177353, -0.14445795118808746, -0.11467817425727844, -0.08489841222763062, -0.05511864274740219, -0.025338873267173767, 0.00444088876247406, 0.03422066569328308, 0.06400042772293091, 0.09378019720315933, 0.12355996668338776, 0.15333972871303558, 0.1831195056438446, 0.21289926767349243, 0.24267902970314026, 0.2724587917327881, 0.3022385835647583, 0.33201834559440613, 0.36179810762405396, 0.39157789945602417, 0.421357661485672, 0.4511374235153198, 0.48091718554496765, 0.5106969475746155, 0.5404766798019409, 0.5702564716339111, 0.6000362038612366, 0.6298159956932068, 0.6595957279205322, 0.6893755197525024, 0.7191553115844727, 0.7489350438117981, 0.7787148356437683, 0.8084946274757385, 0.838274359703064, 0.8680541515350342, 0.8978338837623596, 0.9276136755943298, 0.9573934078216553, 0.9871731996536255, 1.0169529914855957]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 5.0, 1.0, 0.0, 2.0, 1.0, 2.0, 11.0, 9.0, 11.0, 9.0, 15.0, 15.0, 26.0, 29.0, 32.0, 34.0, 47.0, 83.0, 183.0, 698.0, 4463.0, 4018186.0, 167172.0, 2391.0, 443.0, 145.0, 69.0, 45.0, 25.0, 23.0, 30.0, 18.0, 11.0, 9.0, 13.0, 11.0, 5.0, 8.0, 5.0, 5.0, 4.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.3935546875, -1.3535614013671875, -1.313568115234375, -1.2735748291015625, -1.23358154296875, -1.1935882568359375, -1.153594970703125, -1.1136016845703125, -1.0736083984375, -1.0336151123046875, -0.993621826171875, -0.9536285400390625, -0.91363525390625, -0.8736419677734375, -0.833648681640625, -0.7936553955078125, -0.753662109375, -0.7136688232421875, -0.673675537109375, -0.6336822509765625, -0.59368896484375, -0.5536956787109375, -0.513702392578125, -0.4737091064453125, -0.4337158203125, -0.3937225341796875, -0.353729248046875, -0.3137359619140625, -0.27374267578125, -0.2337493896484375, -0.193756103515625, -0.1537628173828125, -0.11376953125, -0.0737762451171875, -0.033782958984375, 0.0062103271484375, 0.04620361328125, 0.0861968994140625, 0.126190185546875, 0.1661834716796875, 0.2061767578125, 0.2461700439453125, 0.286163330078125, 0.3261566162109375, 0.36614990234375, 0.4061431884765625, 0.446136474609375, 0.4861297607421875, 0.526123046875, 0.5661163330078125, 0.606109619140625, 0.6461029052734375, 0.68609619140625, 0.7260894775390625, 0.766082763671875, 0.8060760498046875, 0.8460693359375, 0.8860626220703125, 0.926055908203125, 0.9660491943359375, 1.00604248046875, 1.0460357666015625, 1.086029052734375, 1.1260223388671875, 1.166015625]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 3.0, 3.0, 4.0, 8.0, 12.0, 15.0, 15.0, 22.0, 28.0, 32.0, 34.0, 41.0, 46.0, 54.0, 53.0, 60.0, 73.0, 80.0, 63.0, 48.0, 74.0, 48.0, 38.0, 36.0, 26.0, 20.0, 10.0, 10.0, 14.0, 11.0, 3.0, 3.0, 6.0, 8.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1300048828125, -0.12625789642333984, -0.12251091003417969, -0.11876392364501953, -0.11501693725585938, -0.11126995086669922, -0.10752296447753906, -0.1037759780883789, -0.10002899169921875, -0.0962820053100586, -0.09253501892089844, -0.08878803253173828, -0.08504104614257812, -0.08129405975341797, -0.07754707336425781, -0.07380008697509766, -0.0700531005859375, -0.06630611419677734, -0.06255912780761719, -0.05881214141845703, -0.055065155029296875, -0.05131816864013672, -0.04757118225097656, -0.043824195861816406, -0.04007720947265625, -0.036330223083496094, -0.03258323669433594, -0.02883625030517578, -0.025089263916015625, -0.02134227752685547, -0.017595291137695312, -0.013848304748535156, -0.010101318359375, -0.006354331970214844, -0.0026073455810546875, 0.0011396408081054688, 0.004886627197265625, 0.008633613586425781, 0.012380599975585938, 0.016127586364746094, 0.01987457275390625, 0.023621559143066406, 0.027368545532226562, 0.03111553192138672, 0.034862518310546875, 0.03860950469970703, 0.04235649108886719, 0.046103477478027344, 0.0498504638671875, 0.053597450256347656, 0.05734443664550781, 0.06109142303466797, 0.06483840942382812, 0.06858539581298828, 0.07233238220214844, 0.0760793685913086, 0.07982635498046875, 0.0835733413696289, 0.08732032775878906, 0.09106731414794922, 0.09481430053710938, 0.09856128692626953, 0.10230827331542969, 0.10605525970458984, 0.10980224609375]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 4.0, 2.0, 3.0, 0.0, 0.0, 3.0, 5.0, 7.0, 8.0, 11.0, 10.0, 29.0, 34.0, 45.0, 81.0, 170.0, 312.0, 657.0, 1626.0, 4654.0, 16496.0, 83184.0, 657998.0, 2914055.0, 435811.0, 60473.0, 12599.0, 3673.0, 1284.0, 491.0, 250.0, 107.0, 76.0, 46.0, 31.0, 15.0, 11.0, 8.0, 7.0, 7.0, 3.0, 3.0, 2.0, 0.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.2362060546875, -0.2293415069580078, -0.22247695922851562, -0.21561241149902344, -0.20874786376953125, -0.20188331604003906, -0.19501876831054688, -0.1881542205810547, -0.1812896728515625, -0.1744251251220703, -0.16756057739257812, -0.16069602966308594, -0.15383148193359375, -0.14696693420410156, -0.14010238647460938, -0.1332378387451172, -0.126373291015625, -0.11950874328613281, -0.11264419555664062, -0.10577964782714844, -0.09891510009765625, -0.09205055236816406, -0.08518600463867188, -0.07832145690917969, -0.0714569091796875, -0.06459236145019531, -0.057727813720703125, -0.05086326599121094, -0.04399871826171875, -0.03713417053222656, -0.030269622802734375, -0.023405075073242188, -0.01654052734375, -0.009675979614257812, -0.002811431884765625, 0.0040531158447265625, 0.01091766357421875, 0.017782211303710938, 0.024646759033203125, 0.03151130676269531, 0.0383758544921875, 0.04524040222167969, 0.052104949951171875, 0.05896949768066406, 0.06583404541015625, 0.07269859313964844, 0.07956314086914062, 0.08642768859863281, 0.093292236328125, 0.10015678405761719, 0.10702133178710938, 0.11388587951660156, 0.12075042724609375, 0.12761497497558594, 0.13447952270507812, 0.1413440704345703, 0.1482086181640625, 0.1550731658935547, 0.16193771362304688, 0.16880226135253906, 0.17566680908203125, 0.18253135681152344, 0.18939590454101562, 0.1962604522705078, 0.203125]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 3.0, 3.0, 3.0, 1.0, 10.0, 9.0, 17.0, 22.0, 32.0, 25.0, 54.0, 65.0, 92.0, 148.0, 168.0, 247.0, 374.0, 524.0, 685.0, 492.0, 316.0, 225.0, 148.0, 99.0, 82.0, 59.0, 44.0, 33.0, 19.0, 17.0, 15.0, 16.0, 10.0, 6.0, 5.0, 5.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06365966796875, -0.06067371368408203, -0.05768775939941406, -0.054701805114746094, -0.051715850830078125, -0.048729896545410156, -0.04574394226074219, -0.04275798797607422, -0.03977203369140625, -0.03678607940673828, -0.03380012512207031, -0.030814170837402344, -0.027828216552734375, -0.024842262268066406, -0.021856307983398438, -0.01887035369873047, -0.0158843994140625, -0.012898445129394531, -0.009912490844726562, -0.006926536560058594, -0.003940582275390625, -0.0009546279907226562, 0.0020313262939453125, 0.005017280578613281, 0.00800323486328125, 0.010989189147949219, 0.013975143432617188, 0.016961097717285156, 0.019947052001953125, 0.022933006286621094, 0.025918960571289062, 0.02890491485595703, 0.031890869140625, 0.03487682342529297, 0.03786277770996094, 0.040848731994628906, 0.043834686279296875, 0.046820640563964844, 0.04980659484863281, 0.05279254913330078, 0.05577850341796875, 0.05876445770263672, 0.06175041198730469, 0.06473636627197266, 0.06772232055664062, 0.0707082748413086, 0.07369422912597656, 0.07668018341064453, 0.0796661376953125, 0.08265209197998047, 0.08563804626464844, 0.0886240005493164, 0.09160995483398438, 0.09459590911865234, 0.09758186340332031, 0.10056781768798828, 0.10355377197265625, 0.10653972625732422, 0.10952568054199219, 0.11251163482666016, 0.11549758911132812, 0.1184835433959961, 0.12146949768066406, 0.12445545196533203, 0.12744140625]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 3.0, 1.0, 5.0, 8.0, 20.0, 30.0, 49.0, 91.0, 127.0, 165.0, 154.0, 123.0, 93.0, 64.0, 32.0, 19.0, 14.0, 0.0, 6.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.36305975914001465, -0.3440004289150238, -0.32494112849235535, -0.3058817982673645, -0.28682249784469604, -0.2677631676197052, -0.24870385229587555, -0.2296445369720459, -0.21058522164821625, -0.1915259063243866, -0.17246659100055695, -0.1534072756767273, -0.13434794545173645, -0.1152886375784874, -0.09622931480407715, -0.0771699994802475, -0.05811068415641785, -0.039051368832588196, -0.019992049783468246, -0.0009327307343482971, 0.018126584589481354, 0.037185899913311005, 0.05624522268772125, 0.0753045380115509, 0.09436385333538055, 0.1134231686592102, 0.13248248398303986, 0.1515417993068695, 0.17060112953186035, 0.1896604299545288, 0.20871976017951965, 0.2277790755033493, 0.24683839082717896, 0.2658977210521698, 0.28495702147483826, 0.3040163516998291, 0.32307565212249756, 0.3421349823474884, 0.36119431257247925, 0.3802536129951477, 0.39931291341781616, 0.418372243642807, 0.43743154406547546, 0.4564908742904663, 0.47555017471313477, 0.4946095049381256, 0.5136688351631165, 0.5327281355857849, 0.5517874956130981, 0.5708467960357666, 0.5899061560630798, 0.6089654564857483, 0.6280247569084167, 0.6470840573310852, 0.6661434173583984, 0.6852027177810669, 0.7042620182037354, 0.7233213186264038, 0.742380678653717, 0.7614399790763855, 0.780499279499054, 0.7995585799217224, 0.8186179399490356, 0.8376772403717041, 0.8567365407943726]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 3.0, 4.0, 7.0, 10.0, 16.0, 15.0, 10.0, 16.0, 14.0, 8.0, 22.0, 26.0, 33.0, 30.0, 29.0, 31.0, 43.0, 46.0, 36.0, 39.0, 40.0, 52.0, 51.0, 48.0, 39.0, 38.0, 37.0, 41.0, 32.0, 32.0, 28.0, 20.0, 26.0, 18.0, 14.0, 15.0, 9.0, 5.0, 3.0, 5.0, 5.0, 5.0, 1.0, 4.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0], "bins": [-0.2704402804374695, -0.26254621148109436, -0.25465214252471924, -0.24675807356834412, -0.238864004611969, -0.23096993565559387, -0.22307586669921875, -0.21518179774284363, -0.2072877287864685, -0.19939365983009338, -0.19149959087371826, -0.18360552191734314, -0.17571145296096802, -0.1678173840045929, -0.15992331504821777, -0.15202924609184265, -0.14413517713546753, -0.1362411081790924, -0.12834703922271729, -0.12045297026634216, -0.11255890130996704, -0.10466483235359192, -0.0967707633972168, -0.08887669444084167, -0.08098262548446655, -0.07308855652809143, -0.06519448757171631, -0.057300418615341187, -0.049406349658966064, -0.04151228070259094, -0.03361821174621582, -0.025724142789840698, -0.017830073833465576, -0.009936004877090454, -0.002041935920715332, 0.00585213303565979, 0.013746201992034912, 0.021640270948410034, 0.029534339904785156, 0.03742840886116028, 0.0453224778175354, 0.05321654677391052, 0.061110615730285645, 0.06900468468666077, 0.07689875364303589, 0.08479282259941101, 0.09268689155578613, 0.10058096051216125, 0.10847502946853638, 0.1163690984249115, 0.12426316738128662, 0.13215723633766174, 0.14005130529403687, 0.147945374250412, 0.1558394432067871, 0.16373351216316223, 0.17162758111953735, 0.17952165007591248, 0.1874157190322876, 0.19530978798866272, 0.20320385694503784, 0.21109792590141296, 0.21899199485778809, 0.2268860638141632, 0.23478013277053833]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 5.0, 3.0, 4.0, 5.0, 5.0, 8.0, 11.0, 17.0, 18.0, 36.0, 42.0, 60.0, 78.0, 102.0, 157.0, 216.0, 340.0, 536.0, 825.0, 1463.0, 2630.0, 5332.0, 12168.0, 33078.0, 109742.0, 353392.0, 358419.0, 111672.0, 33549.0, 12662.0, 5343.0, 2691.0, 1457.0, 855.0, 475.0, 353.0, 237.0, 165.0, 125.0, 75.0, 48.0, 47.0, 25.0, 18.0, 26.0, 14.0, 6.0, 6.0, 5.0, 5.0, 1.0, 2.0, 2.0, 3.0, 0.0, 4.0, 1.0, 2.0], "bins": [-0.2313232421875, -0.22409629821777344, -0.21686935424804688, -0.2096424102783203, -0.20241546630859375, -0.1951885223388672, -0.18796157836914062, -0.18073463439941406, -0.1735076904296875, -0.16628074645996094, -0.15905380249023438, -0.1518268585205078, -0.14459991455078125, -0.1373729705810547, -0.13014602661132812, -0.12291908264160156, -0.115692138671875, -0.10846519470214844, -0.10123825073242188, -0.09401130676269531, -0.08678436279296875, -0.07955741882324219, -0.07233047485351562, -0.06510353088378906, -0.0578765869140625, -0.05064964294433594, -0.043422698974609375, -0.03619575500488281, -0.02896881103515625, -0.021741867065429688, -0.014514923095703125, -0.0072879791259765625, -6.103515625e-05, 0.0071659088134765625, 0.014392852783203125, 0.021619796752929688, 0.02884674072265625, 0.03607368469238281, 0.043300628662109375, 0.05052757263183594, 0.0577545166015625, 0.06498146057128906, 0.07220840454101562, 0.07943534851074219, 0.08666229248046875, 0.09388923645019531, 0.10111618041992188, 0.10834312438964844, 0.115570068359375, 0.12279701232910156, 0.13002395629882812, 0.1372509002685547, 0.14447784423828125, 0.1517047882080078, 0.15893173217773438, 0.16615867614746094, 0.1733856201171875, 0.18061256408691406, 0.18783950805664062, 0.1950664520263672, 0.20229339599609375, 0.2095203399658203, 0.21674728393554688, 0.22397422790527344, 0.231201171875]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 4.0, 1.0, 3.0, 4.0, 8.0, 10.0, 14.0, 10.0, 15.0, 11.0, 20.0, 29.0, 35.0, 35.0, 36.0, 45.0, 37.0, 46.0, 55.0, 56.0, 49.0, 63.0, 51.0, 48.0, 59.0, 39.0, 42.0, 34.0, 26.0, 18.0, 23.0, 11.0, 14.0, 15.0, 9.0, 9.0, 3.0, 5.0, 3.0, 4.0, 4.0, 4.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09429931640625, -0.0912027359008789, -0.08810615539550781, -0.08500957489013672, -0.08191299438476562, -0.07881641387939453, -0.07571983337402344, -0.07262325286865234, -0.06952667236328125, -0.06643009185791016, -0.06333351135253906, -0.06023693084716797, -0.057140350341796875, -0.05404376983642578, -0.05094718933105469, -0.047850608825683594, -0.0447540283203125, -0.041657447814941406, -0.03856086730957031, -0.03546428680419922, -0.032367706298828125, -0.02927112579345703, -0.026174545288085938, -0.023077964782714844, -0.01998138427734375, -0.016884803771972656, -0.013788223266601562, -0.010691642761230469, -0.007595062255859375, -0.004498481750488281, -0.0014019012451171875, 0.0016946792602539062, 0.004791259765625, 0.007887840270996094, 0.010984420776367188, 0.014081001281738281, 0.017177581787109375, 0.02027416229248047, 0.023370742797851562, 0.026467323303222656, 0.02956390380859375, 0.032660484313964844, 0.03575706481933594, 0.03885364532470703, 0.041950225830078125, 0.04504680633544922, 0.04814338684082031, 0.051239967346191406, 0.0543365478515625, 0.057433128356933594, 0.06052970886230469, 0.06362628936767578, 0.06672286987304688, 0.06981945037841797, 0.07291603088378906, 0.07601261138916016, 0.07910919189453125, 0.08220577239990234, 0.08530235290527344, 0.08839893341064453, 0.09149551391601562, 0.09459209442138672, 0.09768867492675781, 0.1007852554321289, 0.1038818359375]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 4.0, 1.0, 5.0, 6.0, 8.0, 8.0, 9.0, 10.0, 19.0, 10.0, 11.0, 22.0, 20.0, 23.0, 25.0, 34.0, 36.0, 58.0, 93.0, 139.0, 266.0, 1185.0, 16058.0, 479930.0, 530501.0, 17945.0, 1285.0, 329.0, 122.0, 85.0, 58.0, 33.0, 32.0, 28.0, 22.0, 17.0, 13.0, 15.0, 13.0, 14.0, 15.0, 9.0, 7.0, 4.0, 8.0, 5.0, 5.0, 5.0, 3.0, 4.0, 2.0, 3.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0], "bins": [-0.5068359375, -0.48995208740234375, -0.4730682373046875, -0.45618438720703125, -0.439300537109375, -0.42241668701171875, -0.4055328369140625, -0.38864898681640625, -0.37176513671875, -0.35488128662109375, -0.3379974365234375, -0.32111358642578125, -0.304229736328125, -0.28734588623046875, -0.2704620361328125, -0.25357818603515625, -0.2366943359375, -0.21981048583984375, -0.2029266357421875, -0.18604278564453125, -0.169158935546875, -0.15227508544921875, -0.1353912353515625, -0.11850738525390625, -0.10162353515625, -0.08473968505859375, -0.0678558349609375, -0.05097198486328125, -0.034088134765625, -0.01720428466796875, -0.0003204345703125, 0.01656341552734375, 0.033447265625, 0.05033111572265625, 0.0672149658203125, 0.08409881591796875, 0.100982666015625, 0.11786651611328125, 0.1347503662109375, 0.15163421630859375, 0.16851806640625, 0.18540191650390625, 0.2022857666015625, 0.21916961669921875, 0.236053466796875, 0.25293731689453125, 0.2698211669921875, 0.28670501708984375, 0.3035888671875, 0.32047271728515625, 0.3373565673828125, 0.35424041748046875, 0.371124267578125, 0.38800811767578125, 0.4048919677734375, 0.42177581787109375, 0.43865966796875, 0.45554351806640625, 0.4724273681640625, 0.48931121826171875, 0.506195068359375, 0.5230789184570312, 0.5399627685546875, 0.5568466186523438, 0.57373046875]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 1.0, 8.0, 5.0, 8.0, 13.0, 12.0, 3.0, 10.0, 15.0, 9.0, 32.0, 12.0, 17.0, 20.0, 23.0, 25.0, 34.0, 32.0, 32.0, 34.0, 38.0, 30.0, 45.0, 42.0, 38.0, 34.0, 51.0, 40.0, 32.0, 36.0, 29.0, 31.0, 24.0, 24.0, 24.0, 15.0, 18.0, 11.0, 16.0, 20.0, 12.0, 9.0, 8.0, 7.0, 7.0, 7.0, 5.0, 6.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 3.0], "bins": [-0.1566162109375, -0.15169525146484375, -0.1467742919921875, -0.14185333251953125, -0.136932373046875, -0.13201141357421875, -0.1270904541015625, -0.12216949462890625, -0.11724853515625, -0.11232757568359375, -0.1074066162109375, -0.10248565673828125, -0.097564697265625, -0.09264373779296875, -0.0877227783203125, -0.08280181884765625, -0.077880859375, -0.07295989990234375, -0.0680389404296875, -0.06311798095703125, -0.058197021484375, -0.05327606201171875, -0.0483551025390625, -0.04343414306640625, -0.03851318359375, -0.03359222412109375, -0.0286712646484375, -0.02375030517578125, -0.018829345703125, -0.01390838623046875, -0.0089874267578125, -0.00406646728515625, 0.0008544921875, 0.00577545166015625, 0.0106964111328125, 0.01561737060546875, 0.020538330078125, 0.02545928955078125, 0.0303802490234375, 0.03530120849609375, 0.04022216796875, 0.04514312744140625, 0.0500640869140625, 0.05498504638671875, 0.059906005859375, 0.06482696533203125, 0.0697479248046875, 0.07466888427734375, 0.07958984375, 0.08451080322265625, 0.0894317626953125, 0.09435272216796875, 0.099273681640625, 0.10419464111328125, 0.1091156005859375, 0.11403656005859375, 0.11895751953125, 0.12387847900390625, 0.1287994384765625, 0.13372039794921875, 0.138641357421875, 0.14356231689453125, 0.1484832763671875, 0.15340423583984375, 0.1583251953125]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 4.0, 0.0, 7.0, 11.0, 20.0, 41.0, 62.0, 119.0, 266.0, 485.0, 1095.0, 2720.0, 7306.0, 26486.0, 143163.0, 606323.0, 209085.0, 36153.0, 9447.0, 3336.0, 1324.0, 549.0, 268.0, 126.0, 71.0, 40.0, 27.0, 14.0, 10.0, 0.0, 5.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.13134765625, -0.1279449462890625, -0.124542236328125, -0.1211395263671875, -0.11773681640625, -0.1143341064453125, -0.110931396484375, -0.1075286865234375, -0.1041259765625, -0.1007232666015625, -0.097320556640625, -0.0939178466796875, -0.09051513671875, -0.0871124267578125, -0.083709716796875, -0.0803070068359375, -0.076904296875, -0.0735015869140625, -0.070098876953125, -0.0666961669921875, -0.06329345703125, -0.0598907470703125, -0.056488037109375, -0.0530853271484375, -0.0496826171875, -0.0462799072265625, -0.042877197265625, -0.0394744873046875, -0.03607177734375, -0.0326690673828125, -0.029266357421875, -0.0258636474609375, -0.0224609375, -0.0190582275390625, -0.015655517578125, -0.0122528076171875, -0.00885009765625, -0.0054473876953125, -0.002044677734375, 0.0013580322265625, 0.0047607421875, 0.0081634521484375, 0.011566162109375, 0.0149688720703125, 0.01837158203125, 0.0217742919921875, 0.025177001953125, 0.0285797119140625, 0.031982421875, 0.0353851318359375, 0.038787841796875, 0.0421905517578125, 0.04559326171875, 0.0489959716796875, 0.052398681640625, 0.0558013916015625, 0.0592041015625, 0.0626068115234375, 0.066009521484375, 0.0694122314453125, 0.07281494140625, 0.0762176513671875, 0.079620361328125, 0.0830230712890625, 0.08642578125]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 6.0, 1.0, 6.0, 9.0, 11.0, 12.0, 20.0, 26.0, 30.0, 75.0, 101.0, 123.0, 146.0, 110.0, 93.0, 87.0, 55.0, 30.0, 14.0, 15.0, 8.0, 8.0, 4.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.341104507446289e-05, -1.2867152690887451e-05, -1.2323260307312012e-05, -1.1779367923736572e-05, -1.1235475540161133e-05, -1.0691583156585693e-05, -1.0147690773010254e-05, -9.603798389434814e-06, -9.059906005859375e-06, -8.516013622283936e-06, -7.972121238708496e-06, -7.428228855133057e-06, -6.884336471557617e-06, -6.340444087982178e-06, -5.796551704406738e-06, -5.252659320831299e-06, -4.708766937255859e-06, -4.16487455368042e-06, -3.6209821701049805e-06, -3.077089786529541e-06, -2.5331974029541016e-06, -1.989305019378662e-06, -1.4454126358032227e-06, -9.015202522277832e-07, -3.5762786865234375e-07, 1.862645149230957e-07, 7.301568984985352e-07, 1.2740492820739746e-06, 1.817941665649414e-06, 2.3618340492248535e-06, 2.905726432800293e-06, 3.4496188163757324e-06, 3.993511199951172e-06, 4.537403583526611e-06, 5.081295967102051e-06, 5.62518835067749e-06, 6.16908073425293e-06, 6.712973117828369e-06, 7.256865501403809e-06, 7.800757884979248e-06, 8.344650268554688e-06, 8.888542652130127e-06, 9.432435035705566e-06, 9.976327419281006e-06, 1.0520219802856445e-05, 1.1064112186431885e-05, 1.1608004570007324e-05, 1.2151896953582764e-05, 1.2695789337158203e-05, 1.3239681720733643e-05, 1.3783574104309082e-05, 1.4327466487884521e-05, 1.4871358871459961e-05, 1.54152512550354e-05, 1.595914363861084e-05, 1.650303602218628e-05, 1.704692840576172e-05, 1.7590820789337158e-05, 1.8134713172912598e-05, 1.8678605556488037e-05, 1.9222497940063477e-05, 1.9766390323638916e-05, 2.0310282707214355e-05, 2.0854175090789795e-05, 2.1398067474365234e-05]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 7.0, 4.0, 8.0, 4.0, 15.0, 15.0, 19.0, 26.0, 39.0, 66.0, 117.0, 304.0, 2311.0, 83335.0, 923462.0, 36847.0, 1432.0, 268.0, 84.0, 64.0, 37.0, 26.0, 17.0, 14.0, 8.0, 12.0, 6.0, 3.0, 4.0, 3.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2242431640625, -0.21732330322265625, -0.2104034423828125, -0.20348358154296875, -0.196563720703125, -0.18964385986328125, -0.1827239990234375, -0.17580413818359375, -0.16888427734375, -0.16196441650390625, -0.1550445556640625, -0.14812469482421875, -0.141204833984375, -0.13428497314453125, -0.1273651123046875, -0.12044525146484375, -0.113525390625, -0.10660552978515625, -0.0996856689453125, -0.09276580810546875, -0.085845947265625, -0.07892608642578125, -0.0720062255859375, -0.06508636474609375, -0.05816650390625, -0.05124664306640625, -0.0443267822265625, -0.03740692138671875, -0.030487060546875, -0.02356719970703125, -0.0166473388671875, -0.00972747802734375, -0.0028076171875, 0.00411224365234375, 0.0110321044921875, 0.01795196533203125, 0.024871826171875, 0.03179168701171875, 0.0387115478515625, 0.04563140869140625, 0.05255126953125, 0.05947113037109375, 0.0663909912109375, 0.07331085205078125, 0.080230712890625, 0.08715057373046875, 0.0940704345703125, 0.10099029541015625, 0.10791015625, 0.11483001708984375, 0.1217498779296875, 0.12866973876953125, 0.135589599609375, 0.14250946044921875, 0.1494293212890625, 0.15634918212890625, 0.16326904296875, 0.17018890380859375, 0.1771087646484375, 0.18402862548828125, 0.190948486328125, 0.19786834716796875, 0.2047882080078125, 0.21170806884765625, 0.2186279296875]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 5.0, 2.0, 7.0, 10.0, 25.0, 19.0, 27.0, 41.0, 53.0, 56.0, 83.0, 84.0, 89.0, 106.0, 87.0, 70.0, 69.0, 45.0, 32.0, 25.0, 34.0, 15.0, 6.0, 9.0, 8.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0438232421875, -0.04207134246826172, -0.04031944274902344, -0.038567543029785156, -0.036815643310546875, -0.035063743591308594, -0.03331184387207031, -0.03155994415283203, -0.02980804443359375, -0.02805614471435547, -0.026304244995117188, -0.024552345275878906, -0.022800445556640625, -0.021048545837402344, -0.019296646118164062, -0.01754474639892578, -0.0157928466796875, -0.014040946960449219, -0.012289047241210938, -0.010537147521972656, -0.008785247802734375, -0.007033348083496094, -0.0052814483642578125, -0.0035295486450195312, -0.00177764892578125, -2.574920654296875e-05, 0.0017261505126953125, 0.0034780502319335938, 0.005229949951171875, 0.006981849670410156, 0.008733749389648438, 0.010485649108886719, 0.012237548828125, 0.013989448547363281, 0.015741348266601562, 0.017493247985839844, 0.019245147705078125, 0.020997047424316406, 0.022748947143554688, 0.02450084686279297, 0.02625274658203125, 0.02800464630126953, 0.029756546020507812, 0.031508445739746094, 0.033260345458984375, 0.035012245178222656, 0.03676414489746094, 0.03851604461669922, 0.0402679443359375, 0.04201984405517578, 0.04377174377441406, 0.045523643493652344, 0.047275543212890625, 0.049027442932128906, 0.05077934265136719, 0.05253124237060547, 0.05428314208984375, 0.05603504180908203, 0.05778694152832031, 0.059538841247558594, 0.061290740966796875, 0.06304264068603516, 0.06479454040527344, 0.06654644012451172, 0.06829833984375]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 4.0, 4.0, 3.0, 19.0, 31.0, 84.0, 163.0, 234.0, 216.0, 146.0, 63.0, 26.0, 15.0, 2.0, 4.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3232850730419159, -0.29352620244026184, -0.2637673318386078, -0.23400846123695374, -0.20424959063529968, -0.17449072003364563, -0.14473184943199158, -0.11497297883033752, -0.08521410822868347, -0.05545523762702942, -0.025696367025375366, 0.0040625035762786865, 0.03382137417793274, 0.06358024477958679, 0.09333911538124084, 0.1230979859828949, 0.15285685658454895, 0.182615727186203, 0.21237459778785706, 0.2421334683895111, 0.27189233899116516, 0.3016512095928192, 0.33141008019447327, 0.3611689507961273, 0.39092782139778137, 0.4206866919994354, 0.4504455626010895, 0.48020443320274353, 0.5099632740020752, 0.539722204208374, 0.5694810152053833, 0.5992399454116821, 0.6289987564086914, 0.6587576270103455, 0.6885164976119995, 0.7182753682136536, 0.7480342388153076, 0.7777931094169617, 0.8075519800186157, 0.8373108506202698, 0.8670697212219238, 0.8968285918235779, 0.9265874624252319, 0.956346333026886, 0.98610520362854, 1.0158641338348389, 1.0456229448318481, 1.0753817558288574, 1.1051406860351562, 1.134899616241455, 1.1646584272384644, 1.1944172382354736, 1.2241761684417725, 1.2539350986480713, 1.2836939096450806, 1.3134527206420898, 1.3432116508483887, 1.3729705810546875, 1.4027293920516968, 1.432488203048706, 1.4622471332550049, 1.4920060634613037, 1.521764874458313, 1.5515236854553223, 1.581282615661621]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 7.0, 3.0, 1.0, 8.0, 9.0, 2.0, 17.0, 10.0, 21.0, 19.0, 13.0, 22.0, 27.0, 20.0, 33.0, 36.0, 30.0, 40.0, 40.0, 40.0, 27.0, 33.0, 39.0, 50.0, 42.0, 36.0, 29.0, 30.0, 32.0, 41.0, 29.0, 23.0, 28.0, 30.0, 16.0, 21.0, 12.0, 16.0, 17.0, 5.0, 14.0, 7.0, 3.0, 7.0, 6.0, 3.0, 4.0, 5.0, 2.0, 1.0, 3.0, 4.0, 1.0, 0.0, 1.0], "bins": [-0.6098813414573669, -0.5910165309906006, -0.5721517205238342, -0.5532869100570679, -0.5344221591949463, -0.5155573487281799, -0.4966925382614136, -0.4778277277946472, -0.45896291732788086, -0.4400981068611145, -0.42123329639434814, -0.4023685157299042, -0.3835037052631378, -0.36463889479637146, -0.3457741141319275, -0.32690930366516113, -0.3080444931983948, -0.2891796827316284, -0.27031487226486206, -0.2514500916004181, -0.23258528113365173, -0.21372047066688538, -0.1948556751012802, -0.17599087953567505, -0.1571260690689087, -0.13826125860214233, -0.11939646303653717, -0.10053166002035141, -0.08166685700416565, -0.06280205398797989, -0.04393725097179413, -0.025072455406188965, -0.006207644939422607, 0.012657158076763153, 0.031521961092948914, 0.050386764109134674, 0.06925156712532043, 0.0881163701415062, 0.10698117315769196, 0.12584596872329712, 0.14471077919006348, 0.16357558965682983, 0.182440385222435, 0.20130518078804016, 0.22016999125480652, 0.23903480172157288, 0.25789958238601685, 0.2767643928527832, 0.29562920331954956, 0.3144940137863159, 0.3333588242530823, 0.35222360491752625, 0.3710884153842926, 0.38995322585105896, 0.40881800651550293, 0.4276828169822693, 0.44654762744903564, 0.465412437915802, 0.48427724838256836, 0.5031420588493347, 0.5220068693161011, 0.5408716201782227, 0.559736430644989, 0.5786012411117554, 0.5974660515785217]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 3.0, 2.0, 1.0, 3.0, 7.0, 7.0, 18.0, 10.0, 20.0, 21.0, 28.0, 44.0, 57.0, 79.0, 126.0, 168.0, 239.0, 377.0, 556.0, 946.0, 2050.0, 5797.0, 25683.0, 305619.0, 3390528.0, 417787.0, 32126.0, 6781.0, 2378.0, 1097.0, 593.0, 339.0, 220.0, 166.0, 109.0, 89.0, 53.0, 42.0, 30.0, 26.0, 17.0, 12.0, 10.0, 8.0, 6.0, 3.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.2939453125, -0.2851829528808594, -0.27642059326171875, -0.2676582336425781, -0.2588958740234375, -0.2501335144042969, -0.24137115478515625, -0.23260879516601562, -0.223846435546875, -0.21508407592773438, -0.20632171630859375, -0.19755935668945312, -0.1887969970703125, -0.18003463745117188, -0.17127227783203125, -0.16250991821289062, -0.15374755859375, -0.14498519897460938, -0.13622283935546875, -0.12746047973632812, -0.1186981201171875, -0.10993576049804688, -0.10117340087890625, -0.09241104125976562, -0.083648681640625, -0.07488632202148438, -0.06612396240234375, -0.057361602783203125, -0.0485992431640625, -0.039836883544921875, -0.03107452392578125, -0.022312164306640625, -0.0135498046875, -0.004787445068359375, 0.00397491455078125, 0.012737274169921875, 0.0214996337890625, 0.030261993408203125, 0.03902435302734375, 0.047786712646484375, 0.056549072265625, 0.06531143188476562, 0.07407379150390625, 0.08283615112304688, 0.0915985107421875, 0.10036087036132812, 0.10912322998046875, 0.11788558959960938, 0.12664794921875, 0.13541030883789062, 0.14417266845703125, 0.15293502807617188, 0.1616973876953125, 0.17045974731445312, 0.17922210693359375, 0.18798446655273438, 0.196746826171875, 0.20550918579101562, 0.21427154541015625, 0.22303390502929688, 0.2317962646484375, 0.24055862426757812, 0.24932098388671875, 0.2580833435058594, 0.266845703125]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 4.0, 5.0, 3.0, 4.0, 6.0, 8.0, 11.0, 11.0, 12.0, 15.0, 34.0, 15.0, 31.0, 37.0, 39.0, 45.0, 39.0, 54.0, 51.0, 44.0, 63.0, 66.0, 53.0, 41.0, 56.0, 53.0, 41.0, 31.0, 28.0, 17.0, 17.0, 19.0, 13.0, 11.0, 7.0, 8.0, 5.0, 3.0, 1.0, 4.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08782958984375, -0.08483695983886719, -0.08184432983398438, -0.07885169982910156, -0.07585906982421875, -0.07286643981933594, -0.06987380981445312, -0.06688117980957031, -0.0638885498046875, -0.06089591979980469, -0.057903289794921875, -0.05491065979003906, -0.05191802978515625, -0.04892539978027344, -0.045932769775390625, -0.04294013977050781, -0.039947509765625, -0.03695487976074219, -0.033962249755859375, -0.030969619750976562, -0.02797698974609375, -0.024984359741210938, -0.021991729736328125, -0.018999099731445312, -0.0160064697265625, -0.013013839721679688, -0.010021209716796875, -0.0070285797119140625, -0.00403594970703125, -0.0010433197021484375, 0.001949310302734375, 0.0049419403076171875, 0.0079345703125, 0.010927200317382812, 0.013919830322265625, 0.016912460327148438, 0.01990509033203125, 0.022897720336914062, 0.025890350341796875, 0.028882980346679688, 0.0318756103515625, 0.03486824035644531, 0.037860870361328125, 0.04085350036621094, 0.04384613037109375, 0.04683876037597656, 0.049831390380859375, 0.05282402038574219, 0.055816650390625, 0.05880928039550781, 0.061801910400390625, 0.06479454040527344, 0.06778717041015625, 0.07077980041503906, 0.07377243041992188, 0.07676506042480469, 0.0797576904296875, 0.08275032043457031, 0.08574295043945312, 0.08873558044433594, 0.09172821044921875, 0.09472084045410156, 0.09771347045898438, 0.10070610046386719, 0.10369873046875]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 2.0, 3.0, 4.0, 6.0, 10.0, 6.0, 15.0, 19.0, 10.0, 37.0, 51.0, 88.0, 128.0, 215.0, 355.0, 726.0, 1883.0, 5729.0, 22708.0, 122295.0, 873532.0, 2567913.0, 502562.0, 74163.0, 14919.0, 4112.0, 1475.0, 565.0, 261.0, 163.0, 120.0, 68.0, 40.0, 31.0, 22.0, 20.0, 7.0, 9.0, 6.0, 7.0, 6.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2008056640625, -0.1928882598876953, -0.18497085571289062, -0.17705345153808594, -0.16913604736328125, -0.16121864318847656, -0.15330123901367188, -0.1453838348388672, -0.1374664306640625, -0.1295490264892578, -0.12163162231445312, -0.11371421813964844, -0.10579681396484375, -0.09787940979003906, -0.08996200561523438, -0.08204460144042969, -0.074127197265625, -0.06620979309082031, -0.058292388916015625, -0.05037498474121094, -0.04245758056640625, -0.03454017639160156, -0.026622772216796875, -0.018705368041992188, -0.0107879638671875, -0.0028705596923828125, 0.005046844482421875, 0.012964248657226562, 0.02088165283203125, 0.028799057006835938, 0.036716461181640625, 0.04463386535644531, 0.05255126953125, 0.06046867370605469, 0.06838607788085938, 0.07630348205566406, 0.08422088623046875, 0.09213829040527344, 0.10005569458007812, 0.10797309875488281, 0.1158905029296875, 0.12380790710449219, 0.13172531127929688, 0.13964271545410156, 0.14756011962890625, 0.15547752380371094, 0.16339492797851562, 0.1713123321533203, 0.179229736328125, 0.1871471405029297, 0.19506454467773438, 0.20298194885253906, 0.21089935302734375, 0.21881675720214844, 0.22673416137695312, 0.2346515655517578, 0.2425689697265625, 0.2504863739013672, 0.2584037780761719, 0.26632118225097656, 0.27423858642578125, 0.28215599060058594, 0.2900733947753906, 0.2979907989501953, 0.305908203125]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 5.0, 2.0, 3.0, 5.0, 6.0, 6.0, 15.0, 12.0, 14.0, 18.0, 31.0, 48.0, 33.0, 58.0, 72.0, 81.0, 123.0, 162.0, 197.0, 267.0, 261.0, 343.0, 422.0, 365.0, 301.0, 254.0, 165.0, 169.0, 125.0, 125.0, 74.0, 66.0, 51.0, 46.0, 31.0, 22.0, 29.0, 9.0, 20.0, 13.0, 12.0, 6.0, 2.0, 4.0, 1.0, 2.0, 3.0, 4.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.079833984375, -0.0769510269165039, -0.07406806945800781, -0.07118511199951172, -0.06830215454101562, -0.06541919708251953, -0.06253623962402344, -0.059653282165527344, -0.05677032470703125, -0.053887367248535156, -0.05100440979003906, -0.04812145233154297, -0.045238494873046875, -0.04235553741455078, -0.03947257995605469, -0.036589622497558594, -0.0337066650390625, -0.030823707580566406, -0.027940750122070312, -0.02505779266357422, -0.022174835205078125, -0.01929187774658203, -0.016408920288085938, -0.013525962829589844, -0.01064300537109375, -0.007760047912597656, -0.0048770904541015625, -0.0019941329956054688, 0.000888824462890625, 0.0037717819213867188, 0.0066547393798828125, 0.009537696838378906, 0.012420654296875, 0.015303611755371094, 0.018186569213867188, 0.02106952667236328, 0.023952484130859375, 0.02683544158935547, 0.029718399047851562, 0.032601356506347656, 0.03548431396484375, 0.038367271423339844, 0.04125022888183594, 0.04413318634033203, 0.047016143798828125, 0.04989910125732422, 0.05278205871582031, 0.055665016174316406, 0.0585479736328125, 0.061430931091308594, 0.06431388854980469, 0.06719684600830078, 0.07007980346679688, 0.07296276092529297, 0.07584571838378906, 0.07872867584228516, 0.08161163330078125, 0.08449459075927734, 0.08737754821777344, 0.09026050567626953, 0.09314346313476562, 0.09602642059326172, 0.09890937805175781, 0.1017923355102539, 0.10467529296875]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 8.0, 12.0, 28.0, 53.0, 87.0, 132.0, 168.0, 175.0, 147.0, 90.0, 50.0, 29.0, 8.0, 9.0, 6.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.084836721420288, -1.0564169883728027, -1.0279972553253174, -0.999577522277832, -0.9711577892303467, -0.9427380561828613, -0.9143182635307312, -0.8858985304832458, -0.8574787974357605, -0.8290590643882751, -0.8006393313407898, -0.7722195982933044, -0.7437998056411743, -0.715380072593689, -0.6869603395462036, -0.6585406064987183, -0.6301208734512329, -0.6017011404037476, -0.5732814073562622, -0.5448616743087769, -0.5164419412612915, -0.48802217841148376, -0.459602415561676, -0.4311826825141907, -0.4027629494667053, -0.37434321641921997, -0.3459234833717346, -0.3175037205219269, -0.28908398747444153, -0.2606642544269562, -0.23224450647830963, -0.20382475852966309, -0.1754050850868225, -0.14698535203933716, -0.11856560409069061, -0.09014586359262466, -0.061726123094558716, -0.033306390047073364, -0.004886642098426819, 0.023533105850219727, 0.05195283889770508, 0.08037257939577103, 0.10879231989383698, 0.13721206784248352, 0.16563180088996887, 0.19405153393745422, 0.22247128188610077, 0.2508910298347473, 0.27931076288223267, 0.307730495929718, 0.33615022897720337, 0.3645699918270111, 0.39298972487449646, 0.4214094579219818, 0.44982922077178955, 0.4782489538192749, 0.5066686868667603, 0.5350884199142456, 0.563508152961731, 0.5919278860092163, 0.6203476190567017, 0.648767352104187, 0.6771871447563171, 0.7056068778038025, 0.7340266108512878]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 4.0, 2.0, 4.0, 9.0, 1.0, 3.0, 8.0, 9.0, 13.0, 15.0, 26.0, 14.0, 29.0, 20.0, 30.0, 38.0, 27.0, 36.0, 22.0, 44.0, 49.0, 42.0, 36.0, 43.0, 42.0, 44.0, 37.0, 41.0, 43.0, 39.0, 30.0, 35.0, 27.0, 19.0, 25.0, 11.0, 18.0, 11.0, 14.0, 12.0, 13.0, 7.0, 7.0, 4.0, 6.0, 5.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.404066801071167, -0.39333009719848633, -0.3825933635234833, -0.3718566298484802, -0.36111992597579956, -0.3503832221031189, -0.33964648842811584, -0.3289097547531128, -0.31817305088043213, -0.30743634700775146, -0.2966996133327484, -0.28596287965774536, -0.2752261757850647, -0.26448947191238403, -0.253752738237381, -0.24301601946353912, -0.23227930068969727, -0.2215425819158554, -0.21080586314201355, -0.2000691443681717, -0.18933242559432983, -0.17859570682048798, -0.16785898804664612, -0.15712226927280426, -0.1463855504989624, -0.13564883172512054, -0.12491211295127869, -0.11417539417743683, -0.10343867540359497, -0.09270195662975311, -0.08196523785591125, -0.0712285190820694, -0.06049180030822754, -0.04975508153438568, -0.03901836276054382, -0.028281643986701965, -0.017544925212860107, -0.0068082064390182495, 0.003928512334823608, 0.014665231108665466, 0.025401949882507324, 0.03613866865634918, 0.04687538743019104, 0.0576121062040329, 0.06834882497787476, 0.07908554375171661, 0.08982226252555847, 0.10055898129940033, 0.11129570007324219, 0.12203241884708405, 0.1327691376209259, 0.14350585639476776, 0.15424257516860962, 0.16497929394245148, 0.17571601271629333, 0.1864527314901352, 0.19718945026397705, 0.2079261690378189, 0.21866288781166077, 0.22939960658550262, 0.24013632535934448, 0.25087302923202515, 0.2616097629070282, 0.27234649658203125, 0.2830832004547119]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 5.0, 6.0, 2.0, 1.0, 0.0, 4.0, 9.0, 3.0, 9.0, 7.0, 14.0, 13.0, 24.0, 62.0, 80.0, 172.0, 321.0, 632.0, 1472.0, 3548.0, 9431.0, 29977.0, 135445.0, 497043.0, 286490.0, 58308.0, 15739.0, 5557.0, 2192.0, 1014.0, 453.0, 212.0, 112.0, 61.0, 36.0, 26.0, 19.0, 20.0, 10.0, 7.0, 4.0, 4.0, 4.0, 4.0, 3.0, 2.0, 3.0, 2.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.318115234375, -0.3062171936035156, -0.29431915283203125, -0.2824211120605469, -0.2705230712890625, -0.2586250305175781, -0.24672698974609375, -0.23482894897460938, -0.222930908203125, -0.21103286743164062, -0.19913482666015625, -0.18723678588867188, -0.1753387451171875, -0.16344070434570312, -0.15154266357421875, -0.13964462280273438, -0.12774658203125, -0.11584854125976562, -0.10395050048828125, -0.09205245971679688, -0.0801544189453125, -0.06825637817382812, -0.05635833740234375, -0.044460296630859375, -0.032562255859375, -0.020664215087890625, -0.00876617431640625, 0.003131866455078125, 0.0150299072265625, 0.026927947998046875, 0.03882598876953125, 0.050724029541015625, 0.0626220703125, 0.07452011108398438, 0.08641815185546875, 0.09831619262695312, 0.1102142333984375, 0.12211227416992188, 0.13401031494140625, 0.14590835571289062, 0.157806396484375, 0.16970443725585938, 0.18160247802734375, 0.19350051879882812, 0.2053985595703125, 0.21729660034179688, 0.22919464111328125, 0.24109268188476562, 0.25299072265625, 0.2648887634277344, 0.27678680419921875, 0.2886848449707031, 0.3005828857421875, 0.3124809265136719, 0.32437896728515625, 0.3362770080566406, 0.348175048828125, 0.3600730895996094, 0.37197113037109375, 0.3838691711425781, 0.3957672119140625, 0.4076652526855469, 0.41956329345703125, 0.4314613342285156, 0.443359375]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 0.0, 2.0, 2.0, 2.0, 2.0, 5.0, 5.0, 12.0, 14.0, 19.0, 23.0, 25.0, 24.0, 34.0, 36.0, 43.0, 52.0, 57.0, 63.0, 71.0, 61.0, 64.0, 53.0, 66.0, 49.0, 50.0, 37.0, 27.0, 27.0, 18.0, 16.0, 14.0, 10.0, 5.0, 7.0, 4.0, 6.0, 4.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11376953125, -0.11033821105957031, -0.10690689086914062, -0.10347557067871094, -0.10004425048828125, -0.09661293029785156, -0.09318161010742188, -0.08975028991699219, -0.0863189697265625, -0.08288764953613281, -0.07945632934570312, -0.07602500915527344, -0.07259368896484375, -0.06916236877441406, -0.06573104858398438, -0.06229972839355469, -0.058868408203125, -0.05543708801269531, -0.052005767822265625, -0.04857444763183594, -0.04514312744140625, -0.04171180725097656, -0.038280487060546875, -0.03484916687011719, -0.0314178466796875, -0.027986526489257812, -0.024555206298828125, -0.021123886108398438, -0.01769256591796875, -0.014261245727539062, -0.010829925537109375, -0.0073986053466796875, -0.00396728515625, -0.0005359649658203125, 0.002895355224609375, 0.0063266754150390625, 0.00975799560546875, 0.013189315795898438, 0.016620635986328125, 0.020051956176757812, 0.0234832763671875, 0.026914596557617188, 0.030345916748046875, 0.03377723693847656, 0.03720855712890625, 0.04063987731933594, 0.044071197509765625, 0.04750251770019531, 0.050933837890625, 0.05436515808105469, 0.057796478271484375, 0.06122779846191406, 0.06465911865234375, 0.06809043884277344, 0.07152175903320312, 0.07495307922363281, 0.0783843994140625, 0.08181571960449219, 0.08524703979492188, 0.08867835998535156, 0.09210968017578125, 0.09554100036621094, 0.09897232055664062, 0.10240364074707031, 0.1058349609375]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 4.0, 3.0, 3.0, 3.0, 2.0, 6.0, 3.0, 6.0, 13.0, 12.0, 16.0, 17.0, 37.0, 49.0, 74.0, 146.0, 281.0, 712.0, 1947.0, 5726.0, 20231.0, 117076.0, 553569.0, 291371.0, 41947.0, 9976.0, 3192.0, 1154.0, 460.0, 201.0, 114.0, 63.0, 31.0, 34.0, 14.0, 15.0, 8.0, 10.0, 10.0, 6.0, 3.0, 5.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0], "bins": [-0.4228515625, -0.4095268249511719, -0.39620208740234375, -0.3828773498535156, -0.3695526123046875, -0.3562278747558594, -0.34290313720703125, -0.3295783996582031, -0.316253662109375, -0.3029289245605469, -0.28960418701171875, -0.2762794494628906, -0.2629547119140625, -0.24962997436523438, -0.23630523681640625, -0.22298049926757812, -0.20965576171875, -0.19633102416992188, -0.18300628662109375, -0.16968154907226562, -0.1563568115234375, -0.14303207397460938, -0.12970733642578125, -0.11638259887695312, -0.103057861328125, -0.08973312377929688, -0.07640838623046875, -0.06308364868164062, -0.0497589111328125, -0.036434173583984375, -0.02310943603515625, -0.009784698486328125, 0.0035400390625, 0.016864776611328125, 0.03018951416015625, 0.043514251708984375, 0.0568389892578125, 0.07016372680664062, 0.08348846435546875, 0.09681320190429688, 0.110137939453125, 0.12346267700195312, 0.13678741455078125, 0.15011215209960938, 0.1634368896484375, 0.17676162719726562, 0.19008636474609375, 0.20341110229492188, 0.21673583984375, 0.23006057739257812, 0.24338531494140625, 0.2567100524902344, 0.2700347900390625, 0.2833595275878906, 0.29668426513671875, 0.3100090026855469, 0.323333740234375, 0.3366584777832031, 0.34998321533203125, 0.3633079528808594, 0.3766326904296875, 0.3899574279785156, 0.40328216552734375, 0.4166069030761719, 0.429931640625]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 0.0, 2.0, 5.0, 10.0, 5.0, 10.0, 11.0, 17.0, 20.0, 19.0, 25.0, 25.0, 23.0, 44.0, 34.0, 55.0, 50.0, 47.0, 38.0, 47.0, 56.0, 66.0, 41.0, 39.0, 53.0, 46.0, 33.0, 32.0, 26.0, 25.0, 19.0, 12.0, 12.0, 10.0, 10.0, 8.0, 13.0, 4.0, 5.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.203857421875, -0.19766998291015625, -0.1914825439453125, -0.18529510498046875, -0.179107666015625, -0.17292022705078125, -0.1667327880859375, -0.16054534912109375, -0.15435791015625, -0.14817047119140625, -0.1419830322265625, -0.13579559326171875, -0.129608154296875, -0.12342071533203125, -0.1172332763671875, -0.11104583740234375, -0.1048583984375, -0.09867095947265625, -0.0924835205078125, -0.08629608154296875, -0.080108642578125, -0.07392120361328125, -0.0677337646484375, -0.06154632568359375, -0.05535888671875, -0.04917144775390625, -0.0429840087890625, -0.03679656982421875, -0.030609130859375, -0.02442169189453125, -0.0182342529296875, -0.01204681396484375, -0.005859375, 0.00032806396484375, 0.0065155029296875, 0.01270294189453125, 0.018890380859375, 0.02507781982421875, 0.0312652587890625, 0.03745269775390625, 0.04364013671875, 0.04982757568359375, 0.0560150146484375, 0.06220245361328125, 0.068389892578125, 0.07457733154296875, 0.0807647705078125, 0.08695220947265625, 0.0931396484375, 0.09932708740234375, 0.1055145263671875, 0.11170196533203125, 0.117889404296875, 0.12407684326171875, 0.1302642822265625, 0.13645172119140625, 0.14263916015625, 0.14882659912109375, 0.1550140380859375, 0.16120147705078125, 0.167388916015625, 0.17357635498046875, 0.1797637939453125, 0.18595123291015625, 0.192138671875]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 8.0, 8.0, 23.0, 40.0, 87.0, 138.0, 222.0, 448.0, 837.0, 1653.0, 3475.0, 8280.0, 26240.0, 200426.0, 694897.0, 83456.0, 17076.0, 5912.0, 2580.0, 1272.0, 632.0, 376.0, 194.0, 127.0, 57.0, 32.0, 14.0, 13.0, 11.0, 9.0, 3.0, 0.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.253173828125, -0.24232101440429688, -0.23146820068359375, -0.22061538696289062, -0.2097625732421875, -0.19890975952148438, -0.18805694580078125, -0.17720413208007812, -0.166351318359375, -0.15549850463867188, -0.14464569091796875, -0.13379287719726562, -0.1229400634765625, -0.11208724975585938, -0.10123443603515625, -0.09038162231445312, -0.07952880859375, -0.06867599487304688, -0.05782318115234375, -0.046970367431640625, -0.0361175537109375, -0.025264739990234375, -0.01441192626953125, -0.003559112548828125, 0.007293701171875, 0.018146514892578125, 0.02899932861328125, 0.039852142333984375, 0.0507049560546875, 0.061557769775390625, 0.07241058349609375, 0.08326339721679688, 0.0941162109375, 0.10496902465820312, 0.11582183837890625, 0.12667465209960938, 0.1375274658203125, 0.14838027954101562, 0.15923309326171875, 0.17008590698242188, 0.180938720703125, 0.19179153442382812, 0.20264434814453125, 0.21349716186523438, 0.2243499755859375, 0.23520278930664062, 0.24605560302734375, 0.2569084167480469, 0.26776123046875, 0.2786140441894531, 0.28946685791015625, 0.3003196716308594, 0.3111724853515625, 0.3220252990722656, 0.33287811279296875, 0.3437309265136719, 0.354583740234375, 0.3654365539550781, 0.37628936767578125, 0.3871421813964844, 0.3979949951171875, 0.4088478088378906, 0.41970062255859375, 0.4305534362792969, 0.44140625]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 6.0, 1.0, 4.0, 8.0, 6.0, 9.0, 12.0, 13.0, 19.0, 44.0, 68.0, 128.0, 157.0, 197.0, 143.0, 84.0, 38.0, 11.0, 9.0, 7.0, 8.0, 12.0, 1.0, 2.0, 6.0, 1.0, 3.0, 3.0, 1.0, 1.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.1113624572753906e-05, -3.0081719160079956e-05, -2.9049813747406006e-05, -2.8017908334732056e-05, -2.6986002922058105e-05, -2.5954097509384155e-05, -2.4922192096710205e-05, -2.3890286684036255e-05, -2.2858381271362305e-05, -2.1826475858688354e-05, -2.0794570446014404e-05, -1.9762665033340454e-05, -1.8730759620666504e-05, -1.7698854207992554e-05, -1.6666948795318604e-05, -1.5635043382644653e-05, -1.4603137969970703e-05, -1.3571232557296753e-05, -1.2539327144622803e-05, -1.1507421731948853e-05, -1.0475516319274902e-05, -9.443610906600952e-06, -8.411705493927002e-06, -7.379800081253052e-06, -6.3478946685791016e-06, -5.315989255905151e-06, -4.284083843231201e-06, -3.252178430557251e-06, -2.2202730178833008e-06, -1.1883676052093506e-06, -1.564621925354004e-07, 8.754432201385498e-07, 1.9073486328125e-06, 2.93925404548645e-06, 3.9711594581604e-06, 5.003064870834351e-06, 6.034970283508301e-06, 7.066875696182251e-06, 8.098781108856201e-06, 9.130686521530151e-06, 1.0162591934204102e-05, 1.1194497346878052e-05, 1.2226402759552002e-05, 1.3258308172225952e-05, 1.4290213584899902e-05, 1.5322118997573853e-05, 1.6354024410247803e-05, 1.7385929822921753e-05, 1.8417835235595703e-05, 1.9449740648269653e-05, 2.0481646060943604e-05, 2.1513551473617554e-05, 2.2545456886291504e-05, 2.3577362298965454e-05, 2.4609267711639404e-05, 2.5641173124313354e-05, 2.6673078536987305e-05, 2.7704983949661255e-05, 2.8736889362335205e-05, 2.9768794775009155e-05, 3.0800700187683105e-05, 3.1832605600357056e-05, 3.2864511013031006e-05, 3.3896416425704956e-05, 3.4928321838378906e-05]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 5.0, 3.0, 7.0, 12.0, 11.0, 15.0, 17.0, 24.0, 41.0, 56.0, 110.0, 175.0, 333.0, 644.0, 1401.0, 3212.0, 8328.0, 24966.0, 110449.0, 472963.0, 333340.0, 64731.0, 16945.0, 6073.0, 2431.0, 1093.0, 515.0, 260.0, 144.0, 76.0, 50.0, 32.0, 26.0, 13.0, 12.0, 13.0, 10.0, 8.0, 1.0, 3.0, 4.0, 2.0, 4.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0], "bins": [-0.2196044921875, -0.2133007049560547, -0.20699691772460938, -0.20069313049316406, -0.19438934326171875, -0.18808555603027344, -0.18178176879882812, -0.1754779815673828, -0.1691741943359375, -0.1628704071044922, -0.15656661987304688, -0.15026283264160156, -0.14395904541015625, -0.13765525817871094, -0.13135147094726562, -0.1250476837158203, -0.118743896484375, -0.11244010925292969, -0.10613632202148438, -0.09983253479003906, -0.09352874755859375, -0.08722496032714844, -0.08092117309570312, -0.07461738586425781, -0.0683135986328125, -0.06200981140136719, -0.055706024169921875, -0.04940223693847656, -0.04309844970703125, -0.03679466247558594, -0.030490875244140625, -0.024187088012695312, -0.01788330078125, -0.011579513549804688, -0.005275726318359375, 0.0010280609130859375, 0.00733184814453125, 0.013635635375976562, 0.019939422607421875, 0.026243209838867188, 0.0325469970703125, 0.03885078430175781, 0.045154571533203125, 0.05145835876464844, 0.05776214599609375, 0.06406593322753906, 0.07036972045898438, 0.07667350769042969, 0.082977294921875, 0.08928108215332031, 0.09558486938476562, 0.10188865661621094, 0.10819244384765625, 0.11449623107910156, 0.12080001831054688, 0.1271038055419922, 0.1334075927734375, 0.1397113800048828, 0.14601516723632812, 0.15231895446777344, 0.15862274169921875, 0.16492652893066406, 0.17123031616210938, 0.1775341033935547, 0.183837890625]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 0.0, 5.0, 3.0, 2.0, 3.0, 4.0, 4.0, 6.0, 5.0, 15.0, 11.0, 20.0, 21.0, 27.0, 52.0, 63.0, 70.0, 84.0, 117.0, 106.0, 96.0, 64.0, 49.0, 43.0, 31.0, 27.0, 10.0, 11.0, 17.0, 7.0, 7.0, 8.0, 3.0, 6.0, 1.0, 4.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 4.0, 0.0, 1.0], "bins": [-0.12371826171875, -0.12010383605957031, -0.11648941040039062, -0.11287498474121094, -0.10926055908203125, -0.10564613342285156, -0.10203170776367188, -0.09841728210449219, -0.0948028564453125, -0.09118843078613281, -0.08757400512695312, -0.08395957946777344, -0.08034515380859375, -0.07673072814941406, -0.07311630249023438, -0.06950187683105469, -0.065887451171875, -0.06227302551269531, -0.058658599853515625, -0.05504417419433594, -0.05142974853515625, -0.04781532287597656, -0.044200897216796875, -0.04058647155761719, -0.0369720458984375, -0.03335762023925781, -0.029743194580078125, -0.026128768920898438, -0.02251434326171875, -0.018899917602539062, -0.015285491943359375, -0.011671066284179688, -0.008056640625, -0.0044422149658203125, -0.000827789306640625, 0.0027866363525390625, 0.00640106201171875, 0.010015487670898438, 0.013629913330078125, 0.017244338989257812, 0.0208587646484375, 0.024473190307617188, 0.028087615966796875, 0.03170204162597656, 0.03531646728515625, 0.03893089294433594, 0.042545318603515625, 0.04615974426269531, 0.049774169921875, 0.05338859558105469, 0.057003021240234375, 0.06061744689941406, 0.06423187255859375, 0.06784629821777344, 0.07146072387695312, 0.07507514953613281, 0.0786895751953125, 0.08230400085449219, 0.08591842651367188, 0.08953285217285156, 0.09314727783203125, 0.09676170349121094, 0.10037612915039062, 0.10399055480957031, 0.10760498046875]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 2.0, 3.0, 4.0, 2.0, 13.0, 24.0, 28.0, 52.0, 72.0, 78.0, 111.0, 99.0, 123.0, 97.0, 83.0, 64.0, 52.0, 27.0, 29.0, 14.0, 9.0, 1.0, 4.0, 7.0, 3.0, 4.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.7169004678726196, -0.6929519176483154, -0.6690033078193665, -0.6450547575950623, -0.6211062073707581, -0.5971575975418091, -0.5732090473175049, -0.5492604970932007, -0.5253118872642517, -0.5013633370399475, -0.4774147570133209, -0.45346617698669434, -0.42951759696006775, -0.40556901693344116, -0.38162046670913696, -0.3576718866825104, -0.3337233364582062, -0.3097747564315796, -0.2858262062072754, -0.2618776261806488, -0.23792904615402222, -0.21398048102855682, -0.19003191590309143, -0.16608333587646484, -0.14213477075099945, -0.11818619817495346, -0.09423762559890747, -0.07028906047344208, -0.04634048789739609, -0.022391915321350098, 0.0015566498041152954, 0.025505229830741882, 0.049453794956207275, 0.07340236753225327, 0.09735094010829926, 0.12129950523376465, 0.14524808526039124, 0.16919665038585663, 0.19314521551132202, 0.2170937955379486, 0.241042360663414, 0.2649909257888794, 0.288939505815506, 0.31288808584213257, 0.33683663606643677, 0.36078521609306335, 0.38473379611968994, 0.40868234634399414, 0.4326309263706207, 0.4565795063972473, 0.4805280566215515, 0.5044766664505005, 0.5284252166748047, 0.5523737668991089, 0.5763223171234131, 0.6002709269523621, 0.6242194771766663, 0.6481680274009705, 0.6721166372299194, 0.6960651874542236, 0.7200137376785278, 0.7439623475074768, 0.767910897731781, 0.79185950756073, 0.8158080577850342]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 4.0, 1.0, 4.0, 4.0, 5.0, 6.0, 10.0, 13.0, 15.0, 11.0, 25.0, 27.0, 20.0, 28.0, 34.0, 21.0, 37.0, 31.0, 24.0, 32.0, 43.0, 35.0, 44.0, 38.0, 49.0, 40.0, 42.0, 29.0, 39.0, 35.0, 32.0, 34.0, 27.0, 24.0, 21.0, 20.0, 14.0, 10.0, 14.0, 10.0, 18.0, 11.0, 8.0, 2.0, 3.0, 2.0, 3.0, 6.0, 0.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.481259822845459, -0.46627500653266907, -0.45129022002220154, -0.4363054037094116, -0.4213206171989441, -0.4063358008861542, -0.39135098457336426, -0.37636619806289673, -0.3613813817501068, -0.3463965654373169, -0.33141177892684937, -0.31642696261405945, -0.30144214630126953, -0.286457359790802, -0.2714725434780121, -0.25648772716522217, -0.24150294065475464, -0.22651813924312592, -0.2115333378314972, -0.19654852151870728, -0.18156372010707855, -0.16657891869544983, -0.1515941023826599, -0.1366093009710312, -0.12162449955940247, -0.10663969814777374, -0.09165488928556442, -0.0766700804233551, -0.06168527901172638, -0.046700477600097656, -0.031715668737888336, -0.016730859875679016, -0.001746058464050293, 0.013238746672868729, 0.02822355180978775, 0.04320835694670677, 0.05819316208362579, 0.07317796349525452, 0.08816277235746384, 0.10314758121967316, 0.11813238263130188, 0.1331171840429306, 0.14810198545455933, 0.16308680176734924, 0.17807160317897797, 0.1930564045906067, 0.2080412209033966, 0.22302602231502533, 0.23801082372665405, 0.25299564003944397, 0.2679804265499115, 0.2829652428627014, 0.29795002937316895, 0.31293484568595886, 0.3279196619987488, 0.3429044485092163, 0.3578892648220062, 0.37287408113479614, 0.38785886764526367, 0.4028436839580536, 0.4178285002708435, 0.43281328678131104, 0.44779810309410095, 0.46278291940689087, 0.4777677059173584]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 4.0, 3.0, 5.0, 6.0, 4.0, 17.0, 17.0, 27.0, 42.0, 65.0, 94.0, 133.0, 217.0, 381.0, 650.0, 1338.0, 3052.0, 9677.0, 43827.0, 408569.0, 2840694.0, 793488.0, 70450.0, 14057.0, 4177.0, 1670.0, 754.0, 381.0, 201.0, 122.0, 62.0, 44.0, 29.0, 15.0, 8.0, 3.0, 4.0, 5.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.279052734375, -0.27234840393066406, -0.2656440734863281, -0.2589397430419922, -0.25223541259765625, -0.2455310821533203, -0.23882675170898438, -0.23212242126464844, -0.2254180908203125, -0.21871376037597656, -0.21200942993164062, -0.2053050994873047, -0.19860076904296875, -0.1918964385986328, -0.18519210815429688, -0.17848777770996094, -0.171783447265625, -0.16507911682128906, -0.15837478637695312, -0.1516704559326172, -0.14496612548828125, -0.1382617950439453, -0.13155746459960938, -0.12485313415527344, -0.1181488037109375, -0.11144447326660156, -0.10474014282226562, -0.09803581237792969, -0.09133148193359375, -0.08462715148925781, -0.07792282104492188, -0.07121849060058594, -0.06451416015625, -0.05780982971191406, -0.051105499267578125, -0.04440116882324219, -0.03769683837890625, -0.030992507934570312, -0.024288177490234375, -0.017583847045898438, -0.0108795166015625, -0.0041751861572265625, 0.002529144287109375, 0.009233474731445312, 0.01593780517578125, 0.022642135620117188, 0.029346466064453125, 0.03605079650878906, 0.042755126953125, 0.04945945739746094, 0.056163787841796875, 0.06286811828613281, 0.06957244873046875, 0.07627677917480469, 0.08298110961914062, 0.08968544006347656, 0.0963897705078125, 0.10309410095214844, 0.10979843139648438, 0.11650276184082031, 0.12320709228515625, 0.1299114227294922, 0.13661575317382812, 0.14332008361816406, 0.1500244140625]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 0.0, 2.0, 2.0, 2.0, 2.0, 5.0, 2.0, 10.0, 15.0, 14.0, 21.0, 25.0, 39.0, 44.0, 48.0, 54.0, 68.0, 66.0, 68.0, 53.0, 67.0, 58.0, 62.0, 59.0, 48.0, 43.0, 36.0, 22.0, 24.0, 14.0, 11.0, 11.0, 3.0, 6.0, 2.0, 2.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1285400390625, -0.12481021881103516, -0.12108039855957031, -0.11735057830810547, -0.11362075805664062, -0.10989093780517578, -0.10616111755371094, -0.1024312973022461, -0.09870147705078125, -0.0949716567993164, -0.09124183654785156, -0.08751201629638672, -0.08378219604492188, -0.08005237579345703, -0.07632255554199219, -0.07259273529052734, -0.0688629150390625, -0.06513309478759766, -0.06140327453613281, -0.05767345428466797, -0.053943634033203125, -0.05021381378173828, -0.04648399353027344, -0.042754173278808594, -0.03902435302734375, -0.035294532775878906, -0.03156471252441406, -0.02783489227294922, -0.024105072021484375, -0.02037525177001953, -0.016645431518554688, -0.012915611267089844, -0.009185791015625, -0.005455970764160156, -0.0017261505126953125, 0.0020036697387695312, 0.005733489990234375, 0.009463310241699219, 0.013193130493164062, 0.016922950744628906, 0.02065277099609375, 0.024382591247558594, 0.028112411499023438, 0.03184223175048828, 0.035572052001953125, 0.03930187225341797, 0.04303169250488281, 0.046761512756347656, 0.0504913330078125, 0.054221153259277344, 0.05795097351074219, 0.06168079376220703, 0.06541061401367188, 0.06914043426513672, 0.07287025451660156, 0.0766000747680664, 0.08032989501953125, 0.0840597152709961, 0.08778953552246094, 0.09151935577392578, 0.09524917602539062, 0.09897899627685547, 0.10270881652832031, 0.10643863677978516, 0.11016845703125]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 6.0, 3.0, 2.0, 4.0, 4.0, 10.0, 9.0, 28.0, 43.0, 70.0, 87.0, 206.0, 333.0, 639.0, 1435.0, 3891.0, 14811.0, 80518.0, 596769.0, 2480177.0, 872259.0, 114942.0, 19880.0, 4891.0, 1656.0, 698.0, 373.0, 192.0, 129.0, 76.0, 46.0, 25.0, 25.0, 18.0, 7.0, 11.0, 5.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.2078857421875, -0.20086097717285156, -0.19383621215820312, -0.1868114471435547, -0.17978668212890625, -0.1727619171142578, -0.16573715209960938, -0.15871238708496094, -0.1516876220703125, -0.14466285705566406, -0.13763809204101562, -0.1306133270263672, -0.12358856201171875, -0.11656379699707031, -0.10953903198242188, -0.10251426696777344, -0.095489501953125, -0.08846473693847656, -0.08143997192382812, -0.07441520690917969, -0.06739044189453125, -0.06036567687988281, -0.053340911865234375, -0.04631614685058594, -0.0392913818359375, -0.03226661682128906, -0.025241851806640625, -0.018217086791992188, -0.01119232177734375, -0.0041675567626953125, 0.002857208251953125, 0.009881973266601562, 0.01690673828125, 0.023931503295898438, 0.030956268310546875, 0.03798103332519531, 0.04500579833984375, 0.05203056335449219, 0.059055328369140625, 0.06608009338378906, 0.0731048583984375, 0.08012962341308594, 0.08715438842773438, 0.09417915344238281, 0.10120391845703125, 0.10822868347167969, 0.11525344848632812, 0.12227821350097656, 0.129302978515625, 0.13632774353027344, 0.14335250854492188, 0.1503772735595703, 0.15740203857421875, 0.1644268035888672, 0.17145156860351562, 0.17847633361816406, 0.1855010986328125, 0.19252586364746094, 0.19955062866210938, 0.2065753936767578, 0.21360015869140625, 0.2206249237060547, 0.22764968872070312, 0.23467445373535156, 0.24169921875]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 1.0, 5.0, 2.0, 5.0, 7.0, 14.0, 19.0, 21.0, 25.0, 32.0, 32.0, 65.0, 56.0, 99.0, 132.0, 167.0, 193.0, 240.0, 267.0, 296.0, 303.0, 322.0, 308.0, 284.0, 257.0, 199.0, 165.0, 126.0, 108.0, 84.0, 56.0, 53.0, 40.0, 18.0, 16.0, 19.0, 12.0, 9.0, 2.0, 8.0, 3.0, 1.0, 3.0, 3.0, 3.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.1339111328125, -0.13019943237304688, -0.12648773193359375, -0.12277603149414062, -0.1190643310546875, -0.11535263061523438, -0.11164093017578125, -0.10792922973632812, -0.104217529296875, -0.10050582885742188, -0.09679412841796875, -0.09308242797851562, -0.0893707275390625, -0.08565902709960938, -0.08194732666015625, -0.07823562622070312, -0.07452392578125, -0.07081222534179688, -0.06710052490234375, -0.06338882446289062, -0.0596771240234375, -0.055965423583984375, -0.05225372314453125, -0.048542022705078125, -0.044830322265625, -0.041118621826171875, -0.03740692138671875, -0.033695220947265625, -0.0299835205078125, -0.026271820068359375, -0.02256011962890625, -0.018848419189453125, -0.01513671875, -0.011425018310546875, -0.00771331787109375, -0.004001617431640625, -0.0002899169921875, 0.003421783447265625, 0.00713348388671875, 0.010845184326171875, 0.014556884765625, 0.018268585205078125, 0.02198028564453125, 0.025691986083984375, 0.0294036865234375, 0.033115386962890625, 0.03682708740234375, 0.040538787841796875, 0.04425048828125, 0.047962188720703125, 0.05167388916015625, 0.055385589599609375, 0.0590972900390625, 0.06280899047851562, 0.06652069091796875, 0.07023239135742188, 0.073944091796875, 0.07765579223632812, 0.08136749267578125, 0.08507919311523438, 0.0887908935546875, 0.09250259399414062, 0.09621429443359375, 0.09992599487304688, 0.1036376953125]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 5.0, 7.0, 12.0, 25.0, 52.0, 105.0, 160.0, 198.0, 177.0, 116.0, 80.0, 35.0, 24.0, 9.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6479070782661438, -0.6116114258766174, -0.5753157734870911, -0.5390201210975647, -0.5027244687080383, -0.46642881631851196, -0.4301331341266632, -0.39383748173713684, -0.3575418293476105, -0.3212461769580841, -0.28495052456855774, -0.24865485727787018, -0.2123592048883438, -0.17606355249881744, -0.13976788520812988, -0.10347223281860352, -0.06717658042907715, -0.030880924314260483, 0.005414731800556183, 0.04171039164066315, 0.07800604403018951, 0.11430169641971588, 0.15059736371040344, 0.1868930160999298, 0.22318866848945618, 0.25948432087898254, 0.2957799732685089, 0.33207565546035767, 0.36837130784988403, 0.4046669602394104, 0.44096261262893677, 0.47725826501846313, 0.5135539770126343, 0.5498496294021606, 0.586145281791687, 0.6224409341812134, 0.6587365865707397, 0.6950322389602661, 0.7313278913497925, 0.7676235437393188, 0.8039191961288452, 0.8402148485183716, 0.876510500907898, 0.9128061532974243, 0.9491018056869507, 0.985397458076477, 1.0216931104660034, 1.0579887628555298, 1.0942845344543457, 1.130580186843872, 1.1668758392333984, 1.2031714916229248, 1.2394671440124512, 1.2757627964019775, 1.312058448791504, 1.3483541011810303, 1.3846497535705566, 1.420945405960083, 1.4572410583496094, 1.4935367107391357, 1.529832363128662, 1.5661280155181885, 1.6024236679077148, 1.6387193202972412, 1.6750149726867676]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 9.0, 4.0, 9.0, 5.0, 11.0, 8.0, 12.0, 20.0, 29.0, 22.0, 27.0, 23.0, 32.0, 43.0, 37.0, 35.0, 39.0, 57.0, 35.0, 35.0, 39.0, 50.0, 51.0, 38.0, 35.0, 46.0, 37.0, 29.0, 32.0, 26.0, 23.0, 22.0, 16.0, 19.0, 5.0, 9.0, 5.0, 11.0, 6.0, 6.0, 1.0, 4.0, 4.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.447887659072876, -0.4334411919116974, -0.4189947247505188, -0.4045482873916626, -0.390101820230484, -0.3756553530693054, -0.36120888590812683, -0.34676241874694824, -0.33231598138809204, -0.31786951422691345, -0.30342304706573486, -0.28897660970687866, -0.2745301425457001, -0.2600836753845215, -0.2456372082233429, -0.2311907559633255, -0.2167442888021469, -0.20229782164096832, -0.18785136938095093, -0.17340490221977234, -0.15895844995975494, -0.14451198279857635, -0.13006553053855896, -0.11561906337738037, -0.10117260366678238, -0.08672614395618439, -0.0722796842455864, -0.057833220809698105, -0.04338676109910011, -0.028940297663211823, -0.01449383795261383, -4.737824201583862e-05, 0.014399081468582153, 0.028845541179180145, 0.04329200088977814, 0.05773846432566643, 0.07218492031097412, 0.08663138747215271, 0.1010778471827507, 0.1155243068933487, 0.1299707591533661, 0.14441722631454468, 0.15886367857456207, 0.17331014573574066, 0.18775659799575806, 0.20220306515693665, 0.21664953231811523, 0.23109598457813263, 0.24554245173931122, 0.2599889039993286, 0.2744353711605072, 0.2888818383216858, 0.3033283054828644, 0.31777477264404297, 0.33222121000289917, 0.34666767716407776, 0.36111414432525635, 0.37556061148643494, 0.3900070786476135, 0.4044535160064697, 0.4188999831676483, 0.4333464503288269, 0.4477929174900055, 0.4622393846511841, 0.4766858220100403]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 5.0, 3.0, 7.0, 10.0, 16.0, 16.0, 16.0, 11.0, 17.0, 34.0, 48.0, 46.0, 74.0, 149.0, 194.0, 396.0, 860.0, 2164.0, 6288.0, 19362.0, 66000.0, 226633.0, 426919.0, 210811.0, 60742.0, 17905.0, 5937.0, 2108.0, 818.0, 376.0, 170.0, 119.0, 75.0, 61.0, 50.0, 32.0, 19.0, 19.0, 12.0, 13.0, 9.0, 5.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.297119140625, -0.28668212890625, -0.2762451171875, -0.26580810546875, -0.25537109375, -0.24493408203125, -0.2344970703125, -0.22406005859375, -0.213623046875, -0.20318603515625, -0.1927490234375, -0.18231201171875, -0.171875, -0.16143798828125, -0.1510009765625, -0.14056396484375, -0.130126953125, -0.11968994140625, -0.1092529296875, -0.09881591796875, -0.08837890625, -0.07794189453125, -0.0675048828125, -0.05706787109375, -0.046630859375, -0.03619384765625, -0.0257568359375, -0.01531982421875, -0.0048828125, 0.00555419921875, 0.0159912109375, 0.02642822265625, 0.036865234375, 0.04730224609375, 0.0577392578125, 0.06817626953125, 0.07861328125, 0.08905029296875, 0.0994873046875, 0.10992431640625, 0.120361328125, 0.13079833984375, 0.1412353515625, 0.15167236328125, 0.162109375, 0.17254638671875, 0.1829833984375, 0.19342041015625, 0.203857421875, 0.21429443359375, 0.2247314453125, 0.23516845703125, 0.24560546875, 0.25604248046875, 0.2664794921875, 0.27691650390625, 0.287353515625, 0.29779052734375, 0.3082275390625, 0.31866455078125, 0.3291015625, 0.33953857421875, 0.3499755859375, 0.36041259765625, 0.370849609375]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 5.0, 4.0, 5.0, 5.0, 8.0, 19.0, 16.0, 27.0, 34.0, 23.0, 54.0, 50.0, 46.0, 48.0, 63.0, 69.0, 68.0, 59.0, 54.0, 51.0, 54.0, 58.0, 35.0, 38.0, 29.0, 28.0, 15.0, 7.0, 8.0, 11.0, 7.0, 6.0, 1.0, 3.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.12445068359375, -0.12103843688964844, -0.11762619018554688, -0.11421394348144531, -0.11080169677734375, -0.10738945007324219, -0.10397720336914062, -0.10056495666503906, -0.0971527099609375, -0.09374046325683594, -0.09032821655273438, -0.08691596984863281, -0.08350372314453125, -0.08009147644042969, -0.07667922973632812, -0.07326698303222656, -0.069854736328125, -0.06644248962402344, -0.06303024291992188, -0.05961799621582031, -0.05620574951171875, -0.05279350280761719, -0.049381256103515625, -0.04596900939941406, -0.0425567626953125, -0.03914451599121094, -0.035732269287109375, -0.03232002258300781, -0.02890777587890625, -0.025495529174804688, -0.022083282470703125, -0.018671035766601562, -0.0152587890625, -0.011846542358398438, -0.008434295654296875, -0.0050220489501953125, -0.00160980224609375, 0.0018024444580078125, 0.005214691162109375, 0.008626937866210938, 0.0120391845703125, 0.015451431274414062, 0.018863677978515625, 0.022275924682617188, 0.02568817138671875, 0.029100418090820312, 0.032512664794921875, 0.03592491149902344, 0.039337158203125, 0.04274940490722656, 0.046161651611328125, 0.04957389831542969, 0.05298614501953125, 0.05639839172363281, 0.059810638427734375, 0.06322288513183594, 0.0666351318359375, 0.07004737854003906, 0.07345962524414062, 0.07687187194824219, 0.08028411865234375, 0.08369636535644531, 0.08710861206054688, 0.09052085876464844, 0.09393310546875]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 4.0, 9.0, 8.0, 8.0, 12.0, 9.0, 11.0, 21.0, 42.0, 58.0, 111.0, 171.0, 377.0, 722.0, 1710.0, 4630.0, 12226.0, 34475.0, 98695.0, 251417.0, 348641.0, 188660.0, 68528.0, 23784.0, 8371.0, 3255.0, 1343.0, 607.0, 262.0, 155.0, 68.0, 49.0, 37.0, 19.0, 15.0, 14.0, 8.0, 8.0, 5.0, 3.0, 6.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.284912109375, -0.2755165100097656, -0.26612091064453125, -0.2567253112792969, -0.2473297119140625, -0.23793411254882812, -0.22853851318359375, -0.21914291381835938, -0.209747314453125, -0.20035171508789062, -0.19095611572265625, -0.18156051635742188, -0.1721649169921875, -0.16276931762695312, -0.15337371826171875, -0.14397811889648438, -0.13458251953125, -0.12518692016601562, -0.11579132080078125, -0.10639572143554688, -0.0970001220703125, -0.08760452270507812, -0.07820892333984375, -0.06881332397460938, -0.059417724609375, -0.050022125244140625, -0.04062652587890625, -0.031230926513671875, -0.0218353271484375, -0.012439727783203125, -0.00304412841796875, 0.006351470947265625, 0.0157470703125, 0.025142669677734375, 0.03453826904296875, 0.043933868408203125, 0.0533294677734375, 0.06272506713867188, 0.07212066650390625, 0.08151626586914062, 0.090911865234375, 0.10030746459960938, 0.10970306396484375, 0.11909866333007812, 0.1284942626953125, 0.13788986206054688, 0.14728546142578125, 0.15668106079101562, 0.16607666015625, 0.17547225952148438, 0.18486785888671875, 0.19426345825195312, 0.2036590576171875, 0.21305465698242188, 0.22245025634765625, 0.23184585571289062, 0.241241455078125, 0.2506370544433594, 0.26003265380859375, 0.2694282531738281, 0.2788238525390625, 0.2882194519042969, 0.29761505126953125, 0.3070106506347656, 0.31640625]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 4.0, 2.0, 3.0, 6.0, 4.0, 12.0, 12.0, 10.0, 17.0, 19.0, 22.0, 38.0, 31.0, 31.0, 27.0, 41.0, 50.0, 50.0, 52.0, 53.0, 57.0, 47.0, 39.0, 53.0, 43.0, 32.0, 41.0, 20.0, 35.0, 25.0, 28.0, 16.0, 22.0, 14.0, 8.0, 7.0, 12.0, 7.0, 6.0, 5.0, 5.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.248046875, -0.2407054901123047, -0.23336410522460938, -0.22602272033691406, -0.21868133544921875, -0.21133995056152344, -0.20399856567382812, -0.1966571807861328, -0.1893157958984375, -0.1819744110107422, -0.17463302612304688, -0.16729164123535156, -0.15995025634765625, -0.15260887145996094, -0.14526748657226562, -0.1379261016845703, -0.130584716796875, -0.12324333190917969, -0.11590194702148438, -0.10856056213378906, -0.10121917724609375, -0.09387779235839844, -0.08653640747070312, -0.07919502258300781, -0.0718536376953125, -0.06451225280761719, -0.057170867919921875, -0.04982948303222656, -0.04248809814453125, -0.03514671325683594, -0.027805328369140625, -0.020463943481445312, -0.01312255859375, -0.0057811737060546875, 0.001560211181640625, 0.008901596069335938, 0.01624298095703125, 0.023584365844726562, 0.030925750732421875, 0.03826713562011719, 0.0456085205078125, 0.05294990539550781, 0.060291290283203125, 0.06763267517089844, 0.07497406005859375, 0.08231544494628906, 0.08965682983398438, 0.09699821472167969, 0.104339599609375, 0.11168098449707031, 0.11902236938476562, 0.12636375427246094, 0.13370513916015625, 0.14104652404785156, 0.14838790893554688, 0.1557292938232422, 0.1630706787109375, 0.1704120635986328, 0.17775344848632812, 0.18509483337402344, 0.19243621826171875, 0.19977760314941406, 0.20711898803710938, 0.2144603729248047, 0.2218017578125]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 7.0, 13.0, 9.0, 16.0, 38.0, 68.0, 130.0, 238.0, 615.0, 2061.0, 8885.0, 61067.0, 458580.0, 446650.0, 58388.0, 8590.0, 2044.0, 609.0, 253.0, 151.0, 57.0, 41.0, 20.0, 11.0, 4.0, 3.0, 6.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.298828125, -0.2888641357421875, -0.278900146484375, -0.2689361572265625, -0.25897216796875, -0.2490081787109375, -0.239044189453125, -0.2290802001953125, -0.2191162109375, -0.2091522216796875, -0.199188232421875, -0.1892242431640625, -0.17926025390625, -0.1692962646484375, -0.159332275390625, -0.1493682861328125, -0.139404296875, -0.1294403076171875, -0.119476318359375, -0.1095123291015625, -0.09954833984375, -0.0895843505859375, -0.079620361328125, -0.0696563720703125, -0.0596923828125, -0.0497283935546875, -0.039764404296875, -0.0298004150390625, -0.01983642578125, -0.0098724365234375, 9.1552734375e-05, 0.0100555419921875, 0.02001953125, 0.0299835205078125, 0.039947509765625, 0.0499114990234375, 0.05987548828125, 0.0698394775390625, 0.079803466796875, 0.0897674560546875, 0.0997314453125, 0.1096954345703125, 0.119659423828125, 0.1296234130859375, 0.13958740234375, 0.1495513916015625, 0.159515380859375, 0.1694793701171875, 0.179443359375, 0.1894073486328125, 0.199371337890625, 0.2093353271484375, 0.21929931640625, 0.2292633056640625, 0.239227294921875, 0.2491912841796875, 0.2591552734375, 0.2691192626953125, 0.279083251953125, 0.2890472412109375, 0.29901123046875, 0.3089752197265625, 0.318939208984375, 0.3289031982421875, 0.3388671875]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 0.0, 2.0, 8.0, 6.0, 15.0, 38.0, 42.0, 118.0, 160.0, 209.0, 182.0, 100.0, 53.0, 33.0, 15.0, 10.0, 6.0, 3.0, 3.0, 1.0, 3.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.894899368286133e-05, -5.729403346776962e-05, -5.563907325267792e-05, -5.398411303758621e-05, -5.232915282249451e-05, -5.06741926074028e-05, -4.9019232392311096e-05, -4.736427217721939e-05, -4.5709311962127686e-05, -4.405435174703598e-05, -4.2399391531944275e-05, -4.074443131685257e-05, -3.9089471101760864e-05, -3.743451088666916e-05, -3.5779550671577454e-05, -3.412459045648575e-05, -3.246963024139404e-05, -3.081467002630234e-05, -2.9159709811210632e-05, -2.7504749596118927e-05, -2.584978938102722e-05, -2.4194829165935516e-05, -2.253986895084381e-05, -2.0884908735752106e-05, -1.92299485206604e-05, -1.7574988305568695e-05, -1.592002809047699e-05, -1.4265067875385284e-05, -1.2610107660293579e-05, -1.0955147445201874e-05, -9.300187230110168e-06, -7.645227015018463e-06, -5.990266799926758e-06, -4.3353065848350525e-06, -2.680346369743347e-06, -1.0253861546516418e-06, 6.295740604400635e-07, 2.284534275531769e-06, 3.939494490623474e-06, 5.5944547057151794e-06, 7.249414920806885e-06, 8.90437513589859e-06, 1.0559335350990295e-05, 1.2214295566082e-05, 1.3869255781173706e-05, 1.552421599626541e-05, 1.7179176211357117e-05, 1.8834136426448822e-05, 2.0489096641540527e-05, 2.2144056856632233e-05, 2.3799017071723938e-05, 2.5453977286815643e-05, 2.710893750190735e-05, 2.8763897716999054e-05, 3.041885793209076e-05, 3.2073818147182465e-05, 3.372877836227417e-05, 3.5383738577365875e-05, 3.703869879245758e-05, 3.8693659007549286e-05, 4.034861922264099e-05, 4.2003579437732697e-05, 4.36585396528244e-05, 4.531349986791611e-05, 4.696846008300781e-05]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 0.0, 4.0, 4.0, 4.0, 8.0, 9.0, 10.0, 30.0, 33.0, 47.0, 79.0, 101.0, 171.0, 274.0, 457.0, 785.0, 1354.0, 2668.0, 5483.0, 12214.0, 27556.0, 64120.0, 138294.0, 237338.0, 254256.0, 162370.0, 77857.0, 34120.0, 14780.0, 6833.0, 3327.0, 1610.0, 937.0, 535.0, 327.0, 194.0, 121.0, 77.0, 57.0, 28.0, 23.0, 20.0, 16.0, 7.0, 7.0, 7.0, 5.0, 3.0, 0.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.098388671875, -0.09522724151611328, -0.09206581115722656, -0.08890438079833984, -0.08574295043945312, -0.0825815200805664, -0.07942008972167969, -0.07625865936279297, -0.07309722900390625, -0.06993579864501953, -0.06677436828613281, -0.0636129379272461, -0.060451507568359375, -0.057290077209472656, -0.05412864685058594, -0.05096721649169922, -0.0478057861328125, -0.04464435577392578, -0.04148292541503906, -0.038321495056152344, -0.035160064697265625, -0.031998634338378906, -0.028837203979492188, -0.02567577362060547, -0.02251434326171875, -0.01935291290283203, -0.016191482543945312, -0.013030052185058594, -0.009868621826171875, -0.006707191467285156, -0.0035457611083984375, -0.00038433074951171875, 0.002777099609375, 0.005938529968261719, 0.009099960327148438, 0.012261390686035156, 0.015422821044921875, 0.018584251403808594, 0.021745681762695312, 0.02490711212158203, 0.02806854248046875, 0.03122997283935547, 0.03439140319824219, 0.037552833557128906, 0.040714263916015625, 0.043875694274902344, 0.04703712463378906, 0.05019855499267578, 0.0533599853515625, 0.05652141571044922, 0.05968284606933594, 0.06284427642822266, 0.06600570678710938, 0.0691671371459961, 0.07232856750488281, 0.07548999786376953, 0.07865142822265625, 0.08181285858154297, 0.08497428894042969, 0.0881357192993164, 0.09129714965820312, 0.09445858001708984, 0.09762001037597656, 0.10078144073486328, 0.10394287109375]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 0.0, 3.0, 0.0, 3.0, 2.0, 4.0, 4.0, 4.0, 7.0, 7.0, 7.0, 10.0, 15.0, 15.0, 11.0, 22.0, 25.0, 30.0, 30.0, 47.0, 49.0, 54.0, 52.0, 61.0, 51.0, 50.0, 61.0, 44.0, 51.0, 36.0, 37.0, 39.0, 27.0, 26.0, 23.0, 20.0, 17.0, 20.0, 15.0, 3.0, 6.0, 5.0, 6.0, 2.0, 5.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07275390625, -0.07041168212890625, -0.0680694580078125, -0.06572723388671875, -0.063385009765625, -0.06104278564453125, -0.0587005615234375, -0.05635833740234375, -0.05401611328125, -0.05167388916015625, -0.0493316650390625, -0.04698944091796875, -0.044647216796875, -0.04230499267578125, -0.0399627685546875, -0.03762054443359375, -0.0352783203125, -0.03293609619140625, -0.0305938720703125, -0.02825164794921875, -0.025909423828125, -0.02356719970703125, -0.0212249755859375, -0.01888275146484375, -0.01654052734375, -0.01419830322265625, -0.0118560791015625, -0.00951385498046875, -0.007171630859375, -0.00482940673828125, -0.0024871826171875, -0.00014495849609375, 0.002197265625, 0.00453948974609375, 0.0068817138671875, 0.00922393798828125, 0.011566162109375, 0.01390838623046875, 0.0162506103515625, 0.01859283447265625, 0.02093505859375, 0.02327728271484375, 0.0256195068359375, 0.02796173095703125, 0.030303955078125, 0.03264617919921875, 0.0349884033203125, 0.03733062744140625, 0.0396728515625, 0.04201507568359375, 0.0443572998046875, 0.04669952392578125, 0.049041748046875, 0.05138397216796875, 0.0537261962890625, 0.05606842041015625, 0.05841064453125, 0.06075286865234375, 0.0630950927734375, 0.06543731689453125, 0.067779541015625, 0.07012176513671875, 0.0724639892578125, 0.07480621337890625, 0.0771484375]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 4.0, 6.0, 14.0, 49.0, 109.0, 261.0, 288.0, 166.0, 89.0, 20.0, 8.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.7388163805007935, -0.666898787021637, -0.5949811935424805, -0.5230635404586792, -0.4511459767818451, -0.3792283833026886, -0.3073107600212097, -0.23539316654205322, -0.16347557306289673, -0.09155797213315964, -0.019640371203422546, 0.05227723717689514, 0.12419483065605164, 0.19611242413520813, 0.268030047416687, 0.3399476408958435, 0.411865234375, 0.4837828278541565, 0.555700421333313, 0.6276180744171143, 0.699535608291626, 0.7714532613754272, 0.8433708548545837, 0.9152884483337402, 0.9872060418128967, 1.0591236352920532, 1.1310412883758545, 1.2029588222503662, 1.2748764753341675, 1.3467940092086792, 1.4187116622924805, 1.4906291961669922, 1.562546968460083, 1.6344646215438843, 1.706382155418396, 1.7782998085021973, 1.850217342376709, 1.9221349954605103, 1.9940526485443115, 2.0659701824188232, 2.137887716293335, 2.2098052501678467, 2.2817230224609375, 2.353640556335449, 2.425558090209961, 2.4974756240844727, 2.5693933963775635, 2.641310930252075, 2.713228702545166, 2.7851462364196777, 2.8570640087127686, 2.9289815425872803, 3.000899076461792, 3.0728166103363037, 3.1447343826293945, 3.2166519165039062, 3.288569450378418, 3.3604869842529297, 3.4324047565460205, 3.5043222904205322, 3.576239824295044, 3.6481573581695557, 3.7200751304626465, 3.791992664337158, 3.86391019821167]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 3.0, 1.0, 5.0, 3.0, 1.0, 13.0, 5.0, 9.0, 6.0, 18.0, 15.0, 20.0, 18.0, 33.0, 17.0, 24.0, 41.0, 42.0, 32.0, 34.0, 44.0, 47.0, 40.0, 43.0, 41.0, 51.0, 34.0, 44.0, 38.0, 26.0, 33.0, 34.0, 36.0, 24.0, 22.0, 15.0, 13.0, 12.0, 14.0, 14.0, 8.0, 5.0, 12.0, 5.0, 4.0, 1.0, 5.0, 2.0, 3.0, 0.0, 1.0, 1.0], "bins": [-0.7177101969718933, -0.6973289847373962, -0.676947832107544, -0.6565666198730469, -0.6361854076385498, -0.6158042550086975, -0.5954230427742004, -0.5750418901443481, -0.5546606779098511, -0.534279465675354, -0.5138983130455017, -0.49351710081100464, -0.47313591837882996, -0.4527547359466553, -0.4323735237121582, -0.4119923412799835, -0.39161115884780884, -0.37122997641563416, -0.3508487939834595, -0.3304675817489624, -0.3100863993167877, -0.28970521688461304, -0.26932400465011597, -0.24894282221794128, -0.2285616397857666, -0.20818045735359192, -0.18779926002025604, -0.16741806268692017, -0.14703688025474548, -0.1266556978225708, -0.10627450048923492, -0.08589330315589905, -0.06551212072372437, -0.045130930840969086, -0.024749740958213806, -0.004368551075458527, 0.016012638807296753, 0.03639382869005203, 0.05677501857280731, 0.07715621590614319, 0.09753739833831787, 0.11791858822107315, 0.13829977810382843, 0.1586809754371643, 0.179062157869339, 0.19944334030151367, 0.21982453763484955, 0.24020573496818542, 0.2605869174003601, 0.2809680998325348, 0.3013492822647095, 0.32173049449920654, 0.3421116769313812, 0.3624928593635559, 0.382874071598053, 0.40325525403022766, 0.42363643646240234, 0.444017618894577, 0.4643988013267517, 0.4847800135612488, 0.5051611661911011, 0.5255423784255981, 0.5459235906600952, 0.5663048028945923, 0.5866859555244446]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 7.0, 11.0, 8.0, 10.0, 17.0, 27.0, 40.0, 48.0, 87.0, 102.0, 115.0, 197.0, 251.0, 413.0, 843.0, 2327.0, 9275.0, 77006.0, 1577467.0, 2370620.0, 135864.0, 14011.0, 3149.0, 1085.0, 475.0, 263.0, 167.0, 118.0, 90.0, 53.0, 49.0, 22.0, 28.0, 10.0, 14.0, 5.0, 9.0, 3.0, 3.0, 2.0, 0.0, 1.0], "bins": [-0.318115234375, -0.3103752136230469, -0.30263519287109375, -0.2948951721191406, -0.2871551513671875, -0.2794151306152344, -0.27167510986328125, -0.2639350891113281, -0.256195068359375, -0.24845504760742188, -0.24071502685546875, -0.23297500610351562, -0.2252349853515625, -0.21749496459960938, -0.20975494384765625, -0.20201492309570312, -0.19427490234375, -0.18653488159179688, -0.17879486083984375, -0.17105484008789062, -0.1633148193359375, -0.15557479858398438, -0.14783477783203125, -0.14009475708007812, -0.132354736328125, -0.12461471557617188, -0.11687469482421875, -0.10913467407226562, -0.1013946533203125, -0.09365463256835938, -0.08591461181640625, -0.07817459106445312, -0.0704345703125, -0.06269454956054688, -0.05495452880859375, -0.047214508056640625, -0.0394744873046875, -0.031734466552734375, -0.02399444580078125, -0.016254425048828125, -0.008514404296875, -0.000774383544921875, 0.00696563720703125, 0.014705657958984375, 0.0224456787109375, 0.030185699462890625, 0.03792572021484375, 0.045665740966796875, 0.05340576171875, 0.061145782470703125, 0.06888580322265625, 0.07662582397460938, 0.0843658447265625, 0.09210586547851562, 0.09984588623046875, 0.10758590698242188, 0.115325927734375, 0.12306594848632812, 0.13080596923828125, 0.13854598999023438, 0.1462860107421875, 0.15402603149414062, 0.16176605224609375, 0.16950607299804688, 0.17724609375]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 5.0, 5.0, 8.0, 9.0, 6.0, 8.0, 13.0, 20.0, 21.0, 15.0, 29.0, 27.0, 25.0, 35.0, 44.0, 45.0, 47.0, 58.0, 54.0, 56.0, 56.0, 48.0, 42.0, 39.0, 45.0, 37.0, 40.0, 37.0, 29.0, 21.0, 27.0, 13.0, 9.0, 9.0, 6.0, 7.0, 5.0, 4.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08612060546875, -0.08310413360595703, -0.08008766174316406, -0.0770711898803711, -0.07405471801757812, -0.07103824615478516, -0.06802177429199219, -0.06500530242919922, -0.06198883056640625, -0.05897235870361328, -0.05595588684082031, -0.052939414978027344, -0.049922943115234375, -0.046906471252441406, -0.04388999938964844, -0.04087352752685547, -0.0378570556640625, -0.03484058380126953, -0.03182411193847656, -0.028807640075683594, -0.025791168212890625, -0.022774696350097656, -0.019758224487304688, -0.01674175262451172, -0.01372528076171875, -0.010708808898925781, -0.0076923370361328125, -0.004675865173339844, -0.001659393310546875, 0.0013570785522460938, 0.0043735504150390625, 0.007390022277832031, 0.010406494140625, 0.013422966003417969, 0.016439437866210938, 0.019455909729003906, 0.022472381591796875, 0.025488853454589844, 0.028505325317382812, 0.03152179718017578, 0.03453826904296875, 0.03755474090576172, 0.04057121276855469, 0.043587684631347656, 0.046604156494140625, 0.049620628356933594, 0.05263710021972656, 0.05565357208251953, 0.0586700439453125, 0.06168651580810547, 0.06470298767089844, 0.0677194595336914, 0.07073593139648438, 0.07375240325927734, 0.07676887512207031, 0.07978534698486328, 0.08280181884765625, 0.08581829071044922, 0.08883476257324219, 0.09185123443603516, 0.09486770629882812, 0.0978841781616211, 0.10090065002441406, 0.10391712188720703, 0.10693359375]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 3.0, 5.0, 2.0, 5.0, 9.0, 6.0, 10.0, 11.0, 26.0, 36.0, 43.0, 65.0, 121.0, 187.0, 359.0, 790.0, 1929.0, 6696.0, 33113.0, 242572.0, 1856412.0, 1780631.0, 229524.0, 31590.0, 6501.0, 1987.0, 736.0, 389.0, 188.0, 106.0, 75.0, 36.0, 47.0, 30.0, 9.0, 12.0, 10.0, 6.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.25244140625, -0.2452259063720703, -0.23801040649414062, -0.23079490661621094, -0.22357940673828125, -0.21636390686035156, -0.20914840698242188, -0.2019329071044922, -0.1947174072265625, -0.1875019073486328, -0.18028640747070312, -0.17307090759277344, -0.16585540771484375, -0.15863990783691406, -0.15142440795898438, -0.1442089080810547, -0.136993408203125, -0.1297779083251953, -0.12256240844726562, -0.11534690856933594, -0.10813140869140625, -0.10091590881347656, -0.09370040893554688, -0.08648490905761719, -0.0792694091796875, -0.07205390930175781, -0.06483840942382812, -0.05762290954589844, -0.05040740966796875, -0.04319190979003906, -0.035976409912109375, -0.028760910034179688, -0.02154541015625, -0.014329910278320312, -0.007114410400390625, 0.0001010894775390625, 0.00731658935546875, 0.014532089233398438, 0.021747589111328125, 0.028963088989257812, 0.0361785888671875, 0.04339408874511719, 0.050609588623046875, 0.05782508850097656, 0.06504058837890625, 0.07225608825683594, 0.07947158813476562, 0.08668708801269531, 0.093902587890625, 0.10111808776855469, 0.10833358764648438, 0.11554908752441406, 0.12276458740234375, 0.12998008728027344, 0.13719558715820312, 0.1444110870361328, 0.1516265869140625, 0.1588420867919922, 0.16605758666992188, 0.17327308654785156, 0.18048858642578125, 0.18770408630371094, 0.19491958618164062, 0.2021350860595703, 0.2093505859375]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 4.0, 3.0, 6.0, 6.0, 7.0, 8.0, 11.0, 17.0, 30.0, 45.0, 47.0, 70.0, 86.0, 129.0, 132.0, 219.0, 265.0, 333.0, 327.0, 369.0, 342.0, 342.0, 276.0, 234.0, 192.0, 128.0, 127.0, 80.0, 70.0, 56.0, 26.0, 24.0, 22.0, 14.0, 8.0, 8.0, 7.0, 3.0, 2.0, 4.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1309814453125, -0.1268768310546875, -0.122772216796875, -0.1186676025390625, -0.11456298828125, -0.1104583740234375, -0.106353759765625, -0.1022491455078125, -0.09814453125, -0.0940399169921875, -0.089935302734375, -0.0858306884765625, -0.08172607421875, -0.0776214599609375, -0.073516845703125, -0.0694122314453125, -0.0653076171875, -0.0612030029296875, -0.057098388671875, -0.0529937744140625, -0.04888916015625, -0.0447845458984375, -0.040679931640625, -0.0365753173828125, -0.032470703125, -0.0283660888671875, -0.024261474609375, -0.0201568603515625, -0.01605224609375, -0.0119476318359375, -0.007843017578125, -0.0037384033203125, 0.0003662109375, 0.0044708251953125, 0.008575439453125, 0.0126800537109375, 0.01678466796875, 0.0208892822265625, 0.024993896484375, 0.0290985107421875, 0.033203125, 0.0373077392578125, 0.041412353515625, 0.0455169677734375, 0.04962158203125, 0.0537261962890625, 0.057830810546875, 0.0619354248046875, 0.0660400390625, 0.0701446533203125, 0.074249267578125, 0.0783538818359375, 0.08245849609375, 0.0865631103515625, 0.090667724609375, 0.0947723388671875, 0.098876953125, 0.1029815673828125, 0.107086181640625, 0.1111907958984375, 0.11529541015625, 0.1194000244140625, 0.123504638671875, 0.1276092529296875, 0.1317138671875]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 5.0, 7.0, 17.0, 53.0, 108.0, 160.0, 211.0, 197.0, 128.0, 64.0, 35.0, 16.0, 5.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7270771265029907, -0.685883104801178, -0.6446890830993652, -0.6034950613975525, -0.5623010396957397, -0.521107017993927, -0.47991299629211426, -0.4387189745903015, -0.39752495288848877, -0.356330931186676, -0.3151369094848633, -0.27394288778305054, -0.2327488660812378, -0.19155484437942505, -0.1503608226776123, -0.10916680097579956, -0.06797277927398682, -0.026778757572174072, 0.014415264129638672, 0.055609285831451416, 0.09680330753326416, 0.1379973292350769, 0.17919135093688965, 0.2203853726387024, 0.26157939434051514, 0.3027734160423279, 0.3439674377441406, 0.38516145944595337, 0.4263554811477661, 0.46754950284957886, 0.5087435245513916, 0.5499375462532043, 0.5911314487457275, 0.6323254704475403, 0.673519492149353, 0.7147135138511658, 0.7559075355529785, 0.7971015572547913, 0.838295578956604, 0.8794896006584167, 0.9206836223602295, 0.9618776440620422, 1.003071665763855, 1.0442657470703125, 1.0854597091674805, 1.1266536712646484, 1.167847752571106, 1.2090418338775635, 1.2502357959747314, 1.2914297580718994, 1.332623839378357, 1.3738179206848145, 1.4150118827819824, 1.4562058448791504, 1.497399926185608, 1.5385940074920654, 1.5797879695892334, 1.6209819316864014, 1.6621760129928589, 1.7033700942993164, 1.7445640563964844, 1.7857580184936523, 1.8269520998001099, 1.8681461811065674, 1.9093401432037354]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 5.0, 1.0, 2.0, 2.0, 8.0, 8.0, 15.0, 14.0, 7.0, 12.0, 18.0, 17.0, 35.0, 20.0, 42.0, 39.0, 45.0, 33.0, 55.0, 45.0, 40.0, 47.0, 44.0, 48.0, 45.0, 50.0, 37.0, 36.0, 41.0, 39.0, 27.0, 16.0, 24.0, 23.0, 14.0, 7.0, 9.0, 6.0, 11.0, 7.0, 8.0, 6.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.5296045541763306, -0.5143976807594299, -0.4991908371448517, -0.48398396372795105, -0.4687771201133728, -0.45357024669647217, -0.43836337327957153, -0.4231565296649933, -0.40794968605041504, -0.3927428126335144, -0.37753596901893616, -0.3623290956020355, -0.3471222519874573, -0.33191537857055664, -0.316708505153656, -0.30150166153907776, -0.2862947881221771, -0.2710879147052765, -0.25588107109069824, -0.2406741976737976, -0.22546735405921936, -0.21026048064231873, -0.19505362212657928, -0.17984676361083984, -0.1646399050951004, -0.14943304657936096, -0.13422618806362152, -0.11901932209730148, -0.10381246358156204, -0.0886056050658226, -0.07339873909950256, -0.05819188058376312, -0.04298502206802368, -0.02777816168963909, -0.012571301311254501, 0.002635560929775238, 0.01784241944551468, 0.03304927796125412, 0.04825614392757416, 0.0634630024433136, 0.07866986095905304, 0.09387671947479248, 0.10908357799053192, 0.12429044395685196, 0.139497309923172, 0.15470415353775024, 0.16991102695465088, 0.18511788547039032, 0.20032474398612976, 0.2155316025018692, 0.23073846101760864, 0.24594533443450928, 0.2611521780490875, 0.27635905146598816, 0.2915658950805664, 0.30677276849746704, 0.3219796419143677, 0.3371865153312683, 0.35239335894584656, 0.3676002323627472, 0.38280707597732544, 0.3980139493942261, 0.4132208228111267, 0.42842766642570496, 0.4436345100402832]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 3.0, 1.0, 3.0, 6.0, 6.0, 14.0, 16.0, 28.0, 37.0, 41.0, 83.0, 137.0, 274.0, 555.0, 1501.0, 4227.0, 13159.0, 45942.0, 204837.0, 509357.0, 202985.0, 45467.0, 12946.0, 4189.0, 1500.0, 592.0, 278.0, 128.0, 82.0, 34.0, 39.0, 24.0, 21.0, 15.0, 11.0, 6.0, 6.0, 7.0, 1.0, 0.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.348876953125, -0.33618927001953125, -0.3235015869140625, -0.31081390380859375, -0.298126220703125, -0.28543853759765625, -0.2727508544921875, -0.26006317138671875, -0.24737548828125, -0.23468780517578125, -0.2220001220703125, -0.20931243896484375, -0.196624755859375, -0.18393707275390625, -0.1712493896484375, -0.15856170654296875, -0.1458740234375, -0.13318634033203125, -0.1204986572265625, -0.10781097412109375, -0.095123291015625, -0.08243560791015625, -0.0697479248046875, -0.05706024169921875, -0.04437255859375, -0.03168487548828125, -0.0189971923828125, -0.00630950927734375, 0.006378173828125, 0.01906585693359375, 0.0317535400390625, 0.04444122314453125, 0.05712890625, 0.06981658935546875, 0.0825042724609375, 0.09519195556640625, 0.107879638671875, 0.12056732177734375, 0.1332550048828125, 0.14594268798828125, 0.15863037109375, 0.17131805419921875, 0.1840057373046875, 0.19669342041015625, 0.209381103515625, 0.22206878662109375, 0.2347564697265625, 0.24744415283203125, 0.2601318359375, 0.27281951904296875, 0.2855072021484375, 0.29819488525390625, 0.310882568359375, 0.32357025146484375, 0.3362579345703125, 0.34894561767578125, 0.36163330078125, 0.37432098388671875, 0.3870086669921875, 0.39969635009765625, 0.412384033203125, 0.42507171630859375, 0.4377593994140625, 0.45044708251953125, 0.463134765625]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 3.0, 1.0, 7.0, 4.0, 5.0, 5.0, 15.0, 18.0, 24.0, 17.0, 31.0, 34.0, 34.0, 45.0, 47.0, 53.0, 68.0, 52.0, 72.0, 50.0, 63.0, 53.0, 55.0, 50.0, 45.0, 38.0, 34.0, 24.0, 20.0, 14.0, 8.0, 6.0, 3.0, 4.0, 3.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11834716796875, -0.11490154266357422, -0.11145591735839844, -0.10801029205322266, -0.10456466674804688, -0.1011190414428711, -0.09767341613769531, -0.09422779083251953, -0.09078216552734375, -0.08733654022216797, -0.08389091491699219, -0.0804452896118164, -0.07699966430664062, -0.07355403900146484, -0.07010841369628906, -0.06666278839111328, -0.0632171630859375, -0.05977153778076172, -0.05632591247558594, -0.052880287170410156, -0.049434661865234375, -0.045989036560058594, -0.04254341125488281, -0.03909778594970703, -0.03565216064453125, -0.03220653533935547, -0.028760910034179688, -0.025315284729003906, -0.021869659423828125, -0.018424034118652344, -0.014978408813476562, -0.011532783508300781, -0.008087158203125, -0.004641532897949219, -0.0011959075927734375, 0.0022497177124023438, 0.005695343017578125, 0.009140968322753906, 0.012586593627929688, 0.01603221893310547, 0.01947784423828125, 0.02292346954345703, 0.026369094848632812, 0.029814720153808594, 0.033260345458984375, 0.036705970764160156, 0.04015159606933594, 0.04359722137451172, 0.0470428466796875, 0.05048847198486328, 0.05393409729003906, 0.057379722595214844, 0.060825347900390625, 0.0642709732055664, 0.06771659851074219, 0.07116222381591797, 0.07460784912109375, 0.07805347442626953, 0.08149909973144531, 0.0849447250366211, 0.08839035034179688, 0.09183597564697266, 0.09528160095214844, 0.09872722625732422, 0.1021728515625]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 5.0, 4.0, 6.0, 13.0, 13.0, 24.0, 32.0, 37.0, 46.0, 66.0, 102.0, 169.0, 295.0, 481.0, 1026.0, 2246.0, 5251.0, 12650.0, 32171.0, 83381.0, 201621.0, 319652.0, 227688.0, 98150.0, 37575.0, 14662.0, 5942.0, 2661.0, 1160.0, 584.0, 330.0, 176.0, 99.0, 64.0, 42.0, 33.0, 28.0, 18.0, 10.0, 12.0, 13.0, 9.0, 5.0, 5.0, 1.0, 3.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.225341796875, -0.2179737091064453, -0.21060562133789062, -0.20323753356933594, -0.19586944580078125, -0.18850135803222656, -0.18113327026367188, -0.1737651824951172, -0.1663970947265625, -0.1590290069580078, -0.15166091918945312, -0.14429283142089844, -0.13692474365234375, -0.12955665588378906, -0.12218856811523438, -0.11482048034667969, -0.107452392578125, -0.10008430480957031, -0.09271621704101562, -0.08534812927246094, -0.07798004150390625, -0.07061195373535156, -0.06324386596679688, -0.05587577819824219, -0.0485076904296875, -0.04113960266113281, -0.033771514892578125, -0.026403427124023438, -0.01903533935546875, -0.011667251586914062, -0.004299163818359375, 0.0030689239501953125, 0.01043701171875, 0.017805099487304688, 0.025173187255859375, 0.03254127502441406, 0.03990936279296875, 0.04727745056152344, 0.054645538330078125, 0.06201362609863281, 0.0693817138671875, 0.07674980163574219, 0.08411788940429688, 0.09148597717285156, 0.09885406494140625, 0.10622215270996094, 0.11359024047851562, 0.12095832824707031, 0.128326416015625, 0.1356945037841797, 0.14306259155273438, 0.15043067932128906, 0.15779876708984375, 0.16516685485839844, 0.17253494262695312, 0.1799030303955078, 0.1872711181640625, 0.1946392059326172, 0.20200729370117188, 0.20937538146972656, 0.21674346923828125, 0.22411155700683594, 0.23147964477539062, 0.2388477325439453, 0.2462158203125]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 7.0, 1.0, 7.0, 1.0, 3.0, 3.0, 11.0, 9.0, 14.0, 7.0, 9.0, 15.0, 19.0, 37.0, 27.0, 29.0, 24.0, 29.0, 43.0, 38.0, 43.0, 58.0, 47.0, 38.0, 45.0, 35.0, 43.0, 36.0, 38.0, 44.0, 33.0, 35.0, 25.0, 19.0, 31.0, 20.0, 20.0, 16.0, 8.0, 10.0, 15.0, 3.0, 6.0, 2.0, 5.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.2401123046875, -0.2333965301513672, -0.22668075561523438, -0.21996498107910156, -0.21324920654296875, -0.20653343200683594, -0.19981765747070312, -0.1931018829345703, -0.1863861083984375, -0.1796703338623047, -0.17295455932617188, -0.16623878479003906, -0.15952301025390625, -0.15280723571777344, -0.14609146118164062, -0.1393756866455078, -0.132659912109375, -0.1259441375732422, -0.11922836303710938, -0.11251258850097656, -0.10579681396484375, -0.09908103942871094, -0.09236526489257812, -0.08564949035644531, -0.0789337158203125, -0.07221794128417969, -0.06550216674804688, -0.05878639221191406, -0.05207061767578125, -0.04535484313964844, -0.038639068603515625, -0.03192329406738281, -0.02520751953125, -0.018491744995117188, -0.011775970458984375, -0.0050601959228515625, 0.00165557861328125, 0.008371353149414062, 0.015087127685546875, 0.021802902221679688, 0.0285186767578125, 0.03523445129394531, 0.041950225830078125, 0.04866600036621094, 0.05538177490234375, 0.06209754943847656, 0.06881332397460938, 0.07552909851074219, 0.082244873046875, 0.08896064758300781, 0.09567642211914062, 0.10239219665527344, 0.10910797119140625, 0.11582374572753906, 0.12253952026367188, 0.1292552947998047, 0.1359710693359375, 0.1426868438720703, 0.14940261840820312, 0.15611839294433594, 0.16283416748046875, 0.16954994201660156, 0.17626571655273438, 0.1829814910888672, 0.189697265625]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 8.0, 6.0, 8.0, 5.0, 18.0, 29.0, 41.0, 73.0, 107.0, 171.0, 287.0, 570.0, 974.0, 1715.0, 3258.0, 6510.0, 13657.0, 28955.0, 64736.0, 139170.0, 241429.0, 253155.0, 156026.0, 73829.0, 33280.0, 15333.0, 7220.0, 3656.0, 1856.0, 1042.0, 590.0, 341.0, 197.0, 120.0, 62.0, 52.0, 24.0, 12.0, 16.0, 8.0, 5.0, 5.0, 4.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08233642578125, -0.07959938049316406, -0.07686233520507812, -0.07412528991699219, -0.07138824462890625, -0.06865119934082031, -0.06591415405273438, -0.06317710876464844, -0.0604400634765625, -0.05770301818847656, -0.054965972900390625, -0.05222892761230469, -0.04949188232421875, -0.04675483703613281, -0.044017791748046875, -0.04128074645996094, -0.038543701171875, -0.03580665588378906, -0.033069610595703125, -0.030332565307617188, -0.02759552001953125, -0.024858474731445312, -0.022121429443359375, -0.019384384155273438, -0.0166473388671875, -0.013910293579101562, -0.011173248291015625, -0.008436203002929688, -0.00569915771484375, -0.0029621124267578125, -0.000225067138671875, 0.0025119781494140625, 0.0052490234375, 0.007986068725585938, 0.010723114013671875, 0.013460159301757812, 0.01619720458984375, 0.018934249877929688, 0.021671295166015625, 0.024408340454101562, 0.0271453857421875, 0.029882431030273438, 0.032619476318359375, 0.03535652160644531, 0.03809356689453125, 0.04083061218261719, 0.043567657470703125, 0.04630470275878906, 0.049041748046875, 0.05177879333496094, 0.054515838623046875, 0.05725288391113281, 0.05998992919921875, 0.06272697448730469, 0.06546401977539062, 0.06820106506347656, 0.0709381103515625, 0.07367515563964844, 0.07641220092773438, 0.07914924621582031, 0.08188629150390625, 0.08462333679199219, 0.08736038208007812, 0.09009742736816406, 0.09283447265625]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 4.0, 2.0, 5.0, 4.0, 9.0, 11.0, 13.0, 15.0, 29.0, 24.0, 37.0, 55.0, 81.0, 99.0, 91.0, 104.0, 106.0, 95.0, 65.0, 41.0, 29.0, 30.0, 19.0, 6.0, 8.0, 11.0, 6.0, 1.0, 5.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.6404857635498047e-05, -2.5696121156215668e-05, -2.498738467693329e-05, -2.427864819765091e-05, -2.356991171836853e-05, -2.286117523908615e-05, -2.2152438759803772e-05, -2.1443702280521393e-05, -2.0734965801239014e-05, -2.0026229321956635e-05, -1.9317492842674255e-05, -1.8608756363391876e-05, -1.7900019884109497e-05, -1.7191283404827118e-05, -1.648254692554474e-05, -1.577381044626236e-05, -1.506507396697998e-05, -1.4356337487697601e-05, -1.3647601008415222e-05, -1.2938864529132843e-05, -1.2230128049850464e-05, -1.1521391570568085e-05, -1.0812655091285706e-05, -1.0103918612003326e-05, -9.395182132720947e-06, -8.686445653438568e-06, -7.977709174156189e-06, -7.26897269487381e-06, -6.560236215591431e-06, -5.8514997363090515e-06, -5.142763257026672e-06, -4.434026777744293e-06, -3.725290298461914e-06, -3.016553819179535e-06, -2.3078173398971558e-06, -1.5990808606147766e-06, -8.903443813323975e-07, -1.816079020500183e-07, 5.271285772323608e-07, 1.23586505651474e-06, 1.944601535797119e-06, 2.6533380150794983e-06, 3.3620744943618774e-06, 4.070810973644257e-06, 4.779547452926636e-06, 5.488283932209015e-06, 6.197020411491394e-06, 6.905756890773773e-06, 7.614493370056152e-06, 8.323229849338531e-06, 9.03196632862091e-06, 9.74070280790329e-06, 1.0449439287185669e-05, 1.1158175766468048e-05, 1.1866912245750427e-05, 1.2575648725032806e-05, 1.3284385204315186e-05, 1.3993121683597565e-05, 1.4701858162879944e-05, 1.5410594642162323e-05, 1.6119331121444702e-05, 1.682806760072708e-05, 1.753680408000946e-05, 1.824554055929184e-05, 1.895427703857422e-05]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 5.0, 2.0, 9.0, 14.0, 19.0, 24.0, 25.0, 45.0, 77.0, 98.0, 221.0, 328.0, 489.0, 905.0, 1652.0, 3170.0, 6049.0, 12174.0, 26118.0, 57864.0, 127414.0, 229356.0, 259360.0, 170756.0, 81714.0, 36666.0, 16798.0, 8132.0, 4106.0, 2126.0, 1115.0, 691.0, 393.0, 213.0, 147.0, 94.0, 50.0, 47.0, 38.0, 15.0, 21.0, 6.0, 9.0, 4.0, 3.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.0867919921875, -0.08417892456054688, -0.08156585693359375, -0.07895278930664062, -0.0763397216796875, -0.07372665405273438, -0.07111358642578125, -0.06850051879882812, -0.065887451171875, -0.06327438354492188, -0.06066131591796875, -0.058048248291015625, -0.0554351806640625, -0.052822113037109375, -0.05020904541015625, -0.047595977783203125, -0.04498291015625, -0.042369842529296875, -0.03975677490234375, -0.037143707275390625, -0.0345306396484375, -0.031917572021484375, -0.02930450439453125, -0.026691436767578125, -0.024078369140625, -0.021465301513671875, -0.01885223388671875, -0.016239166259765625, -0.0136260986328125, -0.011013031005859375, -0.00839996337890625, -0.005786895751953125, -0.003173828125, -0.000560760498046875, 0.00205230712890625, 0.004665374755859375, 0.0072784423828125, 0.009891510009765625, 0.01250457763671875, 0.015117645263671875, 0.017730712890625, 0.020343780517578125, 0.02295684814453125, 0.025569915771484375, 0.0281829833984375, 0.030796051025390625, 0.03340911865234375, 0.036022186279296875, 0.03863525390625, 0.041248321533203125, 0.04386138916015625, 0.046474456787109375, 0.0490875244140625, 0.051700592041015625, 0.05431365966796875, 0.056926727294921875, 0.059539794921875, 0.062152862548828125, 0.06476593017578125, 0.06737899780273438, 0.0699920654296875, 0.07260513305664062, 0.07521820068359375, 0.07783126831054688, 0.0804443359375]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 5.0, 6.0, 5.0, 8.0, 6.0, 10.0, 9.0, 10.0, 10.0, 10.0, 16.0, 23.0, 39.0, 29.0, 45.0, 39.0, 43.0, 43.0, 49.0, 54.0, 55.0, 59.0, 43.0, 50.0, 56.0, 50.0, 48.0, 24.0, 34.0, 22.0, 25.0, 13.0, 14.0, 9.0, 7.0, 6.0, 9.0, 4.0, 4.0, 2.0, 6.0, 2.0, 3.0, 1.0, 2.0, 4.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.0693359375, -0.06720256805419922, -0.06506919860839844, -0.06293582916259766, -0.060802459716796875, -0.058669090270996094, -0.05653572082519531, -0.05440235137939453, -0.05226898193359375, -0.05013561248779297, -0.04800224304199219, -0.045868873596191406, -0.043735504150390625, -0.041602134704589844, -0.03946876525878906, -0.03733539581298828, -0.0352020263671875, -0.03306865692138672, -0.030935287475585938, -0.028801918029785156, -0.026668548583984375, -0.024535179138183594, -0.022401809692382812, -0.02026844024658203, -0.01813507080078125, -0.01600170135498047, -0.013868331909179688, -0.011734962463378906, -0.009601593017578125, -0.007468223571777344, -0.0053348541259765625, -0.0032014846801757812, -0.001068115234375, 0.0010652542114257812, 0.0031986236572265625, 0.005331993103027344, 0.007465362548828125, 0.009598731994628906, 0.011732101440429688, 0.013865470886230469, 0.01599884033203125, 0.01813220977783203, 0.020265579223632812, 0.022398948669433594, 0.024532318115234375, 0.026665687561035156, 0.028799057006835938, 0.03093242645263672, 0.0330657958984375, 0.03519916534423828, 0.03733253479003906, 0.039465904235839844, 0.041599273681640625, 0.043732643127441406, 0.04586601257324219, 0.04799938201904297, 0.05013275146484375, 0.05226612091064453, 0.05439949035644531, 0.056532859802246094, 0.058666229248046875, 0.060799598693847656, 0.06293296813964844, 0.06506633758544922, 0.06719970703125]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 5.0, 13.0, 32.0, 61.0, 130.0, 185.0, 213.0, 175.0, 101.0, 53.0, 25.0, 10.0, 8.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.159815549850464, -2.1062066555023193, -2.052597999572754, -1.9989891052246094, -1.9453802108764648, -1.8917714357376099, -1.8381626605987549, -1.7845537662506104, -1.7309448719024658, -1.6773360967636108, -1.6237272024154663, -1.5701184272766113, -1.5165095329284668, -1.4629007577896118, -1.4092919826507568, -1.3556830883026123, -1.3020743131637573, -1.2484655380249023, -1.1948566436767578, -1.1412478685379028, -1.0876389741897583, -1.0340301990509033, -0.9804213643074036, -0.9268125295639038, -0.873203694820404, -0.8195948600769043, -0.7659860253334045, -0.7123771905899048, -0.6587684154510498, -0.6051595211029053, -0.5515507459640503, -0.49794191122055054, -0.4443330764770508, -0.390724241733551, -0.33711540699005127, -0.2835066020488739, -0.22989776730537415, -0.1762889325618744, -0.12268012762069702, -0.06907129287719727, -0.01546245813369751, 0.03814636915922165, 0.09175519645214081, 0.14536401629447937, 0.19897285103797913, 0.2525816857814789, 0.30619049072265625, 0.359799325466156, 0.41340816020965576, 0.4670169949531555, 0.5206258296966553, 0.5742346048355103, 0.6278434991836548, 0.6814522743225098, 0.7350611090660095, 0.7886699438095093, 0.842278778553009, 0.8958876132965088, 0.9494964480400085, 1.0031052827835083, 1.0567140579223633, 1.1103229522705078, 1.1639317274093628, 1.2175405025482178, 1.2711493968963623]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 5.0, 1.0, 4.0, 3.0, 7.0, 7.0, 6.0, 13.0, 15.0, 8.0, 14.0, 17.0, 19.0, 23.0, 26.0, 29.0, 27.0, 28.0, 32.0, 29.0, 20.0, 33.0, 30.0, 32.0, 35.0, 45.0, 33.0, 35.0, 46.0, 28.0, 37.0, 38.0, 34.0, 23.0, 26.0, 34.0, 25.0, 20.0, 13.0, 14.0, 13.0, 14.0, 8.0, 13.0, 12.0, 3.0, 7.0, 11.0, 1.0, 5.0, 2.0, 1.0, 4.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.4883461594581604, -0.4716911315917969, -0.45503610372543335, -0.4383810758590698, -0.4217260479927063, -0.4050710201263428, -0.38841602206230164, -0.3717609941959381, -0.3551059663295746, -0.33845093846321106, -0.32179591059684753, -0.305140882730484, -0.28848588466644287, -0.27183085680007935, -0.2551758289337158, -0.2385208010673523, -0.22186577320098877, -0.20521074533462524, -0.18855571746826172, -0.1719007045030594, -0.15524567663669586, -0.13859064877033234, -0.12193562835454941, -0.10528060793876648, -0.08862558007240295, -0.07197055220603943, -0.0553155317902565, -0.03866050764918327, -0.022005483508110046, -0.005350455641746521, 0.011304564774036407, 0.027959585189819336, 0.04461461305618286, 0.06126963719725609, 0.07792466133832932, 0.09457968175411224, 0.11123470962047577, 0.1278897374868393, 0.14454475045204163, 0.16119977831840515, 0.17785480618476868, 0.1945098340511322, 0.21116486191749573, 0.22781987488269806, 0.24447490274906158, 0.2611299157142639, 0.27778494358062744, 0.29443997144699097, 0.3110949993133545, 0.327750027179718, 0.34440505504608154, 0.36106008291244507, 0.3777151107788086, 0.3943701386451721, 0.41102513670921326, 0.4276801645755768, 0.4443351924419403, 0.46099022030830383, 0.47764524817466736, 0.4943002760410309, 0.510955274105072, 0.5276103019714355, 0.5442653298377991, 0.5609203577041626, 0.5775753855705261]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 5.0, 4.0, 6.0, 4.0, 5.0, 12.0, 11.0, 10.0, 15.0, 24.0, 26.0, 37.0, 58.0, 70.0, 95.0, 166.0, 216.0, 345.0, 524.0, 978.0, 1732.0, 3824.0, 9412.0, 28058.0, 112653.0, 628026.0, 2097322.0, 1053481.0, 188863.0, 43952.0, 13835.0, 5298.0, 2357.0, 1207.0, 629.0, 347.0, 246.0, 135.0, 89.0, 67.0, 42.0, 34.0, 21.0, 11.0, 14.0, 8.0, 8.0, 4.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.1552734375, -0.15091896057128906, -0.14656448364257812, -0.1422100067138672, -0.13785552978515625, -0.1335010528564453, -0.12914657592773438, -0.12479209899902344, -0.1204376220703125, -0.11608314514160156, -0.11172866821289062, -0.10737419128417969, -0.10301971435546875, -0.09866523742675781, -0.09431076049804688, -0.08995628356933594, -0.085601806640625, -0.08124732971191406, -0.07689285278320312, -0.07253837585449219, -0.06818389892578125, -0.06382942199707031, -0.059474945068359375, -0.05512046813964844, -0.0507659912109375, -0.04641151428222656, -0.042057037353515625, -0.03770256042480469, -0.03334808349609375, -0.028993606567382812, -0.024639129638671875, -0.020284652709960938, -0.01593017578125, -0.011575698852539062, -0.007221221923828125, -0.0028667449951171875, 0.00148773193359375, 0.0058422088623046875, 0.010196685791015625, 0.014551162719726562, 0.0189056396484375, 0.023260116577148438, 0.027614593505859375, 0.03196907043457031, 0.03632354736328125, 0.04067802429199219, 0.045032501220703125, 0.04938697814941406, 0.053741455078125, 0.05809593200683594, 0.062450408935546875, 0.06680488586425781, 0.07115936279296875, 0.07551383972167969, 0.07986831665039062, 0.08422279357910156, 0.0885772705078125, 0.09293174743652344, 0.09728622436523438, 0.10164070129394531, 0.10599517822265625, 0.11034965515136719, 0.11470413208007812, 0.11905860900878906, 0.1234130859375]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 2.0, 1.0, 3.0, 3.0, 4.0, 5.0, 4.0, 8.0, 4.0, 16.0, 16.0, 24.0, 25.0, 37.0, 27.0, 33.0, 35.0, 46.0, 41.0, 45.0, 59.0, 62.0, 43.0, 59.0, 61.0, 45.0, 40.0, 33.0, 29.0, 38.0, 39.0, 27.0, 25.0, 15.0, 19.0, 9.0, 7.0, 11.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09197998046875, -0.089019775390625, -0.0860595703125, -0.083099365234375, -0.08013916015625, -0.077178955078125, -0.07421875, -0.071258544921875, -0.06829833984375, -0.065338134765625, -0.0623779296875, -0.059417724609375, -0.05645751953125, -0.053497314453125, -0.050537109375, -0.047576904296875, -0.04461669921875, -0.041656494140625, -0.0386962890625, -0.035736083984375, -0.03277587890625, -0.029815673828125, -0.02685546875, -0.023895263671875, -0.02093505859375, -0.017974853515625, -0.0150146484375, -0.012054443359375, -0.00909423828125, -0.006134033203125, -0.003173828125, -0.000213623046875, 0.00274658203125, 0.005706787109375, 0.0086669921875, 0.011627197265625, 0.01458740234375, 0.017547607421875, 0.0205078125, 0.023468017578125, 0.02642822265625, 0.029388427734375, 0.0323486328125, 0.035308837890625, 0.03826904296875, 0.041229248046875, 0.044189453125, 0.047149658203125, 0.05010986328125, 0.053070068359375, 0.0560302734375, 0.058990478515625, 0.06195068359375, 0.064910888671875, 0.06787109375, 0.070831298828125, 0.07379150390625, 0.076751708984375, 0.0797119140625, 0.082672119140625, 0.08563232421875, 0.088592529296875, 0.091552734375, 0.094512939453125, 0.09747314453125]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 3.0, 1.0, 4.0, 1.0, 3.0, 7.0, 6.0, 10.0, 6.0, 22.0, 23.0, 28.0, 39.0, 52.0, 79.0, 131.0, 222.0, 493.0, 1055.0, 3258.0, 14033.0, 93543.0, 936266.0, 2673141.0, 413854.0, 46082.0, 8096.0, 2209.0, 748.0, 379.0, 184.0, 111.0, 63.0, 34.0, 24.0, 10.0, 14.0, 14.0, 10.0, 4.0, 4.0, 4.0, 2.0, 10.0, 5.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.25244140625, -0.24463272094726562, -0.23682403564453125, -0.22901535034179688, -0.2212066650390625, -0.21339797973632812, -0.20558929443359375, -0.19778060913085938, -0.189971923828125, -0.18216323852539062, -0.17435455322265625, -0.16654586791992188, -0.1587371826171875, -0.15092849731445312, -0.14311981201171875, -0.13531112670898438, -0.12750244140625, -0.11969375610351562, -0.11188507080078125, -0.10407638549804688, -0.0962677001953125, -0.08845901489257812, -0.08065032958984375, -0.07284164428710938, -0.065032958984375, -0.057224273681640625, -0.04941558837890625, -0.041606903076171875, -0.0337982177734375, -0.025989532470703125, -0.01818084716796875, -0.010372161865234375, -0.0025634765625, 0.005245208740234375, 0.01305389404296875, 0.020862579345703125, 0.0286712646484375, 0.036479949951171875, 0.04428863525390625, 0.052097320556640625, 0.059906005859375, 0.06771469116210938, 0.07552337646484375, 0.08333206176757812, 0.0911407470703125, 0.09894943237304688, 0.10675811767578125, 0.11456680297851562, 0.12237548828125, 0.13018417358398438, 0.13799285888671875, 0.14580154418945312, 0.1536102294921875, 0.16141891479492188, 0.16922760009765625, 0.17703628540039062, 0.184844970703125, 0.19265365600585938, 0.20046234130859375, 0.20827102661132812, 0.2160797119140625, 0.22388839721679688, 0.23169708251953125, 0.23950576782226562, 0.247314453125]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 2.0, 3.0, 2.0, 5.0, 5.0, 4.0, 4.0, 3.0, 9.0, 7.0, 8.0, 6.0, 13.0, 19.0, 23.0, 28.0, 50.0, 51.0, 59.0, 66.0, 119.0, 146.0, 163.0, 214.0, 290.0, 314.0, 359.0, 309.0, 290.0, 274.0, 237.0, 212.0, 185.0, 120.0, 111.0, 88.0, 59.0, 45.0, 36.0, 34.0, 30.0, 12.0, 21.0, 15.0, 10.0, 7.0, 2.0, 4.0, 3.0, 4.0, 4.0, 1.0, 0.0, 3.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.1021728515625, -0.09877967834472656, -0.09538650512695312, -0.09199333190917969, -0.08860015869140625, -0.08520698547363281, -0.08181381225585938, -0.07842063903808594, -0.0750274658203125, -0.07163429260253906, -0.06824111938476562, -0.06484794616699219, -0.06145477294921875, -0.05806159973144531, -0.054668426513671875, -0.05127525329589844, -0.047882080078125, -0.04448890686035156, -0.041095733642578125, -0.03770256042480469, -0.03430938720703125, -0.030916213989257812, -0.027523040771484375, -0.024129867553710938, -0.0207366943359375, -0.017343521118164062, -0.013950347900390625, -0.010557174682617188, -0.00716400146484375, -0.0037708282470703125, -0.000377655029296875, 0.0030155181884765625, 0.00640869140625, 0.009801864624023438, 0.013195037841796875, 0.016588211059570312, 0.01998138427734375, 0.023374557495117188, 0.026767730712890625, 0.030160903930664062, 0.0335540771484375, 0.03694725036621094, 0.040340423583984375, 0.04373359680175781, 0.04712677001953125, 0.05051994323730469, 0.053913116455078125, 0.05730628967285156, 0.060699462890625, 0.06409263610839844, 0.06748580932617188, 0.07087898254394531, 0.07427215576171875, 0.07766532897949219, 0.08105850219726562, 0.08445167541503906, 0.0878448486328125, 0.09123802185058594, 0.09463119506835938, 0.09802436828613281, 0.10141754150390625, 0.10481071472167969, 0.10820388793945312, 0.11159706115722656, 0.114990234375]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 3.0, 5.0, 19.0, 15.0, 33.0, 39.0, 57.0, 106.0, 116.0, 136.0, 127.0, 99.0, 92.0, 64.0, 45.0, 22.0, 14.0, 9.0, 6.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.0224627256393433, -0.9937094449996948, -0.9649561643600464, -0.9362028241157532, -0.9074495434761047, -0.8786962628364563, -0.8499429821968079, -0.8211896419525146, -0.7924363613128662, -0.7636830806732178, -0.7349298000335693, -0.7061764597892761, -0.6774231791496277, -0.6486698985099792, -0.6199166178703308, -0.5911632776260376, -0.5624099969863892, -0.5336567163467407, -0.5049034357070923, -0.47615012526512146, -0.44739681482315063, -0.4186435341835022, -0.38989025354385376, -0.36113694310188293, -0.3323836922645569, -0.30363041162490845, -0.2748771011829376, -0.24612382054328918, -0.21737051010131836, -0.18861722946166992, -0.1598639339208603, -0.13111063838005066, -0.10235732793807983, -0.0736040323972702, -0.04485074058175087, -0.016097448766231537, 0.012655846774578094, 0.04140913486480713, 0.07016243040561676, 0.09891572594642639, 0.12766902148723602, 0.15642231702804565, 0.18517561256885529, 0.21392890810966492, 0.24268218874931335, 0.2714354991912842, 0.3001887798309326, 0.32894206047058105, 0.3576953709125519, 0.3864486515522003, 0.41520196199417114, 0.4439552426338196, 0.4727085530757904, 0.5014618635177612, 0.5302151441574097, 0.5589684247970581, 0.5877217054367065, 0.616474986076355, 0.6452282667160034, 0.6739816069602966, 0.7027348875999451, 0.7314881682395935, 0.7602414488792419, 0.7889947891235352, 0.8177480697631836]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 4.0, 2.0, 6.0, 2.0, 5.0, 6.0, 8.0, 12.0, 8.0, 18.0, 15.0, 22.0, 17.0, 18.0, 19.0, 26.0, 27.0, 21.0, 38.0, 22.0, 27.0, 44.0, 46.0, 43.0, 41.0, 32.0, 40.0, 47.0, 38.0, 49.0, 20.0, 41.0, 31.0, 30.0, 27.0, 19.0, 15.0, 18.0, 19.0, 17.0, 11.0, 9.0, 9.0, 8.0, 9.0, 4.0, 4.0, 3.0, 2.0, 1.0, 3.0, 1.0, 2.0, 3.0, 0.0, 1.0, 1.0], "bins": [-0.4364579916000366, -0.42261484265327454, -0.40877172350883484, -0.39492857456207275, -0.38108542561531067, -0.3672422766685486, -0.3533991575241089, -0.3395560085773468, -0.3257128596305847, -0.31186971068382263, -0.29802659153938293, -0.28418344259262085, -0.27034029364585876, -0.2564971446990967, -0.24265402555465698, -0.2288108766078949, -0.2149677574634552, -0.2011246234178543, -0.18728147447109222, -0.17343834042549133, -0.15959519147872925, -0.14575205743312836, -0.13190892338752747, -0.11806578189134598, -0.10422264039516449, -0.090379498898983, -0.07653635740280151, -0.06269322335720062, -0.048850081861019135, -0.035006940364837646, -0.021163806319236755, -0.007320664823055267, 0.006522476673126221, 0.02036561630666256, 0.0342087559401989, 0.04805189371109009, 0.061895035207271576, 0.07573817670345306, 0.08958131074905396, 0.10342445224523544, 0.11726759374141693, 0.13111072778701782, 0.1449538767337799, 0.1587970107793808, 0.1726401448249817, 0.18648329377174377, 0.20032642781734467, 0.21416956186294556, 0.22801271080970764, 0.24185584485530853, 0.2556989789009094, 0.2695421278476715, 0.2833852767944336, 0.2972283959388733, 0.3110715448856354, 0.32491469383239746, 0.33875781297683716, 0.35260096192359924, 0.36644408106803894, 0.380287230014801, 0.3941303789615631, 0.4079735279083252, 0.4218166470527649, 0.435659795999527, 0.44950294494628906]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 3.0, 4.0, 1.0, 8.0, 5.0, 6.0, 12.0, 8.0, 21.0, 23.0, 24.0, 39.0, 45.0, 73.0, 122.0, 179.0, 364.0, 689.0, 1524.0, 3892.0, 10504.0, 31224.0, 96859.0, 281210.0, 373873.0, 166686.0, 53280.0, 17134.0, 6110.0, 2373.0, 984.0, 514.0, 273.0, 171.0, 105.0, 73.0, 34.0, 34.0, 16.0, 11.0, 10.0, 10.0, 10.0, 8.0, 7.0, 5.0, 1.0, 1.0, 2.0, 5.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.269287109375, -0.2597503662109375, -0.250213623046875, -0.2406768798828125, -0.23114013671875, -0.2216033935546875, -0.212066650390625, -0.2025299072265625, -0.1929931640625, -0.1834564208984375, -0.173919677734375, -0.1643829345703125, -0.15484619140625, -0.1453094482421875, -0.135772705078125, -0.1262359619140625, -0.11669921875, -0.1071624755859375, -0.097625732421875, -0.0880889892578125, -0.07855224609375, -0.0690155029296875, -0.059478759765625, -0.0499420166015625, -0.0404052734375, -0.0308685302734375, -0.021331787109375, -0.0117950439453125, -0.00225830078125, 0.0072784423828125, 0.016815185546875, 0.0263519287109375, 0.035888671875, 0.0454254150390625, 0.054962158203125, 0.0644989013671875, 0.07403564453125, 0.0835723876953125, 0.093109130859375, 0.1026458740234375, 0.1121826171875, 0.1217193603515625, 0.131256103515625, 0.1407928466796875, 0.15032958984375, 0.1598663330078125, 0.169403076171875, 0.1789398193359375, 0.1884765625, 0.1980133056640625, 0.207550048828125, 0.2170867919921875, 0.22662353515625, 0.2361602783203125, 0.245697021484375, 0.2552337646484375, 0.2647705078125, 0.2743072509765625, 0.283843994140625, 0.2933807373046875, 0.30291748046875, 0.3124542236328125, 0.321990966796875, 0.3315277099609375, 0.341064453125]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 4.0, 2.0, 4.0, 4.0, 7.0, 10.0, 14.0, 13.0, 20.0, 25.0, 39.0, 34.0, 45.0, 47.0, 58.0, 55.0, 50.0, 74.0, 46.0, 68.0, 56.0, 51.0, 52.0, 43.0, 45.0, 41.0, 32.0, 22.0, 15.0, 7.0, 6.0, 5.0, 6.0, 2.0, 2.0, 4.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 3.0], "bins": [-0.1290283203125, -0.12563323974609375, -0.1222381591796875, -0.11884307861328125, -0.115447998046875, -0.11205291748046875, -0.1086578369140625, -0.10526275634765625, -0.10186767578125, -0.09847259521484375, -0.0950775146484375, -0.09168243408203125, -0.088287353515625, -0.08489227294921875, -0.0814971923828125, -0.07810211181640625, -0.07470703125, -0.07131195068359375, -0.0679168701171875, -0.06452178955078125, -0.061126708984375, -0.05773162841796875, -0.0543365478515625, -0.05094146728515625, -0.04754638671875, -0.04415130615234375, -0.0407562255859375, -0.03736114501953125, -0.033966064453125, -0.03057098388671875, -0.0271759033203125, -0.02378082275390625, -0.0203857421875, -0.01699066162109375, -0.0135955810546875, -0.01020050048828125, -0.006805419921875, -0.00341033935546875, -1.52587890625e-05, 0.00337982177734375, 0.00677490234375, 0.01016998291015625, 0.0135650634765625, 0.01696014404296875, 0.020355224609375, 0.02375030517578125, 0.0271453857421875, 0.03054046630859375, 0.033935546875, 0.03733062744140625, 0.0407257080078125, 0.04412078857421875, 0.047515869140625, 0.05091094970703125, 0.0543060302734375, 0.05770111083984375, 0.06109619140625, 0.06449127197265625, 0.0678863525390625, 0.07128143310546875, 0.074676513671875, 0.07807159423828125, 0.0814666748046875, 0.08486175537109375, 0.0882568359375]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 3.0, 2.0, 1.0, 6.0, 8.0, 9.0, 22.0, 15.0, 11.0, 23.0, 35.0, 50.0, 75.0, 116.0, 196.0, 429.0, 1072.0, 2512.0, 6499.0, 16827.0, 41228.0, 98559.0, 208185.0, 291958.0, 210447.0, 99985.0, 41966.0, 16964.0, 6564.0, 2647.0, 1100.0, 446.0, 204.0, 122.0, 85.0, 29.0, 39.0, 30.0, 22.0, 8.0, 11.0, 8.0, 9.0, 10.0, 5.0, 6.0, 0.0, 6.0, 3.0, 3.0, 3.0, 1.0, 1.0, 2.0], "bins": [-0.242919921875, -0.2356700897216797, -0.22842025756835938, -0.22117042541503906, -0.21392059326171875, -0.20667076110839844, -0.19942092895507812, -0.1921710968017578, -0.1849212646484375, -0.1776714324951172, -0.17042160034179688, -0.16317176818847656, -0.15592193603515625, -0.14867210388183594, -0.14142227172851562, -0.1341724395751953, -0.126922607421875, -0.11967277526855469, -0.11242294311523438, -0.10517311096191406, -0.09792327880859375, -0.09067344665527344, -0.08342361450195312, -0.07617378234863281, -0.0689239501953125, -0.06167411804199219, -0.054424285888671875, -0.04717445373535156, -0.03992462158203125, -0.03267478942871094, -0.025424957275390625, -0.018175125122070312, -0.01092529296875, -0.0036754608154296875, 0.003574371337890625, 0.010824203491210938, 0.01807403564453125, 0.025323867797851562, 0.032573699951171875, 0.03982353210449219, 0.0470733642578125, 0.05432319641113281, 0.061573028564453125, 0.06882286071777344, 0.07607269287109375, 0.08332252502441406, 0.09057235717773438, 0.09782218933105469, 0.105072021484375, 0.11232185363769531, 0.11957168579101562, 0.12682151794433594, 0.13407135009765625, 0.14132118225097656, 0.14857101440429688, 0.1558208465576172, 0.1630706787109375, 0.1703205108642578, 0.17757034301757812, 0.18482017517089844, 0.19207000732421875, 0.19931983947753906, 0.20656967163085938, 0.2138195037841797, 0.2210693359375]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 2.0, 5.0, 5.0, 0.0, 3.0, 3.0, 3.0, 7.0, 7.0, 12.0, 10.0, 13.0, 16.0, 21.0, 16.0, 26.0, 22.0, 25.0, 32.0, 13.0, 28.0, 41.0, 42.0, 48.0, 35.0, 42.0, 33.0, 50.0, 35.0, 34.0, 46.0, 34.0, 42.0, 31.0, 30.0, 20.0, 32.0, 22.0, 29.0, 17.0, 17.0, 13.0, 8.0, 11.0, 10.0, 3.0, 5.0, 4.0, 5.0, 1.0, 3.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.19970703125, -0.19327545166015625, -0.1868438720703125, -0.18041229248046875, -0.173980712890625, -0.16754913330078125, -0.1611175537109375, -0.15468597412109375, -0.14825439453125, -0.14182281494140625, -0.1353912353515625, -0.12895965576171875, -0.122528076171875, -0.11609649658203125, -0.1096649169921875, -0.10323333740234375, -0.0968017578125, -0.09037017822265625, -0.0839385986328125, -0.07750701904296875, -0.071075439453125, -0.06464385986328125, -0.0582122802734375, -0.05178070068359375, -0.04534912109375, -0.03891754150390625, -0.0324859619140625, -0.02605438232421875, -0.019622802734375, -0.01319122314453125, -0.0067596435546875, -0.00032806396484375, 0.006103515625, 0.01253509521484375, 0.0189666748046875, 0.02539825439453125, 0.031829833984375, 0.03826141357421875, 0.0446929931640625, 0.05112457275390625, 0.05755615234375, 0.06398773193359375, 0.0704193115234375, 0.07685089111328125, 0.083282470703125, 0.08971405029296875, 0.0961456298828125, 0.10257720947265625, 0.1090087890625, 0.11544036865234375, 0.1218719482421875, 0.12830352783203125, 0.134735107421875, 0.14116668701171875, 0.1475982666015625, 0.15402984619140625, 0.16046142578125, 0.16689300537109375, 0.1733245849609375, 0.17975616455078125, 0.186187744140625, 0.19261932373046875, 0.1990509033203125, 0.20548248291015625, 0.2119140625]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 6.0, 9.0, 21.0, 28.0, 38.0, 73.0, 60.0, 131.0, 149.0, 240.0, 382.0, 533.0, 927.0, 1449.0, 2283.0, 4008.0, 6949.0, 12038.0, 20787.0, 36671.0, 61685.0, 99364.0, 141702.0, 168992.0, 161653.0, 125500.0, 82898.0, 50752.0, 29018.0, 16904.0, 9499.0, 5409.0, 3137.0, 1921.0, 1192.0, 735.0, 483.0, 288.0, 202.0, 149.0, 84.0, 54.0, 49.0, 34.0, 23.0, 16.0, 8.0, 11.0, 8.0, 4.0, 3.0, 0.0, 4.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.053985595703125, -0.05223274230957031, -0.050479888916015625, -0.04872703552246094, -0.04697418212890625, -0.04522132873535156, -0.043468475341796875, -0.04171562194824219, -0.0399627685546875, -0.03820991516113281, -0.036457061767578125, -0.03470420837402344, -0.03295135498046875, -0.031198501586914062, -0.029445648193359375, -0.027692794799804688, -0.02593994140625, -0.024187088012695312, -0.022434234619140625, -0.020681381225585938, -0.01892852783203125, -0.017175674438476562, -0.015422821044921875, -0.013669967651367188, -0.0119171142578125, -0.010164260864257812, -0.008411407470703125, -0.0066585540771484375, -0.00490570068359375, -0.0031528472900390625, -0.001399993896484375, 0.0003528594970703125, 0.002105712890625, 0.0038585662841796875, 0.005611419677734375, 0.0073642730712890625, 0.00911712646484375, 0.010869979858398438, 0.012622833251953125, 0.014375686645507812, 0.0161285400390625, 0.017881393432617188, 0.019634246826171875, 0.021387100219726562, 0.02313995361328125, 0.024892807006835938, 0.026645660400390625, 0.028398513793945312, 0.0301513671875, 0.03190422058105469, 0.033657073974609375, 0.03540992736816406, 0.03716278076171875, 0.03891563415527344, 0.040668487548828125, 0.04242134094238281, 0.0441741943359375, 0.04592704772949219, 0.047679901123046875, 0.04943275451660156, 0.05118560791015625, 0.05293846130371094, 0.054691314697265625, 0.05644416809082031, 0.058197021484375]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 4.0, 0.0, 3.0, 2.0, 2.0, 1.0, 9.0, 3.0, 2.0, 10.0, 5.0, 10.0, 10.0, 11.0, 21.0, 21.0, 25.0, 21.0, 34.0, 49.0, 47.0, 58.0, 71.0, 58.0, 69.0, 64.0, 51.0, 68.0, 51.0, 33.0, 36.0, 28.0, 21.0, 22.0, 19.0, 16.0, 10.0, 11.0, 8.0, 3.0, 5.0, 4.0, 6.0, 2.0, 2.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.52587890625e-05, -1.477077603340149e-05, -1.4282763004302979e-05, -1.3794749975204468e-05, -1.3306736946105957e-05, -1.2818723917007446e-05, -1.2330710887908936e-05, -1.1842697858810425e-05, -1.1354684829711914e-05, -1.0866671800613403e-05, -1.0378658771514893e-05, -9.890645742416382e-06, -9.402632713317871e-06, -8.91461968421936e-06, -8.42660665512085e-06, -7.938593626022339e-06, -7.450580596923828e-06, -6.962567567825317e-06, -6.474554538726807e-06, -5.986541509628296e-06, -5.498528480529785e-06, -5.010515451431274e-06, -4.522502422332764e-06, -4.034489393234253e-06, -3.546476364135742e-06, -3.0584633350372314e-06, -2.5704503059387207e-06, -2.08243727684021e-06, -1.5944242477416992e-06, -1.1064112186431885e-06, -6.183981895446777e-07, -1.30385160446167e-07, 3.5762786865234375e-07, 8.456408977508545e-07, 1.3336539268493652e-06, 1.821666955947876e-06, 2.3096799850463867e-06, 2.7976930141448975e-06, 3.285706043243408e-06, 3.773719072341919e-06, 4.26173210144043e-06, 4.7497451305389404e-06, 5.237758159637451e-06, 5.725771188735962e-06, 6.213784217834473e-06, 6.701797246932983e-06, 7.189810276031494e-06, 7.677823305130005e-06, 8.165836334228516e-06, 8.653849363327026e-06, 9.141862392425537e-06, 9.629875421524048e-06, 1.0117888450622559e-05, 1.060590147972107e-05, 1.109391450881958e-05, 1.158192753791809e-05, 1.2069940567016602e-05, 1.2557953596115112e-05, 1.3045966625213623e-05, 1.3533979654312134e-05, 1.4021992683410645e-05, 1.4510005712509155e-05, 1.4998018741607666e-05, 1.5486031770706177e-05, 1.5974044799804688e-05]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 2.0, 7.0, 6.0, 6.0, 18.0, 34.0, 49.0, 85.0, 175.0, 353.0, 643.0, 1288.0, 2863.0, 6305.0, 14605.0, 36140.0, 86026.0, 177654.0, 260847.0, 231524.0, 130142.0, 57901.0, 23823.0, 9874.0, 4271.0, 1963.0, 918.0, 491.0, 241.0, 124.0, 78.0, 37.0, 21.0, 10.0, 7.0, 10.0, 7.0, 4.0, 3.0, 4.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07720947265625, -0.074615478515625, -0.072021484375, -0.069427490234375, -0.06683349609375, -0.064239501953125, -0.0616455078125, -0.059051513671875, -0.05645751953125, -0.053863525390625, -0.05126953125, -0.048675537109375, -0.04608154296875, -0.043487548828125, -0.0408935546875, -0.038299560546875, -0.03570556640625, -0.033111572265625, -0.030517578125, -0.027923583984375, -0.02532958984375, -0.022735595703125, -0.0201416015625, -0.017547607421875, -0.01495361328125, -0.012359619140625, -0.009765625, -0.007171630859375, -0.00457763671875, -0.001983642578125, 0.0006103515625, 0.003204345703125, 0.00579833984375, 0.008392333984375, 0.010986328125, 0.013580322265625, 0.01617431640625, 0.018768310546875, 0.0213623046875, 0.023956298828125, 0.02655029296875, 0.029144287109375, 0.03173828125, 0.034332275390625, 0.03692626953125, 0.039520263671875, 0.0421142578125, 0.044708251953125, 0.04730224609375, 0.049896240234375, 0.052490234375, 0.055084228515625, 0.05767822265625, 0.060272216796875, 0.0628662109375, 0.065460205078125, 0.06805419921875, 0.070648193359375, 0.0732421875, 0.075836181640625, 0.07843017578125, 0.081024169921875, 0.0836181640625, 0.086212158203125, 0.08880615234375]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 1.0, 2.0, 5.0, 4.0, 7.0, 7.0, 12.0, 7.0, 13.0, 17.0, 23.0, 19.0, 23.0, 47.0, 36.0, 47.0, 42.0, 55.0, 53.0, 59.0, 58.0, 51.0, 62.0, 45.0, 61.0, 46.0, 37.0, 36.0, 17.0, 27.0, 14.0, 18.0, 22.0, 8.0, 10.0, 4.0, 7.0, 5.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.07830810546875, -0.076171875, -0.07403564453125, -0.0718994140625, -0.06976318359375, -0.067626953125, -0.06549072265625, -0.0633544921875, -0.06121826171875, -0.05908203125, -0.05694580078125, -0.0548095703125, -0.05267333984375, -0.050537109375, -0.04840087890625, -0.0462646484375, -0.04412841796875, -0.0419921875, -0.03985595703125, -0.0377197265625, -0.03558349609375, -0.033447265625, -0.03131103515625, -0.0291748046875, -0.02703857421875, -0.02490234375, -0.02276611328125, -0.0206298828125, -0.01849365234375, -0.016357421875, -0.01422119140625, -0.0120849609375, -0.00994873046875, -0.0078125, -0.00567626953125, -0.0035400390625, -0.00140380859375, 0.000732421875, 0.00286865234375, 0.0050048828125, 0.00714111328125, 0.00927734375, 0.01141357421875, 0.0135498046875, 0.01568603515625, 0.017822265625, 0.01995849609375, 0.0220947265625, 0.02423095703125, 0.0263671875, 0.02850341796875, 0.0306396484375, 0.03277587890625, 0.034912109375, 0.03704833984375, 0.0391845703125, 0.04132080078125, 0.04345703125, 0.04559326171875, 0.0477294921875, 0.04986572265625, 0.052001953125, 0.05413818359375, 0.0562744140625, 0.05841064453125]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 5.0, 8.0, 7.0, 20.0, 25.0, 65.0, 71.0, 100.0, 156.0, 154.0, 121.0, 107.0, 81.0, 48.0, 15.0, 22.0, 8.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7180291414260864, -0.6769859790802002, -0.6359428763389587, -0.5948997139930725, -0.553856611251831, -0.5128134489059448, -0.4717702865600586, -0.43072715401649475, -0.3896840214729309, -0.34864088892936707, -0.3075977563858032, -0.266554594039917, -0.22551146149635315, -0.1844683289527893, -0.14342518150806427, -0.10238203406333923, -0.06133890151977539, -0.02029576152563095, 0.02074737846851349, 0.06179051846265793, 0.10283365845680237, 0.1438767910003662, 0.18491993844509125, 0.22596308588981628, 0.2670062184333801, 0.30804935097694397, 0.3490924835205078, 0.39013564586639404, 0.4311787784099579, 0.47222191095352173, 0.513265073299408, 0.5543081760406494, 0.5953513383865356, 0.6363945007324219, 0.6774376034736633, 0.7184807658195496, 0.759523868560791, 0.8005670309066772, 0.8416101932525635, 0.8826533555984497, 0.9236964583396912, 0.9647396206855774, 1.0057827234268188, 1.046825885772705, 1.0878690481185913, 1.1289122104644775, 1.1699552536010742, 1.2109984159469604, 1.2520415782928467, 1.293084740638733, 1.3341279029846191, 1.3751709461212158, 1.416214108467102, 1.4572572708129883, 1.4983004331588745, 1.5393435955047607, 1.5803866386413574, 1.6214298009872437, 1.6624729633331299, 1.7035160064697266, 1.7445591688156128, 1.785602331161499, 1.8266454935073853, 1.8676886558532715, 1.9087318181991577]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 7.0, 5.0, 3.0, 12.0, 13.0, 11.0, 18.0, 11.0, 19.0, 23.0, 23.0, 18.0, 27.0, 27.0, 19.0, 30.0, 42.0, 41.0, 49.0, 55.0, 47.0, 46.0, 39.0, 45.0, 34.0, 48.0, 25.0, 26.0, 27.0, 29.0, 34.0, 30.0, 22.0, 15.0, 12.0, 17.0, 6.0, 10.0, 11.0, 10.0, 4.0, 7.0, 4.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.6619657874107361, -0.6400976181030273, -0.6182293891906738, -0.5963612198829651, -0.5744930505752563, -0.5526248216629028, -0.5307566523551941, -0.5088884830474854, -0.48702025413513184, -0.4651520550251007, -0.44328388571739197, -0.42141568660736084, -0.3995474874973297, -0.3776792883872986, -0.35581111907958984, -0.3339429199695587, -0.31207475066185, -0.29020655155181885, -0.2683383822441101, -0.24647018313407898, -0.22460198402404785, -0.20273379981517792, -0.18086561560630798, -0.15899741649627686, -0.13712923228740692, -0.11526104062795639, -0.09339284896850586, -0.07152466475963593, -0.049656473100185394, -0.027788281440734863, -0.005920097231864929, 0.0159481018781662, 0.03781628608703613, 0.059684477746486664, 0.0815526694059372, 0.10342085361480713, 0.12528905272483826, 0.1471572369337082, 0.16902542114257812, 0.19089362025260925, 0.2127618044614792, 0.23462998867034912, 0.25649818778038025, 0.2783663868904114, 0.3002345561981201, 0.32210275530815125, 0.3439709544181824, 0.3658391237258911, 0.38770732283592224, 0.40957552194595337, 0.4314436912536621, 0.45331189036369324, 0.47518008947372437, 0.4970482587814331, 0.5189164876937866, 0.5407846570014954, 0.5626528263092041, 0.5845209956169128, 0.6063892245292664, 0.6282573938369751, 0.6501255631446838, 0.6719937920570374, 0.6938619613647461, 0.7157301902770996, 0.7375983595848083]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 8.0, 2.0, 10.0, 13.0, 18.0, 25.0, 35.0, 43.0, 60.0, 137.0, 207.0, 301.0, 768.0, 1864.0, 6819.0, 43054.0, 846595.0, 3082390.0, 187660.0, 18401.0, 3763.0, 1180.0, 435.0, 202.0, 111.0, 72.0, 43.0, 29.0, 14.0, 12.0, 5.0, 3.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0], "bins": [-0.404296875, -0.3949546813964844, -0.38561248779296875, -0.3762702941894531, -0.3669281005859375, -0.3575859069824219, -0.34824371337890625, -0.3389015197753906, -0.329559326171875, -0.3202171325683594, -0.31087493896484375, -0.3015327453613281, -0.2921905517578125, -0.2828483581542969, -0.27350616455078125, -0.2641639709472656, -0.25482177734375, -0.24547958374023438, -0.23613739013671875, -0.22679519653320312, -0.2174530029296875, -0.20811080932617188, -0.19876861572265625, -0.18942642211914062, -0.180084228515625, -0.17074203491210938, -0.16139984130859375, -0.15205764770507812, -0.1427154541015625, -0.13337326049804688, -0.12403106689453125, -0.11468887329101562, -0.1053466796875, -0.09600448608398438, -0.08666229248046875, -0.07732009887695312, -0.0679779052734375, -0.058635711669921875, -0.04929351806640625, -0.039951324462890625, -0.030609130859375, -0.021266937255859375, -0.01192474365234375, -0.002582550048828125, 0.0067596435546875, 0.016101837158203125, 0.02544403076171875, 0.034786224365234375, 0.04412841796875, 0.053470611572265625, 0.06281280517578125, 0.07215499877929688, 0.0814971923828125, 0.09083938598632812, 0.10018157958984375, 0.10952377319335938, 0.118865966796875, 0.12820816040039062, 0.13755035400390625, 0.14689254760742188, 0.1562347412109375, 0.16557693481445312, 0.17491912841796875, 0.18426132202148438, 0.193603515625]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 4.0, 3.0, 9.0, 7.0, 20.0, 12.0, 23.0, 23.0, 36.0, 39.0, 40.0, 42.0, 51.0, 62.0, 60.0, 59.0, 61.0, 70.0, 53.0, 56.0, 57.0, 49.0, 47.0, 26.0, 25.0, 26.0, 13.0, 10.0, 7.0, 7.0, 4.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0], "bins": [-0.1416015625, -0.13797664642333984, -0.1343517303466797, -0.13072681427001953, -0.12710189819335938, -0.12347698211669922, -0.11985206604003906, -0.1162271499633789, -0.11260223388671875, -0.1089773178100586, -0.10535240173339844, -0.10172748565673828, -0.09810256958007812, -0.09447765350341797, -0.09085273742675781, -0.08722782135009766, -0.0836029052734375, -0.07997798919677734, -0.07635307312011719, -0.07272815704345703, -0.06910324096679688, -0.06547832489013672, -0.06185340881347656, -0.058228492736816406, -0.05460357666015625, -0.050978660583496094, -0.04735374450683594, -0.04372882843017578, -0.040103912353515625, -0.03647899627685547, -0.03285408020019531, -0.029229164123535156, -0.025604248046875, -0.021979331970214844, -0.018354415893554688, -0.014729499816894531, -0.011104583740234375, -0.007479667663574219, -0.0038547515869140625, -0.00022983551025390625, 0.00339508056640625, 0.007019996643066406, 0.010644912719726562, 0.014269828796386719, 0.017894744873046875, 0.02151966094970703, 0.025144577026367188, 0.028769493103027344, 0.0323944091796875, 0.036019325256347656, 0.03964424133300781, 0.04326915740966797, 0.046894073486328125, 0.05051898956298828, 0.05414390563964844, 0.057768821716308594, 0.06139373779296875, 0.0650186538696289, 0.06864356994628906, 0.07226848602294922, 0.07589340209960938, 0.07951831817626953, 0.08314323425292969, 0.08676815032958984, 0.09039306640625]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 4.0, 0.0, 3.0, 6.0, 9.0, 13.0, 11.0, 21.0, 22.0, 44.0, 106.0, 187.0, 387.0, 927.0, 2491.0, 11088.0, 97861.0, 1918669.0, 2041131.0, 105488.0, 11420.0, 2624.0, 943.0, 379.0, 174.0, 113.0, 69.0, 28.0, 21.0, 13.0, 8.0, 7.0, 7.0, 1.0, 3.0, 5.0, 2.0, 1.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.35888671875, -0.34833526611328125, -0.3377838134765625, -0.32723236083984375, -0.316680908203125, -0.30612945556640625, -0.2955780029296875, -0.28502655029296875, -0.27447509765625, -0.26392364501953125, -0.2533721923828125, -0.24282073974609375, -0.232269287109375, -0.22171783447265625, -0.2111663818359375, -0.20061492919921875, -0.1900634765625, -0.17951202392578125, -0.1689605712890625, -0.15840911865234375, -0.147857666015625, -0.13730621337890625, -0.1267547607421875, -0.11620330810546875, -0.10565185546875, -0.09510040283203125, -0.0845489501953125, -0.07399749755859375, -0.063446044921875, -0.05289459228515625, -0.0423431396484375, -0.03179168701171875, -0.021240234375, -0.01068878173828125, -0.0001373291015625, 0.01041412353515625, 0.020965576171875, 0.03151702880859375, 0.0420684814453125, 0.05261993408203125, 0.06317138671875, 0.07372283935546875, 0.0842742919921875, 0.09482574462890625, 0.105377197265625, 0.11592864990234375, 0.1264801025390625, 0.13703155517578125, 0.1475830078125, 0.15813446044921875, 0.1686859130859375, 0.17923736572265625, 0.189788818359375, 0.20034027099609375, 0.2108917236328125, 0.22144317626953125, 0.23199462890625, 0.24254608154296875, 0.2530975341796875, 0.26364898681640625, 0.274200439453125, 0.28475189208984375, 0.2953033447265625, 0.30585479736328125, 0.31640625]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 2.0, 2.0, 3.0, 9.0, 8.0, 10.0, 8.0, 19.0, 23.0, 31.0, 51.0, 76.0, 79.0, 137.0, 184.0, 222.0, 295.0, 405.0, 471.0, 466.0, 358.0, 337.0, 259.0, 182.0, 134.0, 83.0, 62.0, 40.0, 34.0, 25.0, 11.0, 16.0, 11.0, 6.0, 4.0, 6.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.127197265625, -0.122650146484375, -0.11810302734375, -0.113555908203125, -0.1090087890625, -0.104461669921875, -0.09991455078125, -0.095367431640625, -0.0908203125, -0.086273193359375, -0.08172607421875, -0.077178955078125, -0.0726318359375, -0.068084716796875, -0.06353759765625, -0.058990478515625, -0.054443359375, -0.049896240234375, -0.04534912109375, -0.040802001953125, -0.0362548828125, -0.031707763671875, -0.02716064453125, -0.022613525390625, -0.01806640625, -0.013519287109375, -0.00897216796875, -0.004425048828125, 0.0001220703125, 0.004669189453125, 0.00921630859375, 0.013763427734375, 0.018310546875, 0.022857666015625, 0.02740478515625, 0.031951904296875, 0.0364990234375, 0.041046142578125, 0.04559326171875, 0.050140380859375, 0.0546875, 0.059234619140625, 0.06378173828125, 0.068328857421875, 0.0728759765625, 0.077423095703125, 0.08197021484375, 0.086517333984375, 0.091064453125, 0.095611572265625, 0.10015869140625, 0.104705810546875, 0.1092529296875, 0.113800048828125, 0.11834716796875, 0.122894287109375, 0.12744140625, 0.131988525390625, 0.13653564453125, 0.141082763671875, 0.1456298828125, 0.150177001953125, 0.15472412109375, 0.159271240234375, 0.163818359375]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 4.0, 13.0, 13.0, 21.0, 31.0, 30.0, 62.0, 65.0, 71.0, 98.0, 103.0, 80.0, 90.0, 72.0, 63.0, 67.0, 39.0, 19.0, 20.0, 18.0, 7.0, 10.0, 4.0, 3.0, 5.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.7866369485855103, -0.764180064201355, -0.7417231798171997, -0.7192662954330444, -0.6968094110488892, -0.6743525862693787, -0.6518957018852234, -0.6294388175010681, -0.6069819331169128, -0.5845250487327576, -0.5620681643486023, -0.539611279964447, -0.5171544551849365, -0.49469754099845886, -0.472240686416626, -0.4497838020324707, -0.42732691764831543, -0.40487003326416016, -0.3824131488800049, -0.359956294298172, -0.3374994099140167, -0.31504252552986145, -0.29258567094802856, -0.2701287865638733, -0.24767190217971802, -0.22521501779556274, -0.20275814831256866, -0.18030127882957458, -0.1578443944454193, -0.13538751006126404, -0.11293064057826996, -0.09047377109527588, -0.0680168867111206, -0.04556000977754593, -0.023103132843971252, -0.0006462559103965759, 0.0218106210231781, 0.04426749795675278, 0.06672437489032745, 0.08918124437332153, 0.1116381287574768, 0.13409501314163208, 0.15655188262462616, 0.17900875210762024, 0.2014656364917755, 0.2239225208759308, 0.24637939035892487, 0.26883625984191895, 0.2912931442260742, 0.3137500286102295, 0.33620691299438477, 0.35866376757621765, 0.3811206519603729, 0.4035775363445282, 0.4260343909263611, 0.44849127531051636, 0.47094815969467163, 0.4934050440788269, 0.5158619284629822, 0.5383188128471375, 0.560775637626648, 0.5832325220108032, 0.6056894063949585, 0.6281462907791138, 0.650603175163269]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 5.0, 5.0, 7.0, 8.0, 9.0, 9.0, 15.0, 18.0, 16.0, 21.0, 21.0, 41.0, 33.0, 26.0, 37.0, 43.0, 45.0, 41.0, 46.0, 52.0, 43.0, 44.0, 43.0, 37.0, 48.0, 37.0, 32.0, 34.0, 33.0, 30.0, 19.0, 29.0, 19.0, 12.0, 8.0, 13.0, 4.0, 8.0, 9.0, 6.0, 1.0, 1.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.48170560598373413, -0.46622613072395325, -0.45074665546417236, -0.4352671802043915, -0.4197877049446106, -0.4043082296848297, -0.38882875442504883, -0.37334927916526794, -0.35786980390548706, -0.3423903286457062, -0.3269108533859253, -0.3114313781261444, -0.2959519028663635, -0.28047242760658264, -0.26499295234680176, -0.24951347708702087, -0.23403401672840118, -0.2185545414686203, -0.20307506620883942, -0.18759559094905853, -0.17211611568927765, -0.15663665533065796, -0.14115718007087708, -0.1256777048110962, -0.11019822210073471, -0.09471874684095383, -0.07923927158117294, -0.06375980377197266, -0.048280324786901474, -0.03280085325241089, -0.017321377992630005, -0.001841902732849121, 0.013637572526931763, 0.029117047786712646, 0.04459652304649353, 0.060075994580984116, 0.0755554735660553, 0.09103494137525558, 0.10651441663503647, 0.12199389189481735, 0.13747337460517883, 0.15295284986495972, 0.1684323251247406, 0.18391180038452148, 0.19939127564430237, 0.21487075090408325, 0.23035022616386414, 0.24582970142364502, 0.2613091468811035, 0.2767886221408844, 0.2922680974006653, 0.30774757266044617, 0.32322704792022705, 0.33870652318000793, 0.3541859984397888, 0.3696654736995697, 0.3851449489593506, 0.40062442421913147, 0.41610389947891235, 0.43158337473869324, 0.4470628499984741, 0.462542325258255, 0.4780218005180359, 0.4935012757778168, 0.5089807510375977]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 5.0, 5.0, 2.0, 10.0, 10.0, 19.0, 21.0, 36.0, 41.0, 91.0, 137.0, 270.0, 596.0, 1570.0, 5261.0, 18565.0, 83018.0, 376660.0, 429201.0, 101571.0, 22434.0, 5836.0, 1794.0, 654.0, 307.0, 164.0, 87.0, 67.0, 43.0, 18.0, 21.0, 13.0, 9.0, 5.0, 7.0, 3.0, 5.0, 2.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5888671875, -0.567108154296875, -0.54534912109375, -0.523590087890625, -0.5018310546875, -0.480072021484375, -0.45831298828125, -0.436553955078125, -0.414794921875, -0.393035888671875, -0.37127685546875, -0.349517822265625, -0.3277587890625, -0.305999755859375, -0.28424072265625, -0.262481689453125, -0.24072265625, -0.218963623046875, -0.19720458984375, -0.175445556640625, -0.1536865234375, -0.131927490234375, -0.11016845703125, -0.088409423828125, -0.066650390625, -0.044891357421875, -0.02313232421875, -0.001373291015625, 0.0203857421875, 0.042144775390625, 0.06390380859375, 0.085662841796875, 0.107421875, 0.129180908203125, 0.15093994140625, 0.172698974609375, 0.1944580078125, 0.216217041015625, 0.23797607421875, 0.259735107421875, 0.281494140625, 0.303253173828125, 0.32501220703125, 0.346771240234375, 0.3685302734375, 0.390289306640625, 0.41204833984375, 0.433807373046875, 0.45556640625, 0.477325439453125, 0.49908447265625, 0.520843505859375, 0.5426025390625, 0.564361572265625, 0.58612060546875, 0.607879638671875, 0.629638671875, 0.651397705078125, 0.67315673828125, 0.694915771484375, 0.7166748046875, 0.738433837890625, 0.76019287109375, 0.781951904296875, 0.8037109375]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 4.0, 7.0, 9.0, 11.0, 14.0, 20.0, 22.0, 27.0, 39.0, 38.0, 42.0, 54.0, 55.0, 64.0, 79.0, 55.0, 61.0, 55.0, 49.0, 61.0, 51.0, 55.0, 33.0, 31.0, 18.0, 16.0, 17.0, 7.0, 5.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.144287109375, -0.14061927795410156, -0.13695144653320312, -0.1332836151123047, -0.12961578369140625, -0.1259479522705078, -0.12228012084960938, -0.11861228942871094, -0.1149444580078125, -0.11127662658691406, -0.10760879516601562, -0.10394096374511719, -0.10027313232421875, -0.09660530090332031, -0.09293746948242188, -0.08926963806152344, -0.085601806640625, -0.08193397521972656, -0.07826614379882812, -0.07459831237792969, -0.07093048095703125, -0.06726264953613281, -0.06359481811523438, -0.05992698669433594, -0.0562591552734375, -0.05259132385253906, -0.048923492431640625, -0.04525566101074219, -0.04158782958984375, -0.03791999816894531, -0.034252166748046875, -0.030584335327148438, -0.02691650390625, -0.023248672485351562, -0.019580841064453125, -0.015913009643554688, -0.01224517822265625, -0.008577346801757812, -0.004909515380859375, -0.0012416839599609375, 0.0024261474609375, 0.0060939788818359375, 0.009761810302734375, 0.013429641723632812, 0.01709747314453125, 0.020765304565429688, 0.024433135986328125, 0.028100967407226562, 0.031768798828125, 0.03543663024902344, 0.039104461669921875, 0.04277229309082031, 0.04644012451171875, 0.05010795593261719, 0.053775787353515625, 0.05744361877441406, 0.0611114501953125, 0.06477928161621094, 0.06844711303710938, 0.07211494445800781, 0.07578277587890625, 0.07945060729980469, 0.08311843872070312, 0.08678627014160156, 0.0904541015625]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 10.0, 9.0, 14.0, 17.0, 24.0, 43.0, 54.0, 106.0, 147.0, 228.0, 442.0, 852.0, 1552.0, 2969.0, 5760.0, 12044.0, 26606.0, 61398.0, 136852.0, 246079.0, 262443.0, 157971.0, 73243.0, 31481.0, 14233.0, 6716.0, 3319.0, 1751.0, 900.0, 545.0, 297.0, 155.0, 99.0, 70.0, 37.0, 29.0, 21.0, 14.0, 12.0, 11.0, 2.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.330078125, -0.3206748962402344, -0.31127166748046875, -0.3018684387207031, -0.2924652099609375, -0.2830619812011719, -0.27365875244140625, -0.2642555236816406, -0.254852294921875, -0.24544906616210938, -0.23604583740234375, -0.22664260864257812, -0.2172393798828125, -0.20783615112304688, -0.19843292236328125, -0.18902969360351562, -0.17962646484375, -0.17022323608398438, -0.16082000732421875, -0.15141677856445312, -0.1420135498046875, -0.13261032104492188, -0.12320709228515625, -0.11380386352539062, -0.104400634765625, -0.09499740600585938, -0.08559417724609375, -0.07619094848632812, -0.0667877197265625, -0.057384490966796875, -0.04798126220703125, -0.038578033447265625, -0.0291748046875, -0.019771575927734375, -0.01036834716796875, -0.000965118408203125, 0.0084381103515625, 0.017841339111328125, 0.02724456787109375, 0.036647796630859375, 0.046051025390625, 0.055454254150390625, 0.06485748291015625, 0.07426071166992188, 0.0836639404296875, 0.09306716918945312, 0.10247039794921875, 0.11187362670898438, 0.12127685546875, 0.13068008422851562, 0.14008331298828125, 0.14948654174804688, 0.1588897705078125, 0.16829299926757812, 0.17769622802734375, 0.18709945678710938, 0.196502685546875, 0.20590591430664062, 0.21530914306640625, 0.22471237182617188, 0.2341156005859375, 0.24351882934570312, 0.25292205810546875, 0.2623252868652344, 0.271728515625]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 3.0, 5.0, 1.0, 3.0, 4.0, 5.0, 5.0, 14.0, 11.0, 12.0, 15.0, 18.0, 16.0, 24.0, 32.0, 39.0, 48.0, 38.0, 45.0, 47.0, 50.0, 43.0, 50.0, 52.0, 50.0, 40.0, 50.0, 44.0, 53.0, 27.0, 33.0, 29.0, 24.0, 16.0, 10.0, 11.0, 6.0, 6.0, 9.0, 8.0, 1.0, 2.0, 1.0, 1.0, 7.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.299072265625, -0.2906494140625, -0.2822265625, -0.2738037109375, -0.265380859375, -0.2569580078125, -0.24853515625, -0.2401123046875, -0.231689453125, -0.2232666015625, -0.21484375, -0.2064208984375, -0.197998046875, -0.1895751953125, -0.18115234375, -0.1727294921875, -0.164306640625, -0.1558837890625, -0.1474609375, -0.1390380859375, -0.130615234375, -0.1221923828125, -0.11376953125, -0.1053466796875, -0.096923828125, -0.0885009765625, -0.080078125, -0.0716552734375, -0.063232421875, -0.0548095703125, -0.04638671875, -0.0379638671875, -0.029541015625, -0.0211181640625, -0.0126953125, -0.0042724609375, 0.004150390625, 0.0125732421875, 0.02099609375, 0.0294189453125, 0.037841796875, 0.0462646484375, 0.0546875, 0.0631103515625, 0.071533203125, 0.0799560546875, 0.08837890625, 0.0968017578125, 0.105224609375, 0.1136474609375, 0.1220703125, 0.1304931640625, 0.138916015625, 0.1473388671875, 0.15576171875, 0.1641845703125, 0.172607421875, 0.1810302734375, 0.189453125, 0.1978759765625, 0.206298828125, 0.2147216796875, 0.22314453125, 0.2315673828125, 0.239990234375]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 2.0, 3.0, 9.0, 7.0, 4.0, 13.0, 13.0, 29.0, 35.0, 47.0, 86.0, 104.0, 156.0, 238.0, 389.0, 633.0, 967.0, 1369.0, 2029.0, 3380.0, 5593.0, 9479.0, 16290.0, 29163.0, 54236.0, 105865.0, 194091.0, 247094.0, 174305.0, 92384.0, 47923.0, 25599.0, 14699.0, 8479.0, 5124.0, 3074.0, 1952.0, 1263.0, 821.0, 519.0, 345.0, 230.0, 169.0, 122.0, 79.0, 41.0, 35.0, 23.0, 16.0, 13.0, 13.0, 4.0, 3.0, 2.0, 4.0, 2.0], "bins": [-0.1322021484375, -0.12846755981445312, -0.12473297119140625, -0.12099838256835938, -0.1172637939453125, -0.11352920532226562, -0.10979461669921875, -0.10606002807617188, -0.102325439453125, -0.09859085083007812, -0.09485626220703125, -0.09112167358398438, -0.0873870849609375, -0.08365249633789062, -0.07991790771484375, -0.07618331909179688, -0.07244873046875, -0.06871414184570312, -0.06497955322265625, -0.061244964599609375, -0.0575103759765625, -0.053775787353515625, -0.05004119873046875, -0.046306610107421875, -0.042572021484375, -0.038837432861328125, -0.03510284423828125, -0.031368255615234375, -0.0276336669921875, -0.023899078369140625, -0.02016448974609375, -0.016429901123046875, -0.0126953125, -0.008960723876953125, -0.00522613525390625, -0.001491546630859375, 0.0022430419921875, 0.005977630615234375, 0.00971221923828125, 0.013446807861328125, 0.017181396484375, 0.020915985107421875, 0.02465057373046875, 0.028385162353515625, 0.0321197509765625, 0.035854339599609375, 0.03958892822265625, 0.043323516845703125, 0.04705810546875, 0.050792694091796875, 0.05452728271484375, 0.058261871337890625, 0.0619964599609375, 0.06573104858398438, 0.06946563720703125, 0.07320022583007812, 0.076934814453125, 0.08066940307617188, 0.08440399169921875, 0.08813858032226562, 0.0918731689453125, 0.09560775756835938, 0.09934234619140625, 0.10307693481445312, 0.1068115234375]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 4.0, 0.0, 4.0, 1.0, 4.0, 3.0, 5.0, 4.0, 2.0, 2.0, 6.0, 7.0, 17.0, 9.0, 12.0, 23.0, 27.0, 45.0, 52.0, 66.0, 81.0, 102.0, 104.0, 81.0, 67.0, 66.0, 52.0, 36.0, 24.0, 23.0, 12.0, 13.0, 7.0, 10.0, 8.0, 5.0, 7.0, 5.0, 4.0, 2.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0], "bins": [-4.291534423828125e-05, -4.173722118139267e-05, -4.055909812450409e-05, -3.938097506761551e-05, -3.820285201072693e-05, -3.702472895383835e-05, -3.584660589694977e-05, -3.466848284006119e-05, -3.349035978317261e-05, -3.231223672628403e-05, -3.113411366939545e-05, -2.9955990612506866e-05, -2.8777867555618286e-05, -2.7599744498729706e-05, -2.6421621441841125e-05, -2.5243498384952545e-05, -2.4065375328063965e-05, -2.2887252271175385e-05, -2.1709129214286804e-05, -2.0531006157398224e-05, -1.9352883100509644e-05, -1.8174760043621063e-05, -1.6996636986732483e-05, -1.5818513929843903e-05, -1.4640390872955322e-05, -1.3462267816066742e-05, -1.2284144759178162e-05, -1.1106021702289581e-05, -9.927898645401001e-06, -8.74977558851242e-06, -7.57165253162384e-06, -6.39352947473526e-06, -5.21540641784668e-06, -4.037283360958099e-06, -2.859160304069519e-06, -1.6810372471809387e-06, -5.029141902923584e-07, 6.752088665962219e-07, 1.8533319234848022e-06, 3.0314549803733826e-06, 4.209578037261963e-06, 5.387701094150543e-06, 6.5658241510391235e-06, 7.743947207927704e-06, 8.922070264816284e-06, 1.0100193321704865e-05, 1.1278316378593445e-05, 1.2456439435482025e-05, 1.3634562492370605e-05, 1.4812685549259186e-05, 1.5990808606147766e-05, 1.7168931663036346e-05, 1.8347054719924927e-05, 1.9525177776813507e-05, 2.0703300833702087e-05, 2.1881423890590668e-05, 2.3059546947479248e-05, 2.423767000436783e-05, 2.541579306125641e-05, 2.659391611814499e-05, 2.777203917503357e-05, 2.895016223192215e-05, 3.012828528881073e-05, 3.130640834569931e-05, 3.248453140258789e-05]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 10.0, 16.0, 11.0, 23.0, 30.0, 66.0, 127.0, 182.0, 327.0, 505.0, 922.0, 1738.0, 3235.0, 6356.0, 13474.0, 30193.0, 76493.0, 211442.0, 368032.0, 204893.0, 74513.0, 29594.0, 13064.0, 6291.0, 3215.0, 1667.0, 907.0, 517.0, 290.0, 162.0, 102.0, 70.0, 33.0, 25.0, 16.0, 11.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1602783203125, -0.15518760681152344, -0.15009689331054688, -0.1450061798095703, -0.13991546630859375, -0.1348247528076172, -0.12973403930664062, -0.12464332580566406, -0.1195526123046875, -0.11446189880371094, -0.10937118530273438, -0.10428047180175781, -0.09918975830078125, -0.09409904479980469, -0.08900833129882812, -0.08391761779785156, -0.078826904296875, -0.07373619079589844, -0.06864547729492188, -0.06355476379394531, -0.05846405029296875, -0.05337333679199219, -0.048282623291015625, -0.04319190979003906, -0.0381011962890625, -0.03301048278808594, -0.027919769287109375, -0.022829055786132812, -0.01773834228515625, -0.012647628784179688, -0.007556915283203125, -0.0024662017822265625, 0.00262451171875, 0.0077152252197265625, 0.012805938720703125, 0.017896652221679688, 0.02298736572265625, 0.028078079223632812, 0.033168792724609375, 0.03825950622558594, 0.0433502197265625, 0.04844093322753906, 0.053531646728515625, 0.05862236022949219, 0.06371307373046875, 0.06880378723144531, 0.07389450073242188, 0.07898521423339844, 0.084075927734375, 0.08916664123535156, 0.09425735473632812, 0.09934806823730469, 0.10443878173828125, 0.10952949523925781, 0.11462020874023438, 0.11971092224121094, 0.1248016357421875, 0.12989234924316406, 0.13498306274414062, 0.1400737762451172, 0.14516448974609375, 0.1502552032470703, 0.15534591674804688, 0.16043663024902344, 0.16552734375]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 7.0, 3.0, 5.0, 5.0, 8.0, 8.0, 4.0, 11.0, 15.0, 20.0, 11.0, 20.0, 22.0, 40.0, 34.0, 43.0, 59.0, 86.0, 71.0, 61.0, 67.0, 65.0, 67.0, 41.0, 41.0, 29.0, 22.0, 27.0, 21.0, 20.0, 14.0, 12.0, 10.0, 6.0, 8.0, 2.0, 9.0, 4.0, 5.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0972900390625, -0.09389114379882812, -0.09049224853515625, -0.08709335327148438, -0.0836944580078125, -0.08029556274414062, -0.07689666748046875, -0.07349777221679688, -0.070098876953125, -0.06669998168945312, -0.06330108642578125, -0.059902191162109375, -0.0565032958984375, -0.053104400634765625, -0.04970550537109375, -0.046306610107421875, -0.04290771484375, -0.039508819580078125, -0.03610992431640625, -0.032711029052734375, -0.0293121337890625, -0.025913238525390625, -0.02251434326171875, -0.019115447998046875, -0.015716552734375, -0.012317657470703125, -0.00891876220703125, -0.005519866943359375, -0.0021209716796875, 0.001277923583984375, 0.00467681884765625, 0.008075714111328125, 0.011474609375, 0.014873504638671875, 0.01827239990234375, 0.021671295166015625, 0.0250701904296875, 0.028469085693359375, 0.03186798095703125, 0.035266876220703125, 0.038665771484375, 0.042064666748046875, 0.04546356201171875, 0.048862457275390625, 0.0522613525390625, 0.055660247802734375, 0.05905914306640625, 0.062458038330078125, 0.06585693359375, 0.06925582885742188, 0.07265472412109375, 0.07605361938476562, 0.0794525146484375, 0.08285140991210938, 0.08625030517578125, 0.08964920043945312, 0.093048095703125, 0.09644699096679688, 0.09984588623046875, 0.10324478149414062, 0.1066436767578125, 0.11004257202148438, 0.11344146728515625, 0.11684036254882812, 0.1202392578125]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 1.0, 6.0, 6.0, 4.0, 8.0, 12.0, 6.0, 11.0, 15.0, 22.0, 25.0, 29.0, 34.0, 31.0, 38.0, 48.0, 62.0, 37.0, 52.0, 56.0, 46.0, 58.0, 42.0, 39.0, 48.0, 33.0, 31.0, 32.0, 17.0, 35.0, 24.0, 15.0, 18.0, 11.0, 11.0, 11.0, 3.0, 9.0, 3.0, 2.0, 3.0, 7.0, 1.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.7316516041755676, -0.7075401544570923, -0.6834287047386169, -0.6593172550201416, -0.6352058053016663, -0.6110943555831909, -0.5869829654693604, -0.5628714561462402, -0.5387600660324097, -0.5146486163139343, -0.490537166595459, -0.46642571687698364, -0.4423142671585083, -0.41820281744003296, -0.39409139752388, -0.36997994780540466, -0.34586846828460693, -0.3217570185661316, -0.29764556884765625, -0.2735341191291809, -0.24942268431186676, -0.22531123459339142, -0.20119979977607727, -0.17708835005760193, -0.1529769003391266, -0.12886545062065125, -0.1047540083527565, -0.08064256608486176, -0.056531116366386414, -0.03241966664791107, -0.008308231830596924, 0.015803217887878418, 0.039914608001708984, 0.06402605772018433, 0.08813749998807907, 0.11224894225597382, 0.13636039197444916, 0.1604718416929245, 0.18458327651023865, 0.208694726228714, 0.23280617594718933, 0.2569176256656647, 0.28102907538414, 0.30514049530029297, 0.3292519450187683, 0.35336339473724365, 0.377474844455719, 0.40158629417419434, 0.4256977438926697, 0.449809193611145, 0.47392064332962036, 0.4980320930480957, 0.522143542766571, 0.5462549924850464, 0.570366382598877, 0.5944778919219971, 0.6185892820358276, 0.642700731754303, 0.6668121814727783, 0.6909236311912537, 0.715035080909729, 0.7391465306282043, 0.7632579803466797, 0.7873693704605103, 0.8114808797836304]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 3.0, 1.0, 3.0, 4.0, 3.0, 8.0, 3.0, 10.0, 18.0, 13.0, 12.0, 16.0, 12.0, 21.0, 22.0, 22.0, 32.0, 27.0, 27.0, 29.0, 44.0, 44.0, 36.0, 44.0, 43.0, 54.0, 35.0, 37.0, 35.0, 26.0, 32.0, 33.0, 34.0, 36.0, 23.0, 18.0, 29.0, 22.0, 16.0, 15.0, 14.0, 12.0, 4.0, 6.0, 6.0, 8.0, 5.0, 6.0, 1.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8565925359725952, -0.8306374549865723, -0.8046824336051941, -0.7787273526191711, -0.7527722716331482, -0.72681725025177, -0.7008621692657471, -0.6749070882797241, -0.6489520072937012, -0.6229969263076782, -0.5970419049263, -0.5710868239402771, -0.5451317429542542, -0.519176721572876, -0.493221640586853, -0.4672665596008301, -0.4413115382194519, -0.41535648703575134, -0.3894014060497284, -0.36344635486602783, -0.3374912738800049, -0.3115362226963043, -0.28558117151260376, -0.2596260905265808, -0.23367103934288025, -0.2077159732580185, -0.18176090717315674, -0.15580585598945618, -0.12985078990459442, -0.10389572381973267, -0.0779406726360321, -0.05198560655117035, -0.02603048086166382, -7.541850209236145e-05, 0.025879643857479095, 0.051834702491760254, 0.07778976857662201, 0.10374483466148376, 0.12969988584518433, 0.15565495193004608, 0.18161001801490784, 0.2075650840997696, 0.23352015018463135, 0.2594752013683319, 0.28543025255203247, 0.3113853335380554, 0.337340384721756, 0.36329543590545654, 0.3892505168914795, 0.41520556807518005, 0.441160649061203, 0.46711570024490356, 0.4930707812309265, 0.5190258026123047, 0.5449808835983276, 0.5709359645843506, 0.5968910455703735, 0.6228461265563965, 0.6488011479377747, 0.6747562289237976, 0.7007113099098206, 0.7266663312911987, 0.7526214122772217, 0.7785764932632446, 0.8045315146446228]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 1.0, 0.0, 1.0, 5.0, 3.0, 1.0, 13.0, 13.0, 10.0, 16.0, 27.0, 30.0, 53.0, 100.0, 198.0, 325.0, 608.0, 1149.0, 2439.0, 5836.0, 16675.0, 61946.0, 365248.0, 2215881.0, 1294115.0, 174440.0, 36688.0, 10986.0, 4091.0, 1739.0, 770.0, 427.0, 200.0, 106.0, 48.0, 40.0, 19.0, 20.0, 10.0, 7.0, 2.0, 5.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.22265625, -0.21565628051757812, -0.20865631103515625, -0.20165634155273438, -0.1946563720703125, -0.18765640258789062, -0.18065643310546875, -0.17365646362304688, -0.166656494140625, -0.15965652465820312, -0.15265655517578125, -0.14565658569335938, -0.1386566162109375, -0.13165664672851562, -0.12465667724609375, -0.11765670776367188, -0.11065673828125, -0.10365676879882812, -0.09665679931640625, -0.08965682983398438, -0.0826568603515625, -0.07565689086914062, -0.06865692138671875, -0.061656951904296875, -0.054656982421875, -0.047657012939453125, -0.04065704345703125, -0.033657073974609375, -0.0266571044921875, -0.019657135009765625, -0.01265716552734375, -0.005657196044921875, 0.0013427734375, 0.008342742919921875, 0.01534271240234375, 0.022342681884765625, 0.0293426513671875, 0.036342620849609375, 0.04334259033203125, 0.050342559814453125, 0.057342529296875, 0.06434249877929688, 0.07134246826171875, 0.07834243774414062, 0.0853424072265625, 0.09234237670898438, 0.09934234619140625, 0.10634231567382812, 0.11334228515625, 0.12034225463867188, 0.12734222412109375, 0.13434219360351562, 0.1413421630859375, 0.14834213256835938, 0.15534210205078125, 0.16234207153320312, 0.169342041015625, 0.17634201049804688, 0.18334197998046875, 0.19034194946289062, 0.1973419189453125, 0.20434188842773438, 0.21134185791015625, 0.21834182739257812, 0.225341796875]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 1.0, 1.0, 6.0, 3.0, 15.0, 4.0, 6.0, 16.0, 20.0, 22.0, 34.0, 17.0, 24.0, 29.0, 30.0, 29.0, 42.0, 36.0, 42.0, 41.0, 48.0, 50.0, 38.0, 43.0, 49.0, 48.0, 37.0, 38.0, 34.0, 37.0, 36.0, 20.0, 25.0, 16.0, 15.0, 11.0, 12.0, 6.0, 11.0, 7.0, 3.0, 4.0, 3.0, 3.0, 0.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.12335205078125, -0.11998939514160156, -0.11662673950195312, -0.11326408386230469, -0.10990142822265625, -0.10653877258300781, -0.10317611694335938, -0.09981346130371094, -0.0964508056640625, -0.09308815002441406, -0.08972549438476562, -0.08636283874511719, -0.08300018310546875, -0.07963752746582031, -0.07627487182617188, -0.07291221618652344, -0.069549560546875, -0.06618690490722656, -0.06282424926757812, -0.05946159362792969, -0.05609893798828125, -0.05273628234863281, -0.049373626708984375, -0.04601097106933594, -0.0426483154296875, -0.03928565979003906, -0.035923004150390625, -0.03256034851074219, -0.02919769287109375, -0.025835037231445312, -0.022472381591796875, -0.019109725952148438, -0.0157470703125, -0.012384414672851562, -0.009021759033203125, -0.0056591033935546875, -0.00229644775390625, 0.0010662078857421875, 0.004428863525390625, 0.0077915191650390625, 0.0111541748046875, 0.014516830444335938, 0.017879486083984375, 0.021242141723632812, 0.02460479736328125, 0.027967453002929688, 0.031330108642578125, 0.03469276428222656, 0.038055419921875, 0.04141807556152344, 0.044780731201171875, 0.04814338684082031, 0.05150604248046875, 0.05486869812011719, 0.058231353759765625, 0.06159400939941406, 0.0649566650390625, 0.06831932067871094, 0.07168197631835938, 0.07504463195800781, 0.07840728759765625, 0.08176994323730469, 0.08513259887695312, 0.08849525451660156, 0.09185791015625]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 5.0, 9.0, 12.0, 14.0, 28.0, 49.0, 41.0, 105.0, 154.0, 294.0, 495.0, 932.0, 2096.0, 5236.0, 16595.0, 70697.0, 491795.0, 2669869.0, 799141.0, 103242.0, 21801.0, 6654.0, 2542.0, 1072.0, 598.0, 307.0, 175.0, 116.0, 71.0, 49.0, 31.0, 26.0, 15.0, 5.0, 4.0, 3.0, 5.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.374755859375, -0.3650493621826172, -0.3553428649902344, -0.34563636779785156, -0.33592987060546875, -0.32622337341308594, -0.3165168762207031, -0.3068103790283203, -0.2971038818359375, -0.2873973846435547, -0.2776908874511719, -0.26798439025878906, -0.25827789306640625, -0.24857139587402344, -0.23886489868164062, -0.2291584014892578, -0.219451904296875, -0.2097454071044922, -0.20003890991210938, -0.19033241271972656, -0.18062591552734375, -0.17091941833496094, -0.16121292114257812, -0.1515064239501953, -0.1417999267578125, -0.1320934295654297, -0.12238693237304688, -0.11268043518066406, -0.10297393798828125, -0.09326744079589844, -0.08356094360351562, -0.07385444641113281, -0.06414794921875, -0.05444145202636719, -0.044734954833984375, -0.03502845764160156, -0.02532196044921875, -0.015615463256835938, -0.005908966064453125, 0.0037975311279296875, 0.0135040283203125, 0.023210525512695312, 0.032917022705078125, 0.04262351989746094, 0.05233001708984375, 0.06203651428222656, 0.07174301147460938, 0.08144950866699219, 0.091156005859375, 0.10086250305175781, 0.11056900024414062, 0.12027549743652344, 0.12998199462890625, 0.13968849182128906, 0.14939498901367188, 0.1591014862060547, 0.1688079833984375, 0.1785144805908203, 0.18822097778320312, 0.19792747497558594, 0.20763397216796875, 0.21734046936035156, 0.22704696655273438, 0.2367534637451172, 0.2464599609375]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 4.0, 7.0, 8.0, 4.0, 12.0, 18.0, 24.0, 45.0, 65.0, 87.0, 127.0, 203.0, 323.0, 460.0, 613.0, 676.0, 492.0, 309.0, 217.0, 125.0, 87.0, 61.0, 32.0, 20.0, 17.0, 14.0, 10.0, 5.0, 5.0, 6.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1785888671875, -0.1704883575439453, -0.16238784790039062, -0.15428733825683594, -0.14618682861328125, -0.13808631896972656, -0.12998580932617188, -0.12188529968261719, -0.1137847900390625, -0.10568428039550781, -0.09758377075195312, -0.08948326110839844, -0.08138275146484375, -0.07328224182128906, -0.06518173217773438, -0.05708122253417969, -0.048980712890625, -0.04088020324707031, -0.032779693603515625, -0.024679183959960938, -0.01657867431640625, -0.008478164672851562, -0.000377655029296875, 0.0077228546142578125, 0.0158233642578125, 0.023923873901367188, 0.032024383544921875, 0.04012489318847656, 0.04822540283203125, 0.05632591247558594, 0.06442642211914062, 0.07252693176269531, 0.08062744140625, 0.08872795104980469, 0.09682846069335938, 0.10492897033691406, 0.11302947998046875, 0.12112998962402344, 0.12923049926757812, 0.1373310089111328, 0.1454315185546875, 0.1535320281982422, 0.16163253784179688, 0.16973304748535156, 0.17783355712890625, 0.18593406677246094, 0.19403457641601562, 0.2021350860595703, 0.210235595703125, 0.2183361053466797, 0.22643661499023438, 0.23453712463378906, 0.24263763427734375, 0.25073814392089844, 0.2588386535644531, 0.2669391632080078, 0.2750396728515625, 0.2831401824951172, 0.2912406921386719, 0.29934120178222656, 0.30744171142578125, 0.31554222106933594, 0.3236427307128906, 0.3317432403564453, 0.33984375]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 11.0, 7.0, 16.0, 22.0, 24.0, 32.0, 45.0, 58.0, 88.0, 76.0, 87.0, 88.0, 72.0, 59.0, 55.0, 57.0, 45.0, 42.0, 35.0, 26.0, 17.0, 17.0, 12.0, 5.0, 5.0, 3.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.111814022064209, -1.0807040929794312, -1.0495940446853638, -1.018484115600586, -0.9873741269111633, -0.9562641978263855, -0.9251542091369629, -0.8940442800521851, -0.8629342913627625, -0.8318243026733398, -0.800714373588562, -0.7696043848991394, -0.7384943962097168, -0.707384467124939, -0.6762744784355164, -0.6451644897460938, -0.6140545606613159, -0.5829445719718933, -0.5518346428871155, -0.5207246541976929, -0.48961469531059265, -0.45850473642349243, -0.4273947477340698, -0.3962847888469696, -0.3651747703552246, -0.3340648114681244, -0.3029548227787018, -0.27184486389160156, -0.24073490500450134, -0.20962493121623993, -0.17851495742797852, -0.1474049985408783, -0.11629503965377808, -0.08518507331609726, -0.054075103253126144, -0.02296513319015503, 0.008144833147525787, 0.039254799485206604, 0.07036477327346802, 0.10147473216056824, 0.13258470594882965, 0.16369467973709106, 0.19480463862419128, 0.2259146124124527, 0.2570245862007141, 0.28813454508781433, 0.31924450397491455, 0.35035449266433716, 0.3814644515514374, 0.4125744104385376, 0.4436843991279602, 0.4747943580150604, 0.5059043169021606, 0.5370143055915833, 0.5681242942810059, 0.5992342233657837, 0.6303442120552063, 0.6614542007446289, 0.6925641298294067, 0.7236741185188293, 0.754784107208252, 0.7858940362930298, 0.8170040249824524, 0.848114013671875, 0.8792239427566528]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 3.0, 4.0, 2.0, 6.0, 11.0, 8.0, 11.0, 14.0, 11.0, 14.0, 11.0, 16.0, 22.0, 22.0, 30.0, 27.0, 28.0, 33.0, 50.0, 31.0, 33.0, 43.0, 37.0, 42.0, 43.0, 40.0, 52.0, 42.0, 34.0, 34.0, 32.0, 35.0, 26.0, 22.0, 25.0, 23.0, 16.0, 10.0, 13.0, 9.0, 5.0, 9.0, 8.0, 7.0, 3.0, 5.0, 3.0, 1.0, 2.0, 1.0, 4.0, 0.0, 0.0, 1.0], "bins": [-0.6481337547302246, -0.6289836168289185, -0.6098334193229675, -0.5906832814216614, -0.5715330839157104, -0.5523829460144043, -0.5332328081130981, -0.5140826106071472, -0.49493247270584106, -0.4757823050022125, -0.456632137298584, -0.43748199939727783, -0.4183318316936493, -0.39918166399002075, -0.3800314962863922, -0.36088132858276367, -0.34173116087913513, -0.3225809931755066, -0.30343082547187805, -0.2842806577682495, -0.26513051986694336, -0.24598035216331482, -0.22683018445968628, -0.20768003165721893, -0.1885298639535904, -0.16937969624996185, -0.1502295434474945, -0.13107937574386597, -0.11192921549081802, -0.09277905523777008, -0.07362888753414154, -0.054478734731674194, -0.035328567028045654, -0.016178404912352562, 0.0029717572033405304, 0.022121921181678772, 0.041272081434726715, 0.06042224168777466, 0.0795724093914032, 0.09872256219387054, 0.11787272989749908, 0.13702289760112762, 0.15617305040359497, 0.1753232181072235, 0.19447338581085205, 0.2136235386133194, 0.23277370631694794, 0.2519238591194153, 0.2710740268230438, 0.29022419452667236, 0.3093743622303009, 0.32852452993392944, 0.3476746678352356, 0.36682483553886414, 0.3859750032424927, 0.40512514114379883, 0.42427533864974976, 0.4434255063533783, 0.46257567405700684, 0.481725811958313, 0.5008760094642639, 0.5200261473655701, 0.539176344871521, 0.5583264827728271, 0.5774766206741333]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 8.0, 6.0, 4.0, 5.0, 9.0, 20.0, 27.0, 42.0, 73.0, 114.0, 177.0, 318.0, 618.0, 1329.0, 3456.0, 9100.0, 26690.0, 94663.0, 367052.0, 394327.0, 104604.0, 29514.0, 9770.0, 3666.0, 1474.0, 643.0, 364.0, 172.0, 116.0, 70.0, 39.0, 23.0, 28.0, 10.0, 5.0, 7.0, 3.0, 5.0, 3.0, 3.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.48583984375, -0.46910858154296875, -0.4523773193359375, -0.43564605712890625, -0.418914794921875, -0.40218353271484375, -0.3854522705078125, -0.36872100830078125, -0.35198974609375, -0.33525848388671875, -0.3185272216796875, -0.30179595947265625, -0.285064697265625, -0.26833343505859375, -0.2516021728515625, -0.23487091064453125, -0.2181396484375, -0.20140838623046875, -0.1846771240234375, -0.16794586181640625, -0.151214599609375, -0.13448333740234375, -0.1177520751953125, -0.10102081298828125, -0.08428955078125, -0.06755828857421875, -0.0508270263671875, -0.03409576416015625, -0.017364501953125, -0.00063323974609375, 0.0160980224609375, 0.03282928466796875, 0.049560546875, 0.06629180908203125, 0.0830230712890625, 0.09975433349609375, 0.116485595703125, 0.13321685791015625, 0.1499481201171875, 0.16667938232421875, 0.18341064453125, 0.20014190673828125, 0.2168731689453125, 0.23360443115234375, 0.250335693359375, 0.26706695556640625, 0.2837982177734375, 0.30052947998046875, 0.3172607421875, 0.33399200439453125, 0.3507232666015625, 0.36745452880859375, 0.384185791015625, 0.40091705322265625, 0.4176483154296875, 0.43437957763671875, 0.45111083984375, 0.46784210205078125, 0.4845733642578125, 0.5013046264648438, 0.518035888671875, 0.5347671508789062, 0.5514984130859375, 0.5682296752929688, 0.5849609375]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 4.0, 7.0, 5.0, 10.0, 11.0, 15.0, 22.0, 20.0, 28.0, 31.0, 44.0, 35.0, 40.0, 50.0, 68.0, 55.0, 51.0, 61.0, 66.0, 51.0, 54.0, 45.0, 47.0, 41.0, 31.0, 27.0, 22.0, 15.0, 11.0, 14.0, 9.0, 9.0, 7.0, 5.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.1766357421875, -0.17232036590576172, -0.16800498962402344, -0.16368961334228516, -0.15937423706054688, -0.1550588607788086, -0.1507434844970703, -0.14642810821533203, -0.14211273193359375, -0.13779735565185547, -0.1334819793701172, -0.1291666030883789, -0.12485122680664062, -0.12053585052490234, -0.11622047424316406, -0.11190509796142578, -0.1075897216796875, -0.10327434539794922, -0.09895896911621094, -0.09464359283447266, -0.09032821655273438, -0.0860128402709961, -0.08169746398925781, -0.07738208770751953, -0.07306671142578125, -0.06875133514404297, -0.06443595886230469, -0.060120582580566406, -0.055805206298828125, -0.051489830017089844, -0.04717445373535156, -0.04285907745361328, -0.038543701171875, -0.03422832489013672, -0.029912948608398438, -0.025597572326660156, -0.021282196044921875, -0.016966819763183594, -0.012651443481445312, -0.008336067199707031, -0.00402069091796875, 0.00029468536376953125, 0.0046100616455078125, 0.008925437927246094, 0.013240814208984375, 0.017556190490722656, 0.021871566772460938, 0.02618694305419922, 0.0305023193359375, 0.03481769561767578, 0.03913307189941406, 0.043448448181152344, 0.047763824462890625, 0.052079200744628906, 0.05639457702636719, 0.06070995330810547, 0.06502532958984375, 0.06934070587158203, 0.07365608215332031, 0.0779714584350586, 0.08228683471679688, 0.08660221099853516, 0.09091758728027344, 0.09523296356201172, 0.09954833984375]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 5.0, 2.0, 7.0, 10.0, 10.0, 15.0, 16.0, 22.0, 28.0, 61.0, 99.0, 191.0, 335.0, 647.0, 1382.0, 3356.0, 8501.0, 22118.0, 63681.0, 200686.0, 407246.0, 227363.0, 71776.0, 25145.0, 9254.0, 3523.0, 1575.0, 736.0, 308.0, 160.0, 101.0, 71.0, 49.0, 33.0, 11.0, 11.0, 11.0, 4.0, 3.0, 4.0, 3.0, 0.0, 3.0, 0.0, 4.0, 2.0, 0.0, 1.0], "bins": [-0.45751953125, -0.4450035095214844, -0.43248748779296875, -0.4199714660644531, -0.4074554443359375, -0.3949394226074219, -0.38242340087890625, -0.3699073791503906, -0.357391357421875, -0.3448753356933594, -0.33235931396484375, -0.3198432922363281, -0.3073272705078125, -0.2948112487792969, -0.28229522705078125, -0.2697792053222656, -0.25726318359375, -0.24474716186523438, -0.23223114013671875, -0.21971511840820312, -0.2071990966796875, -0.19468307495117188, -0.18216705322265625, -0.16965103149414062, -0.157135009765625, -0.14461898803710938, -0.13210296630859375, -0.11958694458007812, -0.1070709228515625, -0.09455490112304688, -0.08203887939453125, -0.06952285766601562, -0.0570068359375, -0.044490814208984375, -0.03197479248046875, -0.019458770751953125, -0.0069427490234375, 0.005573272705078125, 0.01808929443359375, 0.030605316162109375, 0.043121337890625, 0.055637359619140625, 0.06815338134765625, 0.08066940307617188, 0.0931854248046875, 0.10570144653320312, 0.11821746826171875, 0.13073348999023438, 0.14324951171875, 0.15576553344726562, 0.16828155517578125, 0.18079757690429688, 0.1933135986328125, 0.20582962036132812, 0.21834564208984375, 0.23086166381835938, 0.243377685546875, 0.2558937072753906, 0.26840972900390625, 0.2809257507324219, 0.2934417724609375, 0.3059577941894531, 0.31847381591796875, 0.3309898376464844, 0.343505859375]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 4.0, 4.0, 8.0, 8.0, 7.0, 11.0, 20.0, 12.0, 11.0, 17.0, 27.0, 22.0, 31.0, 39.0, 34.0, 37.0, 37.0, 48.0, 44.0, 60.0, 41.0, 46.0, 53.0, 42.0, 44.0, 40.0, 42.0, 28.0, 35.0, 19.0, 21.0, 25.0, 27.0, 16.0, 10.0, 5.0, 6.0, 7.0, 8.0, 4.0, 1.0, 2.0, 1.0, 6.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.322021484375, -0.3114356994628906, -0.30084991455078125, -0.2902641296386719, -0.2796783447265625, -0.2690925598144531, -0.25850677490234375, -0.24792098999023438, -0.237335205078125, -0.22674942016601562, -0.21616363525390625, -0.20557785034179688, -0.1949920654296875, -0.18440628051757812, -0.17382049560546875, -0.16323471069335938, -0.15264892578125, -0.14206314086914062, -0.13147735595703125, -0.12089157104492188, -0.1103057861328125, -0.09972000122070312, -0.08913421630859375, -0.07854843139648438, -0.067962646484375, -0.057376861572265625, -0.04679107666015625, -0.036205291748046875, -0.0256195068359375, -0.015033721923828125, -0.00444793701171875, 0.006137847900390625, 0.0167236328125, 0.027309417724609375, 0.03789520263671875, 0.048480987548828125, 0.0590667724609375, 0.06965255737304688, 0.08023834228515625, 0.09082412719726562, 0.101409912109375, 0.11199569702148438, 0.12258148193359375, 0.13316726684570312, 0.1437530517578125, 0.15433883666992188, 0.16492462158203125, 0.17551040649414062, 0.18609619140625, 0.19668197631835938, 0.20726776123046875, 0.21785354614257812, 0.2284393310546875, 0.23902511596679688, 0.24961090087890625, 0.2601966857910156, 0.270782470703125, 0.2813682556152344, 0.29195404052734375, 0.3025398254394531, 0.3131256103515625, 0.3237113952636719, 0.33429718017578125, 0.3448829650878906, 0.35546875]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 6.0, 2.0, 9.0, 9.0, 24.0, 30.0, 40.0, 66.0, 74.0, 119.0, 196.0, 321.0, 478.0, 756.0, 1214.0, 1913.0, 3085.0, 5008.0, 7873.0, 12412.0, 19490.0, 31356.0, 50297.0, 83322.0, 138857.0, 191942.0, 182667.0, 123061.0, 73808.0, 45141.0, 27546.0, 17593.0, 11146.0, 6948.0, 4467.0, 2747.0, 1706.0, 1040.0, 656.0, 406.0, 249.0, 171.0, 114.0, 71.0, 53.0, 32.0, 20.0, 11.0, 8.0, 3.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09149169921875, -0.08852863311767578, -0.08556556701660156, -0.08260250091552734, -0.07963943481445312, -0.0766763687133789, -0.07371330261230469, -0.07075023651123047, -0.06778717041015625, -0.06482410430908203, -0.06186103820800781, -0.058897972106933594, -0.055934906005859375, -0.052971839904785156, -0.05000877380371094, -0.04704570770263672, -0.0440826416015625, -0.04111957550048828, -0.03815650939941406, -0.035193443298339844, -0.032230377197265625, -0.029267311096191406, -0.026304244995117188, -0.02334117889404297, -0.02037811279296875, -0.01741504669189453, -0.014451980590820312, -0.011488914489746094, -0.008525848388671875, -0.005562782287597656, -0.0025997161865234375, 0.00036334991455078125, 0.003326416015625, 0.006289482116699219, 0.009252548217773438, 0.012215614318847656, 0.015178680419921875, 0.018141746520996094, 0.021104812622070312, 0.02406787872314453, 0.02703094482421875, 0.02999401092529297, 0.03295707702636719, 0.035920143127441406, 0.038883209228515625, 0.041846275329589844, 0.04480934143066406, 0.04777240753173828, 0.0507354736328125, 0.05369853973388672, 0.05666160583496094, 0.059624671936035156, 0.06258773803710938, 0.0655508041381836, 0.06851387023925781, 0.07147693634033203, 0.07444000244140625, 0.07740306854248047, 0.08036613464355469, 0.0833292007446289, 0.08629226684570312, 0.08925533294677734, 0.09221839904785156, 0.09518146514892578, 0.09814453125]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 4.0, 2.0, 3.0, 5.0, 4.0, 4.0, 6.0, 6.0, 5.0, 15.0, 11.0, 25.0, 20.0, 17.0, 22.0, 41.0, 41.0, 78.0, 110.0, 88.0, 108.0, 87.0, 67.0, 52.0, 39.0, 35.0, 20.0, 18.0, 13.0, 8.0, 10.0, 12.0, 7.0, 6.0, 4.0, 2.0, 6.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-4.38690185546875e-05, -4.271510988473892e-05, -4.1561201214790344e-05, -4.0407292544841766e-05, -3.925338387489319e-05, -3.809947520494461e-05, -3.694556653499603e-05, -3.5791657865047455e-05, -3.463774919509888e-05, -3.34838405251503e-05, -3.232993185520172e-05, -3.117602318525314e-05, -3.0022114515304565e-05, -2.8868205845355988e-05, -2.771429717540741e-05, -2.6560388505458832e-05, -2.5406479835510254e-05, -2.4252571165561676e-05, -2.3098662495613098e-05, -2.194475382566452e-05, -2.0790845155715942e-05, -1.9636936485767365e-05, -1.8483027815818787e-05, -1.732911914587021e-05, -1.617521047592163e-05, -1.5021301805973053e-05, -1.3867393136024475e-05, -1.2713484466075897e-05, -1.155957579612732e-05, -1.0405667126178741e-05, -9.251758456230164e-06, -8.097849786281586e-06, -6.943941116333008e-06, -5.79003244638443e-06, -4.636123776435852e-06, -3.482215106487274e-06, -2.3283064365386963e-06, -1.1743977665901184e-06, -2.0489096641540527e-08, 1.1334195733070374e-06, 2.2873282432556152e-06, 3.441236913204193e-06, 4.595145583152771e-06, 5.749054253101349e-06, 6.902962923049927e-06, 8.056871592998505e-06, 9.210780262947083e-06, 1.036468893289566e-05, 1.1518597602844238e-05, 1.2672506272792816e-05, 1.3826414942741394e-05, 1.4980323612689972e-05, 1.613423228263855e-05, 1.7288140952587128e-05, 1.8442049622535706e-05, 1.9595958292484283e-05, 2.074986696243286e-05, 2.190377563238144e-05, 2.3057684302330017e-05, 2.4211592972278595e-05, 2.5365501642227173e-05, 2.651941031217575e-05, 2.767331898212433e-05, 2.8827227652072906e-05, 2.9981136322021484e-05]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 3.0, 7.0, 1.0, 5.0, 13.0, 8.0, 13.0, 24.0, 35.0, 42.0, 70.0, 113.0, 171.0, 244.0, 424.0, 687.0, 1179.0, 1991.0, 3624.0, 6137.0, 11153.0, 19338.0, 34637.0, 63599.0, 125512.0, 235856.0, 247460.0, 140058.0, 70079.0, 37319.0, 20877.0, 11763.0, 6736.0, 3819.0, 2181.0, 1324.0, 722.0, 482.0, 289.0, 182.0, 132.0, 79.0, 52.0, 24.0, 32.0, 29.0, 14.0, 9.0, 6.0, 4.0, 5.0, 3.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10455322265625, -0.10107612609863281, -0.09759902954101562, -0.09412193298339844, -0.09064483642578125, -0.08716773986816406, -0.08369064331054688, -0.08021354675292969, -0.0767364501953125, -0.07325935363769531, -0.06978225708007812, -0.06630516052246094, -0.06282806396484375, -0.05935096740722656, -0.055873870849609375, -0.05239677429199219, -0.048919677734375, -0.04544258117675781, -0.041965484619140625, -0.03848838806152344, -0.03501129150390625, -0.03153419494628906, -0.028057098388671875, -0.024580001831054688, -0.0211029052734375, -0.017625808715820312, -0.014148712158203125, -0.010671615600585938, -0.00719451904296875, -0.0037174224853515625, -0.000240325927734375, 0.0032367706298828125, 0.0067138671875, 0.010190963745117188, 0.013668060302734375, 0.017145156860351562, 0.02062225341796875, 0.024099349975585938, 0.027576446533203125, 0.031053543090820312, 0.0345306396484375, 0.03800773620605469, 0.041484832763671875, 0.04496192932128906, 0.04843902587890625, 0.05191612243652344, 0.055393218994140625, 0.05887031555175781, 0.062347412109375, 0.06582450866699219, 0.06930160522460938, 0.07277870178222656, 0.07625579833984375, 0.07973289489746094, 0.08320999145507812, 0.08668708801269531, 0.0901641845703125, 0.09364128112792969, 0.09711837768554688, 0.10059547424316406, 0.10407257080078125, 0.10754966735839844, 0.11102676391601562, 0.11450386047363281, 0.11798095703125]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 1.0, 3.0, 3.0, 4.0, 5.0, 11.0, 7.0, 8.0, 9.0, 15.0, 16.0, 31.0, 23.0, 17.0, 23.0, 44.0, 35.0, 56.0, 49.0, 69.0, 67.0, 56.0, 48.0, 60.0, 44.0, 52.0, 41.0, 50.0, 28.0, 32.0, 19.0, 9.0, 10.0, 14.0, 7.0, 4.0, 9.0, 9.0, 6.0, 6.0, 1.0, 1.0, 1.0, 4.0, 1.0, 2.0, 1.0, 1.0, 2.0], "bins": [-0.1256103515625, -0.1221628189086914, -0.11871528625488281, -0.11526775360107422, -0.11182022094726562, -0.10837268829345703, -0.10492515563964844, -0.10147762298583984, -0.09803009033203125, -0.09458255767822266, -0.09113502502441406, -0.08768749237060547, -0.08423995971679688, -0.08079242706298828, -0.07734489440917969, -0.0738973617553711, -0.0704498291015625, -0.0670022964477539, -0.06355476379394531, -0.06010723114013672, -0.056659698486328125, -0.05321216583251953, -0.04976463317871094, -0.046317100524902344, -0.04286956787109375, -0.039422035217285156, -0.03597450256347656, -0.03252696990966797, -0.029079437255859375, -0.02563190460205078, -0.022184371948242188, -0.018736839294433594, -0.015289306640625, -0.011841773986816406, -0.008394241333007812, -0.004946708679199219, -0.001499176025390625, 0.0019483566284179688, 0.0053958892822265625, 0.008843421936035156, 0.01229095458984375, 0.015738487243652344, 0.019186019897460938, 0.02263355255126953, 0.026081085205078125, 0.02952861785888672, 0.03297615051269531, 0.036423683166503906, 0.0398712158203125, 0.043318748474121094, 0.04676628112792969, 0.05021381378173828, 0.053661346435546875, 0.05710887908935547, 0.06055641174316406, 0.06400394439697266, 0.06745147705078125, 0.07089900970458984, 0.07434654235839844, 0.07779407501220703, 0.08124160766601562, 0.08468914031982422, 0.08813667297363281, 0.0915842056274414, 0.09503173828125]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 7.0, 8.0, 17.0, 34.0, 53.0, 71.0, 93.0, 140.0, 126.0, 126.0, 117.0, 88.0, 59.0, 37.0, 18.0, 12.0, 5.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.7507119178771973, -2.6893022060394287, -2.6278927326202393, -2.5664830207824707, -2.505073308944702, -2.4436638355255127, -2.382254123687744, -2.3208444118499756, -2.259434938430786, -2.1980252265930176, -2.136615753173828, -2.0752060413360596, -2.013796329498291, -1.9523868560791016, -1.890977144241333, -1.829567551612854, -1.7681578397750854, -1.7067482471466064, -1.645338535308838, -1.5839289426803589, -1.5225193500518799, -1.4611096382141113, -1.3997000455856323, -1.3382904529571533, -1.2768807411193848, -1.2154711484909058, -1.1540614366531372, -1.0926518440246582, -1.0312422513961792, -0.9698325991630554, -0.9084229469299316, -0.8470133543014526, -0.7856036424636841, -0.7241939902305603, -0.6627843976020813, -0.6013747453689575, -0.5399651527404785, -0.47855550050735474, -0.41714584827423096, -0.35573622584342957, -0.2943266034126282, -0.23291698098182678, -0.1715073436498642, -0.11009770631790161, -0.04868808388710022, 0.012721538543701172, 0.07413119077682495, 0.13554081320762634, 0.19695043563842773, 0.2583600580692291, 0.3197696805000305, 0.3811793327331543, 0.4425889551639557, 0.5039985775947571, 0.5654082298278809, 0.6268178224563599, 0.6882274746894836, 0.7496371269226074, 0.8110467195510864, 0.8724563717842102, 0.933866024017334, 0.995275616645813, 1.056685209274292, 1.1180949211120605, 1.1795045137405396]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 6.0, 1.0, 0.0, 4.0, 2.0, 7.0, 5.0, 7.0, 14.0, 14.0, 17.0, 16.0, 18.0, 26.0, 23.0, 30.0, 35.0, 29.0, 35.0, 33.0, 37.0, 46.0, 37.0, 51.0, 27.0, 33.0, 43.0, 44.0, 39.0, 39.0, 35.0, 35.0, 28.0, 31.0, 28.0, 20.0, 21.0, 13.0, 18.0, 12.0, 15.0, 8.0, 5.0, 6.0, 1.0, 5.0, 2.0, 4.0, 2.0, 3.0, 5.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9121192097663879, -0.8830252885818481, -0.8539313673973083, -0.8248374462127686, -0.7957435250282288, -0.766649603843689, -0.7375556826591492, -0.7084617614746094, -0.6793678402900696, -0.6502739191055298, -0.62117999792099, -0.5920860767364502, -0.5629921555519104, -0.5338982343673706, -0.5048043131828308, -0.475710391998291, -0.4466164708137512, -0.4175225496292114, -0.38842862844467163, -0.35933470726013184, -0.33024078607559204, -0.30114686489105225, -0.27205294370651245, -0.24295902252197266, -0.21386510133743286, -0.18477118015289307, -0.15567725896835327, -0.12658333778381348, -0.09748941659927368, -0.06839549541473389, -0.03930157423019409, -0.010207653045654297, 0.018886327743530273, 0.04798024892807007, 0.07707417011260986, 0.10616809129714966, 0.13526201248168945, 0.16435593366622925, 0.19344985485076904, 0.22254377603530884, 0.25163769721984863, 0.2807316184043884, 0.3098255395889282, 0.338919460773468, 0.3680133819580078, 0.3971073031425476, 0.4262012243270874, 0.4552951455116272, 0.484389066696167, 0.5134829878807068, 0.5425769090652466, 0.5716708302497864, 0.6007647514343262, 0.629858672618866, 0.6589525938034058, 0.6880465149879456, 0.7171404361724854, 0.7462343573570251, 0.7753282785415649, 0.8044221997261047, 0.8335161209106445, 0.8626100420951843, 0.8917039632797241, 0.9207978844642639, 0.9498918056488037]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 3.0, 1.0, 9.0, 3.0, 7.0, 5.0, 8.0, 16.0, 11.0, 30.0, 56.0, 99.0, 187.0, 390.0, 1002.0, 2721.0, 8961.0, 39448.0, 320352.0, 2871599.0, 851932.0, 76791.0, 14756.0, 3903.0, 1255.0, 463.0, 162.0, 63.0, 25.0, 19.0, 9.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.387451171875, -0.3762779235839844, -0.36510467529296875, -0.3539314270019531, -0.3427581787109375, -0.3315849304199219, -0.32041168212890625, -0.3092384338378906, -0.298065185546875, -0.2868919372558594, -0.27571868896484375, -0.2645454406738281, -0.2533721923828125, -0.24219894409179688, -0.23102569580078125, -0.21985244750976562, -0.20867919921875, -0.19750595092773438, -0.18633270263671875, -0.17515945434570312, -0.1639862060546875, -0.15281295776367188, -0.14163970947265625, -0.13046646118164062, -0.119293212890625, -0.10811996459960938, -0.09694671630859375, -0.08577346801757812, -0.0746002197265625, -0.06342697143554688, -0.05225372314453125, -0.041080474853515625, -0.0299072265625, -0.018733978271484375, -0.00756072998046875, 0.003612518310546875, 0.0147857666015625, 0.025959014892578125, 0.03713226318359375, 0.048305511474609375, 0.059478759765625, 0.07065200805664062, 0.08182525634765625, 0.09299850463867188, 0.1041717529296875, 0.11534500122070312, 0.12651824951171875, 0.13769149780273438, 0.14886474609375, 0.16003799438476562, 0.17121124267578125, 0.18238449096679688, 0.1935577392578125, 0.20473098754882812, 0.21590423583984375, 0.22707748413085938, 0.238250732421875, 0.24942398071289062, 0.26059722900390625, 0.2717704772949219, 0.2829437255859375, 0.2941169738769531, 0.30529022216796875, 0.3164634704589844, 0.32763671875]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 3.0, 6.0, 3.0, 4.0, 12.0, 16.0, 16.0, 18.0, 24.0, 31.0, 25.0, 43.0, 27.0, 30.0, 41.0, 39.0, 51.0, 56.0, 54.0, 59.0, 48.0, 51.0, 48.0, 47.0, 32.0, 37.0, 45.0, 33.0, 30.0, 15.0, 17.0, 8.0, 10.0, 10.0, 6.0, 6.0, 2.0, 2.0, 3.0, 1.0, 3.0, 1.0], "bins": [-0.171875, -0.16766071319580078, -0.16344642639160156, -0.15923213958740234, -0.15501785278320312, -0.1508035659790039, -0.1465892791748047, -0.14237499237060547, -0.13816070556640625, -0.13394641876220703, -0.1297321319580078, -0.1255178451538086, -0.12130355834960938, -0.11708927154541016, -0.11287498474121094, -0.10866069793701172, -0.1044464111328125, -0.10023212432861328, -0.09601783752441406, -0.09180355072021484, -0.08758926391601562, -0.0833749771118164, -0.07916069030761719, -0.07494640350341797, -0.07073211669921875, -0.06651782989501953, -0.06230354309082031, -0.058089256286621094, -0.053874969482421875, -0.049660682678222656, -0.04544639587402344, -0.04123210906982422, -0.037017822265625, -0.03280353546142578, -0.028589248657226562, -0.024374961853027344, -0.020160675048828125, -0.015946388244628906, -0.011732101440429688, -0.007517814636230469, -0.00330352783203125, 0.0009107589721679688, 0.0051250457763671875, 0.009339332580566406, 0.013553619384765625, 0.017767906188964844, 0.021982192993164062, 0.02619647979736328, 0.0304107666015625, 0.03462505340576172, 0.03883934020996094, 0.043053627014160156, 0.047267913818359375, 0.051482200622558594, 0.05569648742675781, 0.05991077423095703, 0.06412506103515625, 0.06833934783935547, 0.07255363464355469, 0.0767679214477539, 0.08098220825195312, 0.08519649505615234, 0.08941078186035156, 0.09362506866455078, 0.09783935546875]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 1.0, 4.0, 4.0, 3.0, 8.0, 10.0, 12.0, 29.0, 25.0, 26.0, 63.0, 68.0, 96.0, 173.0, 238.0, 343.0, 518.0, 816.0, 1401.0, 2505.0, 5332.0, 12618.0, 35459.0, 127713.0, 624814.0, 2201955.0, 924323.0, 180236.0, 46339.0, 15428.0, 6434.0, 3042.0, 1564.0, 895.0, 587.0, 375.0, 225.0, 170.0, 128.0, 78.0, 74.0, 34.0, 45.0, 25.0, 18.0, 16.0, 9.0, 5.0, 2.0, 5.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.271484375, -0.2623176574707031, -0.25315093994140625, -0.24398422241210938, -0.2348175048828125, -0.22565078735351562, -0.21648406982421875, -0.20731735229492188, -0.198150634765625, -0.18898391723632812, -0.17981719970703125, -0.17065048217773438, -0.1614837646484375, -0.15231704711914062, -0.14315032958984375, -0.13398361206054688, -0.12481689453125, -0.11565017700195312, -0.10648345947265625, -0.09731674194335938, -0.0881500244140625, -0.07898330688476562, -0.06981658935546875, -0.060649871826171875, -0.051483154296875, -0.042316436767578125, -0.03314971923828125, -0.023983001708984375, -0.0148162841796875, -0.005649566650390625, 0.00351715087890625, 0.012683868408203125, 0.0218505859375, 0.031017303466796875, 0.04018402099609375, 0.049350738525390625, 0.0585174560546875, 0.06768417358398438, 0.07685089111328125, 0.08601760864257812, 0.095184326171875, 0.10435104370117188, 0.11351776123046875, 0.12268447875976562, 0.1318511962890625, 0.14101791381835938, 0.15018463134765625, 0.15935134887695312, 0.16851806640625, 0.17768478393554688, 0.18685150146484375, 0.19601821899414062, 0.2051849365234375, 0.21435165405273438, 0.22351837158203125, 0.23268508911132812, 0.241851806640625, 0.2510185241699219, 0.26018524169921875, 0.2693519592285156, 0.2785186767578125, 0.2876853942871094, 0.29685211181640625, 0.3060188293457031, 0.315185546875]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 9.0, 8.0, 6.0, 11.0, 7.0, 16.0, 27.0, 35.0, 53.0, 63.0, 102.0, 158.0, 217.0, 278.0, 401.0, 559.0, 554.0, 460.0, 359.0, 216.0, 165.0, 114.0, 66.0, 43.0, 32.0, 35.0, 24.0, 14.0, 11.0, 7.0, 4.0, 7.0, 3.0, 1.0, 3.0, 2.0, 2.0, 1.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.2919921875, -0.28347015380859375, -0.2749481201171875, -0.26642608642578125, -0.257904052734375, -0.24938201904296875, -0.2408599853515625, -0.23233795166015625, -0.22381591796875, -0.21529388427734375, -0.2067718505859375, -0.19824981689453125, -0.189727783203125, -0.18120574951171875, -0.1726837158203125, -0.16416168212890625, -0.1556396484375, -0.14711761474609375, -0.1385955810546875, -0.13007354736328125, -0.121551513671875, -0.11302947998046875, -0.1045074462890625, -0.09598541259765625, -0.08746337890625, -0.07894134521484375, -0.0704193115234375, -0.06189727783203125, -0.053375244140625, -0.04485321044921875, -0.0363311767578125, -0.02780914306640625, -0.019287109375, -0.01076507568359375, -0.0022430419921875, 0.00627899169921875, 0.014801025390625, 0.02332305908203125, 0.0318450927734375, 0.04036712646484375, 0.04888916015625, 0.05741119384765625, 0.0659332275390625, 0.07445526123046875, 0.082977294921875, 0.09149932861328125, 0.1000213623046875, 0.10854339599609375, 0.1170654296875, 0.12558746337890625, 0.1341094970703125, 0.14263153076171875, 0.151153564453125, 0.15967559814453125, 0.1681976318359375, 0.17671966552734375, 0.18524169921875, 0.19376373291015625, 0.2022857666015625, 0.21080780029296875, 0.219329833984375, 0.22785186767578125, 0.2363739013671875, 0.24489593505859375, 0.25341796875]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 0.0, 5.0, 13.0, 27.0, 57.0, 91.0, 195.0, 200.0, 177.0, 142.0, 65.0, 23.0, 14.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-5.663661479949951, -5.556789398193359, -5.449916839599609, -5.343044281005859, -5.236172199249268, -5.129300117492676, -5.022427558898926, -4.915555000305176, -4.808682918548584, -4.701810836791992, -4.594938278198242, -4.488065719604492, -4.3811936378479, -4.274321556091309, -4.167448997497559, -4.060576438903809, -3.953704357147217, -3.846832036972046, -3.739959716796875, -3.633087396621704, -3.526215076446533, -3.4193427562713623, -3.3124704360961914, -3.2055981159210205, -3.0987257957458496, -2.9918534755706787, -2.884981155395508, -2.778108835220337, -2.671236515045166, -2.564364194869995, -2.457491874694824, -2.3506195545196533, -2.2437474727630615, -2.1368751525878906, -2.0300028324127197, -1.9231305122375488, -1.816258192062378, -1.709385871887207, -1.6025135517120361, -1.4956412315368652, -1.3887689113616943, -1.2818965911865234, -1.1750242710113525, -1.0681519508361816, -0.9612796306610107, -0.8544073104858398, -0.747534990310669, -0.640662670135498, -0.5337903499603271, -0.42691802978515625, -0.32004570960998535, -0.21317338943481445, -0.10630106925964355, 0.0005712509155273438, 0.10744357109069824, 0.21431589126586914, 0.32118821144104004, 0.42806053161621094, 0.5349328517913818, 0.6418051719665527, 0.7486774921417236, 0.8555498123168945, 0.9624221324920654, 1.0692944526672363, 1.1761667728424072]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 3.0, 3.0, 5.0, 6.0, 3.0, 7.0, 9.0, 5.0, 13.0, 17.0, 16.0, 20.0, 22.0, 21.0, 28.0, 20.0, 15.0, 26.0, 23.0, 34.0, 28.0, 34.0, 35.0, 35.0, 31.0, 34.0, 37.0, 36.0, 35.0, 38.0, 28.0, 28.0, 32.0, 31.0, 39.0, 18.0, 17.0, 19.0, 19.0, 11.0, 25.0, 17.0, 15.0, 18.0, 15.0, 8.0, 7.0, 10.0, 8.0, 4.0, 1.0, 3.0, 1.0, 0.0, 1.0, 2.0, 2.0], "bins": [-0.8857031464576721, -0.8588928580284119, -0.8320825099945068, -0.8052722215652466, -0.7784619331359863, -0.7516515851020813, -0.724841296672821, -0.698030948638916, -0.6712206602096558, -0.6444103717803955, -0.6176000237464905, -0.5907897353172302, -0.56397944688797, -0.5371690988540649, -0.5103588104248047, -0.48354849219322205, -0.4567382037639618, -0.42992788553237915, -0.4031175971031189, -0.37630727887153625, -0.3494969606399536, -0.32268667221069336, -0.2958763539791107, -0.2690660357475281, -0.24225573241710663, -0.21544542908668518, -0.18863511085510254, -0.1618248075246811, -0.13501450419425964, -0.108204185962677, -0.08139388263225555, -0.05458356440067291, -0.027773261070251465, -0.0009629521518945694, 0.025847356766462326, 0.05265766382217407, 0.07946797460317612, 0.10627828538417816, 0.1330885887145996, 0.15989890694618225, 0.1867092102766037, 0.21351951360702515, 0.2403298318386078, 0.26714015007019043, 0.2939504384994507, 0.3207607567310333, 0.34757107496261597, 0.3743813633918762, 0.40119168162345886, 0.4280019998550415, 0.45481228828430176, 0.4816226065158844, 0.508432924747467, 0.5352432131767273, 0.5620535612106323, 0.5888638496398926, 0.6156741380691528, 0.6424844264984131, 0.6692947745323181, 0.6961050629615784, 0.7229153513908386, 0.7497256994247437, 0.7765359878540039, 0.8033462762832642, 0.8301566243171692]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 4.0, 6.0, 5.0, 5.0, 15.0, 16.0, 23.0, 27.0, 57.0, 60.0, 103.0, 169.0, 314.0, 563.0, 1192.0, 2247.0, 4561.0, 9804.0, 20896.0, 45859.0, 105319.0, 239222.0, 312647.0, 170961.0, 73423.0, 32231.0, 14856.0, 6972.0, 3357.0, 1654.0, 851.0, 437.0, 255.0, 144.0, 95.0, 71.0, 40.0, 24.0, 15.0, 13.0, 10.0, 6.0, 6.0, 5.0, 2.0, 5.0, 1.0, 0.0, 2.0, 3.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.39208984375, -0.37994384765625, -0.3677978515625, -0.35565185546875, -0.343505859375, -0.33135986328125, -0.3192138671875, -0.30706787109375, -0.294921875, -0.28277587890625, -0.2706298828125, -0.25848388671875, -0.246337890625, -0.23419189453125, -0.2220458984375, -0.20989990234375, -0.19775390625, -0.18560791015625, -0.1734619140625, -0.16131591796875, -0.149169921875, -0.13702392578125, -0.1248779296875, -0.11273193359375, -0.1005859375, -0.08843994140625, -0.0762939453125, -0.06414794921875, -0.052001953125, -0.03985595703125, -0.0277099609375, -0.01556396484375, -0.00341796875, 0.00872802734375, 0.0208740234375, 0.03302001953125, 0.045166015625, 0.05731201171875, 0.0694580078125, 0.08160400390625, 0.09375, 0.10589599609375, 0.1180419921875, 0.13018798828125, 0.142333984375, 0.15447998046875, 0.1666259765625, 0.17877197265625, 0.19091796875, 0.20306396484375, 0.2152099609375, 0.22735595703125, 0.239501953125, 0.25164794921875, 0.2637939453125, 0.27593994140625, 0.2880859375, 0.30023193359375, 0.3123779296875, 0.32452392578125, 0.336669921875, 0.34881591796875, 0.3609619140625, 0.37310791015625, 0.38525390625]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 3.0, 7.0, 4.0, 7.0, 12.0, 11.0, 15.0, 20.0, 20.0, 21.0, 31.0, 39.0, 29.0, 37.0, 42.0, 47.0, 57.0, 48.0, 63.0, 46.0, 46.0, 50.0, 63.0, 38.0, 44.0, 37.0, 29.0, 35.0, 16.0, 17.0, 21.0, 11.0, 12.0, 12.0, 8.0, 5.0, 4.0, 2.0, 5.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1658935546875, -0.1612873077392578, -0.15668106079101562, -0.15207481384277344, -0.14746856689453125, -0.14286231994628906, -0.13825607299804688, -0.1336498260498047, -0.1290435791015625, -0.12443733215332031, -0.11983108520507812, -0.11522483825683594, -0.11061859130859375, -0.10601234436035156, -0.10140609741210938, -0.09679985046386719, -0.092193603515625, -0.08758735656738281, -0.08298110961914062, -0.07837486267089844, -0.07376861572265625, -0.06916236877441406, -0.06455612182617188, -0.05994987487792969, -0.0553436279296875, -0.05073738098144531, -0.046131134033203125, -0.04152488708496094, -0.03691864013671875, -0.03231239318847656, -0.027706146240234375, -0.023099899291992188, -0.01849365234375, -0.013887405395507812, -0.009281158447265625, -0.0046749114990234375, -6.866455078125e-05, 0.0045375823974609375, 0.009143829345703125, 0.013750076293945312, 0.0183563232421875, 0.022962570190429688, 0.027568817138671875, 0.03217506408691406, 0.03678131103515625, 0.04138755798339844, 0.045993804931640625, 0.05060005187988281, 0.055206298828125, 0.05981254577636719, 0.06441879272460938, 0.06902503967285156, 0.07363128662109375, 0.07823753356933594, 0.08284378051757812, 0.08745002746582031, 0.0920562744140625, 0.09666252136230469, 0.10126876831054688, 0.10587501525878906, 0.11048126220703125, 0.11508750915527344, 0.11969375610351562, 0.12430000305175781, 0.12890625]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 2.0, 4.0, 2.0, 6.0, 6.0, 8.0, 19.0, 45.0, 57.0, 113.0, 233.0, 583.0, 1345.0, 4024.0, 11872.0, 36581.0, 126989.0, 416376.0, 323123.0, 87377.0, 26388.0, 8544.0, 2954.0, 1071.0, 434.0, 209.0, 68.0, 52.0, 22.0, 21.0, 8.0, 10.0, 5.0, 4.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.51904296875, -0.49971771240234375, -0.4803924560546875, -0.46106719970703125, -0.441741943359375, -0.42241668701171875, -0.4030914306640625, -0.38376617431640625, -0.36444091796875, -0.34511566162109375, -0.3257904052734375, -0.30646514892578125, -0.287139892578125, -0.26781463623046875, -0.2484893798828125, -0.22916412353515625, -0.2098388671875, -0.19051361083984375, -0.1711883544921875, -0.15186309814453125, -0.132537841796875, -0.11321258544921875, -0.0938873291015625, -0.07456207275390625, -0.05523681640625, -0.03591156005859375, -0.0165863037109375, 0.00273895263671875, 0.022064208984375, 0.04138946533203125, 0.0607147216796875, 0.08003997802734375, 0.099365234375, 0.11869049072265625, 0.1380157470703125, 0.15734100341796875, 0.176666259765625, 0.19599151611328125, 0.2153167724609375, 0.23464202880859375, 0.25396728515625, 0.27329254150390625, 0.2926177978515625, 0.31194305419921875, 0.331268310546875, 0.35059356689453125, 0.3699188232421875, 0.38924407958984375, 0.4085693359375, 0.42789459228515625, 0.4472198486328125, 0.46654510498046875, 0.485870361328125, 0.5051956176757812, 0.5245208740234375, 0.5438461303710938, 0.56317138671875, 0.5824966430664062, 0.6018218994140625, 0.6211471557617188, 0.640472412109375, 0.6597976684570312, 0.6791229248046875, 0.6984481811523438, 0.7177734375]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 1.0, 3.0, 6.0, 9.0, 14.0, 8.0, 18.0, 24.0, 26.0, 28.0, 24.0, 56.0, 49.0, 49.0, 57.0, 63.0, 72.0, 62.0, 57.0, 56.0, 53.0, 52.0, 47.0, 31.0, 25.0, 27.0, 23.0, 16.0, 8.0, 16.0, 10.0, 9.0, 5.0, 2.0, 4.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6640625, -0.64453125, -0.625, -0.60546875, -0.5859375, -0.56640625, -0.546875, -0.52734375, -0.5078125, -0.48828125, -0.46875, -0.44921875, -0.4296875, -0.41015625, -0.390625, -0.37109375, -0.3515625, -0.33203125, -0.3125, -0.29296875, -0.2734375, -0.25390625, -0.234375, -0.21484375, -0.1953125, -0.17578125, -0.15625, -0.13671875, -0.1171875, -0.09765625, -0.078125, -0.05859375, -0.0390625, -0.01953125, 0.0, 0.01953125, 0.0390625, 0.05859375, 0.078125, 0.09765625, 0.1171875, 0.13671875, 0.15625, 0.17578125, 0.1953125, 0.21484375, 0.234375, 0.25390625, 0.2734375, 0.29296875, 0.3125, 0.33203125, 0.3515625, 0.37109375, 0.390625, 0.41015625, 0.4296875, 0.44921875, 0.46875, 0.48828125, 0.5078125, 0.52734375, 0.546875, 0.56640625, 0.5859375]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 3.0, 6.0, 7.0, 11.0, 16.0, 30.0, 28.0, 38.0, 98.0, 163.0, 276.0, 441.0, 671.0, 1256.0, 2213.0, 3994.0, 7531.0, 13937.0, 26421.0, 48797.0, 92230.0, 173310.0, 245409.0, 198093.0, 109183.0, 57687.0, 30936.0, 16337.0, 8792.0, 4582.0, 2491.0, 1456.0, 824.0, 501.0, 301.0, 189.0, 119.0, 68.0, 56.0, 30.0, 16.0, 5.0, 3.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.1583251953125, -0.153472900390625, -0.14862060546875, -0.143768310546875, -0.138916015625, -0.134063720703125, -0.12921142578125, -0.124359130859375, -0.1195068359375, -0.114654541015625, -0.10980224609375, -0.104949951171875, -0.10009765625, -0.095245361328125, -0.09039306640625, -0.085540771484375, -0.0806884765625, -0.075836181640625, -0.07098388671875, -0.066131591796875, -0.061279296875, -0.056427001953125, -0.05157470703125, -0.046722412109375, -0.0418701171875, -0.037017822265625, -0.03216552734375, -0.027313232421875, -0.0224609375, -0.017608642578125, -0.01275634765625, -0.007904052734375, -0.0030517578125, 0.001800537109375, 0.00665283203125, 0.011505126953125, 0.016357421875, 0.021209716796875, 0.02606201171875, 0.030914306640625, 0.0357666015625, 0.040618896484375, 0.04547119140625, 0.050323486328125, 0.05517578125, 0.060028076171875, 0.06488037109375, 0.069732666015625, 0.0745849609375, 0.079437255859375, 0.08428955078125, 0.089141845703125, 0.093994140625, 0.098846435546875, 0.10369873046875, 0.108551025390625, 0.1134033203125, 0.118255615234375, 0.12310791015625, 0.127960205078125, 0.1328125, 0.137664794921875, 0.14251708984375, 0.147369384765625, 0.1522216796875]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 1.0, 3.0, 2.0, 4.0, 4.0, 6.0, 14.0, 13.0, 11.0, 18.0, 23.0, 32.0, 46.0, 51.0, 92.0, 96.0, 124.0, 118.0, 77.0, 75.0, 45.0, 35.0, 26.0, 24.0, 14.0, 11.0, 11.0, 4.0, 6.0, 7.0, 4.0, 5.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0], "bins": [-6.592273712158203e-05, -6.429571658372879e-05, -6.266869604587555e-05, -6.104167550802231e-05, -5.941465497016907e-05, -5.7787634432315826e-05, -5.6160613894462585e-05, -5.4533593356609344e-05, -5.2906572818756104e-05, -5.127955228090286e-05, -4.965253174304962e-05, -4.802551120519638e-05, -4.639849066734314e-05, -4.47714701294899e-05, -4.314444959163666e-05, -4.151742905378342e-05, -3.9890408515930176e-05, -3.8263387978076935e-05, -3.6636367440223694e-05, -3.500934690237045e-05, -3.338232636451721e-05, -3.175530582666397e-05, -3.012828528881073e-05, -2.850126475095749e-05, -2.6874244213104248e-05, -2.5247223675251007e-05, -2.3620203137397766e-05, -2.1993182599544525e-05, -2.0366162061691284e-05, -1.8739141523838043e-05, -1.7112120985984802e-05, -1.548510044813156e-05, -1.385807991027832e-05, -1.223105937242508e-05, -1.0604038834571838e-05, -8.977018296718597e-06, -7.3499977588653564e-06, -5.7229772210121155e-06, -4.0959566831588745e-06, -2.4689361453056335e-06, -8.419156074523926e-07, 7.851049304008484e-07, 2.4121254682540894e-06, 4.03914600610733e-06, 5.666166543960571e-06, 7.293187081813812e-06, 8.920207619667053e-06, 1.0547228157520294e-05, 1.2174248695373535e-05, 1.3801269233226776e-05, 1.5428289771080017e-05, 1.7055310308933258e-05, 1.86823308467865e-05, 2.030935138463974e-05, 2.193637192249298e-05, 2.3563392460346222e-05, 2.5190412998199463e-05, 2.6817433536052704e-05, 2.8444454073905945e-05, 3.0071474611759186e-05, 3.169849514961243e-05, 3.332551568746567e-05, 3.495253622531891e-05, 3.657955676317215e-05, 3.820657730102539e-05]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 7.0, 7.0, 11.0, 8.0, 9.0, 16.0, 29.0, 33.0, 39.0, 85.0, 111.0, 155.0, 225.0, 388.0, 607.0, 953.0, 1621.0, 2796.0, 5064.0, 8980.0, 16392.0, 30918.0, 59286.0, 116687.0, 213775.0, 250630.0, 162819.0, 82992.0, 42880.0, 22609.0, 12232.0, 6724.0, 3856.0, 2199.0, 1272.0, 783.0, 466.0, 295.0, 198.0, 149.0, 79.0, 47.0, 32.0, 27.0, 17.0, 17.0, 9.0, 12.0, 6.0, 5.0, 5.0, 1.0, 2.0, 0.0, 0.0, 1.0, 3.0], "bins": [-0.1544189453125, -0.14963150024414062, -0.14484405517578125, -0.14005661010742188, -0.1352691650390625, -0.13048171997070312, -0.12569427490234375, -0.12090682983398438, -0.116119384765625, -0.11133193969726562, -0.10654449462890625, -0.10175704956054688, -0.0969696044921875, -0.09218215942382812, -0.08739471435546875, -0.08260726928710938, -0.07781982421875, -0.07303237915039062, -0.06824493408203125, -0.06345748901367188, -0.0586700439453125, -0.053882598876953125, -0.04909515380859375, -0.044307708740234375, -0.039520263671875, -0.034732818603515625, -0.02994537353515625, -0.025157928466796875, -0.0203704833984375, -0.015583038330078125, -0.01079559326171875, -0.006008148193359375, -0.001220703125, 0.003566741943359375, 0.00835418701171875, 0.013141632080078125, 0.0179290771484375, 0.022716522216796875, 0.02750396728515625, 0.032291412353515625, 0.037078857421875, 0.041866302490234375, 0.04665374755859375, 0.051441192626953125, 0.0562286376953125, 0.061016082763671875, 0.06580352783203125, 0.07059097290039062, 0.07537841796875, 0.08016586303710938, 0.08495330810546875, 0.08974075317382812, 0.0945281982421875, 0.09931564331054688, 0.10410308837890625, 0.10889053344726562, 0.113677978515625, 0.11846542358398438, 0.12325286865234375, 0.12804031372070312, 0.1328277587890625, 0.13761520385742188, 0.14240264892578125, 0.14719009399414062, 0.1519775390625]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 6.0, 10.0, 7.0, 11.0, 13.0, 8.0, 10.0, 18.0, 30.0, 32.0, 38.0, 42.0, 58.0, 58.0, 75.0, 81.0, 73.0, 72.0, 77.0, 46.0, 37.0, 46.0, 31.0, 29.0, 12.0, 18.0, 12.0, 17.0, 7.0, 11.0, 7.0, 3.0, 4.0, 3.0, 1.0, 2.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.203369140625, -0.1975555419921875, -0.191741943359375, -0.1859283447265625, -0.18011474609375, -0.1743011474609375, -0.168487548828125, -0.1626739501953125, -0.1568603515625, -0.1510467529296875, -0.145233154296875, -0.1394195556640625, -0.13360595703125, -0.1277923583984375, -0.121978759765625, -0.1161651611328125, -0.1103515625, -0.1045379638671875, -0.098724365234375, -0.0929107666015625, -0.08709716796875, -0.0812835693359375, -0.075469970703125, -0.0696563720703125, -0.0638427734375, -0.0580291748046875, -0.052215576171875, -0.0464019775390625, -0.04058837890625, -0.0347747802734375, -0.028961181640625, -0.0231475830078125, -0.017333984375, -0.0115203857421875, -0.005706787109375, 0.0001068115234375, 0.00592041015625, 0.0117340087890625, 0.017547607421875, 0.0233612060546875, 0.0291748046875, 0.0349884033203125, 0.040802001953125, 0.0466156005859375, 0.05242919921875, 0.0582427978515625, 0.064056396484375, 0.0698699951171875, 0.07568359375, 0.0814971923828125, 0.087310791015625, 0.0931243896484375, 0.09893798828125, 0.1047515869140625, 0.110565185546875, 0.1163787841796875, 0.1221923828125, 0.1280059814453125, 0.133819580078125, 0.1396331787109375, 0.14544677734375, 0.1512603759765625, 0.157073974609375, 0.1628875732421875, 0.168701171875]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 10.0, 18.0, 41.0, 91.0, 166.0, 221.0, 185.0, 147.0, 71.0, 35.0, 12.0, 13.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.599320411682129, -2.469660758972168, -2.340000867843628, -2.210341215133667, -2.080681324005127, -1.951021671295166, -1.821362018585205, -1.6917022466659546, -1.562042474746704, -1.4323827028274536, -1.3027229309082031, -1.1730632781982422, -1.0434035062789917, -0.9137437343597412, -0.7840840220451355, -0.6544243097305298, -0.5247645378112793, -0.3951047956943512, -0.2654450535774231, -0.135785311460495, -0.0061255693435668945, 0.1235342025756836, 0.2531939148902893, 0.382853627204895, 0.5125133991241455, 0.642173171043396, 0.7718328833580017, 0.9014925956726074, 1.031152367591858, 1.1608121395111084, 1.2904717922210693, 1.4201315641403198, 1.5497918128967285, 1.679451584815979, 1.8091113567352295, 1.9387710094451904, 2.0684309005737305, 2.1980905532836914, 2.3277502059936523, 2.4574098587036133, 2.5870697498321533, 2.7167294025421143, 2.8463892936706543, 2.9760489463806152, 3.105708599090576, 3.235368490219116, 3.365028142929077, 3.494688034057617, 3.624347686767578, 3.754007339477539, 3.883667230606079, 4.013327121734619, 4.14298677444458, 4.272646427154541, 4.402306079864502, 4.531965732574463, 4.661625862121582, 4.791285514831543, 4.920945167541504, 5.050605297088623, 5.180264949798584, 5.309924602508545, 5.439584255218506, 5.569243907928467, 5.698903560638428]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 2.0, 4.0, 6.0, 6.0, 7.0, 5.0, 9.0, 17.0, 10.0, 15.0, 17.0, 17.0, 17.0, 24.0, 34.0, 36.0, 39.0, 41.0, 46.0, 31.0, 40.0, 39.0, 37.0, 40.0, 44.0, 48.0, 29.0, 46.0, 38.0, 22.0, 30.0, 34.0, 22.0, 27.0, 23.0, 16.0, 15.0, 18.0, 10.0, 9.0, 9.0, 6.0, 5.0, 5.0, 2.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.205600619316101, -1.1674000024795532, -1.129199504852295, -1.090998888015747, -1.0527982711791992, -1.0145976543426514, -0.9763971567153931, -0.9381965398788452, -0.8999959826469421, -0.8617954254150391, -0.8235948085784912, -0.7853942513465881, -0.7471936941146851, -0.7089930772781372, -0.6707925200462341, -0.632591962814331, -0.5943913459777832, -0.5561907887458801, -0.5179901719093323, -0.4797896146774292, -0.44158902764320374, -0.40338844060897827, -0.3651878833770752, -0.32698729634284973, -0.28878670930862427, -0.2505861222743988, -0.21238555014133453, -0.17418497800827026, -0.1359843909740448, -0.09778380393981934, -0.059583231806755066, -0.021382659673690796, 0.016817808151245117, 0.055018387734889984, 0.09321896731853485, 0.13141953945159912, 0.16962012648582458, 0.20782071352005005, 0.24602128565311432, 0.2842218577861786, 0.32242244482040405, 0.3606230318546295, 0.398823618888855, 0.43702417612075806, 0.4752247631549835, 0.513425350189209, 0.5516259074211121, 0.5898264646530151, 0.628027081489563, 0.6662276387214661, 0.7044282555580139, 0.742628812789917, 0.7808294296264648, 0.8190299868583679, 0.857230544090271, 0.8954311609268188, 0.9336317181587219, 0.971832275390625, 1.0100328922271729, 1.0482335090637207, 1.086434006690979, 1.1246346235275269, 1.1628352403640747, 1.201035737991333, 1.2392363548278809]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 4.0, 6.0, 12.0, 11.0, 11.0, 22.0, 18.0, 27.0, 31.0, 31.0, 56.0, 82.0, 128.0, 220.0, 390.0, 697.0, 1517.0, 3395.0, 8630.0, 26072.0, 98000.0, 532733.0, 2435617.0, 882634.0, 149704.0, 35838.0, 11056.0, 4064.0, 1647.0, 786.0, 342.0, 183.0, 106.0, 63.0, 42.0, 22.0, 20.0, 18.0, 15.0, 10.0, 12.0, 4.0, 1.0, 3.0, 3.0, 3.0, 0.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.324951171875, -0.3152885437011719, -0.30562591552734375, -0.2959632873535156, -0.2863006591796875, -0.2766380310058594, -0.26697540283203125, -0.2573127746582031, -0.247650146484375, -0.23798751831054688, -0.22832489013671875, -0.21866226196289062, -0.2089996337890625, -0.19933700561523438, -0.18967437744140625, -0.18001174926757812, -0.17034912109375, -0.16068649291992188, -0.15102386474609375, -0.14136123657226562, -0.1316986083984375, -0.12203598022460938, -0.11237335205078125, -0.10271072387695312, -0.093048095703125, -0.08338546752929688, -0.07372283935546875, -0.06406021118164062, -0.0543975830078125, -0.044734954833984375, -0.03507232666015625, -0.025409698486328125, -0.0157470703125, -0.006084442138671875, 0.00357818603515625, 0.013240814208984375, 0.0229034423828125, 0.032566070556640625, 0.04222869873046875, 0.051891326904296875, 0.061553955078125, 0.07121658325195312, 0.08087921142578125, 0.09054183959960938, 0.1002044677734375, 0.10986709594726562, 0.11952972412109375, 0.12919235229492188, 0.13885498046875, 0.14851760864257812, 0.15818023681640625, 0.16784286499023438, 0.1775054931640625, 0.18716812133789062, 0.19683074951171875, 0.20649337768554688, 0.216156005859375, 0.22581863403320312, 0.23548126220703125, 0.24514389038085938, 0.2548065185546875, 0.2644691467285156, 0.27413177490234375, 0.2837944030761719, 0.29345703125]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 2.0, 3.0, 6.0, 5.0, 6.0, 10.0, 10.0, 12.0, 28.0, 17.0, 20.0, 31.0, 31.0, 25.0, 37.0, 35.0, 45.0, 40.0, 44.0, 53.0, 40.0, 45.0, 53.0, 43.0, 48.0, 52.0, 39.0, 34.0, 32.0, 29.0, 21.0, 26.0, 22.0, 11.0, 16.0, 7.0, 12.0, 4.0, 3.0, 6.0, 4.0, 4.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.169189453125, -0.1644763946533203, -0.15976333618164062, -0.15505027770996094, -0.15033721923828125, -0.14562416076660156, -0.14091110229492188, -0.1361980438232422, -0.1314849853515625, -0.1267719268798828, -0.12205886840820312, -0.11734580993652344, -0.11263275146484375, -0.10791969299316406, -0.10320663452148438, -0.09849357604980469, -0.093780517578125, -0.08906745910644531, -0.08435440063476562, -0.07964134216308594, -0.07492828369140625, -0.07021522521972656, -0.06550216674804688, -0.06078910827636719, -0.0560760498046875, -0.05136299133300781, -0.046649932861328125, -0.04193687438964844, -0.03722381591796875, -0.03251075744628906, -0.027797698974609375, -0.023084640502929688, -0.01837158203125, -0.013658523559570312, -0.008945465087890625, -0.0042324066162109375, 0.00048065185546875, 0.0051937103271484375, 0.009906768798828125, 0.014619827270507812, 0.0193328857421875, 0.024045944213867188, 0.028759002685546875, 0.03347206115722656, 0.03818511962890625, 0.04289817810058594, 0.047611236572265625, 0.05232429504394531, 0.057037353515625, 0.06175041198730469, 0.06646347045898438, 0.07117652893066406, 0.07588958740234375, 0.08060264587402344, 0.08531570434570312, 0.09002876281738281, 0.0947418212890625, 0.09945487976074219, 0.10416793823242188, 0.10888099670410156, 0.11359405517578125, 0.11830711364746094, 0.12302017211914062, 0.1277332305908203, 0.1324462890625]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 5.0, 6.0, 6.0, 13.0, 13.0, 23.0, 36.0, 36.0, 73.0, 105.0, 180.0, 247.0, 412.0, 793.0, 1704.0, 4059.0, 12924.0, 59629.0, 512882.0, 2935257.0, 579188.0, 65277.0, 13416.0, 4206.0, 1713.0, 814.0, 466.0, 272.0, 165.0, 134.0, 58.0, 48.0, 37.0, 32.0, 20.0, 11.0, 10.0, 4.0, 8.0, 7.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.70458984375, -0.6841812133789062, -0.6637725830078125, -0.6433639526367188, -0.622955322265625, -0.6025466918945312, -0.5821380615234375, -0.5617294311523438, -0.54132080078125, -0.5209121704101562, -0.5005035400390625, -0.48009490966796875, -0.459686279296875, -0.43927764892578125, -0.4188690185546875, -0.39846038818359375, -0.3780517578125, -0.35764312744140625, -0.3372344970703125, -0.31682586669921875, -0.296417236328125, -0.27600860595703125, -0.2555999755859375, -0.23519134521484375, -0.21478271484375, -0.19437408447265625, -0.1739654541015625, -0.15355682373046875, -0.133148193359375, -0.11273956298828125, -0.0923309326171875, -0.07192230224609375, -0.051513671875, -0.03110504150390625, -0.0106964111328125, 0.00971221923828125, 0.030120849609375, 0.05052947998046875, 0.0709381103515625, 0.09134674072265625, 0.11175537109375, 0.13216400146484375, 0.1525726318359375, 0.17298126220703125, 0.193389892578125, 0.21379852294921875, 0.2342071533203125, 0.25461578369140625, 0.2750244140625, 0.29543304443359375, 0.3158416748046875, 0.33625030517578125, 0.356658935546875, 0.37706756591796875, 0.3974761962890625, 0.41788482666015625, 0.43829345703125, 0.45870208740234375, 0.4791107177734375, 0.49951934814453125, 0.519927978515625, 0.5403366088867188, 0.5607452392578125, 0.5811538696289062, 0.6015625]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 5.0, 6.0, 3.0, 4.0, 11.0, 16.0, 33.0, 45.0, 71.0, 138.0, 248.0, 412.0, 614.0, 829.0, 663.0, 402.0, 233.0, 136.0, 89.0, 45.0, 23.0, 15.0, 15.0, 6.0, 9.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.51513671875, -0.49976348876953125, -0.4843902587890625, -0.46901702880859375, -0.453643798828125, -0.43827056884765625, -0.4228973388671875, -0.40752410888671875, -0.39215087890625, -0.37677764892578125, -0.3614044189453125, -0.34603118896484375, -0.330657958984375, -0.31528472900390625, -0.2999114990234375, -0.28453826904296875, -0.2691650390625, -0.25379180908203125, -0.2384185791015625, -0.22304534912109375, -0.207672119140625, -0.19229888916015625, -0.1769256591796875, -0.16155242919921875, -0.14617919921875, -0.13080596923828125, -0.1154327392578125, -0.10005950927734375, -0.084686279296875, -0.06931304931640625, -0.0539398193359375, -0.03856658935546875, -0.023193359375, -0.00782012939453125, 0.0075531005859375, 0.02292633056640625, 0.038299560546875, 0.05367279052734375, 0.0690460205078125, 0.08441925048828125, 0.09979248046875, 0.11516571044921875, 0.1305389404296875, 0.14591217041015625, 0.161285400390625, 0.17665863037109375, 0.1920318603515625, 0.20740509033203125, 0.2227783203125, 0.23815155029296875, 0.2535247802734375, 0.26889801025390625, 0.284271240234375, 0.29964447021484375, 0.3150177001953125, 0.33039093017578125, 0.34576416015625, 0.36113739013671875, 0.3765106201171875, 0.39188385009765625, 0.407257080078125, 0.42263031005859375, 0.4380035400390625, 0.45337677001953125, 0.46875]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 3.0, 3.0, 5.0, 5.0, 7.0, 12.0, 12.0, 23.0, 19.0, 22.0, 28.0, 30.0, 35.0, 40.0, 53.0, 64.0, 65.0, 69.0, 69.0, 62.0, 50.0, 57.0, 46.0, 48.0, 30.0, 31.0, 24.0, 24.0, 16.0, 9.0, 18.0, 4.0, 6.0, 5.0, 5.0, 3.0, 2.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 2.0], "bins": [-1.393176794052124, -1.3568590879440308, -1.3205413818359375, -1.2842235565185547, -1.2479058504104614, -1.2115881443023682, -1.175270438194275, -1.1389527320861816, -1.1026349067687988, -1.0663172006607056, -1.0299994945526123, -0.9936817288398743, -0.9573639631271362, -0.921046257019043, -0.8847285509109497, -0.8484107851982117, -0.8120930790901184, -0.7757753729820251, -0.7394576072692871, -0.7031399011611938, -0.6668221354484558, -0.6305044293403625, -0.5941866636276245, -0.5578689575195312, -0.521551251411438, -0.48523351550102234, -0.4489157795906067, -0.4125980734825134, -0.3762803077697754, -0.33996260166168213, -0.3036448657512665, -0.26732712984085083, -0.2310093641281128, -0.19469162821769714, -0.1583738923072815, -0.12205617129802704, -0.08573843538761139, -0.04942069947719574, -0.013102978467941284, 0.023214757442474365, 0.059532493352890015, 0.09585022926330566, 0.1321679651737213, 0.16848568618297577, 0.20480342209339142, 0.24112115800380707, 0.2774388790130615, 0.3137566149234772, 0.3500743508338928, 0.38639208674430847, 0.4227098226547241, 0.4590275287628174, 0.4953452944755554, 0.5316630005836487, 0.5679807662963867, 0.60429847240448, 0.6406161785125732, 0.6769338846206665, 0.7132516503334045, 0.7495693564414978, 0.7858871221542358, 0.8222048282623291, 0.8585225343704224, 0.8948403000831604, 0.9311580657958984]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 3.0, 0.0, 1.0, 4.0, 1.0, 2.0, 2.0, 4.0, 7.0, 7.0, 9.0, 9.0, 17.0, 8.0, 17.0, 15.0, 15.0, 15.0, 18.0, 22.0, 30.0, 31.0, 32.0, 27.0, 45.0, 31.0, 37.0, 35.0, 52.0, 30.0, 46.0, 47.0, 25.0, 37.0, 38.0, 32.0, 38.0, 26.0, 38.0, 25.0, 15.0, 15.0, 14.0, 12.0, 9.0, 10.0, 17.0, 9.0, 4.0, 9.0, 5.0, 5.0, 3.0, 3.0, 2.0, 2.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.945117175579071, -0.9140474796295166, -0.8829777836799622, -0.8519080877304077, -0.8208383917808533, -0.7897686958312988, -0.7586989402770996, -0.7276293039321899, -0.6965595483779907, -0.6654898524284363, -0.6344201564788818, -0.6033504605293274, -0.572280764579773, -0.5412110686302185, -0.5101413726806641, -0.47907164692878723, -0.4480019807815552, -0.41693228483200073, -0.3858625888824463, -0.35479289293289185, -0.3237231969833374, -0.29265350103378296, -0.26158377528190613, -0.23051407933235168, -0.19944438338279724, -0.1683746874332428, -0.13730499148368835, -0.10623528063297272, -0.07516558468341827, -0.04409588873386383, -0.013026177883148193, 0.01804351806640625, 0.04911315441131592, 0.08018285036087036, 0.1112525537610054, 0.14232225716114044, 0.17339195311069489, 0.20446164906024933, 0.23553135991096497, 0.2666010558605194, 0.29767075181007385, 0.3287404477596283, 0.35981014370918274, 0.39087986946105957, 0.421949565410614, 0.45301926136016846, 0.4840889573097229, 0.5151586532592773, 0.5462283492088318, 0.5772980451583862, 0.6083677411079407, 0.6394374370574951, 0.6705071330070496, 0.701576828956604, 0.7326465845108032, 0.7637162208557129, 0.7947859764099121, 0.8258556723594666, 0.856925368309021, 0.8879950642585754, 0.9190647602081299, 0.9501344561576843, 0.9812041521072388, 1.012273907661438, 1.0433435440063477]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 4.0, 1.0, 4.0, 1.0, 2.0, 8.0, 5.0, 14.0, 14.0, 17.0, 26.0, 54.0, 65.0, 106.0, 179.0, 266.0, 412.0, 768.0, 1239.0, 2327.0, 4298.0, 8059.0, 15918.0, 31647.0, 67986.0, 174405.0, 349759.0, 225553.0, 86257.0, 38664.0, 19121.0, 9812.0, 5112.0, 2718.0, 1538.0, 910.0, 514.0, 304.0, 183.0, 108.0, 67.0, 44.0, 26.0, 11.0, 10.0, 12.0, 9.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.339599609375, -0.3281402587890625, -0.316680908203125, -0.3052215576171875, -0.29376220703125, -0.2823028564453125, -0.270843505859375, -0.2593841552734375, -0.2479248046875, -0.2364654541015625, -0.225006103515625, -0.2135467529296875, -0.20208740234375, -0.1906280517578125, -0.179168701171875, -0.1677093505859375, -0.15625, -0.1447906494140625, -0.133331298828125, -0.1218719482421875, -0.11041259765625, -0.0989532470703125, -0.087493896484375, -0.0760345458984375, -0.0645751953125, -0.0531158447265625, -0.041656494140625, -0.0301971435546875, -0.01873779296875, -0.0072784423828125, 0.004180908203125, 0.0156402587890625, 0.027099609375, 0.0385589599609375, 0.050018310546875, 0.0614776611328125, 0.07293701171875, 0.0843963623046875, 0.095855712890625, 0.1073150634765625, 0.1187744140625, 0.1302337646484375, 0.141693115234375, 0.1531524658203125, 0.16461181640625, 0.1760711669921875, 0.187530517578125, 0.1989898681640625, 0.21044921875, 0.2219085693359375, 0.233367919921875, 0.2448272705078125, 0.25628662109375, 0.2677459716796875, 0.279205322265625, 0.2906646728515625, 0.3021240234375, 0.3135833740234375, 0.325042724609375, 0.3365020751953125, 0.34796142578125, 0.3594207763671875, 0.370880126953125, 0.3823394775390625, 0.393798828125]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 6.0, 3.0, 5.0, 6.0, 9.0, 7.0, 10.0, 17.0, 20.0, 14.0, 17.0, 26.0, 27.0, 27.0, 36.0, 40.0, 41.0, 46.0, 48.0, 52.0, 50.0, 49.0, 48.0, 49.0, 43.0, 39.0, 30.0, 25.0, 34.0, 25.0, 23.0, 24.0, 25.0, 18.0, 20.0, 16.0, 9.0, 13.0, 3.0, 5.0, 2.0, 2.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0], "bins": [-0.189697265625, -0.18456268310546875, -0.1794281005859375, -0.17429351806640625, -0.169158935546875, -0.16402435302734375, -0.1588897705078125, -0.15375518798828125, -0.14862060546875, -0.14348602294921875, -0.1383514404296875, -0.13321685791015625, -0.128082275390625, -0.12294769287109375, -0.1178131103515625, -0.11267852783203125, -0.1075439453125, -0.10240936279296875, -0.0972747802734375, -0.09214019775390625, -0.087005615234375, -0.08187103271484375, -0.0767364501953125, -0.07160186767578125, -0.06646728515625, -0.06133270263671875, -0.0561981201171875, -0.05106353759765625, -0.045928955078125, -0.04079437255859375, -0.0356597900390625, -0.03052520751953125, -0.025390625, -0.02025604248046875, -0.0151214599609375, -0.00998687744140625, -0.004852294921875, 0.00028228759765625, 0.0054168701171875, 0.01055145263671875, 0.01568603515625, 0.02082061767578125, 0.0259552001953125, 0.03108978271484375, 0.036224365234375, 0.04135894775390625, 0.0464935302734375, 0.05162811279296875, 0.0567626953125, 0.06189727783203125, 0.0670318603515625, 0.07216644287109375, 0.077301025390625, 0.08243560791015625, 0.0875701904296875, 0.09270477294921875, 0.09783935546875, 0.10297393798828125, 0.1081085205078125, 0.11324310302734375, 0.118377685546875, 0.12351226806640625, 0.1286468505859375, 0.13378143310546875, 0.138916015625]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 4.0, 4.0, 4.0, 9.0, 17.0, 37.0, 39.0, 58.0, 153.0, 249.0, 434.0, 988.0, 2209.0, 5333.0, 14164.0, 44277.0, 210256.0, 595644.0, 124652.0, 31689.0, 10762.0, 4118.0, 1783.0, 794.0, 389.0, 225.0, 123.0, 51.0, 30.0, 24.0, 15.0, 6.0, 7.0, 6.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.80322265625, -0.77984619140625, -0.7564697265625, -0.73309326171875, -0.709716796875, -0.68634033203125, -0.6629638671875, -0.63958740234375, -0.6162109375, -0.59283447265625, -0.5694580078125, -0.54608154296875, -0.522705078125, -0.49932861328125, -0.4759521484375, -0.45257568359375, -0.42919921875, -0.40582275390625, -0.3824462890625, -0.35906982421875, -0.335693359375, -0.31231689453125, -0.2889404296875, -0.26556396484375, -0.2421875, -0.21881103515625, -0.1954345703125, -0.17205810546875, -0.148681640625, -0.12530517578125, -0.1019287109375, -0.07855224609375, -0.05517578125, -0.03179931640625, -0.0084228515625, 0.01495361328125, 0.038330078125, 0.06170654296875, 0.0850830078125, 0.10845947265625, 0.1318359375, 0.15521240234375, 0.1785888671875, 0.20196533203125, 0.225341796875, 0.24871826171875, 0.2720947265625, 0.29547119140625, 0.31884765625, 0.34222412109375, 0.3656005859375, 0.38897705078125, 0.412353515625, 0.43572998046875, 0.4591064453125, 0.48248291015625, 0.505859375, 0.52923583984375, 0.5526123046875, 0.57598876953125, 0.599365234375, 0.62274169921875, 0.6461181640625, 0.66949462890625, 0.69287109375]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 4.0, 6.0, 13.0, 18.0, 11.0, 16.0, 36.0, 34.0, 44.0, 59.0, 60.0, 83.0, 67.0, 75.0, 98.0, 72.0, 62.0, 52.0, 51.0, 47.0, 25.0, 18.0, 10.0, 8.0, 9.0, 6.0, 7.0, 4.0, 4.0, 0.0, 4.0, 1.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.69091796875, -0.6656951904296875, -0.640472412109375, -0.6152496337890625, -0.59002685546875, -0.5648040771484375, -0.539581298828125, -0.5143585205078125, -0.4891357421875, -0.4639129638671875, -0.438690185546875, -0.4134674072265625, -0.38824462890625, -0.3630218505859375, -0.337799072265625, -0.3125762939453125, -0.287353515625, -0.2621307373046875, -0.236907958984375, -0.2116851806640625, -0.18646240234375, -0.1612396240234375, -0.136016845703125, -0.1107940673828125, -0.0855712890625, -0.0603485107421875, -0.035125732421875, -0.0099029541015625, 0.01531982421875, 0.0405426025390625, 0.065765380859375, 0.0909881591796875, 0.1162109375, 0.1414337158203125, 0.166656494140625, 0.1918792724609375, 0.21710205078125, 0.2423248291015625, 0.267547607421875, 0.2927703857421875, 0.3179931640625, 0.3432159423828125, 0.368438720703125, 0.3936614990234375, 0.41888427734375, 0.4441070556640625, 0.469329833984375, 0.4945526123046875, 0.519775390625, 0.5449981689453125, 0.570220947265625, 0.5954437255859375, 0.62066650390625, 0.6458892822265625, 0.671112060546875, 0.6963348388671875, 0.7215576171875, 0.7467803955078125, 0.772003173828125, 0.7972259521484375, 0.82244873046875, 0.8476715087890625, 0.872894287109375, 0.8981170654296875, 0.92333984375]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 4.0, 4.0, 3.0, 5.0, 8.0, 5.0, 9.0, 30.0, 27.0, 48.0, 36.0, 85.0, 105.0, 146.0, 243.0, 302.0, 483.0, 683.0, 1062.0, 1571.0, 2768.0, 4494.0, 7555.0, 13204.0, 24203.0, 45387.0, 96741.0, 238390.0, 317924.0, 152713.0, 64741.0, 32830.0, 17728.0, 9871.0, 5642.0, 3491.0, 2044.0, 1318.0, 836.0, 591.0, 364.0, 270.0, 187.0, 140.0, 64.0, 62.0, 52.0, 25.0, 18.0, 19.0, 16.0, 4.0, 5.0, 7.0, 5.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1778564453125, -0.1721649169921875, -0.166473388671875, -0.1607818603515625, -0.15509033203125, -0.1493988037109375, -0.143707275390625, -0.1380157470703125, -0.13232421875, -0.1266326904296875, -0.120941162109375, -0.1152496337890625, -0.10955810546875, -0.1038665771484375, -0.098175048828125, -0.0924835205078125, -0.0867919921875, -0.0811004638671875, -0.075408935546875, -0.0697174072265625, -0.06402587890625, -0.0583343505859375, -0.052642822265625, -0.0469512939453125, -0.041259765625, -0.0355682373046875, -0.029876708984375, -0.0241851806640625, -0.01849365234375, -0.0128021240234375, -0.007110595703125, -0.0014190673828125, 0.0042724609375, 0.0099639892578125, 0.015655517578125, 0.0213470458984375, 0.02703857421875, 0.0327301025390625, 0.038421630859375, 0.0441131591796875, 0.0498046875, 0.0554962158203125, 0.061187744140625, 0.0668792724609375, 0.07257080078125, 0.0782623291015625, 0.083953857421875, 0.0896453857421875, 0.0953369140625, 0.1010284423828125, 0.106719970703125, 0.1124114990234375, 0.11810302734375, 0.1237945556640625, 0.129486083984375, 0.1351776123046875, 0.140869140625, 0.1465606689453125, 0.152252197265625, 0.1579437255859375, 0.16363525390625, 0.1693267822265625, 0.175018310546875, 0.1807098388671875, 0.1864013671875]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 2.0, 5.0, 6.0, 9.0, 8.0, 10.0, 18.0, 20.0, 29.0, 36.0, 67.0, 128.0, 175.0, 176.0, 101.0, 63.0, 41.0, 18.0, 18.0, 13.0, 16.0, 12.0, 7.0, 7.0, 5.0, 6.0, 2.0, 4.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.657838821411133e-05, -6.434973329305649e-05, -6.212107837200165e-05, -5.989242345094681e-05, -5.766376852989197e-05, -5.543511360883713e-05, -5.320645868778229e-05, -5.097780376672745e-05, -4.874914884567261e-05, -4.652049392461777e-05, -4.429183900356293e-05, -4.206318408250809e-05, -3.983452916145325e-05, -3.760587424039841e-05, -3.537721931934357e-05, -3.314856439828873e-05, -3.091990947723389e-05, -2.8691254556179047e-05, -2.6462599635124207e-05, -2.4233944714069366e-05, -2.2005289793014526e-05, -1.9776634871959686e-05, -1.7547979950904846e-05, -1.5319325029850006e-05, -1.3090670108795166e-05, -1.0862015187740326e-05, -8.633360266685486e-06, -6.404705345630646e-06, -4.176050424575806e-06, -1.9473955035209656e-06, 2.812594175338745e-07, 2.5099143385887146e-06, 4.738569259643555e-06, 6.967224180698395e-06, 9.195879101753235e-06, 1.1424534022808075e-05, 1.3653188943862915e-05, 1.5881843864917755e-05, 1.8110498785972595e-05, 2.0339153707027435e-05, 2.2567808628082275e-05, 2.4796463549137115e-05, 2.7025118470191956e-05, 2.9253773391246796e-05, 3.1482428312301636e-05, 3.3711083233356476e-05, 3.5939738154411316e-05, 3.8168393075466156e-05, 4.0397047996520996e-05, 4.2625702917575836e-05, 4.4854357838630676e-05, 4.7083012759685516e-05, 4.9311667680740356e-05, 5.1540322601795197e-05, 5.376897752285004e-05, 5.599763244390488e-05, 5.822628736495972e-05, 6.045494228601456e-05, 6.26835972070694e-05, 6.491225212812424e-05, 6.714090704917908e-05, 6.936956197023392e-05, 7.159821689128876e-05, 7.38268718123436e-05, 7.605552673339844e-05]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 7.0, 8.0, 8.0, 19.0, 21.0, 29.0, 63.0, 80.0, 116.0, 172.0, 290.0, 423.0, 728.0, 1129.0, 1814.0, 3220.0, 5554.0, 10036.0, 17689.0, 30983.0, 57606.0, 121538.0, 263619.0, 271364.0, 127415.0, 59866.0, 32061.0, 18078.0, 10203.0, 5815.0, 3348.0, 1992.0, 1221.0, 704.0, 504.0, 296.0, 189.0, 126.0, 85.0, 45.0, 39.0, 18.0, 14.0, 8.0, 10.0, 4.0, 1.0, 1.0, 4.0, 1.0, 2.0, 1.0], "bins": [-0.1763916015625, -0.171356201171875, -0.16632080078125, -0.161285400390625, -0.15625, -0.151214599609375, -0.14617919921875, -0.141143798828125, -0.1361083984375, -0.131072998046875, -0.12603759765625, -0.121002197265625, -0.115966796875, -0.110931396484375, -0.10589599609375, -0.100860595703125, -0.0958251953125, -0.090789794921875, -0.08575439453125, -0.080718994140625, -0.07568359375, -0.070648193359375, -0.06561279296875, -0.060577392578125, -0.0555419921875, -0.050506591796875, -0.04547119140625, -0.040435791015625, -0.035400390625, -0.030364990234375, -0.02532958984375, -0.020294189453125, -0.0152587890625, -0.010223388671875, -0.00518798828125, -0.000152587890625, 0.0048828125, 0.009918212890625, 0.01495361328125, 0.019989013671875, 0.0250244140625, 0.030059814453125, 0.03509521484375, 0.040130615234375, 0.045166015625, 0.050201416015625, 0.05523681640625, 0.060272216796875, 0.0653076171875, 0.070343017578125, 0.07537841796875, 0.080413818359375, 0.08544921875, 0.090484619140625, 0.09552001953125, 0.100555419921875, 0.1055908203125, 0.110626220703125, 0.11566162109375, 0.120697021484375, 0.125732421875, 0.130767822265625, 0.13580322265625, 0.140838623046875, 0.1458740234375]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 4.0, 4.0, 4.0, 10.0, 8.0, 21.0, 17.0, 16.0, 17.0, 40.0, 33.0, 51.0, 65.0, 68.0, 89.0, 87.0, 105.0, 73.0, 60.0, 44.0, 41.0, 28.0, 20.0, 16.0, 17.0, 10.0, 10.0, 11.0, 6.0, 2.0, 8.0, 6.0, 0.0, 5.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1787109375, -0.17258262634277344, -0.16645431518554688, -0.1603260040283203, -0.15419769287109375, -0.1480693817138672, -0.14194107055664062, -0.13581275939941406, -0.1296844482421875, -0.12355613708496094, -0.11742782592773438, -0.11129951477050781, -0.10517120361328125, -0.09904289245605469, -0.09291458129882812, -0.08678627014160156, -0.080657958984375, -0.07452964782714844, -0.06840133666992188, -0.06227302551269531, -0.05614471435546875, -0.05001640319824219, -0.043888092041015625, -0.03775978088378906, -0.0316314697265625, -0.025503158569335938, -0.019374847412109375, -0.013246536254882812, -0.00711822509765625, -0.0009899139404296875, 0.005138397216796875, 0.011266708374023438, 0.01739501953125, 0.023523330688476562, 0.029651641845703125, 0.03577995300292969, 0.04190826416015625, 0.04803657531738281, 0.054164886474609375, 0.06029319763183594, 0.0664215087890625, 0.07254981994628906, 0.07867813110351562, 0.08480644226074219, 0.09093475341796875, 0.09706306457519531, 0.10319137573242188, 0.10931968688964844, 0.115447998046875, 0.12157630920410156, 0.12770462036132812, 0.1338329315185547, 0.13996124267578125, 0.1460895538330078, 0.15221786499023438, 0.15834617614746094, 0.1644744873046875, 0.17060279846191406, 0.17673110961914062, 0.1828594207763672, 0.18898773193359375, 0.1951160430908203, 0.20124435424804688, 0.20737266540527344, 0.2135009765625]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 6.0, 21.0, 30.0, 71.0, 102.0, 146.0, 196.0, 150.0, 118.0, 83.0, 48.0, 21.0, 14.0, 6.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-6.404479026794434, -6.280799865722656, -6.157121181488037, -6.03344202041626, -5.909763336181641, -5.786084175109863, -5.662405490875244, -5.538726329803467, -5.415047645568848, -5.29136848449707, -5.167689800262451, -5.044010639190674, -4.920331954956055, -4.796652793884277, -4.672974109649658, -4.549294948577881, -4.425616264343262, -4.301937103271484, -4.178258419036865, -4.054579257965088, -3.9309005737304688, -3.8072216510772705, -3.6835427284240723, -3.559863567352295, -3.4361844062805176, -3.3125054836273193, -3.188826560974121, -3.065147638320923, -2.9414687156677246, -2.8177897930145264, -2.694110870361328, -2.570431709289551, -2.4467530250549316, -2.3230741024017334, -2.199395179748535, -2.075716257095337, -1.9520373344421387, -1.8283584117889404, -1.7046793699264526, -1.5810004472732544, -1.4573214054107666, -1.3336424827575684, -1.2099635601043701, -1.0862846374511719, -0.9626056551933289, -0.8389267325401306, -0.7152477502822876, -0.5915688276290894, -0.4678899049758911, -0.34421098232269287, -0.22053202986717224, -0.09685307741165161, 0.02682584524154663, 0.15050476789474487, 0.2741837501525879, 0.39786267280578613, 0.5215415954589844, 0.6452205181121826, 0.7688994407653809, 0.8925784230232239, 1.0162572860717773, 1.1399362087249756, 1.2636152505874634, 1.3872941732406616, 1.5109730958938599]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 3.0, 6.0, 4.0, 7.0, 8.0, 7.0, 6.0, 7.0, 8.0, 13.0, 15.0, 15.0, 14.0, 19.0, 19.0, 19.0, 31.0, 38.0, 41.0, 43.0, 33.0, 35.0, 50.0, 48.0, 36.0, 44.0, 36.0, 39.0, 48.0, 43.0, 31.0, 29.0, 33.0, 23.0, 26.0, 12.0, 13.0, 16.0, 16.0, 11.0, 7.0, 13.0, 6.0, 10.0, 9.0, 4.0, 7.0, 4.0, 3.0, 2.0, 1.0, 4.0, 1.0, 0.0, 1.0], "bins": [-1.4028453826904297, -1.36062753200531, -1.3184096813201904, -1.2761918306350708, -1.2339739799499512, -1.191756010055542, -1.1495381593704224, -1.1073203086853027, -1.065102458000183, -1.0228846073150635, -0.9806667566299438, -0.9384488463401794, -0.8962309956550598, -0.8540131449699402, -0.8117952346801758, -0.7695773839950562, -0.7273595333099365, -0.6851416826248169, -0.6429238319396973, -0.6007059216499329, -0.5584880709648132, -0.5162702202796936, -0.4740523397922516, -0.43183445930480957, -0.38961660861968994, -0.3473987579345703, -0.3051808774471283, -0.2629629969596863, -0.22074514627456665, -0.17852728068828583, -0.136309415102005, -0.09409153461456299, -0.05187356472015381, -0.009655699133872986, 0.03256216645240784, 0.07478003203868866, 0.11699789762496948, 0.1592157632112503, 0.20143362879753113, 0.24365150928497314, 0.2858693599700928, 0.3280872106552124, 0.3703050911426544, 0.41252297163009644, 0.45474082231521606, 0.4969586730003357, 0.5391765832901001, 0.5813944339752197, 0.6236122846603394, 0.665830135345459, 0.7080479860305786, 0.750265896320343, 0.7924837470054626, 0.8347015976905823, 0.8769195079803467, 0.9191373586654663, 0.9613552093505859, 1.0035730600357056, 1.0457909107208252, 1.0880087614059448, 1.1302266120910645, 1.1724445819854736, 1.2146624326705933, 1.256880283355713, 1.2990981340408325]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 4.0, 6.0, 8.0, 11.0, 12.0, 25.0, 23.0, 32.0, 64.0, 87.0, 155.0, 277.0, 485.0, 1064.0, 2343.0, 5935.0, 17285.0, 63526.0, 321044.0, 2534987.0, 1042016.0, 153089.0, 35066.0, 10212.0, 3642.0, 1448.0, 681.0, 343.0, 149.0, 92.0, 55.0, 47.0, 25.0, 13.0, 7.0, 11.0, 9.0, 5.0, 2.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.45703125, -0.4442596435546875, -0.431488037109375, -0.4187164306640625, -0.40594482421875, -0.3931732177734375, -0.380401611328125, -0.3676300048828125, -0.3548583984375, -0.3420867919921875, -0.329315185546875, -0.3165435791015625, -0.30377197265625, -0.2910003662109375, -0.278228759765625, -0.2654571533203125, -0.252685546875, -0.2399139404296875, -0.227142333984375, -0.2143707275390625, -0.20159912109375, -0.1888275146484375, -0.176055908203125, -0.1632843017578125, -0.1505126953125, -0.1377410888671875, -0.124969482421875, -0.1121978759765625, -0.09942626953125, -0.0866546630859375, -0.073883056640625, -0.0611114501953125, -0.04833984375, -0.0355682373046875, -0.022796630859375, -0.0100250244140625, 0.00274658203125, 0.0155181884765625, 0.028289794921875, 0.0410614013671875, 0.0538330078125, 0.0666046142578125, 0.079376220703125, 0.0921478271484375, 0.10491943359375, 0.1176910400390625, 0.130462646484375, 0.1432342529296875, 0.156005859375, 0.1687774658203125, 0.181549072265625, 0.1943206787109375, 0.20709228515625, 0.2198638916015625, 0.232635498046875, 0.2454071044921875, 0.2581787109375, 0.2709503173828125, 0.283721923828125, 0.2964935302734375, 0.30926513671875, 0.3220367431640625, 0.334808349609375, 0.3475799560546875, 0.3603515625]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 4.0, 6.0, 6.0, 10.0, 18.0, 19.0, 12.0, 30.0, 24.0, 33.0, 40.0, 44.0, 38.0, 34.0, 53.0, 59.0, 49.0, 48.0, 58.0, 51.0, 49.0, 49.0, 54.0, 37.0, 32.0, 26.0, 31.0, 21.0, 18.0, 15.0, 10.0, 3.0, 7.0, 8.0, 2.0, 2.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.2235107421875, -0.21714401245117188, -0.21077728271484375, -0.20441055297851562, -0.1980438232421875, -0.19167709350585938, -0.18531036376953125, -0.17894363403320312, -0.172576904296875, -0.16621017456054688, -0.15984344482421875, -0.15347671508789062, -0.1471099853515625, -0.14074325561523438, -0.13437652587890625, -0.12800979614257812, -0.12164306640625, -0.11527633666992188, -0.10890960693359375, -0.10254287719726562, -0.0961761474609375, -0.08980941772460938, -0.08344268798828125, -0.07707595825195312, -0.070709228515625, -0.06434249877929688, -0.05797576904296875, -0.051609039306640625, -0.0452423095703125, -0.038875579833984375, -0.03250885009765625, -0.026142120361328125, -0.019775390625, -0.013408660888671875, -0.00704193115234375, -0.000675201416015625, 0.0056915283203125, 0.012058258056640625, 0.01842498779296875, 0.024791717529296875, 0.031158447265625, 0.037525177001953125, 0.04389190673828125, 0.050258636474609375, 0.0566253662109375, 0.06299209594726562, 0.06935882568359375, 0.07572555541992188, 0.08209228515625, 0.08845901489257812, 0.09482574462890625, 0.10119247436523438, 0.1075592041015625, 0.11392593383789062, 0.12029266357421875, 0.12665939331054688, 0.133026123046875, 0.13939285278320312, 0.14575958251953125, 0.15212631225585938, 0.1584930419921875, 0.16485977172851562, 0.17122650146484375, 0.17759323120117188, 0.1839599609375]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 4.0, 6.0, 6.0, 11.0, 17.0, 30.0, 28.0, 60.0, 81.0, 116.0, 192.0, 327.0, 619.0, 998.0, 2108.0, 4574.0, 10491.0, 27769.0, 87014.0, 337535.0, 1770782.0, 1534245.0, 296156.0, 77510.0, 25475.0, 9544.0, 4175.0, 1953.0, 1003.0, 516.0, 360.0, 222.0, 119.0, 78.0, 58.0, 30.0, 24.0, 13.0, 17.0, 9.0, 5.0, 4.0, 4.0, 1.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.53466796875, -0.5179367065429688, -0.5012054443359375, -0.48447418212890625, -0.467742919921875, -0.45101165771484375, -0.4342803955078125, -0.41754913330078125, -0.40081787109375, -0.38408660888671875, -0.3673553466796875, -0.35062408447265625, -0.333892822265625, -0.31716156005859375, -0.3004302978515625, -0.28369903564453125, -0.2669677734375, -0.25023651123046875, -0.2335052490234375, -0.21677398681640625, -0.200042724609375, -0.18331146240234375, -0.1665802001953125, -0.14984893798828125, -0.13311767578125, -0.11638641357421875, -0.0996551513671875, -0.08292388916015625, -0.066192626953125, -0.04946136474609375, -0.0327301025390625, -0.01599884033203125, 0.000732421875, 0.01746368408203125, 0.0341949462890625, 0.05092620849609375, 0.067657470703125, 0.08438873291015625, 0.1011199951171875, 0.11785125732421875, 0.13458251953125, 0.15131378173828125, 0.1680450439453125, 0.18477630615234375, 0.201507568359375, 0.21823883056640625, 0.2349700927734375, 0.25170135498046875, 0.2684326171875, 0.28516387939453125, 0.3018951416015625, 0.31862640380859375, 0.335357666015625, 0.35208892822265625, 0.3688201904296875, 0.38555145263671875, 0.40228271484375, 0.41901397705078125, 0.4357452392578125, 0.45247650146484375, 0.469207763671875, 0.48593902587890625, 0.5026702880859375, 0.5194015502929688, 0.5361328125]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 7.0, 5.0, 4.0, 5.0, 12.0, 15.0, 22.0, 24.0, 44.0, 64.0, 98.0, 130.0, 169.0, 274.0, 337.0, 591.0, 746.0, 535.0, 318.0, 211.0, 130.0, 100.0, 75.0, 50.0, 44.0, 21.0, 12.0, 15.0, 7.0, 4.0, 7.0, 5.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3505859375, -0.3372802734375, -0.323974609375, -0.3106689453125, -0.29736328125, -0.2840576171875, -0.270751953125, -0.2574462890625, -0.244140625, -0.2308349609375, -0.217529296875, -0.2042236328125, -0.19091796875, -0.1776123046875, -0.164306640625, -0.1510009765625, -0.1376953125, -0.1243896484375, -0.111083984375, -0.0977783203125, -0.08447265625, -0.0711669921875, -0.057861328125, -0.0445556640625, -0.03125, -0.0179443359375, -0.004638671875, 0.0086669921875, 0.02197265625, 0.0352783203125, 0.048583984375, 0.0618896484375, 0.0751953125, 0.0885009765625, 0.101806640625, 0.1151123046875, 0.12841796875, 0.1417236328125, 0.155029296875, 0.1683349609375, 0.181640625, 0.1949462890625, 0.208251953125, 0.2215576171875, 0.23486328125, 0.2481689453125, 0.261474609375, 0.2747802734375, 0.2880859375, 0.3013916015625, 0.314697265625, 0.3280029296875, 0.34130859375, 0.3546142578125, 0.367919921875, 0.3812255859375, 0.39453125, 0.4078369140625, 0.421142578125, 0.4344482421875, 0.44775390625, 0.4610595703125, 0.474365234375, 0.4876708984375, 0.5009765625]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 5.0, 6.0, 11.0, 16.0, 25.0, 33.0, 53.0, 65.0, 74.0, 101.0, 100.0, 108.0, 82.0, 73.0, 87.0, 48.0, 47.0, 30.0, 19.0, 7.0, 7.0, 5.0, 4.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.878289222717285, -2.811162233352661, -2.744035243988037, -2.676908493041992, -2.609781503677368, -2.542654514312744, -2.47552752494812, -2.408400535583496, -2.341273784637451, -2.274146795272827, -2.207019805908203, -2.139893054962158, -2.072766065597534, -2.00563907623291, -1.9385120868682861, -1.8713852167129517, -1.8042582273483276, -1.7371312379837036, -1.6700043678283691, -1.6028773784637451, -1.5357505083084106, -1.4686235189437866, -1.4014966487884521, -1.3343696594238281, -1.267242670059204, -1.20011568069458, -1.1329888105392456, -1.0658618211746216, -0.9987349510192871, -0.9316079616546631, -0.8644810318946838, -0.7973541021347046, -0.7302272319793701, -0.6631003022193909, -0.5959733724594116, -0.5288463830947876, -0.46171948313713074, -0.3945925533771515, -0.32746559381484985, -0.2603386640548706, -0.19321173429489136, -0.1260848045349121, -0.05895785987377167, 0.008169084787368774, 0.07529601454734802, 0.14242294430732727, 0.2095499038696289, 0.27667683362960815, 0.3438037633895874, 0.41093069314956665, 0.4780576229095459, 0.5451846122741699, 0.6123114824295044, 0.6794384717941284, 0.7465654015541077, 0.8136923313140869, 0.8808192610740662, 0.9479461908340454, 1.0150731801986694, 1.082200050354004, 1.149327039718628, 1.2164539098739624, 1.2835808992385864, 1.350707769393921, 1.417834758758545]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 3.0, 3.0, 6.0, 7.0, 2.0, 5.0, 9.0, 12.0, 14.0, 18.0, 14.0, 21.0, 18.0, 32.0, 20.0, 35.0, 39.0, 39.0, 34.0, 32.0, 41.0, 36.0, 49.0, 55.0, 35.0, 33.0, 37.0, 42.0, 38.0, 30.0, 33.0, 33.0, 32.0, 31.0, 22.0, 17.0, 17.0, 14.0, 10.0, 10.0, 5.0, 4.0, 4.0, 3.0, 6.0, 4.0, 4.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.1168349981307983, -1.0817713737487793, -1.0467077493667603, -1.0116441249847412, -0.9765805006027222, -0.9415168762207031, -0.9064532518386841, -0.871389627456665, -0.836326003074646, -0.801262378692627, -0.7661987543106079, -0.7311351299285889, -0.6960715055465698, -0.6610078811645508, -0.6259442567825317, -0.5908806324005127, -0.5558170080184937, -0.5207533836364746, -0.48568975925445557, -0.4506261348724365, -0.4155625104904175, -0.38049888610839844, -0.3454352617263794, -0.31037163734436035, -0.2753080129623413, -0.24024438858032227, -0.20518076419830322, -0.17011713981628418, -0.13505351543426514, -0.0999898910522461, -0.06492626667022705, -0.029862642288208008, 0.005201101303100586, 0.04026472568511963, 0.07532835006713867, 0.11039197444915771, 0.14545559883117676, 0.1805192232131958, 0.21558284759521484, 0.2506464719772339, 0.28571009635925293, 0.320773720741272, 0.355837345123291, 0.39090096950531006, 0.4259645938873291, 0.46102821826934814, 0.4960918426513672, 0.5311554670333862, 0.5662190914154053, 0.6012827157974243, 0.6363463401794434, 0.6714099645614624, 0.7064735889434814, 0.7415372133255005, 0.7766008377075195, 0.8116644620895386, 0.8467280864715576, 0.8817917108535767, 0.9168553352355957, 0.9519189596176147, 0.9869825839996338, 1.0220462083816528, 1.0571098327636719, 1.092173457145691, 1.12723708152771]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 4.0, 3.0, 5.0, 4.0, 4.0, 7.0, 20.0, 31.0, 38.0, 49.0, 86.0, 113.0, 223.0, 310.0, 546.0, 893.0, 1494.0, 2537.0, 4335.0, 7391.0, 12485.0, 21617.0, 38652.0, 78932.0, 205701.0, 341840.0, 177327.0, 70314.0, 35582.0, 19844.0, 11574.0, 6808.0, 3869.0, 2352.0, 1365.0, 874.0, 488.0, 330.0, 188.0, 116.0, 62.0, 58.0, 31.0, 28.0, 9.0, 9.0, 5.0, 5.0, 1.0, 4.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.32568359375, -0.31497955322265625, -0.3042755126953125, -0.29357147216796875, -0.282867431640625, -0.27216339111328125, -0.2614593505859375, -0.25075531005859375, -0.24005126953125, -0.22934722900390625, -0.2186431884765625, -0.20793914794921875, -0.197235107421875, -0.18653106689453125, -0.1758270263671875, -0.16512298583984375, -0.1544189453125, -0.14371490478515625, -0.1330108642578125, -0.12230682373046875, -0.111602783203125, -0.10089874267578125, -0.0901947021484375, -0.07949066162109375, -0.06878662109375, -0.05808258056640625, -0.0473785400390625, -0.03667449951171875, -0.025970458984375, -0.01526641845703125, -0.0045623779296875, 0.00614166259765625, 0.016845703125, 0.02754974365234375, 0.0382537841796875, 0.04895782470703125, 0.059661865234375, 0.07036590576171875, 0.0810699462890625, 0.09177398681640625, 0.10247802734375, 0.11318206787109375, 0.1238861083984375, 0.13459014892578125, 0.145294189453125, 0.15599822998046875, 0.1667022705078125, 0.17740631103515625, 0.1881103515625, 0.19881439208984375, 0.2095184326171875, 0.22022247314453125, 0.230926513671875, 0.24163055419921875, 0.2523345947265625, 0.26303863525390625, 0.27374267578125, 0.28444671630859375, 0.2951507568359375, 0.30585479736328125, 0.316558837890625, 0.32726287841796875, 0.3379669189453125, 0.34867095947265625, 0.359375]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 5.0, 4.0, 5.0, 4.0, 5.0, 12.0, 7.0, 14.0, 10.0, 18.0, 19.0, 23.0, 21.0, 26.0, 42.0, 42.0, 35.0, 43.0, 41.0, 48.0, 51.0, 53.0, 52.0, 46.0, 48.0, 45.0, 35.0, 50.0, 34.0, 28.0, 26.0, 21.0, 29.0, 15.0, 10.0, 10.0, 15.0, 6.0, 1.0, 5.0, 4.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.216064453125, -0.2097797393798828, -0.20349502563476562, -0.19721031188964844, -0.19092559814453125, -0.18464088439941406, -0.17835617065429688, -0.1720714569091797, -0.1657867431640625, -0.1595020294189453, -0.15321731567382812, -0.14693260192871094, -0.14064788818359375, -0.13436317443847656, -0.12807846069335938, -0.12179374694824219, -0.115509033203125, -0.10922431945800781, -0.10293960571289062, -0.09665489196777344, -0.09037017822265625, -0.08408546447753906, -0.07780075073242188, -0.07151603698730469, -0.0652313232421875, -0.05894660949707031, -0.052661895751953125, -0.04637718200683594, -0.04009246826171875, -0.03380775451660156, -0.027523040771484375, -0.021238327026367188, -0.01495361328125, -0.008668899536132812, -0.002384185791015625, 0.0039005279541015625, 0.01018524169921875, 0.016469955444335938, 0.022754669189453125, 0.029039382934570312, 0.0353240966796875, 0.04160881042480469, 0.047893524169921875, 0.05417823791503906, 0.06046295166015625, 0.06674766540527344, 0.07303237915039062, 0.07931709289550781, 0.085601806640625, 0.09188652038574219, 0.09817123413085938, 0.10445594787597656, 0.11074066162109375, 0.11702537536621094, 0.12331008911132812, 0.1295948028564453, 0.1358795166015625, 0.1421642303466797, 0.14844894409179688, 0.15473365783691406, 0.16101837158203125, 0.16730308532714844, 0.17358779907226562, 0.1798725128173828, 0.1861572265625]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 5.0, 3.0, 1.0, 2.0, 6.0, 3.0, 4.0, 8.0, 6.0, 9.0, 8.0, 15.0, 15.0, 16.0, 36.0, 32.0, 73.0, 108.0, 283.0, 676.0, 1760.0, 5417.0, 15781.0, 46315.0, 172590.0, 559133.0, 174371.0, 47328.0, 16087.0, 5376.0, 1829.0, 649.0, 297.0, 91.0, 75.0, 37.0, 20.0, 27.0, 13.0, 12.0, 11.0, 9.0, 7.0, 5.0, 3.0, 2.0, 9.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.68603515625, -0.6661529541015625, -0.646270751953125, -0.6263885498046875, -0.60650634765625, -0.5866241455078125, -0.566741943359375, -0.5468597412109375, -0.5269775390625, -0.5070953369140625, -0.487213134765625, -0.4673309326171875, -0.44744873046875, -0.4275665283203125, -0.407684326171875, -0.3878021240234375, -0.367919921875, -0.3480377197265625, -0.328155517578125, -0.3082733154296875, -0.28839111328125, -0.2685089111328125, -0.248626708984375, -0.2287445068359375, -0.2088623046875, -0.1889801025390625, -0.169097900390625, -0.1492156982421875, -0.12933349609375, -0.1094512939453125, -0.089569091796875, -0.0696868896484375, -0.0498046875, -0.0299224853515625, -0.010040283203125, 0.0098419189453125, 0.02972412109375, 0.0496063232421875, 0.069488525390625, 0.0893707275390625, 0.1092529296875, 0.1291351318359375, 0.149017333984375, 0.1688995361328125, 0.18878173828125, 0.2086639404296875, 0.228546142578125, 0.2484283447265625, 0.268310546875, 0.2881927490234375, 0.308074951171875, 0.3279571533203125, 0.34783935546875, 0.3677215576171875, 0.387603759765625, 0.4074859619140625, 0.4273681640625, 0.4472503662109375, 0.467132568359375, 0.4870147705078125, 0.50689697265625, 0.5267791748046875, 0.546661376953125, 0.5665435791015625, 0.58642578125]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 1.0, 1.0, 8.0, 5.0, 7.0, 8.0, 9.0, 12.0, 18.0, 12.0, 14.0, 25.0, 21.0, 28.0, 38.0, 31.0, 35.0, 39.0, 37.0, 36.0, 51.0, 44.0, 53.0, 44.0, 41.0, 42.0, 51.0, 35.0, 35.0, 32.0, 29.0, 26.0, 25.0, 20.0, 17.0, 15.0, 10.0, 9.0, 11.0, 9.0, 8.0, 6.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0], "bins": [-0.52294921875, -0.5044784545898438, -0.4860076904296875, -0.46753692626953125, -0.449066162109375, -0.43059539794921875, -0.4121246337890625, -0.39365386962890625, -0.37518310546875, -0.35671234130859375, -0.3382415771484375, -0.31977081298828125, -0.301300048828125, -0.28282928466796875, -0.2643585205078125, -0.24588775634765625, -0.2274169921875, -0.20894622802734375, -0.1904754638671875, -0.17200469970703125, -0.153533935546875, -0.13506317138671875, -0.1165924072265625, -0.09812164306640625, -0.07965087890625, -0.06118011474609375, -0.0427093505859375, -0.02423858642578125, -0.005767822265625, 0.01270294189453125, 0.0311737060546875, 0.04964447021484375, 0.068115234375, 0.08658599853515625, 0.1050567626953125, 0.12352752685546875, 0.141998291015625, 0.16046905517578125, 0.1789398193359375, 0.19741058349609375, 0.21588134765625, 0.23435211181640625, 0.2528228759765625, 0.27129364013671875, 0.289764404296875, 0.30823516845703125, 0.3267059326171875, 0.34517669677734375, 0.3636474609375, 0.38211822509765625, 0.4005889892578125, 0.41905975341796875, 0.437530517578125, 0.45600128173828125, 0.4744720458984375, 0.49294281005859375, 0.51141357421875, 0.5298843383789062, 0.5483551025390625, 0.5668258666992188, 0.585296630859375, 0.6037673950195312, 0.6222381591796875, 0.6407089233398438, 0.6591796875]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 6.0, 6.0, 15.0, 17.0, 27.0, 36.0, 56.0, 75.0, 126.0, 143.0, 303.0, 425.0, 663.0, 1083.0, 1671.0, 2679.0, 4325.0, 6823.0, 10800.0, 17509.0, 29131.0, 56901.0, 136812.0, 295869.0, 259326.0, 108693.0, 48014.0, 25722.0, 15472.0, 9442.0, 6042.0, 3776.0, 2408.0, 1475.0, 983.0, 567.0, 407.0, 255.0, 156.0, 113.0, 66.0, 44.0, 28.0, 20.0, 15.0, 20.0, 5.0, 2.0, 2.0, 4.0, 2.0, 4.0, 2.0, 2.0, 1.0], "bins": [-0.1529541015625, -0.1483020782470703, -0.14365005493164062, -0.13899803161621094, -0.13434600830078125, -0.12969398498535156, -0.12504196166992188, -0.12038993835449219, -0.1157379150390625, -0.11108589172363281, -0.10643386840820312, -0.10178184509277344, -0.09712982177734375, -0.09247779846191406, -0.08782577514648438, -0.08317375183105469, -0.078521728515625, -0.07386970520019531, -0.06921768188476562, -0.06456565856933594, -0.05991363525390625, -0.05526161193847656, -0.050609588623046875, -0.04595756530761719, -0.0413055419921875, -0.03665351867675781, -0.032001495361328125, -0.027349472045898438, -0.02269744873046875, -0.018045425415039062, -0.013393402099609375, -0.008741378784179688, -0.00408935546875, 0.0005626678466796875, 0.005214691162109375, 0.009866714477539062, 0.01451873779296875, 0.019170761108398438, 0.023822784423828125, 0.028474807739257812, 0.0331268310546875, 0.03777885437011719, 0.042430877685546875, 0.04708290100097656, 0.05173492431640625, 0.05638694763183594, 0.061038970947265625, 0.06569099426269531, 0.070343017578125, 0.07499504089355469, 0.07964706420898438, 0.08429908752441406, 0.08895111083984375, 0.09360313415527344, 0.09825515747070312, 0.10290718078613281, 0.1075592041015625, 0.11221122741699219, 0.11686325073242188, 0.12151527404785156, 0.12616729736328125, 0.13081932067871094, 0.13547134399414062, 0.1401233673095703, 0.144775390625]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 3.0, 2.0, 3.0, 1.0, 3.0, 1.0, 3.0, 4.0, 5.0, 17.0, 10.0, 16.0, 16.0, 28.0, 33.0, 52.0, 82.0, 101.0, 138.0, 123.0, 109.0, 65.0, 43.0, 27.0, 21.0, 18.0, 11.0, 8.0, 15.0, 9.0, 6.0, 4.0, 9.0, 6.0, 3.0, 6.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-4.929304122924805e-05, -4.7693029046058655e-05, -4.609301686286926e-05, -4.449300467967987e-05, -4.289299249649048e-05, -4.1292980313301086e-05, -3.9692968130111694e-05, -3.80929559469223e-05, -3.649294376373291e-05, -3.489293158054352e-05, -3.3292919397354126e-05, -3.1692907214164734e-05, -3.0092895030975342e-05, -2.849288284778595e-05, -2.6892870664596558e-05, -2.5292858481407166e-05, -2.3692846298217773e-05, -2.209283411502838e-05, -2.049282193183899e-05, -1.8892809748649597e-05, -1.7292797565460205e-05, -1.5692785382270813e-05, -1.4092773199081421e-05, -1.2492761015892029e-05, -1.0892748832702637e-05, -9.292736649513245e-06, -7.692724466323853e-06, -6.0927122831344604e-06, -4.492700099945068e-06, -2.8926879167556763e-06, -1.2926757335662842e-06, 3.073364496231079e-07, 1.9073486328125e-06, 3.507360816001892e-06, 5.107372999191284e-06, 6.707385182380676e-06, 8.307397365570068e-06, 9.90740954875946e-06, 1.1507421731948853e-05, 1.3107433915138245e-05, 1.4707446098327637e-05, 1.630745828151703e-05, 1.790747046470642e-05, 1.9507482647895813e-05, 2.1107494831085205e-05, 2.2707507014274597e-05, 2.430751919746399e-05, 2.590753138065338e-05, 2.7507543563842773e-05, 2.9107555747032166e-05, 3.070756793022156e-05, 3.230758011341095e-05, 3.390759229660034e-05, 3.5507604479789734e-05, 3.7107616662979126e-05, 3.870762884616852e-05, 4.030764102935791e-05, 4.19076532125473e-05, 4.3507665395736694e-05, 4.5107677578926086e-05, 4.670768976211548e-05, 4.830770194530487e-05, 4.990771412849426e-05, 5.1507726311683655e-05, 5.310773849487305e-05]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 5.0, 4.0, 4.0, 5.0, 4.0, 6.0, 15.0, 17.0, 31.0, 37.0, 55.0, 88.0, 107.0, 244.0, 400.0, 653.0, 1136.0, 2068.0, 3510.0, 6068.0, 10495.0, 18178.0, 33487.0, 70791.0, 189853.0, 349267.0, 206077.0, 75658.0, 35019.0, 19071.0, 11145.0, 6373.0, 3589.0, 2131.0, 1237.0, 635.0, 393.0, 251.0, 151.0, 94.0, 69.0, 35.0, 28.0, 26.0, 19.0, 13.0, 6.0, 4.0, 8.0, 6.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.1583251953125, -0.1534595489501953, -0.14859390258789062, -0.14372825622558594, -0.13886260986328125, -0.13399696350097656, -0.12913131713867188, -0.12426567077636719, -0.1194000244140625, -0.11453437805175781, -0.10966873168945312, -0.10480308532714844, -0.09993743896484375, -0.09507179260253906, -0.09020614624023438, -0.08534049987792969, -0.080474853515625, -0.07560920715332031, -0.07074356079101562, -0.06587791442871094, -0.06101226806640625, -0.05614662170410156, -0.051280975341796875, -0.04641532897949219, -0.0415496826171875, -0.03668403625488281, -0.031818389892578125, -0.026952743530273438, -0.02208709716796875, -0.017221450805664062, -0.012355804443359375, -0.0074901580810546875, -0.00262451171875, 0.0022411346435546875, 0.007106781005859375, 0.011972427368164062, 0.01683807373046875, 0.021703720092773438, 0.026569366455078125, 0.03143501281738281, 0.0363006591796875, 0.04116630554199219, 0.046031951904296875, 0.05089759826660156, 0.05576324462890625, 0.06062889099121094, 0.06549453735351562, 0.07036018371582031, 0.075225830078125, 0.08009147644042969, 0.08495712280273438, 0.08982276916503906, 0.09468841552734375, 0.09955406188964844, 0.10441970825195312, 0.10928535461425781, 0.1141510009765625, 0.11901664733886719, 0.12388229370117188, 0.12874794006347656, 0.13361358642578125, 0.13847923278808594, 0.14334487915039062, 0.1482105255126953, 0.153076171875]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 7.0, 5.0, 6.0, 8.0, 14.0, 10.0, 8.0, 27.0, 28.0, 27.0, 41.0, 74.0, 110.0, 110.0, 135.0, 101.0, 92.0, 50.0, 32.0, 37.0, 13.0, 15.0, 14.0, 7.0, 9.0, 7.0, 4.0, 5.0, 4.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0], "bins": [-0.271484375, -0.26436805725097656, -0.2572517395019531, -0.2501354217529297, -0.24301910400390625, -0.2359027862548828, -0.22878646850585938, -0.22167015075683594, -0.2145538330078125, -0.20743751525878906, -0.20032119750976562, -0.1932048797607422, -0.18608856201171875, -0.1789722442626953, -0.17185592651367188, -0.16473960876464844, -0.157623291015625, -0.15050697326660156, -0.14339065551757812, -0.1362743377685547, -0.12915802001953125, -0.12204170227050781, -0.11492538452148438, -0.10780906677246094, -0.1006927490234375, -0.09357643127441406, -0.08646011352539062, -0.07934379577636719, -0.07222747802734375, -0.06511116027832031, -0.057994842529296875, -0.05087852478027344, -0.04376220703125, -0.03664588928222656, -0.029529571533203125, -0.022413253784179688, -0.01529693603515625, -0.008180618286132812, -0.001064300537109375, 0.0060520172119140625, 0.0131683349609375, 0.020284652709960938, 0.027400970458984375, 0.03451728820800781, 0.04163360595703125, 0.04874992370605469, 0.055866241455078125, 0.06298255920410156, 0.070098876953125, 0.07721519470214844, 0.08433151245117188, 0.09144783020019531, 0.09856414794921875, 0.10568046569824219, 0.11279678344726562, 0.11991310119628906, 0.1270294189453125, 0.13414573669433594, 0.14126205444335938, 0.1483783721923828, 0.15549468994140625, 0.1626110076904297, 0.16972732543945312, 0.17684364318847656, 0.1839599609375]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 24.0, 134.0, 348.0, 336.0, 139.0, 31.0, 6.0], "bins": [-15.124217987060547, -14.872754096984863, -14.62129020690918, -14.369826316833496, -14.118362426757812, -13.866898536682129, -13.615434646606445, -13.363970756530762, -13.112506866455078, -12.861042976379395, -12.609579086303711, -12.358115196228027, -12.106651306152344, -11.85518741607666, -11.603723526000977, -11.352259635925293, -11.10079574584961, -10.849331855773926, -10.597867965698242, -10.346404075622559, -10.094940185546875, -9.843476295471191, -9.592012405395508, -9.340548515319824, -9.08908462524414, -8.837620735168457, -8.586156845092773, -8.33469295501709, -8.083229064941406, -7.831765174865723, -7.580301284790039, -7.3288373947143555, -7.07737398147583, -6.8259100914001465, -6.574446201324463, -6.322982311248779, -6.071518421173096, -5.820054531097412, -5.5685906410217285, -5.317126750946045, -5.065662860870361, -4.814198970794678, -4.562735080718994, -4.3112711906433105, -4.059807300567627, -3.8083434104919434, -3.5568795204162598, -3.305415630340576, -3.0539519786834717, -2.802488088607788, -2.5510241985321045, -2.299560308456421, -2.0480964183807373, -1.7966325283050537, -1.5451686382293701, -1.2937047481536865, -1.042240858078003, -0.7907769680023193, -0.5393130779266357, -0.28784918785095215, -0.036385297775268555, 0.21507859230041504, 0.46654248237609863, 0.7180063724517822, 0.9694703221321106]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 4.0, 0.0, 2.0, 3.0, 3.0, 5.0, 1.0, 6.0, 8.0, 8.0, 6.0, 13.0, 22.0, 23.0, 29.0, 24.0, 29.0, 27.0, 36.0, 30.0, 44.0, 31.0, 45.0, 41.0, 37.0, 60.0, 43.0, 32.0, 44.0, 46.0, 36.0, 31.0, 36.0, 27.0, 33.0, 30.0, 20.0, 20.0, 24.0, 11.0, 15.0, 12.0, 4.0, 3.0, 0.0, 4.0, 2.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.715909481048584, -1.6594817638397217, -1.6030539274215698, -1.5466262102127075, -1.4901983737945557, -1.4337706565856934, -1.377342939376831, -1.3209151029586792, -1.2644872665405273, -1.208059549331665, -1.1516317129135132, -1.0952039957046509, -1.038776159286499, -0.9823484420776367, -0.9259206652641296, -0.8694928884506226, -0.8130651712417603, -0.7566373944282532, -0.7002096176147461, -0.6437819004058838, -0.5873540639877319, -0.5309263467788696, -0.47449856996536255, -0.41807079315185547, -0.3616430163383484, -0.3052152395248413, -0.24878747761249542, -0.19235971570014954, -0.13593193888664246, -0.07950416207313538, -0.023076415061950684, 0.033351361751556396, 0.08977925777435303, 0.1462070345878601, 0.202634796500206, 0.2590625584125519, 0.31549033522605896, 0.37191811203956604, 0.42834585905075073, 0.4847736358642578, 0.5412014126777649, 0.597629189491272, 0.654056966304779, 0.7104847431182861, 0.7669124603271484, 0.8233402967453003, 0.8797680139541626, 0.9361957907676697, 0.9926235675811768, 1.049051284790039, 1.105479121208191, 1.1619068384170532, 1.218334674835205, 1.2747623920440674, 1.3311901092529297, 1.3876179456710815, 1.4440457820892334, 1.5004734992980957, 1.5569013357162476, 1.6133290529251099, 1.6697568893432617, 1.726184606552124, 1.7826123237609863, 1.8390401601791382, 1.8954678773880005]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 10.0, 4.0, 4.0, 7.0, 15.0, 21.0, 21.0, 28.0, 33.0, 78.0, 84.0, 125.0, 206.0, 299.0, 489.0, 853.0, 1533.0, 2889.0, 5778.0, 13143.0, 33355.0, 99079.0, 378084.0, 2407276.0, 959262.0, 195555.0, 57427.0, 20892.0, 8749.0, 4122.0, 2124.0, 1075.0, 638.0, 364.0, 231.0, 143.0, 69.0, 72.0, 32.0, 40.0, 20.0, 17.0, 14.0, 10.0, 9.0, 7.0, 1.0, 3.0, 2.0, 3.0, 0.0, 0.0, 2.0], "bins": [-0.394287109375, -0.3829460144042969, -0.37160491943359375, -0.3602638244628906, -0.3489227294921875, -0.3375816345214844, -0.32624053955078125, -0.3148994445800781, -0.303558349609375, -0.2922172546386719, -0.28087615966796875, -0.2695350646972656, -0.2581939697265625, -0.24685287475585938, -0.23551177978515625, -0.22417068481445312, -0.21282958984375, -0.20148849487304688, -0.19014739990234375, -0.17880630493164062, -0.1674652099609375, -0.15612411499023438, -0.14478302001953125, -0.13344192504882812, -0.122100830078125, -0.11075973510742188, -0.09941864013671875, -0.08807754516601562, -0.0767364501953125, -0.06539535522460938, -0.05405426025390625, -0.042713165283203125, -0.0313720703125, -0.020030975341796875, -0.00868988037109375, 0.002651214599609375, 0.0139923095703125, 0.025333404541015625, 0.03667449951171875, 0.048015594482421875, 0.059356689453125, 0.07069778442382812, 0.08203887939453125, 0.09337997436523438, 0.1047210693359375, 0.11606216430664062, 0.12740325927734375, 0.13874435424804688, 0.15008544921875, 0.16142654418945312, 0.17276763916015625, 0.18410873413085938, 0.1954498291015625, 0.20679092407226562, 0.21813201904296875, 0.22947311401367188, 0.240814208984375, 0.2521553039550781, 0.26349639892578125, 0.2748374938964844, 0.2861785888671875, 0.2975196838378906, 0.30886077880859375, 0.3202018737792969, 0.33154296875]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 1.0, 2.0, 2.0, 4.0, 5.0, 5.0, 6.0, 5.0, 8.0, 13.0, 9.0, 18.0, 12.0, 17.0, 19.0, 18.0, 23.0, 19.0, 19.0, 35.0, 49.0, 33.0, 37.0, 27.0, 39.0, 36.0, 41.0, 49.0, 36.0, 37.0, 44.0, 34.0, 43.0, 33.0, 35.0, 30.0, 21.0, 22.0, 21.0, 23.0, 15.0, 17.0, 14.0, 12.0, 7.0, 7.0, 1.0, 4.0, 3.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1697998046875, -0.16424942016601562, -0.15869903564453125, -0.15314865112304688, -0.1475982666015625, -0.14204788208007812, -0.13649749755859375, -0.13094711303710938, -0.125396728515625, -0.11984634399414062, -0.11429595947265625, -0.10874557495117188, -0.1031951904296875, -0.09764480590820312, -0.09209442138671875, -0.08654403686523438, -0.08099365234375, -0.07544326782226562, -0.06989288330078125, -0.06434249877929688, -0.0587921142578125, -0.053241729736328125, -0.04769134521484375, -0.042140960693359375, -0.036590576171875, -0.031040191650390625, -0.02548980712890625, -0.019939422607421875, -0.0143890380859375, -0.008838653564453125, -0.00328826904296875, 0.002262115478515625, 0.0078125, 0.013362884521484375, 0.01891326904296875, 0.024463653564453125, 0.0300140380859375, 0.035564422607421875, 0.04111480712890625, 0.046665191650390625, 0.052215576171875, 0.057765960693359375, 0.06331634521484375, 0.06886672973632812, 0.0744171142578125, 0.07996749877929688, 0.08551788330078125, 0.09106826782226562, 0.09661865234375, 0.10216903686523438, 0.10771942138671875, 0.11326980590820312, 0.1188201904296875, 0.12437057495117188, 0.12992095947265625, 0.13547134399414062, 0.141021728515625, 0.14657211303710938, 0.15212249755859375, 0.15767288208007812, 0.1632232666015625, 0.16877365112304688, 0.17432403564453125, 0.17987442016601562, 0.1854248046875]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 2.0, 5.0, 11.0, 9.0, 23.0, 27.0, 54.0, 76.0, 73.0, 136.0, 185.0, 293.0, 459.0, 731.0, 1320.0, 2407.0, 4436.0, 9047.0, 20265.0, 49264.0, 135658.0, 437023.0, 1942298.0, 1142996.0, 287203.0, 94612.0, 35591.0, 14922.0, 7047.0, 3477.0, 1829.0, 1100.0, 580.0, 343.0, 253.0, 170.0, 111.0, 75.0, 43.0, 33.0, 31.0, 19.0, 14.0, 10.0, 9.0, 2.0, 5.0, 6.0, 5.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.46923828125, -0.4549446105957031, -0.44065093994140625, -0.4263572692871094, -0.4120635986328125, -0.3977699279785156, -0.38347625732421875, -0.3691825866699219, -0.354888916015625, -0.3405952453613281, -0.32630157470703125, -0.3120079040527344, -0.2977142333984375, -0.2834205627441406, -0.26912689208984375, -0.2548332214355469, -0.24053955078125, -0.22624588012695312, -0.21195220947265625, -0.19765853881835938, -0.1833648681640625, -0.16907119750976562, -0.15477752685546875, -0.14048385620117188, -0.126190185546875, -0.11189651489257812, -0.09760284423828125, -0.08330917358398438, -0.0690155029296875, -0.054721832275390625, -0.04042816162109375, -0.026134490966796875, -0.0118408203125, 0.002452850341796875, 0.01674652099609375, 0.031040191650390625, 0.0453338623046875, 0.059627532958984375, 0.07392120361328125, 0.08821487426757812, 0.102508544921875, 0.11680221557617188, 0.13109588623046875, 0.14538955688476562, 0.1596832275390625, 0.17397689819335938, 0.18827056884765625, 0.20256423950195312, 0.21685791015625, 0.23115158081054688, 0.24544525146484375, 0.2597389221191406, 0.2740325927734375, 0.2883262634277344, 0.30261993408203125, 0.3169136047363281, 0.331207275390625, 0.3455009460449219, 0.35979461669921875, 0.3740882873535156, 0.3883819580078125, 0.4026756286621094, 0.41696929931640625, 0.4312629699707031, 0.445556640625]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 3.0, 1.0, 7.0, 3.0, 4.0, 7.0, 10.0, 8.0, 15.0, 14.0, 28.0, 30.0, 51.0, 84.0, 93.0, 100.0, 188.0, 287.0, 440.0, 665.0, 698.0, 393.0, 247.0, 189.0, 138.0, 83.0, 82.0, 61.0, 50.0, 29.0, 20.0, 13.0, 12.0, 9.0, 5.0, 4.0, 3.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.4296875, -0.4177398681640625, -0.405792236328125, -0.3938446044921875, -0.38189697265625, -0.3699493408203125, -0.358001708984375, -0.3460540771484375, -0.3341064453125, -0.3221588134765625, -0.310211181640625, -0.2982635498046875, -0.28631591796875, -0.2743682861328125, -0.262420654296875, -0.2504730224609375, -0.238525390625, -0.2265777587890625, -0.214630126953125, -0.2026824951171875, -0.19073486328125, -0.1787872314453125, -0.166839599609375, -0.1548919677734375, -0.1429443359375, -0.1309967041015625, -0.119049072265625, -0.1071014404296875, -0.09515380859375, -0.0832061767578125, -0.071258544921875, -0.0593109130859375, -0.04736328125, -0.0354156494140625, -0.023468017578125, -0.0115203857421875, 0.00042724609375, 0.0123748779296875, 0.024322509765625, 0.0362701416015625, 0.0482177734375, 0.0601654052734375, 0.072113037109375, 0.0840606689453125, 0.09600830078125, 0.1079559326171875, 0.119903564453125, 0.1318511962890625, 0.143798828125, 0.1557464599609375, 0.167694091796875, 0.1796417236328125, 0.19158935546875, 0.2035369873046875, 0.215484619140625, 0.2274322509765625, 0.2393798828125, 0.2513275146484375, 0.263275146484375, 0.2752227783203125, 0.28717041015625, 0.2991180419921875, 0.311065673828125, 0.3230133056640625, 0.3349609375]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 5.0, 4.0, 3.0, 9.0, 8.0, 11.0, 15.0, 20.0, 23.0, 39.0, 51.0, 57.0, 63.0, 69.0, 68.0, 81.0, 89.0, 63.0, 66.0, 53.0, 43.0, 43.0, 28.0, 26.0, 24.0, 15.0, 10.0, 3.0, 4.0, 7.0, 2.0, 1.0, 3.0, 2.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4491184949874878, -1.4029057025909424, -1.3566927909851074, -1.310479998588562, -1.264267086982727, -1.2180542945861816, -1.1718413829803467, -1.1256285905838013, -1.0794157981872559, -1.0332030057907104, -0.9869900941848755, -0.9407773017883301, -0.8945643901824951, -0.8483515977859497, -0.8021387457847595, -0.7559258937835693, -0.7097129821777344, -0.6635001301765442, -0.617287278175354, -0.5710744857788086, -0.5248615741729736, -0.47864875197410583, -0.43243592977523804, -0.38622307777404785, -0.34001022577285767, -0.2937973737716675, -0.2475845366716385, -0.2013716995716095, -0.1551588475704193, -0.10894599556922913, -0.06273317337036133, -0.016520321369171143, 0.029692411422729492, 0.07590525597333908, 0.12211810052394867, 0.16833093762397766, 0.21454378962516785, 0.26075664162635803, 0.30696946382522583, 0.353182315826416, 0.3993951678276062, 0.4456080198287964, 0.4918208718299866, 0.5380337238311768, 0.5842465162277222, 0.6304594278335571, 0.6766722202301025, 0.7228850722312927, 0.7690979242324829, 0.8153107762336731, 0.8615236282348633, 0.9077364206314087, 0.9539493322372437, 1.000162124633789, 1.046375036239624, 1.0925878286361694, 1.1388006210327148, 1.1850134134292603, 1.2312263250350952, 1.2774391174316406, 1.3236520290374756, 1.369864821434021, 1.4160776138305664, 1.4622905254364014, 1.5085034370422363]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 1.0, 5.0, 2.0, 7.0, 5.0, 6.0, 11.0, 7.0, 15.0, 14.0, 13.0, 16.0, 13.0, 23.0, 26.0, 30.0, 17.0, 26.0, 33.0, 38.0, 32.0, 37.0, 34.0, 27.0, 33.0, 39.0, 34.0, 35.0, 36.0, 41.0, 30.0, 36.0, 32.0, 28.0, 28.0, 21.0, 33.0, 20.0, 21.0, 15.0, 13.0, 16.0, 16.0, 10.0, 11.0, 4.0, 1.0, 6.0, 3.0, 4.0, 3.0, 2.0, 2.0, 0.0, 2.0], "bins": [-1.1801522970199585, -1.1458258628845215, -1.111499547958374, -1.077173113822937, -1.0428466796875, -1.008520245552063, -0.9741938710212708, -0.9398674964904785, -0.9055410623550415, -0.8712146282196045, -0.8368882536888123, -0.80256187915802, -0.768235445022583, -0.733909010887146, -0.6995826363563538, -0.6652562618255615, -0.6309298276901245, -0.5966033935546875, -0.5622770190238953, -0.527950644493103, -0.493624210357666, -0.4592978060245514, -0.42497140169143677, -0.39064499735832214, -0.3563185930252075, -0.3219921886920929, -0.28766578435897827, -0.25333938002586365, -0.21901297569274902, -0.1846865713596344, -0.15036016702651978, -0.11603376269340515, -0.08170723915100098, -0.04738083481788635, -0.013054430484771729, 0.021271973848342896, 0.05559837818145752, 0.08992478251457214, 0.12425118684768677, 0.1585775911808014, 0.19290399551391602, 0.22723039984703064, 0.26155680418014526, 0.2958832085132599, 0.3302096128463745, 0.36453601717948914, 0.39886242151260376, 0.4331888258457184, 0.467515230178833, 0.50184166431427, 0.5361680388450623, 0.5704944133758545, 0.6048208475112915, 0.6391472816467285, 0.6734736561775208, 0.707800030708313, 0.74212646484375, 0.776452898979187, 0.8107792735099792, 0.8451056480407715, 0.8794320821762085, 0.9137585163116455, 0.9480848908424377, 0.98241126537323, 1.016737699508667]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 3.0, 5.0, 2.0, 6.0, 8.0, 6.0, 11.0, 24.0, 23.0, 38.0, 60.0, 86.0, 163.0, 217.0, 300.0, 457.0, 629.0, 998.0, 1546.0, 2440.0, 3747.0, 5756.0, 8936.0, 14311.0, 22924.0, 38940.0, 69606.0, 128535.0, 216481.0, 221050.0, 133899.0, 71577.0, 40726.0, 24060.0, 14749.0, 9252.0, 5952.0, 3815.0, 2417.0, 1591.0, 1106.0, 709.0, 473.0, 292.0, 216.0, 134.0, 86.0, 69.0, 38.0, 19.0, 32.0, 12.0, 20.0, 9.0, 1.0, 4.0, 2.0, 1.0, 1.0, 3.0], "bins": [-0.253662109375, -0.24598312377929688, -0.23830413818359375, -0.23062515258789062, -0.2229461669921875, -0.21526718139648438, -0.20758819580078125, -0.19990921020507812, -0.192230224609375, -0.18455123901367188, -0.17687225341796875, -0.16919326782226562, -0.1615142822265625, -0.15383529663085938, -0.14615631103515625, -0.13847732543945312, -0.13079833984375, -0.12311935424804688, -0.11544036865234375, -0.10776138305664062, -0.1000823974609375, -0.09240341186523438, -0.08472442626953125, -0.07704544067382812, -0.069366455078125, -0.061687469482421875, -0.05400848388671875, -0.046329498291015625, -0.0386505126953125, -0.030971527099609375, -0.02329254150390625, -0.015613555908203125, -0.0079345703125, -0.000255584716796875, 0.00742340087890625, 0.015102386474609375, 0.0227813720703125, 0.030460357666015625, 0.03813934326171875, 0.045818328857421875, 0.053497314453125, 0.061176300048828125, 0.06885528564453125, 0.07653427124023438, 0.0842132568359375, 0.09189224243164062, 0.09957122802734375, 0.10725021362304688, 0.11492919921875, 0.12260818481445312, 0.13028717041015625, 0.13796615600585938, 0.1456451416015625, 0.15332412719726562, 0.16100311279296875, 0.16868209838867188, 0.176361083984375, 0.18404006958007812, 0.19171905517578125, 0.19939804077148438, 0.2070770263671875, 0.21475601196289062, 0.22243499755859375, 0.23011398315429688, 0.23779296875]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 0.0, 1.0, 8.0, 3.0, 8.0, 15.0, 28.0, 17.0, 21.0, 25.0, 26.0, 25.0, 43.0, 44.0, 49.0, 61.0, 52.0, 48.0, 47.0, 55.0, 43.0, 44.0, 44.0, 57.0, 44.0, 29.0, 30.0, 31.0, 15.0, 27.0, 19.0, 11.0, 12.0, 11.0, 7.0, 4.0, 1.0, 2.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2587890625, -0.2511253356933594, -0.24346160888671875, -0.23579788208007812, -0.2281341552734375, -0.22047042846679688, -0.21280670166015625, -0.20514297485351562, -0.197479248046875, -0.18981552124023438, -0.18215179443359375, -0.17448806762695312, -0.1668243408203125, -0.15916061401367188, -0.15149688720703125, -0.14383316040039062, -0.13616943359375, -0.12850570678710938, -0.12084197998046875, -0.11317825317382812, -0.1055145263671875, -0.09785079956054688, -0.09018707275390625, -0.08252334594726562, -0.074859619140625, -0.06719589233398438, -0.05953216552734375, -0.051868438720703125, -0.0442047119140625, -0.036540985107421875, -0.02887725830078125, -0.021213531494140625, -0.0135498046875, -0.005886077880859375, 0.00177764892578125, 0.009441375732421875, 0.0171051025390625, 0.024768829345703125, 0.03243255615234375, 0.040096282958984375, 0.047760009765625, 0.055423736572265625, 0.06308746337890625, 0.07075119018554688, 0.0784149169921875, 0.08607864379882812, 0.09374237060546875, 0.10140609741210938, 0.10906982421875, 0.11673355102539062, 0.12439727783203125, 0.13206100463867188, 0.1397247314453125, 0.14738845825195312, 0.15505218505859375, 0.16271591186523438, 0.170379638671875, 0.17804336547851562, 0.18570709228515625, 0.19337081909179688, 0.2010345458984375, 0.20869827270507812, 0.21636199951171875, 0.22402572631835938, 0.231689453125]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 5.0, 2.0, 5.0, 7.0, 6.0, 13.0, 11.0, 17.0, 31.0, 33.0, 59.0, 98.0, 236.0, 1198.0, 8968.0, 94532.0, 758657.0, 168006.0, 14232.0, 1781.0, 335.0, 113.0, 63.0, 35.0, 35.0, 25.0, 21.0, 11.0, 13.0, 3.0, 1.0, 9.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8642578125, -0.829132080078125, -0.79400634765625, -0.758880615234375, -0.7237548828125, -0.688629150390625, -0.65350341796875, -0.618377685546875, -0.583251953125, -0.548126220703125, -0.51300048828125, -0.477874755859375, -0.4427490234375, -0.407623291015625, -0.37249755859375, -0.337371826171875, -0.30224609375, -0.267120361328125, -0.23199462890625, -0.196868896484375, -0.1617431640625, -0.126617431640625, -0.09149169921875, -0.056365966796875, -0.021240234375, 0.013885498046875, 0.04901123046875, 0.084136962890625, 0.1192626953125, 0.154388427734375, 0.18951416015625, 0.224639892578125, 0.259765625, 0.294891357421875, 0.33001708984375, 0.365142822265625, 0.4002685546875, 0.435394287109375, 0.47052001953125, 0.505645751953125, 0.540771484375, 0.575897216796875, 0.61102294921875, 0.646148681640625, 0.6812744140625, 0.716400146484375, 0.75152587890625, 0.786651611328125, 0.82177734375, 0.856903076171875, 0.89202880859375, 0.927154541015625, 0.9622802734375, 0.997406005859375, 1.03253173828125, 1.067657470703125, 1.102783203125, 1.137908935546875, 1.17303466796875, 1.208160400390625, 1.2432861328125, 1.278411865234375, 1.31353759765625, 1.348663330078125, 1.3837890625]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 6.0, 3.0, 6.0, 4.0, 13.0, 10.0, 18.0, 15.0, 17.0, 31.0, 29.0, 37.0, 39.0, 39.0, 51.0, 53.0, 39.0, 63.0, 46.0, 58.0, 46.0, 63.0, 43.0, 36.0, 40.0, 40.0, 34.0, 34.0, 19.0, 20.0, 15.0, 10.0, 7.0, 10.0, 10.0, 2.0, 3.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8466796875, -0.8231201171875, -0.799560546875, -0.7760009765625, -0.75244140625, -0.7288818359375, -0.705322265625, -0.6817626953125, -0.658203125, -0.6346435546875, -0.611083984375, -0.5875244140625, -0.56396484375, -0.5404052734375, -0.516845703125, -0.4932861328125, -0.4697265625, -0.4461669921875, -0.422607421875, -0.3990478515625, -0.37548828125, -0.3519287109375, -0.328369140625, -0.3048095703125, -0.28125, -0.2576904296875, -0.234130859375, -0.2105712890625, -0.18701171875, -0.1634521484375, -0.139892578125, -0.1163330078125, -0.0927734375, -0.0692138671875, -0.045654296875, -0.0220947265625, 0.00146484375, 0.0250244140625, 0.048583984375, 0.0721435546875, 0.095703125, 0.1192626953125, 0.142822265625, 0.1663818359375, 0.18994140625, 0.2135009765625, 0.237060546875, 0.2606201171875, 0.2841796875, 0.3077392578125, 0.331298828125, 0.3548583984375, 0.37841796875, 0.4019775390625, 0.425537109375, 0.4490966796875, 0.47265625, 0.4962158203125, 0.519775390625, 0.5433349609375, 0.56689453125, 0.5904541015625, 0.614013671875, 0.6375732421875, 0.6611328125]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 6.0, 3.0, 10.0, 15.0, 26.0, 34.0, 51.0, 102.0, 187.0, 350.0, 630.0, 1254.0, 3004.0, 7946.0, 24359.0, 78353.0, 337745.0, 445651.0, 101692.0, 30617.0, 9922.0, 3470.0, 1514.0, 736.0, 373.0, 224.0, 116.0, 68.0, 48.0, 25.0, 9.0, 9.0, 7.0, 4.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.429443359375, -0.4184608459472656, -0.40747833251953125, -0.3964958190917969, -0.3855133056640625, -0.3745307922363281, -0.36354827880859375, -0.3525657653808594, -0.341583251953125, -0.3306007385253906, -0.31961822509765625, -0.3086357116699219, -0.2976531982421875, -0.2866706848144531, -0.27568817138671875, -0.2647056579589844, -0.25372314453125, -0.24274063110351562, -0.23175811767578125, -0.22077560424804688, -0.2097930908203125, -0.19881057739257812, -0.18782806396484375, -0.17684555053710938, -0.165863037109375, -0.15488052368164062, -0.14389801025390625, -0.13291549682617188, -0.1219329833984375, -0.11095046997070312, -0.09996795654296875, -0.08898544311523438, -0.0780029296875, -0.06702041625976562, -0.05603790283203125, -0.045055389404296875, -0.0340728759765625, -0.023090362548828125, -0.01210784912109375, -0.001125335693359375, 0.009857177734375, 0.020839691162109375, 0.03182220458984375, 0.042804718017578125, 0.0537872314453125, 0.06476974487304688, 0.07575225830078125, 0.08673477172851562, 0.09771728515625, 0.10869979858398438, 0.11968231201171875, 0.13066482543945312, 0.1416473388671875, 0.15262985229492188, 0.16361236572265625, 0.17459487915039062, 0.185577392578125, 0.19655990600585938, 0.20754241943359375, 0.21852493286132812, 0.2295074462890625, 0.24048995971679688, 0.25147247314453125, 0.2624549865722656, 0.2734375]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 2.0, 3.0, 6.0, 7.0, 2.0, 6.0, 5.0, 11.0, 13.0, 19.0, 22.0, 34.0, 38.0, 54.0, 98.0, 120.0, 135.0, 108.0, 85.0, 57.0, 50.0, 32.0, 19.0, 25.0, 15.0, 16.0, 6.0, 2.0, 5.0, 2.0, 6.0, 3.0, 5.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.5703182220458984e-05, -3.396812826395035e-05, -3.223307430744171e-05, -3.0498020350933075e-05, -2.876296639442444e-05, -2.7027912437915802e-05, -2.5292858481407166e-05, -2.355780452489853e-05, -2.1822750568389893e-05, -2.0087696611881256e-05, -1.835264265537262e-05, -1.6617588698863983e-05, -1.4882534742355347e-05, -1.314748078584671e-05, -1.1412426829338074e-05, -9.677372872829437e-06, -7.9423189163208e-06, -6.207264959812164e-06, -4.472211003303528e-06, -2.7371570467948914e-06, -1.0021030902862549e-06, 7.329508662223816e-07, 2.468004822731018e-06, 4.2030587792396545e-06, 5.938112735748291e-06, 7.673166692256927e-06, 9.408220648765564e-06, 1.11432746052742e-05, 1.2878328561782837e-05, 1.4613382518291473e-05, 1.634843647480011e-05, 1.8083490431308746e-05, 1.9818544387817383e-05, 2.155359834432602e-05, 2.3288652300834656e-05, 2.5023706257343292e-05, 2.675876021385193e-05, 2.8493814170360565e-05, 3.02288681268692e-05, 3.196392208337784e-05, 3.3698976039886475e-05, 3.543402999639511e-05, 3.716908395290375e-05, 3.8904137909412384e-05, 4.063919186592102e-05, 4.237424582242966e-05, 4.4109299778938293e-05, 4.584435373544693e-05, 4.7579407691955566e-05, 4.93144616484642e-05, 5.104951560497284e-05, 5.2784569561481476e-05, 5.451962351799011e-05, 5.625467747449875e-05, 5.7989731431007385e-05, 5.972478538751602e-05, 6.145983934402466e-05, 6.31948933005333e-05, 6.492994725704193e-05, 6.666500121355057e-05, 6.84000551700592e-05, 7.013510912656784e-05, 7.187016308307648e-05, 7.360521703958511e-05, 7.534027099609375e-05]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 6.0, 2.0, 5.0, 8.0, 16.0, 17.0, 30.0, 41.0, 77.0, 162.0, 378.0, 1346.0, 8673.0, 100631.0, 830271.0, 96427.0, 8512.0, 1322.0, 345.0, 118.0, 46.0, 45.0, 36.0, 20.0, 13.0, 3.0, 7.0, 5.0, 1.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8583984375, -0.8335113525390625, -0.808624267578125, -0.7837371826171875, -0.75885009765625, -0.7339630126953125, -0.709075927734375, -0.6841888427734375, -0.6593017578125, -0.6344146728515625, -0.609527587890625, -0.5846405029296875, -0.55975341796875, -0.5348663330078125, -0.509979248046875, -0.4850921630859375, -0.460205078125, -0.4353179931640625, -0.410430908203125, -0.3855438232421875, -0.36065673828125, -0.3357696533203125, -0.310882568359375, -0.2859954833984375, -0.2611083984375, -0.2362213134765625, -0.211334228515625, -0.1864471435546875, -0.16156005859375, -0.1366729736328125, -0.111785888671875, -0.0868988037109375, -0.06201171875, -0.0371246337890625, -0.012237548828125, 0.0126495361328125, 0.03753662109375, 0.0624237060546875, 0.087310791015625, 0.1121978759765625, 0.1370849609375, 0.1619720458984375, 0.186859130859375, 0.2117462158203125, 0.23663330078125, 0.2615203857421875, 0.286407470703125, 0.3112945556640625, 0.336181640625, 0.3610687255859375, 0.385955810546875, 0.4108428955078125, 0.43572998046875, 0.4606170654296875, 0.485504150390625, 0.5103912353515625, 0.5352783203125, 0.5601654052734375, 0.585052490234375, 0.6099395751953125, 0.63482666015625, 0.6597137451171875, 0.684600830078125, 0.7094879150390625, 0.734375]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 2.0, 3.0, 3.0, 12.0, 15.0, 25.0, 25.0, 66.0, 124.0, 244.0, 228.0, 114.0, 55.0, 41.0, 27.0, 15.0, 6.0, 8.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.26611328125, -0.24570465087890625, -0.2252960205078125, -0.20488739013671875, -0.184478759765625, -0.16407012939453125, -0.1436614990234375, -0.12325286865234375, -0.10284423828125, -0.08243560791015625, -0.0620269775390625, -0.04161834716796875, -0.021209716796875, -0.00080108642578125, 0.0196075439453125, 0.04001617431640625, 0.0604248046875, 0.08083343505859375, 0.1012420654296875, 0.12165069580078125, 0.142059326171875, 0.16246795654296875, 0.1828765869140625, 0.20328521728515625, 0.22369384765625, 0.24410247802734375, 0.2645111083984375, 0.28491973876953125, 0.305328369140625, 0.32573699951171875, 0.3461456298828125, 0.36655426025390625, 0.386962890625, 0.40737152099609375, 0.4277801513671875, 0.44818878173828125, 0.468597412109375, 0.48900604248046875, 0.5094146728515625, 0.5298233032226562, 0.55023193359375, 0.5706405639648438, 0.5910491943359375, 0.6114578247070312, 0.631866455078125, 0.6522750854492188, 0.6726837158203125, 0.6930923461914062, 0.7135009765625, 0.7339096069335938, 0.7543182373046875, 0.7747268676757812, 0.795135498046875, 0.8155441284179688, 0.8359527587890625, 0.8563613891601562, 0.87677001953125, 0.8971786499023438, 0.9175872802734375, 0.9379959106445312, 0.958404541015625, 0.9788131713867188, 0.9992218017578125, 1.0196304321289062, 1.0400390625]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 9.0, 76.0, 364.0, 448.0, 95.0, 20.0, 2.0, 1.0], "bins": [-22.437585830688477, -22.0572566986084, -21.67692756652832, -21.296598434448242, -20.916269302368164, -20.535940170288086, -20.155611038208008, -19.77528190612793, -19.39495277404785, -19.014623641967773, -18.634294509887695, -18.253965377807617, -17.87363624572754, -17.49330711364746, -17.112977981567383, -16.732648849487305, -16.352319717407227, -15.971990585327148, -15.59166145324707, -15.211332321166992, -14.831003189086914, -14.450674057006836, -14.070344924926758, -13.69001579284668, -13.309685707092285, -12.929356575012207, -12.549027442932129, -12.16869831085205, -11.788369178771973, -11.408040046691895, -11.027710914611816, -10.647381782531738, -10.267051696777344, -9.886722564697266, -9.506393432617188, -9.12606430053711, -8.745735168457031, -8.365406036376953, -7.985076904296875, -7.604747772216797, -7.224418640136719, -6.844089508056641, -6.4637603759765625, -6.083431243896484, -5.703102111816406, -5.322772979736328, -4.94244384765625, -4.562114715576172, -4.1817851066589355, -3.8014559745788574, -3.4211268424987793, -3.040797710418701, -2.660468578338623, -2.280139446258545, -1.8998100757598877, -1.5194809436798096, -1.139151930809021, -0.7588227987289429, -0.37849360704421997, 0.0018355846405029297, 0.38216471672058105, 0.7624938488006592, 1.1428231000900269, 1.523152232170105, 1.903481364250183]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 1.0, 4.0, 5.0, 7.0, 12.0, 14.0, 14.0, 15.0, 17.0, 24.0, 17.0, 21.0, 24.0, 21.0, 29.0, 25.0, 48.0, 40.0, 50.0, 46.0, 61.0, 45.0, 42.0, 41.0, 46.0, 40.0, 43.0, 32.0, 31.0, 32.0, 37.0, 23.0, 21.0, 14.0, 13.0, 12.0, 10.0, 11.0, 4.0, 5.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7485711574554443, -1.6887950897216797, -1.6290191411972046, -1.56924307346344, -1.5094671249389648, -1.4496910572052002, -1.3899149894714355, -1.330138921737671, -1.2703629732131958, -1.2105869054794312, -1.150810956954956, -1.0910348892211914, -1.0312588214874268, -0.9714828729629517, -0.911706805229187, -0.8519307971000671, -0.7921547889709473, -0.7323787808418274, -0.6726027727127075, -0.6128267049789429, -0.553050696849823, -0.4932746887207031, -0.43349865078926086, -0.3737226128578186, -0.31394660472869873, -0.25417059659957886, -0.1943945586681366, -0.13461853563785553, -0.07484251260757446, -0.01506650447845459, 0.04470953345298767, 0.10448557138442993, 0.1642615795135498, 0.22403760254383087, 0.28381362557411194, 0.3435896635055542, 0.4033656716346741, 0.46314167976379395, 0.5229177474975586, 0.5826937556266785, 0.6424697637557983, 0.7022457718849182, 0.7620217800140381, 0.8217978477478027, 0.8815738558769226, 0.9413498640060425, 1.0011259317398071, 1.0609018802642822, 1.1206779479980469, 1.1804540157318115, 1.2402299642562866, 1.3000060319900513, 1.3597819805145264, 1.419558048248291, 1.4793341159820557, 1.5391101837158203, 1.5988861322402954, 1.65866219997406, 1.7184381484985352, 1.7782142162322998, 1.8379902839660645, 1.8977662324905396, 1.9575423002243042, 2.0173182487487793, 2.077094316482544]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 7.0, 3.0, 3.0, 11.0, 7.0, 15.0, 12.0, 16.0, 19.0, 29.0, 34.0, 45.0, 85.0, 100.0, 204.0, 288.0, 516.0, 1071.0, 1971.0, 4448.0, 10876.0, 32033.0, 118574.0, 720557.0, 2809422.0, 382013.0, 75701.0, 22064.0, 7805.0, 3176.0, 1433.0, 715.0, 369.0, 210.0, 153.0, 89.0, 59.0, 37.0, 26.0, 23.0, 18.0, 16.0, 12.0, 8.0, 7.0, 5.0, 2.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.607421875, -0.5897369384765625, -0.572052001953125, -0.5543670654296875, -0.53668212890625, -0.5189971923828125, -0.501312255859375, -0.4836273193359375, -0.4659423828125, -0.4482574462890625, -0.430572509765625, -0.4128875732421875, -0.39520263671875, -0.3775177001953125, -0.359832763671875, -0.3421478271484375, -0.324462890625, -0.3067779541015625, -0.289093017578125, -0.2714080810546875, -0.25372314453125, -0.2360382080078125, -0.218353271484375, -0.2006683349609375, -0.1829833984375, -0.1652984619140625, -0.147613525390625, -0.1299285888671875, -0.11224365234375, -0.0945587158203125, -0.076873779296875, -0.0591888427734375, -0.04150390625, -0.0238189697265625, -0.006134033203125, 0.0115509033203125, 0.02923583984375, 0.0469207763671875, 0.064605712890625, 0.0822906494140625, 0.0999755859375, 0.1176605224609375, 0.135345458984375, 0.1530303955078125, 0.17071533203125, 0.1884002685546875, 0.206085205078125, 0.2237701416015625, 0.241455078125, 0.2591400146484375, 0.276824951171875, 0.2945098876953125, 0.31219482421875, 0.3298797607421875, 0.347564697265625, 0.3652496337890625, 0.3829345703125, 0.4006195068359375, 0.418304443359375, 0.4359893798828125, 0.45367431640625, 0.4713592529296875, 0.489044189453125, 0.5067291259765625, 0.5244140625]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 3.0, 4.0, 3.0, 5.0, 11.0, 8.0, 6.0, 15.0, 13.0, 11.0, 18.0, 21.0, 24.0, 24.0, 23.0, 34.0, 25.0, 38.0, 31.0, 37.0, 43.0, 44.0, 50.0, 55.0, 46.0, 42.0, 38.0, 36.0, 24.0, 40.0, 34.0, 31.0, 32.0, 19.0, 19.0, 19.0, 17.0, 7.0, 11.0, 16.0, 5.0, 4.0, 6.0, 8.0, 2.0, 2.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.185302734375, -0.17938232421875, -0.1734619140625, -0.16754150390625, -0.16162109375, -0.15570068359375, -0.1497802734375, -0.14385986328125, -0.137939453125, -0.13201904296875, -0.1260986328125, -0.12017822265625, -0.1142578125, -0.10833740234375, -0.1024169921875, -0.09649658203125, -0.090576171875, -0.08465576171875, -0.0787353515625, -0.07281494140625, -0.06689453125, -0.06097412109375, -0.0550537109375, -0.04913330078125, -0.043212890625, -0.03729248046875, -0.0313720703125, -0.02545166015625, -0.01953125, -0.01361083984375, -0.0076904296875, -0.00177001953125, 0.004150390625, 0.01007080078125, 0.0159912109375, 0.02191162109375, 0.02783203125, 0.03375244140625, 0.0396728515625, 0.04559326171875, 0.051513671875, 0.05743408203125, 0.0633544921875, 0.06927490234375, 0.0751953125, 0.08111572265625, 0.0870361328125, 0.09295654296875, 0.098876953125, 0.10479736328125, 0.1107177734375, 0.11663818359375, 0.12255859375, 0.12847900390625, 0.1343994140625, 0.14031982421875, 0.146240234375, 0.15216064453125, 0.1580810546875, 0.16400146484375, 0.169921875, 0.17584228515625, 0.1817626953125, 0.18768310546875, 0.193603515625]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 8.0, 5.0, 11.0, 17.0, 15.0, 16.0, 23.0, 39.0, 54.0, 110.0, 167.0, 252.0, 488.0, 845.0, 1674.0, 3468.0, 7543.0, 17850.0, 46198.0, 136530.0, 491279.0, 2121454.0, 1002984.0, 239745.0, 74749.0, 27627.0, 11076.0, 5095.0, 2325.0, 1155.0, 598.0, 355.0, 177.0, 125.0, 65.0, 55.0, 37.0, 20.0, 14.0, 11.0, 6.0, 10.0, 3.0, 3.0, 1.0, 4.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.469970703125, -0.4546775817871094, -0.43938446044921875, -0.4240913391113281, -0.4087982177734375, -0.3935050964355469, -0.37821197509765625, -0.3629188537597656, -0.347625732421875, -0.3323326110839844, -0.31703948974609375, -0.3017463684082031, -0.2864532470703125, -0.2711601257324219, -0.25586700439453125, -0.24057388305664062, -0.22528076171875, -0.20998764038085938, -0.19469451904296875, -0.17940139770507812, -0.1641082763671875, -0.14881515502929688, -0.13352203369140625, -0.11822891235351562, -0.102935791015625, -0.08764266967773438, -0.07234954833984375, -0.057056427001953125, -0.0417633056640625, -0.026470184326171875, -0.01117706298828125, 0.004116058349609375, 0.0194091796875, 0.034702301025390625, 0.04999542236328125, 0.06528854370117188, 0.0805816650390625, 0.09587478637695312, 0.11116790771484375, 0.12646102905273438, 0.141754150390625, 0.15704727172851562, 0.17234039306640625, 0.18763351440429688, 0.2029266357421875, 0.21821975708007812, 0.23351287841796875, 0.24880599975585938, 0.26409912109375, 0.2793922424316406, 0.29468536376953125, 0.3099784851074219, 0.3252716064453125, 0.3405647277832031, 0.35585784912109375, 0.3711509704589844, 0.386444091796875, 0.4017372131347656, 0.41703033447265625, 0.4323234558105469, 0.4476165771484375, 0.4629096984863281, 0.47820281982421875, 0.4934959411621094, 0.5087890625]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 3.0, 4.0, 8.0, 11.0, 12.0, 15.0, 13.0, 22.0, 33.0, 54.0, 61.0, 91.0, 129.0, 225.0, 290.0, 508.0, 718.0, 581.0, 395.0, 277.0, 175.0, 124.0, 92.0, 69.0, 41.0, 28.0, 32.0, 17.0, 17.0, 10.0, 9.0, 4.0, 3.0, 3.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.529296875, -0.5149040222167969, -0.5005111694335938, -0.4861183166503906, -0.4717254638671875, -0.4573326110839844, -0.44293975830078125, -0.4285469055175781, -0.414154052734375, -0.3997611999511719, -0.38536834716796875, -0.3709754943847656, -0.3565826416015625, -0.3421897888183594, -0.32779693603515625, -0.3134040832519531, -0.29901123046875, -0.2846183776855469, -0.27022552490234375, -0.2558326721191406, -0.2414398193359375, -0.22704696655273438, -0.21265411376953125, -0.19826126098632812, -0.183868408203125, -0.16947555541992188, -0.15508270263671875, -0.14068984985351562, -0.1262969970703125, -0.11190414428710938, -0.09751129150390625, -0.08311843872070312, -0.0687255859375, -0.054332733154296875, -0.03993988037109375, -0.025547027587890625, -0.0111541748046875, 0.003238677978515625, 0.01763153076171875, 0.032024383544921875, 0.046417236328125, 0.060810089111328125, 0.07520294189453125, 0.08959579467773438, 0.1039886474609375, 0.11838150024414062, 0.13277435302734375, 0.14716720581054688, 0.16156005859375, 0.17595291137695312, 0.19034576416015625, 0.20473861694335938, 0.2191314697265625, 0.23352432250976562, 0.24791717529296875, 0.2623100280761719, 0.276702880859375, 0.2910957336425781, 0.30548858642578125, 0.3198814392089844, 0.3342742919921875, 0.3486671447753906, 0.36305999755859375, 0.3774528503417969, 0.391845703125]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 8.0, 8.0, 10.0, 23.0, 44.0, 66.0, 81.0, 111.0, 140.0, 145.0, 99.0, 81.0, 77.0, 43.0, 36.0, 11.0, 13.0, 2.0, 7.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8016376495361328, -1.7070591449737549, -1.6124807596206665, -1.5179022550582886, -1.4233238697052002, -1.3287453651428223, -1.2341668605804443, -1.139588475227356, -1.0450100898742676, -0.9504316449165344, -0.8558531999588013, -0.7612746953964233, -0.666696310043335, -0.572117805480957, -0.4775393605232239, -0.3829609155654907, -0.2883824110031128, -0.19380396604537964, -0.09922550618648529, -0.004647046327590942, 0.08993139863014221, 0.18450984358787537, 0.2790883183479309, 0.37366676330566406, 0.4682452082633972, 0.5628236532211304, 0.6574020981788635, 0.7519805431365967, 0.8465590476989746, 0.941137433052063, 1.035715937614441, 1.1302943229675293, 1.2248728275299072, 1.3194513320922852, 1.4140297174453735, 1.5086082220077515, 1.6031866073608398, 1.6977651119232178, 1.7923436164855957, 1.886922001838684, 1.9815003871917725, 2.0760788917541504, 2.1706573963165283, 2.265235662460327, 2.359814167022705, 2.454392671585083, 2.548971176147461, 2.6435494422912598, 2.738128185272217, 2.8327066898345947, 2.9272851943969727, 3.0218634605407715, 3.1164419651031494, 3.2110204696655273, 3.3055989742279053, 3.400177478790283, 3.494755744934082, 3.58933424949646, 3.683912754058838, 3.7784910202026367, 3.8730695247650146, 3.9676480293273926, 4.062226295471191, 4.156805038452148, 4.251383304595947]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 3.0, 4.0, 2.0, 1.0, 1.0, 8.0, 4.0, 10.0, 5.0, 9.0, 15.0, 28.0, 18.0, 18.0, 23.0, 21.0, 23.0, 28.0, 23.0, 28.0, 44.0, 31.0, 39.0, 40.0, 49.0, 50.0, 39.0, 37.0, 40.0, 24.0, 29.0, 39.0, 38.0, 27.0, 33.0, 27.0, 22.0, 14.0, 18.0, 12.0, 16.0, 14.0, 15.0, 9.0, 9.0, 8.0, 4.0, 3.0, 2.0, 3.0, 2.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.0510163307189941, -1.0145249366760254, -0.9780335426330566, -0.9415421485900879, -0.9050507545471191, -0.8685593605041504, -0.8320680260658264, -0.7955766320228577, -0.7590852379798889, -0.7225938439369202, -0.6861024498939514, -0.6496110558509827, -0.6131197214126587, -0.5766283273696899, -0.5401369333267212, -0.5036455392837524, -0.4671541452407837, -0.43066275119781494, -0.3941713571548462, -0.35767999291419983, -0.3211885988712311, -0.28469720482826233, -0.24820582568645477, -0.21171444654464722, -0.17522305250167847, -0.13873165845870972, -0.10224027931690216, -0.06574889272451401, -0.029257506132125854, 0.0072338879108428955, 0.04372526705265045, 0.08021664619445801, 0.11670792102813721, 0.15319931507110596, 0.1896906942129135, 0.22618207335472107, 0.2626734673976898, 0.29916486144065857, 0.33565622568130493, 0.3721476197242737, 0.40863901376724243, 0.4451304078102112, 0.48162180185317993, 0.5181131958961487, 0.5546045303344727, 0.5910959243774414, 0.6275873184204102, 0.6640787124633789, 0.7005701065063477, 0.7370615005493164, 0.7735528945922852, 0.8100442886352539, 0.8465356826782227, 0.8830270767211914, 0.9195184111595154, 0.9560098052024841, 0.9925011992454529, 1.0289925336837769, 1.0654839277267456, 1.1019753217697144, 1.138466715812683, 1.1749581098556519, 1.2114495038986206, 1.2479408979415894, 1.284432291984558]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 8.0, 3.0, 12.0, 11.0, 16.0, 23.0, 36.0, 48.0, 82.0, 105.0, 178.0, 267.0, 375.0, 519.0, 808.0, 1177.0, 1754.0, 2795.0, 4270.0, 6477.0, 10321.0, 16287.0, 25567.0, 42864.0, 76126.0, 148711.0, 272409.0, 199694.0, 98087.0, 53657.0, 31548.0, 19659.0, 12328.0, 7844.0, 5031.0, 3235.0, 2083.0, 1344.0, 917.0, 590.0, 374.0, 308.0, 199.0, 128.0, 79.0, 72.0, 37.0, 30.0, 28.0, 16.0, 15.0, 3.0, 5.0, 1.0, 1.0, 3.0, 0.0, 4.0], "bins": [-0.393310546875, -0.3812828063964844, -0.36925506591796875, -0.3572273254394531, -0.3451995849609375, -0.3331718444824219, -0.32114410400390625, -0.3091163635253906, -0.297088623046875, -0.2850608825683594, -0.27303314208984375, -0.2610054016113281, -0.2489776611328125, -0.23694992065429688, -0.22492218017578125, -0.21289443969726562, -0.20086669921875, -0.18883895874023438, -0.17681121826171875, -0.16478347778320312, -0.1527557373046875, -0.14072799682617188, -0.12870025634765625, -0.11667251586914062, -0.104644775390625, -0.09261703491210938, -0.08058929443359375, -0.06856155395507812, -0.0565338134765625, -0.044506072998046875, -0.03247833251953125, -0.020450592041015625, -0.0084228515625, 0.003604888916015625, 0.01563262939453125, 0.027660369873046875, 0.0396881103515625, 0.051715850830078125, 0.06374359130859375, 0.07577133178710938, 0.087799072265625, 0.09982681274414062, 0.11185455322265625, 0.12388229370117188, 0.1359100341796875, 0.14793777465820312, 0.15996551513671875, 0.17199325561523438, 0.18402099609375, 0.19604873657226562, 0.20807647705078125, 0.22010421752929688, 0.2321319580078125, 0.24415969848632812, 0.25618743896484375, 0.2682151794433594, 0.280242919921875, 0.2922706604003906, 0.30429840087890625, 0.3163261413574219, 0.3283538818359375, 0.3403816223144531, 0.35240936279296875, 0.3644371032714844, 0.37646484375]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 6.0, 8.0, 7.0, 10.0, 14.0, 8.0, 14.0, 15.0, 19.0, 20.0, 23.0, 27.0, 18.0, 35.0, 38.0, 32.0, 37.0, 41.0, 35.0, 56.0, 40.0, 58.0, 43.0, 49.0, 32.0, 25.0, 35.0, 35.0, 30.0, 30.0, 15.0, 25.0, 18.0, 24.0, 11.0, 8.0, 11.0, 13.0, 9.0, 6.0, 8.0, 7.0, 3.0, 3.0, 2.0, 0.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.2039794921875, -0.19777679443359375, -0.1915740966796875, -0.18537139892578125, -0.179168701171875, -0.17296600341796875, -0.1667633056640625, -0.16056060791015625, -0.15435791015625, -0.14815521240234375, -0.1419525146484375, -0.13574981689453125, -0.129547119140625, -0.12334442138671875, -0.1171417236328125, -0.11093902587890625, -0.104736328125, -0.09853363037109375, -0.0923309326171875, -0.08612823486328125, -0.079925537109375, -0.07372283935546875, -0.0675201416015625, -0.06131744384765625, -0.05511474609375, -0.04891204833984375, -0.0427093505859375, -0.03650665283203125, -0.030303955078125, -0.02410125732421875, -0.0178985595703125, -0.01169586181640625, -0.0054931640625, 0.00070953369140625, 0.0069122314453125, 0.01311492919921875, 0.019317626953125, 0.02552032470703125, 0.0317230224609375, 0.03792572021484375, 0.04412841796875, 0.05033111572265625, 0.0565338134765625, 0.06273651123046875, 0.068939208984375, 0.07514190673828125, 0.0813446044921875, 0.08754730224609375, 0.09375, 0.09995269775390625, 0.1061553955078125, 0.11235809326171875, 0.118560791015625, 0.12476348876953125, 0.1309661865234375, 0.13716888427734375, 0.14337158203125, 0.14957427978515625, 0.1557769775390625, 0.16197967529296875, 0.168182373046875, 0.17438507080078125, 0.1805877685546875, 0.18679046630859375, 0.1929931640625]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 4.0, 2.0, 1.0, 7.0, 7.0, 8.0, 16.0, 14.0, 24.0, 50.0, 45.0, 88.0, 145.0, 239.0, 363.0, 826.0, 1611.0, 3408.0, 7784.0, 16761.0, 37890.0, 86484.0, 227905.0, 376075.0, 168130.0, 66319.0, 29340.0, 13560.0, 5942.0, 2755.0, 1283.0, 634.0, 307.0, 203.0, 129.0, 58.0, 44.0, 31.0, 28.0, 20.0, 12.0, 5.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.476806640625, -0.4605598449707031, -0.44431304931640625, -0.4280662536621094, -0.4118194580078125, -0.3955726623535156, -0.37932586669921875, -0.3630790710449219, -0.346832275390625, -0.3305854797363281, -0.31433868408203125, -0.2980918884277344, -0.2818450927734375, -0.2655982971191406, -0.24935150146484375, -0.23310470581054688, -0.21685791015625, -0.20061111450195312, -0.18436431884765625, -0.16811752319335938, -0.1518707275390625, -0.13562393188476562, -0.11937713623046875, -0.10313034057617188, -0.086883544921875, -0.07063674926757812, -0.05438995361328125, -0.038143157958984375, -0.0218963623046875, -0.005649566650390625, 0.01059722900390625, 0.026844024658203125, 0.0430908203125, 0.059337615966796875, 0.07558441162109375, 0.09183120727539062, 0.1080780029296875, 0.12432479858398438, 0.14057159423828125, 0.15681838989257812, 0.173065185546875, 0.18931198120117188, 0.20555877685546875, 0.22180557250976562, 0.2380523681640625, 0.2542991638183594, 0.27054595947265625, 0.2867927551269531, 0.30303955078125, 0.3192863464355469, 0.33553314208984375, 0.3517799377441406, 0.3680267333984375, 0.3842735290527344, 0.40052032470703125, 0.4167671203613281, 0.433013916015625, 0.4492607116699219, 0.46550750732421875, 0.4817543029785156, 0.4980010986328125, 0.5142478942871094, 0.5304946899414062, 0.5467414855957031, 0.56298828125]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 5.0, 7.0, 7.0, 7.0, 8.0, 4.0, 22.0, 15.0, 23.0, 32.0, 24.0, 35.0, 26.0, 43.0, 41.0, 41.0, 40.0, 43.0, 47.0, 41.0, 55.0, 53.0, 58.0, 37.0, 39.0, 45.0, 31.0, 30.0, 25.0, 26.0, 15.0, 17.0, 12.0, 15.0, 7.0, 8.0, 7.0, 6.0, 3.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.65087890625, -0.6277542114257812, -0.6046295166015625, -0.5815048217773438, -0.558380126953125, -0.5352554321289062, -0.5121307373046875, -0.48900604248046875, -0.46588134765625, -0.44275665283203125, -0.4196319580078125, -0.39650726318359375, -0.373382568359375, -0.35025787353515625, -0.3271331787109375, -0.30400848388671875, -0.2808837890625, -0.25775909423828125, -0.2346343994140625, -0.21150970458984375, -0.188385009765625, -0.16526031494140625, -0.1421356201171875, -0.11901092529296875, -0.09588623046875, -0.07276153564453125, -0.0496368408203125, -0.02651214599609375, -0.003387451171875, 0.01973724365234375, 0.0428619384765625, 0.06598663330078125, 0.089111328125, 0.11223602294921875, 0.1353607177734375, 0.15848541259765625, 0.181610107421875, 0.20473480224609375, 0.2278594970703125, 0.25098419189453125, 0.27410888671875, 0.29723358154296875, 0.3203582763671875, 0.34348297119140625, 0.366607666015625, 0.38973236083984375, 0.4128570556640625, 0.43598175048828125, 0.4591064453125, 0.48223114013671875, 0.5053558349609375, 0.5284805297851562, 0.551605224609375, 0.5747299194335938, 0.5978546142578125, 0.6209793090820312, 0.64410400390625, 0.6672286987304688, 0.6903533935546875, 0.7134780883789062, 0.736602783203125, 0.7597274780273438, 0.7828521728515625, 0.8059768676757812, 0.8291015625]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 2.0, 8.0, 17.0, 19.0, 26.0, 74.0, 99.0, 173.0, 347.0, 670.0, 1263.0, 2582.0, 5058.0, 10220.0, 20268.0, 41204.0, 91084.0, 223321.0, 352339.0, 165680.0, 69097.0, 32733.0, 15972.0, 8093.0, 3958.0, 2018.0, 982.0, 538.0, 297.0, 165.0, 101.0, 57.0, 40.0, 20.0, 15.0, 8.0, 6.0, 5.0, 3.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.27783203125, -0.2707691192626953, -0.2637062072753906, -0.25664329528808594, -0.24958038330078125, -0.24251747131347656, -0.23545455932617188, -0.2283916473388672, -0.2213287353515625, -0.2142658233642578, -0.20720291137695312, -0.20013999938964844, -0.19307708740234375, -0.18601417541503906, -0.17895126342773438, -0.1718883514404297, -0.164825439453125, -0.1577625274658203, -0.15069961547851562, -0.14363670349121094, -0.13657379150390625, -0.12951087951660156, -0.12244796752929688, -0.11538505554199219, -0.1083221435546875, -0.10125923156738281, -0.09419631958007812, -0.08713340759277344, -0.08007049560546875, -0.07300758361816406, -0.06594467163085938, -0.05888175964355469, -0.05181884765625, -0.04475593566894531, -0.037693023681640625, -0.030630111694335938, -0.02356719970703125, -0.016504287719726562, -0.009441375732421875, -0.0023784637451171875, 0.0046844482421875, 0.011747360229492188, 0.018810272216796875, 0.025873184204101562, 0.03293609619140625, 0.03999900817871094, 0.047061920166015625, 0.05412483215332031, 0.061187744140625, 0.06825065612792969, 0.07531356811523438, 0.08237648010253906, 0.08943939208984375, 0.09650230407714844, 0.10356521606445312, 0.11062812805175781, 0.1176910400390625, 0.12475395202636719, 0.13181686401367188, 0.13887977600097656, 0.14594268798828125, 0.15300559997558594, 0.16006851196289062, 0.1671314239501953, 0.1741943359375]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 3.0, 4.0, 1.0, 0.0, 2.0, 3.0, 6.0, 4.0, 6.0, 16.0, 12.0, 21.0, 13.0, 24.0, 42.0, 54.0, 90.0, 94.0, 148.0, 131.0, 83.0, 66.0, 43.0, 37.0, 28.0, 11.0, 17.0, 12.0, 4.0, 5.0, 5.0, 3.0, 6.0, 7.0, 1.0, 2.0, 1.0, 3.0, 0.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.37905502319336e-05, -7.166899740695953e-05, -6.954744458198547e-05, -6.742589175701141e-05, -6.530433893203735e-05, -6.31827861070633e-05, -6.106123328208923e-05, -5.893968045711517e-05, -5.681812763214111e-05, -5.469657480716705e-05, -5.257502198219299e-05, -5.045346915721893e-05, -4.833191633224487e-05, -4.621036350727081e-05, -4.408881068229675e-05, -4.196725785732269e-05, -3.984570503234863e-05, -3.772415220737457e-05, -3.560259938240051e-05, -3.348104655742645e-05, -3.135949373245239e-05, -2.9237940907478333e-05, -2.7116388082504272e-05, -2.4994835257530212e-05, -2.2873282432556152e-05, -2.0751729607582092e-05, -1.8630176782608032e-05, -1.6508623957633972e-05, -1.4387071132659912e-05, -1.2265518307685852e-05, -1.0143965482711792e-05, -8.022412657737732e-06, -5.900859832763672e-06, -3.779307007789612e-06, -1.6577541828155518e-06, 4.637986421585083e-07, 2.5853514671325684e-06, 4.706904292106628e-06, 6.8284571170806885e-06, 8.950009942054749e-06, 1.1071562767028809e-05, 1.3193115592002869e-05, 1.531466841697693e-05, 1.743622124195099e-05, 1.955777406692505e-05, 2.167932689189911e-05, 2.380087971687317e-05, 2.592243254184723e-05, 2.804398536682129e-05, 3.016553819179535e-05, 3.228709101676941e-05, 3.440864384174347e-05, 3.653019666671753e-05, 3.865174949169159e-05, 4.077330231666565e-05, 4.289485514163971e-05, 4.501640796661377e-05, 4.713796079158783e-05, 4.925951361656189e-05, 5.138106644153595e-05, 5.350261926651001e-05, 5.562417209148407e-05, 5.774572491645813e-05, 5.986727774143219e-05, 6.198883056640625e-05]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 7.0, 11.0, 7.0, 14.0, 19.0, 29.0, 50.0, 56.0, 117.0, 220.0, 374.0, 746.0, 1714.0, 3965.0, 9409.0, 23229.0, 58685.0, 156462.0, 377758.0, 259360.0, 93652.0, 36610.0, 15011.0, 6100.0, 2509.0, 1160.0, 556.0, 298.0, 162.0, 113.0, 62.0, 39.0, 10.0, 16.0, 12.0, 5.0, 1.0, 7.0, 4.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2259521484375, -0.2180919647216797, -0.21023178100585938, -0.20237159729003906, -0.19451141357421875, -0.18665122985839844, -0.17879104614257812, -0.1709308624267578, -0.1630706787109375, -0.1552104949951172, -0.14735031127929688, -0.13949012756347656, -0.13162994384765625, -0.12376976013183594, -0.11590957641601562, -0.10804939270019531, -0.100189208984375, -0.09232902526855469, -0.08446884155273438, -0.07660865783691406, -0.06874847412109375, -0.06088829040527344, -0.053028106689453125, -0.04516792297363281, -0.0373077392578125, -0.029447555541992188, -0.021587371826171875, -0.013727188110351562, -0.00586700439453125, 0.0019931793212890625, 0.009853363037109375, 0.017713546752929688, 0.02557373046875, 0.03343391418457031, 0.041294097900390625, 0.04915428161621094, 0.05701446533203125, 0.06487464904785156, 0.07273483276367188, 0.08059501647949219, 0.0884552001953125, 0.09631538391113281, 0.10417556762695312, 0.11203575134277344, 0.11989593505859375, 0.12775611877441406, 0.13561630249023438, 0.1434764862060547, 0.151336669921875, 0.1591968536376953, 0.16705703735351562, 0.17491722106933594, 0.18277740478515625, 0.19063758850097656, 0.19849777221679688, 0.2063579559326172, 0.2142181396484375, 0.2220783233642578, 0.22993850708007812, 0.23779869079589844, 0.24565887451171875, 0.25351905822753906, 0.2613792419433594, 0.2692394256591797, 0.277099609375]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 2.0, 4.0, 9.0, 8.0, 7.0, 8.0, 13.0, 28.0, 32.0, 29.0, 42.0, 40.0, 70.0, 74.0, 100.0, 122.0, 101.0, 86.0, 68.0, 37.0, 30.0, 22.0, 14.0, 13.0, 11.0, 9.0, 5.0, 10.0, 4.0, 3.0, 1.0, 3.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.310302734375, -0.3000450134277344, -0.28978729248046875, -0.2795295715332031, -0.2692718505859375, -0.2590141296386719, -0.24875640869140625, -0.23849868774414062, -0.228240966796875, -0.21798324584960938, -0.20772552490234375, -0.19746780395507812, -0.1872100830078125, -0.17695236206054688, -0.16669464111328125, -0.15643692016601562, -0.14617919921875, -0.13592147827148438, -0.12566375732421875, -0.11540603637695312, -0.1051483154296875, -0.09489059448242188, -0.08463287353515625, -0.07437515258789062, -0.064117431640625, -0.053859710693359375, -0.04360198974609375, -0.033344268798828125, -0.0230865478515625, -0.012828826904296875, -0.00257110595703125, 0.007686614990234375, 0.0179443359375, 0.028202056884765625, 0.03845977783203125, 0.048717498779296875, 0.0589752197265625, 0.06923294067382812, 0.07949066162109375, 0.08974838256835938, 0.100006103515625, 0.11026382446289062, 0.12052154541015625, 0.13077926635742188, 0.1410369873046875, 0.15129470825195312, 0.16155242919921875, 0.17181015014648438, 0.18206787109375, 0.19232559204101562, 0.20258331298828125, 0.21284103393554688, 0.2230987548828125, 0.23335647583007812, 0.24361419677734375, 0.2538719177246094, 0.264129638671875, 0.2743873596191406, 0.28464508056640625, 0.2949028015136719, 0.3051605224609375, 0.3154182434082031, 0.32567596435546875, 0.3359336853027344, 0.34619140625]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 14.0, 47.0, 119.0, 167.0, 208.0, 204.0, 124.0, 87.0, 26.0, 7.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.07356071472168, -8.874980926513672, -8.676401138305664, -8.477821350097656, -8.279240608215332, -8.080660820007324, -7.882081031799316, -7.683501243591309, -7.484921455383301, -7.286341667175293, -7.087761402130127, -6.889181613922119, -6.690601825714111, -6.492021560668945, -6.2934417724609375, -6.09486198425293, -5.896281719207764, -5.697701930999756, -5.49912166595459, -5.300541877746582, -5.101962089538574, -4.903382301330566, -4.7048020362854, -4.506222248077393, -4.307641983032227, -4.109062194824219, -3.910482168197632, -3.711902141571045, -3.513322353363037, -3.31474232673645, -3.1161623001098633, -2.9175825119018555, -2.719003200531006, -2.520423173904419, -2.321843385696411, -2.123263359069824, -1.9246834516525269, -1.7261035442352295, -1.5275235176086426, -1.3289436101913452, -1.1303637027740479, -0.9317837953567505, -0.7332038283348083, -0.5346238613128662, -0.33604395389556885, -0.13746404647827148, 0.06111598014831543, 0.2596958875656128, 0.45827579498291016, 0.6568557024002075, 0.8554356694221497, 1.0540156364440918, 1.2525955438613892, 1.4511754512786865, 1.6497554779052734, 1.8483353853225708, 2.046915292739868, 2.245495319366455, 2.444075107574463, 2.64265513420105, 2.8412351608276367, 3.0398149490356445, 3.2383949756622314, 3.4369750022888184, 3.635554790496826]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 3.0, 1.0, 6.0, 4.0, 6.0, 7.0, 4.0, 9.0, 10.0, 15.0, 20.0, 21.0, 18.0, 25.0, 26.0, 28.0, 25.0, 34.0, 25.0, 33.0, 48.0, 48.0, 42.0, 41.0, 32.0, 45.0, 38.0, 43.0, 36.0, 30.0, 36.0, 27.0, 32.0, 33.0, 25.0, 26.0, 21.0, 17.0, 16.0, 14.0, 9.0, 6.0, 6.0, 4.0, 11.0, 3.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.166565179824829, -2.099540948867798, -2.0325167179107666, -1.9654924869537354, -1.898468255996704, -1.8314440250396729, -1.7644199132919312, -1.6973956823349, -1.6303714513778687, -1.5633472204208374, -1.4963229894638062, -1.429298758506775, -1.3622746467590332, -1.295250415802002, -1.2282261848449707, -1.1612019538879395, -1.0941777229309082, -1.027153491973877, -0.9601292610168457, -0.8931050896644592, -0.826080858707428, -0.7590566277503967, -0.6920324563980103, -0.625008225440979, -0.5579839944839478, -0.4909597635269165, -0.42393556237220764, -0.3569113612174988, -0.28988713026046753, -0.22286289930343628, -0.15583869814872742, -0.08881449699401855, -0.021790504455566406, 0.04523371160030365, 0.1122579276561737, 0.17928214371204376, 0.24630635976791382, 0.31333059072494507, 0.38035479187965393, 0.4473789930343628, 0.514403223991394, 0.5814274549484253, 0.6484516859054565, 0.715475857257843, 0.7825000882148743, 0.8495243191719055, 0.916548490524292, 0.9835727214813232, 1.0505969524383545, 1.1176211833953857, 1.184645414352417, 1.2516696453094482, 1.3186938762664795, 1.3857181072235107, 1.4527422189712524, 1.5197664499282837, 1.586790680885315, 1.6538149118423462, 1.7208391427993774, 1.7878633737564087, 1.8548874855041504, 1.9219117164611816, 1.988935947418213, 2.055960178375244, 2.1229844093322754]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 2.0, 5.0, 3.0, 13.0, 7.0, 15.0, 37.0, 49.0, 80.0, 132.0, 210.0, 382.0, 612.0, 1138.0, 2177.0, 4459.0, 9399.0, 21635.0, 54972.0, 154641.0, 521880.0, 2146561.0, 910241.0, 233283.0, 79068.0, 29812.0, 12274.0, 5467.0, 2698.0, 1385.0, 715.0, 371.0, 241.0, 141.0, 71.0, 50.0, 21.0, 10.0, 10.0, 8.0, 6.0, 7.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0], "bins": [-0.4208984375, -0.409423828125, -0.39794921875, -0.386474609375, -0.375, -0.363525390625, -0.35205078125, -0.340576171875, -0.3291015625, -0.317626953125, -0.30615234375, -0.294677734375, -0.283203125, -0.271728515625, -0.26025390625, -0.248779296875, -0.2373046875, -0.225830078125, -0.21435546875, -0.202880859375, -0.19140625, -0.179931640625, -0.16845703125, -0.156982421875, -0.1455078125, -0.134033203125, -0.12255859375, -0.111083984375, -0.099609375, -0.088134765625, -0.07666015625, -0.065185546875, -0.0537109375, -0.042236328125, -0.03076171875, -0.019287109375, -0.0078125, 0.003662109375, 0.01513671875, 0.026611328125, 0.0380859375, 0.049560546875, 0.06103515625, 0.072509765625, 0.083984375, 0.095458984375, 0.10693359375, 0.118408203125, 0.1298828125, 0.141357421875, 0.15283203125, 0.164306640625, 0.17578125, 0.187255859375, 0.19873046875, 0.210205078125, 0.2216796875, 0.233154296875, 0.24462890625, 0.256103515625, 0.267578125, 0.279052734375, 0.29052734375, 0.302001953125, 0.3134765625]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 3.0, 4.0, 8.0, 5.0, 5.0, 10.0, 14.0, 13.0, 17.0, 16.0, 20.0, 39.0, 31.0, 28.0, 24.0, 50.0, 39.0, 42.0, 43.0, 46.0, 34.0, 47.0, 37.0, 52.0, 43.0, 48.0, 41.0, 30.0, 27.0, 35.0, 24.0, 19.0, 20.0, 12.0, 18.0, 11.0, 10.0, 8.0, 11.0, 6.0, 6.0, 4.0, 1.0, 2.0, 4.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.257080078125, -0.24976730346679688, -0.24245452880859375, -0.23514175415039062, -0.2278289794921875, -0.22051620483398438, -0.21320343017578125, -0.20589065551757812, -0.198577880859375, -0.19126510620117188, -0.18395233154296875, -0.17663955688476562, -0.1693267822265625, -0.16201400756835938, -0.15470123291015625, -0.14738845825195312, -0.14007568359375, -0.13276290893554688, -0.12545013427734375, -0.11813735961914062, -0.1108245849609375, -0.10351181030273438, -0.09619903564453125, -0.08888626098632812, -0.081573486328125, -0.07426071166992188, -0.06694793701171875, -0.059635162353515625, -0.0523223876953125, -0.045009613037109375, -0.03769683837890625, -0.030384063720703125, -0.0230712890625, -0.015758514404296875, -0.00844573974609375, -0.001132965087890625, 0.0061798095703125, 0.013492584228515625, 0.02080535888671875, 0.028118133544921875, 0.035430908203125, 0.042743682861328125, 0.05005645751953125, 0.057369232177734375, 0.0646820068359375, 0.07199478149414062, 0.07930755615234375, 0.08662033081054688, 0.09393310546875, 0.10124588012695312, 0.10855865478515625, 0.11587142944335938, 0.1231842041015625, 0.13049697875976562, 0.13780975341796875, 0.14512252807617188, 0.152435302734375, 0.15974807739257812, 0.16706085205078125, 0.17437362670898438, 0.1816864013671875, 0.18899917602539062, 0.19631195068359375, 0.20362472534179688, 0.2109375]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 6.0, 4.0, 4.0, 11.0, 15.0, 12.0, 19.0, 36.0, 46.0, 46.0, 75.0, 88.0, 116.0, 203.0, 329.0, 585.0, 990.0, 2125.0, 5523.0, 15612.0, 50368.0, 192464.0, 1000947.0, 2354136.0, 426765.0, 99388.0, 28147.0, 9138.0, 3568.0, 1530.0, 758.0, 476.0, 237.0, 160.0, 97.0, 73.0, 59.0, 46.0, 22.0, 22.0, 9.0, 9.0, 12.0, 7.0, 4.0, 5.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.63134765625, -0.6117782592773438, -0.5922088623046875, -0.5726394653320312, -0.553070068359375, -0.5335006713867188, -0.5139312744140625, -0.49436187744140625, -0.47479248046875, -0.45522308349609375, -0.4356536865234375, -0.41608428955078125, -0.396514892578125, -0.37694549560546875, -0.3573760986328125, -0.33780670166015625, -0.3182373046875, -0.29866790771484375, -0.2790985107421875, -0.25952911376953125, -0.239959716796875, -0.22039031982421875, -0.2008209228515625, -0.18125152587890625, -0.16168212890625, -0.14211273193359375, -0.1225433349609375, -0.10297393798828125, -0.083404541015625, -0.06383514404296875, -0.0442657470703125, -0.02469635009765625, -0.005126953125, 0.01444244384765625, 0.0340118408203125, 0.05358123779296875, 0.073150634765625, 0.09272003173828125, 0.1122894287109375, 0.13185882568359375, 0.15142822265625, 0.17099761962890625, 0.1905670166015625, 0.21013641357421875, 0.229705810546875, 0.24927520751953125, 0.2688446044921875, 0.28841400146484375, 0.3079833984375, 0.32755279541015625, 0.3471221923828125, 0.36669158935546875, 0.386260986328125, 0.40583038330078125, 0.4253997802734375, 0.44496917724609375, 0.46453857421875, 0.48410797119140625, 0.5036773681640625, 0.5232467651367188, 0.542816162109375, 0.5623855590820312, 0.5819549560546875, 0.6015243530273438, 0.62109375]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 1.0, 9.0, 3.0, 9.0, 8.0, 17.0, 19.0, 27.0, 49.0, 74.0, 88.0, 128.0, 194.0, 315.0, 563.0, 808.0, 708.0, 377.0, 221.0, 155.0, 79.0, 78.0, 54.0, 31.0, 18.0, 10.0, 12.0, 9.0, 5.0, 3.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.6728515625, -0.6534271240234375, -0.634002685546875, -0.6145782470703125, -0.59515380859375, -0.5757293701171875, -0.556304931640625, -0.5368804931640625, -0.5174560546875, -0.4980316162109375, -0.478607177734375, -0.4591827392578125, -0.43975830078125, -0.4203338623046875, -0.400909423828125, -0.3814849853515625, -0.362060546875, -0.3426361083984375, -0.323211669921875, -0.3037872314453125, -0.28436279296875, -0.2649383544921875, -0.245513916015625, -0.2260894775390625, -0.2066650390625, -0.1872406005859375, -0.167816162109375, -0.1483917236328125, -0.12896728515625, -0.1095428466796875, -0.090118408203125, -0.0706939697265625, -0.05126953125, -0.0318450927734375, -0.012420654296875, 0.0070037841796875, 0.02642822265625, 0.0458526611328125, 0.065277099609375, 0.0847015380859375, 0.1041259765625, 0.1235504150390625, 0.142974853515625, 0.1623992919921875, 0.18182373046875, 0.2012481689453125, 0.220672607421875, 0.2400970458984375, 0.259521484375, 0.2789459228515625, 0.298370361328125, 0.3177947998046875, 0.33721923828125, 0.3566436767578125, 0.376068115234375, 0.3954925537109375, 0.4149169921875, 0.4343414306640625, 0.453765869140625, 0.4731903076171875, 0.49261474609375, 0.5120391845703125, 0.531463623046875, 0.5508880615234375, 0.5703125]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 8.0, 9.0, 9.0, 14.0, 23.0, 35.0, 39.0, 61.0, 72.0, 92.0, 90.0, 91.0, 88.0, 73.0, 60.0, 56.0, 55.0, 36.0, 30.0, 20.0, 13.0, 9.0, 13.0, 3.0, 2.0, 4.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.892702341079712, -1.8221635818481445, -1.7516249418258667, -1.6810861825942993, -1.6105475425720215, -1.540008783340454, -1.4694700241088867, -1.3989312648773193, -1.3283926248550415, -1.2578538656234741, -1.1873152256011963, -1.116776466369629, -1.0462377071380615, -0.9756990671157837, -0.9051603078842163, -0.8346216082572937, -0.7640829086303711, -0.6935442090034485, -0.6230055093765259, -0.5524667501449585, -0.4819280505180359, -0.4113893508911133, -0.3408506214618683, -0.2703118920326233, -0.19977319240570068, -0.12923447787761688, -0.05869576334953308, 0.01184295117855072, 0.08238166570663452, 0.15292036533355713, 0.22345909476280212, 0.2939978241920471, 0.3645362854003906, 0.43507498502731323, 0.5056136846542358, 0.5761524438858032, 0.6466911435127258, 0.7172298431396484, 0.7877686023712158, 0.8583073019981384, 0.928846001625061, 0.9993847012519836, 1.0699234008789062, 1.1404621601104736, 1.211000919342041, 1.2815395593643188, 1.3520783185958862, 1.422616958618164, 1.4931557178497314, 1.5636944770812988, 1.6342331171035767, 1.704771876335144, 1.7753105163574219, 1.8458492755889893, 1.9163880348205566, 1.986926794052124, 2.0574655532836914, 2.128004312515259, 2.198543071746826, 2.2690815925598145, 2.339620351791382, 2.410159111022949, 2.4806978702545166, 2.551236629486084, 2.6217751502990723]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [4.0, 0.0, 1.0, 4.0, 3.0, 1.0, 3.0, 3.0, 9.0, 1.0, 13.0, 5.0, 9.0, 15.0, 10.0, 22.0, 13.0, 36.0, 30.0, 28.0, 34.0, 39.0, 44.0, 39.0, 40.0, 54.0, 33.0, 40.0, 38.0, 44.0, 45.0, 33.0, 24.0, 32.0, 22.0, 36.0, 33.0, 22.0, 20.0, 26.0, 29.0, 13.0, 12.0, 13.0, 14.0, 10.0, 10.0, 2.0, 1.0, 2.0, 4.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.375525951385498, -1.3259044885635376, -1.2762830257415771, -1.2266616821289062, -1.1770402193069458, -1.1274187564849854, -1.077797293663025, -1.0281758308410645, -0.9785544276237488, -0.9289329648017883, -0.8793115615844727, -0.8296900987625122, -0.7800686359405518, -0.7304472327232361, -0.6808257699012756, -0.63120436668396, -0.5815829038619995, -0.5319614410400391, -0.4823400378227234, -0.43271857500076294, -0.3830971419811249, -0.3334757089614868, -0.28385424613952637, -0.2342328131198883, -0.18461138010025024, -0.13498994708061218, -0.08536849915981293, -0.03574705123901367, 0.01387438178062439, 0.06349581480026245, 0.1131172776222229, 0.16273871064186096, 0.21236026287078857, 0.26198169589042664, 0.3116031289100647, 0.36122459173202515, 0.4108460247516632, 0.46046745777130127, 0.5100889205932617, 0.5597103834152222, 0.6093317866325378, 0.6589532494544983, 0.708574652671814, 0.7581961154937744, 0.8078175783157349, 0.8574389815330505, 0.907060444355011, 0.9566818475723267, 1.006303310394287, 1.0559247732162476, 1.105546236038208, 1.155167579650879, 1.2047890424728394, 1.2544105052947998, 1.3040319681167603, 1.3536534309387207, 1.4032747745513916, 1.452896237373352, 1.5025177001953125, 1.5521390438079834, 1.6017605066299438, 1.6513819694519043, 1.7010034322738647, 1.7506248950958252, 1.8002463579177856]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 3.0, 1.0, 2.0, 1.0, 4.0, 6.0, 19.0, 19.0, 21.0, 29.0, 51.0, 72.0, 82.0, 143.0, 215.0, 296.0, 460.0, 655.0, 885.0, 1413.0, 2122.0, 3297.0, 5046.0, 8171.0, 13835.0, 24750.0, 49086.0, 125618.0, 353733.0, 275504.0, 91294.0, 39394.0, 20573.0, 11717.0, 7207.0, 4486.0, 2789.0, 1805.0, 1211.0, 780.0, 556.0, 357.0, 264.0, 182.0, 125.0, 77.0, 72.0, 49.0, 42.0, 16.0, 6.0, 8.0, 9.0, 6.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.3955078125, -0.3826866149902344, -0.36986541748046875, -0.3570442199707031, -0.3442230224609375, -0.3314018249511719, -0.31858062744140625, -0.3057594299316406, -0.292938232421875, -0.2801170349121094, -0.26729583740234375, -0.2544746398925781, -0.2416534423828125, -0.22883224487304688, -0.21601104736328125, -0.20318984985351562, -0.19036865234375, -0.17754745483398438, -0.16472625732421875, -0.15190505981445312, -0.1390838623046875, -0.12626266479492188, -0.11344146728515625, -0.10062026977539062, -0.087799072265625, -0.07497787475585938, -0.06215667724609375, -0.049335479736328125, -0.0365142822265625, -0.023693084716796875, -0.01087188720703125, 0.001949310302734375, 0.0147705078125, 0.027591705322265625, 0.04041290283203125, 0.053234100341796875, 0.0660552978515625, 0.07887649536132812, 0.09169769287109375, 0.10451889038085938, 0.117340087890625, 0.13016128540039062, 0.14298248291015625, 0.15580368041992188, 0.1686248779296875, 0.18144607543945312, 0.19426727294921875, 0.20708847045898438, 0.21990966796875, 0.23273086547851562, 0.24555206298828125, 0.2583732604980469, 0.2711944580078125, 0.2840156555175781, 0.29683685302734375, 0.3096580505371094, 0.322479248046875, 0.3353004455566406, 0.34812164306640625, 0.3609428405761719, 0.3737640380859375, 0.3865852355957031, 0.39940643310546875, 0.4122276306152344, 0.425048828125]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 3.0, 2.0, 2.0, 1.0, 5.0, 6.0, 4.0, 9.0, 2.0, 10.0, 9.0, 11.0, 11.0, 12.0, 13.0, 17.0, 16.0, 21.0, 20.0, 23.0, 27.0, 34.0, 27.0, 32.0, 30.0, 27.0, 29.0, 36.0, 44.0, 49.0, 47.0, 31.0, 31.0, 39.0, 38.0, 39.0, 25.0, 31.0, 30.0, 20.0, 15.0, 17.0, 23.0, 14.0, 14.0, 10.0, 10.0, 5.0, 10.0, 6.0, 7.0, 4.0, 6.0, 3.0, 1.0, 4.0, 2.0, 0.0, 1.0, 0.0, 4.0, 1.0], "bins": [-0.19580078125, -0.18956947326660156, -0.18333816528320312, -0.1771068572998047, -0.17087554931640625, -0.1646442413330078, -0.15841293334960938, -0.15218162536621094, -0.1459503173828125, -0.13971900939941406, -0.13348770141601562, -0.1272563934326172, -0.12102508544921875, -0.11479377746582031, -0.10856246948242188, -0.10233116149902344, -0.096099853515625, -0.08986854553222656, -0.08363723754882812, -0.07740592956542969, -0.07117462158203125, -0.06494331359863281, -0.058712005615234375, -0.05248069763183594, -0.0462493896484375, -0.04001808166503906, -0.033786773681640625, -0.027555465698242188, -0.02132415771484375, -0.015092849731445312, -0.008861541748046875, -0.0026302337646484375, 0.00360107421875, 0.009832382202148438, 0.016063690185546875, 0.022294998168945312, 0.02852630615234375, 0.03475761413574219, 0.040988922119140625, 0.04722023010253906, 0.0534515380859375, 0.05968284606933594, 0.06591415405273438, 0.07214546203613281, 0.07837677001953125, 0.08460807800292969, 0.09083938598632812, 0.09707069396972656, 0.103302001953125, 0.10953330993652344, 0.11576461791992188, 0.12199592590332031, 0.12822723388671875, 0.1344585418701172, 0.14068984985351562, 0.14692115783691406, 0.1531524658203125, 0.15938377380371094, 0.16561508178710938, 0.1718463897705078, 0.17807769775390625, 0.1843090057373047, 0.19054031372070312, 0.19677162170410156, 0.2030029296875]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 6.0, 4.0, 9.0, 12.0, 12.0, 16.0, 16.0, 32.0, 61.0, 81.0, 145.0, 326.0, 633.0, 1410.0, 3353.0, 8200.0, 20595.0, 55168.0, 227072.0, 534039.0, 131582.0, 39674.0, 15496.0, 5961.0, 2464.0, 1137.0, 515.0, 233.0, 115.0, 69.0, 44.0, 25.0, 17.0, 12.0, 9.0, 7.0, 4.0, 3.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.7158203125, -0.6955642700195312, -0.6753082275390625, -0.6550521850585938, -0.634796142578125, -0.6145401000976562, -0.5942840576171875, -0.5740280151367188, -0.55377197265625, -0.5335159301757812, -0.5132598876953125, -0.49300384521484375, -0.472747802734375, -0.45249176025390625, -0.4322357177734375, -0.41197967529296875, -0.3917236328125, -0.37146759033203125, -0.3512115478515625, -0.33095550537109375, -0.310699462890625, -0.29044342041015625, -0.2701873779296875, -0.24993133544921875, -0.22967529296875, -0.20941925048828125, -0.1891632080078125, -0.16890716552734375, -0.148651123046875, -0.12839508056640625, -0.1081390380859375, -0.08788299560546875, -0.067626953125, -0.04737091064453125, -0.0271148681640625, -0.00685882568359375, 0.013397216796875, 0.03365325927734375, 0.0539093017578125, 0.07416534423828125, 0.09442138671875, 0.11467742919921875, 0.1349334716796875, 0.15518951416015625, 0.175445556640625, 0.19570159912109375, 0.2159576416015625, 0.23621368408203125, 0.2564697265625, 0.27672576904296875, 0.2969818115234375, 0.31723785400390625, 0.337493896484375, 0.35774993896484375, 0.3780059814453125, 0.39826202392578125, 0.41851806640625, 0.43877410888671875, 0.4590301513671875, 0.47928619384765625, 0.499542236328125, 0.5197982788085938, 0.5400543212890625, 0.5603103637695312, 0.58056640625]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 3.0, 6.0, 5.0, 7.0, 3.0, 9.0, 11.0, 16.0, 12.0, 12.0, 22.0, 23.0, 20.0, 30.0, 33.0, 36.0, 44.0, 45.0, 40.0, 36.0, 45.0, 47.0, 49.0, 53.0, 45.0, 40.0, 41.0, 44.0, 42.0, 32.0, 18.0, 15.0, 20.0, 15.0, 18.0, 17.0, 9.0, 5.0, 8.0, 12.0, 5.0, 5.0, 3.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.76171875, -0.7367935180664062, -0.7118682861328125, -0.6869430541992188, -0.662017822265625, -0.6370925903320312, -0.6121673583984375, -0.5872421264648438, -0.56231689453125, -0.5373916625976562, -0.5124664306640625, -0.48754119873046875, -0.462615966796875, -0.43769073486328125, -0.4127655029296875, -0.38784027099609375, -0.3629150390625, -0.33798980712890625, -0.3130645751953125, -0.28813934326171875, -0.263214111328125, -0.23828887939453125, -0.2133636474609375, -0.18843841552734375, -0.16351318359375, -0.13858795166015625, -0.1136627197265625, -0.08873748779296875, -0.063812255859375, -0.03888702392578125, -0.0139617919921875, 0.01096343994140625, 0.035888671875, 0.06081390380859375, 0.0857391357421875, 0.11066436767578125, 0.135589599609375, 0.16051483154296875, 0.1854400634765625, 0.21036529541015625, 0.23529052734375, 0.26021575927734375, 0.2851409912109375, 0.31006622314453125, 0.334991455078125, 0.35991668701171875, 0.3848419189453125, 0.40976715087890625, 0.4346923828125, 0.45961761474609375, 0.4845428466796875, 0.5094680786132812, 0.534393310546875, 0.5593185424804688, 0.5842437744140625, 0.6091690063476562, 0.63409423828125, 0.6590194702148438, 0.6839447021484375, 0.7088699340820312, 0.733795166015625, 0.7587203979492188, 0.7836456298828125, 0.8085708618164062, 0.83349609375]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 5.0, 5.0, 16.0, 19.0, 18.0, 42.0, 40.0, 80.0, 120.0, 216.0, 352.0, 605.0, 1099.0, 2114.0, 4982.0, 12635.0, 35039.0, 96278.0, 354402.0, 378659.0, 101707.0, 36587.0, 13345.0, 5200.0, 2288.0, 1103.0, 626.0, 369.0, 237.0, 135.0, 78.0, 63.0, 40.0, 24.0, 10.0, 11.0, 5.0, 3.0, 2.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.347412109375, -0.3377685546875, -0.328125, -0.3184814453125, -0.308837890625, -0.2991943359375, -0.28955078125, -0.2799072265625, -0.270263671875, -0.2606201171875, -0.2509765625, -0.2413330078125, -0.231689453125, -0.2220458984375, -0.21240234375, -0.2027587890625, -0.193115234375, -0.1834716796875, -0.173828125, -0.1641845703125, -0.154541015625, -0.1448974609375, -0.13525390625, -0.1256103515625, -0.115966796875, -0.1063232421875, -0.0966796875, -0.0870361328125, -0.077392578125, -0.0677490234375, -0.05810546875, -0.0484619140625, -0.038818359375, -0.0291748046875, -0.01953125, -0.0098876953125, -0.000244140625, 0.0093994140625, 0.01904296875, 0.0286865234375, 0.038330078125, 0.0479736328125, 0.0576171875, 0.0672607421875, 0.076904296875, 0.0865478515625, 0.09619140625, 0.1058349609375, 0.115478515625, 0.1251220703125, 0.134765625, 0.1444091796875, 0.154052734375, 0.1636962890625, 0.17333984375, 0.1829833984375, 0.192626953125, 0.2022705078125, 0.2119140625, 0.2215576171875, 0.231201171875, 0.2408447265625, 0.25048828125, 0.2601318359375, 0.269775390625]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 2.0, 5.0, 8.0, 6.0, 9.0, 7.0, 11.0, 17.0, 9.0, 16.0, 19.0, 31.0, 39.0, 71.0, 147.0, 199.0, 151.0, 66.0, 48.0, 31.0, 25.0, 18.0, 19.0, 12.0, 11.0, 7.0, 3.0, 8.0, 3.0, 1.0, 1.0, 4.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.845329284667969e-05, -8.588097989559174e-05, -8.330866694450378e-05, -8.073635399341583e-05, -7.816404104232788e-05, -7.559172809123993e-05, -7.301941514015198e-05, -7.044710218906403e-05, -6.787478923797607e-05, -6.530247628688812e-05, -6.273016333580017e-05, -6.015785038471222e-05, -5.758553743362427e-05, -5.5013224482536316e-05, -5.2440911531448364e-05, -4.986859858036041e-05, -4.729628562927246e-05, -4.472397267818451e-05, -4.215165972709656e-05, -3.9579346776008606e-05, -3.7007033824920654e-05, -3.44347208738327e-05, -3.186240792274475e-05, -2.92900949716568e-05, -2.6717782020568848e-05, -2.4145469069480896e-05, -2.1573156118392944e-05, -1.9000843167304993e-05, -1.642853021621704e-05, -1.385621726512909e-05, -1.1283904314041138e-05, -8.711591362953186e-06, -6.139278411865234e-06, -3.5669654607772827e-06, -9.94652509689331e-07, 1.5776604413986206e-06, 4.149973392486572e-06, 6.722286343574524e-06, 9.294599294662476e-06, 1.1866912245750427e-05, 1.4439225196838379e-05, 1.701153814792633e-05, 1.9583851099014282e-05, 2.2156164050102234e-05, 2.4728477001190186e-05, 2.7300789952278137e-05, 2.987310290336609e-05, 3.244541585445404e-05, 3.501772880554199e-05, 3.7590041756629944e-05, 4.0162354707717896e-05, 4.273466765880585e-05, 4.53069806098938e-05, 4.787929356098175e-05, 5.04516065120697e-05, 5.3023919463157654e-05, 5.5596232414245605e-05, 5.816854536533356e-05, 6.074085831642151e-05, 6.331317126750946e-05, 6.588548421859741e-05, 6.845779716968536e-05, 7.103011012077332e-05, 7.360242307186127e-05, 7.617473602294922e-05]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 4.0, 3.0, 2.0, 4.0, 7.0, 20.0, 20.0, 29.0, 33.0, 70.0, 78.0, 149.0, 276.0, 453.0, 765.0, 1515.0, 3383.0, 8080.0, 22888.0, 68272.0, 223633.0, 474395.0, 162107.0, 52775.0, 17800.0, 6283.0, 2643.0, 1226.0, 638.0, 393.0, 230.0, 139.0, 74.0, 51.0, 38.0, 28.0, 21.0, 12.0, 9.0, 5.0, 7.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.317138671875, -0.30817413330078125, -0.2992095947265625, -0.29024505615234375, -0.281280517578125, -0.27231597900390625, -0.2633514404296875, -0.25438690185546875, -0.24542236328125, -0.23645782470703125, -0.2274932861328125, -0.21852874755859375, -0.209564208984375, -0.20059967041015625, -0.1916351318359375, -0.18267059326171875, -0.1737060546875, -0.16474151611328125, -0.1557769775390625, -0.14681243896484375, -0.137847900390625, -0.12888336181640625, -0.1199188232421875, -0.11095428466796875, -0.10198974609375, -0.09302520751953125, -0.0840606689453125, -0.07509613037109375, -0.066131591796875, -0.05716705322265625, -0.0482025146484375, -0.03923797607421875, -0.0302734375, -0.02130889892578125, -0.0123443603515625, -0.00337982177734375, 0.005584716796875, 0.01454925537109375, 0.0235137939453125, 0.03247833251953125, 0.04144287109375, 0.05040740966796875, 0.0593719482421875, 0.06833648681640625, 0.077301025390625, 0.08626556396484375, 0.0952301025390625, 0.10419464111328125, 0.1131591796875, 0.12212371826171875, 0.1310882568359375, 0.14005279541015625, 0.149017333984375, 0.15798187255859375, 0.1669464111328125, 0.17591094970703125, 0.18487548828125, 0.19384002685546875, 0.2028045654296875, 0.21176910400390625, 0.220733642578125, 0.22969818115234375, 0.2386627197265625, 0.24762725830078125, 0.256591796875]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 2.0, 3.0, 4.0, 12.0, 4.0, 21.0, 18.0, 19.0, 26.0, 50.0, 55.0, 64.0, 103.0, 146.0, 127.0, 100.0, 62.0, 39.0, 42.0, 25.0, 23.0, 19.0, 7.0, 12.0, 3.0, 5.0, 4.0, 3.0, 3.0, 1.0, 2.0, 1.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.40869140625, -0.397613525390625, -0.38653564453125, -0.375457763671875, -0.3643798828125, -0.353302001953125, -0.34222412109375, -0.331146240234375, -0.320068359375, -0.308990478515625, -0.29791259765625, -0.286834716796875, -0.2757568359375, -0.264678955078125, -0.25360107421875, -0.242523193359375, -0.2314453125, -0.220367431640625, -0.20928955078125, -0.198211669921875, -0.1871337890625, -0.176055908203125, -0.16497802734375, -0.153900146484375, -0.142822265625, -0.131744384765625, -0.12066650390625, -0.109588623046875, -0.0985107421875, -0.087432861328125, -0.07635498046875, -0.065277099609375, -0.05419921875, -0.043121337890625, -0.03204345703125, -0.020965576171875, -0.0098876953125, 0.001190185546875, 0.01226806640625, 0.023345947265625, 0.034423828125, 0.045501708984375, 0.05657958984375, 0.067657470703125, 0.0787353515625, 0.089813232421875, 0.10089111328125, 0.111968994140625, 0.123046875, 0.134124755859375, 0.14520263671875, 0.156280517578125, 0.1673583984375, 0.178436279296875, 0.18951416015625, 0.200592041015625, 0.211669921875, 0.222747802734375, 0.23382568359375, 0.244903564453125, 0.2559814453125, 0.267059326171875, 0.27813720703125, 0.289215087890625, 0.30029296875]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 0.0, 3.0, 2.0, 16.0, 85.0, 332.0, 409.0, 136.0, 24.0, 5.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-19.707050323486328, -19.349416732788086, -18.991783142089844, -18.634151458740234, -18.276517868041992, -17.91888427734375, -17.56125259399414, -17.2036190032959, -16.845985412597656, -16.488351821899414, -16.130718231201172, -15.773086547851562, -15.41545295715332, -15.057819366455078, -14.700186729431152, -14.342554092407227, -13.984920501708984, -13.627286911010742, -13.269654273986816, -12.91202163696289, -12.554388046264648, -12.196754455566406, -11.83912181854248, -11.481489181518555, -11.123855590820312, -10.76622200012207, -10.408589363098145, -10.050956726074219, -9.693323135375977, -9.335689544677734, -8.978056907653809, -8.620424270629883, -8.262789726257324, -7.90515661239624, -7.547523498535156, -7.189890384674072, -6.832257270812988, -6.474624156951904, -6.11699104309082, -5.759357929229736, -5.401724815368652, -5.044091701507568, -4.686458587646484, -4.3288254737854, -3.9711923599243164, -3.6135592460632324, -3.2559261322021484, -2.8982930183410645, -2.5406601428985596, -2.1830270290374756, -1.8253939151763916, -1.4677608013153076, -1.1101276874542236, -0.7524945735931396, -0.39486145973205566, -0.03722834587097168, 0.3204047679901123, 0.6780378818511963, 1.0356709957122803, 1.3933041095733643, 1.7509372234344482, 2.1085703372955322, 2.466203451156616, 2.8238365650177, 3.181469678878784]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 4.0, 6.0, 6.0, 6.0, 7.0, 9.0, 15.0, 9.0, 8.0, 20.0, 21.0, 28.0, 23.0, 26.0, 31.0, 22.0, 29.0, 31.0, 30.0, 29.0, 36.0, 42.0, 49.0, 48.0, 42.0, 49.0, 39.0, 45.0, 38.0, 24.0, 28.0, 33.0, 22.0, 33.0, 22.0, 18.0, 14.0, 15.0, 7.0, 9.0, 9.0, 4.0, 5.0, 9.0, 2.0, 4.0, 3.0, 1.0, 1.0, 2.0, 1.0, 2.0], "bins": [-2.024390697479248, -1.9669029712677002, -1.909415364265442, -1.851927638053894, -1.7944400310516357, -1.736952304840088, -1.67946457862854, -1.6219769716262817, -1.5644893646240234, -1.5070016384124756, -1.4495140314102173, -1.3920263051986694, -1.3345386981964111, -1.2770509719848633, -1.2195632457733154, -1.1620756387710571, -1.1045879125595093, -1.0471001863479614, -0.9896125793457031, -0.9321248531341553, -0.874637246131897, -0.8171495199203491, -0.759661853313446, -0.702174186706543, -0.6446865200996399, -0.5871988534927368, -0.5297111868858337, -0.4722234904766083, -0.4147358238697052, -0.3572481572628021, -0.29976046085357666, -0.24227279424667358, -0.18478500843048096, -0.12729734182357788, -0.06980966031551361, -0.01232197880744934, 0.045165687799453735, 0.10265335440635681, 0.16014105081558228, 0.21762871742248535, 0.2751163840293884, 0.3326040506362915, 0.3900917172431946, 0.44757941365242004, 0.5050671100616455, 0.5625547170639038, 0.6200424432754517, 0.6775301098823547, 0.7350177764892578, 0.7925054430961609, 0.849993109703064, 0.9074808359146118, 0.9649684429168701, 1.022456169128418, 1.0799438953399658, 1.1374315023422241, 1.1949191093444824, 1.2524068355560303, 1.3098944425582886, 1.3673821687698364, 1.4248697757720947, 1.4823575019836426, 1.5398452281951904, 1.5973328351974487, 1.6548205614089966]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 10.0, 10.0, 9.0, 16.0, 15.0, 34.0, 32.0, 56.0, 97.0, 144.0, 211.0, 338.0, 491.0, 794.0, 1273.0, 1947.0, 3284.0, 5563.0, 9169.0, 16052.0, 29042.0, 52991.0, 100606.0, 206275.0, 514659.0, 1584197.0, 1010919.0, 338196.0, 150112.0, 75248.0, 40017.0, 22252.0, 12327.0, 6967.0, 4149.0, 2512.0, 1484.0, 968.0, 635.0, 396.0, 252.0, 173.0, 134.0, 82.0, 47.0, 29.0, 28.0, 18.0, 14.0, 3.0, 3.0, 5.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.251220703125, -0.243316650390625, -0.23541259765625, -0.227508544921875, -0.2196044921875, -0.211700439453125, -0.20379638671875, -0.195892333984375, -0.18798828125, -0.180084228515625, -0.17218017578125, -0.164276123046875, -0.1563720703125, -0.148468017578125, -0.14056396484375, -0.132659912109375, -0.124755859375, -0.116851806640625, -0.10894775390625, -0.101043701171875, -0.0931396484375, -0.085235595703125, -0.07733154296875, -0.069427490234375, -0.0615234375, -0.053619384765625, -0.04571533203125, -0.037811279296875, -0.0299072265625, -0.022003173828125, -0.01409912109375, -0.006195068359375, 0.001708984375, 0.009613037109375, 0.01751708984375, 0.025421142578125, 0.0333251953125, 0.041229248046875, 0.04913330078125, 0.057037353515625, 0.06494140625, 0.072845458984375, 0.08074951171875, 0.088653564453125, 0.0965576171875, 0.104461669921875, 0.11236572265625, 0.120269775390625, 0.128173828125, 0.136077880859375, 0.14398193359375, 0.151885986328125, 0.1597900390625, 0.167694091796875, 0.17559814453125, 0.183502197265625, 0.19140625, 0.199310302734375, 0.20721435546875, 0.215118408203125, 0.2230224609375, 0.230926513671875, 0.23883056640625, 0.246734619140625, 0.254638671875]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 3.0, 7.0, 6.0, 6.0, 12.0, 13.0, 12.0, 14.0, 17.0, 22.0, 22.0, 31.0, 42.0, 31.0, 42.0, 40.0, 42.0, 39.0, 39.0, 36.0, 45.0, 42.0, 48.0, 52.0, 49.0, 40.0, 27.0, 38.0, 24.0, 24.0, 19.0, 26.0, 15.0, 14.0, 18.0, 9.0, 18.0, 3.0, 5.0, 4.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 4.0, 0.0, 1.0, 2.0], "bins": [-0.25244140625, -0.24508094787597656, -0.23772048950195312, -0.2303600311279297, -0.22299957275390625, -0.2156391143798828, -0.20827865600585938, -0.20091819763183594, -0.1935577392578125, -0.18619728088378906, -0.17883682250976562, -0.1714763641357422, -0.16411590576171875, -0.1567554473876953, -0.14939498901367188, -0.14203453063964844, -0.134674072265625, -0.12731361389160156, -0.11995315551757812, -0.11259269714355469, -0.10523223876953125, -0.09787178039550781, -0.09051132202148438, -0.08315086364746094, -0.0757904052734375, -0.06842994689941406, -0.061069488525390625, -0.05370903015136719, -0.04634857177734375, -0.03898811340332031, -0.031627655029296875, -0.024267196655273438, -0.01690673828125, -0.009546279907226562, -0.002185821533203125, 0.0051746368408203125, 0.01253509521484375, 0.019895553588867188, 0.027256011962890625, 0.03461647033691406, 0.0419769287109375, 0.04933738708496094, 0.056697845458984375, 0.06405830383300781, 0.07141876220703125, 0.07877922058105469, 0.08613967895507812, 0.09350013732910156, 0.100860595703125, 0.10822105407714844, 0.11558151245117188, 0.12294197082519531, 0.13030242919921875, 0.1376628875732422, 0.14502334594726562, 0.15238380432128906, 0.1597442626953125, 0.16710472106933594, 0.17446517944335938, 0.1818256378173828, 0.18918609619140625, 0.1965465545654297, 0.20390701293945312, 0.21126747131347656, 0.2186279296875]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 4.0, 6.0, 5.0, 4.0, 9.0, 17.0, 25.0, 30.0, 41.0, 42.0, 63.0, 99.0, 152.0, 238.0, 472.0, 888.0, 2352.0, 6870.0, 24890.0, 108856.0, 646891.0, 2838895.0, 452417.0, 82461.0, 19200.0, 5523.0, 1933.0, 812.0, 394.0, 208.0, 152.0, 88.0, 67.0, 53.0, 31.0, 25.0, 24.0, 16.0, 10.0, 6.0, 6.0, 3.0, 4.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.83203125, -0.80712890625, -0.7822265625, -0.75732421875, -0.732421875, -0.70751953125, -0.6826171875, -0.65771484375, -0.6328125, -0.60791015625, -0.5830078125, -0.55810546875, -0.533203125, -0.50830078125, -0.4833984375, -0.45849609375, -0.43359375, -0.40869140625, -0.3837890625, -0.35888671875, -0.333984375, -0.30908203125, -0.2841796875, -0.25927734375, -0.234375, -0.20947265625, -0.1845703125, -0.15966796875, -0.134765625, -0.10986328125, -0.0849609375, -0.06005859375, -0.03515625, -0.01025390625, 0.0146484375, 0.03955078125, 0.064453125, 0.08935546875, 0.1142578125, 0.13916015625, 0.1640625, 0.18896484375, 0.2138671875, 0.23876953125, 0.263671875, 0.28857421875, 0.3134765625, 0.33837890625, 0.36328125, 0.38818359375, 0.4130859375, 0.43798828125, 0.462890625, 0.48779296875, 0.5126953125, 0.53759765625, 0.5625, 0.58740234375, 0.6123046875, 0.63720703125, 0.662109375, 0.68701171875, 0.7119140625, 0.73681640625, 0.76171875]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 6.0, 8.0, 10.0, 11.0, 21.0, 29.0, 53.0, 74.0, 90.0, 148.0, 258.0, 431.0, 849.0, 882.0, 525.0, 248.0, 152.0, 111.0, 63.0, 46.0, 25.0, 13.0, 9.0, 3.0, 8.0, 3.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.828125, -0.804443359375, -0.78076171875, -0.757080078125, -0.7333984375, -0.709716796875, -0.68603515625, -0.662353515625, -0.638671875, -0.614990234375, -0.59130859375, -0.567626953125, -0.5439453125, -0.520263671875, -0.49658203125, -0.472900390625, -0.44921875, -0.425537109375, -0.40185546875, -0.378173828125, -0.3544921875, -0.330810546875, -0.30712890625, -0.283447265625, -0.259765625, -0.236083984375, -0.21240234375, -0.188720703125, -0.1650390625, -0.141357421875, -0.11767578125, -0.093994140625, -0.0703125, -0.046630859375, -0.02294921875, 0.000732421875, 0.0244140625, 0.048095703125, 0.07177734375, 0.095458984375, 0.119140625, 0.142822265625, 0.16650390625, 0.190185546875, 0.2138671875, 0.237548828125, 0.26123046875, 0.284912109375, 0.30859375, 0.332275390625, 0.35595703125, 0.379638671875, 0.4033203125, 0.427001953125, 0.45068359375, 0.474365234375, 0.498046875, 0.521728515625, 0.54541015625, 0.569091796875, 0.5927734375, 0.616455078125, 0.64013671875, 0.663818359375, 0.6875]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 2.0, 7.0, 17.0, 27.0, 54.0, 124.0, 146.0, 181.0, 169.0, 130.0, 74.0, 44.0, 12.0, 11.0, 5.0, 4.0, 1.0, 2.0, 0.0, 0.0, 3.0], "bins": [-7.515244007110596, -7.367010116577148, -7.218776226043701, -7.070542335510254, -6.922307968139648, -6.774074077606201, -6.625840187072754, -6.477606296539307, -6.329372406005859, -6.181138515472412, -6.032904624938965, -5.884670734405518, -5.73643684387207, -5.588202476501465, -5.439968585968018, -5.29173469543457, -5.143500804901123, -4.995266914367676, -4.8470330238342285, -4.698799133300781, -4.550564765930176, -4.4023308753967285, -4.254096984863281, -4.105863094329834, -3.9576292037963867, -3.8093953132629395, -3.661161422729492, -3.512927293777466, -3.3646934032440186, -3.2164595127105713, -3.068225383758545, -2.9199914932250977, -2.7717576026916504, -2.623523712158203, -2.475289821624756, -2.3270556926727295, -2.1788218021392822, -2.030587911605835, -1.8823539018630981, -1.7341198921203613, -1.585886001586914, -1.4376521110534668, -1.28941810131073, -1.1411840915679932, -0.9929502010345459, -0.8447162508964539, -0.6964823007583618, -0.548248291015625, -0.40001440048217773, -0.2517804503440857, -0.10354650020599365, 0.04468744993209839, 0.19292140007019043, 0.34115535020828247, 0.4893893003463745, 0.6376233100891113, 0.7858572006225586, 0.9340911507606506, 1.0823251008987427, 1.2305591106414795, 1.3787930011749268, 1.527026891708374, 1.6752609014511108, 1.8234949111938477, 1.971728801727295]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 4.0, 3.0, 2.0, 4.0, 2.0, 8.0, 9.0, 11.0, 10.0, 9.0, 18.0, 18.0, 21.0, 23.0, 26.0, 23.0, 29.0, 29.0, 36.0, 39.0, 38.0, 39.0, 51.0, 42.0, 36.0, 37.0, 32.0, 37.0, 37.0, 45.0, 46.0, 27.0, 26.0, 26.0, 25.0, 27.0, 17.0, 20.0, 17.0, 19.0, 6.0, 10.0, 7.0, 1.0, 6.0, 5.0, 2.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 3.0], "bins": [-1.6356372833251953, -1.5867552757263184, -1.5378732681274414, -1.488991379737854, -1.440109372138977, -1.3912273645401, -1.3423454761505127, -1.2934634685516357, -1.2445814609527588, -1.1956994533538818, -1.1468174457550049, -1.0979355573654175, -1.0490535497665405, -1.0001715421676636, -0.9512895941734314, -0.9024076461791992, -0.8535256385803223, -0.8046436309814453, -0.7557616829872131, -0.706879734992981, -0.657997727394104, -0.609115719795227, -0.5602337718009949, -0.5113518238067627, -0.46246981620788574, -0.4135878384113312, -0.3647058606147766, -0.31582388281822205, -0.2669419050216675, -0.21805992722511292, -0.16917794942855835, -0.12029597163200378, -0.07141399383544922, -0.022532016038894653, 0.026349961757659912, 0.07523193955421448, 0.12411391735076904, 0.1729958951473236, 0.22187787294387817, 0.27075985074043274, 0.3196418285369873, 0.36852380633354187, 0.41740578413009644, 0.466287761926651, 0.5151697397232056, 0.5640517473220825, 0.6129336953163147, 0.6618156433105469, 0.7106976509094238, 0.7595796585083008, 0.808461606502533, 0.8573435544967651, 0.9062255620956421, 0.955107569694519, 1.0039894580841064, 1.0528714656829834, 1.1017534732818604, 1.1506354808807373, 1.1995174884796143, 1.2483993768692017, 1.2972813844680786, 1.3461633920669556, 1.395045280456543, 1.44392728805542, 1.4928092956542969]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 13.0, 15.0, 23.0, 49.0, 73.0, 107.0, 145.0, 206.0, 348.0, 469.0, 743.0, 1147.0, 1594.0, 2318.0, 3511.0, 5295.0, 8120.0, 12739.0, 21782.0, 40686.0, 93219.0, 224828.0, 307244.0, 171955.0, 69463.0, 32594.0, 17906.0, 11024.0, 7006.0, 4692.0, 3058.0, 2017.0, 1394.0, 908.0, 615.0, 429.0, 270.0, 176.0, 144.0, 90.0, 45.0, 36.0, 26.0, 10.0, 8.0, 8.0, 3.0, 4.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.3310546875, -0.3208160400390625, -0.310577392578125, -0.3003387451171875, -0.29010009765625, -0.2798614501953125, -0.269622802734375, -0.2593841552734375, -0.2491455078125, -0.2389068603515625, -0.228668212890625, -0.2184295654296875, -0.20819091796875, -0.1979522705078125, -0.187713623046875, -0.1774749755859375, -0.167236328125, -0.1569976806640625, -0.146759033203125, -0.1365203857421875, -0.12628173828125, -0.1160430908203125, -0.105804443359375, -0.0955657958984375, -0.0853271484375, -0.0750885009765625, -0.064849853515625, -0.0546112060546875, -0.04437255859375, -0.0341339111328125, -0.023895263671875, -0.0136566162109375, -0.00341796875, 0.0068206787109375, 0.017059326171875, 0.0272979736328125, 0.03753662109375, 0.0477752685546875, 0.058013916015625, 0.0682525634765625, 0.0784912109375, 0.0887298583984375, 0.098968505859375, 0.1092071533203125, 0.11944580078125, 0.1296844482421875, 0.139923095703125, 0.1501617431640625, 0.160400390625, 0.1706390380859375, 0.180877685546875, 0.1911163330078125, 0.20135498046875, 0.2115936279296875, 0.221832275390625, 0.2320709228515625, 0.2423095703125, 0.2525482177734375, 0.262786865234375, 0.2730255126953125, 0.28326416015625, 0.2935028076171875, 0.303741455078125, 0.3139801025390625, 0.32421875]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 8.0, 6.0, 9.0, 7.0, 10.0, 10.0, 12.0, 18.0, 32.0, 20.0, 18.0, 38.0, 30.0, 28.0, 43.0, 46.0, 47.0, 47.0, 47.0, 52.0, 41.0, 47.0, 41.0, 46.0, 44.0, 28.0, 35.0, 19.0, 28.0, 23.0, 18.0, 22.0, 14.0, 20.0, 20.0, 10.0, 7.0, 3.0, 7.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.259765625, -0.2515106201171875, -0.243255615234375, -0.2350006103515625, -0.22674560546875, -0.2184906005859375, -0.210235595703125, -0.2019805908203125, -0.1937255859375, -0.1854705810546875, -0.177215576171875, -0.1689605712890625, -0.16070556640625, -0.1524505615234375, -0.144195556640625, -0.1359405517578125, -0.127685546875, -0.1194305419921875, -0.111175537109375, -0.1029205322265625, -0.09466552734375, -0.0864105224609375, -0.078155517578125, -0.0699005126953125, -0.0616455078125, -0.0533905029296875, -0.045135498046875, -0.0368804931640625, -0.02862548828125, -0.0203704833984375, -0.012115478515625, -0.0038604736328125, 0.00439453125, 0.0126495361328125, 0.020904541015625, 0.0291595458984375, 0.03741455078125, 0.0456695556640625, 0.053924560546875, 0.0621795654296875, 0.0704345703125, 0.0786895751953125, 0.086944580078125, 0.0951995849609375, 0.10345458984375, 0.1117095947265625, 0.119964599609375, 0.1282196044921875, 0.136474609375, 0.1447296142578125, 0.152984619140625, 0.1612396240234375, 0.16949462890625, 0.1777496337890625, 0.186004638671875, 0.1942596435546875, 0.2025146484375, 0.2107696533203125, 0.219024658203125, 0.2272796630859375, 0.23553466796875, 0.2437896728515625, 0.252044677734375, 0.2602996826171875, 0.2685546875]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 3.0, 5.0, 7.0, 13.0, 18.0, 33.0, 69.0, 98.0, 202.0, 428.0, 1051.0, 2536.0, 6592.0, 17710.0, 60737.0, 344772.0, 484674.0, 91842.0, 23582.0, 8518.0, 3227.0, 1281.0, 584.0, 276.0, 121.0, 73.0, 39.0, 20.0, 13.0, 13.0, 6.0, 10.0, 1.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7421875, -0.722198486328125, -0.70220947265625, -0.682220458984375, -0.6622314453125, -0.642242431640625, -0.62225341796875, -0.602264404296875, -0.582275390625, -0.562286376953125, -0.54229736328125, -0.522308349609375, -0.5023193359375, -0.482330322265625, -0.46234130859375, -0.442352294921875, -0.42236328125, -0.402374267578125, -0.38238525390625, -0.362396240234375, -0.3424072265625, -0.322418212890625, -0.30242919921875, -0.282440185546875, -0.262451171875, -0.242462158203125, -0.22247314453125, -0.202484130859375, -0.1824951171875, -0.162506103515625, -0.14251708984375, -0.122528076171875, -0.1025390625, -0.082550048828125, -0.06256103515625, -0.042572021484375, -0.0225830078125, -0.002593994140625, 0.01739501953125, 0.037384033203125, 0.057373046875, 0.077362060546875, 0.09735107421875, 0.117340087890625, 0.1373291015625, 0.157318115234375, 0.17730712890625, 0.197296142578125, 0.21728515625, 0.237274169921875, 0.25726318359375, 0.277252197265625, 0.2972412109375, 0.317230224609375, 0.33721923828125, 0.357208251953125, 0.377197265625, 0.397186279296875, 0.41717529296875, 0.437164306640625, 0.4571533203125, 0.477142333984375, 0.49713134765625, 0.517120361328125, 0.537109375]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 3.0, 2.0, 4.0, 1.0, 2.0, 5.0, 6.0, 7.0, 6.0, 7.0, 14.0, 10.0, 9.0, 15.0, 9.0, 19.0, 25.0, 25.0, 35.0, 22.0, 37.0, 32.0, 37.0, 34.0, 49.0, 34.0, 43.0, 51.0, 29.0, 35.0, 51.0, 44.0, 41.0, 40.0, 22.0, 25.0, 25.0, 18.0, 22.0, 18.0, 20.0, 12.0, 17.0, 11.0, 7.0, 6.0, 7.0, 4.0, 7.0, 2.0, 4.0, 0.0, 5.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.638671875, -0.6173782348632812, -0.5960845947265625, -0.5747909545898438, -0.553497314453125, -0.5322036743164062, -0.5109100341796875, -0.48961639404296875, -0.46832275390625, -0.44702911376953125, -0.4257354736328125, -0.40444183349609375, -0.383148193359375, -0.36185455322265625, -0.3405609130859375, -0.31926727294921875, -0.2979736328125, -0.27667999267578125, -0.2553863525390625, -0.23409271240234375, -0.212799072265625, -0.19150543212890625, -0.1702117919921875, -0.14891815185546875, -0.12762451171875, -0.10633087158203125, -0.0850372314453125, -0.06374359130859375, -0.042449951171875, -0.02115631103515625, 0.0001373291015625, 0.02143096923828125, 0.042724609375, 0.06401824951171875, 0.0853118896484375, 0.10660552978515625, 0.127899169921875, 0.14919281005859375, 0.1704864501953125, 0.19178009033203125, 0.21307373046875, 0.23436737060546875, 0.2556610107421875, 0.27695465087890625, 0.298248291015625, 0.31954193115234375, 0.3408355712890625, 0.36212921142578125, 0.3834228515625, 0.40471649169921875, 0.4260101318359375, 0.44730377197265625, 0.468597412109375, 0.48989105224609375, 0.5111846923828125, 0.5324783325195312, 0.55377197265625, 0.5750656127929688, 0.5963592529296875, 0.6176528930664062, 0.638946533203125, 0.6602401733398438, 0.6815338134765625, 0.7028274536132812, 0.72412109375]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 4.0, 6.0, 7.0, 11.0, 13.0, 22.0, 41.0, 59.0, 105.0, 198.0, 387.0, 749.0, 1419.0, 2765.0, 5584.0, 11307.0, 22746.0, 46614.0, 101500.0, 227657.0, 307230.0, 172898.0, 76349.0, 35623.0, 17667.0, 8609.0, 4394.0, 2198.0, 1145.0, 540.0, 317.0, 145.0, 110.0, 52.0, 31.0, 20.0, 14.0, 13.0, 8.0, 2.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.1600341796875, -0.15523147583007812, -0.15042877197265625, -0.14562606811523438, -0.1408233642578125, -0.13602066040039062, -0.13121795654296875, -0.12641525268554688, -0.121612548828125, -0.11680984497070312, -0.11200714111328125, -0.10720443725585938, -0.1024017333984375, -0.09759902954101562, -0.09279632568359375, -0.08799362182617188, -0.08319091796875, -0.07838821411132812, -0.07358551025390625, -0.06878280639648438, -0.0639801025390625, -0.059177398681640625, -0.05437469482421875, -0.049571990966796875, -0.044769287109375, -0.039966583251953125, -0.03516387939453125, -0.030361175537109375, -0.0255584716796875, -0.020755767822265625, -0.01595306396484375, -0.011150360107421875, -0.00634765625, -0.001544952392578125, 0.00325775146484375, 0.008060455322265625, 0.0128631591796875, 0.017665863037109375, 0.02246856689453125, 0.027271270751953125, 0.032073974609375, 0.036876678466796875, 0.04167938232421875, 0.046482086181640625, 0.0512847900390625, 0.056087493896484375, 0.06089019775390625, 0.06569290161132812, 0.07049560546875, 0.07529830932617188, 0.08010101318359375, 0.08490371704101562, 0.0897064208984375, 0.09450912475585938, 0.09931182861328125, 0.10411453247070312, 0.108917236328125, 0.11371994018554688, 0.11852264404296875, 0.12332534790039062, 0.1281280517578125, 0.13293075561523438, 0.13773345947265625, 0.14253616333007812, 0.1473388671875]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 4.0, 3.0, 7.0, 17.0, 19.0, 22.0, 32.0, 44.0, 68.0, 109.0, 149.0, 166.0, 141.0, 82.0, 44.0, 24.0, 26.0, 9.0, 13.0, 5.0, 4.0, 4.0, 10.0, 3.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.73532485961914e-05, -6.511248648166656e-05, -6.287172436714172e-05, -6.063096225261688e-05, -5.839020013809204e-05, -5.61494380235672e-05, -5.390867590904236e-05, -5.166791379451752e-05, -4.9427151679992676e-05, -4.7186389565467834e-05, -4.494562745094299e-05, -4.270486533641815e-05, -4.046410322189331e-05, -3.822334110736847e-05, -3.598257899284363e-05, -3.374181687831879e-05, -3.1501054763793945e-05, -2.9260292649269104e-05, -2.7019530534744263e-05, -2.477876842021942e-05, -2.253800630569458e-05, -2.029724419116974e-05, -1.8056482076644897e-05, -1.5815719962120056e-05, -1.3574957847595215e-05, -1.1334195733070374e-05, -9.093433618545532e-06, -6.852671504020691e-06, -4.61190938949585e-06, -2.3711472749710083e-06, -1.30385160446167e-07, 2.1103769540786743e-06, 4.351139068603516e-06, 6.591901183128357e-06, 8.832663297653198e-06, 1.107342541217804e-05, 1.3314187526702881e-05, 1.5554949641227722e-05, 1.7795711755752563e-05, 2.0036473870277405e-05, 2.2277235984802246e-05, 2.4517998099327087e-05, 2.675876021385193e-05, 2.899952232837677e-05, 3.124028444290161e-05, 3.348104655742645e-05, 3.5721808671951294e-05, 3.7962570786476135e-05, 4.0203332901000977e-05, 4.244409501552582e-05, 4.468485713005066e-05, 4.69256192445755e-05, 4.916638135910034e-05, 5.140714347362518e-05, 5.3647905588150024e-05, 5.5888667702674866e-05, 5.812942981719971e-05, 6.037019193172455e-05, 6.261095404624939e-05, 6.485171616077423e-05, 6.709247827529907e-05, 6.933324038982391e-05, 7.157400250434875e-05, 7.38147646188736e-05, 7.605552673339844e-05]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [4.0, 0.0, 2.0, 2.0, 3.0, 3.0, 6.0, 3.0, 9.0, 13.0, 14.0, 18.0, 24.0, 48.0, 58.0, 104.0, 157.0, 250.0, 424.0, 600.0, 1180.0, 1982.0, 3632.0, 6664.0, 12445.0, 23045.0, 44826.0, 86362.0, 162565.0, 238759.0, 209137.0, 122099.0, 63308.0, 32945.0, 17339.0, 9085.0, 4943.0, 2674.0, 1533.0, 840.0, 528.0, 304.0, 207.0, 136.0, 87.0, 61.0, 51.0, 28.0, 22.0, 12.0, 16.0, 7.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1185302734375, -0.1145477294921875, -0.110565185546875, -0.1065826416015625, -0.10260009765625, -0.0986175537109375, -0.094635009765625, -0.0906524658203125, -0.086669921875, -0.0826873779296875, -0.078704833984375, -0.0747222900390625, -0.07073974609375, -0.0667572021484375, -0.062774658203125, -0.0587921142578125, -0.0548095703125, -0.0508270263671875, -0.046844482421875, -0.0428619384765625, -0.03887939453125, -0.0348968505859375, -0.030914306640625, -0.0269317626953125, -0.02294921875, -0.0189666748046875, -0.014984130859375, -0.0110015869140625, -0.00701904296875, -0.0030364990234375, 0.000946044921875, 0.0049285888671875, 0.0089111328125, 0.0128936767578125, 0.016876220703125, 0.0208587646484375, 0.02484130859375, 0.0288238525390625, 0.032806396484375, 0.0367889404296875, 0.040771484375, 0.0447540283203125, 0.048736572265625, 0.0527191162109375, 0.05670166015625, 0.0606842041015625, 0.064666748046875, 0.0686492919921875, 0.0726318359375, 0.0766143798828125, 0.080596923828125, 0.0845794677734375, 0.08856201171875, 0.0925445556640625, 0.096527099609375, 0.1005096435546875, 0.1044921875, 0.1084747314453125, 0.112457275390625, 0.1164398193359375, 0.12042236328125, 0.1244049072265625, 0.128387451171875, 0.1323699951171875, 0.1363525390625]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 3.0, 0.0, 1.0, 4.0, 4.0, 3.0, 7.0, 6.0, 5.0, 8.0, 8.0, 7.0, 9.0, 17.0, 18.0, 29.0, 26.0, 29.0, 42.0, 40.0, 51.0, 65.0, 66.0, 71.0, 63.0, 57.0, 59.0, 36.0, 43.0, 41.0, 32.0, 37.0, 31.0, 23.0, 14.0, 15.0, 8.0, 7.0, 7.0, 4.0, 3.0, 5.0, 5.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.1748046875, -0.1694049835205078, -0.16400527954101562, -0.15860557556152344, -0.15320587158203125, -0.14780616760253906, -0.14240646362304688, -0.1370067596435547, -0.1316070556640625, -0.1262073516845703, -0.12080764770507812, -0.11540794372558594, -0.11000823974609375, -0.10460853576660156, -0.09920883178710938, -0.09380912780761719, -0.088409423828125, -0.08300971984863281, -0.07761001586914062, -0.07221031188964844, -0.06681060791015625, -0.06141090393066406, -0.056011199951171875, -0.05061149597167969, -0.0452117919921875, -0.03981208801269531, -0.034412384033203125, -0.029012680053710938, -0.02361297607421875, -0.018213272094726562, -0.012813568115234375, -0.0074138641357421875, -0.00201416015625, 0.0033855438232421875, 0.008785247802734375, 0.014184951782226562, 0.01958465576171875, 0.024984359741210938, 0.030384063720703125, 0.03578376770019531, 0.0411834716796875, 0.04658317565917969, 0.051982879638671875, 0.05738258361816406, 0.06278228759765625, 0.06818199157714844, 0.07358169555664062, 0.07898139953613281, 0.084381103515625, 0.08978080749511719, 0.09518051147460938, 0.10058021545410156, 0.10597991943359375, 0.11137962341308594, 0.11677932739257812, 0.12217903137207031, 0.1275787353515625, 0.1329784393310547, 0.13837814331054688, 0.14377784729003906, 0.14917755126953125, 0.15457725524902344, 0.15997695922851562, 0.1653766632080078, 0.1707763671875]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 5.0, 5.0, 19.0, 63.0, 140.0, 273.0, 274.0, 170.0, 43.0, 15.0, 1.0, 5.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.786008834838867, -4.586511611938477, -4.387014389038086, -4.187517166137695, -3.9880199432373047, -3.788522720336914, -3.5890254974365234, -3.389528274536133, -3.190031051635742, -2.9905338287353516, -2.791036605834961, -2.5915393829345703, -2.3920421600341797, -2.192544937133789, -1.9930477142333984, -1.7935504913330078, -1.5940532684326172, -1.3945560455322266, -1.195058822631836, -0.9955615997314453, -0.7960643768310547, -0.5965671539306641, -0.39706993103027344, -0.1975727081298828, 0.0019245147705078125, 0.20142173767089844, 0.40091896057128906, 0.6004161834716797, 0.7999134063720703, 0.9994106292724609, 1.1989078521728516, 1.3984050750732422, 1.5979022979736328, 1.7973995208740234, 1.996896743774414, 2.1963939666748047, 2.3958911895751953, 2.595388412475586, 2.7948856353759766, 2.994382858276367, 3.193880081176758, 3.3933773040771484, 3.592874526977539, 3.7923717498779297, 3.9918689727783203, 4.191366195678711, 4.390863418579102, 4.590360641479492, 4.789857864379883, 4.989355087280273, 5.188852310180664, 5.388349533081055, 5.587846755981445, 5.787343978881836, 5.986841201782227, 6.186338424682617, 6.385835647583008, 6.585332870483398, 6.784830093383789, 6.98432731628418, 7.18382453918457, 7.383321762084961, 7.582818984985352, 7.782316207885742, 7.981813430786133]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 2.0, 0.0, 4.0, 1.0, 9.0, 5.0, 5.0, 8.0, 13.0, 14.0, 14.0, 15.0, 24.0, 18.0, 24.0, 24.0, 21.0, 42.0, 31.0, 39.0, 36.0, 49.0, 52.0, 50.0, 60.0, 44.0, 48.0, 38.0, 45.0, 42.0, 33.0, 29.0, 30.0, 18.0, 17.0, 21.0, 13.0, 11.0, 21.0, 7.0, 8.0, 4.0, 3.0, 4.0, 3.0, 3.0, 5.0, 1.0, 3.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.073650598526001, -2.0085251331329346, -1.9433997869491577, -1.8782743215560913, -1.8131489753723145, -1.748023509979248, -1.6828980445861816, -1.6177725791931152, -1.5526472330093384, -1.487521767616272, -1.4223964214324951, -1.3572709560394287, -1.2921454906463623, -1.2270201444625854, -1.161894679069519, -1.0967693328857422, -1.0316438674926758, -0.9665184617042542, -0.9013930559158325, -0.8362675905227661, -0.7711421847343445, -0.7060167789459229, -0.6408913135528564, -0.5757659077644348, -0.5106405019760132, -0.44551509618759155, -0.38038966059684753, -0.3152642250061035, -0.2501388192176819, -0.18501341342926025, -0.11988797783851624, -0.05476254224777222, 0.010362625122070312, 0.07548804581165314, 0.14061346650123596, 0.2057388871908188, 0.2708643078804016, 0.33598971366882324, 0.40111514925956726, 0.4662405848503113, 0.5313659906387329, 0.5964913964271545, 0.6616168022155762, 0.7267422676086426, 0.7918676733970642, 0.8569930791854858, 0.9221185445785522, 0.9872439503669739, 1.0523693561553955, 1.117494821548462, 1.1826201677322388, 1.2477456331253052, 1.312870979309082, 1.3779964447021484, 1.4431219100952148, 1.5082473754882812, 1.573372721672058, 1.6384981870651245, 1.7036235332489014, 1.7687489986419678, 1.8338744640350342, 1.898999810218811, 1.9641252756118774, 2.0292506217956543, 2.0943760871887207]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 6.0, 3.0, 8.0, 16.0, 17.0, 18.0, 38.0, 44.0, 73.0, 113.0, 167.0, 300.0, 467.0, 876.0, 1690.0, 3048.0, 6626.0, 14970.0, 37665.0, 104567.0, 335407.0, 1400967.0, 1683687.0, 404421.0, 123648.0, 43762.0, 16959.0, 7340.0, 3363.0, 1751.0, 912.0, 506.0, 288.0, 198.0, 127.0, 82.0, 48.0, 37.0, 22.0, 19.0, 12.0, 12.0, 4.0, 2.0, 2.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.413330078125, -0.3995857238769531, -0.38584136962890625, -0.3720970153808594, -0.3583526611328125, -0.3446083068847656, -0.33086395263671875, -0.3171195983886719, -0.303375244140625, -0.2896308898925781, -0.27588653564453125, -0.2621421813964844, -0.2483978271484375, -0.23465347290039062, -0.22090911865234375, -0.20716476440429688, -0.19342041015625, -0.17967605590820312, -0.16593170166015625, -0.15218734741210938, -0.1384429931640625, -0.12469863891601562, -0.11095428466796875, -0.09720993041992188, -0.083465576171875, -0.06972122192382812, -0.05597686767578125, -0.042232513427734375, -0.0284881591796875, -0.014743804931640625, -0.00099945068359375, 0.012744903564453125, 0.0264892578125, 0.040233612060546875, 0.05397796630859375, 0.06772232055664062, 0.0814666748046875, 0.09521102905273438, 0.10895538330078125, 0.12269973754882812, 0.136444091796875, 0.15018844604492188, 0.16393280029296875, 0.17767715454101562, 0.1914215087890625, 0.20516586303710938, 0.21891021728515625, 0.23265457153320312, 0.24639892578125, 0.2601432800292969, 0.27388763427734375, 0.2876319885253906, 0.3013763427734375, 0.3151206970214844, 0.32886505126953125, 0.3426094055175781, 0.356353759765625, 0.3700981140136719, 0.38384246826171875, 0.3975868225097656, 0.4113311767578125, 0.4250755310058594, 0.43881988525390625, 0.4525642395019531, 0.46630859375]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 4.0, 8.0, 10.0, 16.0, 16.0, 13.0, 28.0, 28.0, 34.0, 33.0, 41.0, 32.0, 62.0, 64.0, 55.0, 49.0, 62.0, 40.0, 59.0, 56.0, 46.0, 33.0, 28.0, 37.0, 32.0, 27.0, 18.0, 26.0, 15.0, 9.0, 9.0, 5.0, 3.0, 4.0, 4.0, 1.0, 0.0, 4.0, 0.0, 0.0, 1.0], "bins": [-0.399169921875, -0.3889884948730469, -0.37880706787109375, -0.3686256408691406, -0.3584442138671875, -0.3482627868652344, -0.33808135986328125, -0.3278999328613281, -0.317718505859375, -0.3075370788574219, -0.29735565185546875, -0.2871742248535156, -0.2769927978515625, -0.2668113708496094, -0.25662994384765625, -0.24644851684570312, -0.23626708984375, -0.22608566284179688, -0.21590423583984375, -0.20572280883789062, -0.1955413818359375, -0.18535995483398438, -0.17517852783203125, -0.16499710083007812, -0.154815673828125, -0.14463424682617188, -0.13445281982421875, -0.12427139282226562, -0.1140899658203125, -0.10390853881835938, -0.09372711181640625, -0.08354568481445312, -0.0733642578125, -0.06318283081054688, -0.05300140380859375, -0.042819976806640625, -0.0326385498046875, -0.022457122802734375, -0.01227569580078125, -0.002094268798828125, 0.008087158203125, 0.018268585205078125, 0.02845001220703125, 0.038631439208984375, 0.0488128662109375, 0.058994293212890625, 0.06917572021484375, 0.07935714721679688, 0.08953857421875, 0.09972000122070312, 0.10990142822265625, 0.12008285522460938, 0.1302642822265625, 0.14044570922851562, 0.15062713623046875, 0.16080856323242188, 0.170989990234375, 0.18117141723632812, 0.19135284423828125, 0.20153427124023438, 0.2117156982421875, 0.22189712524414062, 0.23207855224609375, 0.24225997924804688, 0.25244140625]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 6.0, 7.0, 2.0, 10.0, 17.0, 14.0, 20.0, 33.0, 53.0, 78.0, 102.0, 193.0, 272.0, 453.0, 805.0, 1630.0, 3521.0, 8442.0, 23058.0, 70967.0, 257349.0, 1424638.0, 1940932.0, 329531.0, 87087.0, 27497.0, 9654.0, 3902.0, 1770.0, 921.0, 455.0, 285.0, 199.0, 120.0, 76.0, 62.0, 42.0, 27.0, 20.0, 19.0, 2.0, 4.0, 3.0, 6.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.63916015625, -0.619842529296875, -0.60052490234375, -0.581207275390625, -0.5618896484375, -0.542572021484375, -0.52325439453125, -0.503936767578125, -0.484619140625, -0.465301513671875, -0.44598388671875, -0.426666259765625, -0.4073486328125, -0.388031005859375, -0.36871337890625, -0.349395751953125, -0.330078125, -0.310760498046875, -0.29144287109375, -0.272125244140625, -0.2528076171875, -0.233489990234375, -0.21417236328125, -0.194854736328125, -0.175537109375, -0.156219482421875, -0.13690185546875, -0.117584228515625, -0.0982666015625, -0.078948974609375, -0.05963134765625, -0.040313720703125, -0.02099609375, -0.001678466796875, 0.01763916015625, 0.036956787109375, 0.0562744140625, 0.075592041015625, 0.09490966796875, 0.114227294921875, 0.133544921875, 0.152862548828125, 0.17218017578125, 0.191497802734375, 0.2108154296875, 0.230133056640625, 0.24945068359375, 0.268768310546875, 0.2880859375, 0.307403564453125, 0.32672119140625, 0.346038818359375, 0.3653564453125, 0.384674072265625, 0.40399169921875, 0.423309326171875, 0.442626953125, 0.461944580078125, 0.48126220703125, 0.500579833984375, 0.5198974609375, 0.539215087890625, 0.55853271484375, 0.577850341796875, 0.59716796875]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 4.0, 2.0, 6.0, 8.0, 4.0, 10.0, 10.0, 14.0, 22.0, 36.0, 31.0, 38.0, 63.0, 75.0, 96.0, 151.0, 178.0, 316.0, 486.0, 737.0, 601.0, 393.0, 222.0, 166.0, 106.0, 70.0, 67.0, 40.0, 36.0, 27.0, 18.0, 13.0, 11.0, 6.0, 3.0, 7.0, 4.0, 5.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.67333984375, -0.65338134765625, -0.6334228515625, -0.61346435546875, -0.593505859375, -0.57354736328125, -0.5535888671875, -0.53363037109375, -0.513671875, -0.49371337890625, -0.4737548828125, -0.45379638671875, -0.433837890625, -0.41387939453125, -0.3939208984375, -0.37396240234375, -0.35400390625, -0.33404541015625, -0.3140869140625, -0.29412841796875, -0.274169921875, -0.25421142578125, -0.2342529296875, -0.21429443359375, -0.1943359375, -0.17437744140625, -0.1544189453125, -0.13446044921875, -0.114501953125, -0.09454345703125, -0.0745849609375, -0.05462646484375, -0.03466796875, -0.01470947265625, 0.0052490234375, 0.02520751953125, 0.045166015625, 0.06512451171875, 0.0850830078125, 0.10504150390625, 0.125, 0.14495849609375, 0.1649169921875, 0.18487548828125, 0.204833984375, 0.22479248046875, 0.2447509765625, 0.26470947265625, 0.28466796875, 0.30462646484375, 0.3245849609375, 0.34454345703125, 0.364501953125, 0.38446044921875, 0.4044189453125, 0.42437744140625, 0.4443359375, 0.46429443359375, 0.4842529296875, 0.50421142578125, 0.524169921875, 0.54412841796875, 0.5640869140625, 0.58404541015625, 0.60400390625]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 6.0, 12.0, 28.0, 85.0, 141.0, 233.0, 224.0, 165.0, 63.0, 32.0, 8.0, 8.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.920873641967773, -8.698906898498535, -8.476940155029297, -8.254973411560059, -8.03300666809082, -7.811039924621582, -7.589073657989502, -7.367106914520264, -7.145140171051025, -6.923173427581787, -6.701206684112549, -6.4792399406433105, -6.2572736740112305, -6.035306930541992, -5.813340187072754, -5.591373443603516, -5.369406700134277, -5.147439956665039, -4.925473213195801, -4.7035064697265625, -4.481539726257324, -4.259572982788086, -4.037606716156006, -3.8156399726867676, -3.5936732292175293, -3.371706485748291, -3.1497397422790527, -2.9277732372283936, -2.7058064937591553, -2.483839750289917, -2.261873245239258, -2.0399065017700195, -1.8179397583007812, -1.595973014831543, -1.3740063905715942, -1.1520397663116455, -0.9300730228424072, -0.708106279373169, -0.4861396551132202, -0.2641730308532715, -0.0422062873840332, 0.1797603964805603, 0.4017270803451538, 0.6236937642097473, 0.8456604480743408, 1.067627191543579, 1.2895938158035278, 1.5115604400634766, 1.7335271835327148, 1.9554939270019531, 2.1774606704711914, 2.3994271755218506, 2.621393918991089, 2.843360662460327, 3.0653271675109863, 3.2872939109802246, 3.509260654449463, 3.731227397918701, 3.9531941413879395, 4.175160884857178, 4.397127151489258, 4.619093894958496, 4.841060638427734, 5.063027381896973, 5.284994125366211]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 1.0, 2.0, 4.0, 2.0, 6.0, 8.0, 5.0, 8.0, 10.0, 12.0, 12.0, 4.0, 10.0, 15.0, 12.0, 21.0, 16.0, 21.0, 27.0, 28.0, 31.0, 37.0, 32.0, 31.0, 36.0, 29.0, 39.0, 42.0, 46.0, 41.0, 39.0, 37.0, 31.0, 30.0, 37.0, 28.0, 26.0, 26.0, 27.0, 27.0, 5.0, 15.0, 22.0, 9.0, 9.0, 10.0, 9.0, 8.0, 9.0, 5.0, 4.0, 5.0, 4.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-1.7942206859588623, -1.7366327047348022, -1.6790448427200317, -1.6214568614959717, -1.5638688802719116, -1.5062808990478516, -1.448693037033081, -1.391105055809021, -1.333517074584961, -1.2759290933609009, -1.2183412313461304, -1.1607532501220703, -1.1031652688980103, -1.0455772876739502, -0.9879894256591797, -0.9304014444351196, -0.8728135228157043, -0.8152256011962891, -0.757637619972229, -0.7000496983528137, -0.6424617171287537, -0.5848737955093384, -0.5272858142852783, -0.46969789266586304, -0.41210994124412537, -0.3545219898223877, -0.29693403840065, -0.23934610188007355, -0.18175815045833588, -0.1241702139377594, -0.06658226251602173, -0.008994311094284058, 0.04859364032745361, 0.10618159174919128, 0.16376954317092896, 0.22135747969150543, 0.2789454460144043, 0.3365333676338196, 0.39412131905555725, 0.4517092704772949, 0.509297251701355, 0.5668851733207703, 0.6244731545448303, 0.6820610761642456, 0.7396490573883057, 0.797236979007721, 0.8548249006271362, 0.9124128818511963, 0.9700008034706116, 1.0275887250900269, 1.085176706314087, 1.142764687538147, 1.2003525495529175, 1.2579405307769775, 1.3155285120010376, 1.3731164932250977, 1.4307043552398682, 1.4882923364639282, 1.5458801984786987, 1.6034681797027588, 1.6610561609268188, 1.718644142150879, 1.7762320041656494, 1.8338199853897095, 1.8914079666137695]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 5.0, 5.0, 11.0, 12.0, 22.0, 31.0, 45.0, 72.0, 113.0, 160.0, 241.0, 335.0, 474.0, 687.0, 988.0, 1466.0, 2009.0, 2829.0, 4086.0, 5643.0, 8380.0, 13329.0, 22726.0, 51948.0, 198332.0, 445899.0, 178917.0, 48310.0, 21725.0, 12728.0, 8051.0, 5714.0, 3958.0, 2807.0, 2017.0, 1421.0, 941.0, 675.0, 466.0, 291.0, 244.0, 166.0, 106.0, 54.0, 41.0, 34.0, 26.0, 11.0, 6.0, 5.0, 4.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.469482421875, -0.4535484313964844, -0.43761444091796875, -0.4216804504394531, -0.4057464599609375, -0.3898124694824219, -0.37387847900390625, -0.3579444885253906, -0.342010498046875, -0.3260765075683594, -0.31014251708984375, -0.2942085266113281, -0.2782745361328125, -0.2623405456542969, -0.24640655517578125, -0.23047256469726562, -0.21453857421875, -0.19860458374023438, -0.18267059326171875, -0.16673660278320312, -0.1508026123046875, -0.13486862182617188, -0.11893463134765625, -0.10300064086914062, -0.087066650390625, -0.07113265991210938, -0.05519866943359375, -0.039264678955078125, -0.0233306884765625, -0.007396697998046875, 0.00853729248046875, 0.024471282958984375, 0.0404052734375, 0.056339263916015625, 0.07227325439453125, 0.08820724487304688, 0.1041412353515625, 0.12007522583007812, 0.13600921630859375, 0.15194320678710938, 0.167877197265625, 0.18381118774414062, 0.19974517822265625, 0.21567916870117188, 0.2316131591796875, 0.24754714965820312, 0.26348114013671875, 0.2794151306152344, 0.29534912109375, 0.3112831115722656, 0.32721710205078125, 0.3431510925292969, 0.3590850830078125, 0.3750190734863281, 0.39095306396484375, 0.4068870544433594, 0.422821044921875, 0.4387550354003906, 0.45468902587890625, 0.4706230163574219, 0.4865570068359375, 0.5024909973144531, 0.5184249877929688, 0.5343589782714844, 0.55029296875]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 6.0, 5.0, 6.0, 9.0, 5.0, 15.0, 12.0, 18.0, 18.0, 18.0, 29.0, 22.0, 30.0, 40.0, 41.0, 44.0, 38.0, 47.0, 44.0, 46.0, 39.0, 44.0, 34.0, 58.0, 36.0, 36.0, 42.0, 28.0, 29.0, 28.0, 29.0, 16.0, 18.0, 14.0, 15.0, 12.0, 11.0, 5.0, 8.0, 7.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0], "bins": [-0.295166015625, -0.2868518829345703, -0.2785377502441406, -0.27022361755371094, -0.26190948486328125, -0.25359535217285156, -0.24528121948242188, -0.2369670867919922, -0.2286529541015625, -0.2203388214111328, -0.21202468872070312, -0.20371055603027344, -0.19539642333984375, -0.18708229064941406, -0.17876815795898438, -0.1704540252685547, -0.162139892578125, -0.1538257598876953, -0.14551162719726562, -0.13719749450683594, -0.12888336181640625, -0.12056922912597656, -0.11225509643554688, -0.10394096374511719, -0.0956268310546875, -0.08731269836425781, -0.07899856567382812, -0.07068443298339844, -0.06237030029296875, -0.05405616760253906, -0.045742034912109375, -0.03742790222167969, -0.02911376953125, -0.020799636840820312, -0.012485504150390625, -0.0041713714599609375, 0.00414276123046875, 0.012456893920898438, 0.020771026611328125, 0.029085159301757812, 0.0373992919921875, 0.04571342468261719, 0.054027557373046875, 0.06234169006347656, 0.07065582275390625, 0.07896995544433594, 0.08728408813476562, 0.09559822082519531, 0.103912353515625, 0.11222648620605469, 0.12054061889648438, 0.12885475158691406, 0.13716888427734375, 0.14548301696777344, 0.15379714965820312, 0.1621112823486328, 0.1704254150390625, 0.1787395477294922, 0.18705368041992188, 0.19536781311035156, 0.20368194580078125, 0.21199607849121094, 0.22031021118164062, 0.2286243438720703, 0.2369384765625]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 1.0, 3.0, 3.0, 1.0, 4.0, 11.0, 4.0, 11.0, 9.0, 17.0, 27.0, 23.0, 44.0, 54.0, 90.0, 118.0, 167.0, 273.0, 435.0, 652.0, 1093.0, 1845.0, 3678.0, 7677.0, 16825.0, 39830.0, 196243.0, 625807.0, 97633.0, 30056.0, 13005.0, 5855.0, 2905.0, 1547.0, 939.0, 515.0, 397.0, 240.0, 171.0, 108.0, 76.0, 52.0, 29.0, 26.0, 21.0, 8.0, 9.0, 4.0, 5.0, 1.0, 6.0, 4.0, 3.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.77880859375, -0.7539596557617188, -0.7291107177734375, -0.7042617797851562, -0.679412841796875, -0.6545639038085938, -0.6297149658203125, -0.6048660278320312, -0.58001708984375, -0.5551681518554688, -0.5303192138671875, -0.5054702758789062, -0.480621337890625, -0.45577239990234375, -0.4309234619140625, -0.40607452392578125, -0.3812255859375, -0.35637664794921875, -0.3315277099609375, -0.30667877197265625, -0.281829833984375, -0.25698089599609375, -0.2321319580078125, -0.20728302001953125, -0.18243408203125, -0.15758514404296875, -0.1327362060546875, -0.10788726806640625, -0.083038330078125, -0.05818939208984375, -0.0333404541015625, -0.00849151611328125, 0.016357421875, 0.04120635986328125, 0.0660552978515625, 0.09090423583984375, 0.115753173828125, 0.14060211181640625, 0.1654510498046875, 0.19029998779296875, 0.21514892578125, 0.23999786376953125, 0.2648468017578125, 0.28969573974609375, 0.314544677734375, 0.33939361572265625, 0.3642425537109375, 0.38909149169921875, 0.4139404296875, 0.43878936767578125, 0.4636383056640625, 0.48848724365234375, 0.513336181640625, 0.5381851196289062, 0.5630340576171875, 0.5878829956054688, 0.61273193359375, 0.6375808715820312, 0.6624298095703125, 0.6872787475585938, 0.712127685546875, 0.7369766235351562, 0.7618255615234375, 0.7866744995117188, 0.8115234375]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 5.0, 1.0, 4.0, 4.0, 6.0, 6.0, 7.0, 8.0, 14.0, 13.0, 14.0, 19.0, 33.0, 27.0, 40.0, 50.0, 36.0, 60.0, 56.0, 59.0, 60.0, 41.0, 64.0, 64.0, 51.0, 57.0, 31.0, 33.0, 26.0, 25.0, 20.0, 19.0, 16.0, 10.0, 7.0, 3.0, 3.0, 4.0, 1.0, 4.0, 1.0, 6.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-1.0029296875, -0.973663330078125, -0.94439697265625, -0.915130615234375, -0.8858642578125, -0.856597900390625, -0.82733154296875, -0.798065185546875, -0.768798828125, -0.739532470703125, -0.71026611328125, -0.680999755859375, -0.6517333984375, -0.622467041015625, -0.59320068359375, -0.563934326171875, -0.53466796875, -0.505401611328125, -0.47613525390625, -0.446868896484375, -0.4176025390625, -0.388336181640625, -0.35906982421875, -0.329803466796875, -0.300537109375, -0.271270751953125, -0.24200439453125, -0.212738037109375, -0.1834716796875, -0.154205322265625, -0.12493896484375, -0.095672607421875, -0.06640625, -0.037139892578125, -0.00787353515625, 0.021392822265625, 0.0506591796875, 0.079925537109375, 0.10919189453125, 0.138458251953125, 0.167724609375, 0.196990966796875, 0.22625732421875, 0.255523681640625, 0.2847900390625, 0.314056396484375, 0.34332275390625, 0.372589111328125, 0.40185546875, 0.431121826171875, 0.46038818359375, 0.489654541015625, 0.5189208984375, 0.548187255859375, 0.57745361328125, 0.606719970703125, 0.635986328125, 0.665252685546875, 0.69451904296875, 0.723785400390625, 0.7530517578125, 0.782318115234375, 0.81158447265625, 0.840850830078125, 0.8701171875]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 0.0, 6.0, 7.0, 10.0, 9.0, 19.0, 14.0, 35.0, 45.0, 56.0, 63.0, 81.0, 126.0, 162.0, 222.0, 324.0, 384.0, 568.0, 831.0, 1231.0, 1799.0, 3125.0, 6320.0, 14823.0, 52582.0, 392690.0, 477351.0, 62623.0, 16707.0, 6690.0, 3361.0, 1950.0, 1209.0, 881.0, 586.0, 445.0, 323.0, 225.0, 182.0, 135.0, 88.0, 73.0, 61.0, 42.0, 25.0, 26.0, 11.0, 8.0, 9.0, 12.0, 3.0, 0.0, 0.0, 1.0, 3.0, 0.0, 4.0], "bins": [-0.386474609375, -0.3747825622558594, -0.36309051513671875, -0.3513984680175781, -0.3397064208984375, -0.3280143737792969, -0.31632232666015625, -0.3046302795410156, -0.292938232421875, -0.2812461853027344, -0.26955413818359375, -0.2578620910644531, -0.2461700439453125, -0.23447799682617188, -0.22278594970703125, -0.21109390258789062, -0.19940185546875, -0.18770980834960938, -0.17601776123046875, -0.16432571411132812, -0.1526336669921875, -0.14094161987304688, -0.12924957275390625, -0.11755752563476562, -0.105865478515625, -0.09417343139648438, -0.08248138427734375, -0.07078933715820312, -0.0590972900390625, -0.047405242919921875, -0.03571319580078125, -0.024021148681640625, -0.0123291015625, -0.000637054443359375, 0.01105499267578125, 0.022747039794921875, 0.0344390869140625, 0.046131134033203125, 0.05782318115234375, 0.06951522827148438, 0.081207275390625, 0.09289932250976562, 0.10459136962890625, 0.11628341674804688, 0.1279754638671875, 0.13966751098632812, 0.15135955810546875, 0.16305160522460938, 0.17474365234375, 0.18643569946289062, 0.19812774658203125, 0.20981979370117188, 0.2215118408203125, 0.23320388793945312, 0.24489593505859375, 0.2565879821777344, 0.268280029296875, 0.2799720764160156, 0.29166412353515625, 0.3033561706542969, 0.3150482177734375, 0.3267402648925781, 0.33843231201171875, 0.3501243591308594, 0.36181640625]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 6.0, 1.0, 3.0, 4.0, 3.0, 6.0, 15.0, 21.0, 43.0, 182.0, 425.0, 182.0, 40.0, 29.0, 15.0, 14.0, 4.0, 5.0, 3.0, 2.0, 2.0, 0.0, 1.0, 4.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00023829936981201172, -0.0002319440245628357, -0.00022558867931365967, -0.00021923333406448364, -0.00021287798881530762, -0.0002065226435661316, -0.00020016729831695557, -0.00019381195306777954, -0.00018745660781860352, -0.0001811012625694275, -0.00017474591732025146, -0.00016839057207107544, -0.00016203522682189941, -0.0001556798815727234, -0.00014932453632354736, -0.00014296919107437134, -0.0001366138458251953, -0.0001302585005760193, -0.00012390315532684326, -0.00011754781007766724, -0.00011119246482849121, -0.00010483711957931519, -9.848177433013916e-05, -9.212642908096313e-05, -8.577108383178711e-05, -7.941573858261108e-05, -7.306039333343506e-05, -6.670504808425903e-05, -6.034970283508301e-05, -5.399435758590698e-05, -4.763901233673096e-05, -4.128366708755493e-05, -3.4928321838378906e-05, -2.857297658920288e-05, -2.2217631340026855e-05, -1.586228609085083e-05, -9.506940841674805e-06, -3.1515955924987793e-06, 3.203749656677246e-06, 9.559094905853271e-06, 1.5914440155029297e-05, 2.2269785404205322e-05, 2.8625130653381348e-05, 3.498047590255737e-05, 4.13358211517334e-05, 4.7691166400909424e-05, 5.404651165008545e-05, 6.0401856899261475e-05, 6.67572021484375e-05, 7.311254739761353e-05, 7.946789264678955e-05, 8.582323789596558e-05, 9.21785831451416e-05, 9.853392839431763e-05, 0.00010488927364349365, 0.00011124461889266968, 0.0001175999641418457, 0.00012395530939102173, 0.00013031065464019775, 0.00013666599988937378, 0.0001430213451385498, 0.00014937669038772583, 0.00015573203563690186, 0.00016208738088607788, 0.0001684427261352539]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 1.0, 5.0, 2.0, 11.0, 7.0, 19.0, 18.0, 23.0, 40.0, 72.0, 112.0, 171.0, 268.0, 479.0, 933.0, 1782.0, 3984.0, 12018.0, 57291.0, 447387.0, 446995.0, 57248.0, 11961.0, 3914.0, 1748.0, 846.0, 472.0, 276.0, 151.0, 110.0, 65.0, 50.0, 30.0, 20.0, 15.0, 9.0, 4.0, 5.0, 8.0, 4.0, 4.0, 1.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.28564453125, -0.27374267578125, -0.2618408203125, -0.24993896484375, -0.238037109375, -0.22613525390625, -0.2142333984375, -0.20233154296875, -0.1904296875, -0.17852783203125, -0.1666259765625, -0.15472412109375, -0.142822265625, -0.13092041015625, -0.1190185546875, -0.10711669921875, -0.09521484375, -0.08331298828125, -0.0714111328125, -0.05950927734375, -0.047607421875, -0.03570556640625, -0.0238037109375, -0.01190185546875, 0.0, 0.01190185546875, 0.0238037109375, 0.03570556640625, 0.047607421875, 0.05950927734375, 0.0714111328125, 0.08331298828125, 0.09521484375, 0.10711669921875, 0.1190185546875, 0.13092041015625, 0.142822265625, 0.15472412109375, 0.1666259765625, 0.17852783203125, 0.1904296875, 0.20233154296875, 0.2142333984375, 0.22613525390625, 0.238037109375, 0.24993896484375, 0.2618408203125, 0.27374267578125, 0.28564453125, 0.29754638671875, 0.3094482421875, 0.32135009765625, 0.333251953125, 0.34515380859375, 0.3570556640625, 0.36895751953125, 0.380859375, 0.39276123046875, 0.4046630859375, 0.41656494140625, 0.428466796875, 0.44036865234375, 0.4522705078125, 0.46417236328125, 0.47607421875]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 4.0, 10.0, 12.0, 19.0, 31.0, 60.0, 90.0, 174.0, 170.0, 160.0, 99.0, 61.0, 41.0, 26.0, 13.0, 5.0, 7.0, 5.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.309326171875, -0.2961540222167969, -0.28298187255859375, -0.2698097229003906, -0.2566375732421875, -0.24346542358398438, -0.23029327392578125, -0.21712112426757812, -0.203948974609375, -0.19077682495117188, -0.17760467529296875, -0.16443252563476562, -0.1512603759765625, -0.13808822631835938, -0.12491607666015625, -0.11174392700195312, -0.09857177734375, -0.08539962768554688, -0.07222747802734375, -0.059055328369140625, -0.0458831787109375, -0.032711029052734375, -0.01953887939453125, -0.006366729736328125, 0.006805419921875, 0.019977569580078125, 0.03314971923828125, 0.046321868896484375, 0.0594940185546875, 0.07266616821289062, 0.08583831787109375, 0.09901046752929688, 0.1121826171875, 0.12535476684570312, 0.13852691650390625, 0.15169906616210938, 0.1648712158203125, 0.17804336547851562, 0.19121551513671875, 0.20438766479492188, 0.217559814453125, 0.23073196411132812, 0.24390411376953125, 0.2570762634277344, 0.2702484130859375, 0.2834205627441406, 0.29659271240234375, 0.3097648620605469, 0.32293701171875, 0.3361091613769531, 0.34928131103515625, 0.3624534606933594, 0.3756256103515625, 0.3887977600097656, 0.40196990966796875, 0.4151420593261719, 0.428314208984375, 0.4414863586425781, 0.45465850830078125, 0.4678306579589844, 0.4810028076171875, 0.4941749572753906, 0.5073471069335938, 0.5205192565917969, 0.53369140625]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 5.0, 1.0, 14.0, 12.0, 26.0, 39.0, 63.0, 60.0, 106.0, 116.0, 108.0, 118.0, 91.0, 65.0, 59.0, 38.0, 36.0, 14.0, 8.0, 5.0, 7.0, 2.0, 7.0, 1.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.2200071811676025, -2.1144423484802246, -2.0088772773742676, -1.9033124446868896, -1.7977473735809326, -1.6921825408935547, -1.5866175889968872, -1.4810526371002197, -1.3754876852035522, -1.2699227333068848, -1.1643577814102173, -1.0587928295135498, -0.9532279372215271, -0.8476629853248596, -0.7420980930328369, -0.6365331411361694, -0.530968189239502, -0.4254032373428345, -0.3198383152484894, -0.2142733931541443, -0.1087084412574768, -0.003143489360809326, 0.10242140293121338, 0.20798635482788086, 0.31355130672454834, 0.4191162586212158, 0.5246812105178833, 0.630246102809906, 0.7358110547065735, 0.841376006603241, 0.9469408988952637, 1.0525058507919312, 1.1580710411071777, 1.2636359930038452, 1.3692009449005127, 1.4747657775878906, 1.5803308486938477, 1.6858956813812256, 1.791460633277893, 1.8970255851745605, 2.0025906562805176, 2.1081554889678955, 2.2137205600738525, 2.3192853927612305, 2.4248504638671875, 2.5304152965545654, 2.6359801292419434, 2.7415452003479004, 2.8471100330352783, 2.9526748657226562, 3.0582399368286133, 3.163804769515991, 3.2693698406219482, 3.374934673309326, 3.480499744415283, 3.586064577102661, 3.691629409790039, 3.797194242477417, 3.902759313583374, 4.008324146270752, 4.113889217376709, 4.219454288482666, 4.325018882751465, 4.430583953857422, 4.536149024963379]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 1.0, 6.0, 9.0, 4.0, 5.0, 11.0, 7.0, 11.0, 12.0, 12.0, 22.0, 23.0, 21.0, 29.0, 27.0, 35.0, 18.0, 36.0, 28.0, 31.0, 32.0, 45.0, 43.0, 43.0, 37.0, 37.0, 42.0, 36.0, 26.0, 34.0, 31.0, 34.0, 28.0, 25.0, 26.0, 22.0, 16.0, 16.0, 19.0, 11.0, 8.0, 8.0, 6.0, 10.0, 3.0, 6.0, 4.0, 5.0, 3.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0], "bins": [-2.161407709121704, -2.0957603454589844, -2.0301132202148438, -1.9644659757614136, -1.8988187313079834, -1.8331713676452637, -1.7675241231918335, -1.7018768787384033, -1.6362296342849731, -1.570582389831543, -1.5049351453781128, -1.4392879009246826, -1.373640537261963, -1.3079934120178223, -1.2423460483551025, -1.1766988039016724, -1.1110515594482422, -1.045404314994812, -0.9797570705413818, -0.9141097664833069, -0.8484625220298767, -0.7828152775764465, -0.7171679735183716, -0.6515207290649414, -0.5858734846115112, -0.520226240158081, -0.4545789659023285, -0.3889316916465759, -0.32328444719314575, -0.2576372027397156, -0.191989928483963, -0.12634265422821045, -0.060695648193359375, 0.004951611161231995, 0.07059887051582336, 0.13624612987041473, 0.2018933892250061, 0.2675406336784363, 0.33318790793418884, 0.3988351821899414, 0.4644824266433716, 0.5301296710968018, 0.5957769155502319, 0.6614242196083069, 0.7270714640617371, 0.7927187085151672, 0.8583660125732422, 0.9240132570266724, 0.9896605014801025, 1.0553077459335327, 1.120954990386963, 1.186602234840393, 1.2522494792938232, 1.317896842956543, 1.3835440874099731, 1.4491913318634033, 1.5148385763168335, 1.5804858207702637, 1.6461330652236938, 1.711780309677124, 1.7774276733398438, 1.8430747985839844, 1.908722162246704, 1.9743694067001343, 2.0400166511535645]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 5.0, 3.0, 3.0, 2.0, 5.0, 11.0, 14.0, 20.0, 21.0, 21.0, 41.0, 58.0, 83.0, 121.0, 145.0, 246.0, 392.0, 528.0, 932.0, 1496.0, 2541.0, 4566.0, 8613.0, 16819.0, 34669.0, 76473.0, 183164.0, 520157.0, 1533693.0, 1175696.0, 372673.0, 140654.0, 60898.0, 28664.0, 13926.0, 7402.0, 3783.0, 2253.0, 1291.0, 763.0, 475.0, 322.0, 214.0, 116.0, 92.0, 72.0, 42.0, 25.0, 32.0, 19.0, 10.0, 5.0, 8.0, 5.0, 5.0, 4.0, 2.0, 1.0, 5.0], "bins": [-0.363525390625, -0.3527870178222656, -0.34204864501953125, -0.3313102722167969, -0.3205718994140625, -0.3098335266113281, -0.29909515380859375, -0.2883567810058594, -0.277618408203125, -0.2668800354003906, -0.25614166259765625, -0.24540328979492188, -0.2346649169921875, -0.22392654418945312, -0.21318817138671875, -0.20244979858398438, -0.19171142578125, -0.18097305297851562, -0.17023468017578125, -0.15949630737304688, -0.1487579345703125, -0.13801956176757812, -0.12728118896484375, -0.11654281616210938, -0.105804443359375, -0.09506607055664062, -0.08432769775390625, -0.07358932495117188, -0.0628509521484375, -0.052112579345703125, -0.04137420654296875, -0.030635833740234375, -0.0198974609375, -0.009159088134765625, 0.00157928466796875, 0.012317657470703125, 0.0230560302734375, 0.033794403076171875, 0.04453277587890625, 0.055271148681640625, 0.066009521484375, 0.07674789428710938, 0.08748626708984375, 0.09822463989257812, 0.1089630126953125, 0.11970138549804688, 0.13043975830078125, 0.14117813110351562, 0.15191650390625, 0.16265487670898438, 0.17339324951171875, 0.18413162231445312, 0.1948699951171875, 0.20560836791992188, 0.21634674072265625, 0.22708511352539062, 0.237823486328125, 0.24856185913085938, 0.25930023193359375, 0.2700386047363281, 0.2807769775390625, 0.2915153503417969, 0.30225372314453125, 0.3129920959472656, 0.32373046875]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 4.0, 5.0, 5.0, 11.0, 10.0, 17.0, 12.0, 21.0, 22.0, 27.0, 32.0, 36.0, 38.0, 40.0, 41.0, 43.0, 47.0, 54.0, 54.0, 46.0, 52.0, 56.0, 39.0, 32.0, 43.0, 36.0, 24.0, 26.0, 15.0, 26.0, 17.0, 15.0, 11.0, 12.0, 8.0, 5.0, 3.0, 6.0, 5.0, 2.0, 5.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.31787109375, -0.3083915710449219, -0.29891204833984375, -0.2894325256347656, -0.2799530029296875, -0.2704734802246094, -0.26099395751953125, -0.2515144348144531, -0.242034912109375, -0.23255538940429688, -0.22307586669921875, -0.21359634399414062, -0.2041168212890625, -0.19463729858398438, -0.18515777587890625, -0.17567825317382812, -0.16619873046875, -0.15671920776367188, -0.14723968505859375, -0.13776016235351562, -0.1282806396484375, -0.11880111694335938, -0.10932159423828125, -0.09984207153320312, -0.090362548828125, -0.08088302612304688, -0.07140350341796875, -0.061923980712890625, -0.0524444580078125, -0.042964935302734375, -0.03348541259765625, -0.024005889892578125, -0.0145263671875, -0.005046844482421875, 0.00443267822265625, 0.013912200927734375, 0.0233917236328125, 0.032871246337890625, 0.04235076904296875, 0.051830291748046875, 0.061309814453125, 0.07078933715820312, 0.08026885986328125, 0.08974838256835938, 0.0992279052734375, 0.10870742797851562, 0.11818695068359375, 0.12766647338867188, 0.13714599609375, 0.14662551879882812, 0.15610504150390625, 0.16558456420898438, 0.1750640869140625, 0.18454360961914062, 0.19402313232421875, 0.20350265502929688, 0.212982177734375, 0.22246170043945312, 0.23194122314453125, 0.24142074584960938, 0.2509002685546875, 0.2603797912597656, 0.26985931396484375, 0.2793388366699219, 0.288818359375]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 0.0, 3.0, 9.0, 10.0, 7.0, 16.0, 17.0, 22.0, 33.0, 72.0, 83.0, 127.0, 183.0, 283.0, 495.0, 842.0, 1653.0, 3791.0, 12944.0, 70616.0, 600743.0, 3112098.0, 330262.0, 44472.0, 9287.0, 2946.0, 1353.0, 740.0, 353.0, 281.0, 174.0, 123.0, 76.0, 55.0, 49.0, 21.0, 18.0, 10.0, 6.0, 5.0, 5.0, 3.0, 5.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.0419921875, -1.0076904296875, -0.973388671875, -0.9390869140625, -0.90478515625, -0.8704833984375, -0.836181640625, -0.8018798828125, -0.767578125, -0.7332763671875, -0.698974609375, -0.6646728515625, -0.63037109375, -0.5960693359375, -0.561767578125, -0.5274658203125, -0.4931640625, -0.4588623046875, -0.424560546875, -0.3902587890625, -0.35595703125, -0.3216552734375, -0.287353515625, -0.2530517578125, -0.21875, -0.1844482421875, -0.150146484375, -0.1158447265625, -0.08154296875, -0.0472412109375, -0.012939453125, 0.0213623046875, 0.0556640625, 0.0899658203125, 0.124267578125, 0.1585693359375, 0.19287109375, 0.2271728515625, 0.261474609375, 0.2957763671875, 0.330078125, 0.3643798828125, 0.398681640625, 0.4329833984375, 0.46728515625, 0.5015869140625, 0.535888671875, 0.5701904296875, 0.6044921875, 0.6387939453125, 0.673095703125, 0.7073974609375, 0.74169921875, 0.7760009765625, 0.810302734375, 0.8446044921875, 0.87890625, 0.9132080078125, 0.947509765625, 0.9818115234375, 1.01611328125, 1.0504150390625, 1.084716796875, 1.1190185546875, 1.1533203125]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 3.0, 6.0, 2.0, 10.0, 15.0, 19.0, 34.0, 54.0, 100.0, 149.0, 219.0, 452.0, 943.0, 1005.0, 447.0, 261.0, 147.0, 73.0, 62.0, 31.0, 20.0, 9.0, 9.0, 6.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.130859375, -1.09442138671875, -1.0579833984375, -1.02154541015625, -0.985107421875, -0.94866943359375, -0.9122314453125, -0.87579345703125, -0.83935546875, -0.80291748046875, -0.7664794921875, -0.73004150390625, -0.693603515625, -0.65716552734375, -0.6207275390625, -0.58428955078125, -0.5478515625, -0.51141357421875, -0.4749755859375, -0.43853759765625, -0.402099609375, -0.36566162109375, -0.3292236328125, -0.29278564453125, -0.25634765625, -0.21990966796875, -0.1834716796875, -0.14703369140625, -0.110595703125, -0.07415771484375, -0.0377197265625, -0.00128173828125, 0.03515625, 0.07159423828125, 0.1080322265625, 0.14447021484375, 0.180908203125, 0.21734619140625, 0.2537841796875, 0.29022216796875, 0.32666015625, 0.36309814453125, 0.3995361328125, 0.43597412109375, 0.472412109375, 0.50885009765625, 0.5452880859375, 0.58172607421875, 0.6181640625, 0.65460205078125, 0.6910400390625, 0.72747802734375, 0.763916015625, 0.80035400390625, 0.8367919921875, 0.87322998046875, 0.90966796875, 0.94610595703125, 0.9825439453125, 1.01898193359375, 1.055419921875, 1.09185791015625, 1.1282958984375, 1.16473388671875, 1.201171875]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 1.0, 3.0, 2.0, 6.0, 13.0, 20.0, 50.0, 47.0, 101.0, 122.0, 131.0, 163.0, 119.0, 80.0, 66.0, 36.0, 14.0, 12.0, 7.0, 6.0, 2.0, 1.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.914224624633789, -4.7564802169799805, -4.59873628616333, -4.4409918785095215, -4.283247947692871, -4.1255035400390625, -3.967759370803833, -3.8100152015686035, -3.652271032333374, -3.4945268630981445, -3.336782693862915, -3.1790385246276855, -3.021294116973877, -2.8635501861572266, -2.705805778503418, -2.5480616092681885, -2.390317440032959, -2.2325732707977295, -2.0748291015625, -1.917084813117981, -1.7593406438827515, -1.601596474647522, -1.443852186203003, -1.2861080169677734, -1.128363847732544, -0.9706196784973145, -0.8128754496574402, -0.6551312208175659, -0.4973870515823364, -0.33964288234710693, -0.18189865350723267, -0.0241544246673584, 0.1335892677307129, 0.29133346676826477, 0.44907766580581665, 0.6068218946456909, 0.7645660638809204, 0.9223102331161499, 1.080054521560669, 1.2377986907958984, 1.395542860031128, 1.5532870292663574, 1.711031198501587, 1.868775486946106, 2.026519775390625, 2.1842637062072754, 2.342008113861084, 2.4997522830963135, 2.657496452331543, 2.8152406215667725, 2.972984790802002, 3.1307289600372314, 3.288473129272461, 3.4462175369262695, 3.603961706161499, 3.7617058753967285, 3.919450044631958, 4.0771942138671875, 4.234938621520996, 4.3926825523376465, 4.550426959991455, 4.7081708908081055, 4.865915298461914, 5.023659706115723, 5.181403636932373]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 1.0, 8.0, 3.0, 5.0, 8.0, 7.0, 8.0, 14.0, 15.0, 20.0, 27.0, 15.0, 24.0, 26.0, 24.0, 31.0, 32.0, 34.0, 37.0, 38.0, 33.0, 42.0, 35.0, 32.0, 31.0, 40.0, 40.0, 29.0, 42.0, 43.0, 22.0, 29.0, 25.0, 29.0, 24.0, 25.0, 24.0, 17.0, 10.0, 17.0, 13.0, 6.0, 5.0, 4.0, 5.0, 3.0, 3.0, 1.0, 2.0, 2.0, 3.0], "bins": [-2.5704305171966553, -2.4997072219848633, -2.4289839267730713, -2.3582606315612793, -2.2875373363494873, -2.2168140411376953, -2.1460907459259033, -2.0753674507141113, -2.0046443939208984, -1.9339210987091064, -1.8631978034973145, -1.7924745082855225, -1.7217512130737305, -1.6510279178619385, -1.580304741859436, -1.509581446647644, -1.4388580322265625, -1.3681347370147705, -1.2974114418029785, -1.2266881465911865, -1.1559648513793945, -1.0852415561676025, -1.0145183801651, -0.9437950849533081, -0.8730717897415161, -0.8023484945297241, -0.7316251993179321, -0.6609019637107849, -0.5901786684989929, -0.5194553732872009, -0.4487321078777313, -0.3780088424682617, -0.3072856664657593, -0.23656238615512848, -0.16583910584449768, -0.09511582553386688, -0.024392545223236084, 0.04633074998855591, 0.11705401539802551, 0.18777728080749512, 0.2585005760192871, 0.3292238712310791, 0.3999471366405487, 0.4706704020500183, 0.5413936972618103, 0.6121169924736023, 0.6828402280807495, 0.7535635232925415, 0.8242868185043335, 0.8950101137161255, 0.9657334089279175, 1.0364567041397095, 1.107179880142212, 1.177903175354004, 1.248626470565796, 1.319349765777588, 1.3900730609893799, 1.4607963562011719, 1.5315196514129639, 1.6022429466247559, 1.6729662418365479, 1.7436895370483398, 1.8144127130508423, 1.8851360082626343, 1.9558593034744263]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 6.0, 0.0, 1.0, 6.0, 5.0, 6.0, 7.0, 14.0, 19.0, 33.0, 31.0, 57.0, 90.0, 131.0, 177.0, 264.0, 437.0, 572.0, 963.0, 1447.0, 2188.0, 3273.0, 4991.0, 7489.0, 11428.0, 18199.0, 31785.0, 81146.0, 286734.0, 373161.0, 123547.0, 40368.0, 21050.0, 13318.0, 8647.0, 5801.0, 3680.0, 2488.0, 1728.0, 1112.0, 746.0, 472.0, 290.0, 218.0, 160.0, 96.0, 60.0, 36.0, 27.0, 25.0, 20.0, 6.0, 7.0, 5.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.47705078125, -0.46123504638671875, -0.4454193115234375, -0.42960357666015625, -0.413787841796875, -0.39797210693359375, -0.3821563720703125, -0.36634063720703125, -0.35052490234375, -0.33470916748046875, -0.3188934326171875, -0.30307769775390625, -0.287261962890625, -0.27144622802734375, -0.2556304931640625, -0.23981475830078125, -0.2239990234375, -0.20818328857421875, -0.1923675537109375, -0.17655181884765625, -0.160736083984375, -0.14492034912109375, -0.1291046142578125, -0.11328887939453125, -0.09747314453125, -0.08165740966796875, -0.0658416748046875, -0.05002593994140625, -0.034210205078125, -0.01839447021484375, -0.0025787353515625, 0.01323699951171875, 0.029052734375, 0.04486846923828125, 0.0606842041015625, 0.07649993896484375, 0.092315673828125, 0.10813140869140625, 0.1239471435546875, 0.13976287841796875, 0.15557861328125, 0.17139434814453125, 0.1872100830078125, 0.20302581787109375, 0.218841552734375, 0.23465728759765625, 0.2504730224609375, 0.26628875732421875, 0.2821044921875, 0.29792022705078125, 0.3137359619140625, 0.32955169677734375, 0.345367431640625, 0.36118316650390625, 0.3769989013671875, 0.39281463623046875, 0.40863037109375, 0.42444610595703125, 0.4402618408203125, 0.45607757568359375, 0.471893310546875, 0.48770904541015625, 0.5035247802734375, 0.5193405151367188, 0.53515625]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 2.0, 9.0, 6.0, 8.0, 10.0, 11.0, 8.0, 15.0, 19.0, 25.0, 13.0, 23.0, 33.0, 26.0, 34.0, 25.0, 38.0, 35.0, 40.0, 58.0, 45.0, 37.0, 45.0, 44.0, 42.0, 32.0, 41.0, 40.0, 27.0, 30.0, 29.0, 31.0, 30.0, 24.0, 8.0, 18.0, 13.0, 7.0, 6.0, 5.0, 3.0, 4.0, 2.0, 3.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.297119140625, -0.2884674072265625, -0.279815673828125, -0.2711639404296875, -0.26251220703125, -0.2538604736328125, -0.245208740234375, -0.2365570068359375, -0.2279052734375, -0.2192535400390625, -0.210601806640625, -0.2019500732421875, -0.19329833984375, -0.1846466064453125, -0.175994873046875, -0.1673431396484375, -0.15869140625, -0.1500396728515625, -0.141387939453125, -0.1327362060546875, -0.12408447265625, -0.1154327392578125, -0.106781005859375, -0.0981292724609375, -0.0894775390625, -0.0808258056640625, -0.072174072265625, -0.0635223388671875, -0.05487060546875, -0.0462188720703125, -0.037567138671875, -0.0289154052734375, -0.020263671875, -0.0116119384765625, -0.002960205078125, 0.0056915283203125, 0.01434326171875, 0.0229949951171875, 0.031646728515625, 0.0402984619140625, 0.0489501953125, 0.0576019287109375, 0.066253662109375, 0.0749053955078125, 0.08355712890625, 0.0922088623046875, 0.100860595703125, 0.1095123291015625, 0.1181640625, 0.1268157958984375, 0.135467529296875, 0.1441192626953125, 0.15277099609375, 0.1614227294921875, 0.170074462890625, 0.1787261962890625, 0.1873779296875, 0.1960296630859375, 0.204681396484375, 0.2133331298828125, 0.22198486328125, 0.2306365966796875, 0.239288330078125, 0.2479400634765625, 0.256591796875]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 3.0, 2.0, 2.0, 1.0, 3.0, 6.0, 11.0, 5.0, 14.0, 16.0, 29.0, 26.0, 28.0, 58.0, 113.0, 163.0, 296.0, 539.0, 996.0, 1944.0, 4334.0, 9959.0, 24405.0, 87215.0, 672260.0, 188262.0, 33755.0, 13158.0, 5616.0, 2565.0, 1235.0, 637.0, 348.0, 188.0, 111.0, 85.0, 64.0, 29.0, 21.0, 14.0, 9.0, 11.0, 8.0, 9.0, 4.0, 5.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.0087890625, -0.9769287109375, -0.945068359375, -0.9132080078125, -0.88134765625, -0.8494873046875, -0.817626953125, -0.7857666015625, -0.75390625, -0.7220458984375, -0.690185546875, -0.6583251953125, -0.62646484375, -0.5946044921875, -0.562744140625, -0.5308837890625, -0.4990234375, -0.4671630859375, -0.435302734375, -0.4034423828125, -0.37158203125, -0.3397216796875, -0.307861328125, -0.2760009765625, -0.244140625, -0.2122802734375, -0.180419921875, -0.1485595703125, -0.11669921875, -0.0848388671875, -0.052978515625, -0.0211181640625, 0.0107421875, 0.0426025390625, 0.074462890625, 0.1063232421875, 0.13818359375, 0.1700439453125, 0.201904296875, 0.2337646484375, 0.265625, 0.2974853515625, 0.329345703125, 0.3612060546875, 0.39306640625, 0.4249267578125, 0.456787109375, 0.4886474609375, 0.5205078125, 0.5523681640625, 0.584228515625, 0.6160888671875, 0.64794921875, 0.6798095703125, 0.711669921875, 0.7435302734375, 0.775390625, 0.8072509765625, 0.839111328125, 0.8709716796875, 0.90283203125, 0.9346923828125, 0.966552734375, 0.9984130859375, 1.0302734375]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 1.0, 1.0, 3.0, 2.0, 3.0, 1.0, 6.0, 3.0, 7.0, 8.0, 13.0, 13.0, 18.0, 24.0, 27.0, 28.0, 33.0, 40.0, 40.0, 49.0, 39.0, 41.0, 40.0, 43.0, 51.0, 31.0, 45.0, 45.0, 46.0, 38.0, 37.0, 28.0, 39.0, 34.0, 20.0, 21.0, 14.0, 16.0, 12.0, 8.0, 8.0, 10.0, 4.0, 5.0, 3.0, 3.0, 2.0, 2.0, 1.0, 4.0, 0.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.94970703125, -0.92108154296875, -0.8924560546875, -0.86383056640625, -0.835205078125, -0.80657958984375, -0.7779541015625, -0.74932861328125, -0.720703125, -0.69207763671875, -0.6634521484375, -0.63482666015625, -0.606201171875, -0.57757568359375, -0.5489501953125, -0.52032470703125, -0.49169921875, -0.46307373046875, -0.4344482421875, -0.40582275390625, -0.377197265625, -0.34857177734375, -0.3199462890625, -0.29132080078125, -0.2626953125, -0.23406982421875, -0.2054443359375, -0.17681884765625, -0.148193359375, -0.11956787109375, -0.0909423828125, -0.06231689453125, -0.03369140625, -0.00506591796875, 0.0235595703125, 0.05218505859375, 0.080810546875, 0.10943603515625, 0.1380615234375, 0.16668701171875, 0.1953125, 0.22393798828125, 0.2525634765625, 0.28118896484375, 0.309814453125, 0.33843994140625, 0.3670654296875, 0.39569091796875, 0.42431640625, 0.45294189453125, 0.4815673828125, 0.51019287109375, 0.538818359375, 0.56744384765625, 0.5960693359375, 0.62469482421875, 0.6533203125, 0.68194580078125, 0.7105712890625, 0.73919677734375, 0.767822265625, 0.79644775390625, 0.8250732421875, 0.85369873046875, 0.88232421875]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 5.0, 5.0, 11.0, 9.0, 9.0, 16.0, 29.0, 58.0, 57.0, 129.0, 209.0, 337.0, 537.0, 1018.0, 1764.0, 3157.0, 5580.0, 9981.0, 18624.0, 38521.0, 98754.0, 373761.0, 332494.0, 88629.0, 35526.0, 17613.0, 9427.0, 5233.0, 2969.0, 1732.0, 989.0, 571.0, 332.0, 187.0, 105.0, 60.0, 45.0, 25.0, 19.0, 11.0, 6.0, 6.0, 3.0, 8.0, 4.0, 2.0, 1.0], "bins": [-0.3037109375, -0.2959136962890625, -0.288116455078125, -0.2803192138671875, -0.27252197265625, -0.2647247314453125, -0.256927490234375, -0.2491302490234375, -0.2413330078125, -0.2335357666015625, -0.225738525390625, -0.2179412841796875, -0.21014404296875, -0.2023468017578125, -0.194549560546875, -0.1867523193359375, -0.178955078125, -0.1711578369140625, -0.163360595703125, -0.1555633544921875, -0.14776611328125, -0.1399688720703125, -0.132171630859375, -0.1243743896484375, -0.1165771484375, -0.1087799072265625, -0.100982666015625, -0.0931854248046875, -0.08538818359375, -0.0775909423828125, -0.069793701171875, -0.0619964599609375, -0.05419921875, -0.0464019775390625, -0.038604736328125, -0.0308074951171875, -0.02301025390625, -0.0152130126953125, -0.007415771484375, 0.0003814697265625, 0.0081787109375, 0.0159759521484375, 0.023773193359375, 0.0315704345703125, 0.03936767578125, 0.0471649169921875, 0.054962158203125, 0.0627593994140625, 0.070556640625, 0.0783538818359375, 0.086151123046875, 0.0939483642578125, 0.10174560546875, 0.1095428466796875, 0.117340087890625, 0.1251373291015625, 0.1329345703125, 0.1407318115234375, 0.148529052734375, 0.1563262939453125, 0.16412353515625, 0.1719207763671875, 0.179718017578125, 0.1875152587890625, 0.1953125]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 2.0, 0.0, 2.0, 2.0, 7.0, 1.0, 4.0, 3.0, 11.0, 17.0, 10.0, 16.0, 18.0, 30.0, 63.0, 99.0, 184.0, 162.0, 138.0, 64.0, 40.0, 34.0, 16.0, 15.0, 7.0, 17.0, 8.0, 6.0, 7.0, 4.0, 3.0, 4.0, 3.0, 1.0, 2.0, 2.0, 5.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.179115295410156e-05, -8.88630747795105e-05, -8.593499660491943e-05, -8.300691843032837e-05, -8.00788402557373e-05, -7.715076208114624e-05, -7.422268390655518e-05, -7.129460573196411e-05, -6.836652755737305e-05, -6.543844938278198e-05, -6.251037120819092e-05, -5.9582293033599854e-05, -5.665421485900879e-05, -5.3726136684417725e-05, -5.079805850982666e-05, -4.7869980335235596e-05, -4.494190216064453e-05, -4.201382398605347e-05, -3.90857458114624e-05, -3.615766763687134e-05, -3.3229589462280273e-05, -3.030151128768921e-05, -2.7373433113098145e-05, -2.444535493850708e-05, -2.1517276763916016e-05, -1.858919858932495e-05, -1.5661120414733887e-05, -1.2733042240142822e-05, -9.804964065551758e-06, -6.876885890960693e-06, -3.948807716369629e-06, -1.0207295417785645e-06, 1.9073486328125e-06, 4.8354268074035645e-06, 7.763504981994629e-06, 1.0691583156585693e-05, 1.3619661331176758e-05, 1.6547739505767822e-05, 1.9475817680358887e-05, 2.240389585494995e-05, 2.5331974029541016e-05, 2.826005220413208e-05, 3.1188130378723145e-05, 3.411620855331421e-05, 3.7044286727905273e-05, 3.997236490249634e-05, 4.29004430770874e-05, 4.582852125167847e-05, 4.875659942626953e-05, 5.1684677600860596e-05, 5.461275577545166e-05, 5.7540833950042725e-05, 6.046891212463379e-05, 6.339699029922485e-05, 6.632506847381592e-05, 6.925314664840698e-05, 7.218122482299805e-05, 7.510930299758911e-05, 7.803738117218018e-05, 8.096545934677124e-05, 8.38935375213623e-05, 8.682161569595337e-05, 8.974969387054443e-05, 9.26777720451355e-05, 9.560585021972656e-05]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 1.0, 2.0, 9.0, 7.0, 16.0, 15.0, 28.0, 42.0, 75.0, 95.0, 155.0, 265.0, 482.0, 889.0, 1871.0, 4164.0, 9768.0, 23799.0, 63714.0, 227406.0, 472475.0, 160512.0, 49231.0, 18956.0, 7996.0, 3362.0, 1491.0, 702.0, 380.0, 238.0, 127.0, 94.0, 74.0, 38.0, 15.0, 25.0, 13.0, 4.0, 7.0, 6.0, 4.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.287841796875, -0.2797050476074219, -0.27156829833984375, -0.2634315490722656, -0.2552947998046875, -0.24715805053710938, -0.23902130126953125, -0.23088455200195312, -0.222747802734375, -0.21461105346679688, -0.20647430419921875, -0.19833755493164062, -0.1902008056640625, -0.18206405639648438, -0.17392730712890625, -0.16579055786132812, -0.15765380859375, -0.14951705932617188, -0.14138031005859375, -0.13324356079101562, -0.1251068115234375, -0.11697006225585938, -0.10883331298828125, -0.10069656372070312, -0.092559814453125, -0.08442306518554688, -0.07628631591796875, -0.06814956665039062, -0.0600128173828125, -0.051876068115234375, -0.04373931884765625, -0.035602569580078125, -0.0274658203125, -0.019329071044921875, -0.01119232177734375, -0.003055572509765625, 0.0050811767578125, 0.013217926025390625, 0.02135467529296875, 0.029491424560546875, 0.037628173828125, 0.045764923095703125, 0.05390167236328125, 0.062038421630859375, 0.0701751708984375, 0.07831192016601562, 0.08644866943359375, 0.09458541870117188, 0.10272216796875, 0.11085891723632812, 0.11899566650390625, 0.12713241577148438, 0.1352691650390625, 0.14340591430664062, 0.15154266357421875, 0.15967941284179688, 0.167816162109375, 0.17595291137695312, 0.18408966064453125, 0.19222640991210938, 0.2003631591796875, 0.20849990844726562, 0.21663665771484375, 0.22477340698242188, 0.23291015625]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 5.0, 2.0, 1.0, 7.0, 4.0, 4.0, 5.0, 19.0, 10.0, 19.0, 18.0, 31.0, 41.0, 47.0, 49.0, 93.0, 98.0, 123.0, 91.0, 73.0, 63.0, 39.0, 44.0, 19.0, 22.0, 21.0, 12.0, 12.0, 6.0, 9.0, 3.0, 5.0, 1.0, 4.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.257080078125, -0.24859237670898438, -0.24010467529296875, -0.23161697387695312, -0.2231292724609375, -0.21464157104492188, -0.20615386962890625, -0.19766616821289062, -0.189178466796875, -0.18069076538085938, -0.17220306396484375, -0.16371536254882812, -0.1552276611328125, -0.14673995971679688, -0.13825225830078125, -0.12976455688476562, -0.12127685546875, -0.11278915405273438, -0.10430145263671875, -0.09581375122070312, -0.0873260498046875, -0.07883834838867188, -0.07035064697265625, -0.061862945556640625, -0.053375244140625, -0.044887542724609375, -0.03639984130859375, -0.027912139892578125, -0.0194244384765625, -0.010936737060546875, -0.00244903564453125, 0.006038665771484375, 0.0145263671875, 0.023014068603515625, 0.03150177001953125, 0.039989471435546875, 0.0484771728515625, 0.056964874267578125, 0.06545257568359375, 0.07394027709960938, 0.082427978515625, 0.09091567993164062, 0.09940338134765625, 0.10789108276367188, 0.1163787841796875, 0.12486648559570312, 0.13335418701171875, 0.14184188842773438, 0.15032958984375, 0.15881729125976562, 0.16730499267578125, 0.17579269409179688, 0.1842803955078125, 0.19276809692382812, 0.20125579833984375, 0.20974349975585938, 0.218231201171875, 0.22671890258789062, 0.23520660400390625, 0.24369430541992188, 0.2521820068359375, 0.2606697082519531, 0.26915740966796875, 0.2776451110839844, 0.2861328125]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 4.0, 13.0, 26.0, 53.0, 116.0, 164.0, 230.0, 186.0, 106.0, 57.0, 19.0, 10.0, 7.0, 2.0, 4.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.969951629638672, -8.759028434753418, -8.548105239868164, -8.337182998657227, -8.126259803771973, -7.915336608886719, -7.704413890838623, -7.493491172790527, -7.282567977905273, -7.0716447830200195, -6.860722064971924, -6.649799346923828, -6.438876152038574, -6.22795295715332, -6.017030239105225, -5.806107521057129, -5.595184326171875, -5.384261131286621, -5.173338413238525, -4.96241569519043, -4.751492500305176, -4.540569305419922, -4.329646587371826, -4.1187238693237305, -3.9078006744384766, -3.6968777179718018, -3.485954761505127, -3.275031805038452, -3.0641088485717773, -2.8531858921051025, -2.6422629356384277, -2.431339979171753, -2.220417022705078, -2.0094940662384033, -1.7985711097717285, -1.5876481533050537, -1.376725196838379, -1.165802240371704, -0.9548792839050293, -0.7439563274383545, -0.5330333709716797, -0.3221104145050049, -0.11118745803833008, 0.09973549842834473, 0.31065845489501953, 0.5215814113616943, 0.7325043678283691, 0.943427324295044, 1.1543502807617188, 1.3652732372283936, 1.5761961936950684, 1.7871191501617432, 1.998042106628418, 2.2089650630950928, 2.4198880195617676, 2.6308109760284424, 2.841733932495117, 3.052656888961792, 3.263579845428467, 3.4745028018951416, 3.6854257583618164, 3.896348714828491, 4.107271671295166, 4.318194389343262, 4.529117584228516]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 5.0, 7.0, 5.0, 9.0, 12.0, 17.0, 12.0, 15.0, 26.0, 30.0, 27.0, 33.0, 27.0, 47.0, 33.0, 47.0, 55.0, 54.0, 45.0, 44.0, 40.0, 44.0, 50.0, 37.0, 36.0, 34.0, 35.0, 25.0, 29.0, 21.0, 26.0, 21.0, 16.0, 14.0, 13.0, 6.0, 9.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.495077133178711, -2.41534423828125, -2.335611581802368, -2.2558786869049072, -2.1761457920074463, -2.0964131355285645, -2.0166802406311035, -1.9369473457336426, -1.8572145700454712, -1.7774817943572998, -1.6977488994598389, -1.6180161237716675, -1.538283348083496, -1.4585504531860352, -1.3788176774978638, -1.2990849018096924, -1.2193520069122314, -1.13961923122406, -1.0598863363265991, -0.9801535606384277, -0.9004207253456116, -0.8206878900527954, -0.740955114364624, -0.6612222790718079, -0.5814894437789917, -0.5017566084861755, -0.42202380299568176, -0.342290997505188, -0.2625581622123718, -0.18282532691955566, -0.10309252142906189, -0.023359715938568115, 0.05637335777282715, 0.13610617816448212, 0.21583899855613708, 0.29557180404663086, 0.375304639339447, 0.4550374746322632, 0.5347702503204346, 0.6145030856132507, 0.6942359209060669, 0.7739687561988831, 0.8537015914916992, 0.9334343671798706, 1.013167142868042, 1.092900037765503, 1.1726328134536743, 1.2523655891418457, 1.3320984840393066, 1.411831259727478, 1.491564154624939, 1.5712969303131104, 1.6510298252105713, 1.7307626008987427, 1.810495376586914, 1.890228271484375, 1.9699610471725464, 2.0496938228607178, 2.1294267177581787, 2.2091596126556396, 2.2888922691345215, 2.3686251640319824, 2.4483580589294434, 2.528090715408325, 2.607823610305786]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 3.0, 3.0, 9.0, 9.0, 10.0, 17.0, 24.0, 25.0, 49.0, 81.0, 104.0, 151.0, 218.0, 354.0, 561.0, 896.0, 1340.0, 2303.0, 3968.0, 7128.0, 13173.0, 26757.0, 56269.0, 126052.0, 317089.0, 886374.0, 1512754.0, 755886.0, 272695.0, 110375.0, 49118.0, 23488.0, 11685.0, 6139.0, 3543.0, 2117.0, 1259.0, 775.0, 480.0, 304.0, 222.0, 162.0, 97.0, 73.0, 45.0, 31.0, 23.0, 15.0, 9.0, 10.0, 8.0, 4.0, 2.0, 2.0, 3.0, 0.0, 1.0], "bins": [-0.3564453125, -0.3457794189453125, -0.335113525390625, -0.3244476318359375, -0.31378173828125, -0.3031158447265625, -0.292449951171875, -0.2817840576171875, -0.2711181640625, -0.2604522705078125, -0.249786376953125, -0.2391204833984375, -0.22845458984375, -0.2177886962890625, -0.207122802734375, -0.1964569091796875, -0.185791015625, -0.1751251220703125, -0.164459228515625, -0.1537933349609375, -0.14312744140625, -0.1324615478515625, -0.121795654296875, -0.1111297607421875, -0.1004638671875, -0.0897979736328125, -0.079132080078125, -0.0684661865234375, -0.05780029296875, -0.0471343994140625, -0.036468505859375, -0.0258026123046875, -0.01513671875, -0.0044708251953125, 0.006195068359375, 0.0168609619140625, 0.02752685546875, 0.0381927490234375, 0.048858642578125, 0.0595245361328125, 0.0701904296875, 0.0808563232421875, 0.091522216796875, 0.1021881103515625, 0.11285400390625, 0.1235198974609375, 0.134185791015625, 0.1448516845703125, 0.155517578125, 0.1661834716796875, 0.176849365234375, 0.1875152587890625, 0.19818115234375, 0.2088470458984375, 0.219512939453125, 0.2301788330078125, 0.2408447265625, 0.2515106201171875, 0.262176513671875, 0.2728424072265625, 0.28350830078125, 0.2941741943359375, 0.304840087890625, 0.3155059814453125, 0.326171875]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 5.0, 1.0, 3.0, 3.0, 5.0, 3.0, 2.0, 7.0, 9.0, 9.0, 16.0, 21.0, 22.0, 14.0, 20.0, 28.0, 19.0, 29.0, 30.0, 33.0, 38.0, 31.0, 48.0, 42.0, 35.0, 41.0, 33.0, 37.0, 44.0, 37.0, 37.0, 43.0, 38.0, 31.0, 20.0, 23.0, 32.0, 23.0, 10.0, 14.0, 9.0, 15.0, 14.0, 6.0, 9.0, 8.0, 3.0, 3.0, 1.0, 7.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.258056640625, -0.24997711181640625, -0.2418975830078125, -0.23381805419921875, -0.225738525390625, -0.21765899658203125, -0.2095794677734375, -0.20149993896484375, -0.19342041015625, -0.18534088134765625, -0.1772613525390625, -0.16918182373046875, -0.161102294921875, -0.15302276611328125, -0.1449432373046875, -0.13686370849609375, -0.1287841796875, -0.12070465087890625, -0.1126251220703125, -0.10454559326171875, -0.096466064453125, -0.08838653564453125, -0.0803070068359375, -0.07222747802734375, -0.06414794921875, -0.05606842041015625, -0.0479888916015625, -0.03990936279296875, -0.031829833984375, -0.02375030517578125, -0.0156707763671875, -0.00759124755859375, 0.00048828125, 0.00856781005859375, 0.0166473388671875, 0.02472686767578125, 0.032806396484375, 0.04088592529296875, 0.0489654541015625, 0.05704498291015625, 0.06512451171875, 0.07320404052734375, 0.0812835693359375, 0.08936309814453125, 0.097442626953125, 0.10552215576171875, 0.1136016845703125, 0.12168121337890625, 0.1297607421875, 0.13784027099609375, 0.1459197998046875, 0.15399932861328125, 0.162078857421875, 0.17015838623046875, 0.1782379150390625, 0.18631744384765625, 0.19439697265625, 0.20247650146484375, 0.2105560302734375, 0.21863555908203125, 0.226715087890625, 0.23479461669921875, 0.2428741455078125, 0.25095367431640625, 0.259033203125]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 3.0, 7.0, 9.0, 11.0, 20.0, 33.0, 41.0, 79.0, 143.0, 252.0, 527.0, 1160.0, 2645.0, 7002.0, 27249.0, 186815.0, 2501102.0, 1327537.0, 111028.0, 18836.0, 5588.0, 2195.0, 1022.0, 434.0, 223.0, 140.0, 70.0, 43.0, 29.0, 16.0, 12.0, 10.0, 3.0, 2.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.27734375, -1.238494873046875, -1.19964599609375, -1.160797119140625, -1.1219482421875, -1.083099365234375, -1.04425048828125, -1.005401611328125, -0.966552734375, -0.927703857421875, -0.88885498046875, -0.850006103515625, -0.8111572265625, -0.772308349609375, -0.73345947265625, -0.694610595703125, -0.65576171875, -0.616912841796875, -0.57806396484375, -0.539215087890625, -0.5003662109375, -0.461517333984375, -0.42266845703125, -0.383819580078125, -0.344970703125, -0.306121826171875, -0.26727294921875, -0.228424072265625, -0.1895751953125, -0.150726318359375, -0.11187744140625, -0.073028564453125, -0.0341796875, 0.004669189453125, 0.04351806640625, 0.082366943359375, 0.1212158203125, 0.160064697265625, 0.19891357421875, 0.237762451171875, 0.276611328125, 0.315460205078125, 0.35430908203125, 0.393157958984375, 0.4320068359375, 0.470855712890625, 0.50970458984375, 0.548553466796875, 0.58740234375, 0.626251220703125, 0.66510009765625, 0.703948974609375, 0.7427978515625, 0.781646728515625, 0.82049560546875, 0.859344482421875, 0.898193359375, 0.937042236328125, 0.97589111328125, 1.014739990234375, 1.0535888671875, 1.092437744140625, 1.13128662109375, 1.170135498046875, 1.208984375]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 4.0, 8.0, 4.0, 6.0, 12.0, 14.0, 28.0, 39.0, 88.0, 94.0, 153.0, 252.0, 460.0, 751.0, 824.0, 495.0, 298.0, 206.0, 116.0, 62.0, 54.0, 38.0, 26.0, 18.0, 9.0, 9.0, 1.0, 3.0, 6.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0625, -1.0283966064453125, -0.994293212890625, -0.9601898193359375, -0.92608642578125, -0.8919830322265625, -0.857879638671875, -0.8237762451171875, -0.7896728515625, -0.7555694580078125, -0.721466064453125, -0.6873626708984375, -0.65325927734375, -0.6191558837890625, -0.585052490234375, -0.5509490966796875, -0.516845703125, -0.4827423095703125, -0.448638916015625, -0.4145355224609375, -0.38043212890625, -0.3463287353515625, -0.312225341796875, -0.2781219482421875, -0.2440185546875, -0.2099151611328125, -0.175811767578125, -0.1417083740234375, -0.10760498046875, -0.0735015869140625, -0.039398193359375, -0.0052947998046875, 0.02880859375, 0.0629119873046875, 0.097015380859375, 0.1311187744140625, 0.16522216796875, 0.1993255615234375, 0.233428955078125, 0.2675323486328125, 0.3016357421875, 0.3357391357421875, 0.369842529296875, 0.4039459228515625, 0.43804931640625, 0.4721527099609375, 0.506256103515625, 0.5403594970703125, 0.574462890625, 0.6085662841796875, 0.642669677734375, 0.6767730712890625, 0.71087646484375, 0.7449798583984375, 0.779083251953125, 0.8131866455078125, 0.8472900390625, 0.8813934326171875, 0.915496826171875, 0.9496002197265625, 0.98370361328125, 1.0178070068359375, 1.051910400390625, 1.0860137939453125, 1.1201171875]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 3.0, 11.0, 26.0, 96.0, 242.0, 355.0, 183.0, 68.0, 17.0, 4.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.080930709838867, -14.666093826293945, -14.25125789642334, -13.836421012878418, -13.421585083007812, -13.00674819946289, -12.591911315917969, -12.177074432373047, -11.762238502502441, -11.34740161895752, -10.932565689086914, -10.517728805541992, -10.10289192199707, -9.688055992126465, -9.273219108581543, -8.858383178710938, -8.443546295166016, -8.028709411621094, -7.613873481750488, -7.199036598205566, -6.784200191497803, -6.369363784790039, -5.954526901245117, -5.5396904945373535, -5.12485408782959, -4.710017681121826, -4.2951812744140625, -3.8803443908691406, -3.465507984161377, -3.0506715774536133, -2.6358349323272705, -2.2209982872009277, -1.8061609268188477, -1.3913244009017944, -0.9764878749847412, -0.561651349067688, -0.14681482315063477, 0.2680215835571289, 0.6828582286834717, 1.0976948738098145, 1.5125312805175781, 1.9273678064346313, 2.3422043323516846, 2.7570409774780273, 3.171877384185791, 3.5867137908935547, 4.001550674438477, 4.41638708114624, 4.831223487854004, 5.246059894561768, 5.660896301269531, 6.075733184814453, 6.490569591522217, 6.9054059982299805, 7.320242881774902, 7.735079288482666, 8.14991569519043, 8.564752578735352, 8.979588508605957, 9.394425392150879, 9.809261322021484, 10.224098205566406, 10.638935089111328, 11.05377197265625, 11.468607902526855]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 3.0, 2.0, 1.0, 5.0, 6.0, 15.0, 9.0, 8.0, 9.0, 11.0, 17.0, 17.0, 16.0, 18.0, 21.0, 30.0, 36.0, 22.0, 37.0, 31.0, 28.0, 34.0, 24.0, 37.0, 38.0, 44.0, 35.0, 39.0, 38.0, 32.0, 34.0, 34.0, 38.0, 30.0, 29.0, 33.0, 20.0, 19.0, 19.0, 23.0, 17.0, 9.0, 14.0, 6.0, 4.0, 3.0, 4.0, 6.0, 5.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.105996608734131, -2.0334300994873047, -1.9608635902404785, -1.8882970809936523, -1.8157304525375366, -1.7431639432907104, -1.6705974340438843, -1.5980308055877686, -1.5254642963409424, -1.4528977870941162, -1.38033127784729, -1.3077647686004639, -1.2351981401443481, -1.162631630897522, -1.0900651216506958, -1.01749849319458, -0.9449321031570435, -0.8723655939102173, -0.7997990250587463, -0.7272325158119202, -0.6546659469604492, -0.582099437713623, -0.5095329284667969, -0.4369663596153259, -0.36439985036849976, -0.2918333113193512, -0.21926678717136383, -0.14670026302337646, -0.0741337239742279, -0.0015671849250793457, 0.07099932432174683, 0.14356589317321777, 0.21613240242004395, 0.2886989414691925, 0.36126548051834106, 0.43383198976516724, 0.5063985586166382, 0.5789650678634644, 0.6515315771102905, 0.7240981459617615, 0.7966646552085876, 0.8692311644554138, 0.9417977333068848, 1.014364242553711, 1.086930751800537, 1.1594972610473633, 1.2320637702941895, 1.3046303987503052, 1.3771969079971313, 1.4497634172439575, 1.5223299264907837, 1.5948965549468994, 1.6674630641937256, 1.7400295734405518, 1.812596082687378, 1.885162591934204, 1.9577291011810303, 2.0302956104278564, 2.1028621196746826, 2.175428628921509, 2.247995138168335, 2.3205618858337402, 2.3931283950805664, 2.4656949043273926, 2.5382614135742188]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 4.0, 8.0, 9.0, 18.0, 19.0, 40.0, 51.0, 97.0, 150.0, 205.0, 318.0, 537.0, 869.0, 1410.0, 2531.0, 4453.0, 7993.0, 14975.0, 29693.0, 74102.0, 270939.0, 420494.0, 131391.0, 43431.0, 20263.0, 10639.0, 5749.0, 3301.0, 1896.0, 1152.0, 674.0, 429.0, 273.0, 132.0, 113.0, 73.0, 39.0, 33.0, 14.0, 17.0, 9.0, 5.0, 7.0, 4.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.634765625, -0.61376953125, -0.5927734375, -0.57177734375, -0.55078125, -0.52978515625, -0.5087890625, -0.48779296875, -0.466796875, -0.44580078125, -0.4248046875, -0.40380859375, -0.3828125, -0.36181640625, -0.3408203125, -0.31982421875, -0.298828125, -0.27783203125, -0.2568359375, -0.23583984375, -0.21484375, -0.19384765625, -0.1728515625, -0.15185546875, -0.130859375, -0.10986328125, -0.0888671875, -0.06787109375, -0.046875, -0.02587890625, -0.0048828125, 0.01611328125, 0.037109375, 0.05810546875, 0.0791015625, 0.10009765625, 0.12109375, 0.14208984375, 0.1630859375, 0.18408203125, 0.205078125, 0.22607421875, 0.2470703125, 0.26806640625, 0.2890625, 0.31005859375, 0.3310546875, 0.35205078125, 0.373046875, 0.39404296875, 0.4150390625, 0.43603515625, 0.45703125, 0.47802734375, 0.4990234375, 0.52001953125, 0.541015625, 0.56201171875, 0.5830078125, 0.60400390625, 0.625, 0.64599609375, 0.6669921875, 0.68798828125, 0.708984375]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 4.0, 1.0, 4.0, 6.0, 5.0, 8.0, 14.0, 11.0, 13.0, 17.0, 17.0, 21.0, 35.0, 45.0, 43.0, 46.0, 45.0, 46.0, 41.0, 50.0, 52.0, 47.0, 53.0, 47.0, 47.0, 50.0, 24.0, 35.0, 32.0, 24.0, 29.0, 20.0, 14.0, 11.0, 8.0, 13.0, 11.0, 7.0, 5.0, 7.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.356201171875, -0.34531402587890625, -0.3344268798828125, -0.32353973388671875, -0.312652587890625, -0.30176544189453125, -0.2908782958984375, -0.27999114990234375, -0.26910400390625, -0.25821685791015625, -0.2473297119140625, -0.23644256591796875, -0.225555419921875, -0.21466827392578125, -0.2037811279296875, -0.19289398193359375, -0.1820068359375, -0.17111968994140625, -0.1602325439453125, -0.14934539794921875, -0.138458251953125, -0.12757110595703125, -0.1166839599609375, -0.10579681396484375, -0.09490966796875, -0.08402252197265625, -0.0731353759765625, -0.06224822998046875, -0.051361083984375, -0.04047393798828125, -0.0295867919921875, -0.01869964599609375, -0.0078125, 0.00307464599609375, 0.0139617919921875, 0.02484893798828125, 0.035736083984375, 0.04662322998046875, 0.0575103759765625, 0.06839752197265625, 0.07928466796875, 0.09017181396484375, 0.1010589599609375, 0.11194610595703125, 0.122833251953125, 0.13372039794921875, 0.1446075439453125, 0.15549468994140625, 0.1663818359375, 0.17726898193359375, 0.1881561279296875, 0.19904327392578125, 0.209930419921875, 0.22081756591796875, 0.2317047119140625, 0.24259185791015625, 0.25347900390625, 0.26436614990234375, 0.2752532958984375, 0.28614044189453125, 0.297027587890625, 0.30791473388671875, 0.3188018798828125, 0.32968902587890625, 0.340576171875]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 1.0, 4.0, 2.0, 0.0, 2.0, 3.0, 1.0, 5.0, 3.0, 9.0, 14.0, 13.0, 18.0, 31.0, 32.0, 53.0, 85.0, 99.0, 130.0, 214.0, 330.0, 621.0, 955.0, 1756.0, 3215.0, 6698.0, 14665.0, 35471.0, 121090.0, 528199.0, 242124.0, 53660.0, 20470.0, 9072.0, 4177.0, 2187.0, 1191.0, 689.0, 407.0, 255.0, 193.0, 118.0, 78.0, 52.0, 35.0, 34.0, 22.0, 19.0, 13.0, 9.0, 9.0, 11.0, 7.0, 4.0, 3.0, 4.0, 2.0, 1.0, 2.0, 5.0], "bins": [-0.9638671875, -0.9352645874023438, -0.9066619873046875, -0.8780593872070312, -0.849456787109375, -0.8208541870117188, -0.7922515869140625, -0.7636489868164062, -0.73504638671875, -0.7064437866210938, -0.6778411865234375, -0.6492385864257812, -0.620635986328125, -0.5920333862304688, -0.5634307861328125, -0.5348281860351562, -0.5062255859375, -0.47762298583984375, -0.4490203857421875, -0.42041778564453125, -0.391815185546875, -0.36321258544921875, -0.3346099853515625, -0.30600738525390625, -0.27740478515625, -0.24880218505859375, -0.2201995849609375, -0.19159698486328125, -0.162994384765625, -0.13439178466796875, -0.1057891845703125, -0.07718658447265625, -0.048583984375, -0.01998138427734375, 0.0086212158203125, 0.03722381591796875, 0.065826416015625, 0.09442901611328125, 0.1230316162109375, 0.15163421630859375, 0.18023681640625, 0.20883941650390625, 0.2374420166015625, 0.26604461669921875, 0.294647216796875, 0.32324981689453125, 0.3518524169921875, 0.38045501708984375, 0.4090576171875, 0.43766021728515625, 0.4662628173828125, 0.49486541748046875, 0.523468017578125, 0.5520706176757812, 0.5806732177734375, 0.6092758178710938, 0.63787841796875, 0.6664810180664062, 0.6950836181640625, 0.7236862182617188, 0.752288818359375, 0.7808914184570312, 0.8094940185546875, 0.8380966186523438, 0.86669921875]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 2.0, 6.0, 1.0, 2.0, 8.0, 11.0, 9.0, 10.0, 15.0, 18.0, 14.0, 17.0, 18.0, 29.0, 23.0, 28.0, 36.0, 42.0, 33.0, 50.0, 38.0, 42.0, 51.0, 39.0, 39.0, 54.0, 39.0, 40.0, 33.0, 36.0, 32.0, 25.0, 25.0, 18.0, 22.0, 16.0, 7.0, 14.0, 19.0, 14.0, 4.0, 7.0, 6.0, 4.0, 5.0, 2.0, 0.0, 2.0, 2.0, 2.0, 2.0, 0.0, 2.0], "bins": [-1.0, -0.9704437255859375, -0.940887451171875, -0.9113311767578125, -0.88177490234375, -0.8522186279296875, -0.822662353515625, -0.7931060791015625, -0.7635498046875, -0.7339935302734375, -0.704437255859375, -0.6748809814453125, -0.64532470703125, -0.6157684326171875, -0.586212158203125, -0.5566558837890625, -0.527099609375, -0.4975433349609375, -0.467987060546875, -0.4384307861328125, -0.40887451171875, -0.3793182373046875, -0.349761962890625, -0.3202056884765625, -0.2906494140625, -0.2610931396484375, -0.231536865234375, -0.2019805908203125, -0.17242431640625, -0.1428680419921875, -0.113311767578125, -0.0837554931640625, -0.05419921875, -0.0246429443359375, 0.004913330078125, 0.0344696044921875, 0.06402587890625, 0.0935821533203125, 0.123138427734375, 0.1526947021484375, 0.1822509765625, 0.2118072509765625, 0.241363525390625, 0.2709197998046875, 0.30047607421875, 0.3300323486328125, 0.359588623046875, 0.3891448974609375, 0.418701171875, 0.4482574462890625, 0.477813720703125, 0.5073699951171875, 0.53692626953125, 0.5664825439453125, 0.596038818359375, 0.6255950927734375, 0.6551513671875, 0.6847076416015625, 0.714263916015625, 0.7438201904296875, 0.77337646484375, 0.8029327392578125, 0.832489013671875, 0.8620452880859375, 0.8916015625]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 6.0, 2.0, 6.0, 3.0, 5.0, 13.0, 20.0, 26.0, 48.0, 67.0, 132.0, 251.0, 528.0, 1341.0, 3250.0, 8655.0, 22368.0, 70628.0, 442266.0, 399018.0, 65203.0, 21183.0, 8135.0, 3079.0, 1270.0, 510.0, 238.0, 118.0, 69.0, 35.0, 28.0, 19.0, 5.0, 15.0, 8.0, 4.0, 6.0, 3.0, 3.0, 3.0, 3.0], "bins": [-0.5498046875, -0.5367050170898438, -0.5236053466796875, -0.5105056762695312, -0.497406005859375, -0.48430633544921875, -0.4712066650390625, -0.45810699462890625, -0.44500732421875, -0.43190765380859375, -0.4188079833984375, -0.40570831298828125, -0.392608642578125, -0.37950897216796875, -0.3664093017578125, -0.35330963134765625, -0.3402099609375, -0.32711029052734375, -0.3140106201171875, -0.30091094970703125, -0.287811279296875, -0.27471160888671875, -0.2616119384765625, -0.24851226806640625, -0.23541259765625, -0.22231292724609375, -0.2092132568359375, -0.19611358642578125, -0.183013916015625, -0.16991424560546875, -0.1568145751953125, -0.14371490478515625, -0.130615234375, -0.11751556396484375, -0.1044158935546875, -0.09131622314453125, -0.078216552734375, -0.06511688232421875, -0.0520172119140625, -0.03891754150390625, -0.02581787109375, -0.01271820068359375, 0.0003814697265625, 0.01348114013671875, 0.026580810546875, 0.03968048095703125, 0.0527801513671875, 0.06587982177734375, 0.0789794921875, 0.09207916259765625, 0.1051788330078125, 0.11827850341796875, 0.131378173828125, 0.14447784423828125, 0.1575775146484375, 0.17067718505859375, 0.18377685546875, 0.19687652587890625, 0.2099761962890625, 0.22307586669921875, 0.236175537109375, 0.24927520751953125, 0.2623748779296875, 0.27547454833984375, 0.28857421875]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 5.0, 2.0, 1.0, 1.0, 3.0, 3.0, 2.0, 0.0, 3.0, 2.0, 4.0, 7.0, 7.0, 6.0, 8.0, 14.0, 18.0, 41.0, 39.0, 75.0, 116.0, 186.0, 157.0, 104.0, 55.0, 45.0, 27.0, 17.0, 11.0, 14.0, 8.0, 9.0, 4.0, 4.0, 5.0, 0.0, 5.0, 2.0, 0.0, 0.0, 3.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00010156631469726562, -9.815767407417297e-05, -9.474903345108032e-05, -9.134039282798767e-05, -8.793175220489502e-05, -8.452311158180237e-05, -8.111447095870972e-05, -7.770583033561707e-05, -7.429718971252441e-05, -7.088854908943176e-05, -6.747990846633911e-05, -6.407126784324646e-05, -6.066262722015381e-05, -5.725398659706116e-05, -5.3845345973968506e-05, -5.0436705350875854e-05, -4.70280647277832e-05, -4.361942410469055e-05, -4.02107834815979e-05, -3.680214285850525e-05, -3.33935022354126e-05, -2.9984861612319946e-05, -2.6576220989227295e-05, -2.3167580366134644e-05, -1.9758939743041992e-05, -1.635029911994934e-05, -1.294165849685669e-05, -9.533017873764038e-06, -6.124377250671387e-06, -2.7157366275787354e-06, 6.92903995513916e-07, 4.101544618606567e-06, 7.510185241699219e-06, 1.091882586479187e-05, 1.4327466487884521e-05, 1.7736107110977173e-05, 2.1144747734069824e-05, 2.4553388357162476e-05, 2.7962028980255127e-05, 3.137066960334778e-05, 3.477931022644043e-05, 3.818795084953308e-05, 4.159659147262573e-05, 4.5005232095718384e-05, 4.8413872718811035e-05, 5.1822513341903687e-05, 5.523115396499634e-05, 5.863979458808899e-05, 6.204843521118164e-05, 6.545707583427429e-05, 6.886571645736694e-05, 7.22743570804596e-05, 7.568299770355225e-05, 7.90916383266449e-05, 8.250027894973755e-05, 8.59089195728302e-05, 8.931756019592285e-05, 9.27262008190155e-05, 9.613484144210815e-05, 9.95434820652008e-05, 0.00010295212268829346, 0.00010636076331138611, 0.00010976940393447876, 0.00011317804455757141, 0.00011658668518066406]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 5.0, 8.0, 6.0, 6.0, 14.0, 9.0, 15.0, 32.0, 59.0, 77.0, 137.0, 211.0, 357.0, 655.0, 1201.0, 2534.0, 5759.0, 13489.0, 35712.0, 118894.0, 437680.0, 311724.0, 75811.0, 25238.0, 10198.0, 4456.0, 2012.0, 973.0, 512.0, 297.0, 163.0, 114.0, 62.0, 48.0, 25.0, 14.0, 16.0, 9.0, 6.0, 7.0, 8.0, 0.0, 5.0, 3.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.28076171875, -0.2716560363769531, -0.26255035400390625, -0.2534446716308594, -0.2443389892578125, -0.23523330688476562, -0.22612762451171875, -0.21702194213867188, -0.207916259765625, -0.19881057739257812, -0.18970489501953125, -0.18059921264648438, -0.1714935302734375, -0.16238784790039062, -0.15328216552734375, -0.14417648315429688, -0.13507080078125, -0.12596511840820312, -0.11685943603515625, -0.10775375366210938, -0.0986480712890625, -0.08954238891601562, -0.08043670654296875, -0.07133102416992188, -0.062225341796875, -0.053119659423828125, -0.04401397705078125, -0.034908294677734375, -0.0258026123046875, -0.016696929931640625, -0.00759124755859375, 0.001514434814453125, 0.0106201171875, 0.019725799560546875, 0.02883148193359375, 0.037937164306640625, 0.0470428466796875, 0.056148529052734375, 0.06525421142578125, 0.07435989379882812, 0.083465576171875, 0.09257125854492188, 0.10167694091796875, 0.11078262329101562, 0.1198883056640625, 0.12899398803710938, 0.13809967041015625, 0.14720535278320312, 0.15631103515625, 0.16541671752929688, 0.17452239990234375, 0.18362808227539062, 0.1927337646484375, 0.20183944702148438, 0.21094512939453125, 0.22005081176757812, 0.229156494140625, 0.23826217651367188, 0.24736785888671875, 0.2564735412597656, 0.2655792236328125, 0.2746849060058594, 0.28379058837890625, 0.2928962707519531, 0.302001953125]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 5.0, 2.0, 2.0, 6.0, 5.0, 14.0, 18.0, 18.0, 24.0, 27.0, 37.0, 59.0, 86.0, 101.0, 123.0, 116.0, 123.0, 70.0, 42.0, 24.0, 24.0, 20.0, 9.0, 15.0, 13.0, 4.0, 8.0, 2.0, 3.0, 3.0, 4.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.363037109375, -0.35199737548828125, -0.3409576416015625, -0.32991790771484375, -0.318878173828125, -0.30783843994140625, -0.2967987060546875, -0.28575897216796875, -0.27471923828125, -0.26367950439453125, -0.2526397705078125, -0.24160003662109375, -0.230560302734375, -0.21952056884765625, -0.2084808349609375, -0.19744110107421875, -0.1864013671875, -0.17536163330078125, -0.1643218994140625, -0.15328216552734375, -0.142242431640625, -0.13120269775390625, -0.1201629638671875, -0.10912322998046875, -0.09808349609375, -0.08704376220703125, -0.0760040283203125, -0.06496429443359375, -0.053924560546875, -0.04288482666015625, -0.0318450927734375, -0.02080535888671875, -0.009765625, 0.00127410888671875, 0.0123138427734375, 0.02335357666015625, 0.034393310546875, 0.04543304443359375, 0.0564727783203125, 0.06751251220703125, 0.07855224609375, 0.08959197998046875, 0.1006317138671875, 0.11167144775390625, 0.122711181640625, 0.13375091552734375, 0.1447906494140625, 0.15583038330078125, 0.1668701171875, 0.17790985107421875, 0.1889495849609375, 0.19998931884765625, 0.211029052734375, 0.22206878662109375, 0.2331085205078125, 0.24414825439453125, 0.25518798828125, 0.26622772216796875, 0.2772674560546875, 0.28830718994140625, 0.299346923828125, 0.31038665771484375, 0.3214263916015625, 0.33246612548828125, 0.343505859375]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 3.0, 13.0, 55.0, 154.0, 259.0, 294.0, 155.0, 52.0, 11.0, 8.0, 4.0, 1.0, 2.0, 1.0], "bins": [-17.814624786376953, -17.491138458251953, -17.167652130126953, -16.844165802001953, -16.520679473876953, -16.197193145751953, -15.873706817626953, -15.550220489501953, -15.226734161376953, -14.903247833251953, -14.579761505126953, -14.256275177001953, -13.932788848876953, -13.609302520751953, -13.285816192626953, -12.962329864501953, -12.638843536376953, -12.315357208251953, -11.991870880126953, -11.668384552001953, -11.344898223876953, -11.021411895751953, -10.697925567626953, -10.374439239501953, -10.05095386505127, -9.72746753692627, -9.40398120880127, -9.08049488067627, -8.75700855255127, -8.43352222442627, -8.11003589630127, -7.7865495681762695, -7.463062286376953, -7.139575958251953, -6.816089630126953, -6.492603302001953, -6.169116973876953, -5.845630645751953, -5.522144317626953, -5.198657989501953, -4.875172138214111, -4.551685810089111, -4.228199481964111, -3.9047131538391113, -3.5812268257141113, -3.2577404975891113, -2.9342544078826904, -2.6107680797576904, -2.2872817516326904, -1.9637954235076904, -1.6403090953826904, -1.31682288646698, -0.99333655834198, -0.66985023021698, -0.34636402130126953, -0.02287769317626953, 0.30060863494873047, 0.6240949630737305, 0.9475812315940857, 1.271067500114441, 1.594553828239441, 1.918040156364441, 2.2415263652801514, 2.5650126934051514, 2.8884990215301514]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 4.0, 4.0, 4.0, 3.0, 7.0, 8.0, 14.0, 12.0, 18.0, 14.0, 22.0, 20.0, 21.0, 25.0, 26.0, 32.0, 35.0, 34.0, 35.0, 32.0, 30.0, 47.0, 50.0, 38.0, 36.0, 41.0, 47.0, 31.0, 38.0, 40.0, 28.0, 39.0, 25.0, 29.0, 18.0, 21.0, 17.0, 15.0, 11.0, 10.0, 7.0, 4.0, 2.0, 3.0, 8.0, 3.0, 3.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.5101425647735596, -2.429661273956299, -2.349179983139038, -2.2686984539031982, -2.1882171630859375, -2.1077358722686768, -2.027254581451416, -1.9467731714248657, -1.8662917613983154, -1.7858104705810547, -1.7053290605545044, -1.6248477697372437, -1.5443663597106934, -1.4638850688934326, -1.3834037780761719, -1.3029223680496216, -1.2224410772323608, -1.1419597864151, -1.0614783763885498, -0.9809970855712891, -0.9005156755447388, -0.820034384727478, -0.7395530343055725, -0.659071683883667, -0.5785903334617615, -0.49810898303985596, -0.41762763261795044, -0.3371463119983673, -0.2566649615764618, -0.17618361115455627, -0.09570229053497314, -0.015220940113067627, 0.06526041030883789, 0.1457417607307434, 0.22622309625148773, 0.30670443177223206, 0.3871857821941376, 0.4676671326160431, 0.5481484532356262, 0.6286298036575317, 0.7091111540794373, 0.7895925045013428, 0.8700738549232483, 0.9505552053451538, 1.0310364961624146, 1.1115179061889648, 1.1919991970062256, 1.2724804878234863, 1.3529618978500366, 1.4334431886672974, 1.5139245986938477, 1.5944058895111084, 1.6748872995376587, 1.7553685903549194, 1.8358500003814697, 1.9163312911987305, 1.9968125820159912, 2.077293872833252, 2.1577751636505127, 2.2382566928863525, 2.3187379837036133, 2.399219274520874, 2.4797005653381348, 2.5601820945739746, 2.6406633853912354]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 2.0, 5.0, 7.0, 5.0, 4.0, 7.0, 21.0, 16.0, 29.0, 37.0, 50.0, 84.0, 107.0, 164.0, 230.0, 318.0, 482.0, 839.0, 1364.0, 2286.0, 4011.0, 7582.0, 15325.0, 32369.0, 73955.0, 180299.0, 489557.0, 1270470.0, 1283333.0, 500445.0, 187319.0, 76514.0, 33496.0, 15627.0, 7869.0, 4172.0, 2229.0, 1365.0, 787.0, 526.0, 305.0, 218.0, 139.0, 113.0, 72.0, 47.0, 26.0, 23.0, 10.0, 11.0, 3.0, 8.0, 2.0, 5.0, 1.0, 3.0, 1.0, 1.0], "bins": [-0.3525390625, -0.3421745300292969, -0.33180999755859375, -0.3214454650878906, -0.3110809326171875, -0.3007164001464844, -0.29035186767578125, -0.2799873352050781, -0.269622802734375, -0.2592582702636719, -0.24889373779296875, -0.23852920532226562, -0.2281646728515625, -0.21780014038085938, -0.20743560791015625, -0.19707107543945312, -0.18670654296875, -0.17634201049804688, -0.16597747802734375, -0.15561294555664062, -0.1452484130859375, -0.13488388061523438, -0.12451934814453125, -0.11415481567382812, -0.103790283203125, -0.09342575073242188, -0.08306121826171875, -0.07269668579101562, -0.0623321533203125, -0.051967620849609375, -0.04160308837890625, -0.031238555908203125, -0.0208740234375, -0.010509490966796875, -0.00014495849609375, 0.010219573974609375, 0.0205841064453125, 0.030948638916015625, 0.04131317138671875, 0.051677703857421875, 0.062042236328125, 0.07240676879882812, 0.08277130126953125, 0.09313583374023438, 0.1035003662109375, 0.11386489868164062, 0.12422943115234375, 0.13459396362304688, 0.14495849609375, 0.15532302856445312, 0.16568756103515625, 0.17605209350585938, 0.1864166259765625, 0.19678115844726562, 0.20714569091796875, 0.21751022338867188, 0.227874755859375, 0.23823928833007812, 0.24860382080078125, 0.2589683532714844, 0.2693328857421875, 0.2796974182128906, 0.29006195068359375, 0.3004264831542969, 0.310791015625]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 4.0, 1.0, 5.0, 5.0, 3.0, 9.0, 9.0, 9.0, 16.0, 10.0, 11.0, 9.0, 23.0, 12.0, 34.0, 23.0, 39.0, 39.0, 31.0, 41.0, 36.0, 43.0, 55.0, 35.0, 52.0, 44.0, 41.0, 38.0, 31.0, 40.0, 38.0, 37.0, 31.0, 26.0, 26.0, 20.0, 17.0, 11.0, 8.0, 11.0, 9.0, 8.0, 6.0, 4.0, 3.0, 5.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.322998046875, -0.3137054443359375, -0.304412841796875, -0.2951202392578125, -0.28582763671875, -0.2765350341796875, -0.267242431640625, -0.2579498291015625, -0.2486572265625, -0.2393646240234375, -0.230072021484375, -0.2207794189453125, -0.21148681640625, -0.2021942138671875, -0.192901611328125, -0.1836090087890625, -0.17431640625, -0.1650238037109375, -0.155731201171875, -0.1464385986328125, -0.13714599609375, -0.1278533935546875, -0.118560791015625, -0.1092681884765625, -0.0999755859375, -0.0906829833984375, -0.081390380859375, -0.0720977783203125, -0.06280517578125, -0.0535125732421875, -0.044219970703125, -0.0349273681640625, -0.025634765625, -0.0163421630859375, -0.007049560546875, 0.0022430419921875, 0.01153564453125, 0.0208282470703125, 0.030120849609375, 0.0394134521484375, 0.0487060546875, 0.0579986572265625, 0.067291259765625, 0.0765838623046875, 0.08587646484375, 0.0951690673828125, 0.104461669921875, 0.1137542724609375, 0.123046875, 0.1323394775390625, 0.141632080078125, 0.1509246826171875, 0.16021728515625, 0.1695098876953125, 0.178802490234375, 0.1880950927734375, 0.1973876953125, 0.2066802978515625, 0.215972900390625, 0.2252655029296875, 0.23455810546875, 0.2438507080078125, 0.253143310546875, 0.2624359130859375, 0.271728515625]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 5.0, 4.0, 4.0, 8.0, 10.0, 23.0, 33.0, 42.0, 69.0, 108.0, 134.0, 259.0, 418.0, 647.0, 1130.0, 2077.0, 4080.0, 9009.0, 26838.0, 111511.0, 745387.0, 2785917.0, 401619.0, 71583.0, 19008.0, 7126.0, 3304.0, 1606.0, 912.0, 482.0, 303.0, 218.0, 121.0, 104.0, 60.0, 31.0, 22.0, 28.0, 12.0, 5.0, 13.0, 8.0, 4.0, 6.0, 3.0, 1.0, 0.0, 1.0, 4.0], "bins": [-1.12890625, -1.0978546142578125, -1.066802978515625, -1.0357513427734375, -1.00469970703125, -0.9736480712890625, -0.942596435546875, -0.9115447998046875, -0.8804931640625, -0.8494415283203125, -0.818389892578125, -0.7873382568359375, -0.75628662109375, -0.7252349853515625, -0.694183349609375, -0.6631317138671875, -0.632080078125, -0.6010284423828125, -0.569976806640625, -0.5389251708984375, -0.50787353515625, -0.4768218994140625, -0.445770263671875, -0.4147186279296875, -0.3836669921875, -0.3526153564453125, -0.321563720703125, -0.2905120849609375, -0.25946044921875, -0.2284088134765625, -0.197357177734375, -0.1663055419921875, -0.13525390625, -0.1042022705078125, -0.073150634765625, -0.0420989990234375, -0.01104736328125, 0.0200042724609375, 0.051055908203125, 0.0821075439453125, 0.1131591796875, 0.1442108154296875, 0.175262451171875, 0.2063140869140625, 0.23736572265625, 0.2684173583984375, 0.299468994140625, 0.3305206298828125, 0.361572265625, 0.3926239013671875, 0.423675537109375, 0.4547271728515625, 0.48577880859375, 0.5168304443359375, 0.547882080078125, 0.5789337158203125, 0.6099853515625, 0.6410369873046875, 0.672088623046875, 0.7031402587890625, 0.73419189453125, 0.7652435302734375, 0.796295166015625, 0.8273468017578125, 0.8583984375]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 4.0, 2.0, 2.0, 4.0, 4.0, 4.0, 5.0, 5.0, 19.0, 26.0, 14.0, 33.0, 40.0, 61.0, 108.0, 149.0, 261.0, 362.0, 638.0, 848.0, 541.0, 352.0, 186.0, 122.0, 112.0, 59.0, 46.0, 23.0, 16.0, 11.0, 6.0, 6.0, 6.0, 4.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.81787109375, -0.7867202758789062, -0.7555694580078125, -0.7244186401367188, -0.693267822265625, -0.6621170043945312, -0.6309661865234375, -0.5998153686523438, -0.56866455078125, -0.5375137329101562, -0.5063629150390625, -0.47521209716796875, -0.444061279296875, -0.41291046142578125, -0.3817596435546875, -0.35060882568359375, -0.3194580078125, -0.28830718994140625, -0.2571563720703125, -0.22600555419921875, -0.194854736328125, -0.16370391845703125, -0.1325531005859375, -0.10140228271484375, -0.07025146484375, -0.03910064697265625, -0.0079498291015625, 0.02320098876953125, 0.054351806640625, 0.08550262451171875, 0.1166534423828125, 0.14780426025390625, 0.178955078125, 0.21010589599609375, 0.2412567138671875, 0.27240753173828125, 0.303558349609375, 0.33470916748046875, 0.3658599853515625, 0.39701080322265625, 0.42816162109375, 0.45931243896484375, 0.4904632568359375, 0.5216140747070312, 0.552764892578125, 0.5839157104492188, 0.6150665283203125, 0.6462173461914062, 0.6773681640625, 0.7085189819335938, 0.7396697998046875, 0.7708206176757812, 0.801971435546875, 0.8331222534179688, 0.8642730712890625, 0.8954238891601562, 0.92657470703125, 0.9577255249023438, 0.9888763427734375, 1.0200271606445312, 1.051177978515625, 1.0823287963867188, 1.1134796142578125, 1.1446304321289062, 1.17578125]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 1.0, 1.0, 2.0, 5.0, 3.0, 4.0, 18.0, 44.0, 110.0, 233.0, 311.0, 192.0, 57.0, 16.0, 1.0, 1.0, 6.0, 2.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.26705551147461, -11.861639022827148, -11.456222534179688, -11.050806045532227, -10.645390510559082, -10.239974021911621, -9.83455753326416, -9.4291410446167, -9.023725509643555, -8.618309020996094, -8.212892532348633, -7.80747652053833, -7.402060508728027, -6.996644020080566, -6.5912275314331055, -6.1858110427856445, -5.780394554138184, -5.374978065490723, -4.96956205368042, -4.564145565032959, -4.158729553222656, -3.7533130645751953, -3.3478965759277344, -2.9424803256988525, -2.5370640754699707, -2.131647825241089, -1.7262314558029175, -1.320815086364746, -0.9153988361358643, -0.5099825859069824, -0.10456609725952148, 0.30085015296936035, 0.7062673568725586, 1.1116836071014404, 1.5170999765396118, 1.9225163459777832, 2.327932596206665, 2.733348846435547, 3.138765335083008, 3.5441815853118896, 3.9495978355407715, 4.355014324188232, 4.760430335998535, 5.165846824645996, 5.571263313293457, 5.97667932510376, 6.382095813751221, 6.787511825561523, 7.192928314208984, 7.598344802856445, 8.003761291503906, 8.409177780151367, 8.814593315124512, 9.220009803771973, 9.625426292419434, 10.030842781066895, 10.436258316040039, 10.8416748046875, 11.247091293334961, 11.652507781982422, 12.057923316955566, 12.463339805603027, 12.868756294250488, 13.27417278289795, 13.67958927154541]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 2.0, 1.0, 3.0, 5.0, 8.0, 5.0, 4.0, 12.0, 8.0, 10.0, 16.0, 23.0, 26.0, 31.0, 36.0, 24.0, 35.0, 29.0, 48.0, 40.0, 33.0, 45.0, 38.0, 53.0, 46.0, 58.0, 49.0, 42.0, 30.0, 37.0, 28.0, 32.0, 23.0, 25.0, 13.0, 13.0, 12.0, 17.0, 11.0, 7.0, 3.0, 5.0, 6.0, 3.0, 1.0, 4.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.4894862174987793, -2.4036760330200195, -2.3178658485412598, -2.2320556640625, -2.1462454795837402, -2.0604350566864014, -1.9746248722076416, -1.8888146877288818, -1.803004503250122, -1.7171943187713623, -1.6313841342926025, -1.5455738306045532, -1.4597636461257935, -1.3739534616470337, -1.2881431579589844, -1.2023329734802246, -1.1165227890014648, -1.030712604522705, -0.9449023604393005, -0.859092116355896, -0.7732819318771362, -0.6874717473983765, -0.6016615033149719, -0.5158512592315674, -0.4300410747528076, -0.34423086047172546, -0.2584206461906433, -0.17261043190956116, -0.086800217628479, -0.0009900033473968506, 0.0848202109336853, 0.17063045501708984, 0.2564408779144287, 0.34225109219551086, 0.428061306476593, 0.5138715505599976, 0.5996817350387573, 0.6854919195175171, 0.7713021636009216, 0.8571124076843262, 0.9429225921630859, 1.0287327766418457, 1.1145429611206055, 1.2003532648086548, 1.2861634492874146, 1.3719736337661743, 1.4577839374542236, 1.5435941219329834, 1.6294043064117432, 1.715214490890503, 1.8010246753692627, 1.886834979057312, 1.9726451635360718, 2.058455467224121, 2.144265651702881, 2.2300758361816406, 2.3158860206604004, 2.40169620513916, 2.48750638961792, 2.5733165740966797, 2.6591267585754395, 2.7449371814727783, 2.830747365951538, 2.916557550430298, 3.0023677349090576]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 5.0, 3.0, 11.0, 17.0, 17.0, 18.0, 24.0, 36.0, 75.0, 110.0, 165.0, 266.0, 449.0, 667.0, 1237.0, 2310.0, 4592.0, 10544.0, 29788.0, 98669.0, 281951.0, 366013.0, 169805.0, 51140.0, 16887.0, 6594.0, 3198.0, 1658.0, 893.0, 526.0, 294.0, 233.0, 128.0, 75.0, 60.0, 38.0, 25.0, 9.0, 18.0, 4.0, 4.0, 4.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.59326171875, -0.573638916015625, -0.55401611328125, -0.534393310546875, -0.5147705078125, -0.495147705078125, -0.47552490234375, -0.455902099609375, -0.436279296875, -0.416656494140625, -0.39703369140625, -0.377410888671875, -0.3577880859375, -0.338165283203125, -0.31854248046875, -0.298919677734375, -0.279296875, -0.259674072265625, -0.24005126953125, -0.220428466796875, -0.2008056640625, -0.181182861328125, -0.16156005859375, -0.141937255859375, -0.122314453125, -0.102691650390625, -0.08306884765625, -0.063446044921875, -0.0438232421875, -0.024200439453125, -0.00457763671875, 0.015045166015625, 0.03466796875, 0.054290771484375, 0.07391357421875, 0.093536376953125, 0.1131591796875, 0.132781982421875, 0.15240478515625, 0.172027587890625, 0.191650390625, 0.211273193359375, 0.23089599609375, 0.250518798828125, 0.2701416015625, 0.289764404296875, 0.30938720703125, 0.329010009765625, 0.3486328125, 0.368255615234375, 0.38787841796875, 0.407501220703125, 0.4271240234375, 0.446746826171875, 0.46636962890625, 0.485992431640625, 0.505615234375, 0.525238037109375, 0.54486083984375, 0.564483642578125, 0.5841064453125, 0.603729248046875, 0.62335205078125, 0.642974853515625, 0.66259765625]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 5.0, 1.0, 4.0, 4.0, 6.0, 9.0, 5.0, 11.0, 15.0, 15.0, 19.0, 28.0, 23.0, 28.0, 26.0, 31.0, 31.0, 31.0, 32.0, 45.0, 39.0, 43.0, 47.0, 49.0, 30.0, 44.0, 42.0, 36.0, 32.0, 30.0, 30.0, 31.0, 26.0, 29.0, 26.0, 20.0, 21.0, 14.0, 7.0, 13.0, 7.0, 11.0, 3.0, 4.0, 4.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.320068359375, -0.3098030090332031, -0.29953765869140625, -0.2892723083496094, -0.2790069580078125, -0.2687416076660156, -0.25847625732421875, -0.24821090698242188, -0.237945556640625, -0.22768020629882812, -0.21741485595703125, -0.20714950561523438, -0.1968841552734375, -0.18661880493164062, -0.17635345458984375, -0.16608810424804688, -0.15582275390625, -0.14555740356445312, -0.13529205322265625, -0.12502670288085938, -0.1147613525390625, -0.10449600219726562, -0.09423065185546875, -0.08396530151367188, -0.073699951171875, -0.06343460083007812, -0.05316925048828125, -0.042903900146484375, -0.0326385498046875, -0.022373199462890625, -0.01210784912109375, -0.001842498779296875, 0.0084228515625, 0.018688201904296875, 0.02895355224609375, 0.039218902587890625, 0.0494842529296875, 0.059749603271484375, 0.07001495361328125, 0.08028030395507812, 0.090545654296875, 0.10081100463867188, 0.11107635498046875, 0.12134170532226562, 0.1316070556640625, 0.14187240600585938, 0.15213775634765625, 0.16240310668945312, 0.17266845703125, 0.18293380737304688, 0.19319915771484375, 0.20346450805664062, 0.2137298583984375, 0.22399520874023438, 0.23426055908203125, 0.24452590942382812, 0.254791259765625, 0.2650566101074219, 0.27532196044921875, 0.2855873107910156, 0.2958526611328125, 0.3061180114746094, 0.31638336181640625, 0.3266487121582031, 0.3369140625]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 5.0, 1.0, 5.0, 8.0, 8.0, 6.0, 3.0, 14.0, 21.0, 36.0, 49.0, 73.0, 105.0, 150.0, 244.0, 376.0, 583.0, 1048.0, 1879.0, 3991.0, 8904.0, 23058.0, 70850.0, 224966.0, 392855.0, 213090.0, 66946.0, 22088.0, 8621.0, 3965.0, 1922.0, 962.0, 644.0, 366.0, 224.0, 163.0, 87.0, 56.0, 68.0, 37.0, 29.0, 16.0, 11.0, 10.0, 7.0, 5.0, 3.0, 4.0, 0.0, 3.0, 1.0, 1.0, 1.0], "bins": [-0.66259765625, -0.6439208984375, -0.625244140625, -0.6065673828125, -0.587890625, -0.5692138671875, -0.550537109375, -0.5318603515625, -0.51318359375, -0.4945068359375, -0.475830078125, -0.4571533203125, -0.4384765625, -0.4197998046875, -0.401123046875, -0.3824462890625, -0.36376953125, -0.3450927734375, -0.326416015625, -0.3077392578125, -0.2890625, -0.2703857421875, -0.251708984375, -0.2330322265625, -0.21435546875, -0.1956787109375, -0.177001953125, -0.1583251953125, -0.1396484375, -0.1209716796875, -0.102294921875, -0.0836181640625, -0.06494140625, -0.0462646484375, -0.027587890625, -0.0089111328125, 0.009765625, 0.0284423828125, 0.047119140625, 0.0657958984375, 0.08447265625, 0.1031494140625, 0.121826171875, 0.1405029296875, 0.1591796875, 0.1778564453125, 0.196533203125, 0.2152099609375, 0.23388671875, 0.2525634765625, 0.271240234375, 0.2899169921875, 0.30859375, 0.3272705078125, 0.345947265625, 0.3646240234375, 0.38330078125, 0.4019775390625, 0.420654296875, 0.4393310546875, 0.4580078125, 0.4766845703125, 0.495361328125, 0.5140380859375, 0.53271484375]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 6.0, 1.0, 3.0, 6.0, 6.0, 5.0, 7.0, 21.0, 16.0, 8.0, 20.0, 13.0, 28.0, 19.0, 28.0, 32.0, 29.0, 45.0, 43.0, 49.0, 43.0, 46.0, 50.0, 40.0, 48.0, 52.0, 40.0, 43.0, 42.0, 40.0, 43.0, 23.0, 20.0, 13.0, 19.0, 18.0, 7.0, 11.0, 8.0, 3.0, 7.0, 3.0, 3.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.1181640625, -1.085968017578125, -1.05377197265625, -1.021575927734375, -0.9893798828125, -0.957183837890625, -0.92498779296875, -0.892791748046875, -0.860595703125, -0.828399658203125, -0.79620361328125, -0.764007568359375, -0.7318115234375, -0.699615478515625, -0.66741943359375, -0.635223388671875, -0.60302734375, -0.570831298828125, -0.53863525390625, -0.506439208984375, -0.4742431640625, -0.442047119140625, -0.40985107421875, -0.377655029296875, -0.345458984375, -0.313262939453125, -0.28106689453125, -0.248870849609375, -0.2166748046875, -0.184478759765625, -0.15228271484375, -0.120086669921875, -0.087890625, -0.055694580078125, -0.02349853515625, 0.008697509765625, 0.0408935546875, 0.073089599609375, 0.10528564453125, 0.137481689453125, 0.169677734375, 0.201873779296875, 0.23406982421875, 0.266265869140625, 0.2984619140625, 0.330657958984375, 0.36285400390625, 0.395050048828125, 0.42724609375, 0.459442138671875, 0.49163818359375, 0.523834228515625, 0.5560302734375, 0.588226318359375, 0.62042236328125, 0.652618408203125, 0.684814453125, 0.717010498046875, 0.74920654296875, 0.781402587890625, 0.8135986328125, 0.845794677734375, 0.87799072265625, 0.910186767578125, 0.9423828125]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 2.0, 9.0, 7.0, 11.0, 22.0, 34.0, 31.0, 59.0, 97.0, 144.0, 258.0, 394.0, 652.0, 1080.0, 1953.0, 3650.0, 7915.0, 19783.0, 59788.0, 208982.0, 427025.0, 217064.0, 61768.0, 20951.0, 8378.0, 3780.0, 1985.0, 1098.0, 651.0, 370.0, 212.0, 138.0, 85.0, 67.0, 38.0, 21.0, 19.0, 17.0, 9.0, 5.0, 5.0, 4.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.422119140625, -0.4111595153808594, -0.40019989013671875, -0.3892402648925781, -0.3782806396484375, -0.3673210144042969, -0.35636138916015625, -0.3454017639160156, -0.334442138671875, -0.3234825134277344, -0.31252288818359375, -0.3015632629394531, -0.2906036376953125, -0.2796440124511719, -0.26868438720703125, -0.2577247619628906, -0.24676513671875, -0.23580551147460938, -0.22484588623046875, -0.21388626098632812, -0.2029266357421875, -0.19196701049804688, -0.18100738525390625, -0.17004776000976562, -0.159088134765625, -0.14812850952148438, -0.13716888427734375, -0.12620925903320312, -0.1152496337890625, -0.10429000854492188, -0.09333038330078125, -0.08237075805664062, -0.0714111328125, -0.060451507568359375, -0.04949188232421875, -0.038532257080078125, -0.0275726318359375, -0.016613006591796875, -0.00565338134765625, 0.005306243896484375, 0.016265869140625, 0.027225494384765625, 0.03818511962890625, 0.049144744873046875, 0.0601043701171875, 0.07106399536132812, 0.08202362060546875, 0.09298324584960938, 0.10394287109375, 0.11490249633789062, 0.12586212158203125, 0.13682174682617188, 0.1477813720703125, 0.15874099731445312, 0.16970062255859375, 0.18066024780273438, 0.191619873046875, 0.20257949829101562, 0.21353912353515625, 0.22449874877929688, 0.2354583740234375, 0.24641799926757812, 0.25737762451171875, 0.2683372497558594, 0.279296875]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 3.0, 1.0, 4.0, 1.0, 6.0, 9.0, 2.0, 16.0, 12.0, 10.0, 14.0, 23.0, 31.0, 46.0, 59.0, 71.0, 80.0, 98.0, 101.0, 105.0, 83.0, 55.0, 38.0, 41.0, 25.0, 17.0, 9.0, 13.0, 8.0, 5.0, 11.0, 4.0, 4.0, 5.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.00011664628982543945, -0.00011366605758666992, -0.00011068582534790039, -0.00010770559310913086, -0.00010472536087036133, -0.0001017451286315918, -9.876489639282227e-05, -9.578466415405273e-05, -9.28044319152832e-05, -8.982419967651367e-05, -8.684396743774414e-05, -8.386373519897461e-05, -8.088350296020508e-05, -7.790327072143555e-05, -7.492303848266602e-05, -7.194280624389648e-05, -6.896257400512695e-05, -6.598234176635742e-05, -6.300210952758789e-05, -6.002187728881836e-05, -5.704164505004883e-05, -5.40614128112793e-05, -5.1081180572509766e-05, -4.8100948333740234e-05, -4.51207160949707e-05, -4.214048385620117e-05, -3.916025161743164e-05, -3.618001937866211e-05, -3.319978713989258e-05, -3.0219554901123047e-05, -2.7239322662353516e-05, -2.4259090423583984e-05, -2.1278858184814453e-05, -1.8298625946044922e-05, -1.531839370727539e-05, -1.233816146850586e-05, -9.357929229736328e-06, -6.377696990966797e-06, -3.3974647521972656e-06, -4.172325134277344e-07, 2.562999725341797e-06, 5.543231964111328e-06, 8.52346420288086e-06, 1.150369644165039e-05, 1.4483928680419922e-05, 1.7464160919189453e-05, 2.0444393157958984e-05, 2.3424625396728516e-05, 2.6404857635498047e-05, 2.9385089874267578e-05, 3.236532211303711e-05, 3.534555435180664e-05, 3.832578659057617e-05, 4.13060188293457e-05, 4.4286251068115234e-05, 4.7266483306884766e-05, 5.02467155456543e-05, 5.322694778442383e-05, 5.620718002319336e-05, 5.918741226196289e-05, 6.216764450073242e-05, 6.514787673950195e-05, 6.812810897827148e-05, 7.110834121704102e-05, 7.408857345581055e-05]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 3.0, 1.0, 3.0, 12.0, 6.0, 12.0, 15.0, 22.0, 23.0, 50.0, 76.0, 97.0, 139.0, 208.0, 300.0, 562.0, 963.0, 1739.0, 3456.0, 7608.0, 19050.0, 57945.0, 199834.0, 404910.0, 240036.0, 71271.0, 22670.0, 8843.0, 4016.0, 1990.0, 1093.0, 596.0, 323.0, 238.0, 133.0, 92.0, 61.0, 42.0, 28.0, 26.0, 23.0, 12.0, 9.0, 7.0, 2.0, 6.0, 1.0, 4.0, 4.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.343017578125, -0.333099365234375, -0.32318115234375, -0.313262939453125, -0.3033447265625, -0.293426513671875, -0.28350830078125, -0.273590087890625, -0.263671875, -0.253753662109375, -0.24383544921875, -0.233917236328125, -0.2239990234375, -0.214080810546875, -0.20416259765625, -0.194244384765625, -0.184326171875, -0.174407958984375, -0.16448974609375, -0.154571533203125, -0.1446533203125, -0.134735107421875, -0.12481689453125, -0.114898681640625, -0.10498046875, -0.095062255859375, -0.08514404296875, -0.075225830078125, -0.0653076171875, -0.055389404296875, -0.04547119140625, -0.035552978515625, -0.025634765625, -0.015716552734375, -0.00579833984375, 0.004119873046875, 0.0140380859375, 0.023956298828125, 0.03387451171875, 0.043792724609375, 0.0537109375, 0.063629150390625, 0.07354736328125, 0.083465576171875, 0.0933837890625, 0.103302001953125, 0.11322021484375, 0.123138427734375, 0.133056640625, 0.142974853515625, 0.15289306640625, 0.162811279296875, 0.1727294921875, 0.182647705078125, 0.19256591796875, 0.202484130859375, 0.21240234375, 0.222320556640625, 0.23223876953125, 0.242156982421875, 0.2520751953125, 0.261993408203125, 0.27191162109375, 0.281829833984375, 0.291748046875]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 6.0, 2.0, 2.0, 1.0, 4.0, 7.0, 6.0, 6.0, 5.0, 3.0, 8.0, 20.0, 18.0, 14.0, 34.0, 32.0, 35.0, 52.0, 50.0, 62.0, 56.0, 64.0, 61.0, 59.0, 63.0, 57.0, 44.0, 48.0, 27.0, 26.0, 20.0, 15.0, 21.0, 10.0, 16.0, 11.0, 10.0, 7.0, 5.0, 4.0, 9.0, 4.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.228515625, -0.2214374542236328, -0.21435928344726562, -0.20728111267089844, -0.20020294189453125, -0.19312477111816406, -0.18604660034179688, -0.1789684295654297, -0.1718902587890625, -0.1648120880126953, -0.15773391723632812, -0.15065574645996094, -0.14357757568359375, -0.13649940490722656, -0.12942123413085938, -0.12234306335449219, -0.115264892578125, -0.10818672180175781, -0.10110855102539062, -0.09403038024902344, -0.08695220947265625, -0.07987403869628906, -0.07279586791992188, -0.06571769714355469, -0.0586395263671875, -0.05156135559082031, -0.044483184814453125, -0.03740501403808594, -0.03032684326171875, -0.023248672485351562, -0.016170501708984375, -0.009092330932617188, -0.00201416015625, 0.0050640106201171875, 0.012142181396484375, 0.019220352172851562, 0.02629852294921875, 0.03337669372558594, 0.040454864501953125, 0.04753303527832031, 0.0546112060546875, 0.06168937683105469, 0.06876754760742188, 0.07584571838378906, 0.08292388916015625, 0.09000205993652344, 0.09708023071289062, 0.10415840148925781, 0.111236572265625, 0.11831474304199219, 0.12539291381835938, 0.13247108459472656, 0.13954925537109375, 0.14662742614746094, 0.15370559692382812, 0.1607837677001953, 0.1678619384765625, 0.1749401092529297, 0.18201828002929688, 0.18909645080566406, 0.19617462158203125, 0.20325279235839844, 0.21033096313476562, 0.2174091339111328, 0.2244873046875]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 7.0, 5.0, 4.0, 13.0, 8.0, 22.0, 37.0, 60.0, 84.0, 116.0, 137.0, 134.0, 116.0, 95.0, 61.0, 46.0, 25.0, 10.0, 9.0, 4.0, 5.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.291975021362305, -4.170666217803955, -4.049356937408447, -3.9280478954315186, -3.80673885345459, -3.6854300498962402, -3.5641207695007324, -3.442811965942383, -3.321502923965454, -3.2001938819885254, -3.0788848400115967, -2.957575798034668, -2.8362667560577393, -2.7149577140808105, -2.593648910522461, -2.4723398685455322, -2.3510308265686035, -2.229721784591675, -2.108412742614746, -1.9871037006378174, -1.8657947778701782, -1.7444857358932495, -1.6231766939163208, -1.5018677711486816, -1.3805584907531738, -1.2592494487762451, -1.1379404067993164, -1.0166313648223877, -0.8953224420547485, -0.7740134000778198, -0.6527043581008911, -0.5313953757286072, -0.41008639335632324, -0.2887773811817169, -0.1674683541059494, -0.046159327030181885, 0.07514968514442444, 0.19645869731903076, 0.3177677392959595, 0.4390767216682434, 0.5603857636451721, 0.6816948056221008, 0.8030037879943848, 0.9243128299713135, 1.0456218719482422, 1.166930913925171, 1.2882399559020996, 1.4095488786697388, 1.5308579206466675, 1.6521669626235962, 1.773476004600525, 1.894784927368164, 2.0160939693450928, 2.1374030113220215, 2.25871205329895, 2.380021095275879, 2.5013301372528076, 2.6226391792297363, 2.743948221206665, 2.8652572631835938, 2.9865663051605225, 3.107875347137451, 3.229184150695801, 3.3504931926727295, 3.471802234649658]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 3.0, 2.0, 4.0, 4.0, 7.0, 15.0, 8.0, 14.0, 13.0, 12.0, 12.0, 17.0, 19.0, 30.0, 17.0, 30.0, 32.0, 35.0, 38.0, 42.0, 35.0, 43.0, 41.0, 32.0, 50.0, 43.0, 41.0, 47.0, 33.0, 43.0, 32.0, 35.0, 39.0, 24.0, 17.0, 17.0, 23.0, 15.0, 9.0, 7.0, 12.0, 3.0, 3.0, 7.0, 3.0, 2.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.6569857597351074, -2.5691003799438477, -2.481215238571167, -2.3933298587799072, -2.3054444789886475, -2.217559337615967, -2.129673957824707, -2.0417885780334473, -1.953903317451477, -1.8660180568695068, -1.778132677078247, -1.6902474164962769, -1.6023621559143066, -1.5144767761230469, -1.4265915155410767, -1.3387062549591064, -1.2508208751678467, -1.1629356145858765, -1.0750502347946167, -0.9871649742126465, -0.8992796540260315, -0.8113943338394165, -0.7235090732574463, -0.6356237530708313, -0.5477384328842163, -0.4598531126976013, -0.3719678223133087, -0.2840825319290161, -0.19619721174240112, -0.10831189155578613, -0.020426630973815918, 0.06745868921279907, 0.15534377098083496, 0.24322907626628876, 0.33111438155174255, 0.41899967193603516, 0.5068849921226501, 0.5947703123092651, 0.6826555728912354, 0.7705408930778503, 0.8584262132644653, 0.9463115334510803, 1.0341968536376953, 1.1220821142196655, 1.2099673748016357, 1.2978527545928955, 1.3857380151748657, 1.473623275756836, 1.5615086555480957, 1.649393916130066, 1.7372792959213257, 1.825164556503296, 1.9130499362945557, 2.0009350776672363, 2.088820457458496, 2.176705837249756, 2.2645912170410156, 2.3524765968322754, 2.440361738204956, 2.528247117996216, 2.6161324977874756, 2.7040176391601562, 2.791903018951416, 2.879788398742676, 2.9676735401153564]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 0.0, 2.0, 6.0, 1.0, 15.0, 13.0, 15.0, 30.0, 31.0, 59.0, 61.0, 95.0, 125.0, 153.0, 218.0, 387.0, 541.0, 779.0, 1245.0, 2136.0, 3630.0, 7273.0, 15762.0, 40201.0, 119700.0, 409202.0, 1420070.0, 1512589.0, 450835.0, 130534.0, 43189.0, 17190.0, 7925.0, 4010.0, 2327.0, 1368.0, 901.0, 540.0, 369.0, 224.0, 160.0, 106.0, 78.0, 62.0, 41.0, 30.0, 24.0, 14.0, 8.0, 6.0, 8.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.47119140625, -0.4573478698730469, -0.44350433349609375, -0.4296607971191406, -0.4158172607421875, -0.4019737243652344, -0.38813018798828125, -0.3742866516113281, -0.360443115234375, -0.3465995788574219, -0.33275604248046875, -0.3189125061035156, -0.3050689697265625, -0.2912254333496094, -0.27738189697265625, -0.2635383605957031, -0.24969482421875, -0.23585128784179688, -0.22200775146484375, -0.20816421508789062, -0.1943206787109375, -0.18047714233398438, -0.16663360595703125, -0.15279006958007812, -0.138946533203125, -0.12510299682617188, -0.11125946044921875, -0.09741592407226562, -0.0835723876953125, -0.06972885131835938, -0.05588531494140625, -0.042041778564453125, -0.0281982421875, -0.014354705810546875, -0.00051116943359375, 0.013332366943359375, 0.0271759033203125, 0.041019439697265625, 0.05486297607421875, 0.06870651245117188, 0.082550048828125, 0.09639358520507812, 0.11023712158203125, 0.12408065795898438, 0.1379241943359375, 0.15176773071289062, 0.16561126708984375, 0.17945480346679688, 0.19329833984375, 0.20714187622070312, 0.22098541259765625, 0.23482894897460938, 0.2486724853515625, 0.2625160217285156, 0.27635955810546875, 0.2902030944824219, 0.304046630859375, 0.3178901672363281, 0.33173370361328125, 0.3455772399902344, 0.3594207763671875, 0.3732643127441406, 0.38710784912109375, 0.4009513854980469, 0.414794921875]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 2.0, 2.0, 3.0, 8.0, 4.0, 5.0, 7.0, 10.0, 10.0, 12.0, 12.0, 9.0, 11.0, 23.0, 17.0, 12.0, 24.0, 36.0, 33.0, 28.0, 40.0, 27.0, 32.0, 33.0, 38.0, 25.0, 39.0, 35.0, 46.0, 28.0, 32.0, 42.0, 50.0, 29.0, 28.0, 31.0, 22.0, 19.0, 21.0, 13.0, 17.0, 18.0, 13.0, 13.0, 4.0, 8.0, 9.0, 10.0, 5.0, 5.0, 2.0, 5.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.283447265625, -0.27394866943359375, -0.2644500732421875, -0.25495147705078125, -0.245452880859375, -0.23595428466796875, -0.2264556884765625, -0.21695709228515625, -0.20745849609375, -0.19795989990234375, -0.1884613037109375, -0.17896270751953125, -0.169464111328125, -0.15996551513671875, -0.1504669189453125, -0.14096832275390625, -0.1314697265625, -0.12197113037109375, -0.1124725341796875, -0.10297393798828125, -0.093475341796875, -0.08397674560546875, -0.0744781494140625, -0.06497955322265625, -0.05548095703125, -0.04598236083984375, -0.0364837646484375, -0.02698516845703125, -0.017486572265625, -0.00798797607421875, 0.0015106201171875, 0.01100921630859375, 0.0205078125, 0.03000640869140625, 0.0395050048828125, 0.04900360107421875, 0.058502197265625, 0.06800079345703125, 0.0774993896484375, 0.08699798583984375, 0.09649658203125, 0.10599517822265625, 0.1154937744140625, 0.12499237060546875, 0.134490966796875, 0.14398956298828125, 0.1534881591796875, 0.16298675537109375, 0.1724853515625, 0.18198394775390625, 0.1914825439453125, 0.20098114013671875, 0.210479736328125, 0.21997833251953125, 0.2294769287109375, 0.23897552490234375, 0.24847412109375, 0.25797271728515625, 0.2674713134765625, 0.27696990966796875, 0.286468505859375, 0.29596710205078125, 0.3054656982421875, 0.31496429443359375, 0.324462890625]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 5.0, 3.0, 6.0, 5.0, 5.0, 8.0, 17.0, 37.0, 48.0, 54.0, 68.0, 118.0, 209.0, 310.0, 549.0, 1177.0, 2639.0, 7249.0, 25967.0, 146883.0, 2264373.0, 1594513.0, 116240.0, 22376.0, 6531.0, 2435.0, 1112.0, 581.0, 293.0, 174.0, 96.0, 65.0, 49.0, 40.0, 21.0, 4.0, 11.0, 6.0, 7.0, 5.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9541015625, -0.9158477783203125, -0.877593994140625, -0.8393402099609375, -0.80108642578125, -0.7628326416015625, -0.724578857421875, -0.6863250732421875, -0.6480712890625, -0.6098175048828125, -0.571563720703125, -0.5333099365234375, -0.49505615234375, -0.4568023681640625, -0.418548583984375, -0.3802947998046875, -0.342041015625, -0.3037872314453125, -0.265533447265625, -0.2272796630859375, -0.18902587890625, -0.1507720947265625, -0.112518310546875, -0.0742645263671875, -0.0360107421875, 0.0022430419921875, 0.040496826171875, 0.0787506103515625, 0.11700439453125, 0.1552581787109375, 0.193511962890625, 0.2317657470703125, 0.27001953125, 0.3082733154296875, 0.346527099609375, 0.3847808837890625, 0.42303466796875, 0.4612884521484375, 0.499542236328125, 0.5377960205078125, 0.5760498046875, 0.6143035888671875, 0.652557373046875, 0.6908111572265625, 0.72906494140625, 0.7673187255859375, 0.805572509765625, 0.8438262939453125, 0.882080078125, 0.9203338623046875, 0.958587646484375, 0.9968414306640625, 1.03509521484375, 1.0733489990234375, 1.111602783203125, 1.1498565673828125, 1.1881103515625, 1.2263641357421875, 1.264617919921875, 1.3028717041015625, 1.34112548828125, 1.3793792724609375, 1.417633056640625, 1.4558868408203125, 1.494140625]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 4.0, 4.0, 8.0, 4.0, 19.0, 17.0, 41.0, 48.0, 86.0, 131.0, 260.0, 437.0, 906.0, 918.0, 491.0, 271.0, 155.0, 88.0, 68.0, 32.0, 26.0, 23.0, 9.0, 12.0, 3.0, 6.0, 6.0, 4.0, 5.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-1.482421875, -1.4471664428710938, -1.4119110107421875, -1.3766555786132812, -1.341400146484375, -1.3061447143554688, -1.2708892822265625, -1.2356338500976562, -1.20037841796875, -1.1651229858398438, -1.1298675537109375, -1.0946121215820312, -1.059356689453125, -1.0241012573242188, -0.9888458251953125, -0.9535903930664062, -0.9183349609375, -0.8830795288085938, -0.8478240966796875, -0.8125686645507812, -0.777313232421875, -0.7420578002929688, -0.7068023681640625, -0.6715469360351562, -0.63629150390625, -0.6010360717773438, -0.5657806396484375, -0.5305252075195312, -0.495269775390625, -0.46001434326171875, -0.4247589111328125, -0.38950347900390625, -0.354248046875, -0.31899261474609375, -0.2837371826171875, -0.24848175048828125, -0.213226318359375, -0.17797088623046875, -0.1427154541015625, -0.10746002197265625, -0.07220458984375, -0.03694915771484375, -0.0016937255859375, 0.03356170654296875, 0.068817138671875, 0.10407257080078125, 0.1393280029296875, 0.17458343505859375, 0.2098388671875, 0.24509429931640625, 0.2803497314453125, 0.31560516357421875, 0.350860595703125, 0.38611602783203125, 0.4213714599609375, 0.45662689208984375, 0.49188232421875, 0.5271377563476562, 0.5623931884765625, 0.5976486206054688, 0.632904052734375, 0.6681594848632812, 0.7034149169921875, 0.7386703491210938, 0.77392578125]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 5.0, 17.0, 42.0, 90.0, 155.0, 213.0, 245.0, 125.0, 58.0, 32.0, 11.0, 6.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.1748504638671875, -6.914915084838867, -6.654979705810547, -6.395044326782227, -6.135108947753906, -5.875173568725586, -5.615238189697266, -5.355302810668945, -5.095367431640625, -4.835432052612305, -4.575496673583984, -4.315561294555664, -4.055625915527344, -3.7956905364990234, -3.5357553958892822, -3.275820016860962, -3.0158848762512207, -2.7559494972229004, -2.49601411819458, -2.2360787391662598, -1.976143479347229, -1.7162081003189087, -1.456272840499878, -1.1963374614715576, -0.9364020824432373, -0.676466703414917, -0.41653138399124146, -0.15659606456756592, 0.1033393144607544, 0.3632746934890747, 0.6232099533081055, 0.8831453323364258, 1.143080711364746, 1.4030160903930664, 1.6629514694213867, 1.9228867292404175, 2.1828222274780273, 2.4427576065063477, 2.702692747116089, 2.962628126144409, 3.2225635051727295, 3.48249888420105, 3.74243426322937, 4.002369403839111, 4.262304782867432, 4.522240161895752, 4.782175540924072, 5.042110919952393, 5.302046298980713, 5.561981678009033, 5.8219170570373535, 6.081852436065674, 6.341787815093994, 6.6017231941223145, 6.861658096313477, 7.121593475341797, 7.381528854370117, 7.6414642333984375, 7.901399612426758, 8.161334991455078, 8.421270370483398, 8.681205749511719, 8.941141128540039, 9.20107650756836, 9.46101188659668]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [4.0, 2.0, 0.0, 0.0, 3.0, 2.0, 4.0, 6.0, 4.0, 7.0, 15.0, 7.0, 11.0, 15.0, 22.0, 16.0, 16.0, 24.0, 26.0, 19.0, 23.0, 35.0, 41.0, 38.0, 25.0, 23.0, 26.0, 42.0, 27.0, 37.0, 43.0, 29.0, 30.0, 31.0, 37.0, 28.0, 38.0, 26.0, 33.0, 26.0, 27.0, 18.0, 20.0, 13.0, 14.0, 15.0, 13.0, 11.0, 7.0, 10.0, 6.0, 7.0, 3.0, 4.0, 2.0, 5.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-2.0035922527313232, -1.9376325607299805, -1.8716728687286377, -1.805713176727295, -1.7397534847259521, -1.6737937927246094, -1.6078341007232666, -1.5418744087219238, -1.475914716720581, -1.4099550247192383, -1.3439953327178955, -1.2780356407165527, -1.21207594871521, -1.1461162567138672, -1.0801565647125244, -1.0141968727111816, -0.9482372999191284, -0.8822776079177856, -0.8163179159164429, -0.7503582239151001, -0.6843985319137573, -0.6184388399124146, -0.5524792075157166, -0.4865195155143738, -0.420559823513031, -0.35460013151168823, -0.28864043951034546, -0.22268077731132507, -0.1567210853099823, -0.09076139330863953, -0.02480173110961914, 0.04115796089172363, 0.1071176528930664, 0.17307734489440918, 0.23903702199459076, 0.30499669909477234, 0.3709563910961151, 0.4369160830974579, 0.5028757452964783, 0.568835437297821, 0.6347951292991638, 0.7007548213005066, 0.7667145133018494, 0.8326741456985474, 0.8986338376998901, 0.9645935297012329, 1.0305532217025757, 1.0965129137039185, 1.1624726057052612, 1.228432297706604, 1.2943919897079468, 1.3603516817092896, 1.4263113737106323, 1.492271065711975, 1.5582306385040283, 1.624190330505371, 1.6901500225067139, 1.7561097145080566, 1.8220694065093994, 1.8880290985107422, 1.953988790512085, 2.0199484825134277, 2.0859081745147705, 2.1518678665161133, 2.217827558517456]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 4.0, 9.0, 8.0, 15.0, 8.0, 15.0, 19.0, 27.0, 31.0, 37.0, 66.0, 102.0, 128.0, 183.0, 315.0, 426.0, 693.0, 1092.0, 1778.0, 3090.0, 5581.0, 10612.0, 23137.0, 63841.0, 209476.0, 410602.0, 207394.0, 62842.0, 23107.0, 10348.0, 5465.0, 3056.0, 1759.0, 1102.0, 747.0, 435.0, 315.0, 182.0, 127.0, 114.0, 62.0, 54.0, 37.0, 31.0, 20.0, 14.0, 9.0, 19.0, 4.0, 7.0, 5.0, 5.0, 3.0, 3.0, 2.0, 3.0], "bins": [-0.765625, -0.742767333984375, -0.71990966796875, -0.697052001953125, -0.6741943359375, -0.651336669921875, -0.62847900390625, -0.605621337890625, -0.582763671875, -0.559906005859375, -0.53704833984375, -0.514190673828125, -0.4913330078125, -0.468475341796875, -0.44561767578125, -0.422760009765625, -0.39990234375, -0.377044677734375, -0.35418701171875, -0.331329345703125, -0.3084716796875, -0.285614013671875, -0.26275634765625, -0.239898681640625, -0.217041015625, -0.194183349609375, -0.17132568359375, -0.148468017578125, -0.1256103515625, -0.102752685546875, -0.07989501953125, -0.057037353515625, -0.0341796875, -0.011322021484375, 0.01153564453125, 0.034393310546875, 0.0572509765625, 0.080108642578125, 0.10296630859375, 0.125823974609375, 0.148681640625, 0.171539306640625, 0.19439697265625, 0.217254638671875, 0.2401123046875, 0.262969970703125, 0.28582763671875, 0.308685302734375, 0.33154296875, 0.354400634765625, 0.37725830078125, 0.400115966796875, 0.4229736328125, 0.445831298828125, 0.46868896484375, 0.491546630859375, 0.514404296875, 0.537261962890625, 0.56011962890625, 0.582977294921875, 0.6058349609375, 0.628692626953125, 0.65155029296875, 0.674407958984375, 0.697265625]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 0.0, 6.0, 2.0, 2.0, 6.0, 6.0, 12.0, 6.0, 12.0, 14.0, 12.0, 9.0, 26.0, 15.0, 18.0, 21.0, 37.0, 37.0, 39.0, 26.0, 34.0, 29.0, 36.0, 33.0, 36.0, 37.0, 35.0, 40.0, 34.0, 46.0, 37.0, 36.0, 35.0, 32.0, 29.0, 36.0, 20.0, 19.0, 15.0, 15.0, 15.0, 13.0, 9.0, 8.0, 4.0, 5.0, 6.0, 2.0, 5.0, 0.0, 2.0, 3.0, 0.0, 0.0, 2.0, 2.0], "bins": [-0.37158203125, -0.36042022705078125, -0.3492584228515625, -0.33809661865234375, -0.326934814453125, -0.31577301025390625, -0.3046112060546875, -0.29344940185546875, -0.28228759765625, -0.27112579345703125, -0.2599639892578125, -0.24880218505859375, -0.237640380859375, -0.22647857666015625, -0.2153167724609375, -0.20415496826171875, -0.1929931640625, -0.18183135986328125, -0.1706695556640625, -0.15950775146484375, -0.148345947265625, -0.13718414306640625, -0.1260223388671875, -0.11486053466796875, -0.10369873046875, -0.09253692626953125, -0.0813751220703125, -0.07021331787109375, -0.059051513671875, -0.04788970947265625, -0.0367279052734375, -0.02556610107421875, -0.014404296875, -0.00324249267578125, 0.0079193115234375, 0.01908111572265625, 0.030242919921875, 0.04140472412109375, 0.0525665283203125, 0.06372833251953125, 0.07489013671875, 0.08605194091796875, 0.0972137451171875, 0.10837554931640625, 0.119537353515625, 0.13069915771484375, 0.1418609619140625, 0.15302276611328125, 0.1641845703125, 0.17534637451171875, 0.1865081787109375, 0.19766998291015625, 0.208831787109375, 0.21999359130859375, 0.2311553955078125, 0.24231719970703125, 0.25347900390625, 0.26464080810546875, 0.2758026123046875, 0.28696441650390625, 0.298126220703125, 0.30928802490234375, 0.3204498291015625, 0.33161163330078125, 0.3427734375]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 5.0, 2.0, 2.0, 10.0, 5.0, 7.0, 12.0, 11.0, 17.0, 18.0, 41.0, 57.0, 106.0, 142.0, 212.0, 331.0, 604.0, 959.0, 1779.0, 3128.0, 5900.0, 12390.0, 30793.0, 100807.0, 362002.0, 367351.0, 103596.0, 31891.0, 12730.0, 6062.0, 3204.0, 1789.0, 1043.0, 601.0, 364.0, 207.0, 125.0, 86.0, 46.0, 30.0, 25.0, 21.0, 15.0, 6.0, 9.0, 4.0, 7.0, 4.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.8837890625, -0.8578033447265625, -0.831817626953125, -0.8058319091796875, -0.77984619140625, -0.7538604736328125, -0.727874755859375, -0.7018890380859375, -0.6759033203125, -0.6499176025390625, -0.623931884765625, -0.5979461669921875, -0.57196044921875, -0.5459747314453125, -0.519989013671875, -0.4940032958984375, -0.468017578125, -0.4420318603515625, -0.416046142578125, -0.3900604248046875, -0.36407470703125, -0.3380889892578125, -0.312103271484375, -0.2861175537109375, -0.2601318359375, -0.2341461181640625, -0.208160400390625, -0.1821746826171875, -0.15618896484375, -0.1302032470703125, -0.104217529296875, -0.0782318115234375, -0.05224609375, -0.0262603759765625, -0.000274658203125, 0.0257110595703125, 0.05169677734375, 0.0776824951171875, 0.103668212890625, 0.1296539306640625, 0.1556396484375, 0.1816253662109375, 0.207611083984375, 0.2335968017578125, 0.25958251953125, 0.2855682373046875, 0.311553955078125, 0.3375396728515625, 0.363525390625, 0.3895111083984375, 0.415496826171875, 0.4414825439453125, 0.46746826171875, 0.4934539794921875, 0.519439697265625, 0.5454254150390625, 0.5714111328125, 0.5973968505859375, 0.623382568359375, 0.6493682861328125, 0.67535400390625, 0.7013397216796875, 0.727325439453125, 0.7533111572265625, 0.779296875]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 3.0, 4.0, 5.0, 4.0, 7.0, 10.0, 6.0, 7.0, 13.0, 21.0, 24.0, 21.0, 25.0, 25.0, 32.0, 23.0, 31.0, 38.0, 42.0, 49.0, 38.0, 34.0, 40.0, 38.0, 39.0, 39.0, 48.0, 30.0, 33.0, 35.0, 29.0, 20.0, 26.0, 22.0, 20.0, 14.0, 12.0, 18.0, 12.0, 11.0, 11.0, 9.0, 4.0, 9.0, 2.0, 4.0, 8.0, 7.0, 4.0, 0.0, 2.0, 1.0], "bins": [-1.275390625, -1.2389678955078125, -1.202545166015625, -1.1661224365234375, -1.12969970703125, -1.0932769775390625, -1.056854248046875, -1.0204315185546875, -0.9840087890625, -0.9475860595703125, -0.911163330078125, -0.8747406005859375, -0.83831787109375, -0.8018951416015625, -0.765472412109375, -0.7290496826171875, -0.692626953125, -0.6562042236328125, -0.619781494140625, -0.5833587646484375, -0.54693603515625, -0.5105133056640625, -0.474090576171875, -0.4376678466796875, -0.4012451171875, -0.3648223876953125, -0.328399658203125, -0.2919769287109375, -0.25555419921875, -0.2191314697265625, -0.182708740234375, -0.1462860107421875, -0.10986328125, -0.0734405517578125, -0.037017822265625, -0.0005950927734375, 0.03582763671875, 0.0722503662109375, 0.108673095703125, 0.1450958251953125, 0.1815185546875, 0.2179412841796875, 0.254364013671875, 0.2907867431640625, 0.32720947265625, 0.3636322021484375, 0.400054931640625, 0.4364776611328125, 0.472900390625, 0.5093231201171875, 0.545745849609375, 0.5821685791015625, 0.61859130859375, 0.6550140380859375, 0.691436767578125, 0.7278594970703125, 0.7642822265625, 0.8007049560546875, 0.837127685546875, 0.8735504150390625, 0.90997314453125, 0.9463958740234375, 0.982818603515625, 1.0192413330078125, 1.0556640625]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 0.0, 5.0, 4.0, 4.0, 6.0, 19.0, 20.0, 21.0, 47.0, 62.0, 88.0, 133.0, 205.0, 310.0, 497.0, 712.0, 1142.0, 1729.0, 2839.0, 4490.0, 7304.0, 12751.0, 22953.0, 45389.0, 99797.0, 227305.0, 306159.0, 164388.0, 72423.0, 33918.0, 17618.0, 10040.0, 5921.0, 3725.0, 2223.0, 1509.0, 962.0, 650.0, 388.0, 260.0, 194.0, 111.0, 77.0, 55.0, 34.0, 27.0, 20.0, 7.0, 8.0, 6.0, 3.0, 3.0, 4.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.2332763671875, -0.2262706756591797, -0.21926498413085938, -0.21225929260253906, -0.20525360107421875, -0.19824790954589844, -0.19124221801757812, -0.1842365264892578, -0.1772308349609375, -0.1702251434326172, -0.16321945190429688, -0.15621376037597656, -0.14920806884765625, -0.14220237731933594, -0.13519668579101562, -0.1281909942626953, -0.121185302734375, -0.11417961120605469, -0.10717391967773438, -0.10016822814941406, -0.09316253662109375, -0.08615684509277344, -0.07915115356445312, -0.07214546203613281, -0.0651397705078125, -0.05813407897949219, -0.051128387451171875, -0.04412269592285156, -0.03711700439453125, -0.030111312866210938, -0.023105621337890625, -0.016099929809570312, -0.00909423828125, -0.0020885467529296875, 0.004917144775390625, 0.011922836303710938, 0.01892852783203125, 0.025934219360351562, 0.032939910888671875, 0.03994560241699219, 0.0469512939453125, 0.05395698547363281, 0.060962677001953125, 0.06796836853027344, 0.07497406005859375, 0.08197975158691406, 0.08898544311523438, 0.09599113464355469, 0.102996826171875, 0.11000251770019531, 0.11700820922851562, 0.12401390075683594, 0.13101959228515625, 0.13802528381347656, 0.14503097534179688, 0.1520366668701172, 0.1590423583984375, 0.1660480499267578, 0.17305374145507812, 0.18005943298339844, 0.18706512451171875, 0.19407081604003906, 0.20107650756835938, 0.2080821990966797, 0.215087890625]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 3.0, 3.0, 5.0, 13.0, 8.0, 16.0, 21.0, 31.0, 50.0, 82.0, 112.0, 140.0, 137.0, 130.0, 82.0, 49.0, 29.0, 14.0, 19.0, 14.0, 8.0, 8.0, 7.0, 2.0, 3.0, 3.0, 3.0, 1.0, 2.0, 3.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.475780487060547e-05, -8.10716301202774e-05, -7.738545536994934e-05, -7.369928061962128e-05, -7.001310586929321e-05, -6.632693111896515e-05, -6.264075636863708e-05, -5.895458161830902e-05, -5.526840686798096e-05, -5.158223211765289e-05, -4.789605736732483e-05, -4.4209882616996765e-05, -4.05237078666687e-05, -3.683753311634064e-05, -3.315135836601257e-05, -2.946518361568451e-05, -2.5779008865356445e-05, -2.209283411502838e-05, -1.8406659364700317e-05, -1.4720484614372253e-05, -1.103430986404419e-05, -7.3481351137161255e-06, -3.6619603633880615e-06, 2.421438694000244e-08, 3.7103891372680664e-06, 7.39656388759613e-06, 1.1082738637924194e-05, 1.4768913388252258e-05, 1.8455088138580322e-05, 2.2141262888908386e-05, 2.582743763923645e-05, 2.9513612389564514e-05, 3.319978713989258e-05, 3.688596189022064e-05, 4.0572136640548706e-05, 4.425831139087677e-05, 4.7944486141204834e-05, 5.16306608915329e-05, 5.531683564186096e-05, 5.9003010392189026e-05, 6.268918514251709e-05, 6.637535989284515e-05, 7.006153464317322e-05, 7.374770939350128e-05, 7.743388414382935e-05, 8.112005889415741e-05, 8.480623364448547e-05, 8.849240839481354e-05, 9.21785831451416e-05, 9.586475789546967e-05, 9.955093264579773e-05, 0.0001032371073961258, 0.00010692328214645386, 0.00011060945689678192, 0.00011429563164710999, 0.00011798180639743805, 0.00012166798114776611, 0.00012535415589809418, 0.00012904033064842224, 0.0001327265053987503, 0.00013641268014907837, 0.00014009885489940643, 0.0001437850296497345, 0.00014747120440006256, 0.00015115737915039062]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 2.0, 4.0, 10.0, 9.0, 14.0, 15.0, 16.0, 42.0, 45.0, 84.0, 121.0, 214.0, 278.0, 520.0, 833.0, 1325.0, 2280.0, 4044.0, 7118.0, 12736.0, 23680.0, 45294.0, 91559.0, 182605.0, 267004.0, 199403.0, 100691.0, 50280.0, 25810.0, 13821.0, 7793.0, 4547.0, 2524.0, 1456.0, 902.0, 545.0, 326.0, 211.0, 147.0, 87.0, 49.0, 46.0, 22.0, 17.0, 11.0, 8.0, 4.0, 2.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0], "bins": [-0.2120361328125, -0.2057209014892578, -0.19940567016601562, -0.19309043884277344, -0.18677520751953125, -0.18045997619628906, -0.17414474487304688, -0.1678295135498047, -0.1615142822265625, -0.1551990509033203, -0.14888381958007812, -0.14256858825683594, -0.13625335693359375, -0.12993812561035156, -0.12362289428710938, -0.11730766296386719, -0.110992431640625, -0.10467720031738281, -0.09836196899414062, -0.09204673767089844, -0.08573150634765625, -0.07941627502441406, -0.07310104370117188, -0.06678581237792969, -0.0604705810546875, -0.05415534973144531, -0.047840118408203125, -0.04152488708496094, -0.03520965576171875, -0.028894424438476562, -0.022579193115234375, -0.016263961791992188, -0.00994873046875, -0.0036334991455078125, 0.002681732177734375, 0.008996963500976562, 0.01531219482421875, 0.021627426147460938, 0.027942657470703125, 0.03425788879394531, 0.0405731201171875, 0.04688835144042969, 0.053203582763671875, 0.05951881408691406, 0.06583404541015625, 0.07214927673339844, 0.07846450805664062, 0.08477973937988281, 0.091094970703125, 0.09741020202636719, 0.10372543334960938, 0.11004066467285156, 0.11635589599609375, 0.12267112731933594, 0.12898635864257812, 0.1353015899658203, 0.1416168212890625, 0.1479320526123047, 0.15424728393554688, 0.16056251525878906, 0.16687774658203125, 0.17319297790527344, 0.17950820922851562, 0.1858234405517578, 0.192138671875]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 4.0, 5.0, 9.0, 8.0, 8.0, 8.0, 10.0, 18.0, 17.0, 25.0, 33.0, 33.0, 31.0, 51.0, 85.0, 73.0, 81.0, 70.0, 71.0, 60.0, 43.0, 47.0, 36.0, 38.0, 25.0, 25.0, 18.0, 14.0, 16.0, 9.0, 11.0, 6.0, 6.0, 6.0, 2.0, 6.0, 2.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1783447265625, -0.1695690155029297, -0.16079330444335938, -0.15201759338378906, -0.14324188232421875, -0.13446617126464844, -0.12569046020507812, -0.11691474914550781, -0.1081390380859375, -0.09936332702636719, -0.09058761596679688, -0.08181190490722656, -0.07303619384765625, -0.06426048278808594, -0.055484771728515625, -0.04670906066894531, -0.037933349609375, -0.029157638549804688, -0.020381927490234375, -0.011606216430664062, -0.00283050537109375, 0.0059452056884765625, 0.014720916748046875, 0.023496627807617188, 0.0322723388671875, 0.04104804992675781, 0.049823760986328125, 0.05859947204589844, 0.06737518310546875, 0.07615089416503906, 0.08492660522460938, 0.09370231628417969, 0.10247802734375, 0.11125373840332031, 0.12002944946289062, 0.12880516052246094, 0.13758087158203125, 0.14635658264160156, 0.15513229370117188, 0.1639080047607422, 0.1726837158203125, 0.1814594268798828, 0.19023513793945312, 0.19901084899902344, 0.20778656005859375, 0.21656227111816406, 0.22533798217773438, 0.2341136932373047, 0.242889404296875, 0.2516651153564453, 0.2604408264160156, 0.26921653747558594, 0.27799224853515625, 0.28676795959472656, 0.2955436706542969, 0.3043193817138672, 0.3130950927734375, 0.3218708038330078, 0.3306465148925781, 0.33942222595214844, 0.34819793701171875, 0.35697364807128906, 0.3657493591308594, 0.3745250701904297, 0.38330078125]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 5.0, 2.0, 5.0, 9.0, 15.0, 56.0, 92.0, 124.0, 162.0, 200.0, 145.0, 87.0, 51.0, 31.0, 8.0, 5.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.79995584487915, -4.600244045257568, -4.4005327224731445, -4.2008209228515625, -4.001109600067139, -3.8013978004455566, -3.6016862392425537, -3.401974678039551, -3.202263116836548, -3.002551555633545, -2.802839994430542, -2.603128433227539, -2.403416633605957, -2.203705310821533, -2.003993511199951, -1.8042819499969482, -1.6045703887939453, -1.4048588275909424, -1.2051472663879395, -1.005435585975647, -0.805724024772644, -0.6060124635696411, -0.40630078315734863, -0.2065892219543457, -0.0068776607513427734, 0.19283393025398254, 0.39254552125930786, 0.5922571420669556, 0.7919687032699585, 0.9916802644729614, 1.191391944885254, 1.3911035060882568, 1.590815544128418, 1.790527105331421, 1.9902386665344238, 2.189950466156006, 2.3896617889404297, 2.5893735885620117, 2.7890851497650146, 2.9887967109680176, 3.1885082721710205, 3.3882198333740234, 3.5879313945770264, 3.7876429557800293, 3.9873547554016113, 4.187066078186035, 4.386777877807617, 4.586489677429199, 4.786201000213623, 4.985912799835205, 5.185624122619629, 5.385335922241211, 5.585047245025635, 5.784759044647217, 5.984470367431641, 6.184182167053223, 6.383893966674805, 6.583605766296387, 6.7833170890808105, 6.983028888702393, 7.182740211486816, 7.382452011108398, 7.5821638107299805, 7.781875133514404, 7.981586456298828]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 6.0, 1.0, 6.0, 5.0, 7.0, 8.0, 8.0, 12.0, 13.0, 14.0, 16.0, 18.0, 21.0, 29.0, 29.0, 28.0, 49.0, 34.0, 31.0, 37.0, 39.0, 33.0, 38.0, 42.0, 27.0, 36.0, 47.0, 42.0, 51.0, 22.0, 37.0, 28.0, 31.0, 28.0, 23.0, 18.0, 18.0, 14.0, 21.0, 12.0, 6.0, 8.0, 4.0, 7.0, 3.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.1429152488708496, -3.042776107788086, -2.9426369667053223, -2.8424978256225586, -2.742358684539795, -2.6422195434570312, -2.5420804023742676, -2.441941261291504, -2.3418021202087402, -2.2416629791259766, -2.141523838043213, -2.041384696960449, -1.9412455558776855, -1.8411064147949219, -1.7409672737121582, -1.6408281326293945, -1.5406888723373413, -1.4405497312545776, -1.340410590171814, -1.2402714490890503, -1.1401323080062866, -1.0399930477142334, -0.9398539662361145, -0.8397148251533508, -0.7395756840705872, -0.6394365429878235, -0.5392974019050598, -0.43915823101997375, -0.3390190899372101, -0.23887991905212402, -0.13874077796936035, -0.03860163688659668, 0.06153750419616699, 0.16167664527893066, 0.26181578636169434, 0.3619549572467804, 0.46209409832954407, 0.5622332692146301, 0.6623724102973938, 0.7625115513801575, 0.8626506924629211, 0.9627898335456848, 1.0629290342330933, 1.163068175315857, 1.2632073163986206, 1.3633464574813843, 1.463485598564148, 1.5636247396469116, 1.6637638807296753, 1.763903021812439, 1.8640421628952026, 1.9641813039779663, 2.0643205642700195, 2.164459705352783, 2.264598846435547, 2.3647379875183105, 2.464877128601074, 2.565016269683838, 2.6651554107666016, 2.7652945518493652, 2.865433692932129, 2.9655728340148926, 3.0657119750976562, 3.16585111618042, 3.2659902572631836]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 3.0, 2.0, 6.0, 4.0, 5.0, 11.0, 19.0, 17.0, 40.0, 36.0, 61.0, 68.0, 111.0, 148.0, 218.0, 295.0, 504.0, 765.0, 1358.0, 2288.0, 4292.0, 8491.0, 20299.0, 63010.0, 282745.0, 1336232.0, 1854100.0, 469977.0, 97807.0, 28269.0, 11234.0, 5149.0, 2736.0, 1524.0, 851.0, 550.0, 325.0, 216.0, 156.0, 121.0, 62.0, 61.0, 37.0, 28.0, 21.0, 15.0, 10.0, 5.0, 7.0, 0.0, 1.0, 3.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.65087890625, -0.6306381225585938, -0.6103973388671875, -0.5901565551757812, -0.569915771484375, -0.5496749877929688, -0.5294342041015625, -0.5091934204101562, -0.48895263671875, -0.46871185302734375, -0.4484710693359375, -0.42823028564453125, -0.407989501953125, -0.38774871826171875, -0.3675079345703125, -0.34726715087890625, -0.3270263671875, -0.30678558349609375, -0.2865447998046875, -0.26630401611328125, -0.246063232421875, -0.22582244873046875, -0.2055816650390625, -0.18534088134765625, -0.16510009765625, -0.14485931396484375, -0.1246185302734375, -0.10437774658203125, -0.084136962890625, -0.06389617919921875, -0.0436553955078125, -0.02341461181640625, -0.003173828125, 0.01706695556640625, 0.0373077392578125, 0.05754852294921875, 0.077789306640625, 0.09803009033203125, 0.1182708740234375, 0.13851165771484375, 0.15875244140625, 0.17899322509765625, 0.1992340087890625, 0.21947479248046875, 0.239715576171875, 0.25995635986328125, 0.2801971435546875, 0.30043792724609375, 0.3206787109375, 0.34091949462890625, 0.3611602783203125, 0.38140106201171875, 0.401641845703125, 0.42188262939453125, 0.4421234130859375, 0.46236419677734375, 0.48260498046875, 0.5028457641601562, 0.5230865478515625, 0.5433273315429688, 0.563568115234375, 0.5838088989257812, 0.6040496826171875, 0.6242904663085938, 0.64453125]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 2.0, 4.0, 6.0, 6.0, 8.0, 5.0, 11.0, 10.0, 10.0, 16.0, 21.0, 17.0, 25.0, 26.0, 24.0, 36.0, 32.0, 37.0, 45.0, 43.0, 34.0, 51.0, 48.0, 47.0, 55.0, 42.0, 37.0, 35.0, 22.0, 33.0, 35.0, 34.0, 26.0, 22.0, 22.0, 10.0, 17.0, 13.0, 8.0, 12.0, 7.0, 3.0, 3.0, 2.0, 3.0, 2.0, 5.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.411376953125, -0.3979759216308594, -0.38457489013671875, -0.3711738586425781, -0.3577728271484375, -0.3443717956542969, -0.33097076416015625, -0.3175697326660156, -0.304168701171875, -0.2907676696777344, -0.27736663818359375, -0.2639656066894531, -0.2505645751953125, -0.23716354370117188, -0.22376251220703125, -0.21036148071289062, -0.19696044921875, -0.18355941772460938, -0.17015838623046875, -0.15675735473632812, -0.1433563232421875, -0.12995529174804688, -0.11655426025390625, -0.10315322875976562, -0.089752197265625, -0.07635116577148438, -0.06295013427734375, -0.049549102783203125, -0.0361480712890625, -0.022747039794921875, -0.00934600830078125, 0.004055023193359375, 0.0174560546875, 0.030857086181640625, 0.04425811767578125, 0.057659149169921875, 0.0710601806640625, 0.08446121215820312, 0.09786224365234375, 0.11126327514648438, 0.124664306640625, 0.13806533813476562, 0.15146636962890625, 0.16486740112304688, 0.1782684326171875, 0.19166946411132812, 0.20507049560546875, 0.21847152709960938, 0.23187255859375, 0.24527359008789062, 0.25867462158203125, 0.2720756530761719, 0.2854766845703125, 0.2988777160644531, 0.31227874755859375, 0.3256797790527344, 0.339080810546875, 0.3524818420410156, 0.36588287353515625, 0.3792839050292969, 0.3926849365234375, 0.4060859680175781, 0.41948699951171875, 0.4328880310058594, 0.4462890625]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 8.0, 6.0, 5.0, 7.0, 18.0, 17.0, 29.0, 44.0, 58.0, 82.0, 111.0, 196.0, 308.0, 448.0, 787.0, 1299.0, 2387.0, 5163.0, 14259.0, 57324.0, 490683.0, 3203316.0, 348913.0, 46690.0, 12310.0, 4558.0, 2169.0, 1153.0, 658.0, 378.0, 304.0, 180.0, 124.0, 74.0, 59.0, 59.0, 35.0, 17.0, 18.0, 9.0, 12.0, 6.0, 7.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3642578125, -1.32086181640625, -1.2774658203125, -1.23406982421875, -1.190673828125, -1.14727783203125, -1.1038818359375, -1.06048583984375, -1.01708984375, -0.97369384765625, -0.9302978515625, -0.88690185546875, -0.843505859375, -0.80010986328125, -0.7567138671875, -0.71331787109375, -0.669921875, -0.62652587890625, -0.5831298828125, -0.53973388671875, -0.496337890625, -0.45294189453125, -0.4095458984375, -0.36614990234375, -0.32275390625, -0.27935791015625, -0.2359619140625, -0.19256591796875, -0.149169921875, -0.10577392578125, -0.0623779296875, -0.01898193359375, 0.0244140625, 0.06781005859375, 0.1112060546875, 0.15460205078125, 0.197998046875, 0.24139404296875, 0.2847900390625, 0.32818603515625, 0.37158203125, 0.41497802734375, 0.4583740234375, 0.50177001953125, 0.545166015625, 0.58856201171875, 0.6319580078125, 0.67535400390625, 0.71875, 0.76214599609375, 0.8055419921875, 0.84893798828125, 0.892333984375, 0.93572998046875, 0.9791259765625, 1.02252197265625, 1.06591796875, 1.10931396484375, 1.1527099609375, 1.19610595703125, 1.239501953125, 1.28289794921875, 1.3262939453125, 1.36968994140625, 1.4130859375]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 5.0, 3.0, 4.0, 7.0, 7.0, 8.0, 11.0, 22.0, 26.0, 52.0, 83.0, 120.0, 257.0, 469.0, 844.0, 940.0, 540.0, 278.0, 151.0, 96.0, 57.0, 40.0, 21.0, 12.0, 8.0, 5.0, 2.0, 4.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.3447265625, -1.3015289306640625, -1.258331298828125, -1.2151336669921875, -1.17193603515625, -1.1287384033203125, -1.085540771484375, -1.0423431396484375, -0.9991455078125, -0.9559478759765625, -0.912750244140625, -0.8695526123046875, -0.82635498046875, -0.7831573486328125, -0.739959716796875, -0.6967620849609375, -0.653564453125, -0.6103668212890625, -0.567169189453125, -0.5239715576171875, -0.48077392578125, -0.4375762939453125, -0.394378662109375, -0.3511810302734375, -0.3079833984375, -0.2647857666015625, -0.221588134765625, -0.1783905029296875, -0.13519287109375, -0.0919952392578125, -0.048797607421875, -0.0055999755859375, 0.03759765625, 0.0807952880859375, 0.123992919921875, 0.1671905517578125, 0.21038818359375, 0.2535858154296875, 0.296783447265625, 0.3399810791015625, 0.3831787109375, 0.4263763427734375, 0.469573974609375, 0.5127716064453125, 0.55596923828125, 0.5991668701171875, 0.642364501953125, 0.6855621337890625, 0.728759765625, 0.7719573974609375, 0.815155029296875, 0.8583526611328125, 0.90155029296875, 0.9447479248046875, 0.987945556640625, 1.0311431884765625, 1.0743408203125, 1.1175384521484375, 1.160736083984375, 1.2039337158203125, 1.24713134765625, 1.2903289794921875, 1.333526611328125, 1.3767242431640625, 1.419921875]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 8.0, 2.0, 7.0, 9.0, 19.0, 40.0, 62.0, 96.0, 186.0, 177.0, 159.0, 115.0, 69.0, 32.0, 12.0, 7.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-11.671438217163086, -11.385149002075195, -11.098858833312988, -10.812569618225098, -10.52627944946289, -10.239990234375, -9.95370101928711, -9.667411804199219, -9.381121635437012, -9.094832420349121, -8.808542251586914, -8.522253036499023, -8.235963821411133, -7.949673652648926, -7.663384437561035, -7.377094745635986, -7.0908050537109375, -6.804515361785889, -6.51822566986084, -6.231936454772949, -5.9456467628479, -5.659357070922852, -5.373067855834961, -5.086778163909912, -4.800488471984863, -4.5141987800598145, -4.227909088134766, -3.941619873046875, -3.655330181121826, -3.3690404891967773, -3.0827510356903076, -2.796461582183838, -2.5101728439331055, -2.2238831520080566, -1.937593698501587, -1.6513041257858276, -1.3650145530700684, -1.078724980354309, -0.7924354076385498, -0.5061459541320801, -0.21985626220703125, 0.06643331050872803, 0.3527228832244873, 0.6390124559402466, 0.9253020286560059, 1.2115916013717651, 1.4978811740875244, 1.7841706275939941, 2.070460319519043, 2.356750011444092, 2.6430394649505615, 2.9293289184570312, 3.21561861038208, 3.501908302307129, 3.7881977558135986, 4.074487209320068, 4.360776901245117, 4.647066593170166, 4.933356285095215, 5.2196455001831055, 5.505935192108154, 5.792224884033203, 6.078514099121094, 6.364803791046143, 6.651093482971191]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 3.0, 2.0, 1.0, 0.0, 4.0, 5.0, 4.0, 6.0, 10.0, 13.0, 19.0, 14.0, 23.0, 23.0, 28.0, 20.0, 31.0, 25.0, 32.0, 37.0, 43.0, 43.0, 39.0, 36.0, 49.0, 36.0, 47.0, 48.0, 47.0, 34.0, 37.0, 34.0, 24.0, 27.0, 27.0, 27.0, 23.0, 14.0, 11.0, 18.0, 13.0, 7.0, 10.0, 5.0, 4.0, 2.0, 5.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-3.3810982704162598, -3.2837817668914795, -3.18646502494812, -3.08914852142334, -2.9918320178985596, -2.8945155143737793, -2.79719877243042, -2.6998822689056396, -2.6025657653808594, -2.505249261856079, -2.4079325199127197, -2.3106160163879395, -2.213299512863159, -2.115983009338379, -2.0186662673950195, -1.9213497638702393, -1.8240331411361694, -1.7267165184020996, -1.6294000148773193, -1.5320833921432495, -1.4347668886184692, -1.3374502658843994, -1.2401337623596191, -1.1428171396255493, -1.0455005168914795, -0.9481839537620544, -0.8508673906326294, -0.7535507678985596, -0.6562342643737793, -0.5589176416397095, -0.4616010785102844, -0.3642845153808594, -0.2669680118560791, -0.16965144872665405, -0.07233487069606781, 0.024981707334518433, 0.12229827046394348, 0.21961483359336853, 0.31693142652511597, 0.414247989654541, 0.5115645527839661, 0.6088811159133911, 0.7061976790428162, 0.8035142421722412, 0.900830864906311, 0.9981473684310913, 1.0954639911651611, 1.1927804946899414, 1.2900971174240112, 1.387413740158081, 1.4847302436828613, 1.5820468664169312, 1.6793633699417114, 1.7766799926757812, 1.8739964962005615, 1.9713131189346313, 2.068629741668701, 2.1659462451934814, 2.263262987136841, 2.360579490661621, 2.4578959941864014, 2.5552124977111816, 2.652529239654541, 2.7498457431793213, 2.8471622467041016]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 3.0, 2.0, 3.0, 4.0, 15.0, 18.0, 20.0, 39.0, 77.0, 114.0, 137.0, 217.0, 365.0, 529.0, 833.0, 1384.0, 2381.0, 4192.0, 7563.0, 15969.0, 41895.0, 172165.0, 473347.0, 233880.0, 54125.0, 18830.0, 8729.0, 4815.0, 2697.0, 1597.0, 894.0, 650.0, 392.0, 238.0, 147.0, 101.0, 73.0, 33.0, 24.0, 26.0, 12.0, 8.0, 3.0, 6.0, 6.0, 2.0, 2.0, 3.0, 3.0], "bins": [-1.3251953125, -1.2899551391601562, -1.2547149658203125, -1.2194747924804688, -1.184234619140625, -1.1489944458007812, -1.1137542724609375, -1.0785140991210938, -1.04327392578125, -1.0080337524414062, -0.9727935791015625, -0.9375534057617188, -0.902313232421875, -0.8670730590820312, -0.8318328857421875, -0.7965927124023438, -0.7613525390625, -0.7261123657226562, -0.6908721923828125, -0.6556320190429688, -0.620391845703125, -0.5851516723632812, -0.5499114990234375, -0.5146713256835938, -0.47943115234375, -0.44419097900390625, -0.4089508056640625, -0.37371063232421875, -0.338470458984375, -0.30323028564453125, -0.2679901123046875, -0.23274993896484375, -0.197509765625, -0.16226959228515625, -0.1270294189453125, -0.09178924560546875, -0.056549072265625, -0.02130889892578125, 0.0139312744140625, 0.04917144775390625, 0.08441162109375, 0.11965179443359375, 0.1548919677734375, 0.19013214111328125, 0.225372314453125, 0.26061248779296875, 0.2958526611328125, 0.33109283447265625, 0.3663330078125, 0.40157318115234375, 0.4368133544921875, 0.47205352783203125, 0.507293701171875, 0.5425338745117188, 0.5777740478515625, 0.6130142211914062, 0.64825439453125, 0.6834945678710938, 0.7187347412109375, 0.7539749145507812, 0.789215087890625, 0.8244552612304688, 0.8596954345703125, 0.8949356079101562, 0.93017578125]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 4.0, 6.0, 3.0, 7.0, 4.0, 7.0, 5.0, 6.0, 17.0, 15.0, 28.0, 13.0, 17.0, 21.0, 23.0, 22.0, 28.0, 31.0, 29.0, 31.0, 29.0, 34.0, 42.0, 48.0, 55.0, 36.0, 55.0, 45.0, 41.0, 35.0, 33.0, 27.0, 28.0, 30.0, 15.0, 27.0, 18.0, 19.0, 13.0, 16.0, 11.0, 11.0, 7.0, 8.0, 4.0, 1.0, 2.0, 1.0, 5.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0], "bins": [-0.436279296875, -0.4224052429199219, -0.40853118896484375, -0.3946571350097656, -0.3807830810546875, -0.3669090270996094, -0.35303497314453125, -0.3391609191894531, -0.325286865234375, -0.3114128112792969, -0.29753875732421875, -0.2836647033691406, -0.2697906494140625, -0.2559165954589844, -0.24204254150390625, -0.22816848754882812, -0.21429443359375, -0.20042037963867188, -0.18654632568359375, -0.17267227172851562, -0.1587982177734375, -0.14492416381835938, -0.13105010986328125, -0.11717605590820312, -0.103302001953125, -0.08942794799804688, -0.07555389404296875, -0.061679840087890625, -0.0478057861328125, -0.033931732177734375, -0.02005767822265625, -0.006183624267578125, 0.0076904296875, 0.021564483642578125, 0.03543853759765625, 0.049312591552734375, 0.0631866455078125, 0.07706069946289062, 0.09093475341796875, 0.10480880737304688, 0.118682861328125, 0.13255691528320312, 0.14643096923828125, 0.16030502319335938, 0.1741790771484375, 0.18805313110351562, 0.20192718505859375, 0.21580123901367188, 0.22967529296875, 0.24354934692382812, 0.25742340087890625, 0.2712974548339844, 0.2851715087890625, 0.2990455627441406, 0.31291961669921875, 0.3267936706542969, 0.340667724609375, 0.3545417785644531, 0.36841583251953125, 0.3822898864746094, 0.3961639404296875, 0.4100379943847656, 0.42391204833984375, 0.4377861022949219, 0.45166015625]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 2.0, 4.0, 4.0, 4.0, 9.0, 8.0, 17.0, 29.0, 33.0, 46.0, 72.0, 94.0, 151.0, 246.0, 412.0, 689.0, 1271.0, 2566.0, 5422.0, 13573.0, 44899.0, 260678.0, 557082.0, 117625.0, 26336.0, 9069.0, 3854.0, 1896.0, 1021.0, 552.0, 317.0, 172.0, 130.0, 84.0, 50.0, 45.0, 28.0, 16.0, 13.0, 11.0, 7.0, 6.0, 4.0, 2.0, 3.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0], "bins": [-1.447265625, -1.4037933349609375, -1.360321044921875, -1.3168487548828125, -1.27337646484375, -1.2299041748046875, -1.186431884765625, -1.1429595947265625, -1.0994873046875, -1.0560150146484375, -1.012542724609375, -0.9690704345703125, -0.92559814453125, -0.8821258544921875, -0.838653564453125, -0.7951812744140625, -0.751708984375, -0.7082366943359375, -0.664764404296875, -0.6212921142578125, -0.57781982421875, -0.5343475341796875, -0.490875244140625, -0.4474029541015625, -0.4039306640625, -0.3604583740234375, -0.316986083984375, -0.2735137939453125, -0.23004150390625, -0.1865692138671875, -0.143096923828125, -0.0996246337890625, -0.05615234375, -0.0126800537109375, 0.030792236328125, 0.0742645263671875, 0.11773681640625, 0.1612091064453125, 0.204681396484375, 0.2481536865234375, 0.2916259765625, 0.3350982666015625, 0.378570556640625, 0.4220428466796875, 0.46551513671875, 0.5089874267578125, 0.552459716796875, 0.5959320068359375, 0.639404296875, 0.6828765869140625, 0.726348876953125, 0.7698211669921875, 0.81329345703125, 0.8567657470703125, 0.900238037109375, 0.9437103271484375, 0.9871826171875, 1.0306549072265625, 1.074127197265625, 1.1175994873046875, 1.16107177734375, 1.2045440673828125, 1.248016357421875, 1.2914886474609375, 1.3349609375]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 2.0, 0.0, 3.0, 1.0, 10.0, 4.0, 9.0, 10.0, 12.0, 10.0, 15.0, 12.0, 20.0, 25.0, 29.0, 30.0, 37.0, 31.0, 39.0, 37.0, 40.0, 32.0, 48.0, 47.0, 40.0, 47.0, 44.0, 54.0, 35.0, 37.0, 41.0, 41.0, 29.0, 24.0, 21.0, 21.0, 13.0, 12.0, 13.0, 8.0, 6.0, 5.0, 1.0, 3.0, 3.0, 2.0, 5.0, 0.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.52734375, -1.4812164306640625, -1.435089111328125, -1.3889617919921875, -1.34283447265625, -1.2967071533203125, -1.250579833984375, -1.2044525146484375, -1.1583251953125, -1.1121978759765625, -1.066070556640625, -1.0199432373046875, -0.97381591796875, -0.9276885986328125, -0.881561279296875, -0.8354339599609375, -0.789306640625, -0.7431793212890625, -0.697052001953125, -0.6509246826171875, -0.60479736328125, -0.5586700439453125, -0.512542724609375, -0.4664154052734375, -0.4202880859375, -0.3741607666015625, -0.328033447265625, -0.2819061279296875, -0.23577880859375, -0.1896514892578125, -0.143524169921875, -0.0973968505859375, -0.05126953125, -0.0051422119140625, 0.040985107421875, 0.0871124267578125, 0.13323974609375, 0.1793670654296875, 0.225494384765625, 0.2716217041015625, 0.3177490234375, 0.3638763427734375, 0.410003662109375, 0.4561309814453125, 0.50225830078125, 0.5483856201171875, 0.594512939453125, 0.6406402587890625, 0.686767578125, 0.7328948974609375, 0.779022216796875, 0.8251495361328125, 0.87127685546875, 0.9174041748046875, 0.963531494140625, 1.0096588134765625, 1.0557861328125, 1.1019134521484375, 1.148040771484375, 1.1941680908203125, 1.24029541015625, 1.2864227294921875, 1.332550048828125, 1.3786773681640625, 1.4248046875]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 3.0, 1.0, 5.0, 4.0, 5.0, 8.0, 12.0, 13.0, 15.0, 33.0, 52.0, 100.0, 133.0, 250.0, 442.0, 765.0, 1592.0, 2999.0, 6166.0, 14495.0, 39836.0, 142475.0, 429294.0, 288939.0, 77353.0, 24481.0, 9733.0, 4472.0, 2202.0, 1120.0, 645.0, 380.0, 215.0, 102.0, 70.0, 59.0, 25.0, 19.0, 11.0, 13.0, 11.0, 6.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3916015625, -0.378448486328125, -0.36529541015625, -0.352142333984375, -0.3389892578125, -0.325836181640625, -0.31268310546875, -0.299530029296875, -0.286376953125, -0.273223876953125, -0.26007080078125, -0.246917724609375, -0.2337646484375, -0.220611572265625, -0.20745849609375, -0.194305419921875, -0.18115234375, -0.167999267578125, -0.15484619140625, -0.141693115234375, -0.1285400390625, -0.115386962890625, -0.10223388671875, -0.089080810546875, -0.075927734375, -0.062774658203125, -0.04962158203125, -0.036468505859375, -0.0233154296875, -0.010162353515625, 0.00299072265625, 0.016143798828125, 0.029296875, 0.042449951171875, 0.05560302734375, 0.068756103515625, 0.0819091796875, 0.095062255859375, 0.10821533203125, 0.121368408203125, 0.134521484375, 0.147674560546875, 0.16082763671875, 0.173980712890625, 0.1871337890625, 0.200286865234375, 0.21343994140625, 0.226593017578125, 0.23974609375, 0.252899169921875, 0.26605224609375, 0.279205322265625, 0.2923583984375, 0.305511474609375, 0.31866455078125, 0.331817626953125, 0.344970703125, 0.358123779296875, 0.37127685546875, 0.384429931640625, 0.3975830078125, 0.410736083984375, 0.42388916015625, 0.437042236328125, 0.4501953125]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 2.0, 2.0, 5.0, 6.0, 3.0, 9.0, 11.0, 16.0, 16.0, 36.0, 31.0, 52.0, 67.0, 93.0, 116.0, 133.0, 126.0, 67.0, 64.0, 37.0, 25.0, 23.0, 11.0, 12.0, 9.0, 7.0, 5.0, 8.0, 4.0, 4.0, 3.0, 1.0, 0.0, 0.0, 3.0, 0.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00014328956604003906, -0.0001389719545841217, -0.00013465434312820435, -0.000130336731672287, -0.00012601912021636963, -0.00012170150876045227, -0.00011738389730453491, -0.00011306628584861755, -0.0001087486743927002, -0.00010443106293678284, -0.00010011345148086548, -9.579584002494812e-05, -9.147822856903076e-05, -8.71606171131134e-05, -8.284300565719604e-05, -7.852539420127869e-05, -7.420778274536133e-05, -6.989017128944397e-05, -6.557255983352661e-05, -6.125494837760925e-05, -5.6937336921691895e-05, -5.2619725465774536e-05, -4.830211400985718e-05, -4.398450255393982e-05, -3.966689109802246e-05, -3.53492796421051e-05, -3.1031668186187744e-05, -2.6714056730270386e-05, -2.2396445274353027e-05, -1.807883381843567e-05, -1.376122236251831e-05, -9.443610906600952e-06, -5.125999450683594e-06, -8.083879947662354e-07, 3.509223461151123e-06, 7.826834917068481e-06, 1.214444637298584e-05, 1.6462057828903198e-05, 2.0779669284820557e-05, 2.5097280740737915e-05, 2.9414892196655273e-05, 3.373250365257263e-05, 3.805011510848999e-05, 4.236772656440735e-05, 4.668533802032471e-05, 5.1002949476242065e-05, 5.5320560932159424e-05, 5.963817238807678e-05, 6.395578384399414e-05, 6.82733952999115e-05, 7.259100675582886e-05, 7.690861821174622e-05, 8.122622966766357e-05, 8.554384112358093e-05, 8.986145257949829e-05, 9.417906403541565e-05, 9.849667549133301e-05, 0.00010281428694725037, 0.00010713189840316772, 0.00011144950985908508, 0.00011576712131500244, 0.0001200847327709198, 0.00012440234422683716, 0.00012871995568275452, 0.00013303756713867188]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 4.0, 6.0, 5.0, 9.0, 7.0, 20.0, 24.0, 23.0, 44.0, 63.0, 94.0, 138.0, 229.0, 356.0, 591.0, 1074.0, 1919.0, 3649.0, 8027.0, 19563.0, 55070.0, 169730.0, 372402.0, 268886.0, 92899.0, 30656.0, 11786.0, 5320.0, 2584.0, 1356.0, 744.0, 450.0, 289.0, 193.0, 92.0, 82.0, 60.0, 32.0, 23.0, 19.0, 13.0, 7.0, 12.0, 5.0, 4.0, 2.0, 3.0, 2.0, 1.0, 1.0], "bins": [-0.396240234375, -0.3854522705078125, -0.374664306640625, -0.3638763427734375, -0.35308837890625, -0.3423004150390625, -0.331512451171875, -0.3207244873046875, -0.3099365234375, -0.2991485595703125, -0.288360595703125, -0.2775726318359375, -0.26678466796875, -0.2559967041015625, -0.245208740234375, -0.2344207763671875, -0.2236328125, -0.2128448486328125, -0.202056884765625, -0.1912689208984375, -0.18048095703125, -0.1696929931640625, -0.158905029296875, -0.1481170654296875, -0.1373291015625, -0.1265411376953125, -0.115753173828125, -0.1049652099609375, -0.09417724609375, -0.0833892822265625, -0.072601318359375, -0.0618133544921875, -0.051025390625, -0.0402374267578125, -0.029449462890625, -0.0186614990234375, -0.00787353515625, 0.0029144287109375, 0.013702392578125, 0.0244903564453125, 0.0352783203125, 0.0460662841796875, 0.056854248046875, 0.0676422119140625, 0.07843017578125, 0.0892181396484375, 0.100006103515625, 0.1107940673828125, 0.12158203125, 0.1323699951171875, 0.143157958984375, 0.1539459228515625, 0.16473388671875, 0.1755218505859375, 0.186309814453125, 0.1970977783203125, 0.2078857421875, 0.2186737060546875, 0.229461669921875, 0.2402496337890625, 0.25103759765625, 0.2618255615234375, 0.272613525390625, 0.2834014892578125, 0.294189453125]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 4.0, 3.0, 4.0, 4.0, 5.0, 4.0, 6.0, 9.0, 4.0, 9.0, 11.0, 24.0, 32.0, 33.0, 46.0, 67.0, 78.0, 69.0, 86.0, 91.0, 80.0, 80.0, 66.0, 54.0, 27.0, 31.0, 19.0, 14.0, 10.0, 5.0, 3.0, 6.0, 4.0, 5.0, 3.0, 4.0, 4.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.357177734375, -0.3443756103515625, -0.331573486328125, -0.3187713623046875, -0.30596923828125, -0.2931671142578125, -0.280364990234375, -0.2675628662109375, -0.2547607421875, -0.2419586181640625, -0.229156494140625, -0.2163543701171875, -0.20355224609375, -0.1907501220703125, -0.177947998046875, -0.1651458740234375, -0.15234375, -0.1395416259765625, -0.126739501953125, -0.1139373779296875, -0.10113525390625, -0.0883331298828125, -0.075531005859375, -0.0627288818359375, -0.0499267578125, -0.0371246337890625, -0.024322509765625, -0.0115203857421875, 0.00128173828125, 0.0140838623046875, 0.026885986328125, 0.0396881103515625, 0.052490234375, 0.0652923583984375, 0.078094482421875, 0.0908966064453125, 0.10369873046875, 0.1165008544921875, 0.129302978515625, 0.1421051025390625, 0.1549072265625, 0.1677093505859375, 0.180511474609375, 0.1933135986328125, 0.20611572265625, 0.2189178466796875, 0.231719970703125, 0.2445220947265625, 0.25732421875, 0.2701263427734375, 0.282928466796875, 0.2957305908203125, 0.30853271484375, 0.3213348388671875, 0.334136962890625, 0.3469390869140625, 0.3597412109375, 0.3725433349609375, 0.385345458984375, 0.3981475830078125, 0.41094970703125, 0.4237518310546875, 0.436553955078125, 0.4493560791015625, 0.462158203125]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 10.0, 18.0, 30.0, 62.0, 104.0, 163.0, 177.0, 175.0, 128.0, 53.0, 29.0, 30.0, 6.0, 7.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0], "bins": [-9.316065788269043, -9.081131935119629, -8.846198081970215, -8.6112642288208, -8.37632942199707, -8.141395568847656, -7.906461715698242, -7.671527862548828, -7.436594009399414, -7.20166015625, -6.966726303100586, -6.731791973114014, -6.4968581199646, -6.2619242668151855, -6.026989936828613, -5.792056083679199, -5.557122230529785, -5.322188377380371, -5.087254524230957, -4.852320194244385, -4.617386341094971, -4.382452487945557, -4.147518157958984, -3.9125843048095703, -3.6776504516601562, -3.442716598510742, -3.207782506942749, -2.972848415374756, -2.737914562225342, -2.5029807090759277, -2.2680466175079346, -2.0331125259399414, -1.7981786727905273, -1.5632447004318237, -1.3283107280731201, -1.0933767557144165, -0.8584427833557129, -0.6235088109970093, -0.38857483863830566, -0.15364086627960205, 0.08129310607910156, 0.3162270784378052, 0.5511610507965088, 0.7860950231552124, 1.021028995513916, 1.2559629678726196, 1.4908969402313232, 1.7258309125900269, 1.9607648849487305, 2.1956987380981445, 2.4306328296661377, 2.665566921234131, 2.900500774383545, 3.135434627532959, 3.370368719100952, 3.6053028106689453, 3.8402366638183594, 4.075170516967773, 4.3101043701171875, 4.54503870010376, 4.779972553253174, 5.014906406402588, 5.24984073638916, 5.484774589538574, 5.719708442687988]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 2.0, 5.0, 8.0, 5.0, 6.0, 10.0, 13.0, 12.0, 14.0, 17.0, 20.0, 16.0, 32.0, 25.0, 25.0, 21.0, 47.0, 31.0, 41.0, 40.0, 45.0, 49.0, 39.0, 47.0, 28.0, 41.0, 43.0, 30.0, 39.0, 45.0, 23.0, 28.0, 20.0, 27.0, 16.0, 18.0, 16.0, 17.0, 9.0, 9.0, 9.0, 1.0, 7.0, 6.0, 5.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.4426169395446777, -3.328608989715576, -3.2146010398864746, -3.100593328475952, -2.9865853786468506, -2.872577428817749, -2.7585697174072266, -2.644561767578125, -2.5305538177490234, -2.416545867919922, -2.3025379180908203, -2.188530206680298, -2.0745222568511963, -1.9605143070220947, -1.8465064764022827, -1.7324986457824707, -1.6184906959533691, -1.5044827461242676, -1.3904749155044556, -1.2764670848846436, -1.162459135055542, -1.0484511852264404, -0.9344433546066284, -0.8204354643821716, -0.7064275741577148, -0.5924196839332581, -0.47841179370880127, -0.3644039034843445, -0.2503960132598877, -0.1363881230354309, -0.02238023281097412, 0.09162765741348267, 0.20563554763793945, 0.31964343786239624, 0.433651328086853, 0.5476592183113098, 0.6616671085357666, 0.7756749987602234, 0.8896828889846802, 1.0036907196044922, 1.1176986694335938, 1.2317066192626953, 1.3457144498825073, 1.4597222805023193, 1.573730230331421, 1.6877381801605225, 1.8017460107803345, 1.9157538414001465, 2.029761791229248, 2.1437697410583496, 2.257777690887451, 2.3717854022979736, 2.485793352127075, 2.5998013019561768, 2.713809013366699, 2.827816963195801, 2.9418249130249023, 3.055832862854004, 3.1698408126831055, 3.283848524093628, 3.3978564739227295, 3.511864423751831, 3.6258721351623535, 3.739880084991455, 3.8538880348205566]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 4.0, 8.0, 6.0, 5.0, 9.0, 12.0, 24.0, 34.0, 45.0, 76.0, 81.0, 126.0, 179.0, 241.0, 350.0, 544.0, 793.0, 1293.0, 2176.0, 3984.0, 7970.0, 19924.0, 68324.0, 312141.0, 1305062.0, 1795376.0, 516386.0, 106256.0, 29116.0, 10917.0, 5274.0, 2927.0, 1560.0, 1039.0, 646.0, 416.0, 309.0, 199.0, 129.0, 100.0, 66.0, 51.0, 34.0, 31.0, 23.0, 11.0, 7.0, 5.0, 10.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7685546875, -0.7453842163085938, -0.7222137451171875, -0.6990432739257812, -0.675872802734375, -0.6527023315429688, -0.6295318603515625, -0.6063613891601562, -0.58319091796875, -0.5600204467773438, -0.5368499755859375, -0.5136795043945312, -0.490509033203125, -0.46733856201171875, -0.4441680908203125, -0.42099761962890625, -0.3978271484375, -0.37465667724609375, -0.3514862060546875, -0.32831573486328125, -0.305145263671875, -0.28197479248046875, -0.2588043212890625, -0.23563385009765625, -0.21246337890625, -0.18929290771484375, -0.1661224365234375, -0.14295196533203125, -0.119781494140625, -0.09661102294921875, -0.0734405517578125, -0.05027008056640625, -0.027099609375, -0.00392913818359375, 0.0192413330078125, 0.04241180419921875, 0.065582275390625, 0.08875274658203125, 0.1119232177734375, 0.13509368896484375, 0.15826416015625, 0.18143463134765625, 0.2046051025390625, 0.22777557373046875, 0.250946044921875, 0.27411651611328125, 0.2972869873046875, 0.32045745849609375, 0.3436279296875, 0.36679840087890625, 0.3899688720703125, 0.41313934326171875, 0.436309814453125, 0.45948028564453125, 0.4826507568359375, 0.5058212280273438, 0.52899169921875, 0.5521621704101562, 0.5753326416015625, 0.5985031127929688, 0.621673583984375, 0.6448440551757812, 0.6680145263671875, 0.6911849975585938, 0.71435546875]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 6.0, 3.0, 4.0, 5.0, 11.0, 16.0, 10.0, 15.0, 6.0, 27.0, 18.0, 16.0, 23.0, 22.0, 37.0, 30.0, 36.0, 42.0, 30.0, 38.0, 35.0, 44.0, 30.0, 38.0, 40.0, 47.0, 32.0, 38.0, 26.0, 29.0, 44.0, 24.0, 24.0, 18.0, 26.0, 11.0, 19.0, 20.0, 11.0, 4.0, 15.0, 6.0, 6.0, 9.0, 4.0, 7.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.46240234375, -0.4483451843261719, -0.43428802490234375, -0.4202308654785156, -0.4061737060546875, -0.3921165466308594, -0.37805938720703125, -0.3640022277832031, -0.349945068359375, -0.3358879089355469, -0.32183074951171875, -0.3077735900878906, -0.2937164306640625, -0.2796592712402344, -0.26560211181640625, -0.2515449523925781, -0.23748779296875, -0.22343063354492188, -0.20937347412109375, -0.19531631469726562, -0.1812591552734375, -0.16720199584960938, -0.15314483642578125, -0.13908767700195312, -0.125030517578125, -0.11097335815429688, -0.09691619873046875, -0.08285903930664062, -0.0688018798828125, -0.054744720458984375, -0.04068756103515625, -0.026630401611328125, -0.0125732421875, 0.001483917236328125, 0.01554107666015625, 0.029598236083984375, 0.0436553955078125, 0.057712554931640625, 0.07176971435546875, 0.08582687377929688, 0.099884033203125, 0.11394119262695312, 0.12799835205078125, 0.14205551147460938, 0.1561126708984375, 0.17016983032226562, 0.18422698974609375, 0.19828414916992188, 0.21234130859375, 0.22639846801757812, 0.24045562744140625, 0.2545127868652344, 0.2685699462890625, 0.2826271057128906, 0.29668426513671875, 0.3107414245605469, 0.324798583984375, 0.3388557434082031, 0.35291290283203125, 0.3669700622558594, 0.3810272216796875, 0.3950843811035156, 0.40914154052734375, 0.4231986999511719, 0.437255859375]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 7.0, 7.0, 12.0, 14.0, 20.0, 37.0, 26.0, 46.0, 48.0, 78.0, 83.0, 119.0, 147.0, 199.0, 299.0, 446.0, 737.0, 1241.0, 2177.0, 4333.0, 10310.0, 29212.0, 116761.0, 856643.0, 2706801.0, 364130.0, 65789.0, 19114.0, 7425.0, 3405.0, 1674.0, 925.0, 642.0, 406.0, 259.0, 161.0, 132.0, 91.0, 86.0, 49.0, 37.0, 33.0, 19.0, 29.0, 22.0, 20.0, 16.0, 10.0, 5.0, 6.0, 1.0, 3.0, 3.0, 0.0, 1.0, 2.0], "bins": [-1.166015625, -1.1299285888671875, -1.093841552734375, -1.0577545166015625, -1.02166748046875, -0.9855804443359375, -0.949493408203125, -0.9134063720703125, -0.8773193359375, -0.8412322998046875, -0.805145263671875, -0.7690582275390625, -0.73297119140625, -0.6968841552734375, -0.660797119140625, -0.6247100830078125, -0.588623046875, -0.5525360107421875, -0.516448974609375, -0.4803619384765625, -0.44427490234375, -0.4081878662109375, -0.372100830078125, -0.3360137939453125, -0.2999267578125, -0.2638397216796875, -0.227752685546875, -0.1916656494140625, -0.15557861328125, -0.1194915771484375, -0.083404541015625, -0.0473175048828125, -0.01123046875, 0.0248565673828125, 0.060943603515625, 0.0970306396484375, 0.13311767578125, 0.1692047119140625, 0.205291748046875, 0.2413787841796875, 0.2774658203125, 0.3135528564453125, 0.349639892578125, 0.3857269287109375, 0.42181396484375, 0.4579010009765625, 0.493988037109375, 0.5300750732421875, 0.566162109375, 0.6022491455078125, 0.638336181640625, 0.6744232177734375, 0.71051025390625, 0.7465972900390625, 0.782684326171875, 0.8187713623046875, 0.8548583984375, 0.8909454345703125, 0.927032470703125, 0.9631195068359375, 0.99920654296875, 1.0352935791015625, 1.071380615234375, 1.1074676513671875, 1.1435546875]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 5.0, 6.0, 8.0, 16.0, 16.0, 26.0, 32.0, 52.0, 113.0, 171.0, 370.0, 677.0, 936.0, 713.0, 395.0, 201.0, 135.0, 65.0, 54.0, 33.0, 15.0, 16.0, 8.0, 6.0, 4.0, 3.0, 1.0, 0.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5322265625, -1.4837188720703125, -1.435211181640625, -1.3867034912109375, -1.33819580078125, -1.2896881103515625, -1.241180419921875, -1.1926727294921875, -1.1441650390625, -1.0956573486328125, -1.047149658203125, -0.9986419677734375, -0.95013427734375, -0.9016265869140625, -0.853118896484375, -0.8046112060546875, -0.756103515625, -0.7075958251953125, -0.659088134765625, -0.6105804443359375, -0.56207275390625, -0.5135650634765625, -0.465057373046875, -0.4165496826171875, -0.3680419921875, -0.3195343017578125, -0.271026611328125, -0.2225189208984375, -0.17401123046875, -0.1255035400390625, -0.076995849609375, -0.0284881591796875, 0.02001953125, 0.0685272216796875, 0.117034912109375, 0.1655426025390625, 0.21405029296875, 0.2625579833984375, 0.311065673828125, 0.3595733642578125, 0.4080810546875, 0.4565887451171875, 0.505096435546875, 0.5536041259765625, 0.60211181640625, 0.6506195068359375, 0.699127197265625, 0.7476348876953125, 0.796142578125, 0.8446502685546875, 0.893157958984375, 0.9416656494140625, 0.99017333984375, 1.0386810302734375, 1.087188720703125, 1.1356964111328125, 1.1842041015625, 1.2327117919921875, 1.281219482421875, 1.3297271728515625, 1.37823486328125, 1.4267425537109375, 1.475250244140625, 1.5237579345703125, 1.572265625]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 9.0, 15.0, 25.0, 39.0, 94.0, 145.0, 183.0, 179.0, 116.0, 94.0, 41.0, 31.0, 9.0, 11.0, 7.0, 4.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.126413345336914, -9.845429420471191, -9.564445495605469, -9.283462524414062, -9.00247859954834, -8.721494674682617, -8.440511703491211, -8.159527778625488, -7.878543853759766, -7.597559928894043, -7.3165764808654785, -7.035593032836914, -6.754609107971191, -6.473625183105469, -6.192641735076904, -5.91165828704834, -5.630674362182617, -5.3496904373168945, -5.06870698928833, -4.787723541259766, -4.506739616394043, -4.22575569152832, -3.944772243499756, -3.6637885570526123, -3.3828048706054688, -3.101821184158325, -2.8208374977111816, -2.539853811264038, -2.2588701248168945, -1.977886438369751, -1.6969027519226074, -1.4159190654754639, -1.1349363327026367, -0.8539526462554932, -0.5729689598083496, -0.29198527336120605, -0.0110015869140625, 0.26998209953308105, 0.5509657859802246, 0.8319494724273682, 1.1129331588745117, 1.3939168453216553, 1.6749005317687988, 1.9558842182159424, 2.236867904663086, 2.5178515911102295, 2.798835277557373, 3.0798189640045166, 3.36080265045166, 3.6417863368988037, 3.9227700233459473, 4.203753471374512, 4.484737396240234, 4.765721321105957, 5.0467047691345215, 5.327688217163086, 5.608672142028809, 5.889656066894531, 6.170639514923096, 6.45162296295166, 6.732606887817383, 7.0135908126831055, 7.29457426071167, 7.575557708740234, 7.856541633605957]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 6.0, 1.0, 8.0, 4.0, 13.0, 12.0, 11.0, 8.0, 17.0, 21.0, 20.0, 19.0, 36.0, 33.0, 29.0, 35.0, 29.0, 39.0, 40.0, 48.0, 48.0, 43.0, 34.0, 40.0, 37.0, 52.0, 38.0, 46.0, 40.0, 29.0, 24.0, 21.0, 32.0, 28.0, 14.0, 13.0, 11.0, 11.0, 2.0, 4.0, 5.0, 1.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.4994616508483887, -3.3876075744628906, -3.2757534980773926, -3.1638994216918945, -3.0520451068878174, -2.9401910305023193, -2.8283369541168213, -2.7164828777313232, -2.604628562927246, -2.492774486541748, -2.38092041015625, -2.269066333770752, -2.157212018966675, -2.0453579425811768, -1.9335038661956787, -1.8216497898101807, -1.7097957134246826, -1.5979416370391846, -1.486087441444397, -1.374233365058899, -1.2623791694641113, -1.1505250930786133, -1.0386710166931152, -0.9268168807029724, -0.8149627447128296, -0.7031086087226868, -0.591254472732544, -0.4794003963470459, -0.3675462603569031, -0.25569212436676025, -0.1438380479812622, -0.031983911991119385, 0.07986998558044434, 0.19172410666942596, 0.3035782277584076, 0.415432333946228, 0.5272864699363708, 0.6391406059265137, 0.7509946823120117, 0.8628488183021545, 0.9747029542922974, 1.0865570306777954, 1.198411226272583, 1.310265302658081, 1.422119379043579, 1.5339735746383667, 1.6458276510238647, 1.7576818466186523, 1.8695359230041504, 1.9813899993896484, 2.0932440757751465, 2.2050981521606445, 2.3169524669647217, 2.4288065433502197, 2.5406606197357178, 2.652514696121216, 2.764369010925293, 2.876223087310791, 2.988077163696289, 3.099931240081787, 3.2117855548858643, 3.3236396312713623, 3.4354937076568604, 3.5473477840423584, 3.6592018604278564]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 5.0, 2.0, 2.0, 7.0, 2.0, 4.0, 11.0, 11.0, 17.0, 34.0, 34.0, 71.0, 84.0, 111.0, 195.0, 286.0, 468.0, 820.0, 1471.0, 2966.0, 6725.0, 17704.0, 65232.0, 302652.0, 468803.0, 131378.0, 30577.0, 9853.0, 4213.0, 1993.0, 1112.0, 614.0, 373.0, 239.0, 173.0, 100.0, 74.0, 46.0, 36.0, 21.0, 11.0, 10.0, 7.0, 10.0, 4.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.203125, -1.1645965576171875, -1.126068115234375, -1.0875396728515625, -1.04901123046875, -1.0104827880859375, -0.971954345703125, -0.9334259033203125, -0.8948974609375, -0.8563690185546875, -0.817840576171875, -0.7793121337890625, -0.74078369140625, -0.7022552490234375, -0.663726806640625, -0.6251983642578125, -0.586669921875, -0.5481414794921875, -0.509613037109375, -0.4710845947265625, -0.43255615234375, -0.3940277099609375, -0.355499267578125, -0.3169708251953125, -0.2784423828125, -0.2399139404296875, -0.201385498046875, -0.1628570556640625, -0.12432861328125, -0.0858001708984375, -0.047271728515625, -0.0087432861328125, 0.02978515625, 0.0683135986328125, 0.106842041015625, 0.1453704833984375, 0.18389892578125, 0.2224273681640625, 0.260955810546875, 0.2994842529296875, 0.3380126953125, 0.3765411376953125, 0.415069580078125, 0.4535980224609375, 0.49212646484375, 0.5306549072265625, 0.569183349609375, 0.6077117919921875, 0.646240234375, 0.6847686767578125, 0.723297119140625, 0.7618255615234375, 0.80035400390625, 0.8388824462890625, 0.877410888671875, 0.9159393310546875, 0.9544677734375, 0.9929962158203125, 1.031524658203125, 1.0700531005859375, 1.10858154296875, 1.1471099853515625, 1.185638427734375, 1.2241668701171875, 1.2626953125]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 6.0, 6.0, 4.0, 8.0, 6.0, 8.0, 13.0, 12.0, 15.0, 13.0, 15.0, 27.0, 26.0, 26.0, 29.0, 43.0, 42.0, 32.0, 37.0, 48.0, 39.0, 34.0, 50.0, 54.0, 37.0, 35.0, 47.0, 32.0, 36.0, 35.0, 30.0, 19.0, 23.0, 22.0, 15.0, 17.0, 17.0, 8.0, 11.0, 7.0, 6.0, 2.0, 4.0, 1.0, 3.0, 3.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.51953125, -0.5020523071289062, -0.4845733642578125, -0.46709442138671875, -0.449615478515625, -0.43213653564453125, -0.4146575927734375, -0.39717864990234375, -0.37969970703125, -0.36222076416015625, -0.3447418212890625, -0.32726287841796875, -0.309783935546875, -0.29230499267578125, -0.2748260498046875, -0.25734710693359375, -0.2398681640625, -0.22238922119140625, -0.2049102783203125, -0.18743133544921875, -0.169952392578125, -0.15247344970703125, -0.1349945068359375, -0.11751556396484375, -0.10003662109375, -0.08255767822265625, -0.0650787353515625, -0.04759979248046875, -0.030120849609375, -0.01264190673828125, 0.0048370361328125, 0.02231597900390625, 0.039794921875, 0.05727386474609375, 0.0747528076171875, 0.09223175048828125, 0.109710693359375, 0.12718963623046875, 0.1446685791015625, 0.16214752197265625, 0.17962646484375, 0.19710540771484375, 0.2145843505859375, 0.23206329345703125, 0.249542236328125, 0.26702117919921875, 0.2845001220703125, 0.30197906494140625, 0.3194580078125, 0.33693695068359375, 0.3544158935546875, 0.37189483642578125, 0.389373779296875, 0.40685272216796875, 0.4243316650390625, 0.44181060791015625, 0.45928955078125, 0.47676849365234375, 0.4942474365234375, 0.5117263793945312, 0.529205322265625, 0.5466842651367188, 0.5641632080078125, 0.5816421508789062, 0.59912109375]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 6.0, 3.0, 9.0, 13.0, 12.0, 21.0, 31.0, 52.0, 56.0, 85.0, 128.0, 178.0, 250.0, 404.0, 620.0, 931.0, 1562.0, 2577.0, 4434.0, 8823.0, 19866.0, 60960.0, 227463.0, 431856.0, 198845.0, 52803.0, 17971.0, 8000.0, 4164.0, 2339.0, 1417.0, 916.0, 587.0, 387.0, 235.0, 178.0, 118.0, 86.0, 53.0, 38.0, 20.0, 13.0, 19.0, 10.0, 10.0, 4.0, 3.0, 6.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8349609375, -0.8066024780273438, -0.7782440185546875, -0.7498855590820312, -0.721527099609375, -0.6931686401367188, -0.6648101806640625, -0.6364517211914062, -0.60809326171875, -0.5797348022460938, -0.5513763427734375, -0.5230178833007812, -0.494659423828125, -0.46630096435546875, -0.4379425048828125, -0.40958404541015625, -0.3812255859375, -0.35286712646484375, -0.3245086669921875, -0.29615020751953125, -0.267791748046875, -0.23943328857421875, -0.2110748291015625, -0.18271636962890625, -0.15435791015625, -0.12599945068359375, -0.0976409912109375, -0.06928253173828125, -0.040924072265625, -0.01256561279296875, 0.0157928466796875, 0.04415130615234375, 0.072509765625, 0.10086822509765625, 0.1292266845703125, 0.15758514404296875, 0.185943603515625, 0.21430206298828125, 0.2426605224609375, 0.27101898193359375, 0.29937744140625, 0.32773590087890625, 0.3560943603515625, 0.38445281982421875, 0.412811279296875, 0.44116973876953125, 0.4695281982421875, 0.49788665771484375, 0.5262451171875, 0.5546035766601562, 0.5829620361328125, 0.6113204956054688, 0.639678955078125, 0.6680374145507812, 0.6963958740234375, 0.7247543334960938, 0.75311279296875, 0.7814712524414062, 0.8098297119140625, 0.8381881713867188, 0.866546630859375, 0.8949050903320312, 0.9232635498046875, 0.9516220092773438, 0.97998046875]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 4.0, 7.0, 7.0, 11.0, 9.0, 18.0, 17.0, 19.0, 25.0, 23.0, 32.0, 42.0, 34.0, 43.0, 52.0, 41.0, 44.0, 54.0, 47.0, 42.0, 41.0, 56.0, 46.0, 38.0, 37.0, 39.0, 33.0, 22.0, 22.0, 25.0, 23.0, 21.0, 9.0, 7.0, 4.0, 4.0, 5.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.95703125, -1.9011993408203125, -1.845367431640625, -1.7895355224609375, -1.73370361328125, -1.6778717041015625, -1.622039794921875, -1.5662078857421875, -1.5103759765625, -1.4545440673828125, -1.398712158203125, -1.3428802490234375, -1.28704833984375, -1.2312164306640625, -1.175384521484375, -1.1195526123046875, -1.063720703125, -1.0078887939453125, -0.952056884765625, -0.8962249755859375, -0.84039306640625, -0.7845611572265625, -0.728729248046875, -0.6728973388671875, -0.6170654296875, -0.5612335205078125, -0.505401611328125, -0.4495697021484375, -0.39373779296875, -0.3379058837890625, -0.282073974609375, -0.2262420654296875, -0.17041015625, -0.1145782470703125, -0.058746337890625, -0.0029144287109375, 0.05291748046875, 0.1087493896484375, 0.164581298828125, 0.2204132080078125, 0.2762451171875, 0.3320770263671875, 0.387908935546875, 0.4437408447265625, 0.49957275390625, 0.5554046630859375, 0.611236572265625, 0.6670684814453125, 0.722900390625, 0.7787322998046875, 0.834564208984375, 0.8903961181640625, 0.94622802734375, 1.0020599365234375, 1.057891845703125, 1.1137237548828125, 1.1695556640625, 1.2253875732421875, 1.281219482421875, 1.3370513916015625, 1.39288330078125, 1.4487152099609375, 1.504547119140625, 1.5603790283203125, 1.6162109375]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 6.0, 6.0, 7.0, 11.0, 18.0, 19.0, 33.0, 49.0, 82.0, 130.0, 187.0, 301.0, 480.0, 902.0, 1521.0, 2974.0, 6557.0, 16808.0, 61838.0, 314771.0, 485086.0, 112647.0, 26413.0, 9199.0, 3899.0, 1912.0, 1064.0, 585.0, 419.0, 212.0, 155.0, 88.0, 72.0, 32.0, 23.0, 26.0, 15.0, 6.0, 5.0, 3.0, 4.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.427734375, -0.4140205383300781, -0.40030670166015625, -0.3865928649902344, -0.3728790283203125, -0.3591651916503906, -0.34545135498046875, -0.3317375183105469, -0.318023681640625, -0.3043098449707031, -0.29059600830078125, -0.2768821716308594, -0.2631683349609375, -0.24945449829101562, -0.23574066162109375, -0.22202682495117188, -0.20831298828125, -0.19459915161132812, -0.18088531494140625, -0.16717147827148438, -0.1534576416015625, -0.13974380493164062, -0.12602996826171875, -0.11231613159179688, -0.098602294921875, -0.08488845825195312, -0.07117462158203125, -0.057460784912109375, -0.0437469482421875, -0.030033111572265625, -0.01631927490234375, -0.002605438232421875, 0.0111083984375, 0.024822235107421875, 0.03853607177734375, 0.052249908447265625, 0.0659637451171875, 0.07967758178710938, 0.09339141845703125, 0.10710525512695312, 0.120819091796875, 0.13453292846679688, 0.14824676513671875, 0.16196060180664062, 0.1756744384765625, 0.18938827514648438, 0.20310211181640625, 0.21681594848632812, 0.23052978515625, 0.24424362182617188, 0.25795745849609375, 0.2716712951660156, 0.2853851318359375, 0.2990989685058594, 0.31281280517578125, 0.3265266418457031, 0.340240478515625, 0.3539543151855469, 0.36766815185546875, 0.3813819885253906, 0.3950958251953125, 0.4088096618652344, 0.42252349853515625, 0.4362373352050781, 0.449951171875]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 4.0, 3.0, 3.0, 1.0, 2.0, 3.0, 8.0, 13.0, 17.0, 26.0, 88.0, 157.0, 267.0, 218.0, 91.0, 46.0, 22.0, 12.0, 7.0, 6.0, 5.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.000244140625, -0.00023462623357772827, -0.00022511184215545654, -0.00021559745073318481, -0.00020608305931091309, -0.00019656866788864136, -0.00018705427646636963, -0.0001775398850440979, -0.00016802549362182617, -0.00015851110219955444, -0.00014899671077728271, -0.00013948231935501099, -0.00012996792793273926, -0.00012045353651046753, -0.0001109391450881958, -0.00010142475366592407, -9.191036224365234e-05, -8.239597082138062e-05, -7.288157939910889e-05, -6.336718797683716e-05, -5.385279655456543e-05, -4.43384051322937e-05, -3.482401371002197e-05, -2.5309622287750244e-05, -1.5795230865478516e-05, -6.280839443206787e-06, 3.2335519790649414e-06, 1.274794340133667e-05, 2.22623348236084e-05, 3.177672624588013e-05, 4.1291117668151855e-05, 5.0805509090423584e-05, 6.031990051269531e-05, 6.983429193496704e-05, 7.934868335723877e-05, 8.88630747795105e-05, 9.837746620178223e-05, 0.00010789185762405396, 0.00011740624904632568, 0.0001269206404685974, 0.00013643503189086914, 0.00014594942331314087, 0.0001554638147354126, 0.00016497820615768433, 0.00017449259757995605, 0.00018400698900222778, 0.0001935213804244995, 0.00020303577184677124, 0.00021255016326904297, 0.0002220645546913147, 0.00023157894611358643, 0.00024109333753585815, 0.0002506077289581299, 0.0002601221203804016, 0.00026963651180267334, 0.00027915090322494507, 0.0002886652946472168, 0.0002981796860694885, 0.00030769407749176025, 0.000317208468914032, 0.0003267228603363037, 0.00033623725175857544, 0.00034575164318084717, 0.0003552660346031189, 0.0003647804260253906]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 5.0, 4.0, 2.0, 7.0, 3.0, 8.0, 18.0, 23.0, 32.0, 51.0, 58.0, 80.0, 100.0, 169.0, 233.0, 372.0, 523.0, 832.0, 1232.0, 2123.0, 3604.0, 7033.0, 14659.0, 35165.0, 98566.0, 268566.0, 351169.0, 163705.0, 56258.0, 22012.0, 9721.0, 4836.0, 2704.0, 1635.0, 960.0, 671.0, 408.0, 322.0, 208.0, 138.0, 108.0, 62.0, 54.0, 35.0, 28.0, 11.0, 16.0, 12.0, 3.0, 6.0, 6.0, 7.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.284912109375, -0.2757911682128906, -0.26667022705078125, -0.2575492858886719, -0.2484283447265625, -0.23930740356445312, -0.23018646240234375, -0.22106552124023438, -0.211944580078125, -0.20282363891601562, -0.19370269775390625, -0.18458175659179688, -0.1754608154296875, -0.16633987426757812, -0.15721893310546875, -0.14809799194335938, -0.13897705078125, -0.12985610961914062, -0.12073516845703125, -0.11161422729492188, -0.1024932861328125, -0.09337234497070312, -0.08425140380859375, -0.07513046264648438, -0.066009521484375, -0.056888580322265625, -0.04776763916015625, -0.038646697998046875, -0.0295257568359375, -0.020404815673828125, -0.01128387451171875, -0.002162933349609375, 0.0069580078125, 0.016078948974609375, 0.02519989013671875, 0.034320831298828125, 0.0434417724609375, 0.052562713623046875, 0.06168365478515625, 0.07080459594726562, 0.079925537109375, 0.08904647827148438, 0.09816741943359375, 0.10728836059570312, 0.1164093017578125, 0.12553024291992188, 0.13465118408203125, 0.14377212524414062, 0.15289306640625, 0.16201400756835938, 0.17113494873046875, 0.18025588989257812, 0.1893768310546875, 0.19849777221679688, 0.20761871337890625, 0.21673965454101562, 0.225860595703125, 0.23498153686523438, 0.24410247802734375, 0.2532234191894531, 0.2623443603515625, 0.2714653015136719, 0.28058624267578125, 0.2897071838378906, 0.298828125]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 5.0, 3.0, 10.0, 11.0, 13.0, 22.0, 35.0, 69.0, 88.0, 117.0, 135.0, 111.0, 143.0, 95.0, 51.0, 37.0, 12.0, 16.0, 10.0, 5.0, 4.0, 3.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.59765625, -0.5805206298828125, -0.563385009765625, -0.5462493896484375, -0.52911376953125, -0.5119781494140625, -0.494842529296875, -0.4777069091796875, -0.4605712890625, -0.4434356689453125, -0.426300048828125, -0.4091644287109375, -0.39202880859375, -0.3748931884765625, -0.357757568359375, -0.3406219482421875, -0.323486328125, -0.3063507080078125, -0.289215087890625, -0.2720794677734375, -0.25494384765625, -0.2378082275390625, -0.220672607421875, -0.2035369873046875, -0.1864013671875, -0.1692657470703125, -0.152130126953125, -0.1349945068359375, -0.11785888671875, -0.1007232666015625, -0.083587646484375, -0.0664520263671875, -0.04931640625, -0.0321807861328125, -0.015045166015625, 0.0020904541015625, 0.01922607421875, 0.0363616943359375, 0.053497314453125, 0.0706329345703125, 0.0877685546875, 0.1049041748046875, 0.122039794921875, 0.1391754150390625, 0.15631103515625, 0.1734466552734375, 0.190582275390625, 0.2077178955078125, 0.224853515625, 0.2419891357421875, 0.259124755859375, 0.2762603759765625, 0.29339599609375, 0.3105316162109375, 0.327667236328125, 0.3448028564453125, 0.3619384765625, 0.3790740966796875, 0.396209716796875, 0.4133453369140625, 0.43048095703125, 0.4476165771484375, 0.464752197265625, 0.4818878173828125, 0.4990234375]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 0.0, 3.0, 1.0, 6.0, 5.0, 11.0, 29.0, 44.0, 84.0, 166.0, 167.0, 187.0, 140.0, 75.0, 40.0, 15.0, 11.0, 7.0, 5.0, 4.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.579278945922852, -9.319979667663574, -9.060680389404297, -8.801380157470703, -8.542080879211426, -8.282781600952148, -8.023482322692871, -7.7641825675964355, -7.5048828125, -7.245583534240723, -6.986283779144287, -6.72698450088501, -6.467684745788574, -6.208385467529297, -5.9490861892700195, -5.689786434173584, -5.430487155914307, -5.171187877655029, -4.911888122558594, -4.652588844299316, -4.393289089202881, -4.1339898109436035, -3.874690294265747, -3.6153907775878906, -3.356091260910034, -3.0967917442321777, -2.8374922275543213, -2.578192710876465, -2.3188934326171875, -2.059593677520752, -1.8002943992614746, -1.5409948825836182, -1.28169584274292, -1.0223963260650635, -0.7630968689918518, -0.5037974119186401, -0.2444978952407837, 0.014801621437072754, 0.27410101890563965, 0.5334005355834961, 0.7927000522613525, 1.051999568939209, 1.3112990856170654, 1.5705984830856323, 1.8298979997634888, 2.0891976356506348, 2.348496913909912, 2.6077964305877686, 2.867095947265625, 3.1263954639434814, 3.385694980621338, 3.6449942588806152, 3.904294013977051, 4.163593292236328, 4.4228925704956055, 4.682192325592041, 4.941492080688477, 5.200791358947754, 5.4600911140441895, 5.719390392303467, 5.978690147399902, 6.23798942565918, 6.497288703918457, 6.756588459014893, 7.01588773727417]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 5.0, 3.0, 5.0, 13.0, 6.0, 10.0, 17.0, 14.0, 19.0, 17.0, 34.0, 25.0, 24.0, 29.0, 35.0, 37.0, 41.0, 42.0, 44.0, 48.0, 43.0, 41.0, 61.0, 45.0, 47.0, 40.0, 38.0, 27.0, 31.0, 23.0, 18.0, 19.0, 24.0, 14.0, 16.0, 10.0, 11.0, 5.0, 14.0, 2.0, 2.0, 6.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.521371364593506, -4.390708923339844, -4.26004695892334, -4.129384517669678, -3.9987223148345947, -3.8680601119995117, -3.7373976707458496, -3.6067354679107666, -3.4760732650756836, -3.3454110622406006, -3.2147488594055176, -3.0840864181518555, -2.9534242153167725, -2.8227620124816895, -2.6920995712280273, -2.5614373683929443, -2.4307751655578613, -2.3001129627227783, -2.1694507598876953, -2.038788318634033, -1.9081261157989502, -1.7774639129638672, -1.6468015909194946, -1.516139268875122, -1.385477066040039, -1.254814863204956, -1.1241525411605835, -0.9934902787208557, -0.8628280162811279, -0.7321657538414001, -0.6015034914016724, -0.4708412289619446, -0.3401784896850586, -0.2095162272453308, -0.07885396480560303, 0.051808297634124756, 0.18247056007385254, 0.3131328225135803, 0.4437950849533081, 0.5744573473930359, 0.7051196098327637, 0.8357818722724915, 0.9664441347122192, 1.0971064567565918, 1.2277686595916748, 1.3584308624267578, 1.4890931844711304, 1.619755506515503, 1.750417709350586, 1.881079912185669, 2.011742115020752, 2.142404556274414, 2.273066759109497, 2.40372896194458, 2.534391403198242, 2.665053606033325, 2.795715808868408, 2.926378011703491, 3.057040214538574, 3.1877026557922363, 3.3183648586273193, 3.4490270614624023, 3.5796895027160645, 3.7103517055511475, 3.8410139083862305]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 6.0, 6.0, 13.0, 5.0, 12.0, 16.0, 22.0, 31.0, 51.0, 54.0, 89.0, 118.0, 176.0, 250.0, 414.0, 532.0, 829.0, 1261.0, 2049.0, 3463.0, 6222.0, 12887.0, 34560.0, 135507.0, 617614.0, 1857383.0, 1135025.0, 279745.0, 67050.0, 20053.0, 8326.0, 4185.0, 2383.0, 1372.0, 897.0, 563.0, 376.0, 265.0, 146.0, 98.0, 74.0, 42.0, 44.0, 24.0, 12.0, 15.0, 6.0, 6.0, 10.0, 0.0, 3.0, 1.0, 4.0, 0.0, 0.0, 1.0], "bins": [-0.78076171875, -0.7576141357421875, -0.734466552734375, -0.7113189697265625, -0.68817138671875, -0.6650238037109375, -0.641876220703125, -0.6187286376953125, -0.5955810546875, -0.5724334716796875, -0.549285888671875, -0.5261383056640625, -0.50299072265625, -0.4798431396484375, -0.456695556640625, -0.4335479736328125, -0.410400390625, -0.3872528076171875, -0.364105224609375, -0.3409576416015625, -0.31781005859375, -0.2946624755859375, -0.271514892578125, -0.2483673095703125, -0.2252197265625, -0.2020721435546875, -0.178924560546875, -0.1557769775390625, -0.13262939453125, -0.1094818115234375, -0.086334228515625, -0.0631866455078125, -0.0400390625, -0.0168914794921875, 0.006256103515625, 0.0294036865234375, 0.05255126953125, 0.0756988525390625, 0.098846435546875, 0.1219940185546875, 0.1451416015625, 0.1682891845703125, 0.191436767578125, 0.2145843505859375, 0.23773193359375, 0.2608795166015625, 0.284027099609375, 0.3071746826171875, 0.330322265625, 0.3534698486328125, 0.376617431640625, 0.3997650146484375, 0.42291259765625, 0.4460601806640625, 0.469207763671875, 0.4923553466796875, 0.5155029296875, 0.5386505126953125, 0.561798095703125, 0.5849456787109375, 0.60809326171875, 0.6312408447265625, 0.654388427734375, 0.6775360107421875, 0.70068359375]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [3.0, 1.0, 3.0, 3.0, 2.0, 2.0, 0.0, 2.0, 7.0, 2.0, 5.0, 6.0, 6.0, 10.0, 6.0, 14.0, 12.0, 12.0, 16.0, 18.0, 21.0, 26.0, 30.0, 23.0, 26.0, 23.0, 43.0, 47.0, 36.0, 32.0, 43.0, 37.0, 37.0, 37.0, 34.0, 39.0, 30.0, 32.0, 27.0, 30.0, 28.0, 24.0, 28.0, 21.0, 22.0, 21.0, 18.0, 11.0, 14.0, 9.0, 6.0, 14.0, 2.0, 2.0, 3.0, 3.0, 8.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.46142578125, -0.447021484375, -0.4326171875, -0.418212890625, -0.40380859375, -0.389404296875, -0.375, -0.360595703125, -0.34619140625, -0.331787109375, -0.3173828125, -0.302978515625, -0.28857421875, -0.274169921875, -0.259765625, -0.245361328125, -0.23095703125, -0.216552734375, -0.2021484375, -0.187744140625, -0.17333984375, -0.158935546875, -0.14453125, -0.130126953125, -0.11572265625, -0.101318359375, -0.0869140625, -0.072509765625, -0.05810546875, -0.043701171875, -0.029296875, -0.014892578125, -0.00048828125, 0.013916015625, 0.0283203125, 0.042724609375, 0.05712890625, 0.071533203125, 0.0859375, 0.100341796875, 0.11474609375, 0.129150390625, 0.1435546875, 0.157958984375, 0.17236328125, 0.186767578125, 0.201171875, 0.215576171875, 0.22998046875, 0.244384765625, 0.2587890625, 0.273193359375, 0.28759765625, 0.302001953125, 0.31640625, 0.330810546875, 0.34521484375, 0.359619140625, 0.3740234375, 0.388427734375, 0.40283203125, 0.417236328125, 0.431640625, 0.446044921875, 0.46044921875]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 3.0, 2.0, 1.0, 1.0, 3.0, 10.0, 12.0, 12.0, 24.0, 24.0, 35.0, 55.0, 88.0, 132.0, 207.0, 288.0, 529.0, 850.0, 1519.0, 2751.0, 5434.0, 11846.0, 30060.0, 103197.0, 629873.0, 2759403.0, 508793.0, 89640.0, 27298.0, 10831.0, 5018.0, 2689.0, 1420.0, 858.0, 473.0, 276.0, 191.0, 134.0, 99.0, 67.0, 48.0, 26.0, 18.0, 20.0, 9.0, 12.0, 4.0, 6.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.888671875, -0.8574371337890625, -0.826202392578125, -0.7949676513671875, -0.76373291015625, -0.7324981689453125, -0.701263427734375, -0.6700286865234375, -0.6387939453125, -0.6075592041015625, -0.576324462890625, -0.5450897216796875, -0.51385498046875, -0.4826202392578125, -0.451385498046875, -0.4201507568359375, -0.388916015625, -0.3576812744140625, -0.326446533203125, -0.2952117919921875, -0.26397705078125, -0.2327423095703125, -0.201507568359375, -0.1702728271484375, -0.1390380859375, -0.1078033447265625, -0.076568603515625, -0.0453338623046875, -0.01409912109375, 0.0171356201171875, 0.048370361328125, 0.0796051025390625, 0.11083984375, 0.1420745849609375, 0.173309326171875, 0.2045440673828125, 0.23577880859375, 0.2670135498046875, 0.298248291015625, 0.3294830322265625, 0.3607177734375, 0.3919525146484375, 0.423187255859375, 0.4544219970703125, 0.48565673828125, 0.5168914794921875, 0.548126220703125, 0.5793609619140625, 0.610595703125, 0.6418304443359375, 0.673065185546875, 0.7042999267578125, 0.73553466796875, 0.7667694091796875, 0.798004150390625, 0.8292388916015625, 0.8604736328125, 0.8917083740234375, 0.922943115234375, 0.9541778564453125, 0.98541259765625, 1.0166473388671875, 1.047882080078125, 1.0791168212890625, 1.1103515625]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 5.0, 6.0, 12.0, 9.0, 17.0, 20.0, 23.0, 33.0, 55.0, 96.0, 118.0, 194.0, 353.0, 601.0, 830.0, 604.0, 408.0, 230.0, 148.0, 101.0, 58.0, 49.0, 36.0, 21.0, 13.0, 7.0, 10.0, 4.0, 4.0, 3.0, 3.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.427734375, -1.3898239135742188, -1.3519134521484375, -1.3140029907226562, -1.276092529296875, -1.2381820678710938, -1.2002716064453125, -1.1623611450195312, -1.12445068359375, -1.0865402221679688, -1.0486297607421875, -1.0107192993164062, -0.972808837890625, -0.9348983764648438, -0.8969879150390625, -0.8590774536132812, -0.8211669921875, -0.7832565307617188, -0.7453460693359375, -0.7074356079101562, -0.669525146484375, -0.6316146850585938, -0.5937042236328125, -0.5557937622070312, -0.51788330078125, -0.47997283935546875, -0.4420623779296875, -0.40415191650390625, -0.366241455078125, -0.32833099365234375, -0.2904205322265625, -0.25251007080078125, -0.214599609375, -0.17668914794921875, -0.1387786865234375, -0.10086822509765625, -0.062957763671875, -0.02504730224609375, 0.0128631591796875, 0.05077362060546875, 0.08868408203125, 0.12659454345703125, 0.1645050048828125, 0.20241546630859375, 0.240325927734375, 0.27823638916015625, 0.3161468505859375, 0.35405731201171875, 0.3919677734375, 0.42987823486328125, 0.4677886962890625, 0.5056991577148438, 0.543609619140625, 0.5815200805664062, 0.6194305419921875, 0.6573410034179688, 0.69525146484375, 0.7331619262695312, 0.7710723876953125, 0.8089828491210938, 0.846893310546875, 0.8848037719726562, 0.9227142333984375, 0.9606246948242188, 0.99853515625]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 5.0, 1.0, 4.0, 5.0, 7.0, 15.0, 23.0, 36.0, 80.0, 125.0, 147.0, 162.0, 153.0, 109.0, 78.0, 21.0, 17.0, 5.0, 8.0, 4.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.79780101776123, -8.510443687438965, -8.223085403442383, -7.935728073120117, -7.648370742797852, -7.361013412475586, -7.073655605316162, -6.786297798156738, -6.498940467834473, -6.211583137512207, -5.924225330352783, -5.636867523193359, -5.349510192871094, -5.062152862548828, -4.774795055389404, -4.4874372482299805, -4.200079917907715, -3.91272234916687, -3.6253647804260254, -3.3380072116851807, -3.050649642944336, -2.763292074203491, -2.4759345054626465, -2.1885769367218018, -1.901219367980957, -1.6138617992401123, -1.3265042304992676, -1.0391466617584229, -0.7517890930175781, -0.4644315242767334, -0.17707395553588867, 0.11028361320495605, 0.3976402282714844, 0.6849977970123291, 0.9723553657531738, 1.2597129344940186, 1.5470705032348633, 1.834428071975708, 2.1217856407165527, 2.4091432094573975, 2.696500778198242, 2.983858346939087, 3.2712159156799316, 3.5585734844207764, 3.845931053161621, 4.133288383483887, 4.4206461906433105, 4.708003997802734, 4.995361328125, 5.282718658447266, 5.5700764656066895, 5.857434272766113, 6.144791603088379, 6.4321489334106445, 6.719506740570068, 7.006864547729492, 7.294221878051758, 7.581579208374023, 7.868937015533447, 8.156294822692871, 8.443652153015137, 8.731009483337402, 9.018367767333984, 9.30572509765625, 9.593082427978516]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 5.0, 3.0, 3.0, 5.0, 5.0, 5.0, 10.0, 15.0, 19.0, 9.0, 13.0, 17.0, 29.0, 29.0, 28.0, 39.0, 24.0, 29.0, 42.0, 33.0, 38.0, 47.0, 35.0, 35.0, 61.0, 44.0, 39.0, 43.0, 34.0, 33.0, 30.0, 23.0, 29.0, 25.0, 28.0, 17.0, 13.0, 17.0, 7.0, 11.0, 11.0, 8.0, 6.0, 3.0, 3.0, 0.0, 3.0, 0.0, 6.0, 2.0, 0.0, 1.0, 3.0], "bins": [-3.247690200805664, -3.1539840698242188, -3.0602779388427734, -2.966571807861328, -2.872865676879883, -2.7791595458984375, -2.685453414916992, -2.591747283935547, -2.4980411529541016, -2.4043350219726562, -2.310628890991211, -2.2169227600097656, -2.1232166290283203, -2.029510498046875, -1.9358042478561401, -1.8420981168746948, -1.74839186668396, -1.6546857357025146, -1.5609796047210693, -1.467273473739624, -1.3735673427581787, -1.2798612117767334, -1.1861549615859985, -1.0924488306045532, -0.9987426996231079, -0.9050365686416626, -0.8113304376602173, -0.7176242470741272, -0.6239181160926819, -0.5302119851112366, -0.4365057945251465, -0.34279966354370117, -0.24909353256225586, -0.15538738667964935, -0.06168124079704285, 0.032024919986724854, 0.12573105096817017, 0.21943718194961548, 0.31314337253570557, 0.4068495035171509, 0.5005556344985962, 0.5942617654800415, 0.6879678964614868, 0.7816740870475769, 0.8753802180290222, 0.9690863490104675, 1.0627925395965576, 1.156498670578003, 1.2502048015594482, 1.3439109325408936, 1.4376170635223389, 1.5313231945037842, 1.6250293254852295, 1.7187354564666748, 1.8124417066574097, 1.906147837638855, 1.9998539686203003, 2.093560218811035, 2.1872663497924805, 2.280972480773926, 2.374678611755371, 2.4683847427368164, 2.5620908737182617, 2.655797004699707, 2.7495031356811523]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 3.0, 1.0, 4.0, 5.0, 6.0, 5.0, 7.0, 15.0, 17.0, 28.0, 39.0, 52.0, 62.0, 92.0, 129.0, 189.0, 282.0, 402.0, 565.0, 1019.0, 1554.0, 2596.0, 4873.0, 9483.0, 19696.0, 41776.0, 91140.0, 181104.0, 263525.0, 212406.0, 113471.0, 53260.0, 24763.0, 11868.0, 5871.0, 3169.0, 1820.0, 1123.0, 712.0, 450.0, 267.0, 198.0, 139.0, 112.0, 52.0, 62.0, 40.0, 22.0, 17.0, 24.0, 15.0, 20.0, 5.0, 6.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.5322265625, -0.515411376953125, -0.49859619140625, -0.481781005859375, -0.4649658203125, -0.448150634765625, -0.43133544921875, -0.414520263671875, -0.397705078125, -0.380889892578125, -0.36407470703125, -0.347259521484375, -0.3304443359375, -0.313629150390625, -0.29681396484375, -0.279998779296875, -0.26318359375, -0.246368408203125, -0.22955322265625, -0.212738037109375, -0.1959228515625, -0.179107666015625, -0.16229248046875, -0.145477294921875, -0.128662109375, -0.111846923828125, -0.09503173828125, -0.078216552734375, -0.0614013671875, -0.044586181640625, -0.02777099609375, -0.010955810546875, 0.005859375, 0.022674560546875, 0.03948974609375, 0.056304931640625, 0.0731201171875, 0.089935302734375, 0.10675048828125, 0.123565673828125, 0.140380859375, 0.157196044921875, 0.17401123046875, 0.190826416015625, 0.2076416015625, 0.224456787109375, 0.24127197265625, 0.258087158203125, 0.27490234375, 0.291717529296875, 0.30853271484375, 0.325347900390625, 0.3421630859375, 0.358978271484375, 0.37579345703125, 0.392608642578125, 0.409423828125, 0.426239013671875, 0.44305419921875, 0.459869384765625, 0.4766845703125, 0.493499755859375, 0.51031494140625, 0.527130126953125, 0.5439453125]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 4.0, 3.0, 8.0, 7.0, 6.0, 4.0, 6.0, 13.0, 13.0, 12.0, 22.0, 15.0, 25.0, 21.0, 35.0, 30.0, 31.0, 27.0, 40.0, 39.0, 49.0, 38.0, 37.0, 48.0, 37.0, 35.0, 39.0, 32.0, 33.0, 44.0, 47.0, 31.0, 26.0, 21.0, 22.0, 13.0, 21.0, 14.0, 18.0, 12.0, 5.0, 9.0, 6.0, 4.0, 1.0, 4.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.552734375, -0.5345230102539062, -0.5163116455078125, -0.49810028076171875, -0.479888916015625, -0.46167755126953125, -0.4434661865234375, -0.42525482177734375, -0.40704345703125, -0.38883209228515625, -0.3706207275390625, -0.35240936279296875, -0.334197998046875, -0.31598663330078125, -0.2977752685546875, -0.27956390380859375, -0.2613525390625, -0.24314117431640625, -0.2249298095703125, -0.20671844482421875, -0.188507080078125, -0.17029571533203125, -0.1520843505859375, -0.13387298583984375, -0.11566162109375, -0.09745025634765625, -0.0792388916015625, -0.06102752685546875, -0.042816162109375, -0.02460479736328125, -0.0063934326171875, 0.01181793212890625, 0.030029296875, 0.04824066162109375, 0.0664520263671875, 0.08466339111328125, 0.102874755859375, 0.12108612060546875, 0.1392974853515625, 0.15750885009765625, 0.17572021484375, 0.19393157958984375, 0.2121429443359375, 0.23035430908203125, 0.248565673828125, 0.26677703857421875, 0.2849884033203125, 0.30319976806640625, 0.3214111328125, 0.33962249755859375, 0.3578338623046875, 0.37604522705078125, 0.394256591796875, 0.41246795654296875, 0.4306793212890625, 0.44889068603515625, 0.46710205078125, 0.48531341552734375, 0.5035247802734375, 0.5217361450195312, 0.539947509765625, 0.5581588745117188, 0.5763702392578125, 0.5945816040039062, 0.61279296875]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 0.0, 3.0, 2.0, 0.0, 3.0, 6.0, 4.0, 5.0, 13.0, 21.0, 24.0, 31.0, 73.0, 100.0, 154.0, 281.0, 424.0, 811.0, 1545.0, 3259.0, 6644.0, 15023.0, 36817.0, 92920.0, 223248.0, 349493.0, 187015.0, 76071.0, 30369.0, 12708.0, 5600.0, 2721.0, 1382.0, 740.0, 402.0, 219.0, 148.0, 95.0, 68.0, 33.0, 26.0, 16.0, 14.0, 10.0, 5.0, 8.0, 7.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.55322265625, -0.5344009399414062, -0.5155792236328125, -0.49675750732421875, -0.477935791015625, -0.45911407470703125, -0.4402923583984375, -0.42147064208984375, -0.40264892578125, -0.38382720947265625, -0.3650054931640625, -0.34618377685546875, -0.327362060546875, -0.30854034423828125, -0.2897186279296875, -0.27089691162109375, -0.2520751953125, -0.23325347900390625, -0.2144317626953125, -0.19561004638671875, -0.176788330078125, -0.15796661376953125, -0.1391448974609375, -0.12032318115234375, -0.10150146484375, -0.08267974853515625, -0.0638580322265625, -0.04503631591796875, -0.026214599609375, -0.00739288330078125, 0.0114288330078125, 0.03025054931640625, 0.049072265625, 0.06789398193359375, 0.0867156982421875, 0.10553741455078125, 0.124359130859375, 0.14318084716796875, 0.1620025634765625, 0.18082427978515625, 0.19964599609375, 0.21846771240234375, 0.2372894287109375, 0.25611114501953125, 0.274932861328125, 0.29375457763671875, 0.3125762939453125, 0.33139801025390625, 0.3502197265625, 0.36904144287109375, 0.3878631591796875, 0.40668487548828125, 0.425506591796875, 0.44432830810546875, 0.4631500244140625, 0.48197174072265625, 0.50079345703125, 0.5196151733398438, 0.5384368896484375, 0.5572586059570312, 0.576080322265625, 0.5949020385742188, 0.6137237548828125, 0.6325454711914062, 0.6513671875]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 5.0, 4.0, 9.0, 8.0, 12.0, 9.0, 16.0, 14.0, 13.0, 18.0, 21.0, 23.0, 33.0, 29.0, 39.0, 28.0, 45.0, 44.0, 41.0, 44.0, 55.0, 47.0, 40.0, 48.0, 28.0, 45.0, 39.0, 34.0, 37.0, 19.0, 25.0, 22.0, 20.0, 17.0, 10.0, 16.0, 10.0, 6.0, 10.0, 8.0, 5.0, 5.0, 5.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.64453125, -1.594573974609375, -1.54461669921875, -1.494659423828125, -1.4447021484375, -1.394744873046875, -1.34478759765625, -1.294830322265625, -1.244873046875, -1.194915771484375, -1.14495849609375, -1.095001220703125, -1.0450439453125, -0.995086669921875, -0.94512939453125, -0.895172119140625, -0.84521484375, -0.795257568359375, -0.74530029296875, -0.695343017578125, -0.6453857421875, -0.595428466796875, -0.54547119140625, -0.495513916015625, -0.445556640625, -0.395599365234375, -0.34564208984375, -0.295684814453125, -0.2457275390625, -0.195770263671875, -0.14581298828125, -0.095855712890625, -0.0458984375, 0.004058837890625, 0.05401611328125, 0.103973388671875, 0.1539306640625, 0.203887939453125, 0.25384521484375, 0.303802490234375, 0.353759765625, 0.403717041015625, 0.45367431640625, 0.503631591796875, 0.5535888671875, 0.603546142578125, 0.65350341796875, 0.703460693359375, 0.75341796875, 0.803375244140625, 0.85333251953125, 0.903289794921875, 0.9532470703125, 1.003204345703125, 1.05316162109375, 1.103118896484375, 1.153076171875, 1.203033447265625, 1.25299072265625, 1.302947998046875, 1.3529052734375, 1.402862548828125, 1.45281982421875, 1.502777099609375, 1.552734375]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 6.0, 8.0, 11.0, 19.0, 21.0, 34.0, 52.0, 75.0, 118.0, 193.0, 295.0, 455.0, 692.0, 1184.0, 2243.0, 4052.0, 7689.0, 15716.0, 33863.0, 77197.0, 172199.0, 341213.0, 213335.0, 96239.0, 42056.0, 19130.0, 9387.0, 4790.0, 2557.0, 1452.0, 829.0, 521.0, 345.0, 191.0, 135.0, 83.0, 48.0, 42.0, 31.0, 19.0, 11.0, 6.0, 8.0, 5.0, 3.0, 1.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.159423828125, -0.15438461303710938, -0.14934539794921875, -0.14430618286132812, -0.1392669677734375, -0.13422775268554688, -0.12918853759765625, -0.12414932250976562, -0.119110107421875, -0.11407089233398438, -0.10903167724609375, -0.10399246215820312, -0.0989532470703125, -0.09391403198242188, -0.08887481689453125, -0.08383560180664062, -0.07879638671875, -0.07375717163085938, -0.06871795654296875, -0.06367874145507812, -0.0586395263671875, -0.053600311279296875, -0.04856109619140625, -0.043521881103515625, -0.038482666015625, -0.033443450927734375, -0.02840423583984375, -0.023365020751953125, -0.0183258056640625, -0.013286590576171875, -0.00824737548828125, -0.003208160400390625, 0.0018310546875, 0.006870269775390625, 0.01190948486328125, 0.016948699951171875, 0.0219879150390625, 0.027027130126953125, 0.03206634521484375, 0.037105560302734375, 0.042144775390625, 0.047183990478515625, 0.05222320556640625, 0.057262420654296875, 0.0623016357421875, 0.06734085083007812, 0.07238006591796875, 0.07741928100585938, 0.08245849609375, 0.08749771118164062, 0.09253692626953125, 0.09757614135742188, 0.1026153564453125, 0.10765457153320312, 0.11269378662109375, 0.11773300170898438, 0.122772216796875, 0.12781143188476562, 0.13285064697265625, 0.13788986206054688, 0.1429290771484375, 0.14796829223632812, 0.15300750732421875, 0.15804672241210938, 0.1630859375]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 2.0, 3.0, 5.0, 8.0, 8.0, 7.0, 13.0, 20.0, 22.0, 39.0, 54.0, 71.0, 76.0, 107.0, 113.0, 100.0, 83.0, 66.0, 43.0, 43.0, 30.0, 32.0, 11.0, 13.0, 12.0, 4.0, 6.0, 4.0, 5.0, 0.0, 2.0, 6.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-9.304285049438477e-05, -8.977577090263367e-05, -8.650869131088257e-05, -8.324161171913147e-05, -7.997453212738037e-05, -7.670745253562927e-05, -7.344037294387817e-05, -7.017329335212708e-05, -6.690621376037598e-05, -6.363913416862488e-05, -6.037205457687378e-05, -5.710497498512268e-05, -5.383789539337158e-05, -5.0570815801620483e-05, -4.7303736209869385e-05, -4.4036656618118286e-05, -4.076957702636719e-05, -3.750249743461609e-05, -3.423541784286499e-05, -3.096833825111389e-05, -2.7701258659362793e-05, -2.4434179067611694e-05, -2.1167099475860596e-05, -1.7900019884109497e-05, -1.4632940292358398e-05, -1.13658607006073e-05, -8.098781108856201e-06, -4.8317015171051025e-06, -1.564621925354004e-06, 1.7024576663970947e-06, 4.969537258148193e-06, 8.236616849899292e-06, 1.150369644165039e-05, 1.477077603340149e-05, 1.8037855625152588e-05, 2.1304935216903687e-05, 2.4572014808654785e-05, 2.7839094400405884e-05, 3.110617399215698e-05, 3.437325358390808e-05, 3.764033317565918e-05, 4.090741276741028e-05, 4.417449235916138e-05, 4.7441571950912476e-05, 5.0708651542663574e-05, 5.397573113441467e-05, 5.724281072616577e-05, 6.050989031791687e-05, 6.377696990966797e-05, 6.704404950141907e-05, 7.031112909317017e-05, 7.357820868492126e-05, 7.684528827667236e-05, 8.011236786842346e-05, 8.337944746017456e-05, 8.664652705192566e-05, 8.991360664367676e-05, 9.318068623542786e-05, 9.644776582717896e-05, 9.971484541893005e-05, 0.00010298192501068115, 0.00010624900460243225, 0.00010951608419418335, 0.00011278316378593445, 0.00011605024337768555]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 5.0, 2.0, 4.0, 10.0, 9.0, 16.0, 15.0, 21.0, 31.0, 54.0, 52.0, 88.0, 131.0, 216.0, 281.0, 382.0, 577.0, 960.0, 1548.0, 2549.0, 4476.0, 8194.0, 15315.0, 30453.0, 63411.0, 130804.0, 248398.0, 270052.0, 136805.0, 65774.0, 31690.0, 15917.0, 8487.0, 4562.0, 2732.0, 1579.0, 1022.0, 652.0, 424.0, 274.0, 168.0, 116.0, 88.0, 57.0, 43.0, 32.0, 32.0, 17.0, 15.0, 8.0, 5.0, 1.0, 6.0, 1.0, 2.0, 3.0, 1.0], "bins": [-0.1617431640625, -0.15699005126953125, -0.1522369384765625, -0.14748382568359375, -0.142730712890625, -0.13797760009765625, -0.1332244873046875, -0.12847137451171875, -0.12371826171875, -0.11896514892578125, -0.1142120361328125, -0.10945892333984375, -0.104705810546875, -0.09995269775390625, -0.0951995849609375, -0.09044647216796875, -0.085693359375, -0.08094024658203125, -0.0761871337890625, -0.07143402099609375, -0.066680908203125, -0.06192779541015625, -0.0571746826171875, -0.05242156982421875, -0.04766845703125, -0.04291534423828125, -0.0381622314453125, -0.03340911865234375, -0.028656005859375, -0.02390289306640625, -0.0191497802734375, -0.01439666748046875, -0.0096435546875, -0.00489044189453125, -0.0001373291015625, 0.00461578369140625, 0.009368896484375, 0.01412200927734375, 0.0188751220703125, 0.02362823486328125, 0.02838134765625, 0.03313446044921875, 0.0378875732421875, 0.04264068603515625, 0.047393798828125, 0.05214691162109375, 0.0569000244140625, 0.06165313720703125, 0.06640625, 0.07115936279296875, 0.0759124755859375, 0.08066558837890625, 0.085418701171875, 0.09017181396484375, 0.0949249267578125, 0.09967803955078125, 0.10443115234375, 0.10918426513671875, 0.1139373779296875, 0.11869049072265625, 0.123443603515625, 0.12819671630859375, 0.1329498291015625, 0.13770294189453125, 0.1424560546875]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 4.0, 3.0, 3.0, 5.0, 8.0, 15.0, 13.0, 12.0, 15.0, 18.0, 16.0, 29.0, 33.0, 32.0, 50.0, 47.0, 44.0, 65.0, 62.0, 71.0, 84.0, 57.0, 62.0, 46.0, 38.0, 50.0, 25.0, 21.0, 14.0, 6.0, 19.0, 7.0, 3.0, 9.0, 6.0, 3.0, 4.0, 5.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.2548828125, -0.2472209930419922, -0.23955917358398438, -0.23189735412597656, -0.22423553466796875, -0.21657371520996094, -0.20891189575195312, -0.2012500762939453, -0.1935882568359375, -0.1859264373779297, -0.17826461791992188, -0.17060279846191406, -0.16294097900390625, -0.15527915954589844, -0.14761734008789062, -0.1399555206298828, -0.132293701171875, -0.12463188171386719, -0.11697006225585938, -0.10930824279785156, -0.10164642333984375, -0.09398460388183594, -0.08632278442382812, -0.07866096496582031, -0.0709991455078125, -0.06333732604980469, -0.055675506591796875, -0.04801368713378906, -0.04035186767578125, -0.03269004821777344, -0.025028228759765625, -0.017366409301757812, -0.00970458984375, -0.0020427703857421875, 0.005619049072265625, 0.013280868530273438, 0.02094268798828125, 0.028604507446289062, 0.036266326904296875, 0.04392814636230469, 0.0515899658203125, 0.05925178527832031, 0.06691360473632812, 0.07457542419433594, 0.08223724365234375, 0.08989906311035156, 0.09756088256835938, 0.10522270202636719, 0.112884521484375, 0.12054634094238281, 0.12820816040039062, 0.13586997985839844, 0.14353179931640625, 0.15119361877441406, 0.15885543823242188, 0.1665172576904297, 0.1741790771484375, 0.1818408966064453, 0.18950271606445312, 0.19716453552246094, 0.20482635498046875, 0.21248817443847656, 0.22014999389648438, 0.2278118133544922, 0.2354736328125]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 10.0, 10.0, 17.0, 31.0, 44.0, 67.0, 96.0, 156.0, 145.0, 156.0, 112.0, 61.0, 44.0, 20.0, 8.0, 14.0, 5.0, 1.0, 4.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-6.488615989685059, -6.310371398925781, -6.132126808166504, -5.953882217407227, -5.775637626647949, -5.597393035888672, -5.4191484451293945, -5.240903854370117, -5.06265926361084, -4.8844146728515625, -4.706170082092285, -4.527925491333008, -4.3496809005737305, -4.171436309814453, -3.993191719055176, -3.8149471282958984, -3.636702537536621, -3.4584579467773438, -3.2802133560180664, -3.101968765258789, -2.9237241744995117, -2.7454795837402344, -2.567234992980957, -2.3889904022216797, -2.2107458114624023, -2.032501220703125, -1.8542566299438477, -1.6760120391845703, -1.497767448425293, -1.3195228576660156, -1.1412782669067383, -0.9630336761474609, -0.7847895622253418, -0.6065449714660645, -0.4283003807067871, -0.25005578994750977, -0.07181119918823242, 0.10643339157104492, 0.28467798233032227, 0.4629225730895996, 0.641167163848877, 0.8194117546081543, 0.9976563453674316, 1.175900936126709, 1.3541455268859863, 1.5323901176452637, 1.710634708404541, 1.8888792991638184, 2.0671238899230957, 2.245368480682373, 2.4236130714416504, 2.6018576622009277, 2.780102252960205, 2.9583468437194824, 3.1365914344787598, 3.314836025238037, 3.4930806159973145, 3.671325206756592, 3.849569797515869, 4.0278143882751465, 4.206058979034424, 4.384303569793701, 4.5625481605529785, 4.740792751312256, 4.919037342071533]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 9.0, 5.0, 11.0, 6.0, 14.0, 14.0, 13.0, 19.0, 23.0, 25.0, 28.0, 20.0, 33.0, 32.0, 31.0, 39.0, 39.0, 52.0, 52.0, 40.0, 45.0, 49.0, 46.0, 50.0, 26.0, 36.0, 23.0, 26.0, 33.0, 31.0, 22.0, 27.0, 17.0, 17.0, 7.0, 9.0, 10.0, 4.0, 8.0, 2.0, 4.0, 5.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-4.037466526031494, -3.9095664024353027, -3.7816660404205322, -3.653765916824341, -3.5258655548095703, -3.397965431213379, -3.2700653076171875, -3.142165184020996, -3.0142648220062256, -2.886364698410034, -2.7584643363952637, -2.6305642127990723, -2.502664089202881, -2.3747637271881104, -2.246863603591919, -2.1189632415771484, -1.991063117980957, -1.863162875175476, -1.7352626323699951, -1.6073625087738037, -1.4794622659683228, -1.3515620231628418, -1.2236618995666504, -1.0957616567611694, -0.9678614139556885, -0.8399611711502075, -0.7120609879493713, -0.5841608047485352, -0.4562605619430542, -0.32836031913757324, -0.20046013593673706, -0.07255995273590088, 0.05534076690673828, 0.18324097990989685, 0.3111411929130554, 0.439041405916214, 0.5669416189193726, 0.6948418617248535, 0.8227420449256897, 0.9506422281265259, 1.0785424709320068, 1.2064427137374878, 1.3343429565429688, 1.4622430801391602, 1.5901433229446411, 1.718043565750122, 1.8459436893463135, 1.9738439321517944, 2.1017441749572754, 2.229644298553467, 2.3575446605682373, 2.4854447841644287, 2.613345146179199, 2.7412452697753906, 2.869145393371582, 2.9970455169677734, 3.124945878982544, 3.2528460025787354, 3.380746364593506, 3.5086464881896973, 3.6365466117858887, 3.764446973800659, 3.8923470973968506, 4.020247459411621, 4.1481475830078125]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 8.0, 8.0, 10.0, 15.0, 17.0, 34.0, 41.0, 60.0, 103.0, 122.0, 171.0, 323.0, 460.0, 707.0, 1105.0, 1896.0, 3411.0, 6846.0, 16330.0, 49895.0, 172404.0, 490574.0, 1028135.0, 1203174.0, 749901.0, 315232.0, 101196.0, 30472.0, 10798.0, 4841.0, 2422.0, 1340.0, 819.0, 503.0, 311.0, 209.0, 115.0, 76.0, 72.0, 45.0, 35.0, 16.0, 12.0, 10.0, 2.0, 4.0, 3.0, 4.0, 2.0, 0.0, 2.0], "bins": [-0.67138671875, -0.6528701782226562, -0.6343536376953125, -0.6158370971679688, -0.597320556640625, -0.5788040161132812, -0.5602874755859375, -0.5417709350585938, -0.52325439453125, -0.5047378540039062, -0.4862213134765625, -0.46770477294921875, -0.449188232421875, -0.43067169189453125, -0.4121551513671875, -0.39363861083984375, -0.3751220703125, -0.35660552978515625, -0.3380889892578125, -0.31957244873046875, -0.301055908203125, -0.28253936767578125, -0.2640228271484375, -0.24550628662109375, -0.22698974609375, -0.20847320556640625, -0.1899566650390625, -0.17144012451171875, -0.152923583984375, -0.13440704345703125, -0.1158905029296875, -0.09737396240234375, -0.078857421875, -0.06034088134765625, -0.0418243408203125, -0.02330780029296875, -0.004791259765625, 0.01372528076171875, 0.0322418212890625, 0.05075836181640625, 0.06927490234375, 0.08779144287109375, 0.1063079833984375, 0.12482452392578125, 0.143341064453125, 0.16185760498046875, 0.1803741455078125, 0.19889068603515625, 0.2174072265625, 0.23592376708984375, 0.2544403076171875, 0.27295684814453125, 0.291473388671875, 0.30998992919921875, 0.3285064697265625, 0.34702301025390625, 0.36553955078125, 0.38405609130859375, 0.4025726318359375, 0.42108917236328125, 0.439605712890625, 0.45812225341796875, 0.4766387939453125, 0.49515533447265625, 0.513671875]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 5.0, 1.0, 6.0, 5.0, 12.0, 9.0, 8.0, 12.0, 9.0, 11.0, 8.0, 13.0, 16.0, 14.0, 21.0, 21.0, 21.0, 35.0, 16.0, 26.0, 34.0, 34.0, 42.0, 42.0, 34.0, 34.0, 32.0, 32.0, 49.0, 46.0, 47.0, 41.0, 32.0, 21.0, 34.0, 22.0, 27.0, 17.0, 16.0, 14.0, 15.0, 9.0, 7.0, 9.0, 13.0, 3.0, 8.0, 5.0, 7.0, 6.0, 5.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.4814453125, -0.4664344787597656, -0.45142364501953125, -0.4364128112792969, -0.4214019775390625, -0.4063911437988281, -0.39138031005859375, -0.3763694763183594, -0.361358642578125, -0.3463478088378906, -0.33133697509765625, -0.3163261413574219, -0.3013153076171875, -0.2863044738769531, -0.27129364013671875, -0.2562828063964844, -0.24127197265625, -0.22626113891601562, -0.21125030517578125, -0.19623947143554688, -0.1812286376953125, -0.16621780395507812, -0.15120697021484375, -0.13619613647460938, -0.121185302734375, -0.10617446899414062, -0.09116363525390625, -0.07615280151367188, -0.0611419677734375, -0.046131134033203125, -0.03112030029296875, -0.016109466552734375, -0.0010986328125, 0.013912200927734375, 0.02892303466796875, 0.043933868408203125, 0.0589447021484375, 0.07395553588867188, 0.08896636962890625, 0.10397720336914062, 0.118988037109375, 0.13399887084960938, 0.14900970458984375, 0.16402053833007812, 0.1790313720703125, 0.19404220581054688, 0.20905303955078125, 0.22406387329101562, 0.23907470703125, 0.2540855407714844, 0.26909637451171875, 0.2841072082519531, 0.2991180419921875, 0.3141288757324219, 0.32913970947265625, 0.3441505432128906, 0.359161376953125, 0.3741722106933594, 0.38918304443359375, 0.4041938781738281, 0.4192047119140625, 0.4342155456542969, 0.44922637939453125, 0.4642372131347656, 0.479248046875]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 6.0, 6.0, 15.0, 17.0, 35.0, 58.0, 98.0, 173.0, 310.0, 638.0, 1696.0, 6235.0, 45427.0, 1890588.0, 2190093.0, 49352.0, 6432.0, 1721.0, 638.0, 297.0, 176.0, 105.0, 59.0, 37.0, 27.0, 12.0, 11.0, 8.0, 10.0, 3.0, 0.0, 2.0, 0.0, 3.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4345703125, -1.3663177490234375, -1.298065185546875, -1.2298126220703125, -1.16156005859375, -1.0933074951171875, -1.025054931640625, -0.9568023681640625, -0.8885498046875, -0.8202972412109375, -0.752044677734375, -0.6837921142578125, -0.61553955078125, -0.5472869873046875, -0.479034423828125, -0.4107818603515625, -0.342529296875, -0.2742767333984375, -0.206024169921875, -0.1377716064453125, -0.06951904296875, -0.0012664794921875, 0.066986083984375, 0.1352386474609375, 0.2034912109375, 0.2717437744140625, 0.339996337890625, 0.4082489013671875, 0.47650146484375, 0.5447540283203125, 0.613006591796875, 0.6812591552734375, 0.74951171875, 0.8177642822265625, 0.886016845703125, 0.9542694091796875, 1.02252197265625, 1.0907745361328125, 1.159027099609375, 1.2272796630859375, 1.2955322265625, 1.3637847900390625, 1.432037353515625, 1.5002899169921875, 1.56854248046875, 1.6367950439453125, 1.705047607421875, 1.7733001708984375, 1.841552734375, 1.9098052978515625, 1.978057861328125, 2.0463104248046875, 2.11456298828125, 2.1828155517578125, 2.251068115234375, 2.3193206787109375, 2.3875732421875, 2.4558258056640625, 2.524078369140625, 2.5923309326171875, 2.66058349609375, 2.7288360595703125, 2.797088623046875, 2.8653411865234375, 2.93359375]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 4.0, 2.0, 1.0, 4.0, 8.0, 7.0, 12.0, 16.0, 30.0, 25.0, 50.0, 93.0, 79.0, 124.0, 228.0, 273.0, 416.0, 471.0, 520.0, 458.0, 393.0, 270.0, 203.0, 114.0, 100.0, 49.0, 43.0, 23.0, 21.0, 10.0, 10.0, 6.0, 8.0, 4.0, 6.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.6884765625, -1.6476058959960938, -1.6067352294921875, -1.5658645629882812, -1.524993896484375, -1.4841232299804688, -1.4432525634765625, -1.4023818969726562, -1.36151123046875, -1.3206405639648438, -1.2797698974609375, -1.2388992309570312, -1.198028564453125, -1.1571578979492188, -1.1162872314453125, -1.0754165649414062, -1.0345458984375, -0.9936752319335938, -0.9528045654296875, -0.9119338989257812, -0.871063232421875, -0.8301925659179688, -0.7893218994140625, -0.7484512329101562, -0.70758056640625, -0.6667098999023438, -0.6258392333984375, -0.5849685668945312, -0.544097900390625, -0.5032272338867188, -0.4623565673828125, -0.42148590087890625, -0.380615234375, -0.33974456787109375, -0.2988739013671875, -0.25800323486328125, -0.217132568359375, -0.17626190185546875, -0.1353912353515625, -0.09452056884765625, -0.05364990234375, -0.01277923583984375, 0.0280914306640625, 0.06896209716796875, 0.109832763671875, 0.15070343017578125, 0.1915740966796875, 0.23244476318359375, 0.2733154296875, 0.31418609619140625, 0.3550567626953125, 0.39592742919921875, 0.436798095703125, 0.47766876220703125, 0.5185394287109375, 0.5594100952148438, 0.60028076171875, 0.6411514282226562, 0.6820220947265625, 0.7228927612304688, 0.763763427734375, 0.8046340942382812, 0.8455047607421875, 0.8863754272460938, 0.92724609375]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 5.0, 4.0, 5.0, 10.0, 10.0, 9.0, 11.0, 20.0, 33.0, 49.0, 64.0, 94.0, 104.0, 105.0, 91.0, 93.0, 83.0, 72.0, 38.0, 24.0, 27.0, 15.0, 10.0, 8.0, 4.0, 4.0, 3.0, 1.0, 0.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-12.338584899902344, -12.021121978759766, -11.703660011291504, -11.386197090148926, -11.068734169006348, -10.751272201538086, -10.433809280395508, -10.11634635925293, -9.798884391784668, -9.48142147064209, -9.163959503173828, -8.84649658203125, -8.529033660888672, -8.21157169342041, -7.894108772277832, -7.576646327972412, -7.259183406829834, -6.941720962524414, -6.624258041381836, -6.306795597076416, -5.989333152770996, -5.671870231628418, -5.354407787322998, -5.036945343017578, -4.719482421875, -4.40201997756958, -4.084557056427002, -3.767094612121582, -3.449632167816162, -3.132169485092163, -2.814706802368164, -2.497244358062744, -2.179781436920166, -1.8623188734054565, -1.544856309890747, -1.227393627166748, -0.9099310636520386, -0.5924685001373291, -0.2750058174133301, 0.042456626892089844, 0.35991930961608887, 0.6773818731307983, 0.9948444962501526, 1.3123071193695068, 1.6297696828842163, 1.9472322463989258, 2.264694929122925, 2.5821573734283447, 2.8996200561523438, 3.2170827388763428, 3.5345451831817627, 3.8520078659057617, 4.169470310211182, 4.486932754516602, 4.80439567565918, 5.1218581199646, 5.4393205642700195, 5.7567830085754395, 6.074245929718018, 6.3917083740234375, 6.709170818328857, 7.026633262634277, 7.3440961837768555, 7.661558628082275, 7.9790215492248535]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 1.0, 6.0, 4.0, 4.0, 12.0, 8.0, 11.0, 8.0, 17.0, 18.0, 13.0, 13.0, 26.0, 15.0, 23.0, 34.0, 36.0, 29.0, 30.0, 28.0, 42.0, 30.0, 45.0, 41.0, 31.0, 38.0, 48.0, 33.0, 41.0, 46.0, 29.0, 22.0, 20.0, 20.0, 20.0, 28.0, 26.0, 17.0, 9.0, 13.0, 17.0, 14.0, 17.0, 5.0, 6.0, 3.0, 2.0, 1.0, 5.0, 0.0, 1.0, 1.0, 3.0, 0.0, 3.0], "bins": [-4.024127960205078, -3.9028236865997314, -3.7815194129943848, -3.660215139389038, -3.5389108657836914, -3.4176065921783447, -3.296302318572998, -3.1749982833862305, -3.0536937713623047, -2.932389497756958, -2.8110852241516113, -2.6897809505462646, -2.568476676940918, -2.4471724033355713, -2.3258681297302246, -2.204564094543457, -2.0832598209381104, -1.9619555473327637, -1.840651273727417, -1.7193470001220703, -1.5980427265167236, -1.476738452911377, -1.3554342985153198, -1.2341300249099731, -1.1128257513046265, -0.9915214776992798, -0.8702172040939331, -0.7489129900932312, -0.6276087164878845, -0.5063044428825378, -0.38500022888183594, -0.26369595527648926, -0.14239144325256348, -0.02108718454837799, 0.1002170741558075, 0.2215213179588318, 0.34282559156417847, 0.46412986516952515, 0.585434079170227, 0.7067383527755737, 0.8280426263809204, 0.9493468999862671, 1.0706511735916138, 1.191955327987671, 1.3132596015930176, 1.4345638751983643, 1.555868148803711, 1.6771724224090576, 1.7984766960144043, 1.919780969619751, 2.0410852432250977, 2.1623895168304443, 2.283693790435791, 2.4049980640411377, 2.5263023376464844, 2.647606372833252, 2.7689108848571777, 2.8902151584625244, 3.011519432067871, 3.1328237056732178, 3.2541279792785645, 3.375432252883911, 3.496736526489258, 3.6180405616760254, 3.739344835281372]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 1.0, 1.0, 1.0, 3.0, 3.0, 5.0, 13.0, 15.0, 17.0, 30.0, 34.0, 47.0, 56.0, 96.0, 157.0, 228.0, 326.0, 520.0, 756.0, 1252.0, 2056.0, 3483.0, 6271.0, 11960.0, 24953.0, 57450.0, 144306.0, 307643.0, 274508.0, 119398.0, 47989.0, 21121.0, 10280.0, 5498.0, 3012.0, 1820.0, 1093.0, 717.0, 474.0, 299.0, 213.0, 133.0, 96.0, 63.0, 52.0, 36.0, 27.0, 14.0, 12.0, 7.0, 7.0, 2.0, 8.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.385498046875, -0.3730201721191406, -0.36054229736328125, -0.3480644226074219, -0.3355865478515625, -0.3231086730957031, -0.31063079833984375, -0.2981529235839844, -0.285675048828125, -0.2731971740722656, -0.26071929931640625, -0.24824142456054688, -0.2357635498046875, -0.22328567504882812, -0.21080780029296875, -0.19832992553710938, -0.18585205078125, -0.17337417602539062, -0.16089630126953125, -0.14841842651367188, -0.1359405517578125, -0.12346267700195312, -0.11098480224609375, -0.09850692749023438, -0.086029052734375, -0.07355117797851562, -0.06107330322265625, -0.048595428466796875, -0.0361175537109375, -0.023639678955078125, -0.01116180419921875, 0.001316070556640625, 0.0137939453125, 0.026271820068359375, 0.03874969482421875, 0.051227569580078125, 0.0637054443359375, 0.07618331909179688, 0.08866119384765625, 0.10113906860351562, 0.113616943359375, 0.12609481811523438, 0.13857269287109375, 0.15105056762695312, 0.1635284423828125, 0.17600631713867188, 0.18848419189453125, 0.20096206665039062, 0.21343994140625, 0.22591781616210938, 0.23839569091796875, 0.2508735656738281, 0.2633514404296875, 0.2758293151855469, 0.28830718994140625, 0.3007850646972656, 0.313262939453125, 0.3257408142089844, 0.33821868896484375, 0.3506965637207031, 0.3631744384765625, 0.3756523132324219, 0.38813018798828125, 0.4006080627441406, 0.4130859375]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 1.0, 0.0, 1.0, 4.0, 4.0, 6.0, 4.0, 7.0, 9.0, 6.0, 7.0, 11.0, 18.0, 9.0, 20.0, 32.0, 20.0, 28.0, 26.0, 33.0, 27.0, 45.0, 33.0, 34.0, 40.0, 60.0, 42.0, 30.0, 38.0, 38.0, 32.0, 48.0, 32.0, 30.0, 41.0, 32.0, 24.0, 30.0, 18.0, 12.0, 9.0, 10.0, 12.0, 8.0, 10.0, 6.0, 5.0, 4.0, 4.0, 5.0, 3.0, 5.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.67138671875, -0.6491012573242188, -0.6268157958984375, -0.6045303344726562, -0.582244873046875, -0.5599594116210938, -0.5376739501953125, -0.5153884887695312, -0.49310302734375, -0.47081756591796875, -0.4485321044921875, -0.42624664306640625, -0.403961181640625, -0.38167572021484375, -0.3593902587890625, -0.33710479736328125, -0.3148193359375, -0.29253387451171875, -0.2702484130859375, -0.24796295166015625, -0.225677490234375, -0.20339202880859375, -0.1811065673828125, -0.15882110595703125, -0.13653564453125, -0.11425018310546875, -0.0919647216796875, -0.06967926025390625, -0.047393798828125, -0.02510833740234375, -0.0028228759765625, 0.01946258544921875, 0.041748046875, 0.06403350830078125, 0.0863189697265625, 0.10860443115234375, 0.130889892578125, 0.15317535400390625, 0.1754608154296875, 0.19774627685546875, 0.22003173828125, 0.24231719970703125, 0.2646026611328125, 0.28688812255859375, 0.309173583984375, 0.33145904541015625, 0.3537445068359375, 0.37602996826171875, 0.3983154296875, 0.42060089111328125, 0.4428863525390625, 0.46517181396484375, 0.487457275390625, 0.5097427368164062, 0.5320281982421875, 0.5543136596679688, 0.57659912109375, 0.5988845825195312, 0.6211700439453125, 0.6434555053710938, 0.665740966796875, 0.6880264282226562, 0.7103118896484375, 0.7325973510742188, 0.7548828125]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 2.0, 6.0, 5.0, 12.0, 11.0, 18.0, 20.0, 33.0, 47.0, 94.0, 139.0, 236.0, 325.0, 622.0, 1141.0, 2291.0, 4976.0, 11956.0, 32816.0, 120442.0, 572947.0, 218814.0, 51367.0, 16938.0, 6685.0, 3029.0, 1588.0, 821.0, 495.0, 245.0, 165.0, 98.0, 59.0, 46.0, 23.0, 15.0, 9.0, 9.0, 7.0, 3.0, 1.0, 1.0, 3.0, 3.0, 0.0, 0.0, 3.0], "bins": [-0.66552734375, -0.6478691101074219, -0.6302108764648438, -0.6125526428222656, -0.5948944091796875, -0.5772361755371094, -0.5595779418945312, -0.5419197082519531, -0.524261474609375, -0.5066032409667969, -0.48894500732421875, -0.4712867736816406, -0.4536285400390625, -0.4359703063964844, -0.41831207275390625, -0.4006538391113281, -0.38299560546875, -0.3653373718261719, -0.34767913818359375, -0.3300209045410156, -0.3123626708984375, -0.2947044372558594, -0.27704620361328125, -0.2593879699707031, -0.241729736328125, -0.22407150268554688, -0.20641326904296875, -0.18875503540039062, -0.1710968017578125, -0.15343856811523438, -0.13578033447265625, -0.11812210083007812, -0.1004638671875, -0.08280563354492188, -0.06514739990234375, -0.047489166259765625, -0.0298309326171875, -0.012172698974609375, 0.00548553466796875, 0.023143768310546875, 0.040802001953125, 0.058460235595703125, 0.07611846923828125, 0.09377670288085938, 0.1114349365234375, 0.12909317016601562, 0.14675140380859375, 0.16440963745117188, 0.18206787109375, 0.19972610473632812, 0.21738433837890625, 0.23504257202148438, 0.2527008056640625, 0.2703590393066406, 0.28801727294921875, 0.3056755065917969, 0.323333740234375, 0.3409919738769531, 0.35865020751953125, 0.3763084411621094, 0.3939666748046875, 0.4116249084472656, 0.42928314208984375, 0.4469413757324219, 0.464599609375]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 3.0, 1.0, 1.0, 3.0, 1.0, 3.0, 7.0, 7.0, 10.0, 8.0, 11.0, 19.0, 22.0, 30.0, 35.0, 46.0, 61.0, 71.0, 68.0, 81.0, 62.0, 75.0, 68.0, 62.0, 60.0, 49.0, 35.0, 20.0, 21.0, 21.0, 12.0, 9.0, 6.0, 8.0, 6.0, 4.0, 2.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.2421875, -2.16790771484375, -2.0936279296875, -2.01934814453125, -1.945068359375, -1.87078857421875, -1.7965087890625, -1.72222900390625, -1.64794921875, -1.57366943359375, -1.4993896484375, -1.42510986328125, -1.350830078125, -1.27655029296875, -1.2022705078125, -1.12799072265625, -1.0537109375, -0.97943115234375, -0.9051513671875, -0.83087158203125, -0.756591796875, -0.68231201171875, -0.6080322265625, -0.53375244140625, -0.45947265625, -0.38519287109375, -0.3109130859375, -0.23663330078125, -0.162353515625, -0.08807373046875, -0.0137939453125, 0.06048583984375, 0.134765625, 0.20904541015625, 0.2833251953125, 0.35760498046875, 0.431884765625, 0.50616455078125, 0.5804443359375, 0.65472412109375, 0.72900390625, 0.80328369140625, 0.8775634765625, 0.95184326171875, 1.026123046875, 1.10040283203125, 1.1746826171875, 1.24896240234375, 1.3232421875, 1.39752197265625, 1.4718017578125, 1.54608154296875, 1.620361328125, 1.69464111328125, 1.7689208984375, 1.84320068359375, 1.91748046875, 1.99176025390625, 2.0660400390625, 2.14031982421875, 2.214599609375, 2.28887939453125, 2.3631591796875, 2.43743896484375, 2.51171875]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 2.0, 4.0, 0.0, 2.0, 8.0, 10.0, 12.0, 30.0, 61.0, 118.0, 266.0, 909.0, 5758.0, 310986.0, 720982.0, 7626.0, 1154.0, 353.0, 162.0, 52.0, 27.0, 17.0, 6.0, 4.0, 3.0, 4.0, 4.0, 2.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.75, -0.7266082763671875, -0.703216552734375, -0.6798248291015625, -0.65643310546875, -0.6330413818359375, -0.609649658203125, -0.5862579345703125, -0.5628662109375, -0.5394744873046875, -0.516082763671875, -0.4926910400390625, -0.46929931640625, -0.4459075927734375, -0.422515869140625, -0.3991241455078125, -0.375732421875, -0.3523406982421875, -0.328948974609375, -0.3055572509765625, -0.28216552734375, -0.2587738037109375, -0.235382080078125, -0.2119903564453125, -0.1885986328125, -0.1652069091796875, -0.141815185546875, -0.1184234619140625, -0.09503173828125, -0.0716400146484375, -0.048248291015625, -0.0248565673828125, -0.00146484375, 0.0219268798828125, 0.045318603515625, 0.0687103271484375, 0.09210205078125, 0.1154937744140625, 0.138885498046875, 0.1622772216796875, 0.1856689453125, 0.2090606689453125, 0.232452392578125, 0.2558441162109375, 0.27923583984375, 0.3026275634765625, 0.326019287109375, 0.3494110107421875, 0.372802734375, 0.3961944580078125, 0.419586181640625, 0.4429779052734375, 0.46636962890625, 0.4897613525390625, 0.513153076171875, 0.5365447998046875, 0.5599365234375, 0.5833282470703125, 0.606719970703125, 0.6301116943359375, 0.65350341796875, 0.6768951416015625, 0.700286865234375, 0.7236785888671875, 0.7470703125]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 6.0, 2.0, 2.0, 1.0, 11.0, 7.0, 17.0, 18.0, 48.0, 49.0, 72.0, 99.0, 128.0, 138.0, 98.0, 81.0, 60.0, 40.0, 27.0, 20.0, 19.0, 13.0, 13.0, 14.0, 8.0, 2.0, 3.0, 4.0, 2.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.020069122314453e-05, -5.807075649499893e-05, -5.594082176685333e-05, -5.381088703870773e-05, -5.1680952310562134e-05, -4.9551017582416534e-05, -4.7421082854270935e-05, -4.5291148126125336e-05, -4.3161213397979736e-05, -4.103127866983414e-05, -3.890134394168854e-05, -3.677140921354294e-05, -3.464147448539734e-05, -3.251153975725174e-05, -3.038160502910614e-05, -2.825167030096054e-05, -2.612173557281494e-05, -2.3991800844669342e-05, -2.1861866116523743e-05, -1.9731931388378143e-05, -1.7601996660232544e-05, -1.5472061932086945e-05, -1.3342127203941345e-05, -1.1212192475795746e-05, -9.082257747650146e-06, -6.952323019504547e-06, -4.822388291358948e-06, -2.6924535632133484e-06, -5.62518835067749e-07, 1.5674158930778503e-06, 3.6973506212234497e-06, 5.827285349369049e-06, 7.957220077514648e-06, 1.0087154805660248e-05, 1.2217089533805847e-05, 1.4347024261951447e-05, 1.6476958990097046e-05, 1.8606893718242645e-05, 2.0736828446388245e-05, 2.2866763174533844e-05, 2.4996697902679443e-05, 2.7126632630825043e-05, 2.9256567358970642e-05, 3.138650208711624e-05, 3.351643681526184e-05, 3.564637154340744e-05, 3.777630627155304e-05, 3.990624099969864e-05, 4.203617572784424e-05, 4.416611045598984e-05, 4.629604518413544e-05, 4.8425979912281036e-05, 5.0555914640426636e-05, 5.2685849368572235e-05, 5.4815784096717834e-05, 5.6945718824863434e-05, 5.907565355300903e-05, 6.120558828115463e-05, 6.333552300930023e-05, 6.546545773744583e-05, 6.759539246559143e-05, 6.972532719373703e-05, 7.185526192188263e-05, 7.398519665002823e-05, 7.611513137817383e-05]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 4.0, 5.0, 5.0, 7.0, 11.0, 10.0, 15.0, 33.0, 35.0, 34.0, 53.0, 68.0, 134.0, 189.0, 368.0, 681.0, 1389.0, 3379.0, 10993.0, 56928.0, 646903.0, 282841.0, 32253.0, 7268.0, 2547.0, 1072.0, 553.0, 317.0, 163.0, 82.0, 62.0, 46.0, 23.0, 27.0, 18.0, 9.0, 7.0, 7.0, 6.0, 6.0, 1.0, 0.0, 2.0, 3.0, 5.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.335693359375, -0.3240547180175781, -0.31241607666015625, -0.3007774353027344, -0.2891387939453125, -0.2775001525878906, -0.26586151123046875, -0.2542228698730469, -0.242584228515625, -0.23094558715820312, -0.21930694580078125, -0.20766830444335938, -0.1960296630859375, -0.18439102172851562, -0.17275238037109375, -0.16111373901367188, -0.14947509765625, -0.13783645629882812, -0.12619781494140625, -0.11455917358398438, -0.1029205322265625, -0.09128189086914062, -0.07964324951171875, -0.06800460815429688, -0.056365966796875, -0.044727325439453125, -0.03308868408203125, -0.021450042724609375, -0.0098114013671875, 0.001827239990234375, 0.01346588134765625, 0.025104522705078125, 0.0367431640625, 0.048381805419921875, 0.06002044677734375, 0.07165908813476562, 0.0832977294921875, 0.09493637084960938, 0.10657501220703125, 0.11821365356445312, 0.129852294921875, 0.14149093627929688, 0.15312957763671875, 0.16476821899414062, 0.1764068603515625, 0.18804550170898438, 0.19968414306640625, 0.21132278442382812, 0.22296142578125, 0.23460006713867188, 0.24623870849609375, 0.2578773498535156, 0.2695159912109375, 0.2811546325683594, 0.29279327392578125, 0.3044319152832031, 0.316070556640625, 0.3277091979980469, 0.33934783935546875, 0.3509864807128906, 0.3626251220703125, 0.3742637634277344, 0.38590240478515625, 0.3975410461425781, 0.4091796875]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 0.0, 3.0, 4.0, 6.0, 6.0, 4.0, 9.0, 9.0, 7.0, 13.0, 9.0, 13.0, 12.0, 19.0, 21.0, 23.0, 32.0, 33.0, 35.0, 44.0, 47.0, 52.0, 82.0, 65.0, 65.0, 62.0, 52.0, 49.0, 34.0, 23.0, 23.0, 26.0, 24.0, 16.0, 15.0, 14.0, 10.0, 9.0, 3.0, 8.0, 8.0, 3.0, 3.0, 2.0, 4.0, 4.0, 3.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.283203125, -0.274505615234375, -0.26580810546875, -0.257110595703125, -0.2484130859375, -0.239715576171875, -0.23101806640625, -0.222320556640625, -0.213623046875, -0.204925537109375, -0.19622802734375, -0.187530517578125, -0.1788330078125, -0.170135498046875, -0.16143798828125, -0.152740478515625, -0.14404296875, -0.135345458984375, -0.12664794921875, -0.117950439453125, -0.1092529296875, -0.100555419921875, -0.09185791015625, -0.083160400390625, -0.074462890625, -0.065765380859375, -0.05706787109375, -0.048370361328125, -0.0396728515625, -0.030975341796875, -0.02227783203125, -0.013580322265625, -0.0048828125, 0.003814697265625, 0.01251220703125, 0.021209716796875, 0.0299072265625, 0.038604736328125, 0.04730224609375, 0.055999755859375, 0.064697265625, 0.073394775390625, 0.08209228515625, 0.090789794921875, 0.0994873046875, 0.108184814453125, 0.11688232421875, 0.125579833984375, 0.13427734375, 0.142974853515625, 0.15167236328125, 0.160369873046875, 0.1690673828125, 0.177764892578125, 0.18646240234375, 0.195159912109375, 0.203857421875, 0.212554931640625, 0.22125244140625, 0.229949951171875, 0.2386474609375, 0.247344970703125, 0.25604248046875, 0.264739990234375, 0.2734375]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 2.0, 8.0, 8.0, 17.0, 47.0, 75.0, 136.0, 220.0, 228.0, 115.0, 62.0, 42.0, 23.0, 8.0, 6.0, 3.0, 1.0, 2.0, 2.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.709936141967773, -6.403011798858643, -6.09608793258667, -5.789163589477539, -5.482239723205566, -5.1753153800964355, -4.868391036987305, -4.561467170715332, -4.254543304443359, -3.9476191997528076, -3.640695095062256, -3.333770751953125, -3.0268468856811523, -2.7199225425720215, -2.4129984378814697, -2.106074333190918, -1.799149990081787, -1.4922258853912354, -1.1853017807006836, -0.8783775568008423, -0.5714534521102905, -0.26452934741973877, 0.04239487648010254, 0.3493189811706543, 0.656243085861206, 0.9631671905517578, 1.2700912952423096, 1.5770155191421509, 1.8839396238327026, 2.190863609313965, 2.4977879524230957, 2.8047120571136475, 3.111636161804199, 3.418560266494751, 3.7254843711853027, 4.032408714294434, 4.339332580566406, 4.646256923675537, 4.953181266784668, 5.260105133056641, 5.567028999328613, 5.873953342437744, 6.180877208709717, 6.487801551818848, 6.79472541809082, 7.101649761199951, 7.408574104309082, 7.715497970581055, 8.022422790527344, 8.329346656799316, 8.636271476745605, 8.943195343017578, 9.25011920928955, 9.557043075561523, 9.863967895507812, 10.170891761779785, 10.477815628051758, 10.78473949432373, 11.09166431427002, 11.398588180541992, 11.705512046813965, 12.012435913085938, 12.319360733032227, 12.6262845993042, 12.933208465576172]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 3.0, 0.0, 1.0, 4.0, 2.0, 3.0, 1.0, 11.0, 14.0, 5.0, 14.0, 15.0, 27.0, 22.0, 28.0, 34.0, 26.0, 38.0, 40.0, 54.0, 51.0, 68.0, 72.0, 72.0, 61.0, 53.0, 33.0, 41.0, 41.0, 38.0, 26.0, 21.0, 23.0, 10.0, 15.0, 11.0, 7.0, 11.0, 2.0, 3.0, 4.0, 4.0, 2.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.169952392578125, -5.987324237823486, -5.804696083068848, -5.622067928314209, -5.43943977355957, -5.25681209564209, -5.074183464050293, -4.8915557861328125, -4.708927631378174, -4.526299476623535, -4.3436713218688965, -4.161043167114258, -3.9784152507781982, -3.7957870960235596, -3.613158941268921, -3.4305310249328613, -3.2479026317596436, -3.065274477005005, -2.882646322250366, -2.7000184059143066, -2.517390251159668, -2.3347620964050293, -2.1521339416503906, -1.9695059061050415, -1.7868777513504028, -1.6042495965957642, -1.421621561050415, -1.2389934062957764, -1.0563652515411377, -0.8737372159957886, -0.6911090612411499, -0.5084810256958008, -0.3258528709411621, -0.14322476089000702, 0.03940334916114807, 0.22203147411346436, 0.40465956926345825, 0.5872876644134521, 0.7699158191680908, 0.9525438547134399, 1.1351720094680786, 1.3178001642227173, 1.5004281997680664, 1.683056354522705, 1.8656845092773438, 2.0483126640319824, 2.230940818786621, 2.4135687351226807, 2.5961968898773193, 2.778825044631958, 2.9614531993865967, 3.1440811157226562, 3.326709270477295, 3.5093374252319336, 3.6919655799865723, 3.874593734741211, 4.05722188949585, 4.239850044250488, 4.422478199005127, 4.605106353759766, 4.787734508514404, 4.970362663269043, 5.152990341186523, 5.335618495941162, 5.518246650695801]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 3.0, 4.0, 7.0, 13.0, 5.0, 8.0, 17.0, 29.0, 17.0, 27.0, 36.0, 33.0, 76.0, 143.0, 252.0, 88.0, 50.0, 25.0, 27.0, 23.0, 15.0, 27.0, 15.0, 14.0, 11.0, 6.0, 9.0, 2.0, 8.0, 4.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-1.0859375, -1.0559844970703125, -1.026031494140625, -0.9960784912109375, -0.96612548828125, -0.9361724853515625, -0.906219482421875, -0.8762664794921875, -0.8463134765625, -0.8163604736328125, -0.786407470703125, -0.7564544677734375, -0.72650146484375, -0.6965484619140625, -0.666595458984375, -0.6366424560546875, -0.606689453125, -0.5767364501953125, -0.546783447265625, -0.5168304443359375, -0.48687744140625, -0.4569244384765625, -0.426971435546875, -0.3970184326171875, -0.3670654296875, -0.3371124267578125, -0.307159423828125, -0.2772064208984375, -0.24725341796875, -0.2173004150390625, -0.187347412109375, -0.1573944091796875, -0.12744140625, -0.0974884033203125, -0.067535400390625, -0.0375823974609375, -0.00762939453125, 0.0223236083984375, 0.052276611328125, 0.0822296142578125, 0.1121826171875, 0.1421356201171875, 0.172088623046875, 0.2020416259765625, 0.23199462890625, 0.2619476318359375, 0.291900634765625, 0.3218536376953125, 0.351806640625, 0.3817596435546875, 0.411712646484375, 0.4416656494140625, 0.47161865234375, 0.5015716552734375, 0.531524658203125, 0.5614776611328125, 0.5914306640625, 0.6213836669921875, 0.651336669921875, 0.6812896728515625, 0.71124267578125, 0.7411956787109375, 0.771148681640625, 0.8011016845703125, 0.8310546875]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 5.0, 4.0, 4.0, 5.0, 7.0, 13.0, 21.0, 21.0, 35.0, 54.0, 88.0, 161.0, 276.0, 508.0, 1037.0, 2443.0, 6545.0, 29227.0, 8266303.0, 66365.0, 9313.0, 3196.0, 1388.0, 688.0, 343.0, 203.0, 99.0, 65.0, 53.0, 35.0, 24.0, 21.0, 11.0, 9.0, 5.0, 4.0, 5.0, 2.0, 0.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.9354238510131836, -1.8499505519866943, -1.7644771337509155, -1.6790038347244263, -1.5935304164886475, -1.5080571174621582, -1.422583818435669, -1.3371105194091797, -1.2516371011734009, -1.1661638021469116, -1.0806903839111328, -0.9952170848846436, -0.9097437262535095, -0.8242703676223755, -0.7387970685958862, -0.6533237099647522, -0.5678503513336182, -0.48237699270248413, -0.3969036638736725, -0.31143033504486084, -0.2259569764137268, -0.14048361778259277, -0.055010318756103516, 0.030463039875030518, 0.11593639850616455, 0.2014097422361374, 0.28688308596611023, 0.3723564147949219, 0.4578297734260559, 0.5433031320571899, 0.6287764310836792, 0.7142497897148132, 0.7997229099273682, 0.8851962685585022, 0.9706696271896362, 1.0561429262161255, 1.1416163444519043, 1.2270896434783936, 1.3125629425048828, 1.398036241531372, 1.4835096597671509, 1.5689829587936401, 1.654456377029419, 1.7399296760559082, 1.8254029750823975, 1.9108763933181763, 1.9963496923446655, 2.0818231105804443, 2.1672964096069336, 2.252769708633423, 2.338243007659912, 2.4237165451049805, 2.5091898441314697, 2.594663143157959, 2.6801364421844482, 2.7656097412109375, 2.851083278656006, 2.936556577682495, 3.0220298767089844, 3.1075034141540527, 3.192976713180542, 3.2784500122070312, 3.3639233112335205, 3.4493966102600098, 3.534869909286499]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 4.0, 3.0, 6.0, 1.0, 3.0, 3.0, 5.0, 4.0, 2.0, 5.0, 2.0, 5.0, 6.0, 2.0, 2.0, 3.0, 6.0, 3.0, 5.0, 3.0, 0.0, 1.0, 0.0, 5.0, 3.0, 2.0, 2.0, 0.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-1.662826418876648, -1.6025762557983398, -1.5423260927200317, -1.4820759296417236, -1.4218257665634155, -1.3615756034851074, -1.3013255596160889, -1.2410752773284912, -1.1808252334594727, -1.1205750703811646, -1.0603249073028564, -1.0000747442245483, -0.9398245811462402, -0.8795744180679321, -0.8193243145942688, -0.7590741515159607, -0.6988239288330078, -0.6385737657546997, -0.5783236026763916, -0.5180734395980835, -0.4578233063220978, -0.3975731432437897, -0.33732300996780396, -0.27707284688949585, -0.21682268381118774, -0.15657252073287964, -0.09632237255573273, -0.036072224378585815, 0.02417793869972229, 0.0844281017780304, 0.1446782350540161, 0.20492839813232422, 0.2651784420013428, 0.3254286050796509, 0.385678768157959, 0.4459289014339447, 0.5061790943145752, 0.5664292573928833, 0.6266793608665466, 0.6869295239448547, 0.7471796870231628, 0.807429850101471, 0.867680013179779, 0.9279301166534424, 0.9881802797317505, 1.0484304428100586, 1.1086806058883667, 1.1689307689666748, 1.229180932044983, 1.289431095123291, 1.3496812582015991, 1.4099314212799072, 1.4701815843582153, 1.5304317474365234, 1.590681791305542, 1.6509320735931396, 1.7111821174621582, 1.7714322805404663, 1.8316824436187744, 1.8919326066970825, 1.9521827697753906, 2.012432813644409, 2.072683095932007, 2.1329331398010254, 2.193183422088623]}, "gradients/encoder.masked_spec_embed": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 3.0, 4.0, 7.0, 4.0, 8.0, 9.0, 11.0, 18.0, 20.0, 24.0, 19.0, 34.0, 27.0, 32.0, 35.0, 33.0, 34.0, 36.0, 48.0, 44.0, 56.0, 37.0, 44.0, 40.0, 68.0, 35.0, 35.0, 37.0, 30.0, 24.0, 32.0, 18.0, 18.0, 14.0, 11.0, 10.0, 17.0, 7.0, 5.0, 2.0, 4.0, 1.0, 6.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.482421875, -0.4685478210449219, -0.45467376708984375, -0.4407997131347656, -0.4269256591796875, -0.4130516052246094, -0.39917755126953125, -0.3853034973144531, -0.371429443359375, -0.3575553894042969, -0.34368133544921875, -0.3298072814941406, -0.3159332275390625, -0.3020591735839844, -0.28818511962890625, -0.2743110656738281, -0.26043701171875, -0.24656295776367188, -0.23268890380859375, -0.21881484985351562, -0.2049407958984375, -0.19106674194335938, -0.17719268798828125, -0.16331863403320312, -0.149444580078125, -0.13557052612304688, -0.12169647216796875, -0.10782241821289062, -0.0939483642578125, -0.08007431030273438, -0.06620025634765625, -0.052326202392578125, -0.0384521484375, -0.024578094482421875, -0.01070404052734375, 0.003170013427734375, 0.0170440673828125, 0.030918121337890625, 0.04479217529296875, 0.058666229248046875, 0.072540283203125, 0.08641433715820312, 0.10028839111328125, 0.11416244506835938, 0.1280364990234375, 0.14191055297851562, 0.15578460693359375, 0.16965866088867188, 0.18353271484375, 0.19740676879882812, 0.21128082275390625, 0.22515487670898438, 0.2390289306640625, 0.2529029846191406, 0.26677703857421875, 0.2806510925292969, 0.294525146484375, 0.3083992004394531, 0.32227325439453125, 0.3361473083496094, 0.3500213623046875, 0.3638954162597656, 0.37776947021484375, 0.3916435241699219, 0.405517578125]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 1.0, 6.0, 3.0, 1.0, 7.0, 6.0, 5.0, 10.0, 15.0, 22.0, 26.0, 28.0, 51.0, 59.0, 93.0, 143.0, 247.0, 391.0, 732.0, 1648.0, 4386.0, 14716.0, 75983.0, 328654.0, 75014.0, 14282.0, 4286.0, 1618.0, 765.0, 395.0, 227.0, 145.0, 74.0, 55.0, 44.0, 31.0, 24.0, 14.0, 11.0, 7.0, 12.0, 8.0, 8.0, 2.0, 4.0, 2.0, 4.0, 3.0, 3.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-12.84375, -12.4359130859375, -12.028076171875, -11.6202392578125, -11.21240234375, -10.8045654296875, -10.396728515625, -9.9888916015625, -9.5810546875, -9.1732177734375, -8.765380859375, -8.3575439453125, -7.94970703125, -7.5418701171875, -7.134033203125, -6.7261962890625, -6.318359375, -5.9105224609375, -5.502685546875, -5.0948486328125, -4.68701171875, -4.2791748046875, -3.871337890625, -3.4635009765625, -3.0556640625, -2.6478271484375, -2.239990234375, -1.8321533203125, -1.42431640625, -1.0164794921875, -0.608642578125, -0.2008056640625, 0.20703125, 0.6148681640625, 1.022705078125, 1.4305419921875, 1.83837890625, 2.2462158203125, 2.654052734375, 3.0618896484375, 3.4697265625, 3.8775634765625, 4.285400390625, 4.6932373046875, 5.10107421875, 5.5089111328125, 5.916748046875, 6.3245849609375, 6.732421875, 7.1402587890625, 7.548095703125, 7.9559326171875, 8.36376953125, 8.7716064453125, 9.179443359375, 9.5872802734375, 9.9951171875, 10.4029541015625, 10.810791015625, 11.2186279296875, 11.62646484375, 12.0343017578125, 12.442138671875, 12.8499755859375, 13.2578125]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 5.0, 4.0, 3.0, 4.0, 5.0, 3.0, 8.0, 7.0, 8.0, 9.0, 12.0, 13.0, 17.0, 19.0, 13.0, 31.0, 24.0, 40.0, 29.0, 32.0, 25.0, 47.0, 44.0, 45.0, 39.0, 49.0, 47.0, 44.0, 44.0, 50.0, 26.0, 23.0, 31.0, 29.0, 27.0, 23.0, 26.0, 8.0, 14.0, 9.0, 11.0, 14.0, 8.0, 7.0, 5.0, 7.0, 3.0, 2.0, 5.0, 2.0, 4.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 2.0], "bins": [-0.611328125, -0.5914077758789062, -0.5714874267578125, -0.5515670776367188, -0.531646728515625, -0.5117263793945312, -0.4918060302734375, -0.47188568115234375, -0.45196533203125, -0.43204498291015625, -0.4121246337890625, -0.39220428466796875, -0.372283935546875, -0.35236358642578125, -0.3324432373046875, -0.31252288818359375, -0.2926025390625, -0.27268218994140625, -0.2527618408203125, -0.23284149169921875, -0.212921142578125, -0.19300079345703125, -0.1730804443359375, -0.15316009521484375, -0.13323974609375, -0.11331939697265625, -0.0933990478515625, -0.07347869873046875, -0.053558349609375, -0.03363800048828125, -0.0137176513671875, 0.00620269775390625, 0.026123046875, 0.04604339599609375, 0.0659637451171875, 0.08588409423828125, 0.105804443359375, 0.12572479248046875, 0.1456451416015625, 0.16556549072265625, 0.18548583984375, 0.20540618896484375, 0.2253265380859375, 0.24524688720703125, 0.265167236328125, 0.28508758544921875, 0.3050079345703125, 0.32492828369140625, 0.3448486328125, 0.36476898193359375, 0.3846893310546875, 0.40460968017578125, 0.424530029296875, 0.44445037841796875, 0.4643707275390625, 0.48429107666015625, 0.50421142578125, 0.5241317749023438, 0.5440521240234375, 0.5639724731445312, 0.583892822265625, 0.6038131713867188, 0.6237335205078125, 0.6436538696289062, 0.66357421875]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 0.0, 1.0, 7.0, 1.0, 1.0, 8.0, 3.0, 6.0, 9.0, 6.0, 9.0, 12.0, 20.0, 22.0, 50.0, 57.0, 66.0, 44.0, 41.0, 32.0, 19.0, 18.0, 18.0, 5.0, 10.0, 6.0, 5.0, 6.0, 2.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.864600658416748, -2.7792210578918457, -2.6938412189483643, -2.608461618423462, -2.5230817794799805, -2.437702178955078, -2.3523223400115967, -2.2669427394866943, -2.181562900543213, -2.0961833000183105, -2.010803461074829, -1.9254237413406372, -1.8400440216064453, -1.7546643018722534, -1.6692845821380615, -1.5839049816131592, -1.4985252618789673, -1.4131455421447754, -1.3277658224105835, -1.2423861026763916, -1.1570063829421997, -1.0716266632080078, -0.9862470030784607, -0.9008672833442688, -0.8154875636100769, -0.730107843875885, -0.6447281241416931, -0.559348464012146, -0.4739687144756317, -0.3885889947414398, -0.3032093048095703, -0.21782958507537842, -0.13244986534118652, -0.047070153057575226, 0.03830955922603607, 0.12368926405906677, 0.20906898379325867, 0.29444870352745056, 0.37982839345932007, 0.46520811319351196, 0.5505878329277039, 0.6359675526618958, 0.7213472723960876, 0.8067269325256348, 0.8921066522598267, 0.9774863719940186, 1.0628660917282104, 1.1482458114624023, 1.2336255311965942, 1.3190052509307861, 1.404384970664978, 1.48976469039917, 1.5751444101333618, 1.6605241298675537, 1.745903730392456, 1.8312835693359375, 1.9166631698608398, 2.002042770385742, 2.0874226093292236, 2.172802209854126, 2.2581820487976074, 2.3435616493225098, 2.428941488265991, 2.5143210887908936, 2.599700927734375]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 1.0, 2.0, 1.0, 4.0, 2.0, 2.0, 4.0, 2.0, 5.0, 4.0, 7.0, 8.0, 9.0, 12.0, 7.0, 19.0, 41.0, 86.0, 116.0, 48.0, 22.0, 16.0, 10.0, 10.0, 11.0, 7.0, 8.0, 8.0, 5.0, 4.0, 2.0, 0.0, 4.0, 1.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.0783915519714355, -3.952740430831909, -3.8270890712738037, -3.7014379501342773, -3.575786590576172, -3.4501354694366455, -3.324484348297119, -3.1988329887390137, -3.0731818675994873, -2.947530746459961, -2.8218793869018555, -2.696228265762329, -2.5705771446228027, -2.4449257850646973, -2.319274663925171, -2.1936235427856445, -2.067972183227539, -1.9423209428787231, -1.8166697025299072, -1.6910185813903809, -1.565367341041565, -1.439716100692749, -1.3140649795532227, -1.1884137392044067, -1.0627624988555908, -0.9371112585067749, -0.8114600777626038, -0.6858088970184326, -0.5601576566696167, -0.4345064163208008, -0.30885523557662964, -0.1832040548324585, -0.05755281448364258, 0.06809839606285095, 0.19374960660934448, 0.319400817155838, 0.44505202770233154, 0.5707032680511475, 0.6963544487953186, 0.8220056295394897, 0.9476568698883057, 1.0733081102371216, 1.1989593505859375, 1.3246104717254639, 1.4502617120742798, 1.5759129524230957, 1.701564073562622, 1.827215313911438, 1.952866554260254, 2.0785176753997803, 2.2041690349578857, 2.329820156097412, 2.4554715156555176, 2.581122636795044, 2.7067737579345703, 2.832425117492676, 2.958076238632202, 3.0837273597717285, 3.209378719329834, 3.3350298404693604, 3.4606809616088867, 3.586332321166992, 3.7119834423065186, 3.837634563446045, 3.9632859230041504]}, "eval/loss": 1.776824951171875, "eval/bleu": 1.3741745601573323e-19, "eval/runtime": 2494.6636, "eval/samples_per_second": 5.917, "eval/steps_per_second": 0.74, "train/train_runtime": 68108.5497, "train/train_samples_per_second": 9.134, "train/train_steps_per_second": 0.071, "train/total_flos": 0.0, "train/train_loss": 2.012981654225308} \ No newline at end of file