diff --git "a/wandb/run-20220326_171130-bdf5nvyg/files/wandb-summary.json" "b/wandb/run-20220326_171130-bdf5nvyg/files/wandb-summary.json" --- "a/wandb/run-20220326_171130-bdf5nvyg/files/wandb-summary.json" +++ "b/wandb/run-20220326_171130-bdf5nvyg/files/wandb-summary.json" @@ -1 +1 @@ -{"train/loss": 0.0291, "train/learning_rate": 4.057803468208092e-05, "train/epoch": 8.97, "train/global_step": 2000, "_runtime": 46587, "_timestamp": 1648361277, "_step": 2003, "gradients/decoder.model.decoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 6.0, 7.0, 14.0, 11.0, 33.0, 45.0, 70.0, 106.0, 123.0, 134.0, 135.0, 98.0, 86.0, 46.0, 33.0, 18.0, 19.0, 8.0, 10.0, 4.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3876301646232605, -0.3632458448410034, -0.33886149525642395, -0.3144771456718445, -0.2900928258895874, -0.2657085061073303, -0.24132415652275085, -0.21693982183933258, -0.1925554871559143, -0.16817115247249603, -0.14378681778907776, -0.11940248310565948, -0.09501814842224121, -0.07063381373882294, -0.04624947905540466, -0.02186514437198639, 0.0025191903114318848, 0.02690352499485016, 0.05128785967826843, 0.0756721943616867, 0.10005652904510498, 0.12444086372852325, 0.14882519841194153, 0.1732095330953598, 0.19759386777877808, 0.22197820246219635, 0.24636253714561462, 0.2707468867301941, 0.29513120651245117, 0.31951552629470825, 0.3438998758792877, 0.3682842254638672, 0.3926684856414795, 0.4170528054237366, 0.44143715500831604, 0.4658215045928955, 0.4902058243751526, 0.5145901441574097, 0.5389745235443115, 0.5633588433265686, 0.5877431631088257, 0.6121274828910828, 0.6365118026733398, 0.6608961820602417, 0.6852805018424988, 0.7096648216247559, 0.7340492010116577, 0.7584335207939148, 0.7828178405761719, 0.807202160358429, 0.831586480140686, 0.8559708595275879, 0.880355179309845, 0.904739499092102, 0.9291238784790039, 0.953508198261261, 0.9778925180435181, 1.00227689743042, 1.0266611576080322, 1.051045536994934, 1.075429916381836, 1.0998141765594482, 1.12419855594635, 1.1485828161239624, 1.1729671955108643]}, "gradients/decoder.model.decoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 4.0, 5.0, 7.0, 8.0, 15.0, 13.0, 17.0, 19.0, 17.0, 19.0, 32.0, 23.0, 32.0, 36.0, 37.0, 37.0, 51.0, 43.0, 49.0, 52.0, 40.0, 53.0, 31.0, 39.0, 33.0, 36.0, 29.0, 31.0, 33.0, 31.0, 29.0, 16.0, 15.0, 10.0, 17.0, 11.0, 8.0, 6.0, 8.0, 5.0, 6.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.4541098475456238, -0.44089969992637634, -0.4276895523071289, -0.41447940468788147, -0.40126925706863403, -0.3880591094493866, -0.37484896183013916, -0.36163878440856934, -0.3484286665916443, -0.33521851897239685, -0.3220083713531494, -0.308798223733902, -0.29558807611465454, -0.2823779284954071, -0.26916778087615967, -0.25595760345458984, -0.2427474558353424, -0.22953730821609497, -0.21632716059684753, -0.2031170129776001, -0.18990686535835266, -0.17669671773910522, -0.1634865552186966, -0.15027640759944916, -0.13706625998020172, -0.12385611236095428, -0.11064596474170685, -0.09743580967187881, -0.08422566205263138, -0.07101551443338394, -0.05780535936355591, -0.04459521174430847, -0.031385064125061035, -0.01817491464316845, -0.004964765161275864, 0.008245386183261871, 0.021455533802509308, 0.034665681421756744, 0.04787583649158478, 0.061085984110832214, 0.07429613173007965, 0.08750627934932709, 0.10071642696857452, 0.11392658203840256, 0.1271367371082306, 0.14034688472747803, 0.15355703234672546, 0.1667671799659729, 0.17997732758522034, 0.19318747520446777, 0.2063976228237152, 0.21960777044296265, 0.23281791806221008, 0.24602806568145752, 0.25923824310302734, 0.2724483609199524, 0.2856585383415222, 0.29886868596076965, 0.3120788335800171, 0.3252889811992645, 0.33849912881851196, 0.3517092764377594, 0.36491942405700684, 0.37812960147857666, 0.3913397192955017]}, "gradients/decoder.model.decoder.layers.11.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 4.0, 7.0, 9.0, 12.0, 19.0, 18.0, 34.0, 36.0, 61.0, 69.0, 119.0, 153.0, 214.0, 249.0, 430.0, 626.0, 943.0, 1458.0, 2439.0, 4160.0, 7758.0, 16710.0, 45290.0, 206331.0, 957434.0, 2092176.0, 665047.0, 132936.0, 32029.0, 12397.0, 6044.0, 3306.0, 2009.0, 1175.0, 787.0, 546.0, 341.0, 262.0, 174.0, 126.0, 89.0, 61.0, 54.0, 42.0, 31.0, 17.0, 15.0, 12.0, 11.0, 8.0, 5.0, 4.0, 4.0, 0.0, 1.0, 3.0], "bins": [-0.98974609375, -0.9600753784179688, -0.9304046630859375, -0.9007339477539062, -0.871063232421875, -0.8413925170898438, -0.8117218017578125, -0.7820510864257812, -0.75238037109375, -0.7227096557617188, -0.6930389404296875, -0.6633682250976562, -0.633697509765625, -0.6040267944335938, -0.5743560791015625, -0.5446853637695312, -0.5150146484375, -0.48534393310546875, -0.4556732177734375, -0.42600250244140625, -0.396331787109375, -0.36666107177734375, -0.3369903564453125, -0.30731964111328125, -0.27764892578125, -0.24797821044921875, -0.2183074951171875, -0.18863677978515625, -0.158966064453125, -0.12929534912109375, -0.0996246337890625, -0.06995391845703125, -0.040283203125, -0.01061248779296875, 0.0190582275390625, 0.04872894287109375, 0.078399658203125, 0.10807037353515625, 0.1377410888671875, 0.16741180419921875, 0.19708251953125, 0.22675323486328125, 0.2564239501953125, 0.28609466552734375, 0.315765380859375, 0.34543609619140625, 0.3751068115234375, 0.40477752685546875, 0.4344482421875, 0.46411895751953125, 0.4937896728515625, 0.5234603881835938, 0.553131103515625, 0.5828018188476562, 0.6124725341796875, 0.6421432495117188, 0.67181396484375, 0.7014846801757812, 0.7311553955078125, 0.7608261108398438, 0.790496826171875, 0.8201675415039062, 0.8498382568359375, 0.8795089721679688, 0.9091796875]}, "gradients/decoder.model.decoder.layers.11.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 8.0, 10.0, 10.0, 9.0, 23.0, 13.0, 11.0, 20.0, 27.0, 32.0, 29.0, 45.0, 39.0, 45.0, 43.0, 50.0, 43.0, 48.0, 65.0, 47.0, 40.0, 42.0, 40.0, 44.0, 31.0, 28.0, 29.0, 20.0, 19.0, 27.0, 13.0, 9.0, 18.0, 8.0, 9.0, 5.0, 5.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.8369140625, -0.8115768432617188, -0.7862396240234375, -0.7609024047851562, -0.735565185546875, -0.7102279663085938, -0.6848907470703125, -0.6595535278320312, -0.63421630859375, -0.6088790893554688, -0.5835418701171875, -0.5582046508789062, -0.532867431640625, -0.5075302124023438, -0.4821929931640625, -0.45685577392578125, -0.4315185546875, -0.40618133544921875, -0.3808441162109375, -0.35550689697265625, -0.330169677734375, -0.30483245849609375, -0.2794952392578125, -0.25415802001953125, -0.22882080078125, -0.20348358154296875, -0.1781463623046875, -0.15280914306640625, -0.127471923828125, -0.10213470458984375, -0.0767974853515625, -0.05146026611328125, -0.026123046875, -0.00078582763671875, 0.0245513916015625, 0.04988861083984375, 0.075225830078125, 0.10056304931640625, 0.1259002685546875, 0.15123748779296875, 0.17657470703125, 0.20191192626953125, 0.2272491455078125, 0.25258636474609375, 0.277923583984375, 0.30326080322265625, 0.3285980224609375, 0.35393524169921875, 0.3792724609375, 0.40460968017578125, 0.4299468994140625, 0.45528411865234375, 0.480621337890625, 0.5059585571289062, 0.5312957763671875, 0.5566329956054688, 0.58197021484375, 0.6073074340820312, 0.6326446533203125, 0.6579818725585938, 0.683319091796875, 0.7086563110351562, 0.7339935302734375, 0.7593307495117188, 0.78466796875]}, "gradients/decoder.model.decoder.layers.11.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 6.0, 10.0, 17.0, 25.0, 71.0, 172.0, 735.0, 95342.0, 4096145.0, 1327.0, 263.0, 87.0, 48.0, 11.0, 9.0, 3.0, 6.0, 4.0, 1.0, 3.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-10.9296875, -10.4566650390625, -9.983642578125, -9.5106201171875, -9.03759765625, -8.5645751953125, -8.091552734375, -7.6185302734375, -7.1455078125, -6.6724853515625, -6.199462890625, -5.7264404296875, -5.25341796875, -4.7803955078125, -4.307373046875, -3.8343505859375, -3.361328125, -2.8883056640625, -2.415283203125, -1.9422607421875, -1.46923828125, -0.9962158203125, -0.523193359375, -0.0501708984375, 0.4228515625, 0.8958740234375, 1.368896484375, 1.8419189453125, 2.31494140625, 2.7879638671875, 3.260986328125, 3.7340087890625, 4.20703125, 4.6800537109375, 5.153076171875, 5.6260986328125, 6.09912109375, 6.5721435546875, 7.045166015625, 7.5181884765625, 7.9912109375, 8.4642333984375, 8.937255859375, 9.4102783203125, 9.88330078125, 10.3563232421875, 10.829345703125, 11.3023681640625, 11.775390625, 12.2484130859375, 12.721435546875, 13.1944580078125, 13.66748046875, 14.1405029296875, 14.613525390625, 15.0865478515625, 15.5595703125, 16.0325927734375, 16.505615234375, 16.9786376953125, 17.45166015625, 17.9246826171875, 18.397705078125, 18.8707275390625, 19.34375]}, "gradients/decoder.model.decoder.layers.11.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 5.0, 3.0, 17.0, 34.0, 66.0, 108.0, 297.0, 1234.0, 1618.0, 393.0, 162.0, 73.0, 34.0, 17.0, 6.0, 5.0, 6.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.642578125, -0.614776611328125, -0.58697509765625, -0.559173583984375, -0.5313720703125, -0.503570556640625, -0.47576904296875, -0.447967529296875, -0.420166015625, -0.392364501953125, -0.36456298828125, -0.336761474609375, -0.3089599609375, -0.281158447265625, -0.25335693359375, -0.225555419921875, -0.19775390625, -0.169952392578125, -0.14215087890625, -0.114349365234375, -0.0865478515625, -0.058746337890625, -0.03094482421875, -0.003143310546875, 0.024658203125, 0.052459716796875, 0.08026123046875, 0.108062744140625, 0.1358642578125, 0.163665771484375, 0.19146728515625, 0.219268798828125, 0.2470703125, 0.274871826171875, 0.30267333984375, 0.330474853515625, 0.3582763671875, 0.386077880859375, 0.41387939453125, 0.441680908203125, 0.469482421875, 0.497283935546875, 0.52508544921875, 0.552886962890625, 0.5806884765625, 0.608489990234375, 0.63629150390625, 0.664093017578125, 0.69189453125, 0.719696044921875, 0.74749755859375, 0.775299072265625, 0.8031005859375, 0.830902099609375, 0.85870361328125, 0.886505126953125, 0.914306640625, 0.942108154296875, 0.96990966796875, 0.997711181640625, 1.0255126953125, 1.053314208984375, 1.08111572265625, 1.108917236328125, 1.13671875]}, "gradients/decoder.model.decoder.layers.11.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 5.0, 1.0, 2.0, 1.0, 4.0, 5.0, 8.0, 6.0, 7.0, 8.0, 7.0, 16.0, 26.0, 32.0, 27.0, 36.0, 41.0, 44.0, 54.0, 64.0, 58.0, 79.0, 71.0, 63.0, 50.0, 46.0, 49.0, 38.0, 27.0, 22.0, 21.0, 23.0, 18.0, 7.0, 8.0, 6.0, 12.0, 3.0, 6.0, 1.0, 2.0, 0.0, 3.0, 0.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.8187122941017151, -0.7897897958755493, -0.7608672380447388, -0.731944739818573, -0.7030221819877625, -0.6740996837615967, -0.6451771259307861, -0.6162546277046204, -0.5873321294784546, -0.5584096312522888, -0.5294870734214783, -0.5005645751953125, -0.47164201736450195, -0.4427195191383362, -0.413796991109848, -0.38487446308135986, -0.3559519052505493, -0.32702937722206116, -0.298106849193573, -0.2691843509674072, -0.24026180803775787, -0.21133928000926971, -0.18241676688194275, -0.1534942388534546, -0.12457171082496643, -0.09564918279647827, -0.06672666221857071, -0.03780414164066315, -0.008881613612174988, 0.02004091441631317, 0.04896342754364014, 0.0778859555721283, 0.10680842399597168, 0.13573095202445984, 0.164653480052948, 0.19357599318027496, 0.22249852120876312, 0.2514210343360901, 0.28034356236457825, 0.3092660903930664, 0.33818861842155457, 0.3671111464500427, 0.3960336744785309, 0.42495620250701904, 0.4538787007331848, 0.48280125856399536, 0.5117237567901611, 0.5406463146209717, 0.5695688128471375, 0.5984913110733032, 0.6274138689041138, 0.6563363671302795, 0.6852589249610901, 0.7141814231872559, 0.7431039810180664, 0.7720264792442322, 0.800948977470398, 0.8298714756965637, 0.8587940335273743, 0.88771653175354, 0.9166390895843506, 0.9455615878105164, 0.9744840860366821, 1.0034066438674927, 1.0323292016983032]}, "gradients/decoder.model.decoder.layers.11.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 2.0, 4.0, 2.0, 2.0, 3.0, 5.0, 2.0, 4.0, 6.0, 16.0, 8.0, 12.0, 16.0, 12.0, 28.0, 21.0, 23.0, 29.0, 39.0, 29.0, 32.0, 46.0, 34.0, 38.0, 27.0, 41.0, 40.0, 34.0, 38.0, 44.0, 27.0, 33.0, 31.0, 40.0, 29.0, 30.0, 29.0, 12.0, 22.0, 20.0, 11.0, 12.0, 19.0, 11.0, 6.0, 7.0, 7.0, 6.0, 2.0, 8.0, 5.0, 3.0, 3.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.6735132336616516, -0.6536933183670044, -0.633873462677002, -0.6140535473823547, -0.5942336320877075, -0.5744137167930603, -0.5545938014984131, -0.5347739458084106, -0.5149540305137634, -0.4951341152191162, -0.4753142297267914, -0.45549434423446655, -0.43567442893981934, -0.4158545136451721, -0.3960346281528473, -0.37621474266052246, -0.35639482736587524, -0.336574912071228, -0.3167550265789032, -0.29693514108657837, -0.27711522579193115, -0.25729531049728394, -0.2374754250049591, -0.21765552461147308, -0.19783562421798706, -0.17801572382450104, -0.15819582343101501, -0.138375923037529, -0.11855602264404297, -0.09873612225055695, -0.07891622185707092, -0.0590963214635849, -0.0392763614654541, -0.01945646107196808, 0.00036343932151794434, 0.020183339715003967, 0.04000324010848999, 0.05982314050197601, 0.07964304089546204, 0.09946294128894806, 0.11928284168243408, 0.1391027420759201, 0.15892264246940613, 0.17874254286289215, 0.19856244325637817, 0.2183823436498642, 0.23820224404335022, 0.25802212953567505, 0.27784204483032227, 0.2976619601249695, 0.3174818456172943, 0.33730173110961914, 0.35712164640426636, 0.3769415616989136, 0.3967614471912384, 0.41658133268356323, 0.43640124797821045, 0.45622116327285767, 0.4760410487651825, 0.4958609342575073, 0.5156808495521545, 0.5355007648468018, 0.5553206205368042, 0.5751405358314514, 0.5949604511260986]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 11.0, 9.0, 18.0, 18.0, 21.0, 48.0, 78.0, 91.0, 194.0, 284.0, 467.0, 793.0, 1384.0, 2380.0, 4272.0, 7801.0, 14299.0, 26719.0, 50692.0, 98325.0, 184878.0, 267765.0, 182278.0, 97247.0, 50489.0, 26184.0, 14172.0, 7768.0, 4223.0, 2396.0, 1282.0, 812.0, 472.0, 253.0, 149.0, 98.0, 73.0, 35.0, 29.0, 24.0, 19.0, 4.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-0.36865234375, -0.3582649230957031, -0.34787750244140625, -0.3374900817871094, -0.3271026611328125, -0.3167152404785156, -0.30632781982421875, -0.2959403991699219, -0.285552978515625, -0.2751655578613281, -0.26477813720703125, -0.2543907165527344, -0.2440032958984375, -0.23361587524414062, -0.22322845458984375, -0.21284103393554688, -0.20245361328125, -0.19206619262695312, -0.18167877197265625, -0.17129135131835938, -0.1609039306640625, -0.15051651000976562, -0.14012908935546875, -0.12974166870117188, -0.119354248046875, -0.10896682739257812, -0.09857940673828125, -0.08819198608398438, -0.0778045654296875, -0.06741714477539062, -0.05702972412109375, -0.046642303466796875, -0.0362548828125, -0.025867462158203125, -0.01548004150390625, -0.005092620849609375, 0.0052947998046875, 0.015682220458984375, 0.02606964111328125, 0.036457061767578125, 0.046844482421875, 0.057231903076171875, 0.06761932373046875, 0.07800674438476562, 0.0883941650390625, 0.09878158569335938, 0.10916900634765625, 0.11955642700195312, 0.12994384765625, 0.14033126831054688, 0.15071868896484375, 0.16110610961914062, 0.1714935302734375, 0.18188095092773438, 0.19226837158203125, 0.20265579223632812, 0.213043212890625, 0.22343063354492188, 0.23381805419921875, 0.24420547485351562, 0.2545928955078125, 0.2649803161621094, 0.27536773681640625, 0.2857551574707031, 0.296142578125]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 5.0, 1.0, 0.0, 3.0, 4.0, 3.0, 4.0, 4.0, 7.0, 11.0, 6.0, 16.0, 16.0, 15.0, 23.0, 25.0, 21.0, 20.0, 30.0, 39.0, 33.0, 46.0, 50.0, 40.0, 43.0, 43.0, 37.0, 31.0, 31.0, 50.0, 53.0, 34.0, 28.0, 33.0, 29.0, 26.0, 29.0, 20.0, 18.0, 12.0, 12.0, 9.0, 5.0, 13.0, 8.0, 4.0, 7.0, 7.0, 5.0, 1.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.400390625, -0.3867301940917969, -0.37306976318359375, -0.3594093322753906, -0.3457489013671875, -0.3320884704589844, -0.31842803955078125, -0.3047676086425781, -0.291107177734375, -0.2774467468261719, -0.26378631591796875, -0.2501258850097656, -0.2364654541015625, -0.22280502319335938, -0.20914459228515625, -0.19548416137695312, -0.18182373046875, -0.16816329956054688, -0.15450286865234375, -0.14084243774414062, -0.1271820068359375, -0.11352157592773438, -0.09986114501953125, -0.08620071411132812, -0.072540283203125, -0.058879852294921875, -0.04521942138671875, -0.031558990478515625, -0.0178985595703125, -0.004238128662109375, 0.00942230224609375, 0.023082733154296875, 0.0367431640625, 0.050403594970703125, 0.06406402587890625, 0.07772445678710938, 0.0913848876953125, 0.10504531860351562, 0.11870574951171875, 0.13236618041992188, 0.146026611328125, 0.15968704223632812, 0.17334747314453125, 0.18700790405273438, 0.2006683349609375, 0.21432876586914062, 0.22798919677734375, 0.24164962768554688, 0.25531005859375, 0.2689704895019531, 0.28263092041015625, 0.2962913513183594, 0.3099517822265625, 0.3236122131347656, 0.33727264404296875, 0.3509330749511719, 0.364593505859375, 0.3782539367675781, 0.39191436767578125, 0.4055747985839844, 0.4192352294921875, 0.4328956604003906, 0.44655609130859375, 0.4602165222167969, 0.473876953125]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 7.0, 8.0, 6.0, 7.0, 23.0, 27.0, 31.0, 42.0, 58.0, 109.0, 180.0, 252.0, 394.0, 761.0, 1186.0, 2217.0, 3883.0, 7908.0, 16756.0, 40037.0, 102536.0, 256795.0, 344224.0, 160451.0, 61950.0, 25293.0, 11210.0, 5383.0, 2817.0, 1584.0, 924.0, 528.0, 335.0, 207.0, 135.0, 90.0, 55.0, 40.0, 41.0, 16.0, 17.0, 13.0, 8.0, 7.0, 6.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.37744140625, -0.3657341003417969, -0.35402679443359375, -0.3423194885253906, -0.3306121826171875, -0.3189048767089844, -0.30719757080078125, -0.2954902648925781, -0.283782958984375, -0.2720756530761719, -0.26036834716796875, -0.24866104125976562, -0.2369537353515625, -0.22524642944335938, -0.21353912353515625, -0.20183181762695312, -0.19012451171875, -0.17841720581054688, -0.16670989990234375, -0.15500259399414062, -0.1432952880859375, -0.13158798217773438, -0.11988067626953125, -0.10817337036132812, -0.096466064453125, -0.08475875854492188, -0.07305145263671875, -0.061344146728515625, -0.0496368408203125, -0.037929534912109375, -0.02622222900390625, -0.014514923095703125, -0.0028076171875, 0.008899688720703125, 0.02060699462890625, 0.032314300537109375, 0.0440216064453125, 0.055728912353515625, 0.06743621826171875, 0.07914352416992188, 0.090850830078125, 0.10255813598632812, 0.11426544189453125, 0.12597274780273438, 0.1376800537109375, 0.14938735961914062, 0.16109466552734375, 0.17280197143554688, 0.18450927734375, 0.19621658325195312, 0.20792388916015625, 0.21963119506835938, 0.2313385009765625, 0.24304580688476562, 0.25475311279296875, 0.2664604187011719, 0.278167724609375, 0.2898750305175781, 0.30158233642578125, 0.3132896423339844, 0.3249969482421875, 0.3367042541503906, 0.34841156005859375, 0.3601188659667969, 0.371826171875]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 4.0, 2.0, 4.0, 1.0, 1.0, 6.0, 2.0, 3.0, 10.0, 9.0, 6.0, 10.0, 15.0, 13.0, 23.0, 15.0, 31.0, 31.0, 23.0, 40.0, 38.0, 31.0, 46.0, 46.0, 52.0, 46.0, 48.0, 54.0, 50.0, 42.0, 35.0, 36.0, 31.0, 18.0, 35.0, 25.0, 24.0, 18.0, 18.0, 16.0, 11.0, 9.0, 6.0, 7.0, 4.0, 3.0, 4.0, 3.0, 4.0, 2.0, 3.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.88330078125, -0.8537826538085938, -0.8242645263671875, -0.7947463989257812, -0.765228271484375, -0.7357101440429688, -0.7061920166015625, -0.6766738891601562, -0.64715576171875, -0.6176376342773438, -0.5881195068359375, -0.5586013793945312, -0.529083251953125, -0.49956512451171875, -0.4700469970703125, -0.44052886962890625, -0.4110107421875, -0.38149261474609375, -0.3519744873046875, -0.32245635986328125, -0.292938232421875, -0.26342010498046875, -0.2339019775390625, -0.20438385009765625, -0.17486572265625, -0.14534759521484375, -0.1158294677734375, -0.08631134033203125, -0.056793212890625, -0.02727508544921875, 0.0022430419921875, 0.03176116943359375, 0.061279296875, 0.09079742431640625, 0.1203155517578125, 0.14983367919921875, 0.179351806640625, 0.20886993408203125, 0.2383880615234375, 0.26790618896484375, 0.29742431640625, 0.32694244384765625, 0.3564605712890625, 0.38597869873046875, 0.415496826171875, 0.44501495361328125, 0.4745330810546875, 0.5040512084960938, 0.5335693359375, 0.5630874633789062, 0.5926055908203125, 0.6221237182617188, 0.651641845703125, 0.6811599731445312, 0.7106781005859375, 0.7401962280273438, 0.76971435546875, 0.7992324829101562, 0.8287506103515625, 0.8582687377929688, 0.887786865234375, 0.9173049926757812, 0.9468231201171875, 0.9763412475585938, 1.005859375]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 10.0, 10.0, 19.0, 25.0, 31.0, 60.0, 76.0, 129.0, 209.0, 376.0, 590.0, 996.0, 1827.0, 3486.0, 6530.0, 14318.0, 34102.0, 93546.0, 327155.0, 381779.0, 112086.0, 39016.0, 16064.0, 7600.0, 3795.0, 1938.0, 1115.0, 661.0, 352.0, 250.0, 147.0, 105.0, 55.0, 31.0, 27.0, 13.0, 10.0, 6.0, 5.0, 5.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0924072265625, -0.08933448791503906, -0.08626174926757812, -0.08318901062011719, -0.08011627197265625, -0.07704353332519531, -0.07397079467773438, -0.07089805603027344, -0.0678253173828125, -0.06475257873535156, -0.061679840087890625, -0.05860710144042969, -0.05553436279296875, -0.05246162414550781, -0.049388885498046875, -0.04631614685058594, -0.043243408203125, -0.04017066955566406, -0.037097930908203125, -0.03402519226074219, -0.03095245361328125, -0.027879714965820312, -0.024806976318359375, -0.021734237670898438, -0.0186614990234375, -0.015588760375976562, -0.012516021728515625, -0.009443283081054688, -0.00637054443359375, -0.0032978057861328125, -0.000225067138671875, 0.0028476715087890625, 0.00592041015625, 0.008993148803710938, 0.012065887451171875, 0.015138626098632812, 0.01821136474609375, 0.021284103393554688, 0.024356842041015625, 0.027429580688476562, 0.0305023193359375, 0.03357505798339844, 0.036647796630859375, 0.03972053527832031, 0.04279327392578125, 0.04586601257324219, 0.048938751220703125, 0.05201148986816406, 0.055084228515625, 0.05815696716308594, 0.061229705810546875, 0.06430244445800781, 0.06737518310546875, 0.07044792175292969, 0.07352066040039062, 0.07659339904785156, 0.0796661376953125, 0.08273887634277344, 0.08581161499023438, 0.08888435363769531, 0.09195709228515625, 0.09502983093261719, 0.09810256958007812, 0.10117530822753906, 0.104248046875]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 3.0, 8.0, 4.0, 4.0, 10.0, 21.0, 22.0, 20.0, 37.0, 63.0, 79.0, 151.0, 149.0, 147.0, 94.0, 69.0, 43.0, 21.0, 15.0, 13.0, 11.0, 7.0, 3.0, 2.0, 6.0, 2.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.000133514404296875, -0.0001292973756790161, -0.00012508034706115723, -0.00012086331844329834, -0.00011664628982543945, -0.00011242926120758057, -0.00010821223258972168, -0.00010399520397186279, -9.97781753540039e-05, -9.556114673614502e-05, -9.134411811828613e-05, -8.712708950042725e-05, -8.291006088256836e-05, -7.869303226470947e-05, -7.447600364685059e-05, -7.02589750289917e-05, -6.604194641113281e-05, -6.182491779327393e-05, -5.760788917541504e-05, -5.339086055755615e-05, -4.9173831939697266e-05, -4.495680332183838e-05, -4.073977470397949e-05, -3.6522746086120605e-05, -3.230571746826172e-05, -2.8088688850402832e-05, -2.3871660232543945e-05, -1.965463161468506e-05, -1.5437602996826172e-05, -1.1220574378967285e-05, -7.0035457611083984e-06, -2.7865171432495117e-06, 1.430511474609375e-06, 5.647540092468262e-06, 9.864568710327148e-06, 1.4081597328186035e-05, 1.8298625946044922e-05, 2.251565456390381e-05, 2.6732683181762695e-05, 3.094971179962158e-05, 3.516674041748047e-05, 3.9383769035339355e-05, 4.360079765319824e-05, 4.781782627105713e-05, 5.2034854888916016e-05, 5.62518835067749e-05, 6.046891212463379e-05, 6.468594074249268e-05, 6.890296936035156e-05, 7.311999797821045e-05, 7.733702659606934e-05, 8.155405521392822e-05, 8.577108383178711e-05, 8.9988112449646e-05, 9.420514106750488e-05, 9.842216968536377e-05, 0.00010263919830322266, 0.00010685622692108154, 0.00011107325553894043, 0.00011529028415679932, 0.0001195073127746582, 0.0001237243413925171, 0.00012794137001037598, 0.00013215839862823486, 0.00013637542724609375]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 5.0, 0.0, 5.0, 4.0, 3.0, 5.0, 8.0, 10.0, 7.0, 13.0, 27.0, 30.0, 56.0, 92.0, 155.0, 261.0, 708.0, 1847.0, 5382.0, 19756.0, 106952.0, 607182.0, 253731.0, 38411.0, 9144.0, 2840.0, 980.0, 420.0, 197.0, 125.0, 67.0, 30.0, 32.0, 21.0, 11.0, 12.0, 10.0, 9.0, 3.0, 3.0, 2.0, 2.0, 0.0, 1.0, 2.0, 3.0, 1.0, 4.0, 0.0, 1.0], "bins": [-0.1925048828125, -0.18711471557617188, -0.18172454833984375, -0.17633438110351562, -0.1709442138671875, -0.16555404663085938, -0.16016387939453125, -0.15477371215820312, -0.149383544921875, -0.14399337768554688, -0.13860321044921875, -0.13321304321289062, -0.1278228759765625, -0.12243270874023438, -0.11704254150390625, -0.11165237426757812, -0.10626220703125, -0.10087203979492188, -0.09548187255859375, -0.09009170532226562, -0.0847015380859375, -0.07931137084960938, -0.07392120361328125, -0.06853103637695312, -0.063140869140625, -0.057750701904296875, -0.05236053466796875, -0.046970367431640625, -0.0415802001953125, -0.036190032958984375, -0.03079986572265625, -0.025409698486328125, -0.02001953125, -0.014629364013671875, -0.00923919677734375, -0.003849029541015625, 0.0015411376953125, 0.006931304931640625, 0.01232147216796875, 0.017711639404296875, 0.023101806640625, 0.028491973876953125, 0.03388214111328125, 0.039272308349609375, 0.0446624755859375, 0.050052642822265625, 0.05544281005859375, 0.060832977294921875, 0.06622314453125, 0.07161331176757812, 0.07700347900390625, 0.08239364624023438, 0.0877838134765625, 0.09317398071289062, 0.09856414794921875, 0.10395431518554688, 0.109344482421875, 0.11473464965820312, 0.12012481689453125, 0.12551498413085938, 0.1309051513671875, 0.13629531860351562, 0.14168548583984375, 0.14707565307617188, 0.1524658203125]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 5.0, 2.0, 4.0, 8.0, 8.0, 10.0, 10.0, 9.0, 18.0, 23.0, 30.0, 18.0, 48.0, 38.0, 57.0, 86.0, 53.0, 66.0, 57.0, 72.0, 51.0, 58.0, 49.0, 39.0, 42.0, 30.0, 26.0, 12.0, 17.0, 9.0, 9.0, 9.0, 8.0, 5.0, 4.0, 5.0, 0.0, 2.0, 2.0, 3.0, 3.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0], "bins": [-0.035308837890625, -0.03430652618408203, -0.03330421447753906, -0.032301902770996094, -0.031299591064453125, -0.030297279357910156, -0.029294967651367188, -0.02829265594482422, -0.02729034423828125, -0.02628803253173828, -0.025285720825195312, -0.024283409118652344, -0.023281097412109375, -0.022278785705566406, -0.021276473999023438, -0.02027416229248047, -0.0192718505859375, -0.01826953887939453, -0.017267227172851562, -0.016264915466308594, -0.015262603759765625, -0.014260292053222656, -0.013257980346679688, -0.012255668640136719, -0.01125335693359375, -0.010251045227050781, -0.009248733520507812, -0.008246421813964844, -0.007244110107421875, -0.006241798400878906, -0.0052394866943359375, -0.004237174987792969, -0.00323486328125, -0.0022325515747070312, -0.0012302398681640625, -0.00022792816162109375, 0.000774383544921875, 0.0017766952514648438, 0.0027790069580078125, 0.0037813186645507812, 0.00478363037109375, 0.005785942077636719, 0.0067882537841796875, 0.007790565490722656, 0.008792877197265625, 0.009795188903808594, 0.010797500610351562, 0.011799812316894531, 0.0128021240234375, 0.013804435729980469, 0.014806747436523438, 0.015809059143066406, 0.016811370849609375, 0.017813682556152344, 0.018815994262695312, 0.01981830596923828, 0.02082061767578125, 0.02182292938232422, 0.022825241088867188, 0.023827552795410156, 0.024829864501953125, 0.025832176208496094, 0.026834487915039062, 0.02783679962158203, 0.028839111328125]}, "gradients/decoder.model.decoder.layers.11.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 6.0, 2.0, 3.0, 9.0, 9.0, 9.0, 15.0, 19.0, 15.0, 23.0, 39.0, 49.0, 55.0, 66.0, 79.0, 76.0, 89.0, 77.0, 78.0, 65.0, 52.0, 39.0, 27.0, 33.0, 25.0, 14.0, 11.0, 8.0, 6.0, 4.0, 3.0, 2.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.5330137014389038, -0.5120462775230408, -0.49107885360717773, -0.4701114296913147, -0.44914403557777405, -0.428176611661911, -0.407209187746048, -0.3862417936325073, -0.3652743697166443, -0.34430694580078125, -0.3233395218849182, -0.3023720979690552, -0.2814047038555145, -0.2604372799396515, -0.23946985602378845, -0.2185024470090866, -0.19753500819206238, -0.17656758427619934, -0.1556001752614975, -0.13463275134563446, -0.11366533488035202, -0.09269791841506958, -0.07173049449920654, -0.0507630854845047, -0.029795661568641663, -0.008828243240714073, 0.012139175087213516, 0.033106595277786255, 0.054074011743068695, 0.07504142820835114, 0.09600885212421417, 0.11697626113891602, 0.13794368505477905, 0.1589111089706421, 0.17987851798534393, 0.20084594190120697, 0.2218133509159088, 0.24278077483177185, 0.2637481987476349, 0.28471559286117554, 0.3056830167770386, 0.3266504406929016, 0.34761786460876465, 0.3685852885246277, 0.38955268263816833, 0.41052010655403137, 0.4314875304698944, 0.45245492458343506, 0.4734223783016205, 0.4943898022174835, 0.5153571963310242, 0.5363246202468872, 0.5572920441627502, 0.5782594680786133, 0.5992268919944763, 0.6201943159103394, 0.6411617398262024, 0.6621291637420654, 0.6830965876579285, 0.7040640115737915, 0.7250314354896545, 0.7459988594055176, 0.7669662237167358, 0.7879336476325989, 0.8089010715484619]}, "gradients/decoder.model.decoder.layers.11.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 7.0, 1.0, 5.0, 5.0, 7.0, 10.0, 3.0, 10.0, 18.0, 12.0, 22.0, 25.0, 20.0, 24.0, 24.0, 34.0, 41.0, 39.0, 38.0, 33.0, 43.0, 44.0, 39.0, 38.0, 42.0, 29.0, 44.0, 42.0, 23.0, 32.0, 37.0, 24.0, 25.0, 14.0, 20.0, 20.0, 21.0, 12.0, 13.0, 13.0, 11.0, 8.0, 5.0, 7.0, 10.0, 7.0, 6.0, 4.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.38546091318130493, -0.37250885367393494, -0.35955679416656494, -0.34660470485687256, -0.33365264534950256, -0.32070058584213257, -0.3077485263347626, -0.2947964668273926, -0.2818443775177002, -0.2688923180103302, -0.2559402585029602, -0.24298818409442902, -0.23003610968589783, -0.21708405017852783, -0.20413199067115784, -0.19117991626262665, -0.17822785675525665, -0.16527579724788666, -0.15232372283935547, -0.13937166333198547, -0.12641958892345428, -0.11346752941608429, -0.1005154624581337, -0.0875633955001831, -0.07461132854223251, -0.06165926158428192, -0.04870719462633133, -0.035755131393671036, -0.022803064435720444, -0.00985100120306015, 0.003101065754890442, 0.016053132712841034, 0.029005199670791626, 0.04195726662874222, 0.05490933358669281, 0.0678613930940628, 0.080813467502594, 0.09376552700996399, 0.10671759396791458, 0.11966966092586517, 0.13262173533439636, 0.14557379484176636, 0.15852586925029755, 0.17147792875766754, 0.18443000316619873, 0.19738206267356873, 0.21033412218093872, 0.2232861965894699, 0.2362382560968399, 0.2491903156042099, 0.2621423900127411, 0.2750944495201111, 0.2880465090274811, 0.3009985685348511, 0.31395065784454346, 0.32690271735191345, 0.33985477685928345, 0.35280683636665344, 0.36575889587402344, 0.3787109851837158, 0.3916630446910858, 0.4046151041984558, 0.4175671637058258, 0.4305192232131958, 0.4434713125228882]}, "gradients/decoder.model.decoder.layers.11.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 0.0, 5.0, 8.0, 6.0, 9.0, 12.0, 19.0, 31.0, 39.0, 59.0, 85.0, 121.0, 164.0, 244.0, 348.0, 544.0, 821.0, 1278.0, 1938.0, 3096.0, 5196.0, 8964.0, 16004.0, 33828.0, 130666.0, 621688.0, 146927.0, 36342.0, 16575.0, 9069.0, 5333.0, 3272.0, 2012.0, 1250.0, 841.0, 573.0, 375.0, 274.0, 192.0, 110.0, 80.0, 47.0, 40.0, 23.0, 15.0, 16.0, 12.0, 7.0, 1.0, 6.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.2744140625, -0.2651214599609375, -0.255828857421875, -0.2465362548828125, -0.23724365234375, -0.2279510498046875, -0.218658447265625, -0.2093658447265625, -0.2000732421875, -0.1907806396484375, -0.181488037109375, -0.1721954345703125, -0.16290283203125, -0.1536102294921875, -0.144317626953125, -0.1350250244140625, -0.125732421875, -0.1164398193359375, -0.107147216796875, -0.0978546142578125, -0.08856201171875, -0.0792694091796875, -0.069976806640625, -0.0606842041015625, -0.0513916015625, -0.0420989990234375, -0.032806396484375, -0.0235137939453125, -0.01422119140625, -0.0049285888671875, 0.004364013671875, 0.0136566162109375, 0.02294921875, 0.0322418212890625, 0.041534423828125, 0.0508270263671875, 0.06011962890625, 0.0694122314453125, 0.078704833984375, 0.0879974365234375, 0.0972900390625, 0.1065826416015625, 0.115875244140625, 0.1251678466796875, 0.13446044921875, 0.1437530517578125, 0.153045654296875, 0.1623382568359375, 0.171630859375, 0.1809234619140625, 0.190216064453125, 0.1995086669921875, 0.20880126953125, 0.2180938720703125, 0.227386474609375, 0.2366790771484375, 0.2459716796875, 0.2552642822265625, 0.264556884765625, 0.2738494873046875, 0.28314208984375, 0.2924346923828125, 0.301727294921875, 0.3110198974609375, 0.3203125]}, "gradients/decoder.model.decoder.layers.11.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 1.0, 2.0, 3.0, 6.0, 3.0, 4.0, 5.0, 5.0, 4.0, 6.0, 7.0, 12.0, 14.0, 11.0, 14.0, 23.0, 19.0, 20.0, 24.0, 32.0, 38.0, 27.0, 30.0, 27.0, 33.0, 36.0, 37.0, 41.0, 39.0, 35.0, 34.0, 41.0, 39.0, 24.0, 27.0, 34.0, 35.0, 21.0, 26.0, 18.0, 17.0, 18.0, 13.0, 21.0, 10.0, 16.0, 7.0, 11.0, 8.0, 9.0, 2.0, 2.0, 4.0, 4.0, 3.0, 7.0, 3.0, 3.0, 2.0, 0.0, 2.0], "bins": [-0.603515625, -0.5846176147460938, -0.5657196044921875, -0.5468215942382812, -0.527923583984375, -0.5090255737304688, -0.4901275634765625, -0.47122955322265625, -0.45233154296875, -0.43343353271484375, -0.4145355224609375, -0.39563751220703125, -0.376739501953125, -0.35784149169921875, -0.3389434814453125, -0.32004547119140625, -0.3011474609375, -0.28224945068359375, -0.2633514404296875, -0.24445343017578125, -0.225555419921875, -0.20665740966796875, -0.1877593994140625, -0.16886138916015625, -0.14996337890625, -0.13106536865234375, -0.1121673583984375, -0.09326934814453125, -0.074371337890625, -0.05547332763671875, -0.0365753173828125, -0.01767730712890625, 0.001220703125, 0.02011871337890625, 0.0390167236328125, 0.05791473388671875, 0.076812744140625, 0.09571075439453125, 0.1146087646484375, 0.13350677490234375, 0.15240478515625, 0.17130279541015625, 0.1902008056640625, 0.20909881591796875, 0.227996826171875, 0.24689483642578125, 0.2657928466796875, 0.28469085693359375, 0.3035888671875, 0.32248687744140625, 0.3413848876953125, 0.36028289794921875, 0.379180908203125, 0.39807891845703125, 0.4169769287109375, 0.43587493896484375, 0.45477294921875, 0.47367095947265625, 0.4925689697265625, 0.5114669799804688, 0.530364990234375, 0.5492630004882812, 0.5681610107421875, 0.5870590209960938, 0.60595703125]}, "gradients/decoder.model.decoder.layers.11.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 5.0, 3.0, 9.0, 2.0, 11.0, 10.0, 19.0, 26.0, 37.0, 56.0, 93.0, 143.0, 235.0, 399.0, 751.0, 1413.0, 3034.0, 7482.0, 23852.0, 223080.0, 730023.0, 39251.0, 10697.0, 4011.0, 1762.0, 910.0, 478.0, 254.0, 185.0, 99.0, 71.0, 43.0, 36.0, 18.0, 20.0, 11.0, 14.0, 9.0, 6.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.673828125, -0.6535110473632812, -0.6331939697265625, -0.6128768920898438, -0.592559814453125, -0.5722427368164062, -0.5519256591796875, -0.5316085815429688, -0.51129150390625, -0.49097442626953125, -0.4706573486328125, -0.45034027099609375, -0.430023193359375, -0.40970611572265625, -0.3893890380859375, -0.36907196044921875, -0.3487548828125, -0.32843780517578125, -0.3081207275390625, -0.28780364990234375, -0.267486572265625, -0.24716949462890625, -0.2268524169921875, -0.20653533935546875, -0.18621826171875, -0.16590118408203125, -0.1455841064453125, -0.12526702880859375, -0.104949951171875, -0.08463287353515625, -0.0643157958984375, -0.04399871826171875, -0.023681640625, -0.00336456298828125, 0.0169525146484375, 0.03726959228515625, 0.057586669921875, 0.07790374755859375, 0.0982208251953125, 0.11853790283203125, 0.13885498046875, 0.15917205810546875, 0.1794891357421875, 0.19980621337890625, 0.220123291015625, 0.24044036865234375, 0.2607574462890625, 0.28107452392578125, 0.3013916015625, 0.32170867919921875, 0.3420257568359375, 0.36234283447265625, 0.382659912109375, 0.40297698974609375, 0.4232940673828125, 0.44361114501953125, 0.46392822265625, 0.48424530029296875, 0.5045623779296875, 0.5248794555664062, 0.545196533203125, 0.5655136108398438, 0.5858306884765625, 0.6061477661132812, 0.62646484375]}, "gradients/decoder.model.decoder.layers.11.self_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 3.0, 8.0, 5.0, 10.0, 4.0, 14.0, 11.0, 17.0, 25.0, 20.0, 28.0, 20.0, 28.0, 32.0, 23.0, 40.0, 40.0, 33.0, 46.0, 45.0, 44.0, 42.0, 36.0, 32.0, 34.0, 31.0, 33.0, 36.0, 25.0, 24.0, 37.0, 18.0, 22.0, 24.0, 17.0, 19.0, 13.0, 12.0, 11.0, 14.0, 3.0, 4.0, 7.0, 3.0, 1.0, 3.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0], "bins": [-0.64697265625, -0.6257858276367188, -0.6045989990234375, -0.5834121704101562, -0.562225341796875, -0.5410385131835938, -0.5198516845703125, -0.49866485595703125, -0.47747802734375, -0.45629119873046875, -0.4351043701171875, -0.41391754150390625, -0.392730712890625, -0.37154388427734375, -0.3503570556640625, -0.32917022705078125, -0.3079833984375, -0.28679656982421875, -0.2656097412109375, -0.24442291259765625, -0.223236083984375, -0.20204925537109375, -0.1808624267578125, -0.15967559814453125, -0.13848876953125, -0.11730194091796875, -0.0961151123046875, -0.07492828369140625, -0.053741455078125, -0.03255462646484375, -0.0113677978515625, 0.00981903076171875, 0.031005859375, 0.05219268798828125, 0.0733795166015625, 0.09456634521484375, 0.115753173828125, 0.13694000244140625, 0.1581268310546875, 0.17931365966796875, 0.20050048828125, 0.22168731689453125, 0.2428741455078125, 0.26406097412109375, 0.285247802734375, 0.30643463134765625, 0.3276214599609375, 0.34880828857421875, 0.3699951171875, 0.39118194580078125, 0.4123687744140625, 0.43355560302734375, 0.454742431640625, 0.47592926025390625, 0.4971160888671875, 0.5183029174804688, 0.53948974609375, 0.5606765747070312, 0.5818634033203125, 0.6030502319335938, 0.624237060546875, 0.6454238891601562, 0.6666107177734375, 0.6877975463867188, 0.708984375]}, "gradients/decoder.model.decoder.layers.11.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 2.0, 3.0, 4.0, 7.0, 8.0, 11.0, 13.0, 37.0, 28.0, 47.0, 72.0, 109.0, 153.0, 253.0, 398.0, 673.0, 1063.0, 2010.0, 3854.0, 8248.0, 22190.0, 833306.0, 144839.0, 16914.0, 6730.0, 3249.0, 1743.0, 1001.0, 614.0, 308.0, 242.0, 128.0, 84.0, 60.0, 35.0, 23.0, 26.0, 14.0, 14.0, 12.0, 7.0, 9.0, 4.0, 4.0, 5.0, 1.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4013671875, -0.38916015625, -0.376953125, -0.36474609375, -0.3525390625, -0.34033203125, -0.328125, -0.31591796875, -0.3037109375, -0.29150390625, -0.279296875, -0.26708984375, -0.2548828125, -0.24267578125, -0.23046875, -0.21826171875, -0.2060546875, -0.19384765625, -0.181640625, -0.16943359375, -0.1572265625, -0.14501953125, -0.1328125, -0.12060546875, -0.1083984375, -0.09619140625, -0.083984375, -0.07177734375, -0.0595703125, -0.04736328125, -0.03515625, -0.02294921875, -0.0107421875, 0.00146484375, 0.013671875, 0.02587890625, 0.0380859375, 0.05029296875, 0.0625, 0.07470703125, 0.0869140625, 0.09912109375, 0.111328125, 0.12353515625, 0.1357421875, 0.14794921875, 0.16015625, 0.17236328125, 0.1845703125, 0.19677734375, 0.208984375, 0.22119140625, 0.2333984375, 0.24560546875, 0.2578125, 0.27001953125, 0.2822265625, 0.29443359375, 0.306640625, 0.31884765625, 0.3310546875, 0.34326171875, 0.35546875, 0.36767578125, 0.3798828125]}, "gradients/decoder.model.decoder.layers.11.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 8.0, 5.0, 4.0, 18.0, 23.0, 67.0, 433.0, 324.0, 65.0, 27.0, 7.0, 4.0, 5.0, 2.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.143880844116211e-05, -4.909280687570572e-05, -4.674680531024933e-05, -4.440080374479294e-05, -4.205480217933655e-05, -3.970880061388016e-05, -3.736279904842377e-05, -3.501679748296738e-05, -3.2670795917510986e-05, -3.0324794352054596e-05, -2.7978792786598206e-05, -2.5632791221141815e-05, -2.3286789655685425e-05, -2.0940788090229034e-05, -1.8594786524772644e-05, -1.6248784959316254e-05, -1.3902783393859863e-05, -1.1556781828403473e-05, -9.210780262947083e-06, -6.864778697490692e-06, -4.518777132034302e-06, -2.1727755665779114e-06, 1.73225998878479e-07, 2.5192275643348694e-06, 4.86522912979126e-06, 7.21123069524765e-06, 9.55723226070404e-06, 1.1903233826160431e-05, 1.4249235391616821e-05, 1.659523695707321e-05, 1.8941238522529602e-05, 2.1287240087985992e-05, 2.3633241653442383e-05, 2.5979243218898773e-05, 2.8325244784355164e-05, 3.0671246349811554e-05, 3.3017247915267944e-05, 3.5363249480724335e-05, 3.7709251046180725e-05, 4.0055252611637115e-05, 4.2401254177093506e-05, 4.4747255742549896e-05, 4.709325730800629e-05, 4.943925887346268e-05, 5.178526043891907e-05, 5.413126200437546e-05, 5.647726356983185e-05, 5.882326513528824e-05, 6.116926670074463e-05, 6.351526826620102e-05, 6.586126983165741e-05, 6.82072713971138e-05, 7.055327296257019e-05, 7.289927452802658e-05, 7.524527609348297e-05, 7.759127765893936e-05, 7.993727922439575e-05, 8.228328078985214e-05, 8.462928235530853e-05, 8.697528392076492e-05, 8.932128548622131e-05, 9.16672870516777e-05, 9.40132886171341e-05, 9.635929018259048e-05, 9.870529174804688e-05]}, "gradients/decoder.model.decoder.layers.11.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 4.0, 2.0, 1.0, 4.0, 5.0, 9.0, 6.0, 7.0, 6.0, 12.0, 20.0, 33.0, 52.0, 109.0, 197.0, 373.0, 900.0, 2296.0, 6540.0, 25199.0, 945322.0, 52638.0, 9404.0, 3109.0, 1228.0, 530.0, 237.0, 129.0, 63.0, 42.0, 17.0, 14.0, 15.0, 8.0, 7.0, 9.0, 7.0, 3.0, 0.0, 0.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.54931640625, -0.5334663391113281, -0.5176162719726562, -0.5017662048339844, -0.4859161376953125, -0.4700660705566406, -0.45421600341796875, -0.4383659362792969, -0.422515869140625, -0.4066658020019531, -0.39081573486328125, -0.3749656677246094, -0.3591156005859375, -0.3432655334472656, -0.32741546630859375, -0.3115653991699219, -0.29571533203125, -0.2798652648925781, -0.26401519775390625, -0.24816513061523438, -0.2323150634765625, -0.21646499633789062, -0.20061492919921875, -0.18476486206054688, -0.168914794921875, -0.15306472778320312, -0.13721466064453125, -0.12136459350585938, -0.1055145263671875, -0.08966445922851562, -0.07381439208984375, -0.057964324951171875, -0.0421142578125, -0.026264190673828125, -0.01041412353515625, 0.005435943603515625, 0.0212860107421875, 0.037136077880859375, 0.05298614501953125, 0.06883621215820312, 0.084686279296875, 0.10053634643554688, 0.11638641357421875, 0.13223648071289062, 0.1480865478515625, 0.16393661499023438, 0.17978668212890625, 0.19563674926757812, 0.21148681640625, 0.22733688354492188, 0.24318695068359375, 0.2590370178222656, 0.2748870849609375, 0.2907371520996094, 0.30658721923828125, 0.3224372863769531, 0.338287353515625, 0.3541374206542969, 0.36998748779296875, 0.3858375549316406, 0.4016876220703125, 0.4175376892089844, 0.43338775634765625, 0.4492378234863281, 0.465087890625]}, "gradients/decoder.model.decoder.layers.11.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 7.0, 3.0, 6.0, 2.0, 4.0, 5.0, 7.0, 7.0, 13.0, 18.0, 44.0, 71.0, 364.0, 301.0, 70.0, 23.0, 12.0, 6.0, 10.0, 3.0, 4.0, 6.0, 4.0, 6.0, 3.0, 2.0, 1.0, 1.0, 3.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1396484375, -0.13498306274414062, -0.13031768798828125, -0.12565231323242188, -0.1209869384765625, -0.11632156372070312, -0.11165618896484375, -0.10699081420898438, -0.102325439453125, -0.09766006469726562, -0.09299468994140625, -0.08832931518554688, -0.0836639404296875, -0.07899856567382812, -0.07433319091796875, -0.06966781616210938, -0.06500244140625, -0.060337066650390625, -0.05567169189453125, -0.051006317138671875, -0.0463409423828125, -0.041675567626953125, -0.03701019287109375, -0.032344818115234375, -0.027679443359375, -0.023014068603515625, -0.01834869384765625, -0.013683319091796875, -0.0090179443359375, -0.004352569580078125, 0.00031280517578125, 0.004978179931640625, 0.0096435546875, 0.014308929443359375, 0.01897430419921875, 0.023639678955078125, 0.0283050537109375, 0.032970428466796875, 0.03763580322265625, 0.042301177978515625, 0.046966552734375, 0.051631927490234375, 0.05629730224609375, 0.060962677001953125, 0.0656280517578125, 0.07029342651367188, 0.07495880126953125, 0.07962417602539062, 0.08428955078125, 0.08895492553710938, 0.09362030029296875, 0.09828567504882812, 0.1029510498046875, 0.10761642456054688, 0.11228179931640625, 0.11694717407226562, 0.121612548828125, 0.12627792358398438, 0.13094329833984375, 0.13560867309570312, 0.1402740478515625, 0.14493942260742188, 0.14960479736328125, 0.15427017211914062, 0.158935546875]}, "gradients/decoder.model.decoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [3.0, 3.0, 1.0, 2.0, 5.0, 12.0, 11.0, 27.0, 41.0, 59.0, 96.0, 114.0, 131.0, 141.0, 116.0, 100.0, 58.0, 33.0, 34.0, 10.0, 14.0, 6.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8285374045372009, -0.765209436416626, -0.7018814086914062, -0.6385534405708313, -0.5752254724502563, -0.5118974447250366, -0.44856947660446167, -0.38524147868156433, -0.321913480758667, -0.25858548283576965, -0.1952574998140335, -0.13192951679229736, -0.06860151886940002, -0.0052735209465026855, 0.058054447174072266, 0.1213824450969696, 0.18471044301986694, 0.24803844094276428, 0.3113664388656616, 0.3746944069862366, 0.4380224049091339, 0.5013504028320312, 0.5646783709526062, 0.6280063390731812, 0.6913343667984009, 0.7546623349189758, 0.8179903626441956, 0.8813183307647705, 0.9446463584899902, 1.00797438621521, 1.0713022947311401, 1.1346303224563599, 1.1979584693908691, 1.2612864971160889, 1.324614405632019, 1.3879424333572388, 1.4512704610824585, 1.5145983695983887, 1.5779263973236084, 1.6412544250488281, 1.7045824527740479, 1.7679104804992676, 1.8312383890151978, 1.8945664167404175, 1.9578944444656372, 2.0212223529815674, 2.084550380706787, 2.147878408432007, 2.2112064361572266, 2.2745344638824463, 2.337862491607666, 2.4011902809143066, 2.4645183086395264, 2.527846336364746, 2.591174364089966, 2.6545023918151855, 2.717830181121826, 2.781158208847046, 2.8444862365722656, 2.9078140258789062, 2.971142053604126, 3.0344700813293457, 3.0977981090545654, 3.161126136779785, 3.224454164505005]}, "gradients/decoder.model.decoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 2.0, 5.0, 5.0, 2.0, 6.0, 5.0, 9.0, 13.0, 9.0, 17.0, 18.0, 28.0, 14.0, 27.0, 35.0, 27.0, 32.0, 41.0, 32.0, 47.0, 38.0, 45.0, 42.0, 43.0, 46.0, 40.0, 41.0, 49.0, 29.0, 32.0, 16.0, 36.0, 26.0, 23.0, 12.0, 27.0, 14.0, 15.0, 15.0, 8.0, 6.0, 11.0, 6.0, 5.0, 3.0, 3.0, 3.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0], "bins": [-1.222510814666748, -1.1859544515609741, -1.1493980884552002, -1.1128418445587158, -1.076285481452942, -1.039729118347168, -1.003172755241394, -0.9666163921356201, -0.930060088634491, -0.893503725528717, -0.8569474220275879, -0.820391058921814, -0.78383469581604, -0.7472783923149109, -0.710722029209137, -0.6741657257080078, -0.6376093626022339, -0.60105299949646, -0.5644966959953308, -0.5279403328895569, -0.49138399958610535, -0.4548276662826538, -0.4182713031768799, -0.38171496987342834, -0.3451586365699768, -0.30860230326652527, -0.27204596996307373, -0.2354896068572998, -0.19893327355384827, -0.16237694025039673, -0.125820592045784, -0.08926424384117126, -0.05270791053771973, -0.01615156978368759, 0.020404770970344543, 0.05696111172437668, 0.09351745247840881, 0.13007378578186035, 0.16663013398647308, 0.20318648219108582, 0.23974281549453735, 0.2762991487979889, 0.31285548210144043, 0.34941184520721436, 0.3859681785106659, 0.42252451181411743, 0.45908087491989136, 0.4956372082233429, 0.5321935415267944, 0.5687499046325684, 0.6053062081336975, 0.6418625712394714, 0.6784188747406006, 0.7149752378463745, 0.7515316009521484, 0.7880879640579224, 0.8246442675590515, 0.8612006306648254, 0.8977569341659546, 0.9343132972717285, 0.9708696603775024, 1.0074260234832764, 1.0439822673797607, 1.0805386304855347, 1.1170949935913086]}, "gradients/decoder.model.decoder.layers.10.fc2.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 5.0, 7.0, 7.0, 8.0, 10.0, 9.0, 12.0, 17.0, 21.0, 22.0, 45.0, 52.0, 69.0, 81.0, 122.0, 166.0, 246.0, 345.0, 500.0, 774.0, 1089.0, 1660.0, 2489.0, 4136.0, 6603.0, 11718.0, 23532.0, 56748.0, 167425.0, 507049.0, 1309284.0, 1342966.0, 503013.0, 151380.0, 52459.0, 21658.0, 11168.0, 6402.0, 3775.0, 2395.0, 1555.0, 987.0, 717.0, 475.0, 343.0, 220.0, 149.0, 108.0, 59.0, 71.0, 39.0, 29.0, 25.0, 14.0, 13.0, 5.0, 5.0, 7.0, 4.0, 2.0, 5.0], "bins": [-0.5390625, -0.5231971740722656, -0.5073318481445312, -0.4914665222167969, -0.4756011962890625, -0.4597358703613281, -0.44387054443359375, -0.4280052185058594, -0.412139892578125, -0.3962745666503906, -0.38040924072265625, -0.3645439147949219, -0.3486785888671875, -0.3328132629394531, -0.31694793701171875, -0.3010826110839844, -0.28521728515625, -0.2693519592285156, -0.25348663330078125, -0.23762130737304688, -0.2217559814453125, -0.20589065551757812, -0.19002532958984375, -0.17416000366210938, -0.158294677734375, -0.14242935180664062, -0.12656402587890625, -0.11069869995117188, -0.0948333740234375, -0.07896804809570312, -0.06310272216796875, -0.047237396240234375, -0.0313720703125, -0.015506744384765625, 0.00035858154296875, 0.016223907470703125, 0.0320892333984375, 0.047954559326171875, 0.06381988525390625, 0.07968521118164062, 0.095550537109375, 0.11141586303710938, 0.12728118896484375, 0.14314651489257812, 0.1590118408203125, 0.17487716674804688, 0.19074249267578125, 0.20660781860351562, 0.22247314453125, 0.23833847045898438, 0.25420379638671875, 0.2700691223144531, 0.2859344482421875, 0.3017997741699219, 0.31766510009765625, 0.3335304260253906, 0.349395751953125, 0.3652610778808594, 0.38112640380859375, 0.3969917297363281, 0.4128570556640625, 0.4287223815917969, 0.44458770751953125, 0.4604530334472656, 0.476318359375]}, "gradients/decoder.model.decoder.layers.10.fc2.bias": {"_type": "histogram", "values": [3.0, 3.0, 2.0, 1.0, 3.0, 1.0, 6.0, 6.0, 9.0, 6.0, 5.0, 7.0, 10.0, 15.0, 15.0, 20.0, 19.0, 17.0, 45.0, 24.0, 22.0, 26.0, 40.0, 43.0, 41.0, 51.0, 39.0, 41.0, 50.0, 23.0, 43.0, 48.0, 34.0, 30.0, 35.0, 24.0, 28.0, 28.0, 20.0, 15.0, 19.0, 11.0, 18.0, 8.0, 10.0, 5.0, 11.0, 11.0, 4.0, 6.0, 4.0, 3.0, 2.0, 1.0, 4.0, 1.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4169921875, -0.40225982666015625, -0.3875274658203125, -0.37279510498046875, -0.358062744140625, -0.34333038330078125, -0.3285980224609375, -0.31386566162109375, -0.29913330078125, -0.28440093994140625, -0.2696685791015625, -0.25493621826171875, -0.240203857421875, -0.22547149658203125, -0.2107391357421875, -0.19600677490234375, -0.1812744140625, -0.16654205322265625, -0.1518096923828125, -0.13707733154296875, -0.122344970703125, -0.10761260986328125, -0.0928802490234375, -0.07814788818359375, -0.06341552734375, -0.04868316650390625, -0.0339508056640625, -0.01921844482421875, -0.004486083984375, 0.01024627685546875, 0.0249786376953125, 0.03971099853515625, 0.054443359375, 0.06917572021484375, 0.0839080810546875, 0.09864044189453125, 0.113372802734375, 0.12810516357421875, 0.1428375244140625, 0.15756988525390625, 0.17230224609375, 0.18703460693359375, 0.2017669677734375, 0.21649932861328125, 0.231231689453125, 0.24596405029296875, 0.2606964111328125, 0.27542877197265625, 0.2901611328125, 0.30489349365234375, 0.3196258544921875, 0.33435821533203125, 0.349090576171875, 0.36382293701171875, 0.3785552978515625, 0.39328765869140625, 0.40802001953125, 0.42275238037109375, 0.4374847412109375, 0.45221710205078125, 0.466949462890625, 0.48168182373046875, 0.4964141845703125, 0.5111465454101562, 0.52587890625]}, "gradients/decoder.model.decoder.layers.10.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 7.0, 8.0, 12.0, 11.0, 22.0, 47.0, 136.0, 360.0, 2878.0, 3699217.0, 489424.0, 1706.0, 256.0, 101.0, 41.0, 22.0, 22.0, 9.0, 8.0, 2.0, 2.0, 4.0], "bins": [-8.3359375, -8.175369262695312, -8.014801025390625, -7.8542327880859375, -7.69366455078125, -7.5330963134765625, -7.372528076171875, -7.2119598388671875, -7.0513916015625, -6.8908233642578125, -6.730255126953125, -6.5696868896484375, -6.40911865234375, -6.2485504150390625, -6.087982177734375, -5.9274139404296875, -5.766845703125, -5.6062774658203125, -5.445709228515625, -5.2851409912109375, -5.12457275390625, -4.9640045166015625, -4.803436279296875, -4.6428680419921875, -4.4822998046875, -4.3217315673828125, -4.161163330078125, -4.0005950927734375, -3.84002685546875, -3.6794586181640625, -3.518890380859375, -3.3583221435546875, -3.19775390625, -3.0371856689453125, -2.876617431640625, -2.7160491943359375, -2.55548095703125, -2.3949127197265625, -2.234344482421875, -2.0737762451171875, -1.9132080078125, -1.7526397705078125, -1.592071533203125, -1.4315032958984375, -1.27093505859375, -1.1103668212890625, -0.949798583984375, -0.7892303466796875, -0.628662109375, -0.4680938720703125, -0.307525634765625, -0.1469573974609375, 0.01361083984375, 0.1741790771484375, 0.334747314453125, 0.4953155517578125, 0.6558837890625, 0.8164520263671875, 0.977020263671875, 1.1375885009765625, 1.29815673828125, 1.4587249755859375, 1.619293212890625, 1.7798614501953125, 1.9404296875]}, "gradients/decoder.model.decoder.layers.10.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 4.0, 1.0, 2.0, 7.0, 8.0, 9.0, 24.0, 30.0, 34.0, 50.0, 89.0, 115.0, 224.0, 405.0, 713.0, 903.0, 586.0, 344.0, 202.0, 104.0, 65.0, 46.0, 32.0, 37.0, 14.0, 10.0, 9.0, 7.0, 3.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.495361328125, -0.4842033386230469, -0.47304534912109375, -0.4618873596191406, -0.4507293701171875, -0.4395713806152344, -0.42841339111328125, -0.4172554016113281, -0.406097412109375, -0.3949394226074219, -0.38378143310546875, -0.3726234436035156, -0.3614654541015625, -0.3503074645996094, -0.33914947509765625, -0.3279914855957031, -0.31683349609375, -0.3056755065917969, -0.29451751708984375, -0.2833595275878906, -0.2722015380859375, -0.2610435485839844, -0.24988555908203125, -0.23872756958007812, -0.227569580078125, -0.21641159057617188, -0.20525360107421875, -0.19409561157226562, -0.1829376220703125, -0.17177963256835938, -0.16062164306640625, -0.14946365356445312, -0.1383056640625, -0.12714767456054688, -0.11598968505859375, -0.10483169555664062, -0.0936737060546875, -0.08251571655273438, -0.07135772705078125, -0.060199737548828125, -0.049041748046875, -0.037883758544921875, -0.02672576904296875, -0.015567779541015625, -0.0044097900390625, 0.006748199462890625, 0.01790618896484375, 0.029064178466796875, 0.04022216796875, 0.051380157470703125, 0.06253814697265625, 0.07369613647460938, 0.0848541259765625, 0.09601211547851562, 0.10717010498046875, 0.11832809448242188, 0.129486083984375, 0.14064407348632812, 0.15180206298828125, 0.16296005249023438, 0.1741180419921875, 0.18527603149414062, 0.19643402099609375, 0.20759201049804688, 0.21875]}, "gradients/decoder.model.decoder.layers.10.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 4.0, 1.0, 3.0, 7.0, 8.0, 12.0, 7.0, 9.0, 13.0, 23.0, 23.0, 26.0, 35.0, 30.0, 48.0, 38.0, 45.0, 57.0, 50.0, 72.0, 53.0, 64.0, 46.0, 48.0, 45.0, 40.0, 28.0, 22.0, 35.0, 23.0, 12.0, 13.0, 9.0, 8.0, 11.0, 8.0, 8.0, 3.0, 5.0, 4.0, 3.0, 4.0, 1.0, 0.0, 0.0, 0.0, 4.0], "bins": [-0.7299134135246277, -0.7101702094078064, -0.6904270648956299, -0.6706838607788086, -0.6509406566619873, -0.631197452545166, -0.6114543080329895, -0.5917111039161682, -0.5719678997993469, -0.5522246956825256, -0.5324815511703491, -0.5127383470535278, -0.49299514293670654, -0.47325196862220764, -0.45350879430770874, -0.43376559019088745, -0.41402241587638855, -0.39427924156188965, -0.37453603744506836, -0.35479286313056946, -0.33504965901374817, -0.31530648469924927, -0.295563280582428, -0.2758201062679291, -0.2560769319534302, -0.23633374273777008, -0.21659055352210999, -0.19684737920761108, -0.1771041750907898, -0.1573610007762909, -0.1376178115606308, -0.1178746223449707, -0.09813141822814941, -0.07838822901248932, -0.05864504352211952, -0.038901858031749725, -0.01915866881608963, 0.0005845203995704651, 0.020327702164649963, 0.04007089138031006, 0.059814080595970154, 0.07955726981163025, 0.09930045902729034, 0.11904364079236984, 0.13878682255744934, 0.15853002667427063, 0.17827320098876953, 0.19801639020442963, 0.21775957942008972, 0.23750276863574982, 0.2572459578514099, 0.2769891321659088, 0.2967323362827301, 0.316475510597229, 0.3362187147140503, 0.3559618890285492, 0.3757050633430481, 0.395448237657547, 0.4151914417743683, 0.4349346160888672, 0.4546778202056885, 0.4744209945201874, 0.4941641688346863, 0.5139073729515076, 0.5336505770683289]}, "gradients/decoder.model.decoder.layers.10.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 7.0, 5.0, 11.0, 10.0, 11.0, 12.0, 19.0, 14.0, 10.0, 24.0, 20.0, 27.0, 23.0, 23.0, 29.0, 34.0, 45.0, 32.0, 40.0, 46.0, 36.0, 30.0, 33.0, 38.0, 49.0, 35.0, 35.0, 35.0, 31.0, 32.0, 21.0, 22.0, 17.0, 20.0, 17.0, 19.0, 14.0, 11.0, 15.0, 14.0, 10.0, 8.0, 9.0, 6.0, 5.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.5025136470794678, -0.4869573712348938, -0.4714011251926422, -0.45584484934806824, -0.44028857350349426, -0.4247323274612427, -0.4091760516166687, -0.3936197757720947, -0.37806349992752075, -0.3625072240829468, -0.3469509780406952, -0.3313947021961212, -0.31583842635154724, -0.30028218030929565, -0.2847259044647217, -0.2691696286201477, -0.2536133825778961, -0.23805712163448334, -0.22250084578990936, -0.20694458484649658, -0.1913883090019226, -0.17583204805850983, -0.16027578711509705, -0.14471951127052307, -0.1291632503271103, -0.11360698193311691, -0.09805071353912354, -0.08249445259571075, -0.06693818420171738, -0.051381915807724, -0.03582565486431122, -0.02026938647031784, -0.004713088274002075, 0.010843178257346153, 0.02639944478869438, 0.04195570945739746, 0.05751197785139084, 0.07306824624538422, 0.088624507188797, 0.10418077558279037, 0.11973704397678375, 0.13529330492019653, 0.1508495807647705, 0.1664058417081833, 0.18196210265159607, 0.19751837849617004, 0.21307463943958282, 0.2286309003829956, 0.24418717622756958, 0.25974345207214355, 0.27529969811439514, 0.2908559739589691, 0.3064122498035431, 0.3219684958457947, 0.33752477169036865, 0.3530810475349426, 0.3686373233795166, 0.3841935992240906, 0.39974984526634216, 0.41530612111091614, 0.4308623969554901, 0.4464186429977417, 0.4619749188423157, 0.47753119468688965, 0.49308744072914124]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 3.0, 5.0, 8.0, 8.0, 15.0, 22.0, 43.0, 42.0, 95.0, 160.0, 242.0, 385.0, 624.0, 1164.0, 1912.0, 3639.0, 6653.0, 13725.0, 29220.0, 68968.0, 180824.0, 374304.0, 217507.0, 82269.0, 34168.0, 15545.0, 7712.0, 4087.0, 2171.0, 1201.0, 730.0, 439.0, 269.0, 154.0, 96.0, 63.0, 36.0, 24.0, 16.0, 10.0, 4.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.25634765625, -0.24670791625976562, -0.23706817626953125, -0.22742843627929688, -0.2177886962890625, -0.20814895629882812, -0.19850921630859375, -0.18886947631835938, -0.179229736328125, -0.16958999633789062, -0.15995025634765625, -0.15031051635742188, -0.1406707763671875, -0.13103103637695312, -0.12139129638671875, -0.11175155639648438, -0.10211181640625, -0.09247207641601562, -0.08283233642578125, -0.07319259643554688, -0.0635528564453125, -0.053913116455078125, -0.04427337646484375, -0.034633636474609375, -0.024993896484375, -0.015354156494140625, -0.00571441650390625, 0.003925323486328125, 0.0135650634765625, 0.023204803466796875, 0.03284454345703125, 0.042484283447265625, 0.0521240234375, 0.061763763427734375, 0.07140350341796875, 0.08104324340820312, 0.0906829833984375, 0.10032272338867188, 0.10996246337890625, 0.11960220336914062, 0.129241943359375, 0.13888168334960938, 0.14852142333984375, 0.15816116333007812, 0.1678009033203125, 0.17744064331054688, 0.18708038330078125, 0.19672012329101562, 0.20635986328125, 0.21599960327148438, 0.22563934326171875, 0.23527908325195312, 0.2449188232421875, 0.2545585632324219, 0.26419830322265625, 0.2738380432128906, 0.283477783203125, 0.2931175231933594, 0.30275726318359375, 0.3123970031738281, 0.3220367431640625, 0.3316764831542969, 0.34131622314453125, 0.3509559631347656, 0.360595703125]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 8.0, 1.0, 2.0, 8.0, 12.0, 5.0, 11.0, 12.0, 20.0, 20.0, 20.0, 25.0, 24.0, 29.0, 29.0, 39.0, 35.0, 35.0, 39.0, 39.0, 39.0, 26.0, 38.0, 39.0, 52.0, 31.0, 45.0, 30.0, 35.0, 29.0, 28.0, 25.0, 24.0, 17.0, 22.0, 19.0, 13.0, 15.0, 16.0, 8.0, 9.0, 10.0, 5.0, 5.0, 2.0, 4.0, 3.0, 6.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.4013671875, -0.3893928527832031, -0.37741851806640625, -0.3654441833496094, -0.3534698486328125, -0.3414955139160156, -0.32952117919921875, -0.3175468444824219, -0.305572509765625, -0.2935981750488281, -0.28162384033203125, -0.2696495056152344, -0.2576751708984375, -0.24570083618164062, -0.23372650146484375, -0.22175216674804688, -0.20977783203125, -0.19780349731445312, -0.18582916259765625, -0.17385482788085938, -0.1618804931640625, -0.14990615844726562, -0.13793182373046875, -0.12595748901367188, -0.113983154296875, -0.10200881958007812, -0.09003448486328125, -0.07806015014648438, -0.0660858154296875, -0.054111480712890625, -0.04213714599609375, -0.030162811279296875, -0.0181884765625, -0.006214141845703125, 0.00576019287109375, 0.017734527587890625, 0.0297088623046875, 0.041683197021484375, 0.05365753173828125, 0.06563186645507812, 0.077606201171875, 0.08958053588867188, 0.10155487060546875, 0.11352920532226562, 0.1255035400390625, 0.13747787475585938, 0.14945220947265625, 0.16142654418945312, 0.17340087890625, 0.18537521362304688, 0.19734954833984375, 0.20932388305664062, 0.2212982177734375, 0.23327255249023438, 0.24524688720703125, 0.2572212219238281, 0.269195556640625, 0.2811698913574219, 0.29314422607421875, 0.3051185607910156, 0.3170928955078125, 0.3290672302246094, 0.34104156494140625, 0.3530158996582031, 0.364990234375]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [3.0, 3.0, 2.0, 2.0, 4.0, 4.0, 5.0, 15.0, 15.0, 17.0, 23.0, 20.0, 24.0, 54.0, 61.0, 96.0, 162.0, 251.0, 357.0, 653.0, 1104.0, 1841.0, 3642.0, 7782.0, 18648.0, 50077.0, 164468.0, 435110.0, 246313.0, 72261.0, 24874.0, 10143.0, 4703.0, 2410.0, 1310.0, 775.0, 453.0, 327.0, 198.0, 113.0, 86.0, 53.0, 34.0, 17.0, 15.0, 14.0, 9.0, 5.0, 4.0, 7.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2763671875, -0.2663764953613281, -0.25638580322265625, -0.24639511108398438, -0.2364044189453125, -0.22641372680664062, -0.21642303466796875, -0.20643234252929688, -0.196441650390625, -0.18645095825195312, -0.17646026611328125, -0.16646957397460938, -0.1564788818359375, -0.14648818969726562, -0.13649749755859375, -0.12650680541992188, -0.11651611328125, -0.10652542114257812, -0.09653472900390625, -0.08654403686523438, -0.0765533447265625, -0.06656265258789062, -0.05657196044921875, -0.046581268310546875, -0.036590576171875, -0.026599884033203125, -0.01660919189453125, -0.006618499755859375, 0.0033721923828125, 0.013362884521484375, 0.02335357666015625, 0.033344268798828125, 0.0433349609375, 0.053325653076171875, 0.06331634521484375, 0.07330703735351562, 0.0832977294921875, 0.09328842163085938, 0.10327911376953125, 0.11326980590820312, 0.123260498046875, 0.13325119018554688, 0.14324188232421875, 0.15323257446289062, 0.1632232666015625, 0.17321395874023438, 0.18320465087890625, 0.19319534301757812, 0.20318603515625, 0.21317672729492188, 0.22316741943359375, 0.23315811157226562, 0.2431488037109375, 0.2531394958496094, 0.26313018798828125, 0.2731208801269531, 0.283111572265625, 0.2931022644042969, 0.30309295654296875, 0.3130836486816406, 0.3230743408203125, 0.3330650329589844, 0.34305572509765625, 0.3530464172363281, 0.363037109375]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 4.0, 6.0, 9.0, 12.0, 9.0, 14.0, 12.0, 18.0, 23.0, 20.0, 29.0, 17.0, 29.0, 35.0, 36.0, 35.0, 34.0, 49.0, 39.0, 41.0, 41.0, 54.0, 42.0, 43.0, 48.0, 41.0, 36.0, 34.0, 26.0, 27.0, 21.0, 15.0, 15.0, 14.0, 13.0, 14.0, 11.0, 10.0, 9.0, 9.0, 1.0, 1.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.7001953125, -0.674530029296875, -0.64886474609375, -0.623199462890625, -0.5975341796875, -0.571868896484375, -0.54620361328125, -0.520538330078125, -0.494873046875, -0.469207763671875, -0.44354248046875, -0.417877197265625, -0.3922119140625, -0.366546630859375, -0.34088134765625, -0.315216064453125, -0.28955078125, -0.263885498046875, -0.23822021484375, -0.212554931640625, -0.1868896484375, -0.161224365234375, -0.13555908203125, -0.109893798828125, -0.084228515625, -0.058563232421875, -0.03289794921875, -0.007232666015625, 0.0184326171875, 0.044097900390625, 0.06976318359375, 0.095428466796875, 0.12109375, 0.146759033203125, 0.17242431640625, 0.198089599609375, 0.2237548828125, 0.249420166015625, 0.27508544921875, 0.300750732421875, 0.326416015625, 0.352081298828125, 0.37774658203125, 0.403411865234375, 0.4290771484375, 0.454742431640625, 0.48040771484375, 0.506072998046875, 0.53173828125, 0.557403564453125, 0.58306884765625, 0.608734130859375, 0.6343994140625, 0.660064697265625, 0.68572998046875, 0.711395263671875, 0.737060546875, 0.762725830078125, 0.78839111328125, 0.814056396484375, 0.8397216796875, 0.865386962890625, 0.89105224609375, 0.916717529296875, 0.9423828125]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 5.0, 4.0, 8.0, 11.0, 11.0, 13.0, 16.0, 28.0, 23.0, 52.0, 67.0, 85.0, 108.0, 159.0, 265.0, 416.0, 639.0, 981.0, 1590.0, 2817.0, 5319.0, 11360.0, 31992.0, 151446.0, 652031.0, 135713.0, 29980.0, 11058.0, 5346.0, 2666.0, 1589.0, 952.0, 566.0, 401.0, 251.0, 156.0, 125.0, 75.0, 65.0, 41.0, 30.0, 15.0, 18.0, 15.0, 16.0, 8.0, 10.0, 6.0, 6.0, 1.0, 4.0, 1.0, 3.0, 1.0, 1.0, 1.0], "bins": [-0.10675048828125, -0.10346317291259766, -0.10017585754394531, -0.09688854217529297, -0.09360122680664062, -0.09031391143798828, -0.08702659606933594, -0.0837392807006836, -0.08045196533203125, -0.0771646499633789, -0.07387733459472656, -0.07059001922607422, -0.06730270385742188, -0.06401538848876953, -0.06072807312011719, -0.057440757751464844, -0.0541534423828125, -0.050866127014160156, -0.04757881164550781, -0.04429149627685547, -0.041004180908203125, -0.03771686553955078, -0.03442955017089844, -0.031142234802246094, -0.02785491943359375, -0.024567604064941406, -0.021280288696289062, -0.01799297332763672, -0.014705657958984375, -0.011418342590332031, -0.008131027221679688, -0.004843711853027344, -0.001556396484375, 0.0017309188842773438, 0.0050182342529296875, 0.008305549621582031, 0.011592864990234375, 0.014880180358886719, 0.018167495727539062, 0.021454811096191406, 0.02474212646484375, 0.028029441833496094, 0.03131675720214844, 0.03460407257080078, 0.037891387939453125, 0.04117870330810547, 0.04446601867675781, 0.047753334045410156, 0.0510406494140625, 0.054327964782714844, 0.05761528015136719, 0.06090259552001953, 0.06418991088867188, 0.06747722625732422, 0.07076454162597656, 0.0740518569946289, 0.07733917236328125, 0.0806264877319336, 0.08391380310058594, 0.08720111846923828, 0.09048843383789062, 0.09377574920654297, 0.09706306457519531, 0.10035037994384766, 0.1036376953125]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 3.0, 5.0, 7.0, 2.0, 7.0, 7.0, 20.0, 35.0, 58.0, 103.0, 167.0, 230.0, 163.0, 78.0, 44.0, 24.0, 19.0, 8.0, 7.0, 5.0, 3.0, 1.0, 4.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00010031461715698242, -9.664241224527359e-05, -9.297020733356476e-05, -8.929800242185593e-05, -8.56257975101471e-05, -8.195359259843826e-05, -7.828138768672943e-05, -7.46091827750206e-05, -7.093697786331177e-05, -6.726477295160294e-05, -6.35925680398941e-05, -5.992036312818527e-05, -5.624815821647644e-05, -5.257595330476761e-05, -4.890374839305878e-05, -4.5231543481349945e-05, -4.155933856964111e-05, -3.788713365793228e-05, -3.421492874622345e-05, -3.054272383451462e-05, -2.6870518922805786e-05, -2.3198314011096954e-05, -1.9526109099388123e-05, -1.585390418767929e-05, -1.2181699275970459e-05, -8.509494364261627e-06, -4.837289452552795e-06, -1.1650845408439636e-06, 2.507120370864868e-06, 6.1793252825737e-06, 9.851530194282532e-06, 1.3523735105991364e-05, 1.7195940017700195e-05, 2.0868144929409027e-05, 2.454034984111786e-05, 2.821255475282669e-05, 3.188475966453552e-05, 3.5556964576244354e-05, 3.9229169487953186e-05, 4.290137439966202e-05, 4.657357931137085e-05, 5.024578422307968e-05, 5.391798913478851e-05, 5.7590194046497345e-05, 6.126239895820618e-05, 6.493460386991501e-05, 6.860680878162384e-05, 7.227901369333267e-05, 7.59512186050415e-05, 7.962342351675034e-05, 8.329562842845917e-05, 8.6967833340168e-05, 9.064003825187683e-05, 9.431224316358566e-05, 9.79844480752945e-05, 0.00010165665298700333, 0.00010532885789871216, 0.00010900106281042099, 0.00011267326772212982, 0.00011634547263383865, 0.00012001767754554749, 0.00012368988245725632, 0.00012736208736896515, 0.00013103429228067398, 0.0001347064971923828]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 1.0, 1.0, 4.0, 3.0, 6.0, 11.0, 15.0, 17.0, 19.0, 26.0, 47.0, 55.0, 84.0, 157.0, 194.0, 301.0, 494.0, 763.0, 1237.0, 2165.0, 3987.0, 8976.0, 27337.0, 150649.0, 649452.0, 155883.0, 27745.0, 9086.0, 4126.0, 2159.0, 1315.0, 785.0, 505.0, 322.0, 208.0, 138.0, 81.0, 60.0, 39.0, 26.0, 26.0, 16.0, 13.0, 7.0, 6.0, 5.0, 3.0, 5.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.10504150390625, -0.10190677642822266, -0.09877204895019531, -0.09563732147216797, -0.09250259399414062, -0.08936786651611328, -0.08623313903808594, -0.0830984115600586, -0.07996368408203125, -0.0768289566040039, -0.07369422912597656, -0.07055950164794922, -0.06742477416992188, -0.06429004669189453, -0.06115531921386719, -0.058020591735839844, -0.0548858642578125, -0.051751136779785156, -0.04861640930175781, -0.04548168182373047, -0.042346954345703125, -0.03921222686767578, -0.03607749938964844, -0.032942771911621094, -0.02980804443359375, -0.026673316955566406, -0.023538589477539062, -0.02040386199951172, -0.017269134521484375, -0.014134407043457031, -0.010999679565429688, -0.007864952087402344, -0.004730224609375, -0.0015954971313476562, 0.0015392303466796875, 0.004673957824707031, 0.007808685302734375, 0.010943412780761719, 0.014078140258789062, 0.017212867736816406, 0.02034759521484375, 0.023482322692871094, 0.026617050170898438, 0.02975177764892578, 0.032886505126953125, 0.03602123260498047, 0.03915596008300781, 0.042290687561035156, 0.0454254150390625, 0.048560142517089844, 0.05169486999511719, 0.05482959747314453, 0.057964324951171875, 0.06109905242919922, 0.06423377990722656, 0.0673685073852539, 0.07050323486328125, 0.0736379623413086, 0.07677268981933594, 0.07990741729736328, 0.08304214477539062, 0.08617687225341797, 0.08931159973144531, 0.09244632720947266, 0.0955810546875]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 2.0, 1.0, 0.0, 1.0, 3.0, 2.0, 5.0, 2.0, 2.0, 3.0, 3.0, 6.0, 5.0, 7.0, 10.0, 14.0, 23.0, 34.0, 36.0, 53.0, 81.0, 113.0, 119.0, 143.0, 110.0, 54.0, 33.0, 34.0, 26.0, 21.0, 13.0, 8.0, 6.0, 6.0, 8.0, 9.0, 4.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.029693603515625, -0.028784751892089844, -0.027875900268554688, -0.02696704864501953, -0.026058197021484375, -0.02514934539794922, -0.024240493774414062, -0.023331642150878906, -0.02242279052734375, -0.021513938903808594, -0.020605087280273438, -0.01969623565673828, -0.018787384033203125, -0.01787853240966797, -0.016969680786132812, -0.016060829162597656, -0.0151519775390625, -0.014243125915527344, -0.013334274291992188, -0.012425422668457031, -0.011516571044921875, -0.010607719421386719, -0.009698867797851562, -0.008790016174316406, -0.00788116455078125, -0.006972312927246094, -0.0060634613037109375, -0.005154609680175781, -0.004245758056640625, -0.0033369064331054688, -0.0024280548095703125, -0.0015192031860351562, -0.0006103515625, 0.00029850006103515625, 0.0012073516845703125, 0.0021162033081054688, 0.003025054931640625, 0.003933906555175781, 0.0048427581787109375, 0.005751609802246094, 0.00666046142578125, 0.007569313049316406, 0.008478164672851562, 0.009387016296386719, 0.010295867919921875, 0.011204719543457031, 0.012113571166992188, 0.013022422790527344, 0.0139312744140625, 0.014840126037597656, 0.015748977661132812, 0.01665782928466797, 0.017566680908203125, 0.01847553253173828, 0.019384384155273438, 0.020293235778808594, 0.02120208740234375, 0.022110939025878906, 0.023019790649414062, 0.02392864227294922, 0.024837493896484375, 0.02574634552001953, 0.026655197143554688, 0.027564048767089844, 0.028472900390625]}, "gradients/decoder.model.decoder.layers.10.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 5.0, 2.0, 4.0, 5.0, 6.0, 10.0, 12.0, 27.0, 30.0, 44.0, 42.0, 64.0, 75.0, 88.0, 114.0, 96.0, 86.0, 74.0, 62.0, 46.0, 28.0, 22.0, 13.0, 13.0, 11.0, 9.0, 5.0, 5.0, 2.0, 5.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.6447384357452393, -0.6256654858589172, -0.6065924763679504, -0.5875195264816284, -0.5684465169906616, -0.5493735671043396, -0.5303005576133728, -0.5112276077270508, -0.49215462803840637, -0.47308164834976196, -0.45400866866111755, -0.43493568897247314, -0.4158627390861511, -0.3967897295951843, -0.3777167797088623, -0.3586438000202179, -0.3395708203315735, -0.3204978406429291, -0.30142486095428467, -0.28235188126564026, -0.26327890157699585, -0.24420593678951263, -0.22513297200202942, -0.206059992313385, -0.1869870126247406, -0.1679140329360962, -0.14884105324745178, -0.12976808845996857, -0.11069510877132416, -0.09162212908267975, -0.07254915684461594, -0.053476184606552124, -0.03440326452255249, -0.01533028855919838, 0.003742687404155731, 0.022815663367509842, 0.04188863933086395, 0.06096161901950836, 0.08003459125757217, 0.09910756349563599, 0.1181805431842804, 0.1372535228729248, 0.1563265025615692, 0.17539946734905243, 0.19447244703769684, 0.21354542672634125, 0.23261839151382446, 0.25169137120246887, 0.2707643508911133, 0.2898373305797577, 0.3089103102684021, 0.3279832899570465, 0.3470562696456909, 0.36612921953201294, 0.38520219922065735, 0.40427517890930176, 0.42334815859794617, 0.4424211382865906, 0.461494117975235, 0.4805670976638794, 0.4996400475502014, 0.5187130570411682, 0.5377860069274902, 0.556859016418457, 0.575931966304779]}, "gradients/decoder.model.decoder.layers.10.self_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 0.0, 3.0, 5.0, 6.0, 6.0, 8.0, 13.0, 10.0, 5.0, 17.0, 16.0, 14.0, 11.0, 24.0, 28.0, 26.0, 33.0, 39.0, 25.0, 43.0, 40.0, 37.0, 34.0, 29.0, 42.0, 40.0, 44.0, 44.0, 37.0, 33.0, 27.0, 31.0, 31.0, 25.0, 20.0, 33.0, 20.0, 9.0, 15.0, 15.0, 15.0, 9.0, 7.0, 5.0, 7.0, 10.0, 4.0, 3.0, 3.0, 5.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.3684399724006653, -0.35713109374046326, -0.34582218527793884, -0.3345133066177368, -0.3232043981552124, -0.3118955194950104, -0.30058664083480835, -0.28927773237228394, -0.2779688239097595, -0.2666599452495575, -0.2553510367870331, -0.24404215812683105, -0.23273324966430664, -0.22142437100410461, -0.2101154774427414, -0.19880658388137817, -0.18749770522117615, -0.17618881165981293, -0.1648799180984497, -0.15357103943824768, -0.14226213097572327, -0.13095325231552124, -0.11964435875415802, -0.1083354651927948, -0.09702657163143158, -0.08571767807006836, -0.07440878450870514, -0.06309989839792252, -0.051791004836559296, -0.040482111275196075, -0.029173225164413452, -0.017864331603050232, -0.006555438041687012, 0.004753453657031059, 0.01606234535574913, 0.027371235191822052, 0.03868012875318527, 0.04998902231454849, 0.061297908425331116, 0.07260680198669434, 0.08391569554805756, 0.09522458910942078, 0.106533482670784, 0.11784236878156662, 0.12915125489234924, 0.14046016335487366, 0.15176904201507568, 0.1630779355764389, 0.17438682913780212, 0.18569572269916534, 0.19700461626052856, 0.2083134949207306, 0.219622403383255, 0.23093128204345703, 0.24224017560482025, 0.25354906916618347, 0.2648579478263855, 0.2761668264865875, 0.28747573494911194, 0.29878461360931396, 0.3100935220718384, 0.3214024007320404, 0.33271127939224243, 0.34402018785476685, 0.35532909631729126]}, "gradients/decoder.model.decoder.layers.10.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 6.0, 7.0, 10.0, 15.0, 27.0, 55.0, 95.0, 217.0, 477.0, 1161.0, 3462.0, 12160.0, 56790.0, 519045.0, 394525.0, 45378.0, 10233.0, 3021.0, 1067.0, 432.0, 163.0, 106.0, 54.0, 26.0, 14.0, 10.0, 4.0, 2.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.8046875, -0.7850303649902344, -0.7653732299804688, -0.7457160949707031, -0.7260589599609375, -0.7064018249511719, -0.6867446899414062, -0.6670875549316406, -0.647430419921875, -0.6277732849121094, -0.6081161499023438, -0.5884590148925781, -0.5688018798828125, -0.5491447448730469, -0.5294876098632812, -0.5098304748535156, -0.49017333984375, -0.4705162048339844, -0.45085906982421875, -0.4312019348144531, -0.4115447998046875, -0.3918876647949219, -0.37223052978515625, -0.3525733947753906, -0.332916259765625, -0.3132591247558594, -0.29360198974609375, -0.2739448547363281, -0.2542877197265625, -0.23463058471679688, -0.21497344970703125, -0.19531631469726562, -0.1756591796875, -0.15600204467773438, -0.13634490966796875, -0.11668777465820312, -0.0970306396484375, -0.07737350463867188, -0.05771636962890625, -0.038059234619140625, -0.018402099609375, 0.001255035400390625, 0.02091217041015625, 0.040569305419921875, 0.0602264404296875, 0.07988357543945312, 0.09954071044921875, 0.11919784545898438, 0.13885498046875, 0.15851211547851562, 0.17816925048828125, 0.19782638549804688, 0.2174835205078125, 0.23714065551757812, 0.25679779052734375, 0.2764549255371094, 0.296112060546875, 0.3157691955566406, 0.33542633056640625, 0.3550834655761719, 0.3747406005859375, 0.3943977355957031, 0.41405487060546875, 0.4337120056152344, 0.453369140625]}, "gradients/decoder.model.decoder.layers.10.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 1.0, 3.0, 2.0, 7.0, 8.0, 10.0, 8.0, 16.0, 16.0, 11.0, 20.0, 20.0, 20.0, 33.0, 37.0, 46.0, 31.0, 52.0, 41.0, 40.0, 42.0, 52.0, 53.0, 50.0, 46.0, 39.0, 35.0, 34.0, 55.0, 33.0, 29.0, 18.0, 17.0, 19.0, 13.0, 11.0, 13.0, 9.0, 2.0, 10.0, 3.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.76953125, -0.7452239990234375, -0.720916748046875, -0.6966094970703125, -0.67230224609375, -0.6479949951171875, -0.623687744140625, -0.5993804931640625, -0.5750732421875, -0.5507659912109375, -0.526458740234375, -0.5021514892578125, -0.47784423828125, -0.4535369873046875, -0.429229736328125, -0.4049224853515625, -0.380615234375, -0.3563079833984375, -0.332000732421875, -0.3076934814453125, -0.28338623046875, -0.2590789794921875, -0.234771728515625, -0.2104644775390625, -0.1861572265625, -0.1618499755859375, -0.137542724609375, -0.1132354736328125, -0.08892822265625, -0.0646209716796875, -0.040313720703125, -0.0160064697265625, 0.00830078125, 0.0326080322265625, 0.056915283203125, 0.0812225341796875, 0.10552978515625, 0.1298370361328125, 0.154144287109375, 0.1784515380859375, 0.2027587890625, 0.2270660400390625, 0.251373291015625, 0.2756805419921875, 0.29998779296875, 0.3242950439453125, 0.348602294921875, 0.3729095458984375, 0.397216796875, 0.4215240478515625, 0.445831298828125, 0.4701385498046875, 0.49444580078125, 0.5187530517578125, 0.543060302734375, 0.5673675537109375, 0.5916748046875, 0.6159820556640625, 0.640289306640625, 0.6645965576171875, 0.68890380859375, 0.7132110595703125, 0.737518310546875, 0.7618255615234375, 0.7861328125]}, "gradients/decoder.model.decoder.layers.10.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 8.0, 7.0, 12.0, 5.0, 13.0, 26.0, 14.0, 33.0, 47.0, 59.0, 71.0, 80.0, 105.0, 211.0, 1513.0, 232948.0, 810363.0, 2289.0, 243.0, 122.0, 86.0, 61.0, 53.0, 38.0, 32.0, 22.0, 29.0, 16.0, 11.0, 10.0, 5.0, 5.0, 4.0, 4.0, 5.0, 0.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.30078125, -2.221649169921875, -2.14251708984375, -2.063385009765625, -1.9842529296875, -1.905120849609375, -1.82598876953125, -1.746856689453125, -1.667724609375, -1.588592529296875, -1.50946044921875, -1.430328369140625, -1.3511962890625, -1.272064208984375, -1.19293212890625, -1.113800048828125, -1.03466796875, -0.955535888671875, -0.87640380859375, -0.797271728515625, -0.7181396484375, -0.639007568359375, -0.55987548828125, -0.480743408203125, -0.401611328125, -0.322479248046875, -0.24334716796875, -0.164215087890625, -0.0850830078125, -0.005950927734375, 0.07318115234375, 0.152313232421875, 0.2314453125, 0.310577392578125, 0.38970947265625, 0.468841552734375, 0.5479736328125, 0.627105712890625, 0.70623779296875, 0.785369873046875, 0.864501953125, 0.943634033203125, 1.02276611328125, 1.101898193359375, 1.1810302734375, 1.260162353515625, 1.33929443359375, 1.418426513671875, 1.49755859375, 1.576690673828125, 1.65582275390625, 1.734954833984375, 1.8140869140625, 1.893218994140625, 1.97235107421875, 2.051483154296875, 2.130615234375, 2.209747314453125, 2.28887939453125, 2.368011474609375, 2.4471435546875, 2.526275634765625, 2.60540771484375, 2.684539794921875, 2.763671875]}, "gradients/decoder.model.decoder.layers.10.self_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 4.0, 9.0, 7.0, 6.0, 9.0, 11.0, 14.0, 15.0, 20.0, 36.0, 26.0, 35.0, 43.0, 52.0, 60.0, 57.0, 52.0, 51.0, 56.0, 57.0, 49.0, 54.0, 46.0, 39.0, 42.0, 28.0, 29.0, 29.0, 16.0, 11.0, 8.0, 9.0, 7.0, 4.0, 5.0, 5.0, 2.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.97412109375, -0.9403610229492188, -0.9066009521484375, -0.8728408813476562, -0.839080810546875, -0.8053207397460938, -0.7715606689453125, -0.7378005981445312, -0.70404052734375, -0.6702804565429688, -0.6365203857421875, -0.6027603149414062, -0.569000244140625, -0.5352401733398438, -0.5014801025390625, -0.46772003173828125, -0.4339599609375, -0.40019989013671875, -0.3664398193359375, -0.33267974853515625, -0.298919677734375, -0.26515960693359375, -0.2313995361328125, -0.19763946533203125, -0.16387939453125, -0.13011932373046875, -0.0963592529296875, -0.06259918212890625, -0.028839111328125, 0.00492095947265625, 0.0386810302734375, 0.07244110107421875, 0.106201171875, 0.13996124267578125, 0.1737213134765625, 0.20748138427734375, 0.241241455078125, 0.27500152587890625, 0.3087615966796875, 0.34252166748046875, 0.37628173828125, 0.41004180908203125, 0.4438018798828125, 0.47756195068359375, 0.511322021484375, 0.5450820922851562, 0.5788421630859375, 0.6126022338867188, 0.6463623046875, 0.6801223754882812, 0.7138824462890625, 0.7476425170898438, 0.781402587890625, 0.8151626586914062, 0.8489227294921875, 0.8826828002929688, 0.91644287109375, 0.9502029418945312, 0.9839630126953125, 1.0177230834960938, 1.051483154296875, 1.0852432250976562, 1.1190032958984375, 1.1527633666992188, 1.1865234375]}, "gradients/decoder.model.decoder.layers.10.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 6.0, 6.0, 6.0, 11.0, 19.0, 41.0, 70.0, 119.0, 264.0, 554.0, 1612.0, 7568.0, 386850.0, 639733.0, 8780.0, 1783.0, 591.0, 249.0, 114.0, 78.0, 43.0, 24.0, 13.0, 4.0, 8.0, 8.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8369140625, -0.8115768432617188, -0.7862396240234375, -0.7609024047851562, -0.735565185546875, -0.7102279663085938, -0.6848907470703125, -0.6595535278320312, -0.63421630859375, -0.6088790893554688, -0.5835418701171875, -0.5582046508789062, -0.532867431640625, -0.5075302124023438, -0.4821929931640625, -0.45685577392578125, -0.4315185546875, -0.40618133544921875, -0.3808441162109375, -0.35550689697265625, -0.330169677734375, -0.30483245849609375, -0.2794952392578125, -0.25415802001953125, -0.22882080078125, -0.20348358154296875, -0.1781463623046875, -0.15280914306640625, -0.127471923828125, -0.10213470458984375, -0.0767974853515625, -0.05146026611328125, -0.026123046875, -0.00078582763671875, 0.0245513916015625, 0.04988861083984375, 0.075225830078125, 0.10056304931640625, 0.1259002685546875, 0.15123748779296875, 0.17657470703125, 0.20191192626953125, 0.2272491455078125, 0.25258636474609375, 0.277923583984375, 0.30326080322265625, 0.3285980224609375, 0.35393524169921875, 0.3792724609375, 0.40460968017578125, 0.4299468994140625, 0.45528411865234375, 0.480621337890625, 0.5059585571289062, 0.5312957763671875, 0.5566329956054688, 0.58197021484375, 0.6073074340820312, 0.6326446533203125, 0.6579818725585938, 0.683319091796875, 0.7086563110351562, 0.7339935302734375, 0.7593307495117188, 0.78466796875]}, "gradients/decoder.model.decoder.layers.10.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 2.0, 13.0, 13.0, 20.0, 33.0, 56.0, 108.0, 227.0, 258.0, 120.0, 63.0, 34.0, 24.0, 15.0, 7.0, 3.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.4286251068115234e-05, -4.2183324694633484e-05, -4.0080398321151733e-05, -3.797747194766998e-05, -3.587454557418823e-05, -3.377161920070648e-05, -3.166869282722473e-05, -2.956576645374298e-05, -2.746284008026123e-05, -2.535991370677948e-05, -2.325698733329773e-05, -2.115406095981598e-05, -1.905113458633423e-05, -1.6948208212852478e-05, -1.4845281839370728e-05, -1.2742355465888977e-05, -1.0639429092407227e-05, -8.536502718925476e-06, -6.433576345443726e-06, -4.330649971961975e-06, -2.2277235984802246e-06, -1.2479722499847412e-07, 1.9781291484832764e-06, 4.081055521965027e-06, 6.183981895446777e-06, 8.286908268928528e-06, 1.0389834642410278e-05, 1.2492761015892029e-05, 1.459568738937378e-05, 1.669861376285553e-05, 1.880154013633728e-05, 2.090446650981903e-05, 2.300739288330078e-05, 2.5110319256782532e-05, 2.7213245630264282e-05, 2.9316172003746033e-05, 3.141909837722778e-05, 3.3522024750709534e-05, 3.5624951124191284e-05, 3.7727877497673035e-05, 3.9830803871154785e-05, 4.1933730244636536e-05, 4.4036656618118286e-05, 4.613958299160004e-05, 4.824250936508179e-05, 5.034543573856354e-05, 5.244836211204529e-05, 5.455128848552704e-05, 5.665421485900879e-05, 5.875714123249054e-05, 6.086006760597229e-05, 6.296299397945404e-05, 6.506592035293579e-05, 6.716884672641754e-05, 6.927177309989929e-05, 7.137469947338104e-05, 7.347762584686279e-05, 7.558055222034454e-05, 7.76834785938263e-05, 7.978640496730804e-05, 8.18893313407898e-05, 8.399225771427155e-05, 8.60951840877533e-05, 8.819811046123505e-05, 9.03010368347168e-05]}, "gradients/decoder.model.decoder.layers.10.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 0.0, 1.0, 2.0, 3.0, 0.0, 3.0, 2.0, 3.0, 5.0, 9.0, 13.0, 13.0, 32.0, 69.0, 373.0, 136424.0, 910927.0, 526.0, 82.0, 23.0, 16.0, 10.0, 7.0, 6.0, 4.0, 3.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.13671875, -2.0577392578125, -1.978759765625, -1.8997802734375, -1.82080078125, -1.7418212890625, -1.662841796875, -1.5838623046875, -1.5048828125, -1.4259033203125, -1.346923828125, -1.2679443359375, -1.18896484375, -1.1099853515625, -1.031005859375, -0.9520263671875, -0.873046875, -0.7940673828125, -0.715087890625, -0.6361083984375, -0.55712890625, -0.4781494140625, -0.399169921875, -0.3201904296875, -0.2412109375, -0.1622314453125, -0.083251953125, -0.0042724609375, 0.07470703125, 0.1536865234375, 0.232666015625, 0.3116455078125, 0.390625, 0.4696044921875, 0.548583984375, 0.6275634765625, 0.70654296875, 0.7855224609375, 0.864501953125, 0.9434814453125, 1.0224609375, 1.1014404296875, 1.180419921875, 1.2593994140625, 1.33837890625, 1.4173583984375, 1.496337890625, 1.5753173828125, 1.654296875, 1.7332763671875, 1.812255859375, 1.8912353515625, 1.97021484375, 2.0491943359375, 2.128173828125, 2.2071533203125, 2.2861328125, 2.3651123046875, 2.444091796875, 2.5230712890625, 2.60205078125, 2.6810302734375, 2.760009765625, 2.8389892578125, 2.91796875]}, "gradients/decoder.model.decoder.layers.10.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 4.0, 2.0, 3.0, 9.0, 18.0, 17.0, 28.0, 50.0, 70.0, 129.0, 183.0, 174.0, 123.0, 73.0, 38.0, 28.0, 15.0, 13.0, 7.0, 6.0, 2.0, 2.0, 2.0, 2.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.19775390625, -0.19240379333496094, -0.18705368041992188, -0.1817035675048828, -0.17635345458984375, -0.1710033416748047, -0.16565322875976562, -0.16030311584472656, -0.1549530029296875, -0.14960289001464844, -0.14425277709960938, -0.1389026641845703, -0.13355255126953125, -0.1282024383544922, -0.12285232543945312, -0.11750221252441406, -0.112152099609375, -0.10680198669433594, -0.10145187377929688, -0.09610176086425781, -0.09075164794921875, -0.08540153503417969, -0.08005142211914062, -0.07470130920410156, -0.0693511962890625, -0.06400108337402344, -0.058650970458984375, -0.05330085754394531, -0.04795074462890625, -0.04260063171386719, -0.037250518798828125, -0.03190040588378906, -0.02655029296875, -0.021200180053710938, -0.015850067138671875, -0.010499954223632812, -0.00514984130859375, 0.0002002716064453125, 0.005550384521484375, 0.010900497436523438, 0.0162506103515625, 0.021600723266601562, 0.026950836181640625, 0.03230094909667969, 0.03765106201171875, 0.04300117492675781, 0.048351287841796875, 0.05370140075683594, 0.059051513671875, 0.06440162658691406, 0.06975173950195312, 0.07510185241699219, 0.08045196533203125, 0.08580207824707031, 0.09115219116210938, 0.09650230407714844, 0.1018524169921875, 0.10720252990722656, 0.11255264282226562, 0.11790275573730469, 0.12325286865234375, 0.1286029815673828, 0.13395309448242188, 0.13930320739746094, 0.1446533203125]}, "gradients/decoder.model.decoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 12.0, 326.0, 653.0, 30.0], "bins": [-29.97443962097168, -29.492164611816406, -29.009889602661133, -28.52761459350586, -28.045339584350586, -27.563064575195312, -27.08078956604004, -26.598514556884766, -26.116239547729492, -25.63396453857422, -25.151689529418945, -24.669414520263672, -24.1871395111084, -23.704864501953125, -23.22258949279785, -22.740314483642578, -22.258041381835938, -21.775766372680664, -21.29349136352539, -20.811216354370117, -20.328941345214844, -19.84666633605957, -19.364391326904297, -18.882116317749023, -18.39984130859375, -17.917566299438477, -17.435291290283203, -16.95301628112793, -16.470741271972656, -15.988466262817383, -15.50619125366211, -15.023917198181152, -14.541641235351562, -14.059366226196289, -13.577091217041016, -13.094816207885742, -12.612541198730469, -12.130266189575195, -11.647991180419922, -11.165717124938965, -10.683442115783691, -10.201167106628418, -9.718892097473145, -9.236617088317871, -8.754342079162598, -8.27206802368164, -7.789792537689209, -7.307518005371094, -6.825242519378662, -6.342967510223389, -5.860692501068115, -5.37841796875, -4.896142959594727, -4.413867950439453, -3.9315929412841797, -3.4493181705474854, -2.967043399810791, -2.4847683906555176, -2.0024936199188232, -1.5202186107635498, -1.037943720817566, -0.555668830871582, -0.0733938217163086, 0.40888094902038574, 0.8911560773849487]}, "gradients/decoder.model.decoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 4.0, 6.0, 7.0, 5.0, 11.0, 7.0, 10.0, 14.0, 21.0, 17.0, 25.0, 25.0, 36.0, 36.0, 30.0, 40.0, 39.0, 41.0, 44.0, 37.0, 41.0, 50.0, 39.0, 46.0, 46.0, 46.0, 31.0, 37.0, 33.0, 23.0, 24.0, 29.0, 20.0, 21.0, 14.0, 10.0, 11.0, 11.0, 11.0, 5.0, 2.0, 1.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.4293893575668335, -1.3908299207687378, -1.352270483970642, -1.3137109279632568, -1.2751514911651611, -1.2365920543670654, -1.1980326175689697, -1.159473180770874, -1.1209137439727783, -1.0823543071746826, -1.043794870376587, -1.0052353143692017, -0.966675877571106, -0.9281164407730103, -0.8895570039749146, -0.8509975671768188, -0.8124380111694336, -0.7738785743713379, -0.7353190779685974, -0.6967596411705017, -0.6582001447677612, -0.6196407079696655, -0.5810812711715698, -0.5425218343734741, -0.5039623379707336, -0.46540287137031555, -0.42684340476989746, -0.38828396797180176, -0.34972450137138367, -0.3111650347709656, -0.2726055979728699, -0.23404613137245178, -0.19548654556274414, -0.15692707896232605, -0.11836762726306915, -0.07980816811323166, -0.041248708963394165, -0.0026892423629760742, 0.03587020933628082, 0.07442966103553772, 0.11298912763595581, 0.1515485942363739, 0.1901080459356308, 0.2286674976348877, 0.2672269642353058, 0.3057864308357239, 0.3443458676338196, 0.38290533423423767, 0.42146480083465576, 0.46002426743507385, 0.49858373403549194, 0.5371431708335876, 0.5757026672363281, 0.6142621040344238, 0.6528215408325195, 0.6913809776306152, 0.7299404740333557, 0.7684999108314514, 0.8070594072341919, 0.8456188440322876, 0.8841782808303833, 0.9227377772331238, 0.9612972140312195, 0.99985671043396, 1.0384161472320557]}, "gradients/decoder.model.decoder.layers.9.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 6.0, 7.0, 8.0, 2.0, 14.0, 18.0, 15.0, 31.0, 44.0, 53.0, 70.0, 125.0, 169.0, 278.0, 473.0, 806.0, 1541.0, 3621.0, 9158.0, 34100.0, 319470.0, 2851335.0, 884202.0, 66267.0, 13480.0, 4625.0, 2045.0, 972.0, 499.0, 306.0, 183.0, 112.0, 73.0, 42.0, 49.0, 22.0, 16.0, 16.0, 16.0, 3.0, 4.0, 5.0, 2.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0], "bins": [-1.1962890625, -1.1617889404296875, -1.127288818359375, -1.0927886962890625, -1.05828857421875, -1.0237884521484375, -0.989288330078125, -0.9547882080078125, -0.9202880859375, -0.8857879638671875, -0.851287841796875, -0.8167877197265625, -0.78228759765625, -0.7477874755859375, -0.713287353515625, -0.6787872314453125, -0.644287109375, -0.6097869873046875, -0.575286865234375, -0.5407867431640625, -0.50628662109375, -0.4717864990234375, -0.437286376953125, -0.4027862548828125, -0.3682861328125, -0.3337860107421875, -0.299285888671875, -0.2647857666015625, -0.23028564453125, -0.1957855224609375, -0.161285400390625, -0.1267852783203125, -0.09228515625, -0.0577850341796875, -0.023284912109375, 0.0112152099609375, 0.04571533203125, 0.0802154541015625, 0.114715576171875, 0.1492156982421875, 0.1837158203125, 0.2182159423828125, 0.252716064453125, 0.2872161865234375, 0.32171630859375, 0.3562164306640625, 0.390716552734375, 0.4252166748046875, 0.459716796875, 0.4942169189453125, 0.528717041015625, 0.5632171630859375, 0.59771728515625, 0.6322174072265625, 0.666717529296875, 0.7012176513671875, 0.7357177734375, 0.7702178955078125, 0.804718017578125, 0.8392181396484375, 0.87371826171875, 0.9082183837890625, 0.942718505859375, 0.9772186279296875, 1.01171875]}, "gradients/decoder.model.decoder.layers.9.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 0.0, 3.0, 3.0, 5.0, 4.0, 5.0, 14.0, 12.0, 16.0, 12.0, 23.0, 15.0, 26.0, 40.0, 45.0, 37.0, 41.0, 40.0, 50.0, 62.0, 71.0, 58.0, 39.0, 57.0, 62.0, 42.0, 31.0, 38.0, 35.0, 26.0, 22.0, 21.0, 9.0, 15.0, 6.0, 7.0, 2.0, 1.0, 0.0, 3.0, 6.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.55712890625, -0.539581298828125, -0.52203369140625, -0.504486083984375, -0.4869384765625, -0.469390869140625, -0.45184326171875, -0.434295654296875, -0.416748046875, -0.399200439453125, -0.38165283203125, -0.364105224609375, -0.3465576171875, -0.329010009765625, -0.31146240234375, -0.293914794921875, -0.2763671875, -0.258819580078125, -0.24127197265625, -0.223724365234375, -0.2061767578125, -0.188629150390625, -0.17108154296875, -0.153533935546875, -0.135986328125, -0.118438720703125, -0.10089111328125, -0.083343505859375, -0.0657958984375, -0.048248291015625, -0.03070068359375, -0.013153076171875, 0.00439453125, 0.021942138671875, 0.03948974609375, 0.057037353515625, 0.0745849609375, 0.092132568359375, 0.10968017578125, 0.127227783203125, 0.144775390625, 0.162322998046875, 0.17987060546875, 0.197418212890625, 0.2149658203125, 0.232513427734375, 0.25006103515625, 0.267608642578125, 0.28515625, 0.302703857421875, 0.32025146484375, 0.337799072265625, 0.3553466796875, 0.372894287109375, 0.39044189453125, 0.407989501953125, 0.425537109375, 0.443084716796875, 0.46063232421875, 0.478179931640625, 0.4957275390625, 0.513275146484375, 0.53082275390625, 0.548370361328125, 0.56591796875]}, "gradients/decoder.model.decoder.layers.9.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 5.0, 10.0, 14.0, 14.0, 45.0, 67.0, 142.0, 369.0, 1081.0, 12186.0, 4016352.0, 159832.0, 3046.0, 666.0, 217.0, 112.0, 58.0, 27.0, 26.0, 4.0, 5.0, 5.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.529296875, -3.418182373046875, -3.30706787109375, -3.195953369140625, -3.0848388671875, -2.973724365234375, -2.86260986328125, -2.751495361328125, -2.640380859375, -2.529266357421875, -2.41815185546875, -2.307037353515625, -2.1959228515625, -2.084808349609375, -1.97369384765625, -1.862579345703125, -1.75146484375, -1.640350341796875, -1.52923583984375, -1.418121337890625, -1.3070068359375, -1.195892333984375, -1.08477783203125, -0.973663330078125, -0.862548828125, -0.751434326171875, -0.64031982421875, -0.529205322265625, -0.4180908203125, -0.306976318359375, -0.19586181640625, -0.084747314453125, 0.0263671875, 0.137481689453125, 0.24859619140625, 0.359710693359375, 0.4708251953125, 0.581939697265625, 0.69305419921875, 0.804168701171875, 0.915283203125, 1.026397705078125, 1.13751220703125, 1.248626708984375, 1.3597412109375, 1.470855712890625, 1.58197021484375, 1.693084716796875, 1.80419921875, 1.915313720703125, 2.02642822265625, 2.137542724609375, 2.2486572265625, 2.359771728515625, 2.47088623046875, 2.582000732421875, 2.693115234375, 2.804229736328125, 2.91534423828125, 3.026458740234375, 3.1375732421875, 3.248687744140625, 3.35980224609375, 3.470916748046875, 3.58203125]}, "gradients/decoder.model.decoder.layers.9.fc1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 3.0, 4.0, 8.0, 7.0, 12.0, 23.0, 44.0, 86.0, 118.0, 304.0, 784.0, 1413.0, 728.0, 254.0, 136.0, 71.0, 44.0, 22.0, 9.0, 6.0, 5.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.58154296875, -0.564666748046875, -0.54779052734375, -0.530914306640625, -0.5140380859375, -0.497161865234375, -0.48028564453125, -0.463409423828125, -0.446533203125, -0.429656982421875, -0.41278076171875, -0.395904541015625, -0.3790283203125, -0.362152099609375, -0.34527587890625, -0.328399658203125, -0.3115234375, -0.294647216796875, -0.27777099609375, -0.260894775390625, -0.2440185546875, -0.227142333984375, -0.21026611328125, -0.193389892578125, -0.176513671875, -0.159637451171875, -0.14276123046875, -0.125885009765625, -0.1090087890625, -0.092132568359375, -0.07525634765625, -0.058380126953125, -0.04150390625, -0.024627685546875, -0.00775146484375, 0.009124755859375, 0.0260009765625, 0.042877197265625, 0.05975341796875, 0.076629638671875, 0.093505859375, 0.110382080078125, 0.12725830078125, 0.144134521484375, 0.1610107421875, 0.177886962890625, 0.19476318359375, 0.211639404296875, 0.228515625, 0.245391845703125, 0.26226806640625, 0.279144287109375, 0.2960205078125, 0.312896728515625, 0.32977294921875, 0.346649169921875, 0.363525390625, 0.380401611328125, 0.39727783203125, 0.414154052734375, 0.4310302734375, 0.447906494140625, 0.46478271484375, 0.481658935546875, 0.49853515625]}, "gradients/decoder.model.decoder.layers.9.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 1.0, 6.0, 4.0, 10.0, 10.0, 8.0, 14.0, 14.0, 15.0, 24.0, 31.0, 39.0, 43.0, 62.0, 74.0, 51.0, 87.0, 72.0, 82.0, 63.0, 50.0, 50.0, 52.0, 25.0, 29.0, 16.0, 15.0, 10.0, 8.0, 7.0, 12.0, 1.0, 2.0, 5.0, 1.0, 5.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.83104407787323, -0.807985246181488, -0.7849264144897461, -0.7618675231933594, -0.7388086915016174, -0.7157498598098755, -0.6926909685134888, -0.6696321368217468, -0.6465733051300049, -0.6235144734382629, -0.600455641746521, -0.5773967504501343, -0.5543379187583923, -0.5312790870666504, -0.5082201957702637, -0.48516136407852173, -0.4621025323867798, -0.43904370069503784, -0.4159848392009735, -0.3929259777069092, -0.36986714601516724, -0.3468083143234253, -0.32374945282936096, -0.30069059133529663, -0.2776317596435547, -0.25457292795181274, -0.2315140664577484, -0.20845521986484528, -0.18539637327194214, -0.162337526679039, -0.13927868008613586, -0.11621983349323273, -0.09316104650497437, -0.07010219991207123, -0.04704335331916809, -0.023984506726264954, -0.0009256601333618164, 0.02213318645954132, 0.04519203305244446, 0.0682508796453476, 0.09130972623825073, 0.11436857283115387, 0.137427419424057, 0.16048626601696014, 0.18354511260986328, 0.20660395920276642, 0.22966280579566956, 0.2527216672897339, 0.27578049898147583, 0.2988393306732178, 0.3218981921672821, 0.34495705366134644, 0.3680158853530884, 0.3910747170448303, 0.41413357853889465, 0.437192440032959, 0.4602512717247009, 0.48331010341644287, 0.5063689947128296, 0.5294278264045715, 0.5524866580963135, 0.5755454897880554, 0.5986043214797974, 0.6216632127761841, 0.644722044467926]}, "gradients/decoder.model.decoder.layers.9.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 6.0, 1.0, 5.0, 6.0, 5.0, 7.0, 7.0, 10.0, 14.0, 6.0, 24.0, 16.0, 20.0, 30.0, 29.0, 34.0, 25.0, 37.0, 52.0, 34.0, 34.0, 47.0, 49.0, 32.0, 42.0, 37.0, 39.0, 44.0, 39.0, 35.0, 45.0, 22.0, 26.0, 11.0, 18.0, 18.0, 22.0, 20.0, 18.0, 10.0, 5.0, 8.0, 2.0, 7.0, 0.0, 2.0, 2.0, 2.0, 4.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.4986001253128052, -0.4820749759674072, -0.4655498266220093, -0.4490247070789337, -0.43249955773353577, -0.4159744083881378, -0.39944928884506226, -0.3829241394996643, -0.36639899015426636, -0.3498738408088684, -0.33334869146347046, -0.3168235719203949, -0.30029842257499695, -0.283773273229599, -0.26724815368652344, -0.2507230043411255, -0.23419785499572754, -0.2176727056503296, -0.20114757120609283, -0.18462243676185608, -0.16809728741645813, -0.15157213807106018, -0.13504700362682343, -0.11852186173200607, -0.10199671983718872, -0.08547157794237137, -0.06894643604755402, -0.052421294152736664, -0.03589615225791931, -0.01937101036310196, -0.002845868468284607, 0.013679273426532745, 0.030204355716705322, 0.046729497611522675, 0.06325463950634003, 0.07977978140115738, 0.09630492329597473, 0.11283006519079208, 0.12935520708560944, 0.1458803415298462, 0.16240549087524414, 0.1789306402206421, 0.19545577466487885, 0.2119809091091156, 0.22850605845451355, 0.2450312077999115, 0.26155632734298706, 0.278081476688385, 0.29460662603378296, 0.3111317753791809, 0.32765692472457886, 0.3441820442676544, 0.36070719361305237, 0.3772323429584503, 0.3937574625015259, 0.41028261184692383, 0.4268077611923218, 0.4433329105377197, 0.4598580598831177, 0.47638317942619324, 0.4929083287715912, 0.5094334483146667, 0.5259585976600647, 0.5424837470054626, 0.5590088963508606]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 5.0, 4.0, 7.0, 5.0, 3.0, 8.0, 19.0, 26.0, 49.0, 76.0, 126.0, 240.0, 448.0, 840.0, 1742.0, 3667.0, 8376.0, 22438.0, 72684.0, 356065.0, 447374.0, 90220.0, 26176.0, 9751.0, 4200.0, 1932.0, 977.0, 481.0, 268.0, 148.0, 78.0, 46.0, 19.0, 18.0, 15.0, 12.0, 7.0, 5.0, 3.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3896484375, -0.37786865234375, -0.3660888671875, -0.35430908203125, -0.342529296875, -0.33074951171875, -0.3189697265625, -0.30718994140625, -0.29541015625, -0.28363037109375, -0.2718505859375, -0.26007080078125, -0.248291015625, -0.23651123046875, -0.2247314453125, -0.21295166015625, -0.201171875, -0.18939208984375, -0.1776123046875, -0.16583251953125, -0.154052734375, -0.14227294921875, -0.1304931640625, -0.11871337890625, -0.10693359375, -0.09515380859375, -0.0833740234375, -0.07159423828125, -0.059814453125, -0.04803466796875, -0.0362548828125, -0.02447509765625, -0.0126953125, -0.00091552734375, 0.0108642578125, 0.02264404296875, 0.034423828125, 0.04620361328125, 0.0579833984375, 0.06976318359375, 0.08154296875, 0.09332275390625, 0.1051025390625, 0.11688232421875, 0.128662109375, 0.14044189453125, 0.1522216796875, 0.16400146484375, 0.17578125, 0.18756103515625, 0.1993408203125, 0.21112060546875, 0.222900390625, 0.23468017578125, 0.2464599609375, 0.25823974609375, 0.27001953125, 0.28179931640625, 0.2935791015625, 0.30535888671875, 0.317138671875, 0.32891845703125, 0.3406982421875, 0.35247802734375, 0.3642578125]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 7.0, 2.0, 3.0, 5.0, 5.0, 5.0, 5.0, 10.0, 10.0, 12.0, 15.0, 22.0, 21.0, 26.0, 37.0, 44.0, 35.0, 37.0, 48.0, 42.0, 50.0, 48.0, 61.0, 52.0, 39.0, 45.0, 31.0, 46.0, 38.0, 28.0, 34.0, 19.0, 26.0, 11.0, 23.0, 18.0, 8.0, 9.0, 11.0, 5.0, 0.0, 4.0, 5.0, 0.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0], "bins": [-0.333740234375, -0.32274627685546875, -0.3117523193359375, -0.30075836181640625, -0.289764404296875, -0.27877044677734375, -0.2677764892578125, -0.25678253173828125, -0.24578857421875, -0.23479461669921875, -0.2238006591796875, -0.21280670166015625, -0.201812744140625, -0.19081878662109375, -0.1798248291015625, -0.16883087158203125, -0.1578369140625, -0.14684295654296875, -0.1358489990234375, -0.12485504150390625, -0.113861083984375, -0.10286712646484375, -0.0918731689453125, -0.08087921142578125, -0.06988525390625, -0.05889129638671875, -0.0478973388671875, -0.03690338134765625, -0.025909423828125, -0.01491546630859375, -0.0039215087890625, 0.00707244873046875, 0.01806640625, 0.02906036376953125, 0.0400543212890625, 0.05104827880859375, 0.062042236328125, 0.07303619384765625, 0.0840301513671875, 0.09502410888671875, 0.10601806640625, 0.11701202392578125, 0.1280059814453125, 0.13899993896484375, 0.149993896484375, 0.16098785400390625, 0.1719818115234375, 0.18297576904296875, 0.1939697265625, 0.20496368408203125, 0.2159576416015625, 0.22695159912109375, 0.237945556640625, 0.24893951416015625, 0.2599334716796875, 0.27092742919921875, 0.28192138671875, 0.29291534423828125, 0.3039093017578125, 0.31490325927734375, 0.325897216796875, 0.33689117431640625, 0.3478851318359375, 0.35887908935546875, 0.369873046875]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 0.0, 1.0, 4.0, 1.0, 1.0, 1.0, 4.0, 4.0, 9.0, 11.0, 11.0, 11.0, 15.0, 32.0, 38.0, 59.0, 99.0, 166.0, 257.0, 404.0, 681.0, 1244.0, 2378.0, 4857.0, 10812.0, 27035.0, 80949.0, 326876.0, 423965.0, 108995.0, 34196.0, 13085.0, 5941.0, 2887.0, 1497.0, 792.0, 463.0, 283.0, 169.0, 116.0, 60.0, 49.0, 34.0, 26.0, 16.0, 16.0, 8.0, 4.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.229736328125, -0.2223529815673828, -0.21496963500976562, -0.20758628845214844, -0.20020294189453125, -0.19281959533691406, -0.18543624877929688, -0.1780529022216797, -0.1706695556640625, -0.1632862091064453, -0.15590286254882812, -0.14851951599121094, -0.14113616943359375, -0.13375282287597656, -0.12636947631835938, -0.11898612976074219, -0.111602783203125, -0.10421943664550781, -0.09683609008789062, -0.08945274353027344, -0.08206939697265625, -0.07468605041503906, -0.06730270385742188, -0.05991935729980469, -0.0525360107421875, -0.04515266418457031, -0.037769317626953125, -0.030385971069335938, -0.02300262451171875, -0.015619277954101562, -0.008235931396484375, -0.0008525848388671875, 0.00653076171875, 0.013914108276367188, 0.021297454833984375, 0.028680801391601562, 0.03606414794921875, 0.04344749450683594, 0.050830841064453125, 0.05821418762207031, 0.0655975341796875, 0.07298088073730469, 0.08036422729492188, 0.08774757385253906, 0.09513092041015625, 0.10251426696777344, 0.10989761352539062, 0.11728096008300781, 0.124664306640625, 0.1320476531982422, 0.13943099975585938, 0.14681434631347656, 0.15419769287109375, 0.16158103942871094, 0.16896438598632812, 0.1763477325439453, 0.1837310791015625, 0.1911144256591797, 0.19849777221679688, 0.20588111877441406, 0.21326446533203125, 0.22064781188964844, 0.22803115844726562, 0.2354145050048828, 0.2427978515625]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 4.0, 4.0, 0.0, 2.0, 4.0, 4.0, 3.0, 4.0, 7.0, 14.0, 8.0, 17.0, 14.0, 22.0, 27.0, 22.0, 48.0, 40.0, 38.0, 44.0, 46.0, 51.0, 49.0, 44.0, 44.0, 60.0, 50.0, 57.0, 47.0, 40.0, 42.0, 24.0, 26.0, 19.0, 23.0, 21.0, 8.0, 8.0, 6.0, 8.0, 6.0, 4.0, 1.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.59228515625, -0.5702362060546875, -0.548187255859375, -0.5261383056640625, -0.50408935546875, -0.4820404052734375, -0.459991455078125, -0.4379425048828125, -0.4158935546875, -0.3938446044921875, -0.371795654296875, -0.3497467041015625, -0.32769775390625, -0.3056488037109375, -0.283599853515625, -0.2615509033203125, -0.239501953125, -0.2174530029296875, -0.195404052734375, -0.1733551025390625, -0.15130615234375, -0.1292572021484375, -0.107208251953125, -0.0851593017578125, -0.0631103515625, -0.0410614013671875, -0.019012451171875, 0.0030364990234375, 0.02508544921875, 0.0471343994140625, 0.069183349609375, 0.0912322998046875, 0.11328125, 0.1353302001953125, 0.157379150390625, 0.1794281005859375, 0.20147705078125, 0.2235260009765625, 0.245574951171875, 0.2676239013671875, 0.2896728515625, 0.3117218017578125, 0.333770751953125, 0.3558197021484375, 0.37786865234375, 0.3999176025390625, 0.421966552734375, 0.4440155029296875, 0.466064453125, 0.4881134033203125, 0.510162353515625, 0.5322113037109375, 0.55426025390625, 0.5763092041015625, 0.598358154296875, 0.6204071044921875, 0.6424560546875, 0.6645050048828125, 0.686553955078125, 0.7086029052734375, 0.73065185546875, 0.7527008056640625, 0.774749755859375, 0.7967987060546875, 0.81884765625]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 4.0, 2.0, 5.0, 11.0, 7.0, 11.0, 13.0, 14.0, 19.0, 32.0, 46.0, 49.0, 77.0, 119.0, 210.0, 304.0, 479.0, 723.0, 1260.0, 2189.0, 4131.0, 7877.0, 17466.0, 49685.0, 242886.0, 546789.0, 117656.0, 30648.0, 12306.0, 5767.0, 3140.0, 1765.0, 935.0, 664.0, 390.0, 255.0, 171.0, 120.0, 84.0, 60.0, 59.0, 31.0, 21.0, 21.0, 10.0, 10.0, 12.0, 10.0, 4.0, 5.0, 6.0, 3.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.082275390625, -0.0798044204711914, -0.07733345031738281, -0.07486248016357422, -0.07239151000976562, -0.06992053985595703, -0.06744956970214844, -0.06497859954833984, -0.06250762939453125, -0.060036659240722656, -0.05756568908691406, -0.05509471893310547, -0.052623748779296875, -0.05015277862548828, -0.04768180847167969, -0.045210838317871094, -0.0427398681640625, -0.040268898010253906, -0.03779792785644531, -0.03532695770263672, -0.032855987548828125, -0.03038501739501953, -0.027914047241210938, -0.025443077087402344, -0.02297210693359375, -0.020501136779785156, -0.018030166625976562, -0.015559196472167969, -0.013088226318359375, -0.010617256164550781, -0.008146286010742188, -0.005675315856933594, -0.003204345703125, -0.0007333755493164062, 0.0017375946044921875, 0.004208564758300781, 0.006679534912109375, 0.009150505065917969, 0.011621475219726562, 0.014092445373535156, 0.01656341552734375, 0.019034385681152344, 0.021505355834960938, 0.02397632598876953, 0.026447296142578125, 0.02891826629638672, 0.03138923645019531, 0.033860206604003906, 0.0363311767578125, 0.038802146911621094, 0.04127311706542969, 0.04374408721923828, 0.046215057373046875, 0.04868602752685547, 0.05115699768066406, 0.053627967834472656, 0.05609893798828125, 0.058569908142089844, 0.06104087829589844, 0.06351184844970703, 0.06598281860351562, 0.06845378875732422, 0.07092475891113281, 0.0733957290649414, 0.07586669921875]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 3.0, 4.0, 2.0, 3.0, 2.0, 5.0, 4.0, 6.0, 10.0, 10.0, 37.0, 38.0, 43.0, 97.0, 149.0, 173.0, 166.0, 80.0, 58.0, 32.0, 25.0, 11.0, 13.0, 9.0, 3.0, 2.0, 2.0, 4.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-6.92605972290039e-05, -6.683077663183212e-05, -6.440095603466034e-05, -6.197113543748856e-05, -5.954131484031677e-05, -5.711149424314499e-05, -5.4681673645973206e-05, -5.225185304880142e-05, -4.982203245162964e-05, -4.7392211854457855e-05, -4.496239125728607e-05, -4.253257066011429e-05, -4.0102750062942505e-05, -3.767292946577072e-05, -3.524310886859894e-05, -3.2813288271427155e-05, -3.038346767425537e-05, -2.7953647077083588e-05, -2.5523826479911804e-05, -2.309400588274002e-05, -2.0664185285568237e-05, -1.8234364688396454e-05, -1.580454409122467e-05, -1.3374723494052887e-05, -1.0944902896881104e-05, -8.51508229970932e-06, -6.085261702537537e-06, -3.655441105365753e-06, -1.2256205081939697e-06, 1.2042000889778137e-06, 3.634020686149597e-06, 6.063841283321381e-06, 8.493661880493164e-06, 1.0923482477664948e-05, 1.3353303074836731e-05, 1.5783123672008514e-05, 1.8212944269180298e-05, 2.064276486635208e-05, 2.3072585463523865e-05, 2.5502406060695648e-05, 2.793222665786743e-05, 3.0362047255039215e-05, 3.2791867852211e-05, 3.522168844938278e-05, 3.7651509046554565e-05, 4.008132964372635e-05, 4.251115024089813e-05, 4.4940970838069916e-05, 4.73707914352417e-05, 4.980061203241348e-05, 5.2230432629585266e-05, 5.466025322675705e-05, 5.709007382392883e-05, 5.9519894421100616e-05, 6.19497150182724e-05, 6.437953561544418e-05, 6.680935621261597e-05, 6.923917680978775e-05, 7.166899740695953e-05, 7.409881800413132e-05, 7.65286386013031e-05, 7.895845919847488e-05, 8.138827979564667e-05, 8.381810039281845e-05, 8.624792098999023e-05]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 0.0, 3.0, 0.0, 1.0, 4.0, 2.0, 5.0, 7.0, 9.0, 14.0, 21.0, 31.0, 36.0, 61.0, 73.0, 125.0, 203.0, 313.0, 460.0, 700.0, 1174.0, 2010.0, 3703.0, 7175.0, 17370.0, 54141.0, 286383.0, 524272.0, 101385.0, 27131.0, 10453.0, 4843.0, 2536.0, 1431.0, 863.0, 584.0, 378.0, 187.0, 125.0, 115.0, 78.0, 43.0, 38.0, 26.0, 12.0, 13.0, 8.0, 4.0, 4.0, 3.0, 1.0, 4.0, 1.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.079833984375, -0.07727622985839844, -0.07471847534179688, -0.07216072082519531, -0.06960296630859375, -0.06704521179199219, -0.06448745727539062, -0.06192970275878906, -0.0593719482421875, -0.05681419372558594, -0.054256439208984375, -0.05169868469238281, -0.04914093017578125, -0.04658317565917969, -0.044025421142578125, -0.04146766662597656, -0.038909912109375, -0.03635215759277344, -0.033794403076171875, -0.031236648559570312, -0.02867889404296875, -0.026121139526367188, -0.023563385009765625, -0.021005630493164062, -0.0184478759765625, -0.015890121459960938, -0.013332366943359375, -0.010774612426757812, -0.00821685791015625, -0.0056591033935546875, -0.003101348876953125, -0.0005435943603515625, 0.00201416015625, 0.0045719146728515625, 0.007129669189453125, 0.009687423706054688, 0.01224517822265625, 0.014802932739257812, 0.017360687255859375, 0.019918441772460938, 0.0224761962890625, 0.025033950805664062, 0.027591705322265625, 0.030149459838867188, 0.03270721435546875, 0.03526496887207031, 0.037822723388671875, 0.04038047790527344, 0.042938232421875, 0.04549598693847656, 0.048053741455078125, 0.05061149597167969, 0.05316925048828125, 0.05572700500488281, 0.058284759521484375, 0.06084251403808594, 0.0634002685546875, 0.06595802307128906, 0.06851577758789062, 0.07107353210449219, 0.07363128662109375, 0.07618904113769531, 0.07874679565429688, 0.08130455017089844, 0.0838623046875]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 2.0, 3.0, 2.0, 3.0, 6.0, 1.0, 2.0, 5.0, 3.0, 10.0, 10.0, 13.0, 15.0, 25.0, 32.0, 47.0, 70.0, 92.0, 87.0, 124.0, 103.0, 98.0, 60.0, 49.0, 32.0, 27.0, 19.0, 13.0, 10.0, 11.0, 7.0, 5.0, 1.0, 3.0, 3.0, 7.0, 2.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.020782470703125, -0.02012157440185547, -0.019460678100585938, -0.018799781799316406, -0.018138885498046875, -0.017477989196777344, -0.016817092895507812, -0.01615619659423828, -0.01549530029296875, -0.014834403991699219, -0.014173507690429688, -0.013512611389160156, -0.012851715087890625, -0.012190818786621094, -0.011529922485351562, -0.010869026184082031, -0.0102081298828125, -0.009547233581542969, -0.008886337280273438, -0.008225440979003906, -0.007564544677734375, -0.006903648376464844, -0.0062427520751953125, -0.005581855773925781, -0.00492095947265625, -0.004260063171386719, -0.0035991668701171875, -0.0029382705688476562, -0.002277374267578125, -0.0016164779663085938, -0.0009555816650390625, -0.00029468536376953125, 0.0003662109375, 0.0010271072387695312, 0.0016880035400390625, 0.0023488998413085938, 0.003009796142578125, 0.0036706924438476562, 0.0043315887451171875, 0.004992485046386719, 0.00565338134765625, 0.006314277648925781, 0.0069751739501953125, 0.007636070251464844, 0.008296966552734375, 0.008957862854003906, 0.009618759155273438, 0.010279655456542969, 0.0109405517578125, 0.011601448059082031, 0.012262344360351562, 0.012923240661621094, 0.013584136962890625, 0.014245033264160156, 0.014905929565429688, 0.015566825866699219, 0.01622772216796875, 0.01688861846923828, 0.017549514770507812, 0.018210411071777344, 0.018871307373046875, 0.019532203674316406, 0.020193099975585938, 0.02085399627685547, 0.021514892578125]}, "gradients/decoder.model.decoder.layers.9.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 5.0, 8.0, 21.0, 19.0, 37.0, 70.0, 129.0, 178.0, 202.0, 148.0, 87.0, 34.0, 37.0, 7.0, 12.0, 5.0, 4.0, 3.0, 2.0, 0.0, 2.0], "bins": [-1.5704151391983032, -1.5396970510482788, -1.5089788436889648, -1.4782607555389404, -1.4475425481796265, -1.416824460029602, -1.386106252670288, -1.3553881645202637, -1.3246699571609497, -1.2939518690109253, -1.2632336616516113, -1.232515573501587, -1.201797366142273, -1.1710792779922485, -1.1403610706329346, -1.1096429824829102, -1.0789248943328857, -1.0482068061828613, -1.0174885988235474, -0.9867704510688782, -0.956052303314209, -0.9253341555595398, -0.8946160078048706, -0.8638979196548462, -0.8331797122955322, -0.802461564540863, -0.7717434167861938, -0.7410252690315247, -0.7103071212768555, -0.6795889735221863, -0.6488708257675171, -0.6181527376174927, -0.5874344706535339, -0.5567163228988647, -0.5259981751441956, -0.49528002738952637, -0.4645618796348572, -0.433843731880188, -0.4031256139278412, -0.372407466173172, -0.3416893184185028, -0.3109711706638336, -0.28025302290916443, -0.24953489005565643, -0.21881674230098724, -0.18809859454631805, -0.15738046169281006, -0.12666231393814087, -0.09594416618347168, -0.06522601842880249, -0.0345078781247139, -0.003789737820625305, 0.026928409934043884, 0.057646557688713074, 0.08836469054222107, 0.11908283829689026, 0.14980098605155945, 0.18051913380622864, 0.21123728156089783, 0.24195541441440582, 0.2726735472679138, 0.303391695022583, 0.3341098427772522, 0.3648279905319214, 0.3955461382865906]}, "gradients/decoder.model.decoder.layers.9.self_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 4.0, 0.0, 7.0, 8.0, 7.0, 9.0, 10.0, 11.0, 14.0, 29.0, 37.0, 35.0, 55.0, 49.0, 64.0, 61.0, 68.0, 68.0, 63.0, 66.0, 51.0, 52.0, 67.0, 36.0, 25.0, 30.0, 28.0, 19.0, 15.0, 6.0, 7.0, 3.0, 3.0, 2.0, 5.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3037736415863037, -0.2891065776348114, -0.2744395136833191, -0.25977247953414917, -0.24510540068149567, -0.23043835163116455, -0.21577128767967224, -0.20110422372817993, -0.18643715977668762, -0.1717700958251953, -0.1571030467748642, -0.1424359828233719, -0.12776891887187958, -0.11310186237096786, -0.09843480587005615, -0.08376774191856384, -0.06910069286823273, -0.054433632642030716, -0.039766572415828705, -0.025099515914916992, -0.010432455688714981, 0.00423460453748703, 0.018901661038398743, 0.03356872498989105, 0.048235781490802765, 0.06290283799171448, 0.07756990194320679, 0.0922369584441185, 0.10690401494503021, 0.12157107889652252, 0.13623812794685364, 0.15090519189834595, 0.16557225584983826, 0.18023931980133057, 0.19490636885166168, 0.209573432803154, 0.2242404967546463, 0.23890754580497742, 0.2535746097564697, 0.26824167370796204, 0.28290873765945435, 0.29757580161094666, 0.31224286556243896, 0.3269098997116089, 0.3415769636631012, 0.3562440276145935, 0.3709110915660858, 0.3855781555175781, 0.40024518966674805, 0.41491225361824036, 0.42957931756973267, 0.4442463517189026, 0.4589134156703949, 0.4735804796218872, 0.4882475435733795, 0.5029146075248718, 0.5175817012786865, 0.5322487354278564, 0.5469158291816711, 0.5615828633308411, 0.5762499570846558, 0.5909169912338257, 0.6055840253829956, 0.6202511191368103, 0.6349181532859802]}, "gradients/decoder.model.decoder.layers.9.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 8.0, 10.0, 22.0, 29.0, 44.0, 89.0, 193.0, 412.0, 744.0, 1823.0, 4231.0, 11604.0, 35419.0, 133798.0, 529750.0, 244669.0, 57609.0, 17366.0, 6205.0, 2474.0, 1098.0, 464.0, 244.0, 106.0, 61.0, 29.0, 28.0, 11.0, 5.0, 6.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.460693359375, -0.4451789855957031, -0.42966461181640625, -0.4141502380371094, -0.3986358642578125, -0.3831214904785156, -0.36760711669921875, -0.3520927429199219, -0.336578369140625, -0.3210639953613281, -0.30554962158203125, -0.2900352478027344, -0.2745208740234375, -0.2590065002441406, -0.24349212646484375, -0.22797775268554688, -0.21246337890625, -0.19694900512695312, -0.18143463134765625, -0.16592025756835938, -0.1504058837890625, -0.13489151000976562, -0.11937713623046875, -0.10386276245117188, -0.088348388671875, -0.07283401489257812, -0.05731964111328125, -0.041805267333984375, -0.0262908935546875, -0.010776519775390625, 0.00473785400390625, 0.020252227783203125, 0.0357666015625, 0.051280975341796875, 0.06679534912109375, 0.08230972290039062, 0.0978240966796875, 0.11333847045898438, 0.12885284423828125, 0.14436721801757812, 0.159881591796875, 0.17539596557617188, 0.19091033935546875, 0.20642471313476562, 0.2219390869140625, 0.23745346069335938, 0.25296783447265625, 0.2684822082519531, 0.28399658203125, 0.2995109558105469, 0.31502532958984375, 0.3305397033691406, 0.3460540771484375, 0.3615684509277344, 0.37708282470703125, 0.3925971984863281, 0.408111572265625, 0.4236259460449219, 0.43914031982421875, 0.4546546936035156, 0.4701690673828125, 0.4856834411621094, 0.5011978149414062, 0.5167121887207031, 0.5322265625]}, "gradients/decoder.model.decoder.layers.9.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 4.0, 1.0, 3.0, 5.0, 7.0, 5.0, 9.0, 12.0, 15.0, 11.0, 18.0, 24.0, 39.0, 32.0, 50.0, 52.0, 61.0, 75.0, 53.0, 65.0, 74.0, 56.0, 50.0, 45.0, 37.0, 37.0, 36.0, 29.0, 21.0, 27.0, 19.0, 15.0, 5.0, 5.0, 5.0, 6.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6396484375, -0.6125640869140625, -0.585479736328125, -0.5583953857421875, -0.53131103515625, -0.5042266845703125, -0.477142333984375, -0.4500579833984375, -0.4229736328125, -0.3958892822265625, -0.368804931640625, -0.3417205810546875, -0.31463623046875, -0.2875518798828125, -0.260467529296875, -0.2333831787109375, -0.206298828125, -0.1792144775390625, -0.152130126953125, -0.1250457763671875, -0.09796142578125, -0.0708770751953125, -0.043792724609375, -0.0167083740234375, 0.0103759765625, 0.0374603271484375, 0.064544677734375, 0.0916290283203125, 0.11871337890625, 0.1457977294921875, 0.172882080078125, 0.1999664306640625, 0.22705078125, 0.2541351318359375, 0.281219482421875, 0.3083038330078125, 0.33538818359375, 0.3624725341796875, 0.389556884765625, 0.4166412353515625, 0.4437255859375, 0.4708099365234375, 0.497894287109375, 0.5249786376953125, 0.55206298828125, 0.5791473388671875, 0.606231689453125, 0.6333160400390625, 0.660400390625, 0.6874847412109375, 0.714569091796875, 0.7416534423828125, 0.76873779296875, 0.7958221435546875, 0.822906494140625, 0.8499908447265625, 0.8770751953125, 0.9041595458984375, 0.931243896484375, 0.9583282470703125, 0.98541259765625, 1.0124969482421875, 1.039581298828125, 1.0666656494140625, 1.09375]}, "gradients/decoder.model.decoder.layers.9.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 6.0, 3.0, 3.0, 8.0, 7.0, 11.0, 18.0, 7.0, 16.0, 15.0, 16.0, 17.0, 16.0, 26.0, 20.0, 34.0, 37.0, 66.0, 85.0, 170.0, 528.0, 5001.0, 938560.0, 101560.0, 1612.0, 269.0, 102.0, 51.0, 56.0, 33.0, 32.0, 22.0, 29.0, 30.0, 19.0, 15.0, 11.0, 11.0, 6.0, 11.0, 5.0, 1.0, 0.0, 3.0, 3.0, 4.0, 3.0, 0.0, 4.0, 1.0, 1.0, 1.0, 3.0, 1.0], "bins": [-2.533203125, -2.45599365234375, -2.3787841796875, -2.30157470703125, -2.224365234375, -2.14715576171875, -2.0699462890625, -1.99273681640625, -1.91552734375, -1.83831787109375, -1.7611083984375, -1.68389892578125, -1.606689453125, -1.52947998046875, -1.4522705078125, -1.37506103515625, -1.2978515625, -1.22064208984375, -1.1434326171875, -1.06622314453125, -0.989013671875, -0.91180419921875, -0.8345947265625, -0.75738525390625, -0.68017578125, -0.60296630859375, -0.5257568359375, -0.44854736328125, -0.371337890625, -0.29412841796875, -0.2169189453125, -0.13970947265625, -0.0625, 0.01470947265625, 0.0919189453125, 0.16912841796875, 0.246337890625, 0.32354736328125, 0.4007568359375, 0.47796630859375, 0.55517578125, 0.63238525390625, 0.7095947265625, 0.78680419921875, 0.864013671875, 0.94122314453125, 1.0184326171875, 1.09564208984375, 1.1728515625, 1.25006103515625, 1.3272705078125, 1.40447998046875, 1.481689453125, 1.55889892578125, 1.6361083984375, 1.71331787109375, 1.79052734375, 1.86773681640625, 1.9449462890625, 2.02215576171875, 2.099365234375, 2.17657470703125, 2.2537841796875, 2.33099365234375, 2.408203125]}, "gradients/decoder.model.decoder.layers.9.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 3.0, 2.0, 0.0, 4.0, 4.0, 5.0, 3.0, 9.0, 8.0, 12.0, 13.0, 6.0, 26.0, 15.0, 12.0, 14.0, 28.0, 36.0, 30.0, 31.0, 31.0, 35.0, 37.0, 44.0, 50.0, 42.0, 44.0, 41.0, 49.0, 33.0, 40.0, 32.0, 26.0, 29.0, 21.0, 31.0, 25.0, 28.0, 28.0, 17.0, 9.0, 9.0, 9.0, 10.0, 7.0, 4.0, 4.0, 1.0, 3.0, 6.0, 1.0, 3.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 3.0], "bins": [-0.62548828125, -0.6050796508789062, -0.5846710205078125, -0.5642623901367188, -0.543853759765625, -0.5234451293945312, -0.5030364990234375, -0.48262786865234375, -0.46221923828125, -0.44181060791015625, -0.4214019775390625, -0.40099334716796875, -0.380584716796875, -0.36017608642578125, -0.3397674560546875, -0.31935882568359375, -0.2989501953125, -0.27854156494140625, -0.2581329345703125, -0.23772430419921875, -0.217315673828125, -0.19690704345703125, -0.1764984130859375, -0.15608978271484375, -0.13568115234375, -0.11527252197265625, -0.0948638916015625, -0.07445526123046875, -0.054046630859375, -0.03363800048828125, -0.0132293701171875, 0.00717926025390625, 0.027587890625, 0.04799652099609375, 0.0684051513671875, 0.08881378173828125, 0.109222412109375, 0.12963104248046875, 0.1500396728515625, 0.17044830322265625, 0.19085693359375, 0.21126556396484375, 0.2316741943359375, 0.25208282470703125, 0.272491455078125, 0.29290008544921875, 0.3133087158203125, 0.33371734619140625, 0.3541259765625, 0.37453460693359375, 0.3949432373046875, 0.41535186767578125, 0.435760498046875, 0.45616912841796875, 0.4765777587890625, 0.49698638916015625, 0.51739501953125, 0.5378036499023438, 0.5582122802734375, 0.5786209106445312, 0.599029541015625, 0.6194381713867188, 0.6398468017578125, 0.6602554321289062, 0.6806640625]}, "gradients/decoder.model.decoder.layers.9.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 5.0, 1.0, 0.0, 0.0, 4.0, 4.0, 7.0, 6.0, 11.0, 19.0, 31.0, 52.0, 142.0, 380.0, 1578.0, 10398.0, 391662.0, 629109.0, 12673.0, 1735.0, 426.0, 164.0, 70.0, 34.0, 15.0, 7.0, 10.0, 4.0, 7.0, 4.0, 4.0, 0.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.58447265625, -0.5662307739257812, -0.5479888916015625, -0.5297470092773438, -0.511505126953125, -0.49326324462890625, -0.4750213623046875, -0.45677947998046875, -0.43853759765625, -0.42029571533203125, -0.4020538330078125, -0.38381195068359375, -0.365570068359375, -0.34732818603515625, -0.3290863037109375, -0.31084442138671875, -0.2926025390625, -0.27436065673828125, -0.2561187744140625, -0.23787689208984375, -0.219635009765625, -0.20139312744140625, -0.1831512451171875, -0.16490936279296875, -0.14666748046875, -0.12842559814453125, -0.1101837158203125, -0.09194183349609375, -0.073699951171875, -0.05545806884765625, -0.0372161865234375, -0.01897430419921875, -0.000732421875, 0.01750946044921875, 0.0357513427734375, 0.05399322509765625, 0.072235107421875, 0.09047698974609375, 0.1087188720703125, 0.12696075439453125, 0.14520263671875, 0.16344451904296875, 0.1816864013671875, 0.19992828369140625, 0.218170166015625, 0.23641204833984375, 0.2546539306640625, 0.27289581298828125, 0.2911376953125, 0.30937957763671875, 0.3276214599609375, 0.34586334228515625, 0.364105224609375, 0.38234710693359375, 0.4005889892578125, 0.41883087158203125, 0.43707275390625, 0.45531463623046875, 0.4735565185546875, 0.49179840087890625, 0.510040283203125, 0.5282821655273438, 0.5465240478515625, 0.5647659301757812, 0.5830078125]}, "gradients/decoder.model.decoder.layers.9.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 4.0, 3.0, 2.0, 3.0, 7.0, 7.0, 12.0, 13.0, 19.0, 31.0, 57.0, 76.0, 138.0, 186.0, 133.0, 92.0, 69.0, 54.0, 38.0, 20.0, 16.0, 4.0, 5.0, 3.0, 5.0, 1.0, 4.0, 3.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.364418029785156e-05, -5.222298204898834e-05, -5.080178380012512e-05, -4.93805855512619e-05, -4.795938730239868e-05, -4.653818905353546e-05, -4.511699080467224e-05, -4.369579255580902e-05, -4.22745943069458e-05, -4.085339605808258e-05, -3.943219780921936e-05, -3.801099956035614e-05, -3.658980131149292e-05, -3.51686030626297e-05, -3.374740481376648e-05, -3.232620656490326e-05, -3.090500831604004e-05, -2.948381006717682e-05, -2.80626118183136e-05, -2.664141356945038e-05, -2.5220215320587158e-05, -2.3799017071723938e-05, -2.2377818822860718e-05, -2.0956620573997498e-05, -1.9535422325134277e-05, -1.8114224076271057e-05, -1.6693025827407837e-05, -1.5271827578544617e-05, -1.3850629329681396e-05, -1.2429431080818176e-05, -1.1008232831954956e-05, -9.587034583091736e-06, -8.165836334228516e-06, -6.744638085365295e-06, -5.323439836502075e-06, -3.902241587638855e-06, -2.4810433387756348e-06, -1.0598450899124146e-06, 3.6135315895080566e-07, 1.7825514078140259e-06, 3.203749656677246e-06, 4.624947905540466e-06, 6.0461461544036865e-06, 7.467344403266907e-06, 8.888542652130127e-06, 1.0309740900993347e-05, 1.1730939149856567e-05, 1.3152137398719788e-05, 1.4573335647583008e-05, 1.5994533896446228e-05, 1.7415732145309448e-05, 1.883693039417267e-05, 2.025812864303589e-05, 2.167932689189911e-05, 2.310052514076233e-05, 2.452172338962555e-05, 2.594292163848877e-05, 2.736411988735199e-05, 2.878531813621521e-05, 3.020651638507843e-05, 3.162771463394165e-05, 3.304891288280487e-05, 3.447011113166809e-05, 3.589130938053131e-05, 3.731250762939453e-05]}, "gradients/decoder.model.decoder.layers.9.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 4.0, 6.0, 6.0, 5.0, 8.0, 17.0, 14.0, 32.0, 36.0, 71.0, 120.0, 233.0, 472.0, 1101.0, 3132.0, 10412.0, 51576.0, 524025.0, 401830.0, 41485.0, 9141.0, 2788.0, 1077.0, 427.0, 233.0, 116.0, 52.0, 52.0, 29.0, 16.0, 9.0, 7.0, 5.0, 4.0, 7.0, 4.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.225830078125, -0.21828842163085938, -0.21074676513671875, -0.20320510864257812, -0.1956634521484375, -0.18812179565429688, -0.18058013916015625, -0.17303848266601562, -0.165496826171875, -0.15795516967773438, -0.15041351318359375, -0.14287185668945312, -0.1353302001953125, -0.12778854370117188, -0.12024688720703125, -0.11270523071289062, -0.10516357421875, -0.09762191772460938, -0.09008026123046875, -0.08253860473632812, -0.0749969482421875, -0.06745529174804688, -0.05991363525390625, -0.052371978759765625, -0.044830322265625, -0.037288665771484375, -0.02974700927734375, -0.022205352783203125, -0.0146636962890625, -0.007122039794921875, 0.00041961669921875, 0.007961273193359375, 0.0155029296875, 0.023044586181640625, 0.03058624267578125, 0.038127899169921875, 0.0456695556640625, 0.053211212158203125, 0.06075286865234375, 0.06829452514648438, 0.075836181640625, 0.08337783813476562, 0.09091949462890625, 0.09846115112304688, 0.1060028076171875, 0.11354446411132812, 0.12108612060546875, 0.12862777709960938, 0.13616943359375, 0.14371109008789062, 0.15125274658203125, 0.15879440307617188, 0.1663360595703125, 0.17387771606445312, 0.18141937255859375, 0.18896102905273438, 0.196502685546875, 0.20404434204101562, 0.21158599853515625, 0.21912765502929688, 0.2266693115234375, 0.23421096801757812, 0.24175262451171875, 0.24929428100585938, 0.2568359375]}, "gradients/decoder.model.decoder.layers.9.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 5.0, 3.0, 2.0, 6.0, 4.0, 6.0, 14.0, 11.0, 19.0, 35.0, 51.0, 73.0, 92.0, 110.0, 145.0, 118.0, 101.0, 58.0, 49.0, 30.0, 21.0, 10.0, 9.0, 7.0, 4.0, 4.0, 1.0, 5.0, 5.0, 5.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1195068359375, -0.11593341827392578, -0.11236000061035156, -0.10878658294677734, -0.10521316528320312, -0.1016397476196289, -0.09806632995605469, -0.09449291229248047, -0.09091949462890625, -0.08734607696533203, -0.08377265930175781, -0.0801992416381836, -0.07662582397460938, -0.07305240631103516, -0.06947898864746094, -0.06590557098388672, -0.0623321533203125, -0.05875873565673828, -0.05518531799316406, -0.051611900329589844, -0.048038482666015625, -0.044465065002441406, -0.04089164733886719, -0.03731822967529297, -0.03374481201171875, -0.03017139434814453, -0.026597976684570312, -0.023024559020996094, -0.019451141357421875, -0.015877723693847656, -0.012304306030273438, -0.008730888366699219, -0.005157470703125, -0.0015840530395507812, 0.0019893646240234375, 0.005562782287597656, 0.009136199951171875, 0.012709617614746094, 0.016283035278320312, 0.01985645294189453, 0.02342987060546875, 0.02700328826904297, 0.030576705932617188, 0.034150123596191406, 0.037723541259765625, 0.041296958923339844, 0.04487037658691406, 0.04844379425048828, 0.0520172119140625, 0.05559062957763672, 0.05916404724121094, 0.06273746490478516, 0.06631088256835938, 0.0698843002319336, 0.07345771789550781, 0.07703113555908203, 0.08060455322265625, 0.08417797088623047, 0.08775138854980469, 0.0913248062133789, 0.09489822387695312, 0.09847164154052734, 0.10204505920410156, 0.10561847686767578, 0.10919189453125]}, "gradients/decoder.model.decoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 10.0, 16.0, 87.0, 330.0, 399.0, 131.0, 32.0, 10.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1274315118789673, -0.9687736630439758, -0.8101158142089844, -0.6514579653739929, -0.49280011653900146, -0.33414226770401, -0.17548441886901855, -0.016826510429382324, 0.14183127880096436, 0.3004891276359558, 0.45914697647094727, 0.6178048253059387, 0.7764626741409302, 0.9351205229759216, 1.093778371810913, 1.2524362802505493, 1.411094069480896, 1.5697519779205322, 1.728409767150879, 1.8870675563812256, 2.0457253456115723, 2.204383373260498, 2.3630411624908447, 2.5216989517211914, 2.680356979370117, 2.839014768600464, 2.9976725578308105, 3.1563305854797363, 3.314988374710083, 3.4736461639404297, 3.6323041915893555, 3.790961980819702, 3.9496192932128906, 4.108277320861816, 4.266934871673584, 4.42559289932251, 4.584250450134277, 4.742908477783203, 4.901566505432129, 5.060224533081055, 5.218882083892822, 5.377540111541748, 5.536197662353516, 5.694855690002441, 5.853513717651367, 6.012171268463135, 6.1708292961120605, 6.329486846923828, 6.488144874572754, 6.64680290222168, 6.805460453033447, 6.964118480682373, 7.122776031494141, 7.281434059143066, 7.440092086791992, 7.598750114440918, 7.7574076652526855, 7.916065692901611, 8.074723243713379, 8.233381271362305, 8.39203929901123, 8.550697326660156, 8.709354400634766, 8.868012428283691, 9.026670455932617]}, "gradients/decoder.model.decoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 3.0, 4.0, 2.0, 6.0, 5.0, 6.0, 7.0, 8.0, 10.0, 17.0, 24.0, 16.0, 25.0, 25.0, 27.0, 44.0, 44.0, 40.0, 49.0, 43.0, 45.0, 46.0, 62.0, 57.0, 61.0, 46.0, 40.0, 48.0, 40.0, 34.0, 26.0, 22.0, 15.0, 8.0, 9.0, 12.0, 9.0, 13.0, 5.0, 2.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.974365234375, -0.9396013617515564, -0.9048374891281128, -0.8700736165046692, -0.8353097438812256, -0.800545871257782, -0.7657819986343384, -0.7310181260108948, -0.6962542533874512, -0.6614903807640076, -0.626726508140564, -0.5919626355171204, -0.5571987628936768, -0.5224348902702332, -0.48767101764678955, -0.45290714502334595, -0.41814327239990234, -0.38337939977645874, -0.34861552715301514, -0.31385165452957153, -0.27908778190612793, -0.24432390928268433, -0.20956003665924072, -0.17479616403579712, -0.14003229141235352, -0.10526841878890991, -0.07050454616546631, -0.035740673542022705, -0.0009768009185791016, 0.0337870717048645, 0.0685509443283081, 0.10331481695175171, 0.13807857036590576, 0.17284244298934937, 0.20760631561279297, 0.24237018823623657, 0.2771340608596802, 0.3118979334831238, 0.3466618061065674, 0.381425678730011, 0.4161895513534546, 0.4509534239768982, 0.4857172966003418, 0.5204811692237854, 0.555245041847229, 0.5900089144706726, 0.6247727870941162, 0.6595366597175598, 0.6943005323410034, 0.729064404964447, 0.7638282775878906, 0.7985921502113342, 0.8333560228347778, 0.8681198954582214, 0.902883768081665, 0.9376476407051086, 0.9724115133285522, 1.0071754455566406, 1.0419392585754395, 1.0767030715942383, 1.1114670038223267, 1.146230936050415, 1.1809947490692139, 1.2157585620880127, 1.250522494316101]}, "gradients/decoder.model.decoder.layers.8.fc2.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 4.0, 1.0, 3.0, 8.0, 7.0, 9.0, 13.0, 21.0, 24.0, 21.0, 28.0, 28.0, 46.0, 43.0, 78.0, 107.0, 202.0, 457.0, 1279.0, 4402.0, 25744.0, 679866.0, 3316614.0, 148913.0, 11811.0, 2800.0, 883.0, 324.0, 155.0, 83.0, 69.0, 55.0, 38.0, 35.0, 25.0, 23.0, 17.0, 13.0, 8.0, 5.0, 6.0, 7.0, 3.0, 4.0, 2.0, 1.0, 1.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3193359375, -1.277191162109375, -1.23504638671875, -1.192901611328125, -1.1507568359375, -1.108612060546875, -1.06646728515625, -1.024322509765625, -0.982177734375, -0.940032958984375, -0.89788818359375, -0.855743408203125, -0.8135986328125, -0.771453857421875, -0.72930908203125, -0.687164306640625, -0.64501953125, -0.602874755859375, -0.56072998046875, -0.518585205078125, -0.4764404296875, -0.434295654296875, -0.39215087890625, -0.350006103515625, -0.307861328125, -0.265716552734375, -0.22357177734375, -0.181427001953125, -0.1392822265625, -0.097137451171875, -0.05499267578125, -0.012847900390625, 0.029296875, 0.071441650390625, 0.11358642578125, 0.155731201171875, 0.1978759765625, 0.240020751953125, 0.28216552734375, 0.324310302734375, 0.366455078125, 0.408599853515625, 0.45074462890625, 0.492889404296875, 0.5350341796875, 0.577178955078125, 0.61932373046875, 0.661468505859375, 0.70361328125, 0.745758056640625, 0.78790283203125, 0.830047607421875, 0.8721923828125, 0.914337158203125, 0.95648193359375, 0.998626708984375, 1.040771484375, 1.082916259765625, 1.12506103515625, 1.167205810546875, 1.2093505859375, 1.251495361328125, 1.29364013671875, 1.335784912109375, 1.3779296875]}, "gradients/decoder.model.decoder.layers.8.fc2.bias": {"_type": "histogram", "values": [5.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 2.0, 4.0, 7.0, 6.0, 10.0, 9.0, 11.0, 12.0, 13.0, 22.0, 20.0, 23.0, 16.0, 27.0, 36.0, 42.0, 43.0, 30.0, 36.0, 45.0, 44.0, 41.0, 47.0, 51.0, 33.0, 36.0, 37.0, 47.0, 34.0, 33.0, 22.0, 31.0, 16.0, 21.0, 11.0, 12.0, 14.0, 11.0, 5.0, 4.0, 10.0, 9.0, 4.0, 3.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.351806640625, -0.3396186828613281, -0.32743072509765625, -0.3152427673339844, -0.3030548095703125, -0.2908668518066406, -0.27867889404296875, -0.2664909362792969, -0.254302978515625, -0.24211502075195312, -0.22992706298828125, -0.21773910522460938, -0.2055511474609375, -0.19336318969726562, -0.18117523193359375, -0.16898727416992188, -0.15679931640625, -0.14461135864257812, -0.13242340087890625, -0.12023544311523438, -0.1080474853515625, -0.09585952758789062, -0.08367156982421875, -0.07148361206054688, -0.059295654296875, -0.047107696533203125, -0.03491973876953125, -0.022731781005859375, -0.0105438232421875, 0.001644134521484375, 0.01383209228515625, 0.026020050048828125, 0.0382080078125, 0.050395965576171875, 0.06258392333984375, 0.07477188110351562, 0.0869598388671875, 0.09914779663085938, 0.11133575439453125, 0.12352371215820312, 0.135711669921875, 0.14789962768554688, 0.16008758544921875, 0.17227554321289062, 0.1844635009765625, 0.19665145874023438, 0.20883941650390625, 0.22102737426757812, 0.23321533203125, 0.24540328979492188, 0.25759124755859375, 0.2697792053222656, 0.2819671630859375, 0.2941551208496094, 0.30634307861328125, 0.3185310363769531, 0.330718994140625, 0.3429069519042969, 0.35509490966796875, 0.3672828674316406, 0.3794708251953125, 0.3916587829589844, 0.40384674072265625, 0.4160346984863281, 0.42822265625]}, "gradients/decoder.model.decoder.layers.8.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 4.0, 1.0, 2.0, 3.0, 6.0, 6.0, 6.0, 4.0, 18.0, 25.0, 34.0, 45.0, 94.0, 248.0, 529.0, 1868.0, 12356.0, 1044320.0, 3112868.0, 18441.0, 2316.0, 590.0, 242.0, 84.0, 51.0, 34.0, 22.0, 25.0, 11.0, 5.0, 9.0, 4.0, 5.0, 1.0, 7.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.248046875, -2.187408447265625, -2.12677001953125, -2.066131591796875, -2.0054931640625, -1.944854736328125, -1.88421630859375, -1.823577880859375, -1.762939453125, -1.702301025390625, -1.64166259765625, -1.581024169921875, -1.5203857421875, -1.459747314453125, -1.39910888671875, -1.338470458984375, -1.27783203125, -1.217193603515625, -1.15655517578125, -1.095916748046875, -1.0352783203125, -0.974639892578125, -0.91400146484375, -0.853363037109375, -0.792724609375, -0.732086181640625, -0.67144775390625, -0.610809326171875, -0.5501708984375, -0.489532470703125, -0.42889404296875, -0.368255615234375, -0.3076171875, -0.246978759765625, -0.18634033203125, -0.125701904296875, -0.0650634765625, -0.004425048828125, 0.05621337890625, 0.116851806640625, 0.177490234375, 0.238128662109375, 0.29876708984375, 0.359405517578125, 0.4200439453125, 0.480682373046875, 0.54132080078125, 0.601959228515625, 0.66259765625, 0.723236083984375, 0.78387451171875, 0.844512939453125, 0.9051513671875, 0.965789794921875, 1.02642822265625, 1.087066650390625, 1.147705078125, 1.208343505859375, 1.26898193359375, 1.329620361328125, 1.3902587890625, 1.450897216796875, 1.51153564453125, 1.572174072265625, 1.6328125]}, "gradients/decoder.model.decoder.layers.8.fc1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 5.0, 2.0, 6.0, 6.0, 5.0, 7.0, 16.0, 19.0, 18.0, 20.0, 52.0, 63.0, 118.0, 198.0, 368.0, 600.0, 824.0, 705.0, 452.0, 208.0, 140.0, 79.0, 50.0, 35.0, 31.0, 20.0, 12.0, 5.0, 5.0, 3.0, 5.0, 0.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2291259765625, -0.2204914093017578, -0.21185684204101562, -0.20322227478027344, -0.19458770751953125, -0.18595314025878906, -0.17731857299804688, -0.1686840057373047, -0.1600494384765625, -0.1514148712158203, -0.14278030395507812, -0.13414573669433594, -0.12551116943359375, -0.11687660217285156, -0.10824203491210938, -0.09960746765136719, -0.090972900390625, -0.08233833312988281, -0.07370376586914062, -0.06506919860839844, -0.05643463134765625, -0.04780006408691406, -0.039165496826171875, -0.030530929565429688, -0.0218963623046875, -0.013261795043945312, -0.004627227783203125, 0.0040073394775390625, 0.01264190673828125, 0.021276473999023438, 0.029911041259765625, 0.03854560852050781, 0.04718017578125, 0.05581474304199219, 0.06444931030273438, 0.07308387756347656, 0.08171844482421875, 0.09035301208496094, 0.09898757934570312, 0.10762214660644531, 0.1162567138671875, 0.12489128112792969, 0.13352584838867188, 0.14216041564941406, 0.15079498291015625, 0.15942955017089844, 0.16806411743164062, 0.1766986846923828, 0.185333251953125, 0.1939678192138672, 0.20260238647460938, 0.21123695373535156, 0.21987152099609375, 0.22850608825683594, 0.23714065551757812, 0.2457752227783203, 0.2544097900390625, 0.2630443572998047, 0.2716789245605469, 0.28031349182128906, 0.28894805908203125, 0.29758262634277344, 0.3062171936035156, 0.3148517608642578, 0.323486328125]}, "gradients/decoder.model.decoder.layers.8.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 2.0, 3.0, 3.0, 4.0, 12.0, 10.0, 7.0, 16.0, 23.0, 30.0, 38.0, 40.0, 65.0, 69.0, 81.0, 87.0, 99.0, 76.0, 67.0, 67.0, 51.0, 36.0, 33.0, 24.0, 15.0, 11.0, 10.0, 13.0, 2.0, 4.0, 0.0, 1.0, 2.0, 2.0, 5.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.8920860886573792, -0.8672125935554504, -0.8423390984535217, -0.817465603351593, -0.7925920486450195, -0.7677185535430908, -0.7428450584411621, -0.7179715633392334, -0.6930980682373047, -0.668224573135376, -0.6433510780334473, -0.6184775829315186, -0.5936040878295898, -0.5687305331230164, -0.5438570380210876, -0.5189835429191589, -0.4941100478172302, -0.4692365527153015, -0.4443630576133728, -0.4194895327091217, -0.394616037607193, -0.3697425425052643, -0.3448690176010132, -0.3199955224990845, -0.29512202739715576, -0.27024853229522705, -0.24537502229213715, -0.22050151228904724, -0.19562801718711853, -0.17075452208518982, -0.14588101208209991, -0.12100750207901001, -0.09613394737243652, -0.07126044481992722, -0.04638694226741791, -0.0215134397149086, 0.003360062837600708, 0.028233565390110016, 0.053107067942619324, 0.07798057794570923, 0.10285407304763794, 0.12772756814956665, 0.15260107815265656, 0.17747458815574646, 0.20234808325767517, 0.22722157835960388, 0.252095103263855, 0.2769685983657837, 0.3018420934677124, 0.3267155885696411, 0.3515890836715698, 0.3764626085758209, 0.40133610367774963, 0.42620959877967834, 0.45108312368392944, 0.47595661878585815, 0.5008301138877869, 0.5257036089897156, 0.5505771040916443, 0.575450599193573, 0.6003241539001465, 0.6251976490020752, 0.6500711441040039, 0.6749446392059326, 0.6998181343078613]}, "gradients/decoder.model.decoder.layers.8.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 0.0, 3.0, 4.0, 5.0, 6.0, 5.0, 7.0, 9.0, 14.0, 12.0, 8.0, 8.0, 12.0, 12.0, 19.0, 20.0, 24.0, 30.0, 23.0, 22.0, 24.0, 30.0, 33.0, 20.0, 42.0, 38.0, 33.0, 36.0, 41.0, 32.0, 34.0, 40.0, 42.0, 46.0, 28.0, 24.0, 19.0, 31.0, 22.0, 18.0, 20.0, 11.0, 16.0, 13.0, 16.0, 7.0, 6.0, 11.0, 4.0, 11.0, 4.0, 7.0, 3.0, 0.0, 3.0, 1.0, 0.0, 4.0, 2.0, 2.0, 1.0], "bins": [-0.32875192165374756, -0.3162781596183777, -0.3038043975830078, -0.29133060574531555, -0.2788568437099457, -0.2663830816745758, -0.25390928983688354, -0.24143552780151367, -0.2289617657661438, -0.21648800373077393, -0.20401422679424286, -0.1915404498577118, -0.17906668782234192, -0.16659292578697205, -0.15411914885044098, -0.1416453719139099, -0.12917160987854004, -0.11669784039258957, -0.1042240709066391, -0.09175030142068863, -0.07927653193473816, -0.06680276244878769, -0.05432899296283722, -0.04185522347688675, -0.02938145399093628, -0.01690768450498581, -0.004433915019035339, 0.00803985446691513, 0.0205136239528656, 0.03298739343881607, 0.04546116292476654, 0.05793493241071701, 0.07040867209434509, 0.08288244158029556, 0.09535621106624603, 0.1078299805521965, 0.12030375003814697, 0.13277751207351685, 0.1452512890100479, 0.15772506594657898, 0.17019882798194885, 0.18267259001731873, 0.1951463669538498, 0.20762014389038086, 0.22009390592575073, 0.2325676679611206, 0.24504144489765167, 0.25751522183418274, 0.2699889838695526, 0.2824627459049225, 0.29493653774261475, 0.3074102997779846, 0.3198840618133545, 0.33235782384872437, 0.34483158588409424, 0.3573053777217865, 0.36977913975715637, 0.38225290179252625, 0.3947266936302185, 0.4072004556655884, 0.41967421770095825, 0.4321479797363281, 0.444621741771698, 0.45709553360939026, 0.46956929564476013]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 5.0, 0.0, 3.0, 2.0, 2.0, 6.0, 4.0, 9.0, 12.0, 13.0, 24.0, 46.0, 80.0, 125.0, 212.0, 372.0, 704.0, 1382.0, 2819.0, 5973.0, 14546.0, 46400.0, 379651.0, 509661.0, 56375.0, 17018.0, 6781.0, 3116.0, 1508.0, 785.0, 418.0, 218.0, 108.0, 70.0, 39.0, 25.0, 19.0, 11.0, 7.0, 7.0, 4.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.307373046875, -0.2967987060546875, -0.286224365234375, -0.2756500244140625, -0.26507568359375, -0.2545013427734375, -0.243927001953125, -0.2333526611328125, -0.2227783203125, -0.2122039794921875, -0.201629638671875, -0.1910552978515625, -0.18048095703125, -0.1699066162109375, -0.159332275390625, -0.1487579345703125, -0.13818359375, -0.1276092529296875, -0.117034912109375, -0.1064605712890625, -0.09588623046875, -0.0853118896484375, -0.074737548828125, -0.0641632080078125, -0.0535888671875, -0.0430145263671875, -0.032440185546875, -0.0218658447265625, -0.01129150390625, -0.0007171630859375, 0.009857177734375, 0.0204315185546875, 0.031005859375, 0.0415802001953125, 0.052154541015625, 0.0627288818359375, 0.07330322265625, 0.0838775634765625, 0.094451904296875, 0.1050262451171875, 0.1156005859375, 0.1261749267578125, 0.136749267578125, 0.1473236083984375, 0.15789794921875, 0.1684722900390625, 0.179046630859375, 0.1896209716796875, 0.2001953125, 0.2107696533203125, 0.221343994140625, 0.2319183349609375, 0.24249267578125, 0.2530670166015625, 0.263641357421875, 0.2742156982421875, 0.2847900390625, 0.2953643798828125, 0.305938720703125, 0.3165130615234375, 0.32708740234375, 0.3376617431640625, 0.348236083984375, 0.3588104248046875, 0.369384765625]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 0.0, 2.0, 3.0, 3.0, 8.0, 4.0, 6.0, 7.0, 12.0, 11.0, 7.0, 11.0, 18.0, 15.0, 30.0, 24.0, 22.0, 31.0, 40.0, 32.0, 33.0, 38.0, 30.0, 51.0, 34.0, 39.0, 40.0, 42.0, 50.0, 53.0, 35.0, 32.0, 24.0, 35.0, 25.0, 30.0, 14.0, 14.0, 20.0, 16.0, 10.0, 13.0, 7.0, 9.0, 5.0, 8.0, 3.0, 4.0, 2.0, 4.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 4.0], "bins": [-0.2705078125, -0.26219940185546875, -0.2538909912109375, -0.24558258056640625, -0.237274169921875, -0.22896575927734375, -0.2206573486328125, -0.21234893798828125, -0.20404052734375, -0.19573211669921875, -0.1874237060546875, -0.17911529541015625, -0.170806884765625, -0.16249847412109375, -0.1541900634765625, -0.14588165283203125, -0.1375732421875, -0.12926483154296875, -0.1209564208984375, -0.11264801025390625, -0.104339599609375, -0.09603118896484375, -0.0877227783203125, -0.07941436767578125, -0.07110595703125, -0.06279754638671875, -0.0544891357421875, -0.04618072509765625, -0.037872314453125, -0.02956390380859375, -0.0212554931640625, -0.01294708251953125, -0.004638671875, 0.00366973876953125, 0.0119781494140625, 0.02028656005859375, 0.028594970703125, 0.03690338134765625, 0.0452117919921875, 0.05352020263671875, 0.06182861328125, 0.07013702392578125, 0.0784454345703125, 0.08675384521484375, 0.095062255859375, 0.10337066650390625, 0.1116790771484375, 0.11998748779296875, 0.1282958984375, 0.13660430908203125, 0.1449127197265625, 0.15322113037109375, 0.161529541015625, 0.16983795166015625, 0.1781463623046875, 0.18645477294921875, 0.19476318359375, 0.20307159423828125, 0.2113800048828125, 0.21968841552734375, 0.227996826171875, 0.23630523681640625, 0.2446136474609375, 0.25292205810546875, 0.26123046875]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 4.0, 3.0, 1.0, 5.0, 7.0, 7.0, 14.0, 20.0, 31.0, 74.0, 115.0, 219.0, 475.0, 1068.0, 2595.0, 7475.0, 26844.0, 166340.0, 685719.0, 124685.0, 22402.0, 6364.0, 2256.0, 902.0, 441.0, 236.0, 117.0, 54.0, 37.0, 21.0, 13.0, 4.0, 6.0, 2.0, 0.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.3076171875, -0.29940032958984375, -0.2911834716796875, -0.28296661376953125, -0.274749755859375, -0.26653289794921875, -0.2583160400390625, -0.25009918212890625, -0.24188232421875, -0.23366546630859375, -0.2254486083984375, -0.21723175048828125, -0.209014892578125, -0.20079803466796875, -0.1925811767578125, -0.18436431884765625, -0.1761474609375, -0.16793060302734375, -0.1597137451171875, -0.15149688720703125, -0.143280029296875, -0.13506317138671875, -0.1268463134765625, -0.11862945556640625, -0.11041259765625, -0.10219573974609375, -0.0939788818359375, -0.08576202392578125, -0.077545166015625, -0.06932830810546875, -0.0611114501953125, -0.05289459228515625, -0.044677734375, -0.03646087646484375, -0.0282440185546875, -0.02002716064453125, -0.011810302734375, -0.00359344482421875, 0.0046234130859375, 0.01284027099609375, 0.02105712890625, 0.02927398681640625, 0.0374908447265625, 0.04570770263671875, 0.053924560546875, 0.06214141845703125, 0.0703582763671875, 0.07857513427734375, 0.0867919921875, 0.09500885009765625, 0.1032257080078125, 0.11144256591796875, 0.119659423828125, 0.12787628173828125, 0.1360931396484375, 0.14430999755859375, 0.15252685546875, 0.16074371337890625, 0.1689605712890625, 0.17717742919921875, 0.185394287109375, 0.19361114501953125, 0.2018280029296875, 0.21004486083984375, 0.21826171875]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 5.0, 4.0, 2.0, 4.0, 6.0, 7.0, 5.0, 17.0, 11.0, 20.0, 19.0, 12.0, 15.0, 25.0, 24.0, 42.0, 29.0, 42.0, 39.0, 33.0, 30.0, 50.0, 52.0, 42.0, 55.0, 51.0, 39.0, 41.0, 40.0, 38.0, 31.0, 23.0, 33.0, 11.0, 29.0, 18.0, 15.0, 8.0, 9.0, 4.0, 6.0, 7.0, 1.0, 8.0, 4.0, 1.0, 0.0, 3.0, 3.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.56689453125, -0.5503463745117188, -0.5337982177734375, -0.5172500610351562, -0.500701904296875, -0.48415374755859375, -0.4676055908203125, -0.45105743408203125, -0.43450927734375, -0.41796112060546875, -0.4014129638671875, -0.38486480712890625, -0.368316650390625, -0.35176849365234375, -0.3352203369140625, -0.31867218017578125, -0.3021240234375, -0.28557586669921875, -0.2690277099609375, -0.25247955322265625, -0.235931396484375, -0.21938323974609375, -0.2028350830078125, -0.18628692626953125, -0.16973876953125, -0.15319061279296875, -0.1366424560546875, -0.12009429931640625, -0.103546142578125, -0.08699798583984375, -0.0704498291015625, -0.05390167236328125, -0.037353515625, -0.02080535888671875, -0.0042572021484375, 0.01229095458984375, 0.028839111328125, 0.04538726806640625, 0.0619354248046875, 0.07848358154296875, 0.09503173828125, 0.11157989501953125, 0.1281280517578125, 0.14467620849609375, 0.161224365234375, 0.17777252197265625, 0.1943206787109375, 0.21086883544921875, 0.2274169921875, 0.24396514892578125, 0.2605133056640625, 0.27706146240234375, 0.293609619140625, 0.31015777587890625, 0.3267059326171875, 0.34325408935546875, 0.35980224609375, 0.37635040283203125, 0.3928985595703125, 0.40944671630859375, 0.425994873046875, 0.44254302978515625, 0.4590911865234375, 0.47563934326171875, 0.4921875]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 1.0, 3.0, 5.0, 4.0, 11.0, 13.0, 23.0, 27.0, 43.0, 92.0, 153.0, 238.0, 442.0, 840.0, 1617.0, 3552.0, 8423.0, 26941.0, 166429.0, 675432.0, 127183.0, 22862.0, 7648.0, 3195.0, 1602.0, 773.0, 439.0, 219.0, 142.0, 74.0, 47.0, 31.0, 25.0, 7.0, 8.0, 9.0, 6.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06512451171875, -0.0628347396850586, -0.06054496765136719, -0.05825519561767578, -0.055965423583984375, -0.05367565155029297, -0.05138587951660156, -0.049096107482910156, -0.04680633544921875, -0.044516563415527344, -0.04222679138183594, -0.03993701934814453, -0.037647247314453125, -0.03535747528076172, -0.03306770324707031, -0.030777931213378906, -0.0284881591796875, -0.026198387145996094, -0.023908615112304688, -0.02161884307861328, -0.019329071044921875, -0.01703929901123047, -0.014749526977539062, -0.012459754943847656, -0.01016998291015625, -0.007880210876464844, -0.0055904388427734375, -0.0033006668090820312, -0.001010894775390625, 0.0012788772583007812, 0.0035686492919921875, 0.005858421325683594, 0.008148193359375, 0.010437965393066406, 0.012727737426757812, 0.015017509460449219, 0.017307281494140625, 0.01959705352783203, 0.021886825561523438, 0.024176597595214844, 0.02646636962890625, 0.028756141662597656, 0.031045913696289062, 0.03333568572998047, 0.035625457763671875, 0.03791522979736328, 0.04020500183105469, 0.042494773864746094, 0.0447845458984375, 0.047074317932128906, 0.04936408996582031, 0.05165386199951172, 0.053943634033203125, 0.05623340606689453, 0.05852317810058594, 0.060812950134277344, 0.06310272216796875, 0.06539249420166016, 0.06768226623535156, 0.06997203826904297, 0.07226181030273438, 0.07455158233642578, 0.07684135437011719, 0.0791311264038086, 0.0814208984375]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 6.0, 3.0, 8.0, 1.0, 10.0, 16.0, 36.0, 46.0, 81.0, 132.0, 204.0, 180.0, 109.0, 74.0, 27.0, 15.0, 20.0, 10.0, 9.0, 5.0, 4.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.863739013671875e-05, -4.6819448471069336e-05, -4.500150680541992e-05, -4.318356513977051e-05, -4.1365623474121094e-05, -3.954768180847168e-05, -3.7729740142822266e-05, -3.591179847717285e-05, -3.409385681152344e-05, -3.2275915145874023e-05, -3.045797348022461e-05, -2.8640031814575195e-05, -2.682209014892578e-05, -2.5004148483276367e-05, -2.3186206817626953e-05, -2.136826515197754e-05, -1.9550323486328125e-05, -1.773238182067871e-05, -1.5914440155029297e-05, -1.4096498489379883e-05, -1.2278556823730469e-05, -1.0460615158081055e-05, -8.64267349243164e-06, -6.8247318267822266e-06, -5.0067901611328125e-06, -3.1888484954833984e-06, -1.3709068298339844e-06, 4.470348358154297e-07, 2.2649765014648438e-06, 4.082918167114258e-06, 5.900859832763672e-06, 7.718801498413086e-06, 9.5367431640625e-06, 1.1354684829711914e-05, 1.3172626495361328e-05, 1.4990568161010742e-05, 1.6808509826660156e-05, 1.862645149230957e-05, 2.0444393157958984e-05, 2.22623348236084e-05, 2.4080276489257812e-05, 2.5898218154907227e-05, 2.771615982055664e-05, 2.9534101486206055e-05, 3.135204315185547e-05, 3.316998481750488e-05, 3.49879264831543e-05, 3.680586814880371e-05, 3.8623809814453125e-05, 4.044175148010254e-05, 4.225969314575195e-05, 4.407763481140137e-05, 4.589557647705078e-05, 4.7713518142700195e-05, 4.953145980834961e-05, 5.1349401473999023e-05, 5.316734313964844e-05, 5.498528480529785e-05, 5.6803226470947266e-05, 5.862116813659668e-05, 6.0439109802246094e-05, 6.225705146789551e-05, 6.407499313354492e-05, 6.589293479919434e-05, 6.771087646484375e-05]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 4.0, 1.0, 6.0, 6.0, 15.0, 21.0, 20.0, 43.0, 80.0, 129.0, 178.0, 354.0, 615.0, 1223.0, 2427.0, 5814.0, 16088.0, 71607.0, 587889.0, 304330.0, 38836.0, 10616.0, 4224.0, 1889.0, 909.0, 504.0, 296.0, 152.0, 93.0, 64.0, 41.0, 22.0, 17.0, 17.0, 5.0, 7.0, 8.0, 1.0, 2.0, 4.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.096923828125, -0.09421825408935547, -0.09151268005371094, -0.0888071060180664, -0.08610153198242188, -0.08339595794677734, -0.08069038391113281, -0.07798480987548828, -0.07527923583984375, -0.07257366180419922, -0.06986808776855469, -0.06716251373291016, -0.06445693969726562, -0.061751365661621094, -0.05904579162597656, -0.05634021759033203, -0.0536346435546875, -0.05092906951904297, -0.04822349548339844, -0.045517921447753906, -0.042812347412109375, -0.040106773376464844, -0.03740119934082031, -0.03469562530517578, -0.03199005126953125, -0.02928447723388672, -0.026578903198242188, -0.023873329162597656, -0.021167755126953125, -0.018462181091308594, -0.015756607055664062, -0.013051033020019531, -0.010345458984375, -0.007639884948730469, -0.0049343109130859375, -0.0022287368774414062, 0.000476837158203125, 0.0031824111938476562, 0.0058879852294921875, 0.008593559265136719, 0.01129913330078125, 0.014004707336425781, 0.016710281372070312, 0.019415855407714844, 0.022121429443359375, 0.024827003479003906, 0.027532577514648438, 0.03023815155029297, 0.0329437255859375, 0.03564929962158203, 0.03835487365722656, 0.041060447692871094, 0.043766021728515625, 0.046471595764160156, 0.04917716979980469, 0.05188274383544922, 0.05458831787109375, 0.05729389190673828, 0.05999946594238281, 0.06270503997802734, 0.06541061401367188, 0.0681161880493164, 0.07082176208496094, 0.07352733612060547, 0.07623291015625]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 0.0, 2.0, 3.0, 2.0, 2.0, 8.0, 4.0, 6.0, 3.0, 5.0, 13.0, 17.0, 25.0, 36.0, 43.0, 41.0, 62.0, 65.0, 87.0, 115.0, 79.0, 76.0, 76.0, 50.0, 50.0, 29.0, 23.0, 20.0, 17.0, 12.0, 8.0, 6.0, 6.0, 2.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0140533447265625, -0.013564348220825195, -0.01307535171508789, -0.012586355209350586, -0.012097358703613281, -0.011608362197875977, -0.011119365692138672, -0.010630369186401367, -0.010141372680664062, -0.009652376174926758, -0.009163379669189453, -0.008674383163452148, -0.008185386657714844, -0.007696390151977539, -0.007207393646240234, -0.00671839714050293, -0.006229400634765625, -0.00574040412902832, -0.005251407623291016, -0.004762411117553711, -0.004273414611816406, -0.0037844181060791016, -0.003295421600341797, -0.002806425094604492, -0.0023174285888671875, -0.0018284320831298828, -0.0013394355773925781, -0.0008504390716552734, -0.00036144256591796875, 0.00012755393981933594, 0.0006165504455566406, 0.0011055469512939453, 0.00159454345703125, 0.0020835399627685547, 0.0025725364685058594, 0.003061532974243164, 0.0035505294799804688, 0.0040395259857177734, 0.004528522491455078, 0.005017518997192383, 0.0055065155029296875, 0.005995512008666992, 0.006484508514404297, 0.0069735050201416016, 0.007462501525878906, 0.007951498031616211, 0.008440494537353516, 0.00892949104309082, 0.009418487548828125, 0.00990748405456543, 0.010396480560302734, 0.010885477066040039, 0.011374473571777344, 0.011863470077514648, 0.012352466583251953, 0.012841463088989258, 0.013330459594726562, 0.013819456100463867, 0.014308452606201172, 0.014797449111938477, 0.015286445617675781, 0.015775442123413086, 0.01626443862915039, 0.016753435134887695, 0.017242431640625]}, "gradients/decoder.model.decoder.layers.8.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 1.0, 9.0, 7.0, 18.0, 24.0, 48.0, 70.0, 92.0, 151.0, 157.0, 146.0, 107.0, 57.0, 62.0, 20.0, 14.0, 7.0, 3.0, 6.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.031504511833191, -1.0077131986618042, -0.9839218258857727, -0.9601304531097412, -0.9363391399383545, -0.912547767162323, -0.8887563943862915, -0.8649650812149048, -0.8411737084388733, -0.8173823356628418, -0.7935910224914551, -0.7697996497154236, -0.7460082769393921, -0.7222169637680054, -0.6984255909919739, -0.6746342182159424, -0.6508429050445557, -0.6270515322685242, -0.6032602190971375, -0.579468846321106, -0.5556775331497192, -0.5318861603736877, -0.5080947875976562, -0.48430344462394714, -0.46051210165023804, -0.43672075867652893, -0.4129294157028198, -0.38913804292678833, -0.3653466999530792, -0.3415553569793701, -0.3177639842033386, -0.2939726412296295, -0.2701812982559204, -0.2463899552822113, -0.222598597407341, -0.1988072395324707, -0.1750158965587616, -0.1512245535850525, -0.1274331957101822, -0.10364183783531189, -0.07985049486160278, -0.05605914443731308, -0.032267794013023376, -0.008476443588733673, 0.01531490683555603, 0.039106257259845734, 0.06289760768413544, 0.08668896555900574, 0.11048030853271484, 0.13427165150642395, 0.15806300938129425, 0.18185436725616455, 0.20564571022987366, 0.22943705320358276, 0.25322842597961426, 0.27701976895332336, 0.30081111192703247, 0.3246024549007416, 0.3483937978744507, 0.3721851706504822, 0.3959765136241913, 0.4197678565979004, 0.4435592293739319, 0.467350572347641, 0.4911419153213501]}, "gradients/decoder.model.decoder.layers.8.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 5.0, 2.0, 7.0, 3.0, 11.0, 9.0, 6.0, 7.0, 12.0, 23.0, 9.0, 12.0, 22.0, 22.0, 38.0, 24.0, 28.0, 33.0, 35.0, 44.0, 38.0, 43.0, 40.0, 42.0, 47.0, 38.0, 54.0, 53.0, 37.0, 38.0, 27.0, 24.0, 31.0, 21.0, 22.0, 13.0, 15.0, 15.0, 9.0, 11.0, 8.0, 9.0, 2.0, 8.0, 5.0, 2.0, 1.0, 3.0, 2.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.2611023485660553, -0.2527869939804077, -0.24447165429592133, -0.23615631461143494, -0.22784097492694855, -0.21952563524246216, -0.21121028065681458, -0.20289494097232819, -0.1945796012878418, -0.1862642616033554, -0.17794890701770782, -0.16963356733322144, -0.16131822764873505, -0.15300288796424866, -0.14468753337860107, -0.13637219369411469, -0.1280568391084671, -0.11974149197340012, -0.11142615228891373, -0.10311080515384674, -0.09479546546936035, -0.08648011833429337, -0.07816477119922638, -0.06984943151473999, -0.061534084379673004, -0.053218740969896317, -0.04490339756011963, -0.03658805042505264, -0.028272707015275955, -0.019957363605499268, -0.011642016470432281, -0.003326673060655594, 0.004988670349121094, 0.013304014690220356, 0.021619359031319618, 0.029934704303741455, 0.03825004771351814, 0.04656539112329483, 0.054880738258361816, 0.0631960779428482, 0.07151142507791519, 0.07982677221298218, 0.08814211189746857, 0.09645745903253555, 0.10477280616760254, 0.11308814585208893, 0.12140349298715591, 0.1297188401222229, 0.1380341798067093, 0.14634951949119568, 0.15466487407684326, 0.16298021376132965, 0.17129555344581604, 0.17961090803146362, 0.18792624771595, 0.1962415874004364, 0.20455694198608398, 0.21287228167057037, 0.22118763625621796, 0.22950297594070435, 0.23781831562519073, 0.24613365530967712, 0.2544490098953247, 0.2627643644809723, 0.2710796892642975]}, "gradients/decoder.model.decoder.layers.8.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 3.0, 2.0, 3.0, 6.0, 8.0, 11.0, 28.0, 32.0, 63.0, 123.0, 158.0, 233.0, 424.0, 724.0, 1270.0, 2386.0, 4843.0, 10383.0, 26918.0, 87242.0, 436713.0, 359499.0, 74644.0, 24005.0, 9420.0, 4403.0, 2132.0, 1214.0, 657.0, 380.0, 217.0, 145.0, 95.0, 61.0, 53.0, 28.0, 14.0, 5.0, 7.0, 5.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.541015625, -0.5255317687988281, -0.5100479125976562, -0.4945640563964844, -0.4790802001953125, -0.4635963439941406, -0.44811248779296875, -0.4326286315917969, -0.417144775390625, -0.4016609191894531, -0.38617706298828125, -0.3706932067871094, -0.3552093505859375, -0.3397254943847656, -0.32424163818359375, -0.3087577819824219, -0.29327392578125, -0.2777900695800781, -0.26230621337890625, -0.24682235717773438, -0.2313385009765625, -0.21585464477539062, -0.20037078857421875, -0.18488693237304688, -0.169403076171875, -0.15391921997070312, -0.13843536376953125, -0.12295150756835938, -0.1074676513671875, -0.09198379516601562, -0.07649993896484375, -0.061016082763671875, -0.0455322265625, -0.030048370361328125, -0.01456451416015625, 0.000919342041015625, 0.0164031982421875, 0.031887054443359375, 0.04737091064453125, 0.06285476684570312, 0.078338623046875, 0.09382247924804688, 0.10930633544921875, 0.12479019165039062, 0.1402740478515625, 0.15575790405273438, 0.17124176025390625, 0.18672561645507812, 0.20220947265625, 0.21769332885742188, 0.23317718505859375, 0.24866104125976562, 0.2641448974609375, 0.2796287536621094, 0.29511260986328125, 0.3105964660644531, 0.326080322265625, 0.3415641784667969, 0.35704803466796875, 0.3725318908691406, 0.3880157470703125, 0.4034996032714844, 0.41898345947265625, 0.4344673156738281, 0.449951171875]}, "gradients/decoder.model.decoder.layers.8.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 7.0, 1.0, 5.0, 10.0, 7.0, 6.0, 13.0, 7.0, 6.0, 15.0, 18.0, 20.0, 26.0, 20.0, 29.0, 29.0, 31.0, 40.0, 46.0, 40.0, 50.0, 58.0, 42.0, 39.0, 51.0, 57.0, 49.0, 31.0, 39.0, 34.0, 29.0, 28.0, 19.0, 20.0, 19.0, 10.0, 13.0, 11.0, 8.0, 3.0, 2.0, 5.0, 2.0, 1.0, 2.0, 6.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.52197265625, -0.5042266845703125, -0.486480712890625, -0.4687347412109375, -0.45098876953125, -0.4332427978515625, -0.415496826171875, -0.3977508544921875, -0.3800048828125, -0.3622589111328125, -0.344512939453125, -0.3267669677734375, -0.30902099609375, -0.2912750244140625, -0.273529052734375, -0.2557830810546875, -0.238037109375, -0.2202911376953125, -0.202545166015625, -0.1847991943359375, -0.16705322265625, -0.1493072509765625, -0.131561279296875, -0.1138153076171875, -0.0960693359375, -0.0783233642578125, -0.060577392578125, -0.0428314208984375, -0.02508544921875, -0.0073394775390625, 0.010406494140625, 0.0281524658203125, 0.0458984375, 0.0636444091796875, 0.081390380859375, 0.0991363525390625, 0.11688232421875, 0.1346282958984375, 0.152374267578125, 0.1701202392578125, 0.1878662109375, 0.2056121826171875, 0.223358154296875, 0.2411041259765625, 0.25885009765625, 0.2765960693359375, 0.294342041015625, 0.3120880126953125, 0.329833984375, 0.3475799560546875, 0.365325927734375, 0.3830718994140625, 0.40081787109375, 0.4185638427734375, 0.436309814453125, 0.4540557861328125, 0.4718017578125, 0.4895477294921875, 0.507293701171875, 0.5250396728515625, 0.54278564453125, 0.5605316162109375, 0.578277587890625, 0.5960235595703125, 0.61376953125]}, "gradients/decoder.model.decoder.layers.8.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 6.0, 11.0, 9.0, 9.0, 9.0, 11.0, 14.0, 23.0, 19.0, 26.0, 30.0, 24.0, 49.0, 75.0, 104.0, 203.0, 488.0, 3290.0, 165546.0, 868652.0, 8463.0, 810.0, 225.0, 104.0, 73.0, 61.0, 31.0, 37.0, 24.0, 30.0, 22.0, 13.0, 16.0, 14.0, 8.0, 7.0, 3.0, 4.0, 6.0, 1.0, 3.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.037109375, -1.97747802734375, -1.9178466796875, -1.85821533203125, -1.798583984375, -1.73895263671875, -1.6793212890625, -1.61968994140625, -1.56005859375, -1.50042724609375, -1.4407958984375, -1.38116455078125, -1.321533203125, -1.26190185546875, -1.2022705078125, -1.14263916015625, -1.0830078125, -1.02337646484375, -0.9637451171875, -0.90411376953125, -0.844482421875, -0.78485107421875, -0.7252197265625, -0.66558837890625, -0.60595703125, -0.54632568359375, -0.4866943359375, -0.42706298828125, -0.367431640625, -0.30780029296875, -0.2481689453125, -0.18853759765625, -0.12890625, -0.06927490234375, -0.0096435546875, 0.04998779296875, 0.109619140625, 0.16925048828125, 0.2288818359375, 0.28851318359375, 0.34814453125, 0.40777587890625, 0.4674072265625, 0.52703857421875, 0.586669921875, 0.64630126953125, 0.7059326171875, 0.76556396484375, 0.8251953125, 0.88482666015625, 0.9444580078125, 1.00408935546875, 1.063720703125, 1.12335205078125, 1.1829833984375, 1.24261474609375, 1.30224609375, 1.36187744140625, 1.4215087890625, 1.48114013671875, 1.540771484375, 1.60040283203125, 1.6600341796875, 1.71966552734375, 1.779296875]}, "gradients/decoder.model.decoder.layers.8.self_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 4.0, 2.0, 4.0, 4.0, 7.0, 9.0, 8.0, 18.0, 8.0, 14.0, 25.0, 27.0, 20.0, 23.0, 22.0, 24.0, 33.0, 51.0, 41.0, 44.0, 42.0, 54.0, 37.0, 44.0, 54.0, 32.0, 38.0, 33.0, 32.0, 43.0, 25.0, 16.0, 29.0, 22.0, 20.0, 20.0, 21.0, 10.0, 8.0, 10.0, 4.0, 9.0, 3.0, 1.0, 2.0, 1.0, 5.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.55908203125, -0.5419692993164062, -0.5248565673828125, -0.5077438354492188, -0.490631103515625, -0.47351837158203125, -0.4564056396484375, -0.43929290771484375, -0.42218017578125, -0.40506744384765625, -0.3879547119140625, -0.37084197998046875, -0.353729248046875, -0.33661651611328125, -0.3195037841796875, -0.30239105224609375, -0.2852783203125, -0.26816558837890625, -0.2510528564453125, -0.23394012451171875, -0.216827392578125, -0.19971466064453125, -0.1826019287109375, -0.16548919677734375, -0.14837646484375, -0.13126373291015625, -0.1141510009765625, -0.09703826904296875, -0.079925537109375, -0.06281280517578125, -0.0457000732421875, -0.02858734130859375, -0.011474609375, 0.00563812255859375, 0.0227508544921875, 0.03986358642578125, 0.056976318359375, 0.07408905029296875, 0.0912017822265625, 0.10831451416015625, 0.12542724609375, 0.14253997802734375, 0.1596527099609375, 0.17676544189453125, 0.193878173828125, 0.21099090576171875, 0.2281036376953125, 0.24521636962890625, 0.2623291015625, 0.27944183349609375, 0.2965545654296875, 0.31366729736328125, 0.330780029296875, 0.34789276123046875, 0.3650054931640625, 0.38211822509765625, 0.39923095703125, 0.41634368896484375, 0.4334564208984375, 0.45056915283203125, 0.467681884765625, 0.48479461669921875, 0.5019073486328125, 0.5190200805664062, 0.5361328125]}, "gradients/decoder.model.decoder.layers.8.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 1.0, 2.0, 3.0, 14.0, 12.0, 10.0, 12.0, 18.0, 46.0, 91.0, 136.0, 222.0, 446.0, 1143.0, 3696.0, 18137.0, 204581.0, 758259.0, 50736.0, 7534.0, 2004.0, 728.0, 295.0, 180.0, 82.0, 69.0, 34.0, 30.0, 11.0, 4.0, 6.0, 4.0, 4.0, 4.0, 1.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2403564453125, -0.2311992645263672, -0.22204208374023438, -0.21288490295410156, -0.20372772216796875, -0.19457054138183594, -0.18541336059570312, -0.1762561798095703, -0.1670989990234375, -0.1579418182373047, -0.14878463745117188, -0.13962745666503906, -0.13047027587890625, -0.12131309509277344, -0.11215591430664062, -0.10299873352050781, -0.093841552734375, -0.08468437194824219, -0.07552719116210938, -0.06637001037597656, -0.05721282958984375, -0.04805564880371094, -0.038898468017578125, -0.029741287231445312, -0.0205841064453125, -0.011426925659179688, -0.002269744873046875, 0.0068874359130859375, 0.01604461669921875, 0.025201797485351562, 0.034358978271484375, 0.04351615905761719, 0.05267333984375, 0.06183052062988281, 0.07098770141601562, 0.08014488220214844, 0.08930206298828125, 0.09845924377441406, 0.10761642456054688, 0.11677360534667969, 0.1259307861328125, 0.1350879669189453, 0.14424514770507812, 0.15340232849121094, 0.16255950927734375, 0.17171669006347656, 0.18087387084960938, 0.1900310516357422, 0.199188232421875, 0.2083454132080078, 0.21750259399414062, 0.22665977478027344, 0.23581695556640625, 0.24497413635253906, 0.2541313171386719, 0.2632884979248047, 0.2724456787109375, 0.2816028594970703, 0.2907600402832031, 0.29991722106933594, 0.30907440185546875, 0.31823158264160156, 0.3273887634277344, 0.3365459442138672, 0.345703125]}, "gradients/decoder.model.decoder.layers.8.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 4.0, 3.0, 7.0, 14.0, 14.0, 17.0, 41.0, 61.0, 101.0, 217.0, 245.0, 111.0, 66.0, 35.0, 23.0, 18.0, 10.0, 11.0, 4.0, 2.0, 5.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.51207160949707e-05, -4.339125007390976e-05, -4.1661784052848816e-05, -3.993231803178787e-05, -3.820285201072693e-05, -3.6473385989665985e-05, -3.474391996860504e-05, -3.30144539475441e-05, -3.1284987926483154e-05, -2.955552190542221e-05, -2.7826055884361267e-05, -2.6096589863300323e-05, -2.436712384223938e-05, -2.2637657821178436e-05, -2.0908191800117493e-05, -1.917872577905655e-05, -1.7449259757995605e-05, -1.5719793736934662e-05, -1.3990327715873718e-05, -1.2260861694812775e-05, -1.0531395673751831e-05, -8.801929652690887e-06, -7.072463631629944e-06, -5.342997610569e-06, -3.6135315895080566e-06, -1.884065568447113e-06, -1.5459954738616943e-07, 1.5748664736747742e-06, 3.3043324947357178e-06, 5.033798515796661e-06, 6.763264536857605e-06, 8.492730557918549e-06, 1.0222196578979492e-05, 1.1951662600040436e-05, 1.368112862110138e-05, 1.5410594642162323e-05, 1.7140060663223267e-05, 1.886952668428421e-05, 2.0598992705345154e-05, 2.2328458726406097e-05, 2.405792474746704e-05, 2.5787390768527985e-05, 2.7516856789588928e-05, 2.9246322810649872e-05, 3.0975788831710815e-05, 3.270525485277176e-05, 3.44347208738327e-05, 3.6164186894893646e-05, 3.789365291595459e-05, 3.9623118937015533e-05, 4.135258495807648e-05, 4.308205097913742e-05, 4.4811517000198364e-05, 4.654098302125931e-05, 4.827044904232025e-05, 4.9999915063381195e-05, 5.172938108444214e-05, 5.345884710550308e-05, 5.5188313126564026e-05, 5.691777914762497e-05, 5.864724516868591e-05, 6.037671118974686e-05, 6.21061772108078e-05, 6.383564323186874e-05, 6.556510925292969e-05]}, "gradients/decoder.model.decoder.layers.8.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 5.0, 5.0, 4.0, 3.0, 5.0, 14.0, 17.0, 35.0, 40.0, 74.0, 112.0, 205.0, 442.0, 969.0, 2701.0, 10977.0, 67243.0, 671012.0, 256012.0, 29611.0, 5867.0, 1716.0, 757.0, 327.0, 165.0, 99.0, 60.0, 25.0, 22.0, 14.0, 11.0, 2.0, 5.0, 5.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.278076171875, -0.2707176208496094, -0.26335906982421875, -0.2560005187988281, -0.2486419677734375, -0.24128341674804688, -0.23392486572265625, -0.22656631469726562, -0.219207763671875, -0.21184921264648438, -0.20449066162109375, -0.19713211059570312, -0.1897735595703125, -0.18241500854492188, -0.17505645751953125, -0.16769790649414062, -0.16033935546875, -0.15298080444335938, -0.14562225341796875, -0.13826370239257812, -0.1309051513671875, -0.12354660034179688, -0.11618804931640625, -0.10882949829101562, -0.101470947265625, -0.09411239624023438, -0.08675384521484375, -0.07939529418945312, -0.0720367431640625, -0.06467819213867188, -0.05731964111328125, -0.049961090087890625, -0.0426025390625, -0.035243988037109375, -0.02788543701171875, -0.020526885986328125, -0.0131683349609375, -0.005809783935546875, 0.00154876708984375, 0.008907318115234375, 0.016265869140625, 0.023624420166015625, 0.03098297119140625, 0.038341522216796875, 0.0457000732421875, 0.053058624267578125, 0.06041717529296875, 0.06777572631835938, 0.07513427734375, 0.08249282836914062, 0.08985137939453125, 0.09720993041992188, 0.1045684814453125, 0.11192703247070312, 0.11928558349609375, 0.12664413452148438, 0.134002685546875, 0.14136123657226562, 0.14871978759765625, 0.15607833862304688, 0.1634368896484375, 0.17079544067382812, 0.17815399169921875, 0.18551254272460938, 0.19287109375]}, "gradients/decoder.model.decoder.layers.8.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 3.0, 11.0, 10.0, 11.0, 25.0, 19.0, 39.0, 46.0, 47.0, 64.0, 79.0, 124.0, 135.0, 97.0, 72.0, 46.0, 45.0, 34.0, 30.0, 18.0, 14.0, 14.0, 11.0, 4.0, 3.0, 3.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.069091796875, -0.06655502319335938, -0.06401824951171875, -0.061481475830078125, -0.0589447021484375, -0.056407928466796875, -0.05387115478515625, -0.051334381103515625, -0.048797607421875, -0.046260833740234375, -0.04372406005859375, -0.041187286376953125, -0.0386505126953125, -0.036113739013671875, -0.03357696533203125, -0.031040191650390625, -0.02850341796875, -0.025966644287109375, -0.02342987060546875, -0.020893096923828125, -0.0183563232421875, -0.015819549560546875, -0.01328277587890625, -0.010746002197265625, -0.008209228515625, -0.005672454833984375, -0.00313568115234375, -0.000598907470703125, 0.0019378662109375, 0.004474639892578125, 0.00701141357421875, 0.009548187255859375, 0.0120849609375, 0.014621734619140625, 0.01715850830078125, 0.019695281982421875, 0.0222320556640625, 0.024768829345703125, 0.02730560302734375, 0.029842376708984375, 0.032379150390625, 0.034915924072265625, 0.03745269775390625, 0.039989471435546875, 0.0425262451171875, 0.045063018798828125, 0.04759979248046875, 0.050136566162109375, 0.05267333984375, 0.055210113525390625, 0.05774688720703125, 0.060283660888671875, 0.0628204345703125, 0.06535720825195312, 0.06789398193359375, 0.07043075561523438, 0.072967529296875, 0.07550430297851562, 0.07804107666015625, 0.08057785034179688, 0.0831146240234375, 0.08565139770507812, 0.08818817138671875, 0.09072494506835938, 0.09326171875]}, "gradients/decoder.model.decoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 5.0, 17.0, 26.0, 57.0, 108.0, 168.0, 214.0, 187.0, 105.0, 63.0, 30.0, 11.0, 7.0, 5.0, 3.0, 2.0, 1.0, 1.0, 2.0], "bins": [-3.356729507446289, -3.2915191650390625, -3.226308822631836, -3.1610984802246094, -3.095888137817383, -3.0306777954101562, -2.9654674530029297, -2.900257110595703, -2.8350467681884766, -2.76983642578125, -2.7046260833740234, -2.639415740966797, -2.5742053985595703, -2.5089950561523438, -2.443784713745117, -2.3785743713378906, -2.313363790512085, -2.2481534481048584, -2.182943105697632, -2.1177327632904053, -2.0525224208831787, -1.9873120784759521, -1.922101616859436, -1.8568912744522095, -1.791680932044983, -1.7264705896377563, -1.6612602472305298, -1.5960499048233032, -1.530839443206787, -1.4656291007995605, -1.400418758392334, -1.3352084159851074, -1.2699980735778809, -1.2047877311706543, -1.1395773887634277, -1.0743670463562012, -1.0091567039489746, -0.9439463019371033, -0.8787358999252319, -0.8135255575180054, -0.7483152747154236, -0.683104932308197, -0.6178945302963257, -0.5526841878890991, -0.48747384548187256, -0.422263503074646, -0.35705313086509705, -0.2918427586555481, -0.22663241624832153, -0.16142205893993378, -0.09621170163154602, -0.031001344323158264, 0.03420901298522949, 0.09941935539245605, 0.164629727602005, 0.22984009981155396, 0.2950504422187805, 0.3602607846260071, 0.42547115683555603, 0.490681529045105, 0.5558918714523315, 0.6211022138595581, 0.6863125562667847, 0.751522958278656, 0.8167333006858826]}, "gradients/decoder.model.decoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 4.0, 4.0, 5.0, 6.0, 6.0, 12.0, 13.0, 15.0, 21.0, 26.0, 32.0, 21.0, 29.0, 23.0, 34.0, 32.0, 34.0, 34.0, 47.0, 48.0, 43.0, 44.0, 44.0, 43.0, 43.0, 31.0, 47.0, 38.0, 24.0, 23.0, 36.0, 23.0, 21.0, 20.0, 14.0, 17.0, 9.0, 10.0, 5.0, 5.0, 4.0, 4.0, 3.0, 3.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.0977847576141357, -1.0669280290603638, -1.0360713005065918, -1.0052146911621094, -0.9743579626083374, -0.9435012340545654, -0.9126445055007935, -0.8817878365516663, -0.8509311676025391, -0.8200744390487671, -0.7892177700996399, -0.7583610415458679, -0.7275043725967407, -0.6966476440429688, -0.6657909154891968, -0.6349342465400696, -0.6040775179862976, -0.5732207894325256, -0.5423641204833984, -0.5115073919296265, -0.48065072298049927, -0.4497939944267273, -0.4189372956752777, -0.3880805969238281, -0.35722389817237854, -0.32636719942092896, -0.29551050066947937, -0.2646538019180298, -0.233797088265419, -0.20294038951396942, -0.17208367586135864, -0.14122697710990906, -0.11037033796310425, -0.07951363921165466, -0.04865693300962448, -0.0178002268075943, 0.013056471943855286, 0.04391317069530487, 0.07476988434791565, 0.10562658309936523, 0.13648328185081482, 0.1673399806022644, 0.198196679353714, 0.22905339300632477, 0.25991010665893555, 0.29076677560806274, 0.3216235041618347, 0.3524802029132843, 0.3833369016647339, 0.41419360041618347, 0.44505029916763306, 0.47590702772140503, 0.5067636966705322, 0.5376204252243042, 0.5684771537780762, 0.5993338227272034, 0.6301904916763306, 0.6610472202301025, 0.6919038891792297, 0.7227606177330017, 0.7536172866821289, 0.7844740152359009, 0.8153307437896729, 0.8461874127388, 0.877044141292572]}, "gradients/decoder.model.decoder.layers.7.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 5.0, 7.0, 5.0, 11.0, 10.0, 18.0, 22.0, 36.0, 34.0, 70.0, 87.0, 147.0, 194.0, 314.0, 440.0, 716.0, 1209.0, 2018.0, 4164.0, 9704.0, 31775.0, 219662.0, 1857966.0, 1798921.0, 216637.0, 31515.0, 9273.0, 4090.0, 2041.0, 1186.0, 712.0, 431.0, 251.0, 184.0, 110.0, 90.0, 62.0, 52.0, 35.0, 21.0, 15.0, 19.0, 8.0, 6.0, 3.0, 6.0, 4.0, 0.0, 3.0, 1.0, 0.0, 1.0], "bins": [-0.68896484375, -0.6692733764648438, -0.6495819091796875, -0.6298904418945312, -0.610198974609375, -0.5905075073242188, -0.5708160400390625, -0.5511245727539062, -0.53143310546875, -0.5117416381835938, -0.4920501708984375, -0.47235870361328125, -0.452667236328125, -0.43297576904296875, -0.4132843017578125, -0.39359283447265625, -0.3739013671875, -0.35420989990234375, -0.3345184326171875, -0.31482696533203125, -0.295135498046875, -0.27544403076171875, -0.2557525634765625, -0.23606109619140625, -0.21636962890625, -0.19667816162109375, -0.1769866943359375, -0.15729522705078125, -0.137603759765625, -0.11791229248046875, -0.0982208251953125, -0.07852935791015625, -0.058837890625, -0.03914642333984375, -0.0194549560546875, 0.00023651123046875, 0.019927978515625, 0.03961944580078125, 0.0593109130859375, 0.07900238037109375, 0.09869384765625, 0.11838531494140625, 0.1380767822265625, 0.15776824951171875, 0.177459716796875, 0.19715118408203125, 0.2168426513671875, 0.23653411865234375, 0.2562255859375, 0.27591705322265625, 0.2956085205078125, 0.31529998779296875, 0.334991455078125, 0.35468292236328125, 0.3743743896484375, 0.39406585693359375, 0.41375732421875, 0.43344879150390625, 0.4531402587890625, 0.47283172607421875, 0.492523193359375, 0.5122146606445312, 0.5319061279296875, 0.5515975952148438, 0.5712890625]}, "gradients/decoder.model.decoder.layers.7.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 8.0, 1.0, 5.0, 12.0, 10.0, 5.0, 10.0, 9.0, 24.0, 24.0, 33.0, 19.0, 34.0, 45.0, 43.0, 35.0, 39.0, 56.0, 45.0, 51.0, 47.0, 50.0, 51.0, 50.0, 50.0, 37.0, 39.0, 37.0, 23.0, 19.0, 25.0, 12.0, 11.0, 9.0, 11.0, 9.0, 7.0, 4.0, 5.0, 1.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.401123046875, -0.38814544677734375, -0.3751678466796875, -0.36219024658203125, -0.349212646484375, -0.33623504638671875, -0.3232574462890625, -0.31027984619140625, -0.29730224609375, -0.28432464599609375, -0.2713470458984375, -0.25836944580078125, -0.245391845703125, -0.23241424560546875, -0.2194366455078125, -0.20645904541015625, -0.1934814453125, -0.18050384521484375, -0.1675262451171875, -0.15454864501953125, -0.141571044921875, -0.12859344482421875, -0.1156158447265625, -0.10263824462890625, -0.08966064453125, -0.07668304443359375, -0.0637054443359375, -0.05072784423828125, -0.037750244140625, -0.02477264404296875, -0.0117950439453125, 0.00118255615234375, 0.01416015625, 0.02713775634765625, 0.0401153564453125, 0.05309295654296875, 0.066070556640625, 0.07904815673828125, 0.0920257568359375, 0.10500335693359375, 0.11798095703125, 0.13095855712890625, 0.1439361572265625, 0.15691375732421875, 0.169891357421875, 0.18286895751953125, 0.1958465576171875, 0.20882415771484375, 0.2218017578125, 0.23477935791015625, 0.2477569580078125, 0.26073455810546875, 0.273712158203125, 0.28668975830078125, 0.2996673583984375, 0.31264495849609375, 0.32562255859375, 0.33860015869140625, 0.3515777587890625, 0.36455535888671875, 0.377532958984375, 0.39051055908203125, 0.4034881591796875, 0.41646575927734375, 0.429443359375]}, "gradients/decoder.model.decoder.layers.7.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 4.0, 6.0, 2.0, 5.0, 9.0, 7.0, 17.0, 32.0, 36.0, 40.0, 83.0, 183.0, 506.0, 2428.0, 35553.0, 4098063.0, 53300.0, 3004.0, 572.0, 190.0, 93.0, 57.0, 36.0, 20.0, 11.0, 12.0, 4.0, 10.0, 1.0, 3.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 3.0], "bins": [-2.75390625, -2.689178466796875, -2.62445068359375, -2.559722900390625, -2.4949951171875, -2.430267333984375, -2.36553955078125, -2.300811767578125, -2.236083984375, -2.171356201171875, -2.10662841796875, -2.041900634765625, -1.9771728515625, -1.912445068359375, -1.84771728515625, -1.782989501953125, -1.71826171875, -1.653533935546875, -1.58880615234375, -1.524078369140625, -1.4593505859375, -1.394622802734375, -1.32989501953125, -1.265167236328125, -1.200439453125, -1.135711669921875, -1.07098388671875, -1.006256103515625, -0.9415283203125, -0.876800537109375, -0.81207275390625, -0.747344970703125, -0.6826171875, -0.617889404296875, -0.55316162109375, -0.488433837890625, -0.4237060546875, -0.358978271484375, -0.29425048828125, -0.229522705078125, -0.164794921875, -0.100067138671875, -0.03533935546875, 0.029388427734375, 0.0941162109375, 0.158843994140625, 0.22357177734375, 0.288299560546875, 0.35302734375, 0.417755126953125, 0.48248291015625, 0.547210693359375, 0.6119384765625, 0.676666259765625, 0.74139404296875, 0.806121826171875, 0.870849609375, 0.935577392578125, 1.00030517578125, 1.065032958984375, 1.1297607421875, 1.194488525390625, 1.25921630859375, 1.323944091796875, 1.388671875]}, "gradients/decoder.model.decoder.layers.7.fc1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 4.0, 3.0, 3.0, 8.0, 6.0, 15.0, 23.0, 23.0, 39.0, 64.0, 69.0, 123.0, 164.0, 323.0, 515.0, 706.0, 685.0, 492.0, 284.0, 182.0, 101.0, 77.0, 47.0, 26.0, 20.0, 25.0, 8.0, 4.0, 5.0, 9.0, 4.0, 6.0, 1.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0], "bins": [-0.205078125, -0.1992053985595703, -0.19333267211914062, -0.18745994567871094, -0.18158721923828125, -0.17571449279785156, -0.16984176635742188, -0.1639690399169922, -0.1580963134765625, -0.1522235870361328, -0.14635086059570312, -0.14047813415527344, -0.13460540771484375, -0.12873268127441406, -0.12285995483398438, -0.11698722839355469, -0.111114501953125, -0.10524177551269531, -0.09936904907226562, -0.09349632263183594, -0.08762359619140625, -0.08175086975097656, -0.07587814331054688, -0.07000541687011719, -0.0641326904296875, -0.05825996398925781, -0.052387237548828125, -0.04651451110839844, -0.04064178466796875, -0.03476905822753906, -0.028896331787109375, -0.023023605346679688, -0.01715087890625, -0.011278152465820312, -0.005405426025390625, 0.0004673004150390625, 0.00634002685546875, 0.012212753295898438, 0.018085479736328125, 0.023958206176757812, 0.0298309326171875, 0.03570365905761719, 0.041576385498046875, 0.04744911193847656, 0.05332183837890625, 0.05919456481933594, 0.06506729125976562, 0.07094001770019531, 0.076812744140625, 0.08268547058105469, 0.08855819702148438, 0.09443092346191406, 0.10030364990234375, 0.10617637634277344, 0.11204910278320312, 0.11792182922363281, 0.1237945556640625, 0.1296672821044922, 0.13554000854492188, 0.14141273498535156, 0.14728546142578125, 0.15315818786621094, 0.15903091430664062, 0.1649036407470703, 0.1707763671875]}, "gradients/decoder.model.decoder.layers.7.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 7.0, 10.0, 7.0, 9.0, 10.0, 14.0, 16.0, 23.0, 24.0, 36.0, 47.0, 63.0, 67.0, 77.0, 86.0, 90.0, 79.0, 69.0, 67.0, 52.0, 32.0, 28.0, 19.0, 21.0, 16.0, 9.0, 4.0, 4.0, 4.0, 3.0, 2.0, 5.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.5770387649536133, -0.5583838820457458, -0.5397289991378784, -0.521074116230011, -0.5024192333221436, -0.48376432061195374, -0.4651094377040863, -0.4464545249938965, -0.42779964208602905, -0.4091447591781616, -0.3904898762702942, -0.37183499336242676, -0.35318008065223694, -0.3345251977443695, -0.3158703148365021, -0.29721540212631226, -0.2785605490207672, -0.2599056661128998, -0.24125076830387115, -0.22259588539600372, -0.2039409875869751, -0.18528610467910767, -0.16663122177124023, -0.1479763239622116, -0.12932144105434418, -0.11066655069589615, -0.09201166033744812, -0.07335677742958069, -0.05470188707113266, -0.03604699671268463, -0.0173921138048172, 0.0012627840042114258, 0.019917666912078857, 0.038572557270526886, 0.057227443903684616, 0.07588233053684235, 0.09453722089529037, 0.1131921112537384, 0.13184699416160583, 0.15050189197063446, 0.1691567748785019, 0.18781165778636932, 0.20646655559539795, 0.22512143850326538, 0.2437763214111328, 0.26243120431900024, 0.2810860872268677, 0.2997409999370575, 0.3183958828449249, 0.33705076575279236, 0.3557056486606598, 0.3743605613708496, 0.39301544427871704, 0.4116703271865845, 0.4303252100944519, 0.44898009300231934, 0.46763497591018677, 0.4862898588180542, 0.5049447417259216, 0.5235996246337891, 0.5422545075416565, 0.5609093904495239, 0.5795643329620361, 0.5982192158699036, 0.616874098777771]}, "gradients/decoder.model.decoder.layers.7.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 4.0, 11.0, 10.0, 11.0, 15.0, 15.0, 14.0, 27.0, 23.0, 28.0, 33.0, 39.0, 50.0, 39.0, 43.0, 45.0, 49.0, 58.0, 55.0, 53.0, 48.0, 29.0, 46.0, 41.0, 20.0, 30.0, 29.0, 25.0, 14.0, 23.0, 16.0, 7.0, 16.0, 9.0, 9.0, 5.0, 9.0, 4.0, 0.0, 0.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.42027556896209717, -0.4064575135707855, -0.3926394581794739, -0.37882140278816223, -0.3650033473968506, -0.35118532180786133, -0.3373672366142273, -0.32354921102523804, -0.3097311556339264, -0.29591310024261475, -0.2820950448513031, -0.26827698945999146, -0.2544589340686798, -0.24064089357852936, -0.2268228381872177, -0.21300479769706726, -0.19918672740459442, -0.18536867201328278, -0.17155061662197113, -0.15773257613182068, -0.14391452074050903, -0.1300964653491974, -0.11627840995788574, -0.1024603620171547, -0.08864230662584305, -0.0748242512345314, -0.061006203293800354, -0.04718814790248871, -0.03337009623646736, -0.019552044570446014, -0.005733989179134369, 0.00808405876159668, 0.021902114152908325, 0.03572016581892967, 0.04953821748495102, 0.06335627287626266, 0.07717432081699371, 0.09099237620830536, 0.104810431599617, 0.11862847954034805, 0.1324465274810791, 0.14626458287239075, 0.1600826382637024, 0.17390069365501404, 0.1877187341451645, 0.20153678953647614, 0.21535484492778778, 0.22917288541793823, 0.24299095571041107, 0.2568089962005615, 0.27062705159187317, 0.2844451069831848, 0.29826316237449646, 0.3120812177658081, 0.32589927315711975, 0.3397173285484314, 0.35353538393974304, 0.3673534393310547, 0.38117149472236633, 0.394989550113678, 0.4088076055049896, 0.42262566089630127, 0.4364436864852905, 0.4502617418766022, 0.4640797972679138]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 3.0, 2.0, 4.0, 2.0, 6.0, 4.0, 6.0, 8.0, 6.0, 5.0, 4.0, 14.0, 13.0, 16.0, 28.0, 36.0, 75.0, 175.0, 391.0, 967.0, 2536.0, 8676.0, 31924.0, 141065.0, 506859.0, 274868.0, 58989.0, 14934.0, 4325.0, 1521.0, 594.0, 240.0, 103.0, 45.0, 34.0, 26.0, 14.0, 10.0, 10.0, 5.0, 8.0, 1.0, 2.0, 4.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.1181640625, -0.11431694030761719, -0.11046981811523438, -0.10662269592285156, -0.10277557373046875, -0.09892845153808594, -0.09508132934570312, -0.09123420715332031, -0.0873870849609375, -0.08353996276855469, -0.07969284057617188, -0.07584571838378906, -0.07199859619140625, -0.06815147399902344, -0.06430435180664062, -0.06045722961425781, -0.056610107421875, -0.05276298522949219, -0.048915863037109375, -0.04506874084472656, -0.04122161865234375, -0.03737449645996094, -0.033527374267578125, -0.029680252075195312, -0.0258331298828125, -0.021986007690429688, -0.018138885498046875, -0.014291763305664062, -0.01044464111328125, -0.0065975189208984375, -0.002750396728515625, 0.0010967254638671875, 0.00494384765625, 0.008790969848632812, 0.012638092041015625, 0.016485214233398438, 0.02033233642578125, 0.024179458618164062, 0.028026580810546875, 0.03187370300292969, 0.0357208251953125, 0.03956794738769531, 0.043415069580078125, 0.04726219177246094, 0.05110931396484375, 0.05495643615722656, 0.058803558349609375, 0.06265068054199219, 0.066497802734375, 0.07034492492675781, 0.07419204711914062, 0.07803916931152344, 0.08188629150390625, 0.08573341369628906, 0.08958053588867188, 0.09342765808105469, 0.0972747802734375, 0.10112190246582031, 0.10496902465820312, 0.10881614685058594, 0.11266326904296875, 0.11651039123535156, 0.12035751342773438, 0.12420463562011719, 0.1280517578125]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 4.0, 6.0, 6.0, 6.0, 11.0, 10.0, 21.0, 22.0, 28.0, 30.0, 33.0, 50.0, 40.0, 73.0, 54.0, 72.0, 67.0, 65.0, 64.0, 49.0, 50.0, 46.0, 33.0, 26.0, 27.0, 27.0, 22.0, 15.0, 17.0, 10.0, 9.0, 5.0, 6.0, 2.0, 3.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.452880859375, -0.44149017333984375, -0.4300994873046875, -0.41870880126953125, -0.407318115234375, -0.39592742919921875, -0.3845367431640625, -0.37314605712890625, -0.36175537109375, -0.35036468505859375, -0.3389739990234375, -0.32758331298828125, -0.316192626953125, -0.30480194091796875, -0.2934112548828125, -0.28202056884765625, -0.2706298828125, -0.25923919677734375, -0.2478485107421875, -0.23645782470703125, -0.225067138671875, -0.21367645263671875, -0.2022857666015625, -0.19089508056640625, -0.17950439453125, -0.16811370849609375, -0.1567230224609375, -0.14533233642578125, -0.133941650390625, -0.12255096435546875, -0.1111602783203125, -0.09976959228515625, -0.08837890625, -0.07698822021484375, -0.0655975341796875, -0.05420684814453125, -0.042816162109375, -0.03142547607421875, -0.0200347900390625, -0.00864410400390625, 0.00274658203125, 0.01413726806640625, 0.0255279541015625, 0.03691864013671875, 0.048309326171875, 0.05970001220703125, 0.0710906982421875, 0.08248138427734375, 0.0938720703125, 0.10526275634765625, 0.1166534423828125, 0.12804412841796875, 0.139434814453125, 0.15082550048828125, 0.1622161865234375, 0.17360687255859375, 0.18499755859375, 0.19638824462890625, 0.2077789306640625, 0.21916961669921875, 0.230560302734375, 0.24195098876953125, 0.2533416748046875, 0.26473236083984375, 0.276123046875]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 5.0, 1.0, 2.0, 5.0, 8.0, 5.0, 11.0, 14.0, 27.0, 29.0, 43.0, 53.0, 101.0, 147.0, 212.0, 324.0, 505.0, 861.0, 1467.0, 2712.0, 5330.0, 11361.0, 25948.0, 62793.0, 155751.0, 301892.0, 266840.0, 123158.0, 49130.0, 20485.0, 9269.0, 4386.0, 2354.0, 1306.0, 757.0, 455.0, 270.0, 160.0, 111.0, 86.0, 53.0, 40.0, 27.0, 24.0, 14.0, 12.0, 8.0, 3.0, 4.0, 2.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.06536865234375, -0.06343793869018555, -0.061507225036621094, -0.05957651138305664, -0.05764579772949219, -0.055715084075927734, -0.05378437042236328, -0.05185365676879883, -0.049922943115234375, -0.04799222946166992, -0.04606151580810547, -0.044130802154541016, -0.04220008850097656, -0.04026937484741211, -0.038338661193847656, -0.0364079475402832, -0.03447723388671875, -0.0325465202331543, -0.030615806579589844, -0.02868509292602539, -0.026754379272460938, -0.024823665618896484, -0.02289295196533203, -0.020962238311767578, -0.019031524658203125, -0.017100811004638672, -0.015170097351074219, -0.013239383697509766, -0.011308670043945312, -0.00937795639038086, -0.007447242736816406, -0.005516529083251953, -0.0035858154296875, -0.0016551017761230469, 0.00027561187744140625, 0.0022063255310058594, 0.0041370391845703125, 0.006067752838134766, 0.007998466491699219, 0.009929180145263672, 0.011859893798828125, 0.013790607452392578, 0.01572132110595703, 0.017652034759521484, 0.019582748413085938, 0.02151346206665039, 0.023444175720214844, 0.025374889373779297, 0.02730560302734375, 0.029236316680908203, 0.031167030334472656, 0.03309774398803711, 0.03502845764160156, 0.036959171295166016, 0.03888988494873047, 0.04082059860229492, 0.042751312255859375, 0.04468202590942383, 0.04661273956298828, 0.048543453216552734, 0.05047416687011719, 0.05240488052368164, 0.054335594177246094, 0.05626630783081055, 0.058197021484375]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 0.0, 3.0, 2.0, 4.0, 7.0, 7.0, 2.0, 6.0, 12.0, 10.0, 18.0, 17.0, 21.0, 19.0, 27.0, 33.0, 44.0, 28.0, 42.0, 36.0, 48.0, 39.0, 37.0, 43.0, 56.0, 47.0, 45.0, 40.0, 34.0, 34.0, 31.0, 34.0, 38.0, 27.0, 21.0, 23.0, 17.0, 9.0, 4.0, 12.0, 8.0, 3.0, 1.0, 7.0, 3.0, 2.0, 4.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.52978515625, -0.5133056640625, -0.496826171875, -0.4803466796875, -0.4638671875, -0.4473876953125, -0.430908203125, -0.4144287109375, -0.39794921875, -0.3814697265625, -0.364990234375, -0.3485107421875, -0.33203125, -0.3155517578125, -0.299072265625, -0.2825927734375, -0.26611328125, -0.2496337890625, -0.233154296875, -0.2166748046875, -0.2001953125, -0.1837158203125, -0.167236328125, -0.1507568359375, -0.13427734375, -0.1177978515625, -0.101318359375, -0.0848388671875, -0.068359375, -0.0518798828125, -0.035400390625, -0.0189208984375, -0.00244140625, 0.0140380859375, 0.030517578125, 0.0469970703125, 0.0634765625, 0.0799560546875, 0.096435546875, 0.1129150390625, 0.12939453125, 0.1458740234375, 0.162353515625, 0.1788330078125, 0.1953125, 0.2117919921875, 0.228271484375, 0.2447509765625, 0.26123046875, 0.2777099609375, 0.294189453125, 0.3106689453125, 0.3271484375, 0.3436279296875, 0.360107421875, 0.3765869140625, 0.39306640625, 0.4095458984375, 0.426025390625, 0.4425048828125, 0.458984375, 0.4754638671875, 0.491943359375, 0.5084228515625, 0.52490234375]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 4.0, 3.0, 3.0, 3.0, 5.0, 10.0, 11.0, 7.0, 23.0, 20.0, 26.0, 38.0, 61.0, 102.0, 150.0, 230.0, 335.0, 560.0, 1087.0, 2040.0, 4306.0, 10447.0, 33585.0, 157022.0, 543862.0, 225814.0, 45149.0, 13166.0, 5079.0, 2322.0, 1225.0, 719.0, 377.0, 235.0, 148.0, 131.0, 76.0, 52.0, 28.0, 30.0, 16.0, 21.0, 12.0, 7.0, 9.0, 4.0, 3.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.03485107421875, -0.0338139533996582, -0.032776832580566406, -0.03173971176147461, -0.030702590942382812, -0.029665470123291016, -0.02862834930419922, -0.027591228485107422, -0.026554107666015625, -0.025516986846923828, -0.02447986602783203, -0.023442745208740234, -0.022405624389648438, -0.02136850357055664, -0.020331382751464844, -0.019294261932373047, -0.01825714111328125, -0.017220020294189453, -0.016182899475097656, -0.01514577865600586, -0.014108657836914062, -0.013071537017822266, -0.012034416198730469, -0.010997295379638672, -0.009960174560546875, -0.008923053741455078, -0.007885932922363281, -0.006848812103271484, -0.0058116912841796875, -0.004774570465087891, -0.0037374496459960938, -0.002700328826904297, -0.0016632080078125, -0.0006260871887207031, 0.00041103363037109375, 0.0014481544494628906, 0.0024852752685546875, 0.0035223960876464844, 0.004559516906738281, 0.005596637725830078, 0.006633758544921875, 0.007670879364013672, 0.008708000183105469, 0.009745121002197266, 0.010782241821289062, 0.01181936264038086, 0.012856483459472656, 0.013893604278564453, 0.01493072509765625, 0.015967845916748047, 0.017004966735839844, 0.01804208755493164, 0.019079208374023438, 0.020116329193115234, 0.02115345001220703, 0.022190570831298828, 0.023227691650390625, 0.024264812469482422, 0.02530193328857422, 0.026339054107666016, 0.027376174926757812, 0.02841329574584961, 0.029450416564941406, 0.030487537384033203, 0.031524658203125]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 4.0, 1.0, 3.0, 2.0, 12.0, 9.0, 8.0, 8.0, 7.0, 17.0, 20.0, 37.0, 34.0, 36.0, 47.0, 67.0, 66.0, 58.0, 93.0, 86.0, 74.0, 70.0, 48.0, 40.0, 35.0, 21.0, 20.0, 11.0, 17.0, 16.0, 9.0, 7.0, 2.0, 5.0, 5.0, 2.0, 1.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4722347259521484e-05, -1.425575464963913e-05, -1.3789162039756775e-05, -1.332256942987442e-05, -1.2855976819992065e-05, -1.238938421010971e-05, -1.1922791600227356e-05, -1.1456198990345001e-05, -1.0989606380462646e-05, -1.0523013770580292e-05, -1.0056421160697937e-05, -9.589828550815582e-06, -9.123235940933228e-06, -8.656643331050873e-06, -8.190050721168518e-06, -7.723458111286163e-06, -7.256865501403809e-06, -6.790272891521454e-06, -6.323680281639099e-06, -5.857087671756744e-06, -5.39049506187439e-06, -4.923902451992035e-06, -4.45730984210968e-06, -3.9907172322273254e-06, -3.5241246223449707e-06, -3.057532012462616e-06, -2.5909394025802612e-06, -2.1243467926979065e-06, -1.6577541828155518e-06, -1.191161572933197e-06, -7.245689630508423e-07, -2.5797635316848755e-07, 2.086162567138672e-07, 6.752088665962219e-07, 1.1418014764785767e-06, 1.6083940863609314e-06, 2.074986696243286e-06, 2.541579306125641e-06, 3.0081719160079956e-06, 3.4747645258903503e-06, 3.941357135772705e-06, 4.40794974565506e-06, 4.8745423555374146e-06, 5.341134965419769e-06, 5.807727575302124e-06, 6.274320185184479e-06, 6.7409127950668335e-06, 7.207505404949188e-06, 7.674098014831543e-06, 8.140690624713898e-06, 8.607283234596252e-06, 9.073875844478607e-06, 9.540468454360962e-06, 1.0007061064243317e-05, 1.0473653674125671e-05, 1.0940246284008026e-05, 1.1406838893890381e-05, 1.1873431503772736e-05, 1.234002411365509e-05, 1.2806616723537445e-05, 1.32732093334198e-05, 1.3739801943302155e-05, 1.420639455318451e-05, 1.4672987163066864e-05, 1.5139579772949219e-05]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 3.0, 1.0, 5.0, 5.0, 8.0, 11.0, 9.0, 6.0, 14.0, 39.0, 31.0, 47.0, 98.0, 140.0, 189.0, 298.0, 429.0, 693.0, 1200.0, 2306.0, 4778.0, 11426.0, 34695.0, 136828.0, 445190.0, 300610.0, 73181.0, 20974.0, 7581.0, 3405.0, 1751.0, 916.0, 557.0, 379.0, 230.0, 160.0, 110.0, 82.0, 57.0, 34.0, 26.0, 13.0, 13.0, 8.0, 6.0, 8.0, 3.0, 3.0, 2.0, 4.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.02960205078125, -0.028699159622192383, -0.027796268463134766, -0.02689337730407715, -0.02599048614501953, -0.025087594985961914, -0.024184703826904297, -0.02328181266784668, -0.022378921508789062, -0.021476030349731445, -0.020573139190673828, -0.01967024803161621, -0.018767356872558594, -0.017864465713500977, -0.01696157455444336, -0.016058683395385742, -0.015155792236328125, -0.014252901077270508, -0.01335000991821289, -0.012447118759155273, -0.011544227600097656, -0.010641336441040039, -0.009738445281982422, -0.008835554122924805, -0.007932662963867188, -0.00702977180480957, -0.006126880645751953, -0.005223989486694336, -0.004321098327636719, -0.0034182071685791016, -0.0025153160095214844, -0.0016124248504638672, -0.00070953369140625, 0.0001933574676513672, 0.0010962486267089844, 0.0019991397857666016, 0.0029020309448242188, 0.003804922103881836, 0.004707813262939453, 0.00561070442199707, 0.0065135955810546875, 0.007416486740112305, 0.008319377899169922, 0.009222269058227539, 0.010125160217285156, 0.011028051376342773, 0.01193094253540039, 0.012833833694458008, 0.013736724853515625, 0.014639616012573242, 0.01554250717163086, 0.016445398330688477, 0.017348289489746094, 0.01825118064880371, 0.019154071807861328, 0.020056962966918945, 0.020959854125976562, 0.02186274528503418, 0.022765636444091797, 0.023668527603149414, 0.02457141876220703, 0.02547430992126465, 0.026377201080322266, 0.027280092239379883, 0.0281829833984375]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 0.0, 3.0, 3.0, 6.0, 8.0, 15.0, 21.0, 16.0, 30.0, 48.0, 46.0, 61.0, 62.0, 85.0, 97.0, 89.0, 71.0, 69.0, 56.0, 51.0, 38.0, 29.0, 30.0, 21.0, 10.0, 9.0, 6.0, 6.0, 7.0, 4.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0089569091796875, -0.008688926696777344, -0.008420944213867188, -0.008152961730957031, -0.007884979248046875, -0.007616996765136719, -0.0073490142822265625, -0.007081031799316406, -0.00681304931640625, -0.006545066833496094, -0.0062770843505859375, -0.006009101867675781, -0.005741119384765625, -0.005473136901855469, -0.0052051544189453125, -0.004937171936035156, -0.004669189453125, -0.004401206970214844, -0.0041332244873046875, -0.0038652420043945312, -0.003597259521484375, -0.0033292770385742188, -0.0030612945556640625, -0.0027933120727539062, -0.00252532958984375, -0.0022573471069335938, -0.0019893646240234375, -0.0017213821411132812, -0.001453399658203125, -0.0011854171752929688, -0.0009174346923828125, -0.0006494522094726562, -0.0003814697265625, -0.00011348724365234375, 0.0001544952392578125, 0.00042247772216796875, 0.000690460205078125, 0.0009584426879882812, 0.0012264251708984375, 0.0014944076538085938, 0.00176239013671875, 0.0020303726196289062, 0.0022983551025390625, 0.0025663375854492188, 0.002834320068359375, 0.0031023025512695312, 0.0033702850341796875, 0.0036382675170898438, 0.00390625, 0.004174232482910156, 0.0044422149658203125, 0.004710197448730469, 0.004978179931640625, 0.005246162414550781, 0.0055141448974609375, 0.005782127380371094, 0.00605010986328125, 0.006318092346191406, 0.0065860748291015625, 0.006854057312011719, 0.007122039794921875, 0.007390022277832031, 0.0076580047607421875, 0.007925987243652344, 0.0081939697265625]}, "gradients/decoder.model.decoder.layers.7.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 4.0, 2.0, 8.0, 12.0, 18.0, 13.0, 36.0, 54.0, 85.0, 113.0, 131.0, 144.0, 128.0, 103.0, 50.0, 37.0, 19.0, 18.0, 12.0, 7.0, 2.0, 2.0, 3.0, 4.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.7224206328392029, -0.7034595012664795, -0.6844983696937561, -0.6655372381210327, -0.6465761065483093, -0.6276149749755859, -0.6086538434028625, -0.5896927118301392, -0.5707315802574158, -0.5517704486846924, -0.532809317111969, -0.5138481855392456, -0.4948870539665222, -0.47592592239379883, -0.45696479082107544, -0.43800365924835205, -0.4190424978733063, -0.4000813663005829, -0.3811202347278595, -0.3621591031551361, -0.3431979715824127, -0.32423684000968933, -0.30527567863464355, -0.28631454706192017, -0.2673534154891968, -0.2483922839164734, -0.22943115234375, -0.2104700207710266, -0.19150888919830322, -0.17254775762557983, -0.15358661115169525, -0.13462547957897186, -0.11566436290740967, -0.09670323133468628, -0.07774209976196289, -0.058780960738658905, -0.039819829165935516, -0.020858697593212128, -0.001897558569908142, 0.017063573002815247, 0.036024704575538635, 0.054985836148262024, 0.07394696772098541, 0.0929081067442894, 0.11186923831701279, 0.13083037734031677, 0.14979150891304016, 0.16875264048576355, 0.18771377205848694, 0.20667490363121033, 0.22563603520393372, 0.2445971667766571, 0.2635582983493805, 0.2825194299221039, 0.30148059129714966, 0.32044172286987305, 0.33940285444259644, 0.3583639860153198, 0.3773251175880432, 0.3962862491607666, 0.41524738073349, 0.4342085123062134, 0.45316964387893677, 0.47213077545166016, 0.49109190702438354]}, "gradients/decoder.model.decoder.layers.7.self_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 4.0, 7.0, 5.0, 11.0, 5.0, 12.0, 16.0, 13.0, 17.0, 26.0, 40.0, 26.0, 37.0, 48.0, 53.0, 39.0, 48.0, 62.0, 55.0, 63.0, 49.0, 47.0, 42.0, 37.0, 33.0, 29.0, 29.0, 29.0, 19.0, 21.0, 12.0, 18.0, 11.0, 9.0, 8.0, 9.0, 4.0, 5.0, 6.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.2719714939594269, -0.2628169655799866, -0.25366243720054626, -0.24450792372226715, -0.23535341024398804, -0.22619888186454773, -0.21704435348510742, -0.20788982510566711, -0.198735311627388, -0.1895807832479477, -0.18042626976966858, -0.17127174139022827, -0.16211721301078796, -0.15296269953250885, -0.14380817115306854, -0.13465365767478943, -0.12549912929534912, -0.11634460836648941, -0.1071900874376297, -0.09803555905818939, -0.08888103812932968, -0.07972651720046997, -0.07057198882102966, -0.06141746789216995, -0.05226294696331024, -0.04310842603445053, -0.03395390138030052, -0.024799378588795662, -0.015644855797290802, -0.006490334868431091, 0.002664189785718918, 0.011818714439868927, 0.020973265171051025, 0.030127787962555885, 0.039282310754060745, 0.048436835408210754, 0.057591356337070465, 0.06674587726593018, 0.07590040564537048, 0.0850549265742302, 0.0942094475030899, 0.10336396843194962, 0.11251848936080933, 0.12167301774024963, 0.13082754611968994, 0.13998205959796906, 0.14913658797740936, 0.15829110145568848, 0.16744562983512878, 0.1766001582145691, 0.1857546716928482, 0.1949092000722885, 0.20406371355056763, 0.21321824193000793, 0.22237277030944824, 0.23152729868888855, 0.24068181216716766, 0.24983634054660797, 0.2589908540248871, 0.2681453824043274, 0.2772999107837677, 0.286454439163208, 0.2956089377403259, 0.30476346611976624, 0.31391799449920654]}, "gradients/decoder.model.decoder.layers.7.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 5.0, 4.0, 2.0, 4.0, 7.0, 15.0, 9.0, 23.0, 48.0, 113.0, 835.0, 10105.0, 846268.0, 186736.0, 3793.0, 406.0, 94.0, 35.0, 13.0, 13.0, 7.0, 5.0, 8.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.271484375, -1.225799560546875, -1.18011474609375, -1.134429931640625, -1.0887451171875, -1.043060302734375, -0.99737548828125, -0.951690673828125, -0.906005859375, -0.860321044921875, -0.81463623046875, -0.768951416015625, -0.7232666015625, -0.677581787109375, -0.63189697265625, -0.586212158203125, -0.54052734375, -0.494842529296875, -0.44915771484375, -0.403472900390625, -0.3577880859375, -0.312103271484375, -0.26641845703125, -0.220733642578125, -0.175048828125, -0.129364013671875, -0.08367919921875, -0.037994384765625, 0.0076904296875, 0.053375244140625, 0.09906005859375, 0.144744873046875, 0.1904296875, 0.236114501953125, 0.28179931640625, 0.327484130859375, 0.3731689453125, 0.418853759765625, 0.46453857421875, 0.510223388671875, 0.555908203125, 0.601593017578125, 0.64727783203125, 0.692962646484375, 0.7386474609375, 0.784332275390625, 0.83001708984375, 0.875701904296875, 0.92138671875, 0.967071533203125, 1.01275634765625, 1.058441162109375, 1.1041259765625, 1.149810791015625, 1.19549560546875, 1.241180419921875, 1.286865234375, 1.332550048828125, 1.37823486328125, 1.423919677734375, 1.4696044921875, 1.515289306640625, 1.56097412109375, 1.606658935546875, 1.65234375]}, "gradients/decoder.model.decoder.layers.7.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0, 1.0, 3.0, 3.0, 4.0, 3.0, 12.0, 13.0, 14.0, 20.0, 22.0, 26.0, 49.0, 55.0, 57.0, 62.0, 78.0, 54.0, 84.0, 82.0, 66.0, 62.0, 51.0, 30.0, 36.0, 26.0, 26.0, 20.0, 15.0, 11.0, 10.0, 6.0, 3.0, 2.0, 4.0, 0.0, 0.0, 4.0, 2.0, 1.0], "bins": [-0.9970703125, -0.9735107421875, -0.949951171875, -0.9263916015625, -0.90283203125, -0.8792724609375, -0.855712890625, -0.8321533203125, -0.80859375, -0.7850341796875, -0.761474609375, -0.7379150390625, -0.71435546875, -0.6907958984375, -0.667236328125, -0.6436767578125, -0.6201171875, -0.5965576171875, -0.572998046875, -0.5494384765625, -0.52587890625, -0.5023193359375, -0.478759765625, -0.4552001953125, -0.431640625, -0.4080810546875, -0.384521484375, -0.3609619140625, -0.33740234375, -0.3138427734375, -0.290283203125, -0.2667236328125, -0.2431640625, -0.2196044921875, -0.196044921875, -0.1724853515625, -0.14892578125, -0.1253662109375, -0.101806640625, -0.0782470703125, -0.0546875, -0.0311279296875, -0.007568359375, 0.0159912109375, 0.03955078125, 0.0631103515625, 0.086669921875, 0.1102294921875, 0.1337890625, 0.1573486328125, 0.180908203125, 0.2044677734375, 0.22802734375, 0.2515869140625, 0.275146484375, 0.2987060546875, 0.322265625, 0.3458251953125, 0.369384765625, 0.3929443359375, 0.41650390625, 0.4400634765625, 0.463623046875, 0.4871826171875, 0.5107421875]}, "gradients/decoder.model.decoder.layers.7.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 4.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 6.0, 6.0, 3.0, 4.0, 6.0, 9.0, 11.0, 17.0, 17.0, 36.0, 35.0, 62.0, 64.0, 77.0, 108.0, 147.0, 225.0, 424.0, 1008.0, 3239.0, 20842.0, 536162.0, 462398.0, 18382.0, 3018.0, 972.0, 441.0, 226.0, 138.0, 110.0, 87.0, 65.0, 45.0, 29.0, 26.0, 19.0, 19.0, 21.0, 14.0, 12.0, 5.0, 7.0, 2.0, 3.0, 1.0, 3.0, 2.0, 2.0, 5.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.80712890625, -0.78265380859375, -0.7581787109375, -0.73370361328125, -0.709228515625, -0.68475341796875, -0.6602783203125, -0.63580322265625, -0.611328125, -0.58685302734375, -0.5623779296875, -0.53790283203125, -0.513427734375, -0.48895263671875, -0.4644775390625, -0.44000244140625, -0.41552734375, -0.39105224609375, -0.3665771484375, -0.34210205078125, -0.317626953125, -0.29315185546875, -0.2686767578125, -0.24420166015625, -0.2197265625, -0.19525146484375, -0.1707763671875, -0.14630126953125, -0.121826171875, -0.09735107421875, -0.0728759765625, -0.04840087890625, -0.02392578125, 0.00054931640625, 0.0250244140625, 0.04949951171875, 0.073974609375, 0.09844970703125, 0.1229248046875, 0.14739990234375, 0.171875, 0.19635009765625, 0.2208251953125, 0.24530029296875, 0.269775390625, 0.29425048828125, 0.3187255859375, 0.34320068359375, 0.36767578125, 0.39215087890625, 0.4166259765625, 0.44110107421875, 0.465576171875, 0.49005126953125, 0.5145263671875, 0.53900146484375, 0.5634765625, 0.58795166015625, 0.6124267578125, 0.63690185546875, 0.661376953125, 0.68585205078125, 0.7103271484375, 0.73480224609375, 0.75927734375]}, "gradients/decoder.model.decoder.layers.7.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 2.0, 8.0, 7.0, 2.0, 9.0, 4.0, 8.0, 15.0, 15.0, 24.0, 24.0, 19.0, 32.0, 33.0, 33.0, 27.0, 39.0, 29.0, 44.0, 39.0, 46.0, 49.0, 37.0, 42.0, 37.0, 46.0, 39.0, 39.0, 36.0, 33.0, 26.0, 23.0, 14.0, 24.0, 12.0, 13.0, 15.0, 12.0, 12.0, 7.0, 6.0, 8.0, 2.0, 2.0, 2.0, 1.0, 4.0, 1.0, 3.0, 2.0, 2.0, 0.0, 2.0], "bins": [-0.4794921875, -0.4650001525878906, -0.45050811767578125, -0.4360160827636719, -0.4215240478515625, -0.4070320129394531, -0.39253997802734375, -0.3780479431152344, -0.363555908203125, -0.3490638732910156, -0.33457183837890625, -0.3200798034667969, -0.3055877685546875, -0.2910957336425781, -0.27660369873046875, -0.2621116638183594, -0.24761962890625, -0.23312759399414062, -0.21863555908203125, -0.20414352416992188, -0.1896514892578125, -0.17515945434570312, -0.16066741943359375, -0.14617538452148438, -0.131683349609375, -0.11719131469726562, -0.10269927978515625, -0.08820724487304688, -0.0737152099609375, -0.059223175048828125, -0.04473114013671875, -0.030239105224609375, -0.0157470703125, -0.001255035400390625, 0.01323699951171875, 0.027729034423828125, 0.0422210693359375, 0.056713104248046875, 0.07120513916015625, 0.08569717407226562, 0.100189208984375, 0.11468124389648438, 0.12917327880859375, 0.14366531372070312, 0.1581573486328125, 0.17264938354492188, 0.18714141845703125, 0.20163345336914062, 0.21612548828125, 0.23061752319335938, 0.24510955810546875, 0.2596015930175781, 0.2740936279296875, 0.2885856628417969, 0.30307769775390625, 0.3175697326660156, 0.332061767578125, 0.3465538024902344, 0.36104583740234375, 0.3755378723144531, 0.3900299072265625, 0.4045219421386719, 0.41901397705078125, 0.4335060119628906, 0.447998046875]}, "gradients/decoder.model.decoder.layers.7.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 6.0, 2.0, 3.0, 0.0, 7.0, 14.0, 19.0, 33.0, 47.0, 85.0, 158.0, 267.0, 553.0, 1050.0, 2634.0, 8157.0, 43231.0, 521077.0, 423389.0, 36126.0, 7241.0, 2428.0, 974.0, 498.0, 217.0, 146.0, 74.0, 35.0, 35.0, 23.0, 11.0, 10.0, 6.0, 3.0, 4.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.1510009765625, -0.145599365234375, -0.14019775390625, -0.134796142578125, -0.12939453125, -0.123992919921875, -0.11859130859375, -0.113189697265625, -0.1077880859375, -0.102386474609375, -0.09698486328125, -0.091583251953125, -0.086181640625, -0.080780029296875, -0.07537841796875, -0.069976806640625, -0.0645751953125, -0.059173583984375, -0.05377197265625, -0.048370361328125, -0.04296875, -0.037567138671875, -0.03216552734375, -0.026763916015625, -0.0213623046875, -0.015960693359375, -0.01055908203125, -0.005157470703125, 0.000244140625, 0.005645751953125, 0.01104736328125, 0.016448974609375, 0.0218505859375, 0.027252197265625, 0.03265380859375, 0.038055419921875, 0.04345703125, 0.048858642578125, 0.05426025390625, 0.059661865234375, 0.0650634765625, 0.070465087890625, 0.07586669921875, 0.081268310546875, 0.086669921875, 0.092071533203125, 0.09747314453125, 0.102874755859375, 0.1082763671875, 0.113677978515625, 0.11907958984375, 0.124481201171875, 0.1298828125, 0.135284423828125, 0.14068603515625, 0.146087646484375, 0.1514892578125, 0.156890869140625, 0.16229248046875, 0.167694091796875, 0.173095703125, 0.178497314453125, 0.18389892578125, 0.189300537109375, 0.1947021484375]}, "gradients/decoder.model.decoder.layers.7.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 4.0, 3.0, 5.0, 8.0, 22.0, 26.0, 50.0, 96.0, 92.0, 180.0, 164.0, 139.0, 87.0, 46.0, 23.0, 24.0, 4.0, 10.0, 8.0, 8.0, 0.0, 3.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.8371810913085938e-05, -2.7325935661792755e-05, -2.6280060410499573e-05, -2.523418515920639e-05, -2.4188309907913208e-05, -2.3142434656620026e-05, -2.2096559405326843e-05, -2.105068415403366e-05, -2.000480890274048e-05, -1.8958933651447296e-05, -1.7913058400154114e-05, -1.686718314886093e-05, -1.582130789756775e-05, -1.4775432646274567e-05, -1.3729557394981384e-05, -1.2683682143688202e-05, -1.163780689239502e-05, -1.0591931641101837e-05, -9.546056389808655e-06, -8.500181138515472e-06, -7.45430588722229e-06, -6.408430635929108e-06, -5.362555384635925e-06, -4.316680133342743e-06, -3.2708048820495605e-06, -2.224929630756378e-06, -1.1790543794631958e-06, -1.3317912817001343e-07, 9.126961231231689e-07, 1.9585713744163513e-06, 3.0044466257095337e-06, 4.050321877002716e-06, 5.0961971282958984e-06, 6.142072379589081e-06, 7.187947630882263e-06, 8.233822882175446e-06, 9.279698133468628e-06, 1.032557338476181e-05, 1.1371448636054993e-05, 1.2417323887348175e-05, 1.3463199138641357e-05, 1.450907438993454e-05, 1.5554949641227722e-05, 1.6600824892520905e-05, 1.7646700143814087e-05, 1.869257539510727e-05, 1.973845064640045e-05, 2.0784325897693634e-05, 2.1830201148986816e-05, 2.287607640028e-05, 2.392195165157318e-05, 2.4967826902866364e-05, 2.6013702154159546e-05, 2.7059577405452728e-05, 2.810545265674591e-05, 2.9151327908039093e-05, 3.0197203159332275e-05, 3.124307841062546e-05, 3.228895366191864e-05, 3.333482891321182e-05, 3.4380704164505005e-05, 3.542657941579819e-05, 3.647245466709137e-05, 3.751832991838455e-05, 3.8564205169677734e-05]}, "gradients/decoder.model.decoder.layers.7.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 3.0, 5.0, 6.0, 15.0, 16.0, 24.0, 51.0, 86.0, 192.0, 496.0, 1472.0, 7047.0, 81881.0, 880274.0, 68381.0, 6385.0, 1403.0, 474.0, 165.0, 83.0, 44.0, 24.0, 10.0, 11.0, 5.0, 3.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2427978515625, -0.2342700958251953, -0.22574234008789062, -0.21721458435058594, -0.20868682861328125, -0.20015907287597656, -0.19163131713867188, -0.1831035614013672, -0.1745758056640625, -0.1660480499267578, -0.15752029418945312, -0.14899253845214844, -0.14046478271484375, -0.13193702697753906, -0.12340927124023438, -0.11488151550292969, -0.106353759765625, -0.09782600402832031, -0.08929824829101562, -0.08077049255371094, -0.07224273681640625, -0.06371498107910156, -0.055187225341796875, -0.04665946960449219, -0.0381317138671875, -0.029603958129882812, -0.021076202392578125, -0.012548446655273438, -0.00402069091796875, 0.0045070648193359375, 0.013034820556640625, 0.021562576293945312, 0.03009033203125, 0.03861808776855469, 0.047145843505859375, 0.05567359924316406, 0.06420135498046875, 0.07272911071777344, 0.08125686645507812, 0.08978462219238281, 0.0983123779296875, 0.10684013366699219, 0.11536788940429688, 0.12389564514160156, 0.13242340087890625, 0.14095115661621094, 0.14947891235351562, 0.1580066680908203, 0.166534423828125, 0.1750621795654297, 0.18358993530273438, 0.19211769104003906, 0.20064544677734375, 0.20917320251464844, 0.21770095825195312, 0.2262287139892578, 0.2347564697265625, 0.2432842254638672, 0.2518119812011719, 0.26033973693847656, 0.26886749267578125, 0.27739524841308594, 0.2859230041503906, 0.2944507598876953, 0.302978515625]}, "gradients/decoder.model.decoder.layers.7.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 3.0, 9.0, 14.0, 17.0, 24.0, 30.0, 37.0, 77.0, 115.0, 137.0, 141.0, 120.0, 89.0, 60.0, 38.0, 30.0, 22.0, 8.0, 11.0, 4.0, 6.0, 2.0, 4.0, 4.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0816650390625, -0.07934761047363281, -0.07703018188476562, -0.07471275329589844, -0.07239532470703125, -0.07007789611816406, -0.06776046752929688, -0.06544303894042969, -0.0631256103515625, -0.06080818176269531, -0.058490753173828125, -0.05617332458496094, -0.05385589599609375, -0.05153846740722656, -0.049221038818359375, -0.04690361022949219, -0.044586181640625, -0.04226875305175781, -0.039951324462890625, -0.03763389587402344, -0.03531646728515625, -0.03299903869628906, -0.030681610107421875, -0.028364181518554688, -0.0260467529296875, -0.023729324340820312, -0.021411895751953125, -0.019094467163085938, -0.01677703857421875, -0.014459609985351562, -0.012142181396484375, -0.009824752807617188, -0.00750732421875, -0.0051898956298828125, -0.002872467041015625, -0.0005550384521484375, 0.00176239013671875, 0.0040798187255859375, 0.006397247314453125, 0.008714675903320312, 0.0110321044921875, 0.013349533081054688, 0.015666961669921875, 0.017984390258789062, 0.02030181884765625, 0.022619247436523438, 0.024936676025390625, 0.027254104614257812, 0.029571533203125, 0.03188896179199219, 0.034206390380859375, 0.03652381896972656, 0.03884124755859375, 0.04115867614746094, 0.043476104736328125, 0.04579353332519531, 0.0481109619140625, 0.05042839050292969, 0.052745819091796875, 0.05506324768066406, 0.05738067626953125, 0.05969810485839844, 0.062015533447265625, 0.06433296203613281, 0.066650390625]}, "gradients/decoder.model.decoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 8.0, 5.0, 20.0, 31.0, 56.0, 124.0, 167.0, 198.0, 176.0, 100.0, 54.0, 24.0, 23.0, 8.0, 8.0, 5.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.3839874267578125, -2.330397844314575, -2.276808261871338, -2.2232186794281006, -2.1696290969848633, -2.116039752960205, -2.0624501705169678, -2.0088605880737305, -1.9552710056304932, -1.9016814231872559, -1.8480918407440186, -1.7945023775100708, -1.7409127950668335, -1.6873232126235962, -1.6337337493896484, -1.5801441669464111, -1.5265545845031738, -1.4729650020599365, -1.4193754196166992, -1.3657859563827515, -1.3121963739395142, -1.2586067914962769, -1.205017328262329, -1.1514277458190918, -1.0978381633758545, -1.0442485809326172, -0.9906590580940247, -0.9370695352554321, -0.8834799528121948, -0.8298903703689575, -0.776300847530365, -0.7227113246917725, -0.6691218614578247, -0.6155322790145874, -0.5619427561759949, -0.5083532333374023, -0.45476365089416504, -0.4011740982532501, -0.3475845456123352, -0.2939949929714203, -0.24040544033050537, -0.18681588768959045, -0.13322633504867554, -0.07963678240776062, -0.026047229766845703, 0.027542322874069214, 0.08113187551498413, 0.13472142815589905, 0.18831098079681396, 0.24190053343772888, 0.2954900860786438, 0.3490796387195587, 0.40266919136047363, 0.45625874400138855, 0.5098482966423035, 0.563437819480896, 0.6170274019241333, 0.6706169843673706, 0.7242065072059631, 0.7777960300445557, 0.831385612487793, 0.8849751949310303, 0.9385647177696228, 0.9921542406082153, 1.0457438230514526]}, "gradients/decoder.model.decoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 1.0, 7.0, 9.0, 11.0, 5.0, 14.0, 13.0, 17.0, 24.0, 22.0, 17.0, 29.0, 38.0, 28.0, 38.0, 34.0, 49.0, 47.0, 50.0, 40.0, 45.0, 42.0, 49.0, 54.0, 42.0, 34.0, 32.0, 35.0, 27.0, 34.0, 19.0, 16.0, 19.0, 10.0, 7.0, 12.0, 5.0, 8.0, 7.0, 8.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-1.0464414358139038, -1.017364740371704, -0.9882881045341492, -0.9592114686965942, -0.9301348328590393, -0.9010581970214844, -0.8719815015792847, -0.8429048657417297, -0.8138282299041748, -0.7847515940666199, -0.7556748986244202, -0.7265982627868652, -0.6975216269493103, -0.6684449911117554, -0.6393682956695557, -0.6102916598320007, -0.581214964389801, -0.5521383285522461, -0.5230616331100464, -0.49398499727249146, -0.4649083614349365, -0.4358316957950592, -0.4067550301551819, -0.37767839431762695, -0.34860172867774963, -0.3195250630378723, -0.2904484272003174, -0.26137176156044006, -0.23229511082172394, -0.2032184600830078, -0.1741417944431305, -0.14506514370441437, -0.11598849296569824, -0.08691184222698212, -0.057835184037685394, -0.028758525848388672, 0.0003181248903274536, 0.02939477562904358, 0.0584714412689209, 0.08754809200763702, 0.11662474274635315, 0.14570139348506927, 0.1747780442237854, 0.20385470986366272, 0.23293136060237885, 0.26200801134109497, 0.2910846769809723, 0.3201613426208496, 0.34923797845840454, 0.37831464409828186, 0.4073912799358368, 0.4364679455757141, 0.46554458141326904, 0.49462124705314636, 0.5236979126930237, 0.5527745485305786, 0.5818512439727783, 0.6109278798103333, 0.640004575252533, 0.6690812110900879, 0.6981578469276428, 0.7272344827651978, 0.7563111782073975, 0.7853878140449524, 0.8144644498825073]}, "gradients/decoder.model.decoder.layers.6.fc2.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 5.0, 2.0, 3.0, 2.0, 8.0, 11.0, 12.0, 18.0, 17.0, 30.0, 44.0, 84.0, 148.0, 252.0, 420.0, 866.0, 1984.0, 5307.0, 22586.0, 291870.0, 3278108.0, 548591.0, 32675.0, 6592.0, 2362.0, 1017.0, 504.0, 288.0, 165.0, 96.0, 74.0, 43.0, 31.0, 18.0, 16.0, 8.0, 9.0, 10.0, 4.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.97412109375, -0.948883056640625, -0.92364501953125, -0.898406982421875, -0.8731689453125, -0.847930908203125, -0.82269287109375, -0.797454833984375, -0.772216796875, -0.746978759765625, -0.72174072265625, -0.696502685546875, -0.6712646484375, -0.646026611328125, -0.62078857421875, -0.595550537109375, -0.5703125, -0.545074462890625, -0.51983642578125, -0.494598388671875, -0.4693603515625, -0.444122314453125, -0.41888427734375, -0.393646240234375, -0.368408203125, -0.343170166015625, -0.31793212890625, -0.292694091796875, -0.2674560546875, -0.242218017578125, -0.21697998046875, -0.191741943359375, -0.16650390625, -0.141265869140625, -0.11602783203125, -0.090789794921875, -0.0655517578125, -0.040313720703125, -0.01507568359375, 0.010162353515625, 0.035400390625, 0.060638427734375, 0.08587646484375, 0.111114501953125, 0.1363525390625, 0.161590576171875, 0.18682861328125, 0.212066650390625, 0.2373046875, 0.262542724609375, 0.28778076171875, 0.313018798828125, 0.3382568359375, 0.363494873046875, 0.38873291015625, 0.413970947265625, 0.439208984375, 0.464447021484375, 0.48968505859375, 0.514923095703125, 0.5401611328125, 0.565399169921875, 0.59063720703125, 0.615875244140625, 0.64111328125]}, "gradients/decoder.model.decoder.layers.6.fc2.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 4.0, 6.0, 10.0, 7.0, 10.0, 14.0, 22.0, 20.0, 19.0, 24.0, 25.0, 42.0, 51.0, 28.0, 40.0, 62.0, 47.0, 52.0, 53.0, 51.0, 54.0, 45.0, 46.0, 29.0, 41.0, 25.0, 37.0, 25.0, 20.0, 20.0, 11.0, 16.0, 8.0, 4.0, 8.0, 11.0, 5.0, 1.0, 3.0, 4.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.34619140625, -0.3344459533691406, -0.32270050048828125, -0.3109550476074219, -0.2992095947265625, -0.2874641418457031, -0.27571868896484375, -0.2639732360839844, -0.252227783203125, -0.24048233032226562, -0.22873687744140625, -0.21699142456054688, -0.2052459716796875, -0.19350051879882812, -0.18175506591796875, -0.17000961303710938, -0.15826416015625, -0.14651870727539062, -0.13477325439453125, -0.12302780151367188, -0.1112823486328125, -0.09953689575195312, -0.08779144287109375, -0.07604598999023438, -0.064300537109375, -0.052555084228515625, -0.04080963134765625, -0.029064178466796875, -0.0173187255859375, -0.005573272705078125, 0.00617218017578125, 0.017917633056640625, 0.0296630859375, 0.041408538818359375, 0.05315399169921875, 0.06489944458007812, 0.0766448974609375, 0.08839035034179688, 0.10013580322265625, 0.11188125610351562, 0.123626708984375, 0.13537216186523438, 0.14711761474609375, 0.15886306762695312, 0.1706085205078125, 0.18235397338867188, 0.19409942626953125, 0.20584487915039062, 0.21759033203125, 0.22933578491210938, 0.24108123779296875, 0.2528266906738281, 0.2645721435546875, 0.2763175964355469, 0.28806304931640625, 0.2998085021972656, 0.311553955078125, 0.3232994079589844, 0.33504486083984375, 0.3467903137207031, 0.3585357666015625, 0.3702812194824219, 0.38202667236328125, 0.3937721252441406, 0.405517578125]}, "gradients/decoder.model.decoder.layers.6.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 0.0, 6.0, 4.0, 7.0, 7.0, 8.0, 11.0, 22.0, 36.0, 55.0, 105.0, 240.0, 635.0, 1947.0, 8942.0, 106969.0, 3898122.0, 162376.0, 11231.0, 2323.0, 675.0, 263.0, 119.0, 71.0, 44.0, 14.0, 13.0, 10.0, 10.0, 5.0, 3.0, 0.0, 3.0, 7.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.08984375, -1.0583038330078125, -1.026763916015625, -0.9952239990234375, -0.96368408203125, -0.9321441650390625, -0.900604248046875, -0.8690643310546875, -0.8375244140625, -0.8059844970703125, -0.774444580078125, -0.7429046630859375, -0.71136474609375, -0.6798248291015625, -0.648284912109375, -0.6167449951171875, -0.585205078125, -0.5536651611328125, -0.522125244140625, -0.4905853271484375, -0.45904541015625, -0.4275054931640625, -0.395965576171875, -0.3644256591796875, -0.3328857421875, -0.3013458251953125, -0.269805908203125, -0.2382659912109375, -0.20672607421875, -0.1751861572265625, -0.143646240234375, -0.1121063232421875, -0.08056640625, -0.0490264892578125, -0.017486572265625, 0.0140533447265625, 0.04559326171875, 0.0771331787109375, 0.108673095703125, 0.1402130126953125, 0.1717529296875, 0.2032928466796875, 0.234832763671875, 0.2663726806640625, 0.29791259765625, 0.3294525146484375, 0.360992431640625, 0.3925323486328125, 0.424072265625, 0.4556121826171875, 0.487152099609375, 0.5186920166015625, 0.55023193359375, 0.5817718505859375, 0.613311767578125, 0.6448516845703125, 0.6763916015625, 0.7079315185546875, 0.739471435546875, 0.7710113525390625, 0.80255126953125, 0.8340911865234375, 0.865631103515625, 0.8971710205078125, 0.9287109375]}, "gradients/decoder.model.decoder.layers.6.fc1.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 2.0, 3.0, 3.0, 2.0, 6.0, 8.0, 7.0, 12.0, 14.0, 20.0, 22.0, 33.0, 30.0, 60.0, 91.0, 106.0, 204.0, 303.0, 419.0, 592.0, 676.0, 484.0, 331.0, 215.0, 118.0, 80.0, 71.0, 43.0, 31.0, 18.0, 16.0, 17.0, 12.0, 6.0, 4.0, 5.0, 1.0, 1.0, 4.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.154052734375, -0.14966964721679688, -0.14528656005859375, -0.14090347290039062, -0.1365203857421875, -0.13213729858398438, -0.12775421142578125, -0.12337112426757812, -0.118988037109375, -0.11460494995117188, -0.11022186279296875, -0.10583877563476562, -0.1014556884765625, -0.09707260131835938, -0.09268951416015625, -0.08830642700195312, -0.08392333984375, -0.07954025268554688, -0.07515716552734375, -0.07077407836914062, -0.0663909912109375, -0.062007904052734375, -0.05762481689453125, -0.053241729736328125, -0.048858642578125, -0.044475555419921875, -0.04009246826171875, -0.035709381103515625, -0.0313262939453125, -0.026943206787109375, -0.02256011962890625, -0.018177032470703125, -0.0137939453125, -0.009410858154296875, -0.00502777099609375, -0.000644683837890625, 0.0037384033203125, 0.008121490478515625, 0.01250457763671875, 0.016887664794921875, 0.021270751953125, 0.025653839111328125, 0.03003692626953125, 0.034420013427734375, 0.0388031005859375, 0.043186187744140625, 0.04756927490234375, 0.051952362060546875, 0.05633544921875, 0.060718536376953125, 0.06510162353515625, 0.06948471069335938, 0.0738677978515625, 0.07825088500976562, 0.08263397216796875, 0.08701705932617188, 0.091400146484375, 0.09578323364257812, 0.10016632080078125, 0.10454940795898438, 0.1089324951171875, 0.11331558227539062, 0.11769866943359375, 0.12208175659179688, 0.12646484375]}, "gradients/decoder.model.decoder.layers.6.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 5.0, 4.0, 3.0, 8.0, 16.0, 17.0, 26.0, 40.0, 63.0, 86.0, 108.0, 125.0, 123.0, 128.0, 89.0, 48.0, 38.0, 27.0, 15.0, 8.0, 9.0, 11.0, 4.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4996727705001831, -0.4749203324317932, -0.4501679241657257, -0.4254155158996582, -0.4006630778312683, -0.3759106397628784, -0.3511582314968109, -0.3264058232307434, -0.3016533851623535, -0.2769009470939636, -0.2521485388278961, -0.22739611566066742, -0.20264369249343872, -0.17789126932621002, -0.15313884615898132, -0.12838642299175262, -0.10363399982452393, -0.07888157665729523, -0.05412915349006653, -0.02937673032283783, -0.004624307155609131, 0.020128116011619568, 0.04488053917884827, 0.06963296234607697, 0.09438538551330566, 0.11913780868053436, 0.14389023184776306, 0.16864265501499176, 0.19339507818222046, 0.21814750134944916, 0.24289992451667786, 0.26765233278274536, 0.29240477085113525, 0.31715720891952515, 0.34190961718559265, 0.36666202545166016, 0.39141446352005005, 0.41616690158843994, 0.44091930985450745, 0.46567171812057495, 0.49042415618896484, 0.5151765942573547, 0.5399290323257446, 0.5646814107894897, 0.5894338488578796, 0.6141862869262695, 0.6389386653900146, 0.6636911034584045, 0.6884435415267944, 0.7131959795951843, 0.7379484176635742, 0.7627007961273193, 0.7874532341957092, 0.8122056722640991, 0.8369580507278442, 0.8617104887962341, 0.886462926864624, 0.9112153649330139, 0.9359678030014038, 0.9607201814651489, 0.9854726195335388, 1.0102250576019287, 1.0349774360656738, 1.0597299337387085, 1.0844823122024536]}, "gradients/decoder.model.decoder.layers.6.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 3.0, 6.0, 5.0, 5.0, 6.0, 7.0, 14.0, 9.0, 23.0, 23.0, 26.0, 21.0, 34.0, 39.0, 51.0, 43.0, 53.0, 41.0, 51.0, 52.0, 38.0, 53.0, 41.0, 48.0, 39.0, 37.0, 38.0, 33.0, 34.0, 21.0, 21.0, 19.0, 21.0, 13.0, 11.0, 6.0, 4.0, 6.0, 4.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.3821377158164978, -0.36959391832351685, -0.3570501208305359, -0.34450632333755493, -0.33196255564689636, -0.3194187581539154, -0.30687496066093445, -0.2943311631679535, -0.28178736567497253, -0.2692435681819916, -0.2566997706890106, -0.24415598809719086, -0.2316121906042099, -0.21906840801239014, -0.20652461051940918, -0.19398081302642822, -0.18143703043460846, -0.1688932329416275, -0.15634945034980774, -0.14380565285682678, -0.13126185536384583, -0.11871806532144547, -0.1061742752790451, -0.09363047778606415, -0.08108668774366379, -0.06854289770126343, -0.05599910020828247, -0.04345531016588211, -0.030911516398191452, -0.018367722630500793, -0.005823932588100433, 0.006719864904880524, 0.019263654947280884, 0.03180744871497154, 0.0443512424826622, 0.05689503252506256, 0.06943883001804352, 0.08198262006044388, 0.09452641010284424, 0.1070702075958252, 0.11961399763822556, 0.13215778768062592, 0.14470158517360687, 0.15724536776542664, 0.1697891652584076, 0.18233296275138855, 0.1948767602443695, 0.20742055773735046, 0.21996434032917023, 0.23250813782215118, 0.24505192041397095, 0.2575957179069519, 0.27013951539993286, 0.2826833128929138, 0.2952271103858948, 0.30777090787887573, 0.3203146755695343, 0.33285847306251526, 0.3454022705554962, 0.3579460382461548, 0.37048983573913574, 0.3830336332321167, 0.39557743072509766, 0.4081212282180786, 0.42066502571105957]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 7.0, 5.0, 14.0, 25.0, 55.0, 106.0, 234.0, 799.0, 3063.0, 14945.0, 232115.0, 747663.0, 41345.0, 5966.0, 1464.0, 425.0, 171.0, 65.0, 36.0, 21.0, 12.0, 4.0, 3.0, 3.0, 2.0, 2.0, 0.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2176513671875, -0.2096576690673828, -0.20166397094726562, -0.19367027282714844, -0.18567657470703125, -0.17768287658691406, -0.16968917846679688, -0.1616954803466797, -0.1537017822265625, -0.1457080841064453, -0.13771438598632812, -0.12972068786621094, -0.12172698974609375, -0.11373329162597656, -0.10573959350585938, -0.09774589538574219, -0.089752197265625, -0.08175849914550781, -0.07376480102539062, -0.06577110290527344, -0.05777740478515625, -0.04978370666503906, -0.041790008544921875, -0.03379631042480469, -0.0258026123046875, -0.017808914184570312, -0.009815216064453125, -0.0018215179443359375, 0.00617218017578125, 0.014165878295898438, 0.022159576416015625, 0.030153274536132812, 0.03814697265625, 0.04614067077636719, 0.054134368896484375, 0.06212806701660156, 0.07012176513671875, 0.07811546325683594, 0.08610916137695312, 0.09410285949707031, 0.1020965576171875, 0.11009025573730469, 0.11808395385742188, 0.12607765197753906, 0.13407135009765625, 0.14206504821777344, 0.15005874633789062, 0.1580524444580078, 0.166046142578125, 0.1740398406982422, 0.18203353881835938, 0.19002723693847656, 0.19802093505859375, 0.20601463317871094, 0.21400833129882812, 0.2220020294189453, 0.2299957275390625, 0.2379894256591797, 0.24598312377929688, 0.25397682189941406, 0.26197052001953125, 0.26996421813964844, 0.2779579162597656, 0.2859516143798828, 0.2939453125]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 4.0, 5.0, 3.0, 10.0, 7.0, 9.0, 17.0, 15.0, 16.0, 27.0, 27.0, 33.0, 45.0, 52.0, 45.0, 49.0, 55.0, 52.0, 55.0, 61.0, 46.0, 45.0, 48.0, 45.0, 27.0, 35.0, 41.0, 31.0, 18.0, 20.0, 17.0, 12.0, 6.0, 10.0, 4.0, 5.0, 4.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.266845703125, -0.257568359375, -0.248291015625, -0.239013671875, -0.229736328125, -0.220458984375, -0.211181640625, -0.201904296875, -0.192626953125, -0.183349609375, -0.174072265625, -0.164794921875, -0.155517578125, -0.146240234375, -0.136962890625, -0.127685546875, -0.118408203125, -0.109130859375, -0.099853515625, -0.090576171875, -0.081298828125, -0.072021484375, -0.062744140625, -0.053466796875, -0.044189453125, -0.034912109375, -0.025634765625, -0.016357421875, -0.007080078125, 0.002197265625, 0.011474609375, 0.020751953125, 0.030029296875, 0.039306640625, 0.048583984375, 0.057861328125, 0.067138671875, 0.076416015625, 0.085693359375, 0.094970703125, 0.104248046875, 0.113525390625, 0.122802734375, 0.132080078125, 0.141357421875, 0.150634765625, 0.159912109375, 0.169189453125, 0.178466796875, 0.187744140625, 0.197021484375, 0.206298828125, 0.215576171875, 0.224853515625, 0.234130859375, 0.243408203125, 0.252685546875, 0.261962890625, 0.271240234375, 0.280517578125, 0.289794921875, 0.299072265625, 0.308349609375, 0.317626953125, 0.326904296875]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 5.0, 3.0, 3.0, 4.0, 14.0, 31.0, 48.0, 98.0, 179.0, 439.0, 1132.0, 3394.0, 12458.0, 75622.0, 564616.0, 339878.0, 39032.0, 7788.0, 2355.0, 803.0, 312.0, 159.0, 92.0, 41.0, 19.0, 8.0, 9.0, 6.0, 4.0, 3.0, 3.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1439208984375, -0.13940048217773438, -0.13488006591796875, -0.13035964965820312, -0.1258392333984375, -0.12131881713867188, -0.11679840087890625, -0.11227798461914062, -0.107757568359375, -0.10323715209960938, -0.09871673583984375, -0.09419631958007812, -0.0896759033203125, -0.08515548706054688, -0.08063507080078125, -0.07611465454101562, -0.07159423828125, -0.06707382202148438, -0.06255340576171875, -0.058032989501953125, -0.0535125732421875, -0.048992156982421875, -0.04447174072265625, -0.039951324462890625, -0.035430908203125, -0.030910491943359375, -0.02639007568359375, -0.021869659423828125, -0.0173492431640625, -0.012828826904296875, -0.00830841064453125, -0.003787994384765625, 0.000732421875, 0.005252838134765625, 0.00977325439453125, 0.014293670654296875, 0.0188140869140625, 0.023334503173828125, 0.02785491943359375, 0.032375335693359375, 0.036895751953125, 0.041416168212890625, 0.04593658447265625, 0.050457000732421875, 0.0549774169921875, 0.059497833251953125, 0.06401824951171875, 0.06853866577148438, 0.07305908203125, 0.07757949829101562, 0.08209991455078125, 0.08662033081054688, 0.0911407470703125, 0.09566116333007812, 0.10018157958984375, 0.10470199584960938, 0.109222412109375, 0.11374282836914062, 0.11826324462890625, 0.12278366088867188, 0.1273040771484375, 0.13182449340820312, 0.13634490966796875, 0.14086532592773438, 0.1453857421875]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 5.0, 10.0, 6.0, 7.0, 5.0, 13.0, 11.0, 9.0, 15.0, 22.0, 23.0, 30.0, 21.0, 32.0, 39.0, 42.0, 39.0, 41.0, 43.0, 47.0, 42.0, 39.0, 45.0, 37.0, 39.0, 39.0, 32.0, 40.0, 34.0, 26.0, 26.0, 25.0, 20.0, 24.0, 18.0, 12.0, 7.0, 9.0, 9.0, 6.0, 4.0, 5.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 3.0], "bins": [-0.4892578125, -0.4744834899902344, -0.45970916748046875, -0.4449348449707031, -0.4301605224609375, -0.4153861999511719, -0.40061187744140625, -0.3858375549316406, -0.371063232421875, -0.3562889099121094, -0.34151458740234375, -0.3267402648925781, -0.3119659423828125, -0.2971916198730469, -0.28241729736328125, -0.2676429748535156, -0.25286865234375, -0.23809432983398438, -0.22332000732421875, -0.20854568481445312, -0.1937713623046875, -0.17899703979492188, -0.16422271728515625, -0.14944839477539062, -0.134674072265625, -0.11989974975585938, -0.10512542724609375, -0.09035110473632812, -0.0755767822265625, -0.060802459716796875, -0.04602813720703125, -0.031253814697265625, -0.0164794921875, -0.001705169677734375, 0.01306915283203125, 0.027843475341796875, 0.0426177978515625, 0.057392120361328125, 0.07216644287109375, 0.08694076538085938, 0.101715087890625, 0.11648941040039062, 0.13126373291015625, 0.14603805541992188, 0.1608123779296875, 0.17558670043945312, 0.19036102294921875, 0.20513534545898438, 0.21990966796875, 0.23468399047851562, 0.24945831298828125, 0.2642326354980469, 0.2790069580078125, 0.2937812805175781, 0.30855560302734375, 0.3233299255371094, 0.338104248046875, 0.3528785705566406, 0.36765289306640625, 0.3824272155761719, 0.3972015380859375, 0.4119758605957031, 0.42675018310546875, 0.4415245056152344, 0.456298828125]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 5.0, 1.0, 2.0, 0.0, 5.0, 6.0, 7.0, 10.0, 15.0, 31.0, 46.0, 78.0, 192.0, 444.0, 1023.0, 3173.0, 12004.0, 77550.0, 614746.0, 297476.0, 32032.0, 6423.0, 2003.0, 670.0, 309.0, 139.0, 73.0, 36.0, 19.0, 13.0, 8.0, 12.0, 5.0, 0.0, 3.0, 4.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.061370849609375, -0.05982828140258789, -0.05828571319580078, -0.05674314498901367, -0.05520057678222656, -0.05365800857543945, -0.052115440368652344, -0.050572872161865234, -0.049030303955078125, -0.047487735748291016, -0.045945167541503906, -0.0444025993347168, -0.04286003112792969, -0.04131746292114258, -0.03977489471435547, -0.03823232650756836, -0.03668975830078125, -0.03514719009399414, -0.03360462188720703, -0.03206205368041992, -0.030519485473632812, -0.028976917266845703, -0.027434349060058594, -0.025891780853271484, -0.024349212646484375, -0.022806644439697266, -0.021264076232910156, -0.019721508026123047, -0.018178939819335938, -0.016636371612548828, -0.015093803405761719, -0.01355123519897461, -0.0120086669921875, -0.01046609878540039, -0.008923530578613281, -0.007380962371826172, -0.0058383941650390625, -0.004295825958251953, -0.0027532577514648438, -0.0012106895446777344, 0.000331878662109375, 0.0018744468688964844, 0.0034170150756835938, 0.004959583282470703, 0.0065021514892578125, 0.008044719696044922, 0.009587287902832031, 0.01112985610961914, 0.01267242431640625, 0.01421499252319336, 0.01575756072998047, 0.017300128936767578, 0.018842697143554688, 0.020385265350341797, 0.021927833557128906, 0.023470401763916016, 0.025012969970703125, 0.026555538177490234, 0.028098106384277344, 0.029640674591064453, 0.031183242797851562, 0.03272581100463867, 0.03426837921142578, 0.03581094741821289, 0.037353515625]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 4.0, 3.0, 4.0, 9.0, 12.0, 12.0, 21.0, 29.0, 41.0, 62.0, 98.0, 114.0, 110.0, 108.0, 107.0, 92.0, 58.0, 41.0, 23.0, 19.0, 13.0, 9.0, 6.0, 7.0, 3.0, 1.0, 0.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.5272369384765625e-05, -2.454407513141632e-05, -2.3815780878067017e-05, -2.3087486624717712e-05, -2.2359192371368408e-05, -2.1630898118019104e-05, -2.09026038646698e-05, -2.0174309611320496e-05, -1.944601535797119e-05, -1.8717721104621887e-05, -1.7989426851272583e-05, -1.726113259792328e-05, -1.6532838344573975e-05, -1.580454409122467e-05, -1.5076249837875366e-05, -1.4347955584526062e-05, -1.3619661331176758e-05, -1.2891367077827454e-05, -1.216307282447815e-05, -1.1434778571128845e-05, -1.0706484317779541e-05, -9.978190064430237e-06, -9.249895811080933e-06, -8.521601557731628e-06, -7.793307304382324e-06, -7.06501305103302e-06, -6.336718797683716e-06, -5.608424544334412e-06, -4.880130290985107e-06, -4.151836037635803e-06, -3.423541784286499e-06, -2.695247530937195e-06, -1.9669532775878906e-06, -1.2386590242385864e-06, -5.103647708892822e-07, 2.1792948246002197e-07, 9.462237358093262e-07, 1.6745179891586304e-06, 2.4028122425079346e-06, 3.1311064958572388e-06, 3.859400749206543e-06, 4.587695002555847e-06, 5.315989255905151e-06, 6.0442835092544556e-06, 6.77257776260376e-06, 7.500872015953064e-06, 8.229166269302368e-06, 8.957460522651672e-06, 9.685754776000977e-06, 1.041404902935028e-05, 1.1142343282699585e-05, 1.187063753604889e-05, 1.2598931789398193e-05, 1.3327226042747498e-05, 1.4055520296096802e-05, 1.4783814549446106e-05, 1.551210880279541e-05, 1.6240403056144714e-05, 1.696869730949402e-05, 1.7696991562843323e-05, 1.8425285816192627e-05, 1.915358006954193e-05, 1.9881874322891235e-05, 2.061016857624054e-05, 2.1338462829589844e-05]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 5.0, 5.0, 13.0, 17.0, 38.0, 45.0, 75.0, 119.0, 217.0, 374.0, 856.0, 1748.0, 4041.0, 11957.0, 52254.0, 309540.0, 520008.0, 114975.0, 21360.0, 6231.0, 2412.0, 1060.0, 519.0, 277.0, 149.0, 87.0, 59.0, 31.0, 27.0, 18.0, 12.0, 9.0, 6.0, 4.0, 2.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.03338623046875, -0.03224372863769531, -0.031101226806640625, -0.029958724975585938, -0.02881622314453125, -0.027673721313476562, -0.026531219482421875, -0.025388717651367188, -0.0242462158203125, -0.023103713989257812, -0.021961212158203125, -0.020818710327148438, -0.01967620849609375, -0.018533706665039062, -0.017391204833984375, -0.016248703002929688, -0.015106201171875, -0.013963699340820312, -0.012821197509765625, -0.011678695678710938, -0.01053619384765625, -0.009393692016601562, -0.008251190185546875, -0.0071086883544921875, -0.0059661865234375, -0.0048236846923828125, -0.003681182861328125, -0.0025386810302734375, -0.00139617919921875, -0.0002536773681640625, 0.000888824462890625, 0.0020313262939453125, 0.003173828125, 0.0043163299560546875, 0.005458831787109375, 0.0066013336181640625, 0.00774383544921875, 0.008886337280273438, 0.010028839111328125, 0.011171340942382812, 0.0123138427734375, 0.013456344604492188, 0.014598846435546875, 0.015741348266601562, 0.01688385009765625, 0.018026351928710938, 0.019168853759765625, 0.020311355590820312, 0.021453857421875, 0.022596359252929688, 0.023738861083984375, 0.024881362915039062, 0.02602386474609375, 0.027166366577148438, 0.028308868408203125, 0.029451370239257812, 0.0305938720703125, 0.03173637390136719, 0.032878875732421875, 0.03402137756347656, 0.03516387939453125, 0.03630638122558594, 0.037448883056640625, 0.03859138488769531, 0.03973388671875]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 4.0, 0.0, 2.0, 5.0, 2.0, 5.0, 2.0, 6.0, 6.0, 2.0, 8.0, 21.0, 19.0, 20.0, 38.0, 48.0, 41.0, 65.0, 60.0, 82.0, 97.0, 64.0, 75.0, 81.0, 60.0, 61.0, 40.0, 25.0, 17.0, 20.0, 11.0, 7.0, 2.0, 5.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.008697509765625, -0.008423209190368652, -0.008148908615112305, -0.007874608039855957, -0.007600307464599609, -0.007326006889343262, -0.007051706314086914, -0.006777405738830566, -0.006503105163574219, -0.006228804588317871, -0.0059545040130615234, -0.005680203437805176, -0.005405902862548828, -0.0051316022872924805, -0.004857301712036133, -0.004583001136779785, -0.0043087005615234375, -0.00403439998626709, -0.003760099411010742, -0.0034857988357543945, -0.003211498260498047, -0.0029371976852416992, -0.0026628971099853516, -0.002388596534729004, -0.0021142959594726562, -0.0018399953842163086, -0.001565694808959961, -0.0012913942337036133, -0.0010170936584472656, -0.000742793083190918, -0.0004684925079345703, -0.00019419193267822266, 8.0108642578125e-05, 0.00035440921783447266, 0.0006287097930908203, 0.000903010368347168, 0.0011773109436035156, 0.0014516115188598633, 0.001725912094116211, 0.0020002126693725586, 0.0022745132446289062, 0.002548813819885254, 0.0028231143951416016, 0.0030974149703979492, 0.003371715545654297, 0.0036460161209106445, 0.003920316696166992, 0.00419461727142334, 0.0044689178466796875, 0.004743218421936035, 0.005017518997192383, 0.0052918195724487305, 0.005566120147705078, 0.005840420722961426, 0.0061147212982177734, 0.006389021873474121, 0.006663322448730469, 0.006937623023986816, 0.007211923599243164, 0.007486224174499512, 0.007760524749755859, 0.008034825325012207, 0.008309125900268555, 0.008583426475524902, 0.00885772705078125]}, "gradients/decoder.model.decoder.layers.6.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 4.0, 6.0, 8.0, 15.0, 56.0, 109.0, 209.0, 259.0, 186.0, 81.0, 39.0, 19.0, 13.0, 2.0, 2.0, 6.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.48781993985176086, -0.45624569058418274, -0.4246714413166046, -0.3930971920490265, -0.36152294278144836, -0.32994869351387024, -0.2983744442462921, -0.266800194978714, -0.23522594571113586, -0.20365169644355774, -0.17207744717597961, -0.1405031979084015, -0.10892894864082336, -0.07735469937324524, -0.045780450105667114, -0.01420620083808899, 0.017368048429489136, 0.04894229769706726, 0.08051654696464539, 0.11209079623222351, 0.14366504549980164, 0.17523929476737976, 0.20681354403495789, 0.238387793302536, 0.26996204257011414, 0.30153629183769226, 0.3331105411052704, 0.3646847903728485, 0.39625903964042664, 0.42783328890800476, 0.4594075381755829, 0.490981787443161, 0.522555947303772, 0.5541301965713501, 0.5857044458389282, 0.6172786951065063, 0.6488529443740845, 0.6804271936416626, 0.7120014429092407, 0.7435756921768188, 0.775149941444397, 0.8067241907119751, 0.8382984399795532, 0.8698726892471313, 0.9014469385147095, 0.9330211877822876, 0.9645954370498657, 0.9961696863174438, 1.027743935585022, 1.0593181848526, 1.0908924341201782, 1.1224666833877563, 1.1540409326553345, 1.1856151819229126, 1.2171894311904907, 1.2487636804580688, 1.280337929725647, 1.311912178993225, 1.3434864282608032, 1.3750606775283813, 1.4066349267959595, 1.4382091760635376, 1.4697834253311157, 1.5013576745986938, 1.532931923866272]}, "gradients/decoder.model.decoder.layers.6.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 8.0, 2.0, 6.0, 4.0, 8.0, 12.0, 14.0, 19.0, 17.0, 35.0, 23.0, 28.0, 36.0, 59.0, 46.0, 53.0, 54.0, 68.0, 43.0, 44.0, 53.0, 48.0, 45.0, 41.0, 47.0, 34.0, 32.0, 24.0, 21.0, 21.0, 14.0, 7.0, 11.0, 4.0, 9.0, 2.0, 5.0, 3.0, 2.0, 3.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.25737351179122925, -0.24833428859710693, -0.2392950803041458, -0.2302558720111847, -0.22121664881706238, -0.21217742562294006, -0.20313821732997894, -0.19409900903701782, -0.1850597858428955, -0.1760205626487732, -0.16698135435581207, -0.15794214606285095, -0.14890292286872864, -0.13986369967460632, -0.1308244913816452, -0.12178527563810349, -0.11274605989456177, -0.10370684415102005, -0.09466762840747833, -0.08562841266393661, -0.0765891969203949, -0.06754998117685318, -0.05851076543331146, -0.049471549689769745, -0.04043233394622803, -0.03139311820268631, -0.022353902459144592, -0.013314686715602875, -0.004275470972061157, 0.00476374477148056, 0.013802960515022278, 0.022842176258563995, 0.03188139200210571, 0.04092060774564743, 0.04995982348918915, 0.058999039232730865, 0.06803825497627258, 0.0770774707198143, 0.08611668646335602, 0.09515590220689774, 0.10419511795043945, 0.11323433369398117, 0.12227354943752289, 0.131312757730484, 0.14035198092460632, 0.14939120411872864, 0.15843041241168976, 0.16746962070465088, 0.1765088438987732, 0.1855480670928955, 0.19458727538585663, 0.20362648367881775, 0.21266570687294006, 0.22170493006706238, 0.2307441383600235, 0.23978334665298462, 0.24882256984710693, 0.25786179304122925, 0.26690101623535156, 0.2759402096271515, 0.2849794328212738, 0.2940186560153961, 0.30305784940719604, 0.31209707260131836, 0.3211362957954407]}, "gradients/decoder.model.decoder.layers.6.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 3.0, 1.0, 2.0, 3.0, 4.0, 4.0, 4.0, 5.0, 3.0, 8.0, 6.0, 8.0, 14.0, 28.0, 59.0, 103.0, 301.0, 1090.0, 5431.0, 84746.0, 919838.0, 32321.0, 3374.0, 761.0, 235.0, 82.0, 38.0, 15.0, 14.0, 11.0, 9.0, 4.0, 3.0, 4.0, 5.0, 5.0, 6.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.0908203125, -1.053680419921875, -1.01654052734375, -0.979400634765625, -0.9422607421875, -0.905120849609375, -0.86798095703125, -0.830841064453125, -0.793701171875, -0.756561279296875, -0.71942138671875, -0.682281494140625, -0.6451416015625, -0.608001708984375, -0.57086181640625, -0.533721923828125, -0.49658203125, -0.459442138671875, -0.42230224609375, -0.385162353515625, -0.3480224609375, -0.310882568359375, -0.27374267578125, -0.236602783203125, -0.199462890625, -0.162322998046875, -0.12518310546875, -0.088043212890625, -0.0509033203125, -0.013763427734375, 0.02337646484375, 0.060516357421875, 0.09765625, 0.134796142578125, 0.17193603515625, 0.209075927734375, 0.2462158203125, 0.283355712890625, 0.32049560546875, 0.357635498046875, 0.394775390625, 0.431915283203125, 0.46905517578125, 0.506195068359375, 0.5433349609375, 0.580474853515625, 0.61761474609375, 0.654754638671875, 0.69189453125, 0.729034423828125, 0.76617431640625, 0.803314208984375, 0.8404541015625, 0.877593994140625, 0.91473388671875, 0.951873779296875, 0.989013671875, 1.026153564453125, 1.06329345703125, 1.100433349609375, 1.1375732421875, 1.174713134765625, 1.21185302734375, 1.248992919921875, 1.2861328125]}, "gradients/decoder.model.decoder.layers.6.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 0.0, 8.0, 2.0, 3.0, 9.0, 6.0, 7.0, 9.0, 18.0, 16.0, 19.0, 25.0, 32.0, 34.0, 54.0, 58.0, 50.0, 51.0, 66.0, 59.0, 57.0, 55.0, 56.0, 48.0, 37.0, 36.0, 43.0, 34.0, 27.0, 18.0, 15.0, 16.0, 5.0, 5.0, 6.0, 9.0, 4.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0], "bins": [-0.5732421875, -0.5546722412109375, -0.536102294921875, -0.5175323486328125, -0.49896240234375, -0.4803924560546875, -0.461822509765625, -0.4432525634765625, -0.4246826171875, -0.4061126708984375, -0.387542724609375, -0.3689727783203125, -0.35040283203125, -0.3318328857421875, -0.313262939453125, -0.2946929931640625, -0.276123046875, -0.2575531005859375, -0.238983154296875, -0.2204132080078125, -0.20184326171875, -0.1832733154296875, -0.164703369140625, -0.1461334228515625, -0.1275634765625, -0.1089935302734375, -0.090423583984375, -0.0718536376953125, -0.05328369140625, -0.0347137451171875, -0.016143798828125, 0.0024261474609375, 0.02099609375, 0.0395660400390625, 0.058135986328125, 0.0767059326171875, 0.09527587890625, 0.1138458251953125, 0.132415771484375, 0.1509857177734375, 0.1695556640625, 0.1881256103515625, 0.206695556640625, 0.2252655029296875, 0.24383544921875, 0.2624053955078125, 0.280975341796875, 0.2995452880859375, 0.318115234375, 0.3366851806640625, 0.355255126953125, 0.3738250732421875, 0.39239501953125, 0.4109649658203125, 0.429534912109375, 0.4481048583984375, 0.4666748046875, 0.4852447509765625, 0.503814697265625, 0.5223846435546875, 0.54095458984375, 0.5595245361328125, 0.578094482421875, 0.5966644287109375, 0.615234375]}, "gradients/decoder.model.decoder.layers.6.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 6.0, 3.0, 7.0, 6.0, 9.0, 13.0, 18.0, 27.0, 49.0, 55.0, 114.0, 224.0, 420.0, 1006.0, 3496.0, 19034.0, 533953.0, 467514.0, 17471.0, 3279.0, 957.0, 399.0, 200.0, 97.0, 69.0, 33.0, 27.0, 16.0, 9.0, 9.0, 12.0, 10.0, 5.0, 0.0, 0.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 2.0], "bins": [-0.87841796875, -0.85400390625, -0.82958984375, -0.80517578125, -0.78076171875, -0.75634765625, -0.73193359375, -0.70751953125, -0.68310546875, -0.65869140625, -0.63427734375, -0.60986328125, -0.58544921875, -0.56103515625, -0.53662109375, -0.51220703125, -0.48779296875, -0.46337890625, -0.43896484375, -0.41455078125, -0.39013671875, -0.36572265625, -0.34130859375, -0.31689453125, -0.29248046875, -0.26806640625, -0.24365234375, -0.21923828125, -0.19482421875, -0.17041015625, -0.14599609375, -0.12158203125, -0.09716796875, -0.07275390625, -0.04833984375, -0.02392578125, 0.00048828125, 0.02490234375, 0.04931640625, 0.07373046875, 0.09814453125, 0.12255859375, 0.14697265625, 0.17138671875, 0.19580078125, 0.22021484375, 0.24462890625, 0.26904296875, 0.29345703125, 0.31787109375, 0.34228515625, 0.36669921875, 0.39111328125, 0.41552734375, 0.43994140625, 0.46435546875, 0.48876953125, 0.51318359375, 0.53759765625, 0.56201171875, 0.58642578125, 0.61083984375, 0.63525390625, 0.65966796875, 0.68408203125]}, "gradients/decoder.model.decoder.layers.6.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 6.0, 7.0, 4.0, 7.0, 7.0, 18.0, 14.0, 16.0, 22.0, 25.0, 23.0, 30.0, 31.0, 33.0, 38.0, 48.0, 64.0, 54.0, 63.0, 62.0, 60.0, 59.0, 51.0, 36.0, 40.0, 33.0, 30.0, 17.0, 26.0, 16.0, 16.0, 12.0, 13.0, 7.0, 7.0, 2.0, 6.0, 2.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7529296875, -0.731781005859375, -0.71063232421875, -0.689483642578125, -0.6683349609375, -0.647186279296875, -0.62603759765625, -0.604888916015625, -0.583740234375, -0.562591552734375, -0.54144287109375, -0.520294189453125, -0.4991455078125, -0.477996826171875, -0.45684814453125, -0.435699462890625, -0.41455078125, -0.393402099609375, -0.37225341796875, -0.351104736328125, -0.3299560546875, -0.308807373046875, -0.28765869140625, -0.266510009765625, -0.245361328125, -0.224212646484375, -0.20306396484375, -0.181915283203125, -0.1607666015625, -0.139617919921875, -0.11846923828125, -0.097320556640625, -0.076171875, -0.055023193359375, -0.03387451171875, -0.012725830078125, 0.0084228515625, 0.029571533203125, 0.05072021484375, 0.071868896484375, 0.093017578125, 0.114166259765625, 0.13531494140625, 0.156463623046875, 0.1776123046875, 0.198760986328125, 0.21990966796875, 0.241058349609375, 0.26220703125, 0.283355712890625, 0.30450439453125, 0.325653076171875, 0.3468017578125, 0.367950439453125, 0.38909912109375, 0.410247802734375, 0.431396484375, 0.452545166015625, 0.47369384765625, 0.494842529296875, 0.5159912109375, 0.537139892578125, 0.55828857421875, 0.579437255859375, 0.6005859375]}, "gradients/decoder.model.decoder.layers.6.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 9.0, 10.0, 15.0, 25.0, 50.0, 94.0, 275.0, 920.0, 5642.0, 231303.0, 796145.0, 11864.0, 1599.0, 353.0, 122.0, 47.0, 35.0, 20.0, 8.0, 5.0, 3.0, 5.0, 3.0, 4.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.341796875, -0.3308219909667969, -0.31984710693359375, -0.3088722229003906, -0.2978973388671875, -0.2869224548339844, -0.27594757080078125, -0.2649726867675781, -0.253997802734375, -0.24302291870117188, -0.23204803466796875, -0.22107315063476562, -0.2100982666015625, -0.19912338256835938, -0.18814849853515625, -0.17717361450195312, -0.16619873046875, -0.15522384643554688, -0.14424896240234375, -0.13327407836914062, -0.1222991943359375, -0.11132431030273438, -0.10034942626953125, -0.08937454223632812, -0.078399658203125, -0.06742477416992188, -0.05644989013671875, -0.045475006103515625, -0.0345001220703125, -0.023525238037109375, -0.01255035400390625, -0.001575469970703125, 0.0093994140625, 0.020374298095703125, 0.03134918212890625, 0.042324066162109375, 0.0532989501953125, 0.06427383422851562, 0.07524871826171875, 0.08622360229492188, 0.097198486328125, 0.10817337036132812, 0.11914825439453125, 0.13012313842773438, 0.1410980224609375, 0.15207290649414062, 0.16304779052734375, 0.17402267456054688, 0.18499755859375, 0.19597244262695312, 0.20694732666015625, 0.21792221069335938, 0.2288970947265625, 0.23987197875976562, 0.25084686279296875, 0.2618217468261719, 0.272796630859375, 0.2837715148925781, 0.29474639892578125, 0.3057212829589844, 0.3166961669921875, 0.3276710510253906, 0.33864593505859375, 0.3496208190917969, 0.360595703125]}, "gradients/decoder.model.decoder.layers.6.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 3.0, 8.0, 10.0, 16.0, 20.0, 42.0, 49.0, 85.0, 117.0, 148.0, 163.0, 93.0, 82.0, 51.0, 34.0, 26.0, 17.0, 13.0, 9.0, 10.0, 2.0, 1.0, 1.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.1054019927978516e-05, -3.013666719198227e-05, -2.9219314455986023e-05, -2.8301961719989777e-05, -2.738460898399353e-05, -2.6467256247997284e-05, -2.5549903512001038e-05, -2.463255077600479e-05, -2.3715198040008545e-05, -2.27978453040123e-05, -2.1880492568016052e-05, -2.0963139832019806e-05, -2.004578709602356e-05, -1.9128434360027313e-05, -1.8211081624031067e-05, -1.729372888803482e-05, -1.6376376152038574e-05, -1.5459023416042328e-05, -1.4541670680046082e-05, -1.3624317944049835e-05, -1.2706965208053589e-05, -1.1789612472057343e-05, -1.0872259736061096e-05, -9.95490700006485e-06, -9.037554264068604e-06, -8.120201528072357e-06, -7.202848792076111e-06, -6.2854960560798645e-06, -5.368143320083618e-06, -4.450790584087372e-06, -3.5334378480911255e-06, -2.616085112094879e-06, -1.6987323760986328e-06, -7.813796401023865e-07, 1.3597309589385986e-07, 1.0533258318901062e-06, 1.9706785678863525e-06, 2.888031303882599e-06, 3.8053840398788452e-06, 4.7227367758750916e-06, 5.640089511871338e-06, 6.557442247867584e-06, 7.4747949838638306e-06, 8.392147719860077e-06, 9.309500455856323e-06, 1.022685319185257e-05, 1.1144205927848816e-05, 1.2061558663845062e-05, 1.2978911399841309e-05, 1.3896264135837555e-05, 1.4813616871833801e-05, 1.5730969607830048e-05, 1.6648322343826294e-05, 1.756567507982254e-05, 1.8483027815818787e-05, 1.9400380551815033e-05, 2.031773328781128e-05, 2.1235086023807526e-05, 2.2152438759803772e-05, 2.306979149580002e-05, 2.3987144231796265e-05, 2.490449696779251e-05, 2.5821849703788757e-05, 2.6739202439785004e-05, 2.765655517578125e-05]}, "gradients/decoder.model.decoder.layers.6.self_attn.q_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 7.0, 6.0, 4.0, 2.0, 13.0, 9.0, 15.0, 33.0, 47.0, 125.0, 222.0, 707.0, 2740.0, 26955.0, 880016.0, 129885.0, 5913.0, 1151.0, 366.0, 155.0, 67.0, 43.0, 29.0, 14.0, 6.0, 8.0, 9.0, 2.0, 4.0, 4.0, 2.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.243896484375, -0.23440933227539062, -0.22492218017578125, -0.21543502807617188, -0.2059478759765625, -0.19646072387695312, -0.18697357177734375, -0.17748641967773438, -0.167999267578125, -0.15851211547851562, -0.14902496337890625, -0.13953781127929688, -0.1300506591796875, -0.12056350708007812, -0.11107635498046875, -0.10158920288085938, -0.09210205078125, -0.08261489868164062, -0.07312774658203125, -0.06364059448242188, -0.0541534423828125, -0.044666290283203125, -0.03517913818359375, -0.025691986083984375, -0.016204833984375, -0.006717681884765625, 0.00276947021484375, 0.012256622314453125, 0.0217437744140625, 0.031230926513671875, 0.04071807861328125, 0.050205230712890625, 0.0596923828125, 0.06917953491210938, 0.07866668701171875, 0.08815383911132812, 0.0976409912109375, 0.10712814331054688, 0.11661529541015625, 0.12610244750976562, 0.135589599609375, 0.14507675170898438, 0.15456390380859375, 0.16405105590820312, 0.1735382080078125, 0.18302536010742188, 0.19251251220703125, 0.20199966430664062, 0.21148681640625, 0.22097396850585938, 0.23046112060546875, 0.23994827270507812, 0.2494354248046875, 0.2589225769042969, 0.26840972900390625, 0.2778968811035156, 0.287384033203125, 0.2968711853027344, 0.30635833740234375, 0.3158454895019531, 0.3253326416015625, 0.3348197937011719, 0.34430694580078125, 0.3537940979003906, 0.36328125]}, "gradients/decoder.model.decoder.layers.6.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 4.0, 3.0, 6.0, 5.0, 5.0, 5.0, 10.0, 12.0, 24.0, 32.0, 51.0, 73.0, 113.0, 118.0, 151.0, 114.0, 83.0, 51.0, 41.0, 29.0, 24.0, 15.0, 12.0, 8.0, 3.0, 7.0, 7.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.09893798828125, -0.0964970588684082, -0.0940561294555664, -0.09161520004272461, -0.08917427062988281, -0.08673334121704102, -0.08429241180419922, -0.08185148239135742, -0.07941055297851562, -0.07696962356567383, -0.07452869415283203, -0.07208776473999023, -0.06964683532714844, -0.06720590591430664, -0.06476497650146484, -0.06232404708862305, -0.05988311767578125, -0.05744218826293945, -0.055001258850097656, -0.05256032943725586, -0.05011940002441406, -0.047678470611572266, -0.04523754119873047, -0.04279661178588867, -0.040355682373046875, -0.03791475296020508, -0.03547382354736328, -0.033032894134521484, -0.030591964721679688, -0.02815103530883789, -0.025710105895996094, -0.023269176483154297, -0.0208282470703125, -0.018387317657470703, -0.015946388244628906, -0.01350545883178711, -0.011064529418945312, -0.008623600006103516, -0.006182670593261719, -0.003741741180419922, -0.001300811767578125, 0.0011401176452636719, 0.0035810470581054688, 0.006021976470947266, 0.008462905883789062, 0.01090383529663086, 0.013344764709472656, 0.015785694122314453, 0.01822662353515625, 0.020667552947998047, 0.023108482360839844, 0.02554941177368164, 0.027990341186523438, 0.030431270599365234, 0.03287220001220703, 0.03531312942504883, 0.037754058837890625, 0.04019498825073242, 0.04263591766357422, 0.045076847076416016, 0.04751777648925781, 0.04995870590209961, 0.052399635314941406, 0.0548405647277832, 0.057281494140625]}, "gradients/decoder.model.decoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 5.0, 5.0, 7.0, 21.0, 41.0, 82.0, 136.0, 203.0, 216.0, 154.0, 61.0, 35.0, 16.0, 10.0, 6.0, 4.0, 9.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7512412071228027, -1.6998151540756226, -1.6483891010284424, -1.5969631671905518, -1.5455371141433716, -1.4941110610961914, -1.4426850080490112, -1.391258955001831, -1.3398330211639404, -1.2884069681167603, -1.23698091506958, -1.1855549812316895, -1.1341289281845093, -1.082702875137329, -1.031276822090149, -0.9798507690429688, -0.9284247159957886, -0.8769986629486084, -0.825572669506073, -0.7741466164588928, -0.7227206230163574, -0.6712945699691772, -0.6198685169219971, -0.5684424638748169, -0.5170164704322815, -0.4655904471874237, -0.4141644239425659, -0.36273837089538574, -0.31131234765052795, -0.25988632440567017, -0.20846027135849, -0.1570342481136322, -0.10560810565948486, -0.05418207496404648, -0.0027560442686080933, 0.04866999387741089, 0.10009601712226868, 0.15152204036712646, 0.20294809341430664, 0.25437411665916443, 0.3058001399040222, 0.35722616314888, 0.4086521863937378, 0.46007823944091797, 0.5115042924880981, 0.5629302859306335, 0.6143563389778137, 0.6657823324203491, 0.7172083854675293, 0.7686344385147095, 0.8200604319572449, 0.871486485004425, 0.9229124784469604, 0.9743385314941406, 1.0257645845413208, 1.077190637588501, 1.1286165714263916, 1.1800426244735718, 1.231468677520752, 1.2828946113586426, 1.3343206644058228, 1.385746717453003, 1.437172770500183, 1.4885988235473633, 1.5400248765945435]}, "gradients/decoder.model.decoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 4.0, 6.0, 4.0, 5.0, 9.0, 9.0, 8.0, 13.0, 14.0, 15.0, 22.0, 21.0, 20.0, 32.0, 31.0, 41.0, 38.0, 34.0, 55.0, 44.0, 43.0, 44.0, 43.0, 41.0, 39.0, 41.0, 36.0, 35.0, 39.0, 31.0, 27.0, 29.0, 22.0, 19.0, 16.0, 18.0, 12.0, 11.0, 9.0, 1.0, 7.0, 10.0, 4.0, 6.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.851614236831665, -0.8216158151626587, -0.7916174530982971, -0.7616190314292908, -0.7316206097602844, -0.7016222476959229, -0.6716238260269165, -0.6416254043579102, -0.6116269826889038, -0.5816285610198975, -0.5516301989555359, -0.5216317772865295, -0.4916333556175232, -0.46163496375083923, -0.4316365718841553, -0.4016381502151489, -0.37163975834846497, -0.341641366481781, -0.31164294481277466, -0.2816445529460907, -0.25164613127708435, -0.2216477394104004, -0.19164933264255524, -0.16165092587471008, -0.13165251910686493, -0.10165411233901978, -0.07165570557117462, -0.041657306253910065, -0.011658899486064911, 0.018339499831199646, 0.0483379065990448, 0.07833631336688995, 0.10833472013473511, 0.13833312690258026, 0.16833153367042542, 0.19832992553710938, 0.22832834720611572, 0.2583267390727997, 0.28832513093948364, 0.31832355260849, 0.34832197427749634, 0.3783203661441803, 0.40831878781318665, 0.4383171796798706, 0.46831560134887695, 0.4983139932155609, 0.5283123850822449, 0.5583108067512512, 0.5883091688156128, 0.6183075904846191, 0.6483059525489807, 0.6783043742179871, 0.7083027958869934, 0.738301157951355, 0.7682995796203613, 0.7982980012893677, 0.828296422958374, 0.8582948446273804, 0.8882932066917419, 0.9182916283607483, 0.9482900500297546, 0.9782884120941162, 1.0082868337631226, 1.038285255432129, 1.0682836771011353]}, "gradients/decoder.model.decoder.layers.5.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 4.0, 6.0, 4.0, 9.0, 8.0, 12.0, 38.0, 37.0, 68.0, 140.0, 209.0, 455.0, 1006.0, 2891.0, 13682.0, 216715.0, 3650245.0, 287958.0, 15154.0, 3328.0, 1159.0, 528.0, 250.0, 136.0, 89.0, 49.0, 39.0, 24.0, 12.0, 10.0, 7.0, 7.0, 5.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.79345703125, -0.7646408081054688, -0.7358245849609375, -0.7070083618164062, -0.678192138671875, -0.6493759155273438, -0.6205596923828125, -0.5917434692382812, -0.56292724609375, -0.5341110229492188, -0.5052947998046875, -0.47647857666015625, -0.447662353515625, -0.41884613037109375, -0.3900299072265625, -0.36121368408203125, -0.3323974609375, -0.30358123779296875, -0.2747650146484375, -0.24594879150390625, -0.217132568359375, -0.18831634521484375, -0.1595001220703125, -0.13068389892578125, -0.10186767578125, -0.07305145263671875, -0.0442352294921875, -0.01541900634765625, 0.013397216796875, 0.04221343994140625, 0.0710296630859375, 0.09984588623046875, 0.128662109375, 0.15747833251953125, 0.1862945556640625, 0.21511077880859375, 0.243927001953125, 0.27274322509765625, 0.3015594482421875, 0.33037567138671875, 0.35919189453125, 0.38800811767578125, 0.4168243408203125, 0.44564056396484375, 0.474456787109375, 0.5032730102539062, 0.5320892333984375, 0.5609054565429688, 0.5897216796875, 0.6185379028320312, 0.6473541259765625, 0.6761703491210938, 0.704986572265625, 0.7338027954101562, 0.7626190185546875, 0.7914352416992188, 0.82025146484375, 0.8490676879882812, 0.8778839111328125, 0.9067001342773438, 0.935516357421875, 0.9643325805664062, 0.9931488037109375, 1.0219650268554688, 1.05078125]}, "gradients/decoder.model.decoder.layers.5.fc2.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 2.0, 5.0, 11.0, 6.0, 10.0, 5.0, 11.0, 10.0, 21.0, 19.0, 25.0, 32.0, 29.0, 46.0, 39.0, 48.0, 54.0, 71.0, 54.0, 51.0, 54.0, 52.0, 53.0, 42.0, 38.0, 39.0, 32.0, 28.0, 25.0, 20.0, 16.0, 11.0, 10.0, 8.0, 6.0, 5.0, 4.0, 2.0, 2.0, 3.0, 3.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0], "bins": [-0.34521484375, -0.3338165283203125, -0.322418212890625, -0.3110198974609375, -0.29962158203125, -0.2882232666015625, -0.276824951171875, -0.2654266357421875, -0.2540283203125, -0.2426300048828125, -0.231231689453125, -0.2198333740234375, -0.20843505859375, -0.1970367431640625, -0.185638427734375, -0.1742401123046875, -0.162841796875, -0.1514434814453125, -0.140045166015625, -0.1286468505859375, -0.11724853515625, -0.1058502197265625, -0.094451904296875, -0.0830535888671875, -0.0716552734375, -0.0602569580078125, -0.048858642578125, -0.0374603271484375, -0.02606201171875, -0.0146636962890625, -0.003265380859375, 0.0081329345703125, 0.01953125, 0.0309295654296875, 0.042327880859375, 0.0537261962890625, 0.06512451171875, 0.0765228271484375, 0.087921142578125, 0.0993194580078125, 0.1107177734375, 0.1221160888671875, 0.133514404296875, 0.1449127197265625, 0.15631103515625, 0.1677093505859375, 0.179107666015625, 0.1905059814453125, 0.201904296875, 0.2133026123046875, 0.224700927734375, 0.2360992431640625, 0.24749755859375, 0.2588958740234375, 0.270294189453125, 0.2816925048828125, 0.2930908203125, 0.3044891357421875, 0.315887451171875, 0.3272857666015625, 0.33868408203125, 0.3500823974609375, 0.361480712890625, 0.3728790283203125, 0.38427734375]}, "gradients/decoder.model.decoder.layers.5.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 9.0, 12.0, 13.0, 24.0, 31.0, 42.0, 62.0, 113.0, 197.0, 364.0, 681.0, 1651.0, 4769.0, 17766.0, 120057.0, 3204211.0, 782008.0, 47492.0, 9501.0, 2906.0, 1173.0, 558.0, 284.0, 146.0, 84.0, 51.0, 20.0, 14.0, 15.0, 11.0, 4.0, 9.0, 5.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.66552734375, -0.6479148864746094, -0.6303024291992188, -0.6126899719238281, -0.5950775146484375, -0.5774650573730469, -0.5598526000976562, -0.5422401428222656, -0.524627685546875, -0.5070152282714844, -0.48940277099609375, -0.4717903137207031, -0.4541778564453125, -0.4365653991699219, -0.41895294189453125, -0.4013404846191406, -0.38372802734375, -0.3661155700683594, -0.34850311279296875, -0.3308906555175781, -0.3132781982421875, -0.2956657409667969, -0.27805328369140625, -0.2604408264160156, -0.242828369140625, -0.22521591186523438, -0.20760345458984375, -0.18999099731445312, -0.1723785400390625, -0.15476608276367188, -0.13715362548828125, -0.11954116821289062, -0.1019287109375, -0.08431625366210938, -0.06670379638671875, -0.049091339111328125, -0.0314788818359375, -0.013866424560546875, 0.00374603271484375, 0.021358489990234375, 0.038970947265625, 0.056583404541015625, 0.07419586181640625, 0.09180831909179688, 0.1094207763671875, 0.12703323364257812, 0.14464569091796875, 0.16225814819335938, 0.17987060546875, 0.19748306274414062, 0.21509552001953125, 0.23270797729492188, 0.2503204345703125, 0.2679328918457031, 0.28554534912109375, 0.3031578063964844, 0.320770263671875, 0.3383827209472656, 0.35599517822265625, 0.3736076354980469, 0.3912200927734375, 0.4088325500488281, 0.42644500732421875, 0.4440574645996094, 0.461669921875]}, "gradients/decoder.model.decoder.layers.5.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 2.0, 2.0, 5.0, 4.0, 6.0, 9.0, 18.0, 30.0, 31.0, 51.0, 65.0, 111.0, 217.0, 311.0, 589.0, 789.0, 720.0, 431.0, 266.0, 139.0, 95.0, 52.0, 37.0, 31.0, 16.0, 15.0, 9.0, 6.0, 10.0, 1.0, 5.0, 6.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.154052734375, -0.14905357360839844, -0.14405441284179688, -0.1390552520751953, -0.13405609130859375, -0.1290569305419922, -0.12405776977539062, -0.11905860900878906, -0.1140594482421875, -0.10906028747558594, -0.10406112670898438, -0.09906196594238281, -0.09406280517578125, -0.08906364440917969, -0.08406448364257812, -0.07906532287597656, -0.074066162109375, -0.06906700134277344, -0.06406784057617188, -0.05906867980957031, -0.05406951904296875, -0.04907035827636719, -0.044071197509765625, -0.03907203674316406, -0.0340728759765625, -0.029073715209960938, -0.024074554443359375, -0.019075393676757812, -0.01407623291015625, -0.009077072143554688, -0.004077911376953125, 0.0009212493896484375, 0.00592041015625, 0.010919570922851562, 0.015918731689453125, 0.020917892456054688, 0.02591705322265625, 0.030916213989257812, 0.035915374755859375, 0.04091453552246094, 0.0459136962890625, 0.05091285705566406, 0.055912017822265625, 0.06091117858886719, 0.06591033935546875, 0.07090950012207031, 0.07590866088867188, 0.08090782165527344, 0.085906982421875, 0.09090614318847656, 0.09590530395507812, 0.10090446472167969, 0.10590362548828125, 0.11090278625488281, 0.11590194702148438, 0.12090110778808594, 0.1259002685546875, 0.13089942932128906, 0.13589859008789062, 0.1408977508544922, 0.14589691162109375, 0.1508960723876953, 0.15589523315429688, 0.16089439392089844, 0.1658935546875]}, "gradients/decoder.model.decoder.layers.5.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 5.0, 9.0, 7.0, 11.0, 19.0, 27.0, 20.0, 34.0, 69.0, 80.0, 98.0, 121.0, 125.0, 83.0, 89.0, 56.0, 37.0, 28.0, 25.0, 18.0, 12.0, 7.0, 5.0, 6.0, 6.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.45134949684143066, -0.4325771629810333, -0.413804829120636, -0.39503249526023865, -0.3762601613998413, -0.35748782753944397, -0.33871549367904663, -0.3199431598186493, -0.30117082595825195, -0.2823984920978546, -0.2636261582374573, -0.24485382437705994, -0.2260814905166626, -0.20730915665626526, -0.18853682279586792, -0.16976448893547058, -0.15099215507507324, -0.1322198212146759, -0.11344748735427856, -0.09467515349388123, -0.07590281963348389, -0.05713048577308655, -0.03835815191268921, -0.01958581805229187, -0.0008134841918945312, 0.017958849668502808, 0.036731183528900146, 0.055503517389297485, 0.07427585124969482, 0.09304818511009216, 0.1118205189704895, 0.13059285283088684, 0.14936524629592896, 0.1681375801563263, 0.18690991401672363, 0.20568224787712097, 0.2244545817375183, 0.24322691559791565, 0.261999249458313, 0.2807715833187103, 0.29954391717910767, 0.318316251039505, 0.33708858489990234, 0.3558609187602997, 0.374633252620697, 0.39340558648109436, 0.4121779203414917, 0.43095025420188904, 0.4497225880622864, 0.4684949219226837, 0.48726725578308105, 0.5060396194458008, 0.5248119235038757, 0.5435842275619507, 0.5623565912246704, 0.5811289548873901, 0.5999012589454651, 0.61867356300354, 0.6374459266662598, 0.6562182903289795, 0.6749905943870544, 0.6937628984451294, 0.7125352621078491, 0.7313076257705688, 0.7500799298286438]}, "gradients/decoder.model.decoder.layers.5.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 5.0, 2.0, 4.0, 2.0, 6.0, 11.0, 9.0, 9.0, 15.0, 19.0, 15.0, 15.0, 27.0, 35.0, 33.0, 30.0, 30.0, 53.0, 30.0, 47.0, 37.0, 42.0, 48.0, 45.0, 61.0, 46.0, 39.0, 37.0, 31.0, 31.0, 28.0, 28.0, 35.0, 18.0, 17.0, 7.0, 13.0, 11.0, 6.0, 11.0, 5.0, 4.0, 2.0, 3.0, 3.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.3310825824737549, -0.32054510712623596, -0.31000766158103943, -0.2994701862335205, -0.288932740688324, -0.27839526534080505, -0.26785778999328613, -0.2573203444480896, -0.24678288400173187, -0.23624542355537415, -0.22570796310901642, -0.2151705026626587, -0.20463302731513977, -0.19409558176994324, -0.18355810642242432, -0.1730206459760666, -0.16248318552970886, -0.15194572508335114, -0.1414082646369934, -0.1308707892894745, -0.12033333629369736, -0.10979587584733963, -0.0992584079504013, -0.08872094750404358, -0.07818348705768585, -0.06764602661132812, -0.0571085624396801, -0.046571098268032074, -0.03603363782167435, -0.02549617737531662, -0.014958709478378296, -0.004421249032020569, 0.006116241216659546, 0.016653703525662422, 0.0271911658346653, 0.037728630006313324, 0.04826609045267105, 0.05880355089902878, 0.0693410187959671, 0.07987847924232483, 0.09041593968868256, 0.10095340013504028, 0.11149086058139801, 0.12202832847833633, 0.13256579637527466, 0.1431032419204712, 0.1536407172679901, 0.16417817771434784, 0.17471563816070557, 0.1852530986070633, 0.19579055905342102, 0.20632803440093994, 0.21686547994613647, 0.2274029552936554, 0.23794041574001312, 0.24847787618637085, 0.2590153217315674, 0.2695527970790863, 0.28009024262428284, 0.29062771797180176, 0.3011651635169983, 0.3117026388645172, 0.32224011421203613, 0.33277755975723267, 0.3433150351047516]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 6.0, 5.0, 6.0, 13.0, 11.0, 24.0, 21.0, 41.0, 82.0, 120.0, 214.0, 378.0, 682.0, 1411.0, 3156.0, 7200.0, 17765.0, 46447.0, 120583.0, 274476.0, 315683.0, 158219.0, 61374.0, 23531.0, 9418.0, 3982.0, 1805.0, 847.0, 430.0, 265.0, 126.0, 93.0, 50.0, 37.0, 13.0, 18.0, 11.0, 10.0, 3.0, 1.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.05120849609375, -0.04970884323120117, -0.048209190368652344, -0.046709537506103516, -0.04520988464355469, -0.04371023178100586, -0.04221057891845703, -0.0407109260559082, -0.039211273193359375, -0.03771162033081055, -0.03621196746826172, -0.03471231460571289, -0.03321266174316406, -0.031713008880615234, -0.030213356018066406, -0.028713703155517578, -0.02721405029296875, -0.025714397430419922, -0.024214744567871094, -0.022715091705322266, -0.021215438842773438, -0.01971578598022461, -0.01821613311767578, -0.016716480255126953, -0.015216827392578125, -0.013717174530029297, -0.012217521667480469, -0.01071786880493164, -0.009218215942382812, -0.007718563079833984, -0.006218910217285156, -0.004719257354736328, -0.0032196044921875, -0.0017199516296386719, -0.00022029876708984375, 0.0012793540954589844, 0.0027790069580078125, 0.004278659820556641, 0.005778312683105469, 0.007277965545654297, 0.008777618408203125, 0.010277271270751953, 0.011776924133300781, 0.01327657699584961, 0.014776229858398438, 0.016275882720947266, 0.017775535583496094, 0.019275188446044922, 0.02077484130859375, 0.022274494171142578, 0.023774147033691406, 0.025273799896240234, 0.026773452758789062, 0.02827310562133789, 0.02977275848388672, 0.03127241134643555, 0.032772064208984375, 0.0342717170715332, 0.03577136993408203, 0.03727102279663086, 0.03877067565917969, 0.040270328521728516, 0.041769981384277344, 0.04326963424682617, 0.044769287109375]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 0.0, 2.0, 2.0, 1.0, 4.0, 6.0, 3.0, 8.0, 11.0, 13.0, 12.0, 19.0, 18.0, 22.0, 30.0, 34.0, 35.0, 32.0, 39.0, 50.0, 43.0, 58.0, 43.0, 56.0, 44.0, 64.0, 45.0, 44.0, 40.0, 36.0, 27.0, 29.0, 23.0, 22.0, 23.0, 11.0, 14.0, 13.0, 5.0, 4.0, 12.0, 2.0, 1.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.23291015625, -0.22544479370117188, -0.21797943115234375, -0.21051406860351562, -0.2030487060546875, -0.19558334350585938, -0.18811798095703125, -0.18065261840820312, -0.173187255859375, -0.16572189331054688, -0.15825653076171875, -0.15079116821289062, -0.1433258056640625, -0.13586044311523438, -0.12839508056640625, -0.12092971801757812, -0.11346435546875, -0.10599899291992188, -0.09853363037109375, -0.09106826782226562, -0.0836029052734375, -0.07613754272460938, -0.06867218017578125, -0.061206817626953125, -0.053741455078125, -0.046276092529296875, -0.03881072998046875, -0.031345367431640625, -0.0238800048828125, -0.016414642333984375, -0.00894927978515625, -0.001483917236328125, 0.0059814453125, 0.013446807861328125, 0.02091217041015625, 0.028377532958984375, 0.0358428955078125, 0.043308258056640625, 0.05077362060546875, 0.058238983154296875, 0.065704345703125, 0.07316970825195312, 0.08063507080078125, 0.08810043334960938, 0.0955657958984375, 0.10303115844726562, 0.11049652099609375, 0.11796188354492188, 0.12542724609375, 0.13289260864257812, 0.14035797119140625, 0.14782333374023438, 0.1552886962890625, 0.16275405883789062, 0.17021942138671875, 0.17768478393554688, 0.185150146484375, 0.19261550903320312, 0.20008087158203125, 0.20754623413085938, 0.2150115966796875, 0.22247695922851562, 0.22994232177734375, 0.23740768432617188, 0.244873046875]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 1.0, 8.0, 9.0, 7.0, 9.0, 17.0, 26.0, 28.0, 52.0, 70.0, 106.0, 161.0, 245.0, 417.0, 732.0, 1302.0, 2687.0, 5967.0, 14360.0, 39955.0, 117918.0, 300284.0, 336840.0, 146276.0, 49721.0, 17568.0, 7081.0, 3138.0, 1566.0, 799.0, 455.0, 258.0, 154.0, 121.0, 61.0, 35.0, 32.0, 22.0, 23.0, 16.0, 8.0, 4.0, 7.0, 3.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.047454833984375, -0.04587841033935547, -0.04430198669433594, -0.042725563049316406, -0.041149139404296875, -0.039572715759277344, -0.03799629211425781, -0.03641986846923828, -0.03484344482421875, -0.03326702117919922, -0.03169059753417969, -0.030114173889160156, -0.028537750244140625, -0.026961326599121094, -0.025384902954101562, -0.02380847930908203, -0.0222320556640625, -0.02065563201904297, -0.019079208374023438, -0.017502784729003906, -0.015926361083984375, -0.014349937438964844, -0.012773513793945312, -0.011197090148925781, -0.00962066650390625, -0.008044242858886719, -0.0064678192138671875, -0.004891395568847656, -0.003314971923828125, -0.0017385482788085938, -0.0001621246337890625, 0.0014142990112304688, 0.00299072265625, 0.004567146301269531, 0.0061435699462890625, 0.007719993591308594, 0.009296417236328125, 0.010872840881347656, 0.012449264526367188, 0.014025688171386719, 0.01560211181640625, 0.01717853546142578, 0.018754959106445312, 0.020331382751464844, 0.021907806396484375, 0.023484230041503906, 0.025060653686523438, 0.02663707733154297, 0.0282135009765625, 0.02978992462158203, 0.03136634826660156, 0.032942771911621094, 0.034519195556640625, 0.036095619201660156, 0.03767204284667969, 0.03924846649169922, 0.04082489013671875, 0.04240131378173828, 0.04397773742675781, 0.045554161071777344, 0.047130584716796875, 0.048707008361816406, 0.05028343200683594, 0.05185985565185547, 0.053436279296875]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 0.0, 2.0, 4.0, 6.0, 7.0, 7.0, 8.0, 12.0, 8.0, 13.0, 28.0, 26.0, 30.0, 29.0, 33.0, 42.0, 37.0, 36.0, 50.0, 32.0, 55.0, 56.0, 50.0, 61.0, 59.0, 37.0, 44.0, 41.0, 27.0, 21.0, 31.0, 21.0, 15.0, 16.0, 14.0, 13.0, 11.0, 6.0, 9.0, 1.0, 6.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.46044921875, -0.445892333984375, -0.43133544921875, -0.416778564453125, -0.4022216796875, -0.387664794921875, -0.37310791015625, -0.358551025390625, -0.343994140625, -0.329437255859375, -0.31488037109375, -0.300323486328125, -0.2857666015625, -0.271209716796875, -0.25665283203125, -0.242095947265625, -0.2275390625, -0.212982177734375, -0.19842529296875, -0.183868408203125, -0.1693115234375, -0.154754638671875, -0.14019775390625, -0.125640869140625, -0.111083984375, -0.096527099609375, -0.08197021484375, -0.067413330078125, -0.0528564453125, -0.038299560546875, -0.02374267578125, -0.009185791015625, 0.00537109375, 0.019927978515625, 0.03448486328125, 0.049041748046875, 0.0635986328125, 0.078155517578125, 0.09271240234375, 0.107269287109375, 0.121826171875, 0.136383056640625, 0.15093994140625, 0.165496826171875, 0.1800537109375, 0.194610595703125, 0.20916748046875, 0.223724365234375, 0.23828125, 0.252838134765625, 0.26739501953125, 0.281951904296875, 0.2965087890625, 0.311065673828125, 0.32562255859375, 0.340179443359375, 0.354736328125, 0.369293212890625, 0.38385009765625, 0.398406982421875, 0.4129638671875, 0.427520751953125, 0.44207763671875, 0.456634521484375, 0.47119140625]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 5.0, 2.0, 8.0, 8.0, 13.0, 10.0, 14.0, 23.0, 30.0, 49.0, 61.0, 138.0, 176.0, 266.0, 609.0, 1072.0, 2140.0, 5017.0, 13521.0, 48787.0, 234599.0, 525434.0, 162709.0, 35552.0, 10492.0, 4014.0, 1708.0, 898.0, 474.0, 253.0, 152.0, 110.0, 66.0, 54.0, 26.0, 16.0, 14.0, 11.0, 7.0, 8.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 4.0, 2.0, 1.0, 2.0], "bins": [-0.0225677490234375, -0.02192997932434082, -0.02129220962524414, -0.02065443992614746, -0.02001667022705078, -0.0193789005279541, -0.018741130828857422, -0.018103361129760742, -0.017465591430664062, -0.016827821731567383, -0.016190052032470703, -0.015552282333374023, -0.014914512634277344, -0.014276742935180664, -0.013638973236083984, -0.013001203536987305, -0.012363433837890625, -0.011725664138793945, -0.011087894439697266, -0.010450124740600586, -0.009812355041503906, -0.009174585342407227, -0.008536815643310547, -0.007899045944213867, -0.0072612762451171875, -0.006623506546020508, -0.005985736846923828, -0.0053479671478271484, -0.004710197448730469, -0.004072427749633789, -0.0034346580505371094, -0.0027968883514404297, -0.00215911865234375, -0.0015213489532470703, -0.0008835792541503906, -0.00024580955505371094, 0.00039196014404296875, 0.0010297298431396484, 0.0016674995422363281, 0.002305269241333008, 0.0029430389404296875, 0.003580808639526367, 0.004218578338623047, 0.0048563480377197266, 0.005494117736816406, 0.006131887435913086, 0.006769657135009766, 0.007407426834106445, 0.008045196533203125, 0.008682966232299805, 0.009320735931396484, 0.009958505630493164, 0.010596275329589844, 0.011234045028686523, 0.011871814727783203, 0.012509584426879883, 0.013147354125976562, 0.013785123825073242, 0.014422893524169922, 0.015060663223266602, 0.01569843292236328, 0.01633620262145996, 0.01697397232055664, 0.01761174201965332, 0.01824951171875]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 8.0, 14.0, 15.0, 16.0, 29.0, 38.0, 53.0, 61.0, 70.0, 100.0, 98.0, 109.0, 85.0, 75.0, 73.0, 39.0, 43.0, 20.0, 19.0, 14.0, 10.0, 6.0, 5.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0192394256591797e-05, -9.768642485141754e-06, -9.344890713691711e-06, -8.921138942241669e-06, -8.497387170791626e-06, -8.073635399341583e-06, -7.64988362789154e-06, -7.226131856441498e-06, -6.802380084991455e-06, -6.378628313541412e-06, -5.95487654209137e-06, -5.531124770641327e-06, -5.107372999191284e-06, -4.6836212277412415e-06, -4.259869456291199e-06, -3.836117684841156e-06, -3.4123659133911133e-06, -2.9886141419410706e-06, -2.564862370491028e-06, -2.141110599040985e-06, -1.7173588275909424e-06, -1.2936070561408997e-06, -8.698552846908569e-07, -4.461035132408142e-07, -2.2351741790771484e-08, 4.0140002965927124e-07, 8.25151801109314e-07, 1.2489035725593567e-06, 1.6726553440093994e-06, 2.096407115459442e-06, 2.520158886909485e-06, 2.9439106583595276e-06, 3.3676624298095703e-06, 3.791414201259613e-06, 4.215165972709656e-06, 4.6389177441596985e-06, 5.062669515609741e-06, 5.486421287059784e-06, 5.910173058509827e-06, 6.333924829959869e-06, 6.757676601409912e-06, 7.181428372859955e-06, 7.6051801443099976e-06, 8.02893191576004e-06, 8.452683687210083e-06, 8.876435458660126e-06, 9.300187230110168e-06, 9.723939001560211e-06, 1.0147690773010254e-05, 1.0571442544460297e-05, 1.099519431591034e-05, 1.1418946087360382e-05, 1.1842697858810425e-05, 1.2266449630260468e-05, 1.269020140171051e-05, 1.3113953173160553e-05, 1.3537704944610596e-05, 1.3961456716060638e-05, 1.4385208487510681e-05, 1.4808960258960724e-05, 1.5232712030410767e-05, 1.565646380186081e-05, 1.6080215573310852e-05, 1.6503967344760895e-05, 1.6927719116210938e-05]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 3.0, 1.0, 3.0, 3.0, 5.0, 11.0, 17.0, 24.0, 26.0, 42.0, 65.0, 84.0, 175.0, 300.0, 601.0, 1075.0, 2460.0, 6005.0, 16910.0, 55021.0, 191597.0, 401386.0, 256972.0, 78741.0, 23053.0, 7901.0, 3120.0, 1359.0, 658.0, 387.0, 224.0, 123.0, 76.0, 41.0, 31.0, 18.0, 16.0, 10.0, 5.0, 4.0, 3.0, 3.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0129241943359375, -0.012399673461914062, -0.011875152587890625, -0.011350631713867188, -0.01082611083984375, -0.010301589965820312, -0.009777069091796875, -0.009252548217773438, -0.00872802734375, -0.008203506469726562, -0.007678985595703125, -0.0071544647216796875, -0.00662994384765625, -0.0061054229736328125, -0.005580902099609375, -0.0050563812255859375, -0.0045318603515625, -0.0040073394775390625, -0.003482818603515625, -0.0029582977294921875, -0.00243377685546875, -0.0019092559814453125, -0.001384735107421875, -0.0008602142333984375, -0.000335693359375, 0.0001888275146484375, 0.000713348388671875, 0.0012378692626953125, 0.00176239013671875, 0.0022869110107421875, 0.002811431884765625, 0.0033359527587890625, 0.0038604736328125, 0.0043849945068359375, 0.004909515380859375, 0.0054340362548828125, 0.00595855712890625, 0.0064830780029296875, 0.007007598876953125, 0.0075321197509765625, 0.008056640625, 0.008581161499023438, 0.009105682373046875, 0.009630203247070312, 0.01015472412109375, 0.010679244995117188, 0.011203765869140625, 0.011728286743164062, 0.0122528076171875, 0.012777328491210938, 0.013301849365234375, 0.013826370239257812, 0.01435089111328125, 0.014875411987304688, 0.015399932861328125, 0.015924453735351562, 0.016448974609375, 0.016973495483398438, 0.017498016357421875, 0.018022537231445312, 0.01854705810546875, 0.019071578979492188, 0.019596099853515625, 0.020120620727539062, 0.0206451416015625]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 6.0, 4.0, 4.0, 5.0, 7.0, 6.0, 6.0, 20.0, 20.0, 18.0, 30.0, 39.0, 28.0, 35.0, 35.0, 62.0, 66.0, 61.0, 69.0, 64.0, 69.0, 37.0, 50.0, 45.0, 35.0, 42.0, 22.0, 27.0, 20.0, 19.0, 12.0, 10.0, 10.0, 7.0, 5.0, 7.0, 3.0, 4.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.004337310791015625, -0.004202008247375488, -0.0040667057037353516, -0.003931403160095215, -0.003796100616455078, -0.0036607980728149414, -0.0035254955291748047, -0.003390192985534668, -0.0032548904418945312, -0.0031195878982543945, -0.002984285354614258, -0.002848982810974121, -0.0027136802673339844, -0.0025783777236938477, -0.002443075180053711, -0.0023077726364135742, -0.0021724700927734375, -0.0020371675491333008, -0.001901865005493164, -0.0017665624618530273, -0.0016312599182128906, -0.001495957374572754, -0.0013606548309326172, -0.0012253522872924805, -0.0010900497436523438, -0.000954747200012207, -0.0008194446563720703, -0.0006841421127319336, -0.0005488395690917969, -0.00041353702545166016, -0.00027823448181152344, -0.00014293193817138672, -7.62939453125e-06, 0.00012767314910888672, 0.00026297569274902344, 0.00039827823638916016, 0.0005335807800292969, 0.0006688833236694336, 0.0008041858673095703, 0.000939488410949707, 0.0010747909545898438, 0.0012100934982299805, 0.0013453960418701172, 0.001480698585510254, 0.0016160011291503906, 0.0017513036727905273, 0.001886606216430664, 0.0020219087600708008, 0.0021572113037109375, 0.0022925138473510742, 0.002427816390991211, 0.0025631189346313477, 0.0026984214782714844, 0.002833724021911621, 0.002969026565551758, 0.0031043291091918945, 0.0032396316528320312, 0.003374934196472168, 0.0035102367401123047, 0.0036455392837524414, 0.003780841827392578, 0.003916144371032715, 0.0040514469146728516, 0.004186749458312988, 0.004322052001953125]}, "gradients/decoder.model.decoder.layers.5.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 5.0, 2.0, 8.0, 22.0, 52.0, 77.0, 207.0, 274.0, 176.0, 104.0, 43.0, 14.0, 15.0, 8.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0115582942962646, -0.9853016138076782, -0.9590449333190918, -0.9327882528305054, -0.906531572341919, -0.8802748918533325, -0.8540182113647461, -0.8277615308761597, -0.8015048503875732, -0.7752481698989868, -0.7489914894104004, -0.722734808921814, -0.6964781284332275, -0.6702214479446411, -0.6439647674560547, -0.6177080869674683, -0.5914513468742371, -0.5651946663856506, -0.5389379858970642, -0.5126813054084778, -0.48642462491989136, -0.46016794443130493, -0.4339112341403961, -0.4076545536518097, -0.38139787316322327, -0.35514119267463684, -0.3288845121860504, -0.3026278018951416, -0.2763711214065552, -0.25011444091796875, -0.22385776042938232, -0.1976010799407959, -0.1713443398475647, -0.14508765935897827, -0.11883097141981125, -0.09257428348064423, -0.0663176029920578, -0.040060922503471375, -0.013804227113723755, 0.012452453374862671, 0.0387091338634491, 0.06496581435203552, 0.09122250229120255, 0.11747919023036957, 0.143735870718956, 0.16999255120754242, 0.19624924659729004, 0.22250592708587646, 0.2487626075744629, 0.2750192880630493, 0.30127596855163574, 0.32753264904022217, 0.3537893295288086, 0.380046010017395, 0.40630272030830383, 0.43255940079689026, 0.4588160812854767, 0.4850727617740631, 0.5113294720649719, 0.5375861525535583, 0.5638428330421448, 0.5900995135307312, 0.6163561940193176, 0.642612874507904, 0.6688695549964905]}, "gradients/decoder.model.decoder.layers.5.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 3.0, 0.0, 2.0, 4.0, 7.0, 1.0, 8.0, 10.0, 10.0, 14.0, 14.0, 18.0, 16.0, 22.0, 26.0, 39.0, 38.0, 41.0, 33.0, 45.0, 47.0, 48.0, 46.0, 47.0, 69.0, 49.0, 46.0, 40.0, 40.0, 26.0, 30.0, 27.0, 35.0, 25.0, 16.0, 10.0, 11.0, 4.0, 7.0, 12.0, 7.0, 2.0, 3.0, 2.0, 1.0, 3.0, 0.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.216329425573349, -0.20912693440914154, -0.20192444324493408, -0.19472193717956543, -0.18751944601535797, -0.1803169548511505, -0.17311446368694305, -0.1659119725227356, -0.15870948135852814, -0.15150699019432068, -0.14430449903011322, -0.13710200786590576, -0.1298995018005371, -0.12269701063632965, -0.11549451947212219, -0.10829202830791473, -0.10108952969312668, -0.09388703852891922, -0.08668453991413116, -0.0794820487499237, -0.07227955758571625, -0.06507706642150879, -0.057874567806720734, -0.050672076642513275, -0.04346958175301552, -0.03626708686351776, -0.029064595699310303, -0.021862100809812546, -0.014659607782959938, -0.00745711475610733, -0.00025461986660957336, 0.006947871297597885, 0.014150366187095642, 0.02135285921394825, 0.028555352240800858, 0.035757847130298615, 0.04296033829450607, 0.05016283318400383, 0.05736532807350159, 0.06456781923770905, 0.0717703104019165, 0.07897280156612396, 0.08617530018091202, 0.09337779134511948, 0.10058028250932693, 0.10778278112411499, 0.11498527228832245, 0.12218776345252991, 0.12939026951789856, 0.13659276068210602, 0.14379525184631348, 0.15099775791168213, 0.1582002490758896, 0.16540274024009705, 0.1726052314043045, 0.17980772256851196, 0.18701021373271942, 0.19421270489692688, 0.20141519606113434, 0.2086176872253418, 0.21582019329071045, 0.2230226844549179, 0.23022517561912537, 0.23742766678333282, 0.24463015794754028]}, "gradients/decoder.model.decoder.layers.5.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 4.0, 8.0, 12.0, 13.0, 23.0, 25.0, 62.0, 74.0, 101.0, 187.0, 275.0, 515.0, 925.0, 1798.0, 3791.0, 8310.0, 20100.0, 54704.0, 170182.0, 435905.0, 232275.0, 73338.0, 26187.0, 10429.0, 4611.0, 2209.0, 1088.0, 580.0, 314.0, 210.0, 103.0, 58.0, 45.0, 27.0, 18.0, 12.0, 12.0, 9.0, 4.0, 8.0, 2.0, 3.0, 3.0, 0.0, 1.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.2418212890625, -0.23392677307128906, -0.22603225708007812, -0.2181377410888672, -0.21024322509765625, -0.2023487091064453, -0.19445419311523438, -0.18655967712402344, -0.1786651611328125, -0.17077064514160156, -0.16287612915039062, -0.1549816131591797, -0.14708709716796875, -0.1391925811767578, -0.13129806518554688, -0.12340354919433594, -0.115509033203125, -0.10761451721191406, -0.09972000122070312, -0.09182548522949219, -0.08393096923828125, -0.07603645324707031, -0.06814193725585938, -0.06024742126464844, -0.0523529052734375, -0.04445838928222656, -0.036563873291015625, -0.028669357299804688, -0.02077484130859375, -0.012880325317382812, -0.004985809326171875, 0.0029087066650390625, 0.01080322265625, 0.018697738647460938, 0.026592254638671875, 0.03448677062988281, 0.04238128662109375, 0.05027580261230469, 0.058170318603515625, 0.06606483459472656, 0.0739593505859375, 0.08185386657714844, 0.08974838256835938, 0.09764289855957031, 0.10553741455078125, 0.11343193054199219, 0.12132644653320312, 0.12922096252441406, 0.137115478515625, 0.14500999450683594, 0.15290451049804688, 0.1607990264892578, 0.16869354248046875, 0.1765880584716797, 0.18448257446289062, 0.19237709045410156, 0.2002716064453125, 0.20816612243652344, 0.21606063842773438, 0.2239551544189453, 0.23184967041015625, 0.2397441864013672, 0.24763870239257812, 0.25553321838378906, 0.263427734375]}, "gradients/decoder.model.decoder.layers.5.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 4.0, 4.0, 3.0, 1.0, 6.0, 6.0, 7.0, 9.0, 22.0, 15.0, 11.0, 24.0, 35.0, 38.0, 38.0, 48.0, 51.0, 60.0, 72.0, 56.0, 58.0, 73.0, 64.0, 48.0, 46.0, 35.0, 37.0, 38.0, 20.0, 21.0, 14.0, 13.0, 7.0, 4.0, 3.0, 6.0, 7.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.467529296875, -0.4495277404785156, -0.43152618408203125, -0.4135246276855469, -0.3955230712890625, -0.3775215148925781, -0.35951995849609375, -0.3415184020996094, -0.323516845703125, -0.3055152893066406, -0.28751373291015625, -0.2695121765136719, -0.2515106201171875, -0.23350906372070312, -0.21550750732421875, -0.19750595092773438, -0.17950439453125, -0.16150283813476562, -0.14350128173828125, -0.12549972534179688, -0.1074981689453125, -0.08949661254882812, -0.07149505615234375, -0.053493499755859375, -0.035491943359375, -0.017490386962890625, 0.00051116943359375, 0.018512725830078125, 0.0365142822265625, 0.054515838623046875, 0.07251739501953125, 0.09051895141601562, 0.1085205078125, 0.12652206420898438, 0.14452362060546875, 0.16252517700195312, 0.1805267333984375, 0.19852828979492188, 0.21652984619140625, 0.23453140258789062, 0.252532958984375, 0.2705345153808594, 0.28853607177734375, 0.3065376281738281, 0.3245391845703125, 0.3425407409667969, 0.36054229736328125, 0.3785438537597656, 0.39654541015625, 0.4145469665527344, 0.43254852294921875, 0.4505500793457031, 0.4685516357421875, 0.4865531921386719, 0.5045547485351562, 0.5225563049316406, 0.540557861328125, 0.5585594177246094, 0.5765609741210938, 0.5945625305175781, 0.6125640869140625, 0.6305656433105469, 0.6485671997070312, 0.6665687561035156, 0.6845703125]}, "gradients/decoder.model.decoder.layers.5.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 4.0, 0.0, 1.0, 2.0, 6.0, 1.0, 10.0, 9.0, 9.0, 9.0, 10.0, 16.0, 13.0, 28.0, 26.0, 33.0, 43.0, 62.0, 76.0, 130.0, 242.0, 464.0, 1386.0, 6572.0, 56236.0, 658665.0, 295388.0, 23740.0, 3390.0, 908.0, 354.0, 206.0, 128.0, 95.0, 69.0, 43.0, 35.0, 21.0, 31.0, 25.0, 15.0, 13.0, 19.0, 13.0, 6.0, 6.0, 2.0, 2.0, 1.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.453125, -0.43792724609375, -0.4227294921875, -0.40753173828125, -0.392333984375, -0.37713623046875, -0.3619384765625, -0.34674072265625, -0.33154296875, -0.31634521484375, -0.3011474609375, -0.28594970703125, -0.270751953125, -0.25555419921875, -0.2403564453125, -0.22515869140625, -0.2099609375, -0.19476318359375, -0.1795654296875, -0.16436767578125, -0.149169921875, -0.13397216796875, -0.1187744140625, -0.10357666015625, -0.08837890625, -0.07318115234375, -0.0579833984375, -0.04278564453125, -0.027587890625, -0.01239013671875, 0.0028076171875, 0.01800537109375, 0.033203125, 0.04840087890625, 0.0635986328125, 0.07879638671875, 0.093994140625, 0.10919189453125, 0.1243896484375, 0.13958740234375, 0.15478515625, 0.16998291015625, 0.1851806640625, 0.20037841796875, 0.215576171875, 0.23077392578125, 0.2459716796875, 0.26116943359375, 0.2763671875, 0.29156494140625, 0.3067626953125, 0.32196044921875, 0.337158203125, 0.35235595703125, 0.3675537109375, 0.38275146484375, 0.39794921875, 0.41314697265625, 0.4283447265625, 0.44354248046875, 0.458740234375, 0.47393798828125, 0.4891357421875, 0.50433349609375, 0.51953125]}, "gradients/decoder.model.decoder.layers.5.self_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 4.0, 4.0, 1.0, 4.0, 1.0, 6.0, 7.0, 6.0, 11.0, 7.0, 16.0, 12.0, 13.0, 13.0, 16.0, 19.0, 25.0, 26.0, 29.0, 30.0, 28.0, 35.0, 30.0, 31.0, 36.0, 39.0, 55.0, 39.0, 36.0, 27.0, 31.0, 40.0, 36.0, 31.0, 32.0, 18.0, 30.0, 25.0, 28.0, 22.0, 23.0, 18.0, 9.0, 10.0, 10.0, 7.0, 10.0, 7.0, 9.0, 2.0, 5.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.50244140625, -0.48804473876953125, -0.4736480712890625, -0.45925140380859375, -0.444854736328125, -0.43045806884765625, -0.4160614013671875, -0.40166473388671875, -0.38726806640625, -0.37287139892578125, -0.3584747314453125, -0.34407806396484375, -0.329681396484375, -0.31528472900390625, -0.3008880615234375, -0.28649139404296875, -0.2720947265625, -0.25769805908203125, -0.2433013916015625, -0.22890472412109375, -0.214508056640625, -0.20011138916015625, -0.1857147216796875, -0.17131805419921875, -0.15692138671875, -0.14252471923828125, -0.1281280517578125, -0.11373138427734375, -0.099334716796875, -0.08493804931640625, -0.0705413818359375, -0.05614471435546875, -0.041748046875, -0.02735137939453125, -0.0129547119140625, 0.00144195556640625, 0.015838623046875, 0.03023529052734375, 0.0446319580078125, 0.05902862548828125, 0.07342529296875, 0.08782196044921875, 0.1022186279296875, 0.11661529541015625, 0.131011962890625, 0.14540863037109375, 0.1598052978515625, 0.17420196533203125, 0.1885986328125, 0.20299530029296875, 0.2173919677734375, 0.23178863525390625, 0.246185302734375, 0.26058197021484375, 0.2749786376953125, 0.28937530517578125, 0.30377197265625, 0.31816864013671875, 0.3325653076171875, 0.34696197509765625, 0.361358642578125, 0.37575531005859375, 0.3901519775390625, 0.40454864501953125, 0.4189453125]}, "gradients/decoder.model.decoder.layers.5.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 1.0, 2.0, 3.0, 8.0, 6.0, 10.0, 27.0, 35.0, 96.0, 268.0, 941.0, 4410.0, 131453.0, 895249.0, 13639.0, 1717.0, 435.0, 133.0, 55.0, 35.0, 9.0, 10.0, 2.0, 3.0, 3.0, 1.0, 2.0, 3.0, 1.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.413818359375, -0.40056610107421875, -0.3873138427734375, -0.37406158447265625, -0.360809326171875, -0.34755706787109375, -0.3343048095703125, -0.32105255126953125, -0.30780029296875, -0.29454803466796875, -0.2812957763671875, -0.26804351806640625, -0.254791259765625, -0.24153900146484375, -0.2282867431640625, -0.21503448486328125, -0.2017822265625, -0.18852996826171875, -0.1752777099609375, -0.16202545166015625, -0.148773193359375, -0.13552093505859375, -0.1222686767578125, -0.10901641845703125, -0.09576416015625, -0.08251190185546875, -0.0692596435546875, -0.05600738525390625, -0.042755126953125, -0.02950286865234375, -0.0162506103515625, -0.00299835205078125, 0.01025390625, 0.02350616455078125, 0.0367584228515625, 0.05001068115234375, 0.063262939453125, 0.07651519775390625, 0.0897674560546875, 0.10301971435546875, 0.11627197265625, 0.12952423095703125, 0.1427764892578125, 0.15602874755859375, 0.169281005859375, 0.18253326416015625, 0.1957855224609375, 0.20903778076171875, 0.2222900390625, 0.23554229736328125, 0.2487945556640625, 0.26204681396484375, 0.275299072265625, 0.28855133056640625, 0.3018035888671875, 0.31505584716796875, 0.32830810546875, 0.34156036376953125, 0.3548126220703125, 0.36806488037109375, 0.381317138671875, 0.39456939697265625, 0.4078216552734375, 0.42107391357421875, 0.434326171875]}, "gradients/decoder.model.decoder.layers.5.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 7.0, 5.0, 13.0, 17.0, 15.0, 41.0, 93.0, 139.0, 213.0, 190.0, 123.0, 48.0, 37.0, 27.0, 16.0, 14.0, 2.0, 6.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.124641418457031e-05, -3.9812177419662476e-05, -3.837794065475464e-05, -3.69437038898468e-05, -3.5509467124938965e-05, -3.407523036003113e-05, -3.264099359512329e-05, -3.1206756830215454e-05, -2.9772520065307617e-05, -2.833828330039978e-05, -2.6904046535491943e-05, -2.5469809770584106e-05, -2.403557300567627e-05, -2.2601336240768433e-05, -2.1167099475860596e-05, -1.973286271095276e-05, -1.8298625946044922e-05, -1.6864389181137085e-05, -1.5430152416229248e-05, -1.3995915651321411e-05, -1.2561678886413574e-05, -1.1127442121505737e-05, -9.6932053565979e-06, -8.258968591690063e-06, -6.8247318267822266e-06, -5.39049506187439e-06, -3.956258296966553e-06, -2.522021532058716e-06, -1.087784767150879e-06, 3.46451997756958e-07, 1.780688762664795e-06, 3.214925527572632e-06, 4.649162292480469e-06, 6.083399057388306e-06, 7.517635822296143e-06, 8.95187258720398e-06, 1.0386109352111816e-05, 1.1820346117019653e-05, 1.325458288192749e-05, 1.4688819646835327e-05, 1.6123056411743164e-05, 1.7557293176651e-05, 1.8991529941558838e-05, 2.0425766706466675e-05, 2.1860003471374512e-05, 2.329424023628235e-05, 2.4728477001190186e-05, 2.6162713766098022e-05, 2.759695053100586e-05, 2.9031187295913696e-05, 3.0465424060821533e-05, 3.189966082572937e-05, 3.333389759063721e-05, 3.4768134355545044e-05, 3.620237112045288e-05, 3.763660788536072e-05, 3.9070844650268555e-05, 4.050508141517639e-05, 4.193931818008423e-05, 4.3373554944992065e-05, 4.48077917098999e-05, 4.624202847480774e-05, 4.7676265239715576e-05, 4.911050200462341e-05, 5.054473876953125e-05]}, "gradients/decoder.model.decoder.layers.5.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 6.0, 12.0, 9.0, 28.0, 49.0, 62.0, 125.0, 360.0, 1142.0, 5481.0, 91482.0, 915208.0, 30071.0, 3285.0, 749.0, 240.0, 113.0, 56.0, 32.0, 15.0, 13.0, 5.0, 5.0, 1.0, 4.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.354736328125, -0.34342193603515625, -0.3321075439453125, -0.32079315185546875, -0.309478759765625, -0.29816436767578125, -0.2868499755859375, -0.27553558349609375, -0.26422119140625, -0.25290679931640625, -0.2415924072265625, -0.23027801513671875, -0.218963623046875, -0.20764923095703125, -0.1963348388671875, -0.18502044677734375, -0.1737060546875, -0.16239166259765625, -0.1510772705078125, -0.13976287841796875, -0.128448486328125, -0.11713409423828125, -0.1058197021484375, -0.09450531005859375, -0.08319091796875, -0.07187652587890625, -0.0605621337890625, -0.04924774169921875, -0.037933349609375, -0.02661895751953125, -0.0153045654296875, -0.00399017333984375, 0.00732421875, 0.01863861083984375, 0.0299530029296875, 0.04126739501953125, 0.052581787109375, 0.06389617919921875, 0.0752105712890625, 0.08652496337890625, 0.09783935546875, 0.10915374755859375, 0.1204681396484375, 0.13178253173828125, 0.143096923828125, 0.15441131591796875, 0.1657257080078125, 0.17704010009765625, 0.1883544921875, 0.19966888427734375, 0.2109832763671875, 0.22229766845703125, 0.233612060546875, 0.24492645263671875, 0.2562408447265625, 0.26755523681640625, 0.27886962890625, 0.29018402099609375, 0.3014984130859375, 0.31281280517578125, 0.324127197265625, 0.33544158935546875, 0.3467559814453125, 0.35807037353515625, 0.369384765625]}, "gradients/decoder.model.decoder.layers.5.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 5.0, 4.0, 2.0, 2.0, 15.0, 17.0, 22.0, 29.0, 40.0, 55.0, 83.0, 79.0, 96.0, 130.0, 121.0, 89.0, 45.0, 54.0, 34.0, 23.0, 18.0, 13.0, 7.0, 8.0, 3.0, 4.0, 5.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08843994140625, -0.08577632904052734, -0.08311271667480469, -0.08044910430908203, -0.07778549194335938, -0.07512187957763672, -0.07245826721191406, -0.0697946548461914, -0.06713104248046875, -0.0644674301147461, -0.06180381774902344, -0.05914020538330078, -0.056476593017578125, -0.05381298065185547, -0.05114936828613281, -0.048485755920410156, -0.0458221435546875, -0.043158531188964844, -0.04049491882324219, -0.03783130645751953, -0.035167694091796875, -0.03250408172607422, -0.029840469360351562, -0.027176856994628906, -0.02451324462890625, -0.021849632263183594, -0.019186019897460938, -0.01652240753173828, -0.013858795166015625, -0.011195182800292969, -0.008531570434570312, -0.005867958068847656, -0.003204345703125, -0.0005407333374023438, 0.0021228790283203125, 0.004786491394042969, 0.007450103759765625, 0.010113716125488281, 0.012777328491210938, 0.015440940856933594, 0.01810455322265625, 0.020768165588378906, 0.023431777954101562, 0.02609539031982422, 0.028759002685546875, 0.03142261505126953, 0.03408622741699219, 0.036749839782714844, 0.0394134521484375, 0.042077064514160156, 0.04474067687988281, 0.04740428924560547, 0.050067901611328125, 0.05273151397705078, 0.05539512634277344, 0.058058738708496094, 0.06072235107421875, 0.0633859634399414, 0.06604957580566406, 0.06871318817138672, 0.07137680053710938, 0.07404041290283203, 0.07670402526855469, 0.07936763763427734, 0.08203125]}, "gradients/decoder.model.decoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 5.0, 12.0, 9.0, 21.0, 28.0, 52.0, 75.0, 115.0, 147.0, 164.0, 142.0, 81.0, 59.0, 38.0, 22.0, 9.0, 8.0, 6.0, 5.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7366736531257629, -0.7034744620323181, -0.6702752709388733, -0.6370760798454285, -0.6038768887519836, -0.5706776976585388, -0.5374784469604492, -0.5042792558670044, -0.47108009457588196, -0.43788090348243713, -0.4046817123889923, -0.3714824914932251, -0.3382833003997803, -0.30508410930633545, -0.2718849182128906, -0.2386857271194458, -0.20548653602600098, -0.17228734493255615, -0.13908815383911133, -0.10588894784450531, -0.07268975675106049, -0.03949056565761566, -0.0062913596630096436, 0.02690783143043518, 0.060107022523880005, 0.09330621361732483, 0.12650540471076965, 0.15970461070537567, 0.1929038017988205, 0.22610299289226532, 0.25930219888687134, 0.29250138998031616, 0.3257005214691162, 0.35889971256256104, 0.39209890365600586, 0.4252980947494507, 0.4584972858428955, 0.49169647693634033, 0.5248956680297852, 0.55809485912323, 0.5912940502166748, 0.6244932413101196, 0.6576924324035645, 0.6908916234970093, 0.7240908145904541, 0.7572900056838989, 0.7904891967773438, 0.8236883878707886, 0.8568876385688782, 0.890086829662323, 0.9232860207557678, 0.9564852118492126, 0.9896844029426575, 1.022883653640747, 1.056082844734192, 1.0892820358276367, 1.1224812269210815, 1.1556804180145264, 1.1888796091079712, 1.222078800201416, 1.2552779912948608, 1.2884771823883057, 1.3216763734817505, 1.3548755645751953, 1.3880747556686401]}, "gradients/decoder.model.decoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 4.0, 3.0, 2.0, 7.0, 2.0, 10.0, 8.0, 9.0, 14.0, 9.0, 15.0, 16.0, 19.0, 20.0, 19.0, 30.0, 33.0, 34.0, 42.0, 41.0, 38.0, 30.0, 51.0, 53.0, 44.0, 38.0, 42.0, 40.0, 42.0, 32.0, 34.0, 30.0, 28.0, 23.0, 24.0, 19.0, 16.0, 14.0, 18.0, 9.0, 12.0, 8.0, 9.0, 4.0, 4.0, 6.0, 0.0, 2.0, 5.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.8605849742889404, -0.8326851725578308, -0.8047853708267212, -0.7768856287002563, -0.7489858269691467, -0.7210860252380371, -0.6931862831115723, -0.6652864813804626, -0.637386679649353, -0.6094868779182434, -0.5815870761871338, -0.553687334060669, -0.5257875323295593, -0.4978877305984497, -0.4699879586696625, -0.44208818674087524, -0.4141883850097656, -0.386288583278656, -0.3583888113498688, -0.33048903942108154, -0.3025892376899719, -0.2746894359588623, -0.24678966403007507, -0.21888987720012665, -0.19099009037017822, -0.1630903035402298, -0.13519051671028137, -0.10729072988033295, -0.07939094305038452, -0.051491156220436096, -0.02359136939048767, 0.004308417439460754, 0.032208263874053955, 0.06010805070400238, 0.0880078375339508, 0.11590762436389923, 0.14380741119384766, 0.17170719802379608, 0.1996069848537445, 0.22750677168369293, 0.25540655851364136, 0.283306360244751, 0.3112061321735382, 0.33910590410232544, 0.36700570583343506, 0.3949055075645447, 0.4228052794933319, 0.45070505142211914, 0.47860485315322876, 0.5065046548843384, 0.5344043970108032, 0.5623041987419128, 0.5902040004730225, 0.6181038022041321, 0.6460036039352417, 0.6739033460617065, 0.7018031477928162, 0.7297029495239258, 0.7576026916503906, 0.7855024933815002, 0.8134022951126099, 0.8413020968437195, 0.8692018985748291, 0.897101640701294, 0.9250014424324036]}, "gradients/decoder.model.decoder.layers.4.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 5.0, 5.0, 4.0, 7.0, 25.0, 32.0, 44.0, 124.0, 221.0, 667.0, 3152.0, 53934.0, 4018617.0, 111660.0, 4351.0, 865.0, 267.0, 125.0, 75.0, 38.0, 20.0, 16.0, 17.0, 6.0, 2.0, 4.0, 4.0, 3.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.341796875, -1.2964324951171875, -1.251068115234375, -1.2057037353515625, -1.16033935546875, -1.1149749755859375, -1.069610595703125, -1.0242462158203125, -0.9788818359375, -0.9335174560546875, -0.888153076171875, -0.8427886962890625, -0.79742431640625, -0.7520599365234375, -0.706695556640625, -0.6613311767578125, -0.615966796875, -0.5706024169921875, -0.525238037109375, -0.4798736572265625, -0.43450927734375, -0.3891448974609375, -0.343780517578125, -0.2984161376953125, -0.2530517578125, -0.2076873779296875, -0.162322998046875, -0.1169586181640625, -0.07159423828125, -0.0262298583984375, 0.019134521484375, 0.0644989013671875, 0.10986328125, 0.1552276611328125, 0.200592041015625, 0.2459564208984375, 0.29132080078125, 0.3366851806640625, 0.382049560546875, 0.4274139404296875, 0.4727783203125, 0.5181427001953125, 0.563507080078125, 0.6088714599609375, 0.65423583984375, 0.6996002197265625, 0.744964599609375, 0.7903289794921875, 0.835693359375, 0.8810577392578125, 0.926422119140625, 0.9717864990234375, 1.01715087890625, 1.0625152587890625, 1.107879638671875, 1.1532440185546875, 1.1986083984375, 1.2439727783203125, 1.289337158203125, 1.3347015380859375, 1.38006591796875, 1.4254302978515625, 1.470794677734375, 1.5161590576171875, 1.5615234375]}, "gradients/decoder.model.decoder.layers.4.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 7.0, 2.0, 6.0, 6.0, 1.0, 6.0, 10.0, 15.0, 11.0, 30.0, 24.0, 21.0, 22.0, 33.0, 46.0, 46.0, 49.0, 48.0, 41.0, 50.0, 38.0, 65.0, 53.0, 54.0, 48.0, 27.0, 36.0, 33.0, 22.0, 33.0, 30.0, 15.0, 23.0, 15.0, 7.0, 5.0, 2.0, 8.0, 3.0, 2.0, 4.0, 2.0, 1.0, 2.0, 1.0, 5.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.3349609375, -0.32524871826171875, -0.3155364990234375, -0.30582427978515625, -0.296112060546875, -0.28639984130859375, -0.2766876220703125, -0.26697540283203125, -0.25726318359375, -0.24755096435546875, -0.2378387451171875, -0.22812652587890625, -0.218414306640625, -0.20870208740234375, -0.1989898681640625, -0.18927764892578125, -0.1795654296875, -0.16985321044921875, -0.1601409912109375, -0.15042877197265625, -0.140716552734375, -0.13100433349609375, -0.1212921142578125, -0.11157989501953125, -0.10186767578125, -0.09215545654296875, -0.0824432373046875, -0.07273101806640625, -0.063018798828125, -0.05330657958984375, -0.0435943603515625, -0.03388214111328125, -0.024169921875, -0.01445770263671875, -0.0047454833984375, 0.00496673583984375, 0.014678955078125, 0.02439117431640625, 0.0341033935546875, 0.04381561279296875, 0.05352783203125, 0.06324005126953125, 0.0729522705078125, 0.08266448974609375, 0.092376708984375, 0.10208892822265625, 0.1118011474609375, 0.12151336669921875, 0.1312255859375, 0.14093780517578125, 0.1506500244140625, 0.16036224365234375, 0.170074462890625, 0.17978668212890625, 0.1894989013671875, 0.19921112060546875, 0.20892333984375, 0.21863555908203125, 0.2283477783203125, 0.23805999755859375, 0.247772216796875, 0.25748443603515625, 0.2671966552734375, 0.27690887451171875, 0.28662109375]}, "gradients/decoder.model.decoder.layers.4.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 4.0, 1.0, 6.0, 8.0, 13.0, 13.0, 32.0, 37.0, 94.0, 127.0, 240.0, 542.0, 1276.0, 3704.0, 16324.0, 191119.0, 3777443.0, 181941.0, 15656.0, 3446.0, 1177.0, 522.0, 227.0, 142.0, 83.0, 36.0, 28.0, 16.0, 15.0, 6.0, 6.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.88525390625, -0.8639183044433594, -0.8425827026367188, -0.8212471008300781, -0.7999114990234375, -0.7785758972167969, -0.7572402954101562, -0.7359046936035156, -0.714569091796875, -0.6932334899902344, -0.6718978881835938, -0.6505622863769531, -0.6292266845703125, -0.6078910827636719, -0.5865554809570312, -0.5652198791503906, -0.54388427734375, -0.5225486755371094, -0.5012130737304688, -0.4798774719238281, -0.4585418701171875, -0.4372062683105469, -0.41587066650390625, -0.3945350646972656, -0.373199462890625, -0.3518638610839844, -0.33052825927734375, -0.3091926574707031, -0.2878570556640625, -0.2665214538574219, -0.24518585205078125, -0.22385025024414062, -0.2025146484375, -0.18117904663085938, -0.15984344482421875, -0.13850784301757812, -0.1171722412109375, -0.09583663940429688, -0.07450103759765625, -0.053165435791015625, -0.031829833984375, -0.010494232177734375, 0.01084136962890625, 0.032176971435546875, 0.0535125732421875, 0.07484817504882812, 0.09618377685546875, 0.11751937866210938, 0.13885498046875, 0.16019058227539062, 0.18152618408203125, 0.20286178588867188, 0.2241973876953125, 0.24553298950195312, 0.26686859130859375, 0.2882041931152344, 0.309539794921875, 0.3308753967285156, 0.35221099853515625, 0.3735466003417969, 0.3948822021484375, 0.4162178039550781, 0.43755340576171875, 0.4588890075683594, 0.480224609375]}, "gradients/decoder.model.decoder.layers.4.fc1.bias": {"_type": "histogram", "values": [3.0, 1.0, 3.0, 1.0, 3.0, 1.0, 3.0, 6.0, 8.0, 11.0, 16.0, 28.0, 36.0, 44.0, 87.0, 142.0, 251.0, 437.0, 742.0, 810.0, 591.0, 351.0, 210.0, 105.0, 68.0, 27.0, 26.0, 16.0, 24.0, 11.0, 6.0, 10.0, 3.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09765625, -0.09261322021484375, -0.0875701904296875, -0.08252716064453125, -0.077484130859375, -0.07244110107421875, -0.0673980712890625, -0.06235504150390625, -0.05731201171875, -0.05226898193359375, -0.0472259521484375, -0.04218292236328125, -0.037139892578125, -0.03209686279296875, -0.0270538330078125, -0.02201080322265625, -0.0169677734375, -0.01192474365234375, -0.0068817138671875, -0.00183868408203125, 0.003204345703125, 0.00824737548828125, 0.0132904052734375, 0.01833343505859375, 0.02337646484375, 0.02841949462890625, 0.0334625244140625, 0.03850555419921875, 0.043548583984375, 0.04859161376953125, 0.0536346435546875, 0.05867767333984375, 0.063720703125, 0.06876373291015625, 0.0738067626953125, 0.07884979248046875, 0.083892822265625, 0.08893585205078125, 0.0939788818359375, 0.09902191162109375, 0.10406494140625, 0.10910797119140625, 0.1141510009765625, 0.11919403076171875, 0.124237060546875, 0.12928009033203125, 0.1343231201171875, 0.13936614990234375, 0.1444091796875, 0.14945220947265625, 0.1544952392578125, 0.15953826904296875, 0.164581298828125, 0.16962432861328125, 0.1746673583984375, 0.17971038818359375, 0.18475341796875, 0.18979644775390625, 0.1948394775390625, 0.19988250732421875, 0.204925537109375, 0.20996856689453125, 0.2150115966796875, 0.22005462646484375, 0.22509765625]}, "gradients/decoder.model.decoder.layers.4.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 4.0, 0.0, 4.0, 4.0, 3.0, 4.0, 9.0, 11.0, 12.0, 21.0, 31.0, 35.0, 47.0, 66.0, 78.0, 92.0, 88.0, 93.0, 86.0, 84.0, 70.0, 45.0, 23.0, 30.0, 23.0, 16.0, 6.0, 4.0, 4.0, 3.0, 2.0, 3.0, 3.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.47583237290382385, -0.4599619209766388, -0.44409146904945374, -0.4282210171222687, -0.412350594997406, -0.39648014307022095, -0.3806096911430359, -0.36473923921585083, -0.34886878728866577, -0.3329983353614807, -0.31712788343429565, -0.3012574315071106, -0.28538697957992554, -0.2695165276527405, -0.2536461055278778, -0.23777565360069275, -0.2219052016735077, -0.20603474974632263, -0.19016429781913757, -0.1742938607931137, -0.15842340886592865, -0.1425529569387436, -0.12668251991271973, -0.11081206798553467, -0.09494161605834961, -0.07907116413116455, -0.06320071965456009, -0.04733027145266533, -0.03145982325077057, -0.01558937132358551, 0.0002810731530189514, 0.016151517629623413, 0.032021939754486084, 0.047892387956380844, 0.0637628361582756, 0.07963328063488007, 0.09550373256206512, 0.11137418448925018, 0.12724462151527405, 0.1431150734424591, 0.15898552536964417, 0.17485597729682922, 0.19072642922401428, 0.20659686625003815, 0.2224673181772232, 0.23833777010440826, 0.25420820713043213, 0.2700786590576172, 0.28594911098480225, 0.3018195629119873, 0.31769001483917236, 0.3335604667663574, 0.3494309186935425, 0.36530137062072754, 0.3811717927455902, 0.39704224467277527, 0.4129126965999603, 0.4287831485271454, 0.44465360045433044, 0.4605240523815155, 0.4763944745063782, 0.49226492643356323, 0.5081353783607483, 0.5240058302879333, 0.5398762822151184]}, "gradients/decoder.model.decoder.layers.4.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 4.0, 3.0, 3.0, 9.0, 6.0, 4.0, 8.0, 12.0, 13.0, 15.0, 23.0, 17.0, 25.0, 20.0, 30.0, 35.0, 44.0, 31.0, 47.0, 38.0, 52.0, 53.0, 50.0, 50.0, 38.0, 51.0, 40.0, 44.0, 28.0, 30.0, 26.0, 21.0, 28.0, 26.0, 16.0, 12.0, 11.0, 8.0, 14.0, 4.0, 3.0, 8.0, 3.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.340414822101593, -0.3305853307247162, -0.32075583934783936, -0.31092631816864014, -0.3010968267917633, -0.2912673354148865, -0.28143781423568726, -0.2716083228588104, -0.2617788314819336, -0.25194934010505676, -0.24211983382701874, -0.2322903275489807, -0.22246083617210388, -0.21263134479522705, -0.20280183851718903, -0.192972332239151, -0.18314284086227417, -0.17331334948539734, -0.16348384320735931, -0.1536543369293213, -0.14382484555244446, -0.13399535417556763, -0.1241658478975296, -0.11433634907007217, -0.10450685024261475, -0.09467735141515732, -0.08484785258769989, -0.07501835376024246, -0.06518885493278503, -0.055359356105327606, -0.04552985727787018, -0.03570035845041275, -0.025870829820632935, -0.016041330993175507, -0.006211832165718079, 0.0036176666617393494, 0.013447165489196777, 0.023276664316654205, 0.03310616314411163, 0.04293566197156906, 0.05276516079902649, 0.06259465962648392, 0.07242415845394135, 0.08225365728139877, 0.0920831561088562, 0.10191265493631363, 0.11174215376377106, 0.12157165259122849, 0.1314011514186859, 0.14123064279556274, 0.15106014907360077, 0.1608896553516388, 0.17071914672851562, 0.18054863810539246, 0.19037814438343048, 0.2002076506614685, 0.21003714203834534, 0.21986663341522217, 0.2296961396932602, 0.23952564597129822, 0.24935513734817505, 0.2591846287250519, 0.2690141201019287, 0.27884364128112793, 0.28867313265800476]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 5.0, 5.0, 5.0, 9.0, 13.0, 13.0, 14.0, 18.0, 31.0, 43.0, 51.0, 100.0, 157.0, 264.0, 416.0, 814.0, 1947.0, 5006.0, 13988.0, 43993.0, 142696.0, 353234.0, 315692.0, 115674.0, 35271.0, 11469.0, 4173.0, 1666.0, 776.0, 372.0, 230.0, 123.0, 94.0, 55.0, 37.0, 31.0, 21.0, 12.0, 9.0, 9.0, 4.0, 5.0, 7.0, 4.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.05804443359375, -0.05622529983520508, -0.054406166076660156, -0.052587032318115234, -0.05076789855957031, -0.04894876480102539, -0.04712963104248047, -0.04531049728393555, -0.043491363525390625, -0.0416722297668457, -0.03985309600830078, -0.03803396224975586, -0.03621482849121094, -0.034395694732666016, -0.032576560974121094, -0.030757427215576172, -0.02893829345703125, -0.027119159698486328, -0.025300025939941406, -0.023480892181396484, -0.021661758422851562, -0.01984262466430664, -0.01802349090576172, -0.016204357147216797, -0.014385223388671875, -0.012566089630126953, -0.010746955871582031, -0.00892782211303711, -0.0071086883544921875, -0.005289554595947266, -0.0034704208374023438, -0.0016512870788574219, 0.0001678466796875, 0.001986980438232422, 0.0038061141967773438, 0.005625247955322266, 0.0074443817138671875, 0.00926351547241211, 0.011082649230957031, 0.012901782989501953, 0.014720916748046875, 0.016540050506591797, 0.01835918426513672, 0.02017831802368164, 0.021997451782226562, 0.023816585540771484, 0.025635719299316406, 0.027454853057861328, 0.02927398681640625, 0.031093120574951172, 0.032912254333496094, 0.034731388092041016, 0.03655052185058594, 0.03836965560913086, 0.04018878936767578, 0.0420079231262207, 0.043827056884765625, 0.04564619064331055, 0.04746532440185547, 0.04928445816040039, 0.05110359191894531, 0.052922725677490234, 0.054741859436035156, 0.05656099319458008, 0.058380126953125]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 4.0, 6.0, 6.0, 13.0, 9.0, 14.0, 20.0, 15.0, 15.0, 25.0, 27.0, 47.0, 38.0, 41.0, 39.0, 46.0, 56.0, 60.0, 63.0, 57.0, 40.0, 54.0, 62.0, 31.0, 34.0, 32.0, 23.0, 35.0, 16.0, 20.0, 11.0, 14.0, 12.0, 8.0, 4.0, 4.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.23876953125, -0.23086929321289062, -0.22296905517578125, -0.21506881713867188, -0.2071685791015625, -0.19926834106445312, -0.19136810302734375, -0.18346786499023438, -0.175567626953125, -0.16766738891601562, -0.15976715087890625, -0.15186691284179688, -0.1439666748046875, -0.13606643676757812, -0.12816619873046875, -0.12026596069335938, -0.11236572265625, -0.10446548461914062, -0.09656524658203125, -0.08866500854492188, -0.0807647705078125, -0.07286453247070312, -0.06496429443359375, -0.057064056396484375, -0.049163818359375, -0.041263580322265625, -0.03336334228515625, -0.025463104248046875, -0.0175628662109375, -0.009662628173828125, -0.00176239013671875, 0.006137847900390625, 0.0140380859375, 0.021938323974609375, 0.02983856201171875, 0.037738800048828125, 0.0456390380859375, 0.053539276123046875, 0.06143951416015625, 0.06933975219726562, 0.077239990234375, 0.08514022827148438, 0.09304046630859375, 0.10094070434570312, 0.1088409423828125, 0.11674118041992188, 0.12464141845703125, 0.13254165649414062, 0.14044189453125, 0.14834213256835938, 0.15624237060546875, 0.16414260864257812, 0.1720428466796875, 0.17994308471679688, 0.18784332275390625, 0.19574356079101562, 0.203643798828125, 0.21154403686523438, 0.21944427490234375, 0.22734451293945312, 0.2352447509765625, 0.24314498901367188, 0.25104522705078125, 0.2589454650878906, 0.266845703125]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 6.0, 1.0, 3.0, 4.0, 9.0, 8.0, 11.0, 22.0, 26.0, 35.0, 67.0, 94.0, 133.0, 190.0, 337.0, 576.0, 957.0, 1959.0, 4180.0, 9258.0, 23123.0, 61428.0, 163118.0, 321806.0, 270676.0, 116374.0, 43401.0, 16714.0, 7148.0, 3124.0, 1569.0, 838.0, 489.0, 314.0, 185.0, 124.0, 69.0, 50.0, 44.0, 28.0, 20.0, 11.0, 10.0, 6.0, 5.0, 5.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0], "bins": [-0.044097900390625, -0.04271221160888672, -0.04132652282714844, -0.039940834045410156, -0.038555145263671875, -0.037169456481933594, -0.03578376770019531, -0.03439807891845703, -0.03301239013671875, -0.03162670135498047, -0.030241012573242188, -0.028855323791503906, -0.027469635009765625, -0.026083946228027344, -0.024698257446289062, -0.02331256866455078, -0.0219268798828125, -0.02054119110107422, -0.019155502319335938, -0.017769813537597656, -0.016384124755859375, -0.014998435974121094, -0.013612747192382812, -0.012227058410644531, -0.01084136962890625, -0.009455680847167969, -0.008069992065429688, -0.006684303283691406, -0.005298614501953125, -0.003912925720214844, -0.0025272369384765625, -0.0011415481567382812, 0.000244140625, 0.0016298294067382812, 0.0030155181884765625, 0.004401206970214844, 0.005786895751953125, 0.007172584533691406, 0.008558273315429688, 0.009943962097167969, 0.01132965087890625, 0.012715339660644531, 0.014101028442382812, 0.015486717224121094, 0.016872406005859375, 0.018258094787597656, 0.019643783569335938, 0.02102947235107422, 0.0224151611328125, 0.02380084991455078, 0.025186538696289062, 0.026572227478027344, 0.027957916259765625, 0.029343605041503906, 0.030729293823242188, 0.03211498260498047, 0.03350067138671875, 0.03488636016845703, 0.03627204895019531, 0.037657737731933594, 0.039043426513671875, 0.040429115295410156, 0.04181480407714844, 0.04320049285888672, 0.044586181640625]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 4.0, 3.0, 7.0, 4.0, 6.0, 12.0, 15.0, 14.0, 22.0, 21.0, 18.0, 20.0, 22.0, 26.0, 42.0, 44.0, 38.0, 38.0, 47.0, 49.0, 50.0, 62.0, 41.0, 46.0, 34.0, 47.0, 35.0, 36.0, 29.0, 16.0, 32.0, 25.0, 19.0, 14.0, 11.0, 7.0, 10.0, 16.0, 8.0, 6.0, 3.0, 4.0, 4.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.42041015625, -0.40726470947265625, -0.3941192626953125, -0.38097381591796875, -0.367828369140625, -0.35468292236328125, -0.3415374755859375, -0.32839202880859375, -0.31524658203125, -0.30210113525390625, -0.2889556884765625, -0.27581024169921875, -0.262664794921875, -0.24951934814453125, -0.2363739013671875, -0.22322845458984375, -0.2100830078125, -0.19693756103515625, -0.1837921142578125, -0.17064666748046875, -0.157501220703125, -0.14435577392578125, -0.1312103271484375, -0.11806488037109375, -0.10491943359375, -0.09177398681640625, -0.0786285400390625, -0.06548309326171875, -0.052337646484375, -0.03919219970703125, -0.0260467529296875, -0.01290130615234375, 0.000244140625, 0.01338958740234375, 0.0265350341796875, 0.03968048095703125, 0.052825927734375, 0.06597137451171875, 0.0791168212890625, 0.09226226806640625, 0.10540771484375, 0.11855316162109375, 0.1316986083984375, 0.14484405517578125, 0.157989501953125, 0.17113494873046875, 0.1842803955078125, 0.19742584228515625, 0.2105712890625, 0.22371673583984375, 0.2368621826171875, 0.25000762939453125, 0.263153076171875, 0.27629852294921875, 0.2894439697265625, 0.30258941650390625, 0.31573486328125, 0.32888031005859375, 0.3420257568359375, 0.35517120361328125, 0.368316650390625, 0.38146209716796875, 0.3946075439453125, 0.40775299072265625, 0.4208984375]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 3.0, 4.0, 0.0, 4.0, 7.0, 6.0, 5.0, 7.0, 20.0, 28.0, 33.0, 56.0, 89.0, 146.0, 223.0, 385.0, 710.0, 1380.0, 2926.0, 6851.0, 18957.0, 63690.0, 236175.0, 434309.0, 201415.0, 53296.0, 16290.0, 6118.0, 2588.0, 1205.0, 686.0, 362.0, 198.0, 136.0, 70.0, 60.0, 49.0, 25.0, 12.0, 13.0, 7.0, 4.0, 4.0, 3.0, 2.0, 3.0, 0.0, 1.0, 3.0, 1.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0147247314453125, -0.014206886291503906, -0.013689041137695312, -0.013171195983886719, -0.012653350830078125, -0.012135505676269531, -0.011617660522460938, -0.011099815368652344, -0.01058197021484375, -0.010064125061035156, -0.009546279907226562, -0.009028434753417969, -0.008510589599609375, -0.007992744445800781, -0.0074748992919921875, -0.006957054138183594, -0.006439208984375, -0.005921363830566406, -0.0054035186767578125, -0.004885673522949219, -0.004367828369140625, -0.0038499832153320312, -0.0033321380615234375, -0.0028142929077148438, -0.00229644775390625, -0.0017786026000976562, -0.0012607574462890625, -0.0007429122924804688, -0.000225067138671875, 0.00029277801513671875, 0.0008106231689453125, 0.0013284683227539062, 0.0018463134765625, 0.0023641586303710938, 0.0028820037841796875, 0.0033998489379882812, 0.003917694091796875, 0.004435539245605469, 0.0049533843994140625, 0.005471229553222656, 0.00598907470703125, 0.006506919860839844, 0.0070247650146484375, 0.007542610168457031, 0.008060455322265625, 0.008578300476074219, 0.009096145629882812, 0.009613990783691406, 0.0101318359375, 0.010649681091308594, 0.011167526245117188, 0.011685371398925781, 0.012203216552734375, 0.012721061706542969, 0.013238906860351562, 0.013756752014160156, 0.01427459716796875, 0.014792442321777344, 0.015310287475585938, 0.01582813262939453, 0.016345977783203125, 0.01686382293701172, 0.017381668090820312, 0.017899513244628906, 0.0184173583984375]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 5.0, 5.0, 2.0, 6.0, 10.0, 7.0, 7.0, 8.0, 16.0, 12.0, 34.0, 45.0, 36.0, 58.0, 55.0, 67.0, 89.0, 80.0, 76.0, 69.0, 47.0, 61.0, 36.0, 36.0, 36.0, 26.0, 24.0, 12.0, 18.0, 5.0, 7.0, 7.0, 2.0, 4.0, 4.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.569789886474609e-06, -7.247552275657654e-06, -6.925314664840698e-06, -6.603077054023743e-06, -6.280839443206787e-06, -5.9586018323898315e-06, -5.636364221572876e-06, -5.31412661075592e-06, -4.991888999938965e-06, -4.669651389122009e-06, -4.347413778305054e-06, -4.025176167488098e-06, -3.7029385566711426e-06, -3.380700945854187e-06, -3.0584633350372314e-06, -2.736225724220276e-06, -2.4139881134033203e-06, -2.0917505025863647e-06, -1.7695128917694092e-06, -1.4472752809524536e-06, -1.125037670135498e-06, -8.028000593185425e-07, -4.805624485015869e-07, -1.5832483768463135e-07, 1.6391277313232422e-07, 4.861503839492798e-07, 8.083879947662354e-07, 1.130625605583191e-06, 1.4528632164001465e-06, 1.775100827217102e-06, 2.0973384380340576e-06, 2.419576048851013e-06, 2.7418136596679688e-06, 3.0640512704849243e-06, 3.38628888130188e-06, 3.7085264921188354e-06, 4.030764102935791e-06, 4.353001713752747e-06, 4.675239324569702e-06, 4.997476935386658e-06, 5.319714546203613e-06, 5.641952157020569e-06, 5.964189767837524e-06, 6.28642737865448e-06, 6.6086649894714355e-06, 6.930902600288391e-06, 7.253140211105347e-06, 7.575377821922302e-06, 7.897615432739258e-06, 8.219853043556213e-06, 8.542090654373169e-06, 8.864328265190125e-06, 9.18656587600708e-06, 9.508803486824036e-06, 9.831041097640991e-06, 1.0153278708457947e-05, 1.0475516319274902e-05, 1.0797753930091858e-05, 1.1119991540908813e-05, 1.1442229151725769e-05, 1.1764466762542725e-05, 1.208670437335968e-05, 1.2408941984176636e-05, 1.2731179594993591e-05, 1.3053417205810547e-05]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [4.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 4.0, 6.0, 6.0, 5.0, 10.0, 13.0, 19.0, 25.0, 26.0, 33.0, 56.0, 74.0, 111.0, 188.0, 281.0, 466.0, 751.0, 1318.0, 2489.0, 4898.0, 10547.0, 23684.0, 57218.0, 137131.0, 258329.0, 275089.0, 156501.0, 67446.0, 27970.0, 12122.0, 5389.0, 2773.0, 1447.0, 814.0, 464.0, 258.0, 182.0, 121.0, 79.0, 54.0, 40.0, 31.0, 28.0, 19.0, 17.0, 8.0, 8.0, 4.0, 2.0, 3.0, 2.0, 2.0, 3.0, 1.0, 1.0], "bins": [-0.0122833251953125, -0.011922955513000488, -0.011562585830688477, -0.011202216148376465, -0.010841846466064453, -0.010481476783752441, -0.01012110710144043, -0.009760737419128418, -0.009400367736816406, -0.009039998054504395, -0.008679628372192383, -0.008319258689880371, -0.00795888900756836, -0.007598519325256348, -0.007238149642944336, -0.006877779960632324, -0.0065174102783203125, -0.006157040596008301, -0.005796670913696289, -0.005436301231384277, -0.005075931549072266, -0.004715561866760254, -0.004355192184448242, -0.0039948225021362305, -0.0036344528198242188, -0.003274083137512207, -0.0029137134552001953, -0.0025533437728881836, -0.002192974090576172, -0.0018326044082641602, -0.0014722347259521484, -0.0011118650436401367, -0.000751495361328125, -0.0003911256790161133, -3.075599670410156e-05, 0.00032961368560791016, 0.0006899833679199219, 0.0010503530502319336, 0.0014107227325439453, 0.001771092414855957, 0.0021314620971679688, 0.0024918317794799805, 0.002852201461791992, 0.003212571144104004, 0.0035729408264160156, 0.003933310508728027, 0.004293680191040039, 0.004654049873352051, 0.0050144195556640625, 0.005374789237976074, 0.005735158920288086, 0.006095528602600098, 0.006455898284912109, 0.006816267967224121, 0.007176637649536133, 0.0075370073318481445, 0.007897377014160156, 0.008257746696472168, 0.00861811637878418, 0.008978486061096191, 0.009338855743408203, 0.009699225425720215, 0.010059595108032227, 0.010419964790344238, 0.01078033447265625]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 6.0, 2.0, 8.0, 5.0, 14.0, 7.0, 12.0, 13.0, 21.0, 25.0, 31.0, 37.0, 29.0, 38.0, 51.0, 59.0, 53.0, 63.0, 50.0, 48.0, 50.0, 52.0, 53.0, 42.0, 46.0, 30.0, 30.0, 30.0, 21.0, 18.0, 10.0, 17.0, 8.0, 6.0, 9.0, 5.0, 3.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0036411285400390625, -0.003518432378768921, -0.0033957362174987793, -0.0032730400562286377, -0.003150343894958496, -0.0030276477336883545, -0.002904951572418213, -0.0027822554111480713, -0.0026595592498779297, -0.002536863088607788, -0.0024141669273376465, -0.002291470766067505, -0.0021687746047973633, -0.0020460784435272217, -0.00192338228225708, -0.0018006861209869385, -0.0016779899597167969, -0.0015552937984466553, -0.0014325976371765137, -0.001309901475906372, -0.0011872053146362305, -0.0010645091533660889, -0.0009418129920959473, -0.0008191168308258057, -0.0006964206695556641, -0.0005737245082855225, -0.00045102834701538086, -0.00032833218574523926, -0.00020563602447509766, -8.293986320495605e-05, 3.975629806518555e-05, 0.00016245245933532715, 0.00028514862060546875, 0.00040784478187561035, 0.000530540943145752, 0.0006532371044158936, 0.0007759332656860352, 0.0008986294269561768, 0.0010213255882263184, 0.00114402174949646, 0.0012667179107666016, 0.0013894140720367432, 0.0015121102333068848, 0.0016348063945770264, 0.001757502555847168, 0.0018801987171173096, 0.002002894878387451, 0.0021255910396575928, 0.0022482872009277344, 0.002370983362197876, 0.0024936795234680176, 0.002616375684738159, 0.0027390718460083008, 0.0028617680072784424, 0.002984464168548584, 0.0031071603298187256, 0.003229856491088867, 0.003352552652359009, 0.0034752488136291504, 0.003597944974899292, 0.0037206411361694336, 0.003843337297439575, 0.003966033458709717, 0.004088729619979858, 0.00421142578125]}, "gradients/decoder.model.decoder.layers.4.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 3.0, 5.0, 15.0, 26.0, 74.0, 133.0, 244.0, 254.0, 147.0, 52.0, 33.0, 14.0, 5.0, 3.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.1874045133590698, -1.1610171794891357, -1.1346298456192017, -1.1082426309585571, -1.081855297088623, -1.055467963218689, -1.0290806293487549, -1.0026934146881104, -0.9763060808181763, -0.9499187469482422, -0.9235314726829529, -0.8971441388130188, -0.8707568645477295, -0.8443695306777954, -0.8179821968078613, -0.791594922542572, -0.7652075886726379, -0.7388202548027039, -0.7124329805374146, -0.6860456466674805, -0.6596583724021912, -0.6332710385322571, -0.6068837642669678, -0.5804964303970337, -0.5541090965270996, -0.5277217626571655, -0.5013344883918762, -0.47494715452194214, -0.44855988025665283, -0.42217254638671875, -0.39578524231910706, -0.36939793825149536, -0.3430106043815613, -0.3166233003139496, -0.2902359962463379, -0.2638486623764038, -0.2374613732099533, -0.2110740691423416, -0.18468675017356873, -0.15829944610595703, -0.13191214203834534, -0.10552483797073364, -0.07913752645254135, -0.05275021493434906, -0.026362910866737366, 2.4393200874328613e-05, 0.026411712169647217, 0.05279901623725891, 0.0791863203048706, 0.1055736243724823, 0.131960928440094, 0.15834824740886688, 0.18473555147647858, 0.21112285554409027, 0.23751017451286316, 0.26389747858047485, 0.29028478264808655, 0.31667208671569824, 0.34305939078330994, 0.36944669485092163, 0.3958340287208557, 0.422221302986145, 0.4486086368560791, 0.4749959409236908, 0.5013832449913025]}, "gradients/decoder.model.decoder.layers.4.self_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 6.0, 4.0, 1.0, 6.0, 4.0, 11.0, 7.0, 9.0, 9.0, 15.0, 23.0, 22.0, 23.0, 22.0, 28.0, 36.0, 41.0, 43.0, 35.0, 54.0, 54.0, 50.0, 62.0, 47.0, 48.0, 41.0, 46.0, 34.0, 38.0, 25.0, 25.0, 25.0, 27.0, 20.0, 11.0, 10.0, 15.0, 9.0, 3.0, 5.0, 5.0, 0.0, 5.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.21879008412361145, -0.21172401309013367, -0.20465795695781708, -0.1975918859243393, -0.1905258148908615, -0.18345975875854492, -0.17639368772506714, -0.16932761669158936, -0.16226154565811157, -0.1551954746246338, -0.1481294184923172, -0.14106334745883942, -0.13399727642536163, -0.12693122029304504, -0.11986514925956726, -0.11279907822608948, -0.10573301464319229, -0.0986669510602951, -0.09160088002681732, -0.08453481644392014, -0.07746874541044235, -0.07040268182754517, -0.06333661079406738, -0.0562705472111702, -0.04920447990298271, -0.04213841259479523, -0.03507234528660774, -0.028006279841065407, -0.020940212532877922, -0.013874147087335587, -0.006808079779148102, 0.00025798752903938293, 0.007324054837226868, 0.014390122145414352, 0.021456189453601837, 0.028522254899144173, 0.03558832406997681, 0.04265438765287399, 0.04972045496106148, 0.05678652226924896, 0.06385259330272675, 0.07091865688562393, 0.07798472791910172, 0.0850507915019989, 0.09211686253547668, 0.09918292611837387, 0.10624898970127106, 0.11331506073474884, 0.12038112431764603, 0.1274471879005432, 0.134513258934021, 0.14157932996749878, 0.14864538609981537, 0.15571145713329315, 0.16277752816677094, 0.16984358429908752, 0.1769096553325653, 0.1839757263660431, 0.19104178249835968, 0.19810785353183746, 0.20517392456531525, 0.21223998069763184, 0.21930605173110962, 0.2263721227645874, 0.23343819379806519]}, "gradients/decoder.model.decoder.layers.4.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 6.0, 2.0, 7.0, 11.0, 13.0, 23.0, 29.0, 45.0, 63.0, 111.0, 157.0, 286.0, 472.0, 896.0, 1761.0, 4201.0, 12495.0, 75405.0, 754829.0, 168170.0, 19243.0, 5522.0, 2237.0, 1183.0, 533.0, 332.0, 200.0, 106.0, 80.0, 45.0, 40.0, 19.0, 10.0, 7.0, 7.0, 6.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.290771484375, -0.2798614501953125, -0.268951416015625, -0.2580413818359375, -0.24713134765625, -0.2362213134765625, -0.225311279296875, -0.2144012451171875, -0.2034912109375, -0.1925811767578125, -0.181671142578125, -0.1707611083984375, -0.15985107421875, -0.1489410400390625, -0.138031005859375, -0.1271209716796875, -0.1162109375, -0.1053009033203125, -0.094390869140625, -0.0834808349609375, -0.07257080078125, -0.0616607666015625, -0.050750732421875, -0.0398406982421875, -0.0289306640625, -0.0180206298828125, -0.007110595703125, 0.0037994384765625, 0.01470947265625, 0.0256195068359375, 0.036529541015625, 0.0474395751953125, 0.058349609375, 0.0692596435546875, 0.080169677734375, 0.0910797119140625, 0.10198974609375, 0.1128997802734375, 0.123809814453125, 0.1347198486328125, 0.1456298828125, 0.1565399169921875, 0.167449951171875, 0.1783599853515625, 0.18927001953125, 0.2001800537109375, 0.211090087890625, 0.2220001220703125, 0.23291015625, 0.2438201904296875, 0.254730224609375, 0.2656402587890625, 0.27655029296875, 0.2874603271484375, 0.298370361328125, 0.3092803955078125, 0.3201904296875, 0.3311004638671875, 0.342010498046875, 0.3529205322265625, 0.36383056640625, 0.3747406005859375, 0.385650634765625, 0.3965606689453125, 0.407470703125]}, "gradients/decoder.model.decoder.layers.4.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 3.0, 2.0, 5.0, 3.0, 3.0, 7.0, 8.0, 10.0, 11.0, 9.0, 16.0, 19.0, 26.0, 29.0, 34.0, 43.0, 45.0, 41.0, 45.0, 60.0, 67.0, 69.0, 62.0, 55.0, 52.0, 39.0, 49.0, 30.0, 37.0, 21.0, 31.0, 11.0, 16.0, 10.0, 14.0, 8.0, 6.0, 4.0, 2.0, 2.0, 3.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.50537109375, -0.4887237548828125, -0.472076416015625, -0.4554290771484375, -0.43878173828125, -0.4221343994140625, -0.405487060546875, -0.3888397216796875, -0.3721923828125, -0.3555450439453125, -0.338897705078125, -0.3222503662109375, -0.30560302734375, -0.2889556884765625, -0.272308349609375, -0.2556610107421875, -0.239013671875, -0.2223663330078125, -0.205718994140625, -0.1890716552734375, -0.17242431640625, -0.1557769775390625, -0.139129638671875, -0.1224822998046875, -0.1058349609375, -0.0891876220703125, -0.072540283203125, -0.0558929443359375, -0.03924560546875, -0.0225982666015625, -0.005950927734375, 0.0106964111328125, 0.02734375, 0.0439910888671875, 0.060638427734375, 0.0772857666015625, 0.09393310546875, 0.1105804443359375, 0.127227783203125, 0.1438751220703125, 0.1605224609375, 0.1771697998046875, 0.193817138671875, 0.2104644775390625, 0.22711181640625, 0.2437591552734375, 0.260406494140625, 0.2770538330078125, 0.293701171875, 0.3103485107421875, 0.326995849609375, 0.3436431884765625, 0.36029052734375, 0.3769378662109375, 0.393585205078125, 0.4102325439453125, 0.4268798828125, 0.4435272216796875, 0.460174560546875, 0.4768218994140625, 0.49346923828125, 0.5101165771484375, 0.526763916015625, 0.5434112548828125, 0.56005859375]}, "gradients/decoder.model.decoder.layers.4.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 6.0, 3.0, 10.0, 4.0, 10.0, 9.0, 10.0, 23.0, 33.0, 47.0, 65.0, 140.0, 233.0, 513.0, 1142.0, 3180.0, 15049.0, 681066.0, 331150.0, 11196.0, 2645.0, 1056.0, 407.0, 243.0, 137.0, 58.0, 35.0, 26.0, 14.0, 9.0, 6.0, 9.0, 1.0, 6.0, 5.0, 5.0, 2.0, 1.0, 4.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5078125, -0.49025726318359375, -0.4727020263671875, -0.45514678955078125, -0.437591552734375, -0.42003631591796875, -0.4024810791015625, -0.38492584228515625, -0.36737060546875, -0.34981536865234375, -0.3322601318359375, -0.31470489501953125, -0.297149658203125, -0.27959442138671875, -0.2620391845703125, -0.24448394775390625, -0.2269287109375, -0.20937347412109375, -0.1918182373046875, -0.17426300048828125, -0.156707763671875, -0.13915252685546875, -0.1215972900390625, -0.10404205322265625, -0.08648681640625, -0.06893157958984375, -0.0513763427734375, -0.03382110595703125, -0.016265869140625, 0.00128936767578125, 0.0188446044921875, 0.03639984130859375, 0.053955078125, 0.07151031494140625, 0.0890655517578125, 0.10662078857421875, 0.124176025390625, 0.14173126220703125, 0.1592864990234375, 0.17684173583984375, 0.19439697265625, 0.21195220947265625, 0.2295074462890625, 0.24706268310546875, 0.264617919921875, 0.28217315673828125, 0.2997283935546875, 0.31728363037109375, 0.3348388671875, 0.35239410400390625, 0.3699493408203125, 0.38750457763671875, 0.405059814453125, 0.42261505126953125, 0.4401702880859375, 0.45772552490234375, 0.47528076171875, 0.49283599853515625, 0.5103912353515625, 0.5279464721679688, 0.545501708984375, 0.5630569458007812, 0.5806121826171875, 0.5981674194335938, 0.61572265625]}, "gradients/decoder.model.decoder.layers.4.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 3.0, 4.0, 6.0, 3.0, 8.0, 16.0, 9.0, 10.0, 21.0, 15.0, 27.0, 30.0, 32.0, 29.0, 27.0, 43.0, 43.0, 50.0, 47.0, 40.0, 47.0, 44.0, 55.0, 49.0, 50.0, 35.0, 29.0, 38.0, 35.0, 26.0, 21.0, 17.0, 14.0, 20.0, 14.0, 12.0, 10.0, 6.0, 2.0, 5.0, 3.0, 5.0, 8.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.50341796875, -0.4857025146484375, -0.467987060546875, -0.4502716064453125, -0.43255615234375, -0.4148406982421875, -0.397125244140625, -0.3794097900390625, -0.3616943359375, -0.3439788818359375, -0.326263427734375, -0.3085479736328125, -0.29083251953125, -0.2731170654296875, -0.255401611328125, -0.2376861572265625, -0.219970703125, -0.2022552490234375, -0.184539794921875, -0.1668243408203125, -0.14910888671875, -0.1313934326171875, -0.113677978515625, -0.0959625244140625, -0.0782470703125, -0.0605316162109375, -0.042816162109375, -0.0251007080078125, -0.00738525390625, 0.0103302001953125, 0.028045654296875, 0.0457611083984375, 0.0634765625, 0.0811920166015625, 0.098907470703125, 0.1166229248046875, 0.13433837890625, 0.1520538330078125, 0.169769287109375, 0.1874847412109375, 0.2052001953125, 0.2229156494140625, 0.240631103515625, 0.2583465576171875, 0.27606201171875, 0.2937774658203125, 0.311492919921875, 0.3292083740234375, 0.346923828125, 0.3646392822265625, 0.382354736328125, 0.4000701904296875, 0.41778564453125, 0.4355010986328125, 0.453216552734375, 0.4709320068359375, 0.4886474609375, 0.5063629150390625, 0.524078369140625, 0.5417938232421875, 0.55950927734375, 0.5772247314453125, 0.594940185546875, 0.6126556396484375, 0.63037109375]}, "gradients/decoder.model.decoder.layers.4.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 0.0, 2.0, 6.0, 11.0, 24.0, 60.0, 147.0, 491.0, 2308.0, 699253.0, 343662.0, 1957.0, 400.0, 144.0, 53.0, 18.0, 7.0, 4.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1973876953125, -0.18216514587402344, -0.16694259643554688, -0.1517200469970703, -0.13649749755859375, -0.12127494812011719, -0.10605239868164062, -0.09082984924316406, -0.0756072998046875, -0.06038475036621094, -0.045162200927734375, -0.029939651489257812, -0.01471710205078125, 0.0005054473876953125, 0.015727996826171875, 0.030950546264648438, 0.046173095703125, 0.06139564514160156, 0.07661819458007812, 0.09184074401855469, 0.10706329345703125, 0.12228584289550781, 0.13750839233398438, 0.15273094177246094, 0.1679534912109375, 0.18317604064941406, 0.19839859008789062, 0.2136211395263672, 0.22884368896484375, 0.2440662384033203, 0.2592887878417969, 0.27451133728027344, 0.28973388671875, 0.30495643615722656, 0.3201789855957031, 0.3354015350341797, 0.35062408447265625, 0.3658466339111328, 0.3810691833496094, 0.39629173278808594, 0.4115142822265625, 0.42673683166503906, 0.4419593811035156, 0.4571819305419922, 0.47240447998046875, 0.4876270294189453, 0.5028495788574219, 0.5180721282958984, 0.533294677734375, 0.5485172271728516, 0.5637397766113281, 0.5789623260498047, 0.5941848754882812, 0.6094074249267578, 0.6246299743652344, 0.6398525238037109, 0.6550750732421875, 0.6702976226806641, 0.6855201721191406, 0.7007427215576172, 0.7159652709960938, 0.7311878204345703, 0.7464103698730469, 0.7616329193115234, 0.77685546875]}, "gradients/decoder.model.decoder.layers.4.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 3.0, 7.0, 8.0, 20.0, 41.0, 58.0, 159.0, 271.0, 229.0, 106.0, 57.0, 22.0, 12.0, 4.0, 2.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-5.561113357543945e-05, -5.442090332508087e-05, -5.323067307472229e-05, -5.204044282436371e-05, -5.085021257400513e-05, -4.9659982323646545e-05, -4.8469752073287964e-05, -4.727952182292938e-05, -4.60892915725708e-05, -4.489906132221222e-05, -4.370883107185364e-05, -4.2518600821495056e-05, -4.1328370571136475e-05, -4.013814032077789e-05, -3.894791007041931e-05, -3.775767982006073e-05, -3.656744956970215e-05, -3.537721931934357e-05, -3.4186989068984985e-05, -3.2996758818626404e-05, -3.180652856826782e-05, -3.061629831790924e-05, -2.942606806755066e-05, -2.8235837817192078e-05, -2.7045607566833496e-05, -2.5855377316474915e-05, -2.4665147066116333e-05, -2.347491681575775e-05, -2.228468656539917e-05, -2.109445631504059e-05, -1.9904226064682007e-05, -1.8713995814323425e-05, -1.7523765563964844e-05, -1.6333535313606262e-05, -1.514330506324768e-05, -1.3953074812889099e-05, -1.2762844562530518e-05, -1.1572614312171936e-05, -1.0382384061813354e-05, -9.192153811454773e-06, -8.001923561096191e-06, -6.81169331073761e-06, -5.621463060379028e-06, -4.431232810020447e-06, -3.2410025596618652e-06, -2.0507723093032837e-06, -8.605420589447021e-07, 3.296881914138794e-07, 1.519918441772461e-06, 2.7101486921310425e-06, 3.900378942489624e-06, 5.0906091928482056e-06, 6.280839443206787e-06, 7.471069693565369e-06, 8.66129994392395e-06, 9.851530194282532e-06, 1.1041760444641113e-05, 1.2231990694999695e-05, 1.3422220945358276e-05, 1.4612451195716858e-05, 1.580268144607544e-05, 1.699291169643402e-05, 1.8183141946792603e-05, 1.9373372197151184e-05, 2.0563602447509766e-05]}, "gradients/decoder.model.decoder.layers.4.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 4.0, 6.0, 7.0, 15.0, 18.0, 65.0, 169.0, 509.0, 1890.0, 31966.0, 1001294.0, 10795.0, 1226.0, 404.0, 119.0, 44.0, 19.0, 7.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.469482421875, -0.4558219909667969, -0.44216156005859375, -0.4285011291503906, -0.4148406982421875, -0.4011802673339844, -0.38751983642578125, -0.3738594055175781, -0.360198974609375, -0.3465385437011719, -0.33287811279296875, -0.3192176818847656, -0.3055572509765625, -0.2918968200683594, -0.27823638916015625, -0.2645759582519531, -0.25091552734375, -0.23725509643554688, -0.22359466552734375, -0.20993423461914062, -0.1962738037109375, -0.18261337280273438, -0.16895294189453125, -0.15529251098632812, -0.141632080078125, -0.12797164916992188, -0.11431121826171875, -0.10065078735351562, -0.0869903564453125, -0.07332992553710938, -0.05966949462890625, -0.046009063720703125, -0.0323486328125, -0.018688201904296875, -0.00502777099609375, 0.008632659912109375, 0.0222930908203125, 0.035953521728515625, 0.04961395263671875, 0.06327438354492188, 0.076934814453125, 0.09059524536132812, 0.10425567626953125, 0.11791610717773438, 0.1315765380859375, 0.14523696899414062, 0.15889739990234375, 0.17255783081054688, 0.18621826171875, 0.19987869262695312, 0.21353912353515625, 0.22719955444335938, 0.2408599853515625, 0.2545204162597656, 0.26818084716796875, 0.2818412780761719, 0.295501708984375, 0.3091621398925781, 0.32282257080078125, 0.3364830017089844, 0.3501434326171875, 0.3638038635253906, 0.37746429443359375, 0.3911247253417969, 0.40478515625]}, "gradients/decoder.model.decoder.layers.4.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 5.0, 4.0, 2.0, 19.0, 15.0, 41.0, 78.0, 140.0, 300.0, 179.0, 97.0, 49.0, 31.0, 17.0, 11.0, 5.0, 7.0, 5.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.09576416015625, -0.09264278411865234, -0.08952140808105469, -0.08640003204345703, -0.08327865600585938, -0.08015727996826172, -0.07703590393066406, -0.0739145278930664, -0.07079315185546875, -0.0676717758178711, -0.06455039978027344, -0.06142902374267578, -0.058307647705078125, -0.05518627166748047, -0.05206489562988281, -0.048943519592285156, -0.0458221435546875, -0.042700767517089844, -0.03957939147949219, -0.03645801544189453, -0.033336639404296875, -0.03021526336669922, -0.027093887329101562, -0.023972511291503906, -0.02085113525390625, -0.017729759216308594, -0.014608383178710938, -0.011487007141113281, -0.008365631103515625, -0.005244255065917969, -0.0021228790283203125, 0.0009984970092773438, 0.004119873046875, 0.007241249084472656, 0.010362625122070312, 0.013484001159667969, 0.016605377197265625, 0.01972675323486328, 0.022848129272460938, 0.025969505310058594, 0.02909088134765625, 0.032212257385253906, 0.03533363342285156, 0.03845500946044922, 0.041576385498046875, 0.04469776153564453, 0.04781913757324219, 0.050940513610839844, 0.0540618896484375, 0.057183265686035156, 0.06030464172363281, 0.06342601776123047, 0.06654739379882812, 0.06966876983642578, 0.07279014587402344, 0.0759115219116211, 0.07903289794921875, 0.0821542739868164, 0.08527565002441406, 0.08839702606201172, 0.09151840209960938, 0.09463977813720703, 0.09776115417480469, 0.10088253021240234, 0.10400390625]}, "gradients/decoder.model.decoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 5.0, 5.0, 9.0, 28.0, 34.0, 112.0, 232.0, 246.0, 186.0, 81.0, 41.0, 16.0, 8.0, 2.0, 3.0, 1.0, 0.0, 1.0, 3.0], "bins": [-2.714205026626587, -2.6623690128326416, -2.610532760620117, -2.558696746826172, -2.5068604946136475, -2.455024480819702, -2.4031882286071777, -2.3513522148132324, -2.299515962600708, -2.2476799488067627, -2.1958436965942383, -2.144007682800293, -2.0921714305877686, -2.0403354167938232, -1.9884991645812988, -1.9366631507873535, -1.8848271369934082, -1.8329910039901733, -1.7811548709869385, -1.7293187379837036, -1.6774826049804688, -1.6256465911865234, -1.573810338973999, -1.5219743251800537, -1.4701380729675293, -1.4183019399642944, -1.3664658069610596, -1.3146296739578247, -1.2627935409545898, -1.2109575271606445, -1.1591212749481201, -1.1072852611541748, -1.05544912815094, -1.003612995147705, -0.9517768621444702, -0.8999407291412354, -0.8481046557426453, -0.7962685227394104, -0.7444323897361755, -0.6925963163375854, -0.6407601833343506, -0.5889240503311157, -0.5370879173278809, -0.4852518141269684, -0.4334157109260559, -0.38157957792282104, -0.3297434449195862, -0.2779073417186737, -0.22607117891311646, -0.17423506081104279, -0.12239893525838852, -0.07056280970573425, -0.018726691603660583, 0.033109426498413086, 0.08494555950164795, 0.13678166270256042, 0.1886177957057953, 0.24045391380786896, 0.2922900319099426, 0.3441261649131775, 0.39596229791641235, 0.44779840111732483, 0.4996345341205597, 0.5514706373214722, 0.603306770324707]}, "gradients/decoder.model.decoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 2.0, 2.0, 4.0, 4.0, 3.0, 6.0, 8.0, 13.0, 7.0, 7.0, 6.0, 14.0, 15.0, 27.0, 25.0, 17.0, 30.0, 34.0, 32.0, 26.0, 34.0, 49.0, 42.0, 40.0, 38.0, 41.0, 34.0, 44.0, 29.0, 35.0, 31.0, 22.0, 28.0, 32.0, 31.0, 30.0, 27.0, 20.0, 28.0, 17.0, 13.0, 14.0, 9.0, 13.0, 11.0, 3.0, 3.0, 5.0, 2.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.7800319790840149, -0.753801167011261, -0.7275702953338623, -0.7013394832611084, -0.6751086711883545, -0.6488778591156006, -0.6226469874382019, -0.596416175365448, -0.5701853036880493, -0.5439544916152954, -0.5177236199378967, -0.4914928078651428, -0.4652619957923889, -0.4390311539173126, -0.41280031204223633, -0.3865694999694824, -0.3603386878967285, -0.3341078460216522, -0.3078770339488983, -0.281646192073822, -0.2554153800010681, -0.22918453812599182, -0.20295369625091553, -0.17672286927700043, -0.15049204230308533, -0.12426121532917023, -0.09803038090467453, -0.07179954648017883, -0.04556871950626373, -0.019337892532348633, 0.006892949342727661, 0.03312377631664276, 0.05935460329055786, 0.08558543026447296, 0.11181626468896866, 0.13804709911346436, 0.16427792608737946, 0.19050875306129456, 0.21673959493637085, 0.24297042191028595, 0.26920124888420105, 0.29543209075927734, 0.32166290283203125, 0.34789374470710754, 0.37412458658218384, 0.40035539865493774, 0.42658624053001404, 0.45281708240509033, 0.47904789447784424, 0.5052787065505981, 0.5315095782279968, 0.5577403903007507, 0.5839712023735046, 0.6102020740509033, 0.6364328861236572, 0.6626636981964111, 0.688894510269165, 0.715125322341919, 0.7413561940193176, 0.7675870060920715, 0.7938178181648254, 0.8200486898422241, 0.846279501914978, 0.8725103139877319, 0.8987411856651306]}, "gradients/decoder.model.decoder.layers.3.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 4.0, 5.0, 10.0, 15.0, 28.0, 28.0, 63.0, 132.0, 280.0, 657.0, 1768.0, 6791.0, 59978.0, 3467785.0, 635820.0, 16070.0, 3022.0, 1028.0, 392.0, 177.0, 104.0, 59.0, 29.0, 20.0, 5.0, 6.0, 3.0, 7.0, 3.0, 0.0, 5.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.833984375, -0.803955078125, -0.77392578125, -0.743896484375, -0.7138671875, -0.683837890625, -0.65380859375, -0.623779296875, -0.59375, -0.563720703125, -0.53369140625, -0.503662109375, -0.4736328125, -0.443603515625, -0.41357421875, -0.383544921875, -0.353515625, -0.323486328125, -0.29345703125, -0.263427734375, -0.2333984375, -0.203369140625, -0.17333984375, -0.143310546875, -0.11328125, -0.083251953125, -0.05322265625, -0.023193359375, 0.0068359375, 0.036865234375, 0.06689453125, 0.096923828125, 0.126953125, 0.156982421875, 0.18701171875, 0.217041015625, 0.2470703125, 0.277099609375, 0.30712890625, 0.337158203125, 0.3671875, 0.397216796875, 0.42724609375, 0.457275390625, 0.4873046875, 0.517333984375, 0.54736328125, 0.577392578125, 0.607421875, 0.637451171875, 0.66748046875, 0.697509765625, 0.7275390625, 0.757568359375, 0.78759765625, 0.817626953125, 0.84765625, 0.877685546875, 0.90771484375, 0.937744140625, 0.9677734375, 0.997802734375, 1.02783203125, 1.057861328125, 1.087890625]}, "gradients/decoder.model.decoder.layers.3.fc2.bias": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 5.0, 8.0, 13.0, 9.0, 9.0, 17.0, 22.0, 33.0, 36.0, 48.0, 55.0, 45.0, 47.0, 63.0, 70.0, 71.0, 71.0, 54.0, 56.0, 47.0, 36.0, 29.0, 28.0, 24.0, 26.0, 22.0, 14.0, 12.0, 10.0, 9.0, 6.0, 3.0, 1.0, 2.0, 0.0, 1.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2469482421875, -0.2368335723876953, -0.22671890258789062, -0.21660423278808594, -0.20648956298828125, -0.19637489318847656, -0.18626022338867188, -0.1761455535888672, -0.1660308837890625, -0.1559162139892578, -0.14580154418945312, -0.13568687438964844, -0.12557220458984375, -0.11545753479003906, -0.10534286499023438, -0.09522819519042969, -0.085113525390625, -0.07499885559082031, -0.06488418579101562, -0.05476951599121094, -0.04465484619140625, -0.03454017639160156, -0.024425506591796875, -0.014310836791992188, -0.0041961669921875, 0.0059185028076171875, 0.016033172607421875, 0.026147842407226562, 0.03626251220703125, 0.04637718200683594, 0.056491851806640625, 0.06660652160644531, 0.07672119140625, 0.08683586120605469, 0.09695053100585938, 0.10706520080566406, 0.11717987060546875, 0.12729454040527344, 0.13740921020507812, 0.1475238800048828, 0.1576385498046875, 0.1677532196044922, 0.17786788940429688, 0.18798255920410156, 0.19809722900390625, 0.20821189880371094, 0.21832656860351562, 0.2284412384033203, 0.238555908203125, 0.2486705780029297, 0.2587852478027344, 0.26889991760253906, 0.27901458740234375, 0.28912925720214844, 0.2992439270019531, 0.3093585968017578, 0.3194732666015625, 0.3295879364013672, 0.3397026062011719, 0.34981727600097656, 0.35993194580078125, 0.37004661560058594, 0.3801612854003906, 0.3902759552001953, 0.400390625]}, "gradients/decoder.model.decoder.layers.3.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 4.0, 2.0, 2.0, 2.0, 7.0, 5.0, 14.0, 13.0, 20.0, 25.0, 51.0, 95.0, 143.0, 256.0, 500.0, 1069.0, 2911.0, 9244.0, 46608.0, 965284.0, 3055170.0, 92013.0, 14056.0, 4031.0, 1425.0, 592.0, 288.0, 175.0, 102.0, 53.0, 52.0, 22.0, 21.0, 8.0, 9.0, 4.0, 3.0, 4.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.65625, -0.6385879516601562, -0.6209259033203125, -0.6032638549804688, -0.585601806640625, -0.5679397583007812, -0.5502777099609375, -0.5326156616210938, -0.51495361328125, -0.49729156494140625, -0.4796295166015625, -0.46196746826171875, -0.444305419921875, -0.42664337158203125, -0.4089813232421875, -0.39131927490234375, -0.3736572265625, -0.35599517822265625, -0.3383331298828125, -0.32067108154296875, -0.303009033203125, -0.28534698486328125, -0.2676849365234375, -0.25002288818359375, -0.23236083984375, -0.21469879150390625, -0.1970367431640625, -0.17937469482421875, -0.161712646484375, -0.14405059814453125, -0.1263885498046875, -0.10872650146484375, -0.091064453125, -0.07340240478515625, -0.0557403564453125, -0.03807830810546875, -0.020416259765625, -0.00275421142578125, 0.0149078369140625, 0.03256988525390625, 0.05023193359375, 0.06789398193359375, 0.0855560302734375, 0.10321807861328125, 0.120880126953125, 0.13854217529296875, 0.1562042236328125, 0.17386627197265625, 0.1915283203125, 0.20919036865234375, 0.2268524169921875, 0.24451446533203125, 0.262176513671875, 0.27983856201171875, 0.2975006103515625, 0.31516265869140625, 0.33282470703125, 0.35048675537109375, 0.3681488037109375, 0.38581085205078125, 0.403472900390625, 0.42113494873046875, 0.4387969970703125, 0.45645904541015625, 0.47412109375]}, "gradients/decoder.model.decoder.layers.3.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 0.0, 3.0, 2.0, 6.0, 5.0, 5.0, 11.0, 15.0, 17.0, 30.0, 34.0, 56.0, 88.0, 121.0, 197.0, 371.0, 569.0, 717.0, 587.0, 457.0, 256.0, 175.0, 104.0, 73.0, 50.0, 37.0, 18.0, 21.0, 12.0, 8.0, 10.0, 4.0, 2.0, 8.0, 1.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.1341552734375, -0.1299266815185547, -0.12569808959960938, -0.12146949768066406, -0.11724090576171875, -0.11301231384277344, -0.10878372192382812, -0.10455513000488281, -0.1003265380859375, -0.09609794616699219, -0.09186935424804688, -0.08764076232910156, -0.08341217041015625, -0.07918357849121094, -0.07495498657226562, -0.07072639465332031, -0.066497802734375, -0.06226921081542969, -0.058040618896484375, -0.05381202697753906, -0.04958343505859375, -0.04535484313964844, -0.041126251220703125, -0.03689765930175781, -0.0326690673828125, -0.028440475463867188, -0.024211883544921875, -0.019983291625976562, -0.01575469970703125, -0.011526107788085938, -0.007297515869140625, -0.0030689239501953125, 0.00115966796875, 0.0053882598876953125, 0.009616851806640625, 0.013845443725585938, 0.01807403564453125, 0.022302627563476562, 0.026531219482421875, 0.030759811401367188, 0.0349884033203125, 0.03921699523925781, 0.043445587158203125, 0.04767417907714844, 0.05190277099609375, 0.05613136291503906, 0.060359954833984375, 0.06458854675292969, 0.068817138671875, 0.07304573059082031, 0.07727432250976562, 0.08150291442871094, 0.08573150634765625, 0.08996009826660156, 0.09418869018554688, 0.09841728210449219, 0.1026458740234375, 0.10687446594238281, 0.11110305786132812, 0.11533164978027344, 0.11956024169921875, 0.12378883361816406, 0.12801742553710938, 0.1322460174560547, 0.136474609375]}, "gradients/decoder.model.decoder.layers.3.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 9.0, 11.0, 19.0, 10.0, 31.0, 45.0, 67.0, 101.0, 115.0, 123.0, 141.0, 107.0, 83.0, 37.0, 40.0, 26.0, 13.0, 9.0, 11.0, 6.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.8029218316078186, -0.7826358079910278, -0.7623497247695923, -0.7420637011528015, -0.7217776775360107, -0.7014915943145752, -0.6812055706977844, -0.6609195470809937, -0.6406334638595581, -0.6203474402427673, -0.6000613570213318, -0.579775333404541, -0.5594892501831055, -0.5392032265663147, -0.5189172029495239, -0.49863114953041077, -0.4783450961112976, -0.45805904269218445, -0.4377729892730713, -0.4174869656562805, -0.39720091223716736, -0.3769148588180542, -0.3566288352012634, -0.33634278178215027, -0.3160567283630371, -0.29577067494392395, -0.2754846215248108, -0.25519859790802, -0.23491254448890686, -0.2146264910697937, -0.19434045255184174, -0.17405441403388977, -0.15376833081245422, -0.13348227739334106, -0.1131962388753891, -0.09291019290685654, -0.07262414693832397, -0.05233810096979141, -0.03205205500125885, -0.011766016483306885, 0.008520036935806274, 0.028806082904338837, 0.0490921288728714, 0.06937817484140396, 0.08966422080993652, 0.10995026677846909, 0.13023631274700165, 0.1505223512649536, 0.17080840468406677, 0.19109445810317993, 0.2113804966211319, 0.23166653513908386, 0.251952588558197, 0.2722386419773102, 0.29252469539642334, 0.3128107190132141, 0.33309677243232727, 0.35338282585144043, 0.3736688494682312, 0.39395490288734436, 0.4142409563064575, 0.4345270097255707, 0.45481306314468384, 0.4750990867614746, 0.49538514018058777]}, "gradients/decoder.model.decoder.layers.3.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 6.0, 3.0, 3.0, 7.0, 6.0, 11.0, 7.0, 19.0, 11.0, 24.0, 23.0, 23.0, 42.0, 39.0, 39.0, 46.0, 53.0, 55.0, 48.0, 50.0, 51.0, 50.0, 50.0, 40.0, 60.0, 47.0, 37.0, 34.0, 29.0, 30.0, 14.0, 11.0, 13.0, 10.0, 8.0, 5.0, 2.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2911028563976288, -0.279893696308136, -0.2686845362186432, -0.2574753761291504, -0.2462662160396576, -0.2350570559501648, -0.223847895860672, -0.2126387357711792, -0.2014295756816864, -0.1902204155921936, -0.1790112555027008, -0.167802095413208, -0.1565929353237152, -0.1453837752342224, -0.13417461514472961, -0.12296546250581741, -0.11175630986690521, -0.10054714977741241, -0.08933798968791962, -0.07812882959842682, -0.06691966950893402, -0.05571051314473152, -0.04450135678052902, -0.033292196691036224, -0.022083036601543427, -0.010873877443373203, 0.00033528171479701996, 0.011544439941644669, 0.022753600031137466, 0.033962760120630264, 0.045171916484832764, 0.05638107657432556, 0.06759023666381836, 0.07879939675331116, 0.09000855684280396, 0.10121771693229675, 0.11242687702178955, 0.12363603711128235, 0.13484519720077515, 0.14605435729026794, 0.15726351737976074, 0.16847267746925354, 0.17968183755874634, 0.19089099764823914, 0.20210015773773193, 0.21330931782722473, 0.22451847791671753, 0.23572763800621033, 0.24693678319454193, 0.25814592838287354, 0.26935508847236633, 0.28056424856185913, 0.29177340865135193, 0.3029825687408447, 0.3141917288303375, 0.3254008889198303, 0.3366100490093231, 0.3478192090988159, 0.3590283691883087, 0.3702375292778015, 0.3814466893672943, 0.3926558494567871, 0.4038650095462799, 0.4150741696357727, 0.4262833297252655]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 9.0, 16.0, 39.0, 136.0, 494.0, 2125.0, 12375.0, 634467.0, 386968.0, 9512.0, 1820.0, 415.0, 104.0, 35.0, 20.0, 6.0, 8.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.27392578125, -0.2650718688964844, -0.25621795654296875, -0.24736404418945312, -0.2385101318359375, -0.22965621948242188, -0.22080230712890625, -0.21194839477539062, -0.203094482421875, -0.19424057006835938, -0.18538665771484375, -0.17653274536132812, -0.1676788330078125, -0.15882492065429688, -0.14997100830078125, -0.14111709594726562, -0.13226318359375, -0.12340927124023438, -0.11455535888671875, -0.10570144653320312, -0.0968475341796875, -0.08799362182617188, -0.07913970947265625, -0.07028579711914062, -0.061431884765625, -0.052577972412109375, -0.04372406005859375, -0.034870147705078125, -0.0260162353515625, -0.017162322998046875, -0.00830841064453125, 0.000545501708984375, 0.0093994140625, 0.018253326416015625, 0.02710723876953125, 0.035961151123046875, 0.0448150634765625, 0.053668975830078125, 0.06252288818359375, 0.07137680053710938, 0.080230712890625, 0.08908462524414062, 0.09793853759765625, 0.10679244995117188, 0.1156463623046875, 0.12450027465820312, 0.13335418701171875, 0.14220809936523438, 0.15106201171875, 0.15991592407226562, 0.16876983642578125, 0.17762374877929688, 0.1864776611328125, 0.19533157348632812, 0.20418548583984375, 0.21303939819335938, 0.221893310546875, 0.23074722290039062, 0.23960113525390625, 0.24845504760742188, 0.2573089599609375, 0.2661628723144531, 0.27501678466796875, 0.2838706970214844, 0.292724609375]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 2.0, 5.0, 3.0, 4.0, 4.0, 8.0, 8.0, 10.0, 19.0, 22.0, 27.0, 31.0, 42.0, 42.0, 36.0, 38.0, 64.0, 61.0, 75.0, 52.0, 55.0, 58.0, 41.0, 52.0, 41.0, 47.0, 41.0, 28.0, 29.0, 16.0, 3.0, 13.0, 12.0, 5.0, 3.0, 4.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.212646484375, -0.20487594604492188, -0.19710540771484375, -0.18933486938476562, -0.1815643310546875, -0.17379379272460938, -0.16602325439453125, -0.15825271606445312, -0.150482177734375, -0.14271163940429688, -0.13494110107421875, -0.12717056274414062, -0.1194000244140625, -0.11162948608398438, -0.10385894775390625, -0.09608840942382812, -0.08831787109375, -0.08054733276367188, -0.07277679443359375, -0.06500625610351562, -0.0572357177734375, -0.049465179443359375, -0.04169464111328125, -0.033924102783203125, -0.026153564453125, -0.018383026123046875, -0.01061248779296875, -0.002841949462890625, 0.0049285888671875, 0.012699127197265625, 0.02046966552734375, 0.028240203857421875, 0.0360107421875, 0.043781280517578125, 0.05155181884765625, 0.059322357177734375, 0.0670928955078125, 0.07486343383789062, 0.08263397216796875, 0.09040451049804688, 0.098175048828125, 0.10594558715820312, 0.11371612548828125, 0.12148666381835938, 0.1292572021484375, 0.13702774047851562, 0.14479827880859375, 0.15256881713867188, 0.16033935546875, 0.16810989379882812, 0.17588043212890625, 0.18365097045898438, 0.1914215087890625, 0.19919204711914062, 0.20696258544921875, 0.21473312377929688, 0.222503662109375, 0.23027420043945312, 0.23804473876953125, 0.24581527709960938, 0.2535858154296875, 0.2613563537597656, 0.26912689208984375, 0.2768974304199219, 0.28466796875]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 4.0, 4.0, 1.0, 5.0, 3.0, 7.0, 6.0, 10.0, 13.0, 12.0, 22.0, 22.0, 44.0, 94.0, 138.0, 298.0, 450.0, 1024.0, 1890.0, 4124.0, 10557.0, 46350.0, 369678.0, 519733.0, 71115.0, 13597.0, 4850.0, 2185.0, 1089.0, 525.0, 296.0, 170.0, 89.0, 44.0, 29.0, 30.0, 18.0, 17.0, 6.0, 7.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10198974609375, -0.0989999771118164, -0.09601020812988281, -0.09302043914794922, -0.09003067016601562, -0.08704090118408203, -0.08405113220214844, -0.08106136322021484, -0.07807159423828125, -0.07508182525634766, -0.07209205627441406, -0.06910228729248047, -0.06611251831054688, -0.06312274932861328, -0.06013298034667969, -0.057143211364746094, -0.0541534423828125, -0.051163673400878906, -0.04817390441894531, -0.04518413543701172, -0.042194366455078125, -0.03920459747314453, -0.03621482849121094, -0.033225059509277344, -0.03023529052734375, -0.027245521545410156, -0.024255752563476562, -0.02126598358154297, -0.018276214599609375, -0.015286445617675781, -0.012296676635742188, -0.009306907653808594, -0.006317138671875, -0.0033273696899414062, -0.0003376007080078125, 0.0026521682739257812, 0.005641937255859375, 0.008631706237792969, 0.011621475219726562, 0.014611244201660156, 0.01760101318359375, 0.020590782165527344, 0.023580551147460938, 0.02657032012939453, 0.029560089111328125, 0.03254985809326172, 0.03553962707519531, 0.038529396057128906, 0.0415191650390625, 0.044508934020996094, 0.04749870300292969, 0.05048847198486328, 0.053478240966796875, 0.05646800994873047, 0.05945777893066406, 0.062447547912597656, 0.06543731689453125, 0.06842708587646484, 0.07141685485839844, 0.07440662384033203, 0.07739639282226562, 0.08038616180419922, 0.08337593078613281, 0.0863656997680664, 0.08935546875]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 4.0, 4.0, 6.0, 10.0, 5.0, 14.0, 16.0, 13.0, 18.0, 25.0, 22.0, 27.0, 42.0, 36.0, 34.0, 55.0, 44.0, 45.0, 49.0, 40.0, 58.0, 50.0, 61.0, 43.0, 40.0, 38.0, 35.0, 24.0, 33.0, 24.0, 22.0, 12.0, 13.0, 10.0, 9.0, 5.0, 7.0, 2.0, 3.0, 5.0, 1.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.448486328125, -0.4352684020996094, -0.42205047607421875, -0.4088325500488281, -0.3956146240234375, -0.3823966979980469, -0.36917877197265625, -0.3559608459472656, -0.342742919921875, -0.3295249938964844, -0.31630706787109375, -0.3030891418457031, -0.2898712158203125, -0.2766532897949219, -0.26343536376953125, -0.2502174377441406, -0.23699951171875, -0.22378158569335938, -0.21056365966796875, -0.19734573364257812, -0.1841278076171875, -0.17090988159179688, -0.15769195556640625, -0.14447402954101562, -0.131256103515625, -0.11803817749023438, -0.10482025146484375, -0.09160232543945312, -0.0783843994140625, -0.06516647338867188, -0.05194854736328125, -0.038730621337890625, -0.0255126953125, -0.012294769287109375, 0.00092315673828125, 0.014141082763671875, 0.0273590087890625, 0.040576934814453125, 0.05379486083984375, 0.06701278686523438, 0.080230712890625, 0.09344863891601562, 0.10666656494140625, 0.11988449096679688, 0.1331024169921875, 0.14632034301757812, 0.15953826904296875, 0.17275619506835938, 0.18597412109375, 0.19919204711914062, 0.21240997314453125, 0.22562789916992188, 0.2388458251953125, 0.2520637512207031, 0.26528167724609375, 0.2784996032714844, 0.291717529296875, 0.3049354553222656, 0.31815338134765625, 0.3313713073730469, 0.3445892333984375, 0.3578071594238281, 0.37102508544921875, 0.3842430114746094, 0.3974609375]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 4.0, 4.0, 11.0, 4.0, 17.0, 20.0, 39.0, 69.0, 98.0, 187.0, 336.0, 720.0, 1429.0, 3546.0, 9546.0, 32287.0, 148293.0, 519038.0, 257746.0, 52569.0, 13973.0, 4816.0, 1940.0, 882.0, 433.0, 225.0, 133.0, 78.0, 42.0, 21.0, 11.0, 13.0, 9.0, 8.0, 7.0, 3.0, 2.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.0270233154296875, -0.02632451057434082, -0.02562570571899414, -0.02492690086364746, -0.02422809600830078, -0.0235292911529541, -0.022830486297607422, -0.022131681442260742, -0.021432876586914062, -0.020734071731567383, -0.020035266876220703, -0.019336462020874023, -0.018637657165527344, -0.017938852310180664, -0.017240047454833984, -0.016541242599487305, -0.015842437744140625, -0.015143632888793945, -0.014444828033447266, -0.013746023178100586, -0.013047218322753906, -0.012348413467407227, -0.011649608612060547, -0.010950803756713867, -0.010251998901367188, -0.009553194046020508, -0.008854389190673828, -0.008155584335327148, -0.007456779479980469, -0.006757974624633789, -0.006059169769287109, -0.00536036491394043, -0.00466156005859375, -0.00396275520324707, -0.0032639503479003906, -0.002565145492553711, -0.0018663406372070312, -0.0011675357818603516, -0.0004687309265136719, 0.0002300739288330078, 0.0009288787841796875, 0.0016276836395263672, 0.002326488494873047, 0.0030252933502197266, 0.0037240982055664062, 0.004422903060913086, 0.005121707916259766, 0.005820512771606445, 0.006519317626953125, 0.007218122482299805, 0.007916927337646484, 0.008615732192993164, 0.009314537048339844, 0.010013341903686523, 0.010712146759033203, 0.011410951614379883, 0.012109756469726562, 0.012808561325073242, 0.013507366180419922, 0.014206171035766602, 0.014904975891113281, 0.015603780746459961, 0.01630258560180664, 0.01700139045715332, 0.0177001953125]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 1.0, 8.0, 5.0, 5.0, 7.0, 11.0, 11.0, 20.0, 32.0, 35.0, 40.0, 65.0, 75.0, 82.0, 72.0, 90.0, 69.0, 80.0, 55.0, 43.0, 56.0, 36.0, 24.0, 21.0, 13.0, 9.0, 10.0, 8.0, 1.0, 3.0, 1.0, 10.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.233816146850586e-05, -1.1992640793323517e-05, -1.1647120118141174e-05, -1.1301599442958832e-05, -1.095607876777649e-05, -1.0610558092594147e-05, -1.0265037417411804e-05, -9.919516742229462e-06, -9.573996067047119e-06, -9.228475391864777e-06, -8.882954716682434e-06, -8.537434041500092e-06, -8.191913366317749e-06, -7.846392691135406e-06, -7.500872015953064e-06, -7.1553513407707214e-06, -6.809830665588379e-06, -6.464309990406036e-06, -6.118789315223694e-06, -5.773268640041351e-06, -5.427747964859009e-06, -5.082227289676666e-06, -4.736706614494324e-06, -4.391185939311981e-06, -4.045665264129639e-06, -3.700144588947296e-06, -3.3546239137649536e-06, -3.009103238582611e-06, -2.6635825634002686e-06, -2.318061888217926e-06, -1.9725412130355835e-06, -1.627020537853241e-06, -1.2814998626708984e-06, -9.359791874885559e-07, -5.904585123062134e-07, -2.4493783712387085e-07, 1.0058283805847168e-07, 4.461035132408142e-07, 7.916241884231567e-07, 1.1371448636054993e-06, 1.4826655387878418e-06, 1.8281862139701843e-06, 2.173706889152527e-06, 2.5192275643348694e-06, 2.864748239517212e-06, 3.2102689146995544e-06, 3.555789589881897e-06, 3.9013102650642395e-06, 4.246830940246582e-06, 4.5923516154289246e-06, 4.937872290611267e-06, 5.28339296579361e-06, 5.628913640975952e-06, 5.974434316158295e-06, 6.319954991340637e-06, 6.66547566652298e-06, 7.010996341705322e-06, 7.356517016887665e-06, 7.702037692070007e-06, 8.04755836725235e-06, 8.393079042434692e-06, 8.738599717617035e-06, 9.084120392799377e-06, 9.42964106798172e-06, 9.775161743164062e-06]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 2.0, 4.0, 4.0, 10.0, 17.0, 21.0, 29.0, 55.0, 74.0, 105.0, 214.0, 307.0, 569.0, 992.0, 2034.0, 4311.0, 10650.0, 31472.0, 112457.0, 357098.0, 361025.0, 115289.0, 31996.0, 11024.0, 4392.0, 1942.0, 1045.0, 553.0, 323.0, 182.0, 116.0, 68.0, 45.0, 31.0, 31.0, 20.0, 16.0, 13.0, 2.0, 3.0, 7.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0190887451171875, -0.018473148345947266, -0.01785755157470703, -0.017241954803466797, -0.016626358032226562, -0.016010761260986328, -0.015395164489746094, -0.01477956771850586, -0.014163970947265625, -0.01354837417602539, -0.012932777404785156, -0.012317180633544922, -0.011701583862304688, -0.011085987091064453, -0.010470390319824219, -0.009854793548583984, -0.00923919677734375, -0.008623600006103516, -0.008008003234863281, -0.007392406463623047, -0.0067768096923828125, -0.006161212921142578, -0.005545616149902344, -0.004930019378662109, -0.004314422607421875, -0.0036988258361816406, -0.0030832290649414062, -0.002467632293701172, -0.0018520355224609375, -0.0012364387512207031, -0.0006208419799804688, -5.245208740234375e-06, 0.0006103515625, 0.0012259483337402344, 0.0018415451049804688, 0.002457141876220703, 0.0030727386474609375, 0.003688335418701172, 0.004303932189941406, 0.004919528961181641, 0.005535125732421875, 0.006150722503662109, 0.006766319274902344, 0.007381916046142578, 0.007997512817382812, 0.008613109588623047, 0.009228706359863281, 0.009844303131103516, 0.01045989990234375, 0.011075496673583984, 0.011691093444824219, 0.012306690216064453, 0.012922286987304688, 0.013537883758544922, 0.014153480529785156, 0.01476907730102539, 0.015384674072265625, 0.01600027084350586, 0.016615867614746094, 0.017231464385986328, 0.017847061157226562, 0.018462657928466797, 0.01907825469970703, 0.019693851470947266, 0.0203094482421875]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 4.0, 1.0, 6.0, 5.0, 7.0, 11.0, 13.0, 17.0, 23.0, 18.0, 45.0, 51.0, 78.0, 80.0, 94.0, 82.0, 86.0, 69.0, 71.0, 64.0, 49.0, 47.0, 23.0, 14.0, 15.0, 9.0, 5.0, 5.0, 4.0, 4.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.00616455078125, -0.005955398082733154, -0.005746245384216309, -0.005537092685699463, -0.005327939987182617, -0.0051187872886657715, -0.004909634590148926, -0.00470048189163208, -0.004491329193115234, -0.004282176494598389, -0.004073023796081543, -0.0038638710975646973, -0.0036547183990478516, -0.003445565700531006, -0.00323641300201416, -0.0030272603034973145, -0.0028181076049804688, -0.002608954906463623, -0.0023998022079467773, -0.0021906495094299316, -0.001981496810913086, -0.0017723441123962402, -0.0015631914138793945, -0.0013540387153625488, -0.0011448860168457031, -0.0009357333183288574, -0.0007265806198120117, -0.000517427921295166, -0.0003082752227783203, -9.912252426147461e-05, 0.0001100301742553711, 0.0003191828727722168, 0.0005283355712890625, 0.0007374882698059082, 0.0009466409683227539, 0.0011557936668395996, 0.0013649463653564453, 0.001574099063873291, 0.0017832517623901367, 0.0019924044609069824, 0.002201557159423828, 0.002410709857940674, 0.0026198625564575195, 0.0028290152549743652, 0.003038167953491211, 0.0032473206520080566, 0.0034564733505249023, 0.003665626049041748, 0.0038747787475585938, 0.0040839314460754395, 0.004293084144592285, 0.004502236843109131, 0.0047113895416259766, 0.004920542240142822, 0.005129694938659668, 0.005338847637176514, 0.005548000335693359, 0.005757153034210205, 0.005966305732727051, 0.0061754584312438965, 0.006384611129760742, 0.006593763828277588, 0.006802916526794434, 0.007012069225311279, 0.007221221923828125]}, "gradients/decoder.model.decoder.layers.3.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 8.0, 21.0, 66.0, 157.0, 303.0, 266.0, 110.0, 47.0, 21.0, 5.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.535526156425476, -1.505895972251892, -1.4762659072875977, -1.4466357231140137, -1.4170055389404297, -1.3873753547668457, -1.3577452898025513, -1.3281151056289673, -1.2984849214553833, -1.2688547372817993, -1.2392246723175049, -1.209594488143921, -1.179964303970337, -1.150334119796753, -1.1207040548324585, -1.0910738706588745, -1.0614436864852905, -1.0318135023117065, -1.002183437347412, -0.9725532531738281, -0.9429230690002441, -0.9132929444313049, -0.883662760257721, -0.8540326356887817, -0.8244025111198425, -0.7947723865509033, -0.7651422023773193, -0.7355120778083801, -0.7058818936347961, -0.6762517690658569, -0.646621584892273, -0.6169914603233337, -0.5873612761497498, -0.5577311515808105, -0.5281009674072266, -0.49847081303596497, -0.46884065866470337, -0.43921053409576416, -0.4095803499221802, -0.37995022535324097, -0.350320041179657, -0.3206898868083954, -0.2910597324371338, -0.2614295780658722, -0.2317994236946106, -0.2021692842245102, -0.1725391298532486, -0.142908975481987, -0.1132788360118866, -0.083648681640625, -0.0540185309946537, -0.024388380348682404, 0.005241774022579193, 0.03487192094326019, 0.06450207531452179, 0.09413222968578339, 0.12376238405704498, 0.15339253842830658, 0.18302269279956818, 0.21265283226966858, 0.24228298664093018, 0.2719131410121918, 0.30154329538345337, 0.33117344975471497, 0.36080360412597656]}, "gradients/decoder.model.decoder.layers.3.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 3.0, 8.0, 4.0, 7.0, 7.0, 15.0, 20.0, 13.0, 38.0, 25.0, 45.0, 40.0, 42.0, 46.0, 79.0, 65.0, 43.0, 62.0, 60.0, 51.0, 66.0, 53.0, 48.0, 34.0, 44.0, 27.0, 14.0, 13.0, 12.0, 10.0, 0.0, 5.0, 2.0, 2.0, 2.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2019055187702179, -0.19379085302352905, -0.1856761872768402, -0.17756153643131256, -0.16944687068462372, -0.16133220493793488, -0.15321755409240723, -0.14510288834571838, -0.13698822259902954, -0.1288735568523407, -0.12075889855623245, -0.1126442402601242, -0.10452957451343536, -0.09641490876674652, -0.08830025047063828, -0.08018559217453003, -0.07207092642784119, -0.06395626068115234, -0.0558416023850441, -0.047726940363645554, -0.03961227834224701, -0.031497616320848465, -0.02338295429944992, -0.015268292278051376, -0.007153630256652832, 0.0009610317647457123, 0.009075693786144257, 0.0171903558075428, 0.025305017828941345, 0.03341967985033989, 0.041534341871738434, 0.04964900389313698, 0.057763636112213135, 0.06587830185890198, 0.07399296015501022, 0.08210761845111847, 0.09022228419780731, 0.09833694994449615, 0.1064516082406044, 0.11456626653671265, 0.12268093228340149, 0.13079559803009033, 0.13891026377677917, 0.14702491462230682, 0.15513958036899567, 0.1632542461156845, 0.17136889696121216, 0.179483562707901, 0.18759822845458984, 0.1957128942012787, 0.20382755994796753, 0.21194221079349518, 0.22005687654018402, 0.22817154228687286, 0.2362861931324005, 0.24440085887908936, 0.2525155246257782, 0.26063019037246704, 0.2687448561191559, 0.2768595218658447, 0.2849741578102112, 0.2930888235569, 0.30120348930358887, 0.3093181550502777, 0.31743282079696655]}, "gradients/decoder.model.decoder.layers.3.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 2.0, 7.0, 5.0, 1.0, 8.0, 14.0, 26.0, 27.0, 54.0, 88.0, 120.0, 226.0, 402.0, 795.0, 1746.0, 4364.0, 14299.0, 68547.0, 712619.0, 202424.0, 30038.0, 7713.0, 2616.0, 1113.0, 610.0, 270.0, 149.0, 101.0, 61.0, 39.0, 20.0, 18.0, 13.0, 9.0, 5.0, 5.0, 5.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.293212890625, -0.2856464385986328, -0.2780799865722656, -0.27051353454589844, -0.26294708251953125, -0.25538063049316406, -0.24781417846679688, -0.2402477264404297, -0.2326812744140625, -0.2251148223876953, -0.21754837036132812, -0.20998191833496094, -0.20241546630859375, -0.19484901428222656, -0.18728256225585938, -0.1797161102294922, -0.172149658203125, -0.1645832061767578, -0.15701675415039062, -0.14945030212402344, -0.14188385009765625, -0.13431739807128906, -0.12675094604492188, -0.11918449401855469, -0.1116180419921875, -0.10405158996582031, -0.09648513793945312, -0.08891868591308594, -0.08135223388671875, -0.07378578186035156, -0.06621932983398438, -0.05865287780761719, -0.05108642578125, -0.04351997375488281, -0.035953521728515625, -0.028387069702148438, -0.02082061767578125, -0.013254165649414062, -0.005687713623046875, 0.0018787384033203125, 0.0094451904296875, 0.017011642456054688, 0.024578094482421875, 0.03214454650878906, 0.03971099853515625, 0.04727745056152344, 0.054843902587890625, 0.06241035461425781, 0.069976806640625, 0.07754325866699219, 0.08510971069335938, 0.09267616271972656, 0.10024261474609375, 0.10780906677246094, 0.11537551879882812, 0.12294197082519531, 0.1305084228515625, 0.1380748748779297, 0.14564132690429688, 0.15320777893066406, 0.16077423095703125, 0.16834068298339844, 0.17590713500976562, 0.1834735870361328, 0.1910400390625]}, "gradients/decoder.model.decoder.layers.3.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 2.0, 7.0, 4.0, 4.0, 8.0, 9.0, 9.0, 14.0, 29.0, 19.0, 41.0, 44.0, 43.0, 50.0, 56.0, 54.0, 71.0, 52.0, 71.0, 69.0, 68.0, 47.0, 55.0, 44.0, 35.0, 28.0, 25.0, 12.0, 10.0, 9.0, 7.0, 2.0, 3.0, 2.0, 1.0, 0.0, 2.0, 5.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.483642578125, -0.4661293029785156, -0.44861602783203125, -0.4311027526855469, -0.4135894775390625, -0.3960762023925781, -0.37856292724609375, -0.3610496520996094, -0.343536376953125, -0.3260231018066406, -0.30850982666015625, -0.2909965515136719, -0.2734832763671875, -0.2559700012207031, -0.23845672607421875, -0.22094345092773438, -0.20343017578125, -0.18591690063476562, -0.16840362548828125, -0.15089035034179688, -0.1333770751953125, -0.11586380004882812, -0.09835052490234375, -0.08083724975585938, -0.063323974609375, -0.045810699462890625, -0.02829742431640625, -0.010784149169921875, 0.0067291259765625, 0.024242401123046875, 0.04175567626953125, 0.059268951416015625, 0.0767822265625, 0.09429550170898438, 0.11180877685546875, 0.12932205200195312, 0.1468353271484375, 0.16434860229492188, 0.18186187744140625, 0.19937515258789062, 0.216888427734375, 0.23440170288085938, 0.25191497802734375, 0.2694282531738281, 0.2869415283203125, 0.3044548034667969, 0.32196807861328125, 0.3394813537597656, 0.35699462890625, 0.3745079040527344, 0.39202117919921875, 0.4095344543457031, 0.4270477294921875, 0.4445610046386719, 0.46207427978515625, 0.4795875549316406, 0.497100830078125, 0.5146141052246094, 0.5321273803710938, 0.5496406555175781, 0.5671539306640625, 0.5846672058105469, 0.6021804809570312, 0.6196937561035156, 0.63720703125]}, "gradients/decoder.model.decoder.layers.3.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 8.0, 1.0, 1.0, 5.0, 7.0, 9.0, 7.0, 9.0, 17.0, 12.0, 20.0, 27.0, 26.0, 34.0, 51.0, 74.0, 104.0, 198.0, 467.0, 2140.0, 49428.0, 981140.0, 12774.0, 1154.0, 345.0, 153.0, 98.0, 60.0, 33.0, 34.0, 31.0, 13.0, 17.0, 22.0, 8.0, 3.0, 8.0, 6.0, 5.0, 4.0, 4.0, 1.0, 4.0, 5.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.84912109375, -0.8257522583007812, -0.8023834228515625, -0.7790145874023438, -0.755645751953125, -0.7322769165039062, -0.7089080810546875, -0.6855392456054688, -0.66217041015625, -0.6388015747070312, -0.6154327392578125, -0.5920639038085938, -0.568695068359375, -0.5453262329101562, -0.5219573974609375, -0.49858856201171875, -0.4752197265625, -0.45185089111328125, -0.4284820556640625, -0.40511322021484375, -0.381744384765625, -0.35837554931640625, -0.3350067138671875, -0.31163787841796875, -0.28826904296875, -0.26490020751953125, -0.2415313720703125, -0.21816253662109375, -0.194793701171875, -0.17142486572265625, -0.1480560302734375, -0.12468719482421875, -0.101318359375, -0.07794952392578125, -0.0545806884765625, -0.03121185302734375, -0.007843017578125, 0.01552581787109375, 0.0388946533203125, 0.06226348876953125, 0.08563232421875, 0.10900115966796875, 0.1323699951171875, 0.15573883056640625, 0.179107666015625, 0.20247650146484375, 0.2258453369140625, 0.24921417236328125, 0.2725830078125, 0.29595184326171875, 0.3193206787109375, 0.34268951416015625, 0.366058349609375, 0.38942718505859375, 0.4127960205078125, 0.43616485595703125, 0.45953369140625, 0.48290252685546875, 0.5062713623046875, 0.5296401977539062, 0.553009033203125, 0.5763778686523438, 0.5997467041015625, 0.6231155395507812, 0.646484375]}, "gradients/decoder.model.decoder.layers.3.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 4.0, 0.0, 2.0, 5.0, 7.0, 5.0, 5.0, 11.0, 7.0, 9.0, 15.0, 13.0, 15.0, 25.0, 21.0, 23.0, 34.0, 38.0, 36.0, 35.0, 45.0, 47.0, 41.0, 45.0, 48.0, 49.0, 38.0, 57.0, 45.0, 44.0, 30.0, 26.0, 30.0, 24.0, 18.0, 26.0, 16.0, 13.0, 18.0, 8.0, 7.0, 5.0, 2.0, 7.0, 6.0, 2.0, 4.0, 1.0, 2.0, 0.0, 1.0, 2.0], "bins": [-0.56396484375, -0.5485496520996094, -0.5331344604492188, -0.5177192687988281, -0.5023040771484375, -0.4868888854980469, -0.47147369384765625, -0.4560585021972656, -0.440643310546875, -0.4252281188964844, -0.40981292724609375, -0.3943977355957031, -0.3789825439453125, -0.3635673522949219, -0.34815216064453125, -0.3327369689941406, -0.31732177734375, -0.3019065856933594, -0.28649139404296875, -0.2710762023925781, -0.2556610107421875, -0.24024581909179688, -0.22483062744140625, -0.20941543579101562, -0.194000244140625, -0.17858505249023438, -0.16316986083984375, -0.14775466918945312, -0.1323394775390625, -0.11692428588867188, -0.10150909423828125, -0.08609390258789062, -0.0706787109375, -0.055263519287109375, -0.03984832763671875, -0.024433135986328125, -0.0090179443359375, 0.006397247314453125, 0.02181243896484375, 0.037227630615234375, 0.052642822265625, 0.06805801391601562, 0.08347320556640625, 0.09888839721679688, 0.1143035888671875, 0.12971878051757812, 0.14513397216796875, 0.16054916381835938, 0.17596435546875, 0.19137954711914062, 0.20679473876953125, 0.22220993041992188, 0.2376251220703125, 0.2530403137207031, 0.26845550537109375, 0.2838706970214844, 0.299285888671875, 0.3147010803222656, 0.33011627197265625, 0.3455314636230469, 0.3609466552734375, 0.3763618469238281, 0.39177703857421875, 0.4071922302246094, 0.422607421875]}, "gradients/decoder.model.decoder.layers.3.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 9.0, 6.0, 6.0, 28.0, 37.0, 70.0, 134.0, 321.0, 865.0, 4222.0, 686244.0, 351539.0, 3815.0, 786.0, 270.0, 109.0, 52.0, 28.0, 9.0, 5.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.188720703125, -0.17927169799804688, -0.16982269287109375, -0.16037368774414062, -0.1509246826171875, -0.14147567749023438, -0.13202667236328125, -0.12257766723632812, -0.113128662109375, -0.10367965698242188, -0.09423065185546875, -0.08478164672851562, -0.0753326416015625, -0.06588363647460938, -0.05643463134765625, -0.046985626220703125, -0.03753662109375, -0.028087615966796875, -0.01863861083984375, -0.009189605712890625, 0.0002593994140625, 0.009708404541015625, 0.01915740966796875, 0.028606414794921875, 0.038055419921875, 0.047504425048828125, 0.05695343017578125, 0.06640243530273438, 0.0758514404296875, 0.08530044555664062, 0.09474945068359375, 0.10419845581054688, 0.1136474609375, 0.12309646606445312, 0.13254547119140625, 0.14199447631835938, 0.1514434814453125, 0.16089248657226562, 0.17034149169921875, 0.17979049682617188, 0.189239501953125, 0.19868850708007812, 0.20813751220703125, 0.21758651733398438, 0.2270355224609375, 0.23648452758789062, 0.24593353271484375, 0.2553825378417969, 0.26483154296875, 0.2742805480957031, 0.28372955322265625, 0.2931785583496094, 0.3026275634765625, 0.3120765686035156, 0.32152557373046875, 0.3309745788574219, 0.340423583984375, 0.3498725891113281, 0.35932159423828125, 0.3687705993652344, 0.3782196044921875, 0.3876686096191406, 0.39711761474609375, 0.4065666198730469, 0.416015625]}, "gradients/decoder.model.decoder.layers.3.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 7.0, 4.0, 17.0, 11.0, 28.0, 50.0, 72.0, 152.0, 320.0, 162.0, 73.0, 39.0, 13.0, 16.0, 18.0, 8.0, 7.0, 2.0, 5.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3530254364013672e-05, -1.271069049835205e-05, -1.189112663269043e-05, -1.1071562767028809e-05, -1.0251998901367188e-05, -9.432435035705566e-06, -8.612871170043945e-06, -7.793307304382324e-06, -6.973743438720703e-06, -6.154179573059082e-06, -5.334615707397461e-06, -4.51505184173584e-06, -3.6954879760742188e-06, -2.8759241104125977e-06, -2.0563602447509766e-06, -1.2367963790893555e-06, -4.172325134277344e-07, 4.023313522338867e-07, 1.2218952178955078e-06, 2.041459083557129e-06, 2.86102294921875e-06, 3.680586814880371e-06, 4.500150680541992e-06, 5.319714546203613e-06, 6.139278411865234e-06, 6.9588422775268555e-06, 7.778406143188477e-06, 8.597970008850098e-06, 9.417533874511719e-06, 1.023709774017334e-05, 1.1056661605834961e-05, 1.1876225471496582e-05, 1.2695789337158203e-05, 1.3515353202819824e-05, 1.4334917068481445e-05, 1.5154480934143066e-05, 1.5974044799804688e-05, 1.679360866546631e-05, 1.761317253112793e-05, 1.843273639678955e-05, 1.9252300262451172e-05, 2.0071864128112793e-05, 2.0891427993774414e-05, 2.1710991859436035e-05, 2.2530555725097656e-05, 2.3350119590759277e-05, 2.41696834564209e-05, 2.498924732208252e-05, 2.580881118774414e-05, 2.6628375053405762e-05, 2.7447938919067383e-05, 2.8267502784729004e-05, 2.9087066650390625e-05, 2.9906630516052246e-05, 3.072619438171387e-05, 3.154575824737549e-05, 3.236532211303711e-05, 3.318488597869873e-05, 3.400444984436035e-05, 3.482401371002197e-05, 3.5643577575683594e-05, 3.6463141441345215e-05, 3.7282705307006836e-05, 3.810226917266846e-05, 3.892183303833008e-05]}, "gradients/decoder.model.decoder.layers.3.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 8.0, 4.0, 15.0, 22.0, 21.0, 60.0, 98.0, 168.0, 453.0, 1758.0, 96398.0, 944620.0, 3799.0, 606.0, 235.0, 120.0, 77.0, 41.0, 28.0, 13.0, 7.0, 5.0, 3.0, 4.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.51953125, -0.5059165954589844, -0.49230194091796875, -0.4786872863769531, -0.4650726318359375, -0.4514579772949219, -0.43784332275390625, -0.4242286682128906, -0.410614013671875, -0.3969993591308594, -0.38338470458984375, -0.3697700500488281, -0.3561553955078125, -0.3425407409667969, -0.32892608642578125, -0.3153114318847656, -0.30169677734375, -0.2880821228027344, -0.27446746826171875, -0.2608528137207031, -0.2472381591796875, -0.23362350463867188, -0.22000885009765625, -0.20639419555664062, -0.192779541015625, -0.17916488647460938, -0.16555023193359375, -0.15193557739257812, -0.1383209228515625, -0.12470626831054688, -0.11109161376953125, -0.09747695922851562, -0.0838623046875, -0.07024765014648438, -0.05663299560546875, -0.043018341064453125, -0.0294036865234375, -0.015789031982421875, -0.00217437744140625, 0.011440277099609375, 0.025054931640625, 0.038669586181640625, 0.05228424072265625, 0.06589889526367188, 0.0795135498046875, 0.09312820434570312, 0.10674285888671875, 0.12035751342773438, 0.13397216796875, 0.14758682250976562, 0.16120147705078125, 0.17481613159179688, 0.1884307861328125, 0.20204544067382812, 0.21566009521484375, 0.22927474975585938, 0.242889404296875, 0.2565040588378906, 0.27011871337890625, 0.2837333679199219, 0.2973480224609375, 0.3109626770019531, 0.32457733154296875, 0.3381919860839844, 0.351806640625]}, "gradients/decoder.model.decoder.layers.3.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 6.0, 16.0, 32.0, 48.0, 122.0, 420.0, 212.0, 81.0, 37.0, 25.0, 2.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0919189453125, -0.08847808837890625, -0.0850372314453125, -0.08159637451171875, -0.078155517578125, -0.07471466064453125, -0.0712738037109375, -0.06783294677734375, -0.06439208984375, -0.06095123291015625, -0.0575103759765625, -0.05406951904296875, -0.050628662109375, -0.04718780517578125, -0.0437469482421875, -0.04030609130859375, -0.036865234375, -0.03342437744140625, -0.0299835205078125, -0.02654266357421875, -0.023101806640625, -0.01966094970703125, -0.0162200927734375, -0.01277923583984375, -0.00933837890625, -0.00589752197265625, -0.0024566650390625, 0.00098419189453125, 0.004425048828125, 0.00786590576171875, 0.0113067626953125, 0.01474761962890625, 0.0181884765625, 0.02162933349609375, 0.0250701904296875, 0.02851104736328125, 0.031951904296875, 0.03539276123046875, 0.0388336181640625, 0.04227447509765625, 0.04571533203125, 0.04915618896484375, 0.0525970458984375, 0.05603790283203125, 0.059478759765625, 0.06291961669921875, 0.0663604736328125, 0.06980133056640625, 0.0732421875, 0.07668304443359375, 0.0801239013671875, 0.08356475830078125, 0.087005615234375, 0.09044647216796875, 0.0938873291015625, 0.09732818603515625, 0.10076904296875, 0.10420989990234375, 0.1076507568359375, 0.11109161376953125, 0.114532470703125, 0.11797332763671875, 0.1214141845703125, 0.12485504150390625, 0.1282958984375]}, "gradients/decoder.model.decoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 1.0, 2.0, 2.0, 10.0, 9.0, 12.0, 20.0, 29.0, 48.0, 72.0, 93.0, 105.0, 133.0, 118.0, 111.0, 73.0, 48.0, 43.0, 23.0, 15.0, 16.0, 10.0, 4.0, 4.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6792455315589905, -0.6547520756721497, -0.6302586197853088, -0.605765163898468, -0.5812717080116272, -0.5567782521247864, -0.5322847366333008, -0.50779128074646, -0.48329785466194153, -0.4588043987751007, -0.4343109428882599, -0.4098174571990967, -0.38532400131225586, -0.36083054542541504, -0.3363370895385742, -0.3118436336517334, -0.2873501777648926, -0.26285672187805176, -0.23836326599121094, -0.21386979520320892, -0.1893763393163681, -0.16488288342952728, -0.14038941264152527, -0.11589595675468445, -0.09140250086784363, -0.06690904498100281, -0.04241558164358139, -0.017922118306159973, 0.006571337580680847, 0.031064793467521667, 0.05555826425552368, 0.0800517201423645, 0.10454511642456055, 0.12903857231140137, 0.1535320281982422, 0.1780254989862442, 0.20251895487308502, 0.22701241075992584, 0.25150588154792786, 0.2759993374347687, 0.3004927933216095, 0.3249862492084503, 0.34947970509529114, 0.37397319078445435, 0.39846664667129517, 0.422960102558136, 0.4474535584449768, 0.4719470143318176, 0.49644047021865845, 0.5209339261054993, 0.5454273819923401, 0.5699208378791809, 0.5944142937660217, 0.6189077496528625, 0.6434012651443481, 0.667894721031189, 0.6923881769180298, 0.7168816328048706, 0.7413750886917114, 0.7658685445785522, 0.7903620004653931, 0.8148554563522339, 0.8393489122390747, 0.8638423681259155, 0.8883358240127563]}, "gradients/decoder.model.decoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 3.0, 4.0, 7.0, 4.0, 4.0, 4.0, 7.0, 11.0, 13.0, 18.0, 16.0, 24.0, 26.0, 24.0, 22.0, 35.0, 41.0, 44.0, 46.0, 45.0, 51.0, 40.0, 54.0, 40.0, 43.0, 39.0, 34.0, 30.0, 33.0, 34.0, 24.0, 37.0, 27.0, 23.0, 11.0, 20.0, 16.0, 17.0, 6.0, 8.0, 8.0, 6.0, 4.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0], "bins": [-0.7886910438537598, -0.7644833326339722, -0.7402756214141846, -0.716067910194397, -0.6918601989746094, -0.6676525473594666, -0.643444836139679, -0.6192371249198914, -0.5950294137001038, -0.5708217024803162, -0.5466139912605286, -0.522406280040741, -0.49819859862327576, -0.47399088740348816, -0.44978320598602295, -0.42557549476623535, -0.40136778354644775, -0.37716007232666016, -0.35295236110687256, -0.32874467968940735, -0.30453696846961975, -0.28032925724983215, -0.25612157583236694, -0.23191386461257935, -0.20770615339279175, -0.18349844217300415, -0.15929074585437775, -0.13508304953575134, -0.11087533831596375, -0.08666763454675674, -0.062459930777549744, -0.03825223445892334, -0.014044463634490967, 0.010163240134716034, 0.034370943903923035, 0.058578647673130035, 0.08278635144233704, 0.10699405521154404, 0.13120175898075104, 0.15540945529937744, 0.17961716651916504, 0.20382487773895264, 0.22803257405757904, 0.25224027037620544, 0.27644798159599304, 0.30065569281578064, 0.32486337423324585, 0.34907108545303345, 0.37327879667282104, 0.39748650789260864, 0.42169421911239624, 0.44590190052986145, 0.47010961174964905, 0.49431732296943665, 0.5185250043869019, 0.5427327156066895, 0.566940426826477, 0.5911481380462646, 0.6153558492660522, 0.6395635604858398, 0.6637712717056274, 0.6879789233207703, 0.7121866345405579, 0.7363943457603455, 0.7606020569801331]}, "gradients/decoder.model.decoder.layers.2.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 6.0, 8.0, 13.0, 18.0, 31.0, 69.0, 129.0, 297.0, 733.0, 5725.0, 1763183.0, 2416608.0, 6117.0, 821.0, 303.0, 124.0, 64.0, 26.0, 11.0, 7.0, 2.0, 1.0, 0.0, 1.0], "bins": [-2.833984375, -2.7784347534179688, -2.7228851318359375, -2.6673355102539062, -2.611785888671875, -2.5562362670898438, -2.5006866455078125, -2.4451370239257812, -2.38958740234375, -2.3340377807617188, -2.2784881591796875, -2.2229385375976562, -2.167388916015625, -2.1118392944335938, -2.0562896728515625, -2.0007400512695312, -1.9451904296875, -1.8896408081054688, -1.8340911865234375, -1.7785415649414062, -1.722991943359375, -1.6674423217773438, -1.6118927001953125, -1.5563430786132812, -1.50079345703125, -1.4452438354492188, -1.3896942138671875, -1.3341445922851562, -1.278594970703125, -1.2230453491210938, -1.1674957275390625, -1.1119461059570312, -1.056396484375, -1.0008468627929688, -0.9452972412109375, -0.8897476196289062, -0.834197998046875, -0.7786483764648438, -0.7230987548828125, -0.6675491333007812, -0.61199951171875, -0.5564498901367188, -0.5009002685546875, -0.44535064697265625, -0.389801025390625, -0.33425140380859375, -0.2787017822265625, -0.22315216064453125, -0.1676025390625, -0.11205291748046875, -0.0565032958984375, -0.00095367431640625, 0.054595947265625, 0.11014556884765625, 0.1656951904296875, 0.22124481201171875, 0.27679443359375, 0.33234405517578125, 0.3878936767578125, 0.44344329833984375, 0.498992919921875, 0.5545425415039062, 0.6100921630859375, 0.6656417846679688, 0.72119140625]}, "gradients/decoder.model.decoder.layers.2.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 4.0, 3.0, 4.0, 6.0, 6.0, 6.0, 12.0, 8.0, 22.0, 20.0, 24.0, 33.0, 51.0, 52.0, 63.0, 63.0, 55.0, 75.0, 68.0, 72.0, 65.0, 61.0, 51.0, 41.0, 41.0, 26.0, 25.0, 13.0, 16.0, 9.0, 7.0, 2.0, 5.0, 1.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.2705078125, -0.2605018615722656, -0.25049591064453125, -0.24048995971679688, -0.2304840087890625, -0.22047805786132812, -0.21047210693359375, -0.20046615600585938, -0.190460205078125, -0.18045425415039062, -0.17044830322265625, -0.16044235229492188, -0.1504364013671875, -0.14043045043945312, -0.13042449951171875, -0.12041854858398438, -0.11041259765625, -0.10040664672851562, -0.09040069580078125, -0.08039474487304688, -0.0703887939453125, -0.060382843017578125, -0.05037689208984375, -0.040370941162109375, -0.030364990234375, -0.020359039306640625, -0.01035308837890625, -0.000347137451171875, 0.0096588134765625, 0.019664764404296875, 0.02967071533203125, 0.039676666259765625, 0.0496826171875, 0.059688568115234375, 0.06969451904296875, 0.07970046997070312, 0.0897064208984375, 0.09971237182617188, 0.10971832275390625, 0.11972427368164062, 0.129730224609375, 0.13973617553710938, 0.14974212646484375, 0.15974807739257812, 0.1697540283203125, 0.17975997924804688, 0.18976593017578125, 0.19977188110351562, 0.20977783203125, 0.21978378295898438, 0.22978973388671875, 0.23979568481445312, 0.2498016357421875, 0.2598075866699219, 0.26981353759765625, 0.2798194885253906, 0.289825439453125, 0.2998313903808594, 0.30983734130859375, 0.3198432922363281, 0.3298492431640625, 0.3398551940917969, 0.34986114501953125, 0.3598670959472656, 0.369873046875]}, "gradients/decoder.model.decoder.layers.2.fc1.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 5.0, 4.0, 11.0, 23.0, 36.0, 69.0, 178.0, 460.0, 1570.0, 7138.0, 69682.0, 3868926.0, 229697.0, 12979.0, 2441.0, 614.0, 251.0, 104.0, 58.0, 19.0, 8.0, 6.0, 2.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.767578125, -0.7387847900390625, -0.709991455078125, -0.6811981201171875, -0.65240478515625, -0.6236114501953125, -0.594818115234375, -0.5660247802734375, -0.5372314453125, -0.5084381103515625, -0.479644775390625, -0.4508514404296875, -0.42205810546875, -0.3932647705078125, -0.364471435546875, -0.3356781005859375, -0.306884765625, -0.2780914306640625, -0.249298095703125, -0.2205047607421875, -0.19171142578125, -0.1629180908203125, -0.134124755859375, -0.1053314208984375, -0.0765380859375, -0.0477447509765625, -0.018951416015625, 0.0098419189453125, 0.03863525390625, 0.0674285888671875, 0.096221923828125, 0.1250152587890625, 0.15380859375, 0.1826019287109375, 0.211395263671875, 0.2401885986328125, 0.26898193359375, 0.2977752685546875, 0.326568603515625, 0.3553619384765625, 0.3841552734375, 0.4129486083984375, 0.441741943359375, 0.4705352783203125, 0.49932861328125, 0.5281219482421875, 0.556915283203125, 0.5857086181640625, 0.614501953125, 0.6432952880859375, 0.672088623046875, 0.7008819580078125, 0.72967529296875, 0.7584686279296875, 0.787261962890625, 0.8160552978515625, 0.8448486328125, 0.8736419677734375, 0.902435302734375, 0.9312286376953125, 0.96002197265625, 0.9888153076171875, 1.017608642578125, 1.0464019775390625, 1.0751953125]}, "gradients/decoder.model.decoder.layers.2.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 0.0, 10.0, 4.0, 5.0, 8.0, 12.0, 20.0, 26.0, 30.0, 47.0, 78.0, 142.0, 240.0, 395.0, 723.0, 856.0, 645.0, 339.0, 193.0, 101.0, 57.0, 39.0, 28.0, 20.0, 16.0, 11.0, 8.0, 4.0, 6.0, 7.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.16357421875, -0.15850448608398438, -0.15343475341796875, -0.14836502075195312, -0.1432952880859375, -0.13822555541992188, -0.13315582275390625, -0.12808609008789062, -0.123016357421875, -0.11794662475585938, -0.11287689208984375, -0.10780715942382812, -0.1027374267578125, -0.09766769409179688, -0.09259796142578125, -0.08752822875976562, -0.08245849609375, -0.07738876342773438, -0.07231903076171875, -0.06724929809570312, -0.0621795654296875, -0.057109832763671875, -0.05204010009765625, -0.046970367431640625, -0.041900634765625, -0.036830902099609375, -0.03176116943359375, -0.026691436767578125, -0.0216217041015625, -0.016551971435546875, -0.01148223876953125, -0.006412506103515625, -0.0013427734375, 0.003726959228515625, 0.00879669189453125, 0.013866424560546875, 0.0189361572265625, 0.024005889892578125, 0.02907562255859375, 0.034145355224609375, 0.039215087890625, 0.044284820556640625, 0.04935455322265625, 0.054424285888671875, 0.0594940185546875, 0.06456375122070312, 0.06963348388671875, 0.07470321655273438, 0.07977294921875, 0.08484268188476562, 0.08991241455078125, 0.09498214721679688, 0.1000518798828125, 0.10512161254882812, 0.11019134521484375, 0.11526107788085938, 0.120330810546875, 0.12540054321289062, 0.13047027587890625, 0.13554000854492188, 0.1406097412109375, 0.14567947387695312, 0.15074920654296875, 0.15581893920898438, 0.160888671875]}, "gradients/decoder.model.decoder.layers.2.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 6.0, 3.0, 8.0, 14.0, 14.0, 24.0, 38.0, 65.0, 76.0, 99.0, 117.0, 143.0, 122.0, 86.0, 67.0, 49.0, 25.0, 19.0, 10.0, 17.0, 7.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6090251207351685, -0.5889208316802979, -0.5688165426254272, -0.5487122535705566, -0.5286079049110413, -0.5085036158561707, -0.48839932680130005, -0.46829503774642944, -0.44819074869155884, -0.42808645963668823, -0.40798214077949524, -0.38787785172462463, -0.36777356266975403, -0.34766924381256104, -0.32756495475769043, -0.3074606657028198, -0.28735634684562683, -0.2672520577907562, -0.24714775383472443, -0.22704344987869263, -0.20693916082382202, -0.18683485686779022, -0.16673055291175842, -0.14662626385688782, -0.12652195990085602, -0.10641766339540482, -0.08631336688995361, -0.06620906293392181, -0.04610476642847061, -0.02600046992301941, -0.00589616596698761, 0.014208123087882996, 0.034312427043914795, 0.054416723549366, 0.0745210200548172, 0.094625324010849, 0.1147296205163002, 0.1348339170217514, 0.1549382209777832, 0.1750425100326538, 0.1951468139886856, 0.2152511179447174, 0.235355406999588, 0.255459725856781, 0.2755640149116516, 0.2956683039665222, 0.3157725930213928, 0.3358768820762634, 0.3559812009334564, 0.376085489988327, 0.39618980884552, 0.4162940979003906, 0.43639838695526123, 0.45650267601013184, 0.47660699486732483, 0.49671128392219543, 0.5168156027793884, 0.536919891834259, 0.5570241808891296, 0.577128529548645, 0.5972328186035156, 0.6173371076583862, 0.6374413967132568, 0.6575456857681274, 0.677649974822998]}, "gradients/decoder.model.decoder.layers.2.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 4.0, 4.0, 3.0, 2.0, 6.0, 6.0, 11.0, 5.0, 9.0, 9.0, 14.0, 7.0, 17.0, 14.0, 29.0, 32.0, 37.0, 43.0, 42.0, 38.0, 34.0, 33.0, 37.0, 49.0, 48.0, 50.0, 37.0, 34.0, 47.0, 30.0, 48.0, 24.0, 27.0, 28.0, 19.0, 21.0, 16.0, 22.0, 24.0, 17.0, 9.0, 3.0, 7.0, 7.0, 5.0, 4.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2784426212310791, -0.269459992647171, -0.2604773938655853, -0.25149476528167725, -0.24251215159893036, -0.23352953791618347, -0.22454692423343658, -0.2155643105506897, -0.20658168196678162, -0.19759906828403473, -0.18861645460128784, -0.17963382601737976, -0.17065121233463287, -0.161668598651886, -0.1526859849691391, -0.1437033712863922, -0.13472075760364532, -0.12573814392089844, -0.11675552278757095, -0.10777290910482407, -0.09879028797149658, -0.0898076742887497, -0.08082506060600281, -0.07184243947267532, -0.06285982578992844, -0.05387720838189125, -0.044894590973854065, -0.03591197729110718, -0.026929359883069992, -0.017946742475032806, -0.00896412879228592, 1.849234104156494e-05, 0.009001106023788452, 0.017983723431825638, 0.026966338977217674, 0.03594895452260971, 0.044931571930646896, 0.05391418933868408, 0.06289680302143097, 0.07187942415475845, 0.08086203783750534, 0.08984465152025223, 0.09882727265357971, 0.1078098863363266, 0.11679250001907349, 0.12577512860298157, 0.13475772738456726, 0.14374035596847534, 0.15272296965122223, 0.16170558333396912, 0.170688197016716, 0.1796708106994629, 0.18865343928337097, 0.19763605296611786, 0.20661866664886475, 0.21560129523277283, 0.22458389401435852, 0.2335665076971054, 0.2425491213798523, 0.2515317499637604, 0.26051434874534607, 0.26949697732925415, 0.27847957611083984, 0.2874622046947479, 0.296444833278656]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 1.0, 0.0, 4.0, 0.0, 4.0, 3.0, 6.0, 11.0, 23.0, 35.0, 80.0, 193.0, 417.0, 912.0, 2310.0, 6146.0, 18760.0, 151137.0, 772076.0, 74851.0, 13883.0, 4520.0, 1839.0, 741.0, 302.0, 119.0, 67.0, 33.0, 19.0, 17.0, 13.0, 6.0, 9.0, 6.0, 1.0, 4.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.195068359375, -0.1879425048828125, -0.180816650390625, -0.1736907958984375, -0.16656494140625, -0.1594390869140625, -0.152313232421875, -0.1451873779296875, -0.1380615234375, -0.1309356689453125, -0.123809814453125, -0.1166839599609375, -0.10955810546875, -0.1024322509765625, -0.095306396484375, -0.0881805419921875, -0.0810546875, -0.0739288330078125, -0.066802978515625, -0.0596771240234375, -0.05255126953125, -0.0454254150390625, -0.038299560546875, -0.0311737060546875, -0.0240478515625, -0.0169219970703125, -0.009796142578125, -0.0026702880859375, 0.00445556640625, 0.0115814208984375, 0.018707275390625, 0.0258331298828125, 0.032958984375, 0.0400848388671875, 0.047210693359375, 0.0543365478515625, 0.06146240234375, 0.0685882568359375, 0.075714111328125, 0.0828399658203125, 0.0899658203125, 0.0970916748046875, 0.104217529296875, 0.1113433837890625, 0.11846923828125, 0.1255950927734375, 0.132720947265625, 0.1398468017578125, 0.14697265625, 0.1540985107421875, 0.161224365234375, 0.1683502197265625, 0.17547607421875, 0.1826019287109375, 0.189727783203125, 0.1968536376953125, 0.2039794921875, 0.2111053466796875, 0.218231201171875, 0.2253570556640625, 0.23248291015625, 0.2396087646484375, 0.246734619140625, 0.2538604736328125, 0.260986328125]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 3.0, 2.0, 3.0, 4.0, 4.0, 4.0, 7.0, 7.0, 8.0, 11.0, 12.0, 18.0, 19.0, 24.0, 23.0, 35.0, 20.0, 37.0, 35.0, 39.0, 33.0, 39.0, 51.0, 36.0, 54.0, 42.0, 44.0, 35.0, 33.0, 36.0, 39.0, 38.0, 24.0, 27.0, 23.0, 12.0, 21.0, 23.0, 13.0, 18.0, 13.0, 13.0, 6.0, 7.0, 3.0, 5.0, 0.0, 3.0, 0.0, 2.0, 2.0, 3.0, 0.0, 1.0, 1.0], "bins": [-0.201416015625, -0.1954364776611328, -0.18945693969726562, -0.18347740173339844, -0.17749786376953125, -0.17151832580566406, -0.16553878784179688, -0.1595592498779297, -0.1535797119140625, -0.1476001739501953, -0.14162063598632812, -0.13564109802246094, -0.12966156005859375, -0.12368202209472656, -0.11770248413085938, -0.11172294616699219, -0.105743408203125, -0.09976387023925781, -0.09378433227539062, -0.08780479431152344, -0.08182525634765625, -0.07584571838378906, -0.06986618041992188, -0.06388664245605469, -0.0579071044921875, -0.05192756652832031, -0.045948028564453125, -0.03996849060058594, -0.03398895263671875, -0.028009414672851562, -0.022029876708984375, -0.016050338745117188, -0.01007080078125, -0.0040912628173828125, 0.001888275146484375, 0.007867813110351562, 0.01384735107421875, 0.019826889038085938, 0.025806427001953125, 0.03178596496582031, 0.0377655029296875, 0.04374504089355469, 0.049724578857421875, 0.05570411682128906, 0.06168365478515625, 0.06766319274902344, 0.07364273071289062, 0.07962226867675781, 0.085601806640625, 0.09158134460449219, 0.09756088256835938, 0.10354042053222656, 0.10951995849609375, 0.11549949645996094, 0.12147903442382812, 0.1274585723876953, 0.1334381103515625, 0.1394176483154297, 0.14539718627929688, 0.15137672424316406, 0.15735626220703125, 0.16333580017089844, 0.16931533813476562, 0.1752948760986328, 0.1812744140625]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 1.0, 6.0, 7.0, 8.0, 6.0, 11.0, 14.0, 16.0, 23.0, 45.0, 62.0, 75.0, 171.0, 322.0, 512.0, 1057.0, 2142.0, 4782.0, 13296.0, 50742.0, 293577.0, 539950.0, 105667.0, 22613.0, 7417.0, 2937.0, 1428.0, 721.0, 415.0, 201.0, 113.0, 68.0, 42.0, 35.0, 24.0, 12.0, 7.0, 11.0, 8.0, 7.0, 4.0, 2.0, 1.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10296630859375, -0.0994424819946289, -0.09591865539550781, -0.09239482879638672, -0.08887100219726562, -0.08534717559814453, -0.08182334899902344, -0.07829952239990234, -0.07477569580078125, -0.07125186920166016, -0.06772804260253906, -0.06420421600341797, -0.060680389404296875, -0.05715656280517578, -0.05363273620605469, -0.050108909606933594, -0.0465850830078125, -0.043061256408691406, -0.03953742980957031, -0.03601360321044922, -0.032489776611328125, -0.02896595001220703, -0.025442123413085938, -0.021918296813964844, -0.01839447021484375, -0.014870643615722656, -0.011346817016601562, -0.007822990417480469, -0.004299163818359375, -0.0007753372192382812, 0.0027484893798828125, 0.006272315979003906, 0.009796142578125, 0.013319969177246094, 0.016843795776367188, 0.02036762237548828, 0.023891448974609375, 0.02741527557373047, 0.030939102172851562, 0.034462928771972656, 0.03798675537109375, 0.041510581970214844, 0.04503440856933594, 0.04855823516845703, 0.052082061767578125, 0.05560588836669922, 0.05912971496582031, 0.0626535415649414, 0.0661773681640625, 0.0697011947631836, 0.07322502136230469, 0.07674884796142578, 0.08027267456054688, 0.08379650115966797, 0.08732032775878906, 0.09084415435791016, 0.09436798095703125, 0.09789180755615234, 0.10141563415527344, 0.10493946075439453, 0.10846328735351562, 0.11198711395263672, 0.11551094055175781, 0.1190347671508789, 0.12255859375]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 5.0, 4.0, 4.0, 5.0, 9.0, 5.0, 7.0, 9.0, 27.0, 10.0, 13.0, 10.0, 20.0, 32.0, 29.0, 23.0, 28.0, 37.0, 36.0, 30.0, 43.0, 43.0, 46.0, 49.0, 44.0, 57.0, 57.0, 46.0, 30.0, 31.0, 31.0, 40.0, 30.0, 21.0, 17.0, 16.0, 6.0, 11.0, 10.0, 9.0, 11.0, 8.0, 6.0, 4.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.39453125, -0.38111114501953125, -0.3676910400390625, -0.35427093505859375, -0.340850830078125, -0.32743072509765625, -0.3140106201171875, -0.30059051513671875, -0.28717041015625, -0.27375030517578125, -0.2603302001953125, -0.24691009521484375, -0.233489990234375, -0.22006988525390625, -0.2066497802734375, -0.19322967529296875, -0.1798095703125, -0.16638946533203125, -0.1529693603515625, -0.13954925537109375, -0.126129150390625, -0.11270904541015625, -0.0992889404296875, -0.08586883544921875, -0.07244873046875, -0.05902862548828125, -0.0456085205078125, -0.03218841552734375, -0.018768310546875, -0.00534820556640625, 0.0080718994140625, 0.02149200439453125, 0.034912109375, 0.04833221435546875, 0.0617523193359375, 0.07517242431640625, 0.088592529296875, 0.10201263427734375, 0.1154327392578125, 0.12885284423828125, 0.14227294921875, 0.15569305419921875, 0.1691131591796875, 0.18253326416015625, 0.195953369140625, 0.20937347412109375, 0.2227935791015625, 0.23621368408203125, 0.2496337890625, 0.26305389404296875, 0.2764739990234375, 0.28989410400390625, 0.303314208984375, 0.31673431396484375, 0.3301544189453125, 0.34357452392578125, 0.35699462890625, 0.37041473388671875, 0.3838348388671875, 0.39725494384765625, 0.410675048828125, 0.42409515380859375, 0.4375152587890625, 0.45093536376953125, 0.46435546875]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 0.0, 5.0, 3.0, 5.0, 6.0, 8.0, 12.0, 19.0, 21.0, 33.0, 53.0, 68.0, 127.0, 173.0, 310.0, 544.0, 982.0, 1843.0, 4011.0, 9834.0, 28022.0, 98273.0, 337933.0, 387472.0, 123245.0, 34361.0, 11721.0, 4630.0, 2194.0, 1130.0, 568.0, 350.0, 203.0, 151.0, 74.0, 50.0, 30.0, 27.0, 17.0, 15.0, 13.0, 6.0, 10.0, 5.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0], "bins": [-0.0233154296875, -0.022669315338134766, -0.02202320098876953, -0.021377086639404297, -0.020730972290039062, -0.020084857940673828, -0.019438743591308594, -0.01879262924194336, -0.018146514892578125, -0.01750040054321289, -0.016854286193847656, -0.016208171844482422, -0.015562057495117188, -0.014915943145751953, -0.014269828796386719, -0.013623714447021484, -0.01297760009765625, -0.012331485748291016, -0.011685371398925781, -0.011039257049560547, -0.010393142700195312, -0.009747028350830078, -0.009100914001464844, -0.00845479965209961, -0.007808685302734375, -0.007162570953369141, -0.006516456604003906, -0.005870342254638672, -0.0052242279052734375, -0.004578113555908203, -0.003931999206542969, -0.0032858848571777344, -0.0026397705078125, -0.0019936561584472656, -0.0013475418090820312, -0.0007014274597167969, -5.53131103515625e-05, 0.0005908012390136719, 0.0012369155883789062, 0.0018830299377441406, 0.002529144287109375, 0.0031752586364746094, 0.0038213729858398438, 0.004467487335205078, 0.0051136016845703125, 0.005759716033935547, 0.006405830383300781, 0.007051944732666016, 0.00769805908203125, 0.008344173431396484, 0.008990287780761719, 0.009636402130126953, 0.010282516479492188, 0.010928630828857422, 0.011574745178222656, 0.01222085952758789, 0.012866973876953125, 0.01351308822631836, 0.014159202575683594, 0.014805316925048828, 0.015451431274414062, 0.016097545623779297, 0.01674365997314453, 0.017389774322509766, 0.018035888671875]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 4.0, 0.0, 3.0, 10.0, 6.0, 6.0, 11.0, 16.0, 19.0, 23.0, 33.0, 43.0, 58.0, 55.0, 63.0, 82.0, 66.0, 73.0, 54.0, 79.0, 59.0, 54.0, 50.0, 27.0, 31.0, 16.0, 22.0, 7.0, 6.0, 7.0, 7.0, 7.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.049041748046875e-05, -1.0115094482898712e-05, -9.739771485328674e-06, -9.364448487758636e-06, -8.989125490188599e-06, -8.61380249261856e-06, -8.238479495048523e-06, -7.863156497478485e-06, -7.487833499908447e-06, -7.1125105023384094e-06, -6.737187504768372e-06, -6.361864507198334e-06, -5.986541509628296e-06, -5.611218512058258e-06, -5.23589551448822e-06, -4.860572516918182e-06, -4.4852495193481445e-06, -4.109926521778107e-06, -3.734603524208069e-06, -3.359280526638031e-06, -2.983957529067993e-06, -2.6086345314979553e-06, -2.2333115339279175e-06, -1.8579885363578796e-06, -1.4826655387878418e-06, -1.107342541217804e-06, -7.320195436477661e-07, -3.5669654607772827e-07, 1.862645149230957e-08, 3.939494490623474e-07, 7.692724466323853e-07, 1.144595444202423e-06, 1.519918441772461e-06, 1.8952414393424988e-06, 2.2705644369125366e-06, 2.6458874344825745e-06, 3.0212104320526123e-06, 3.39653342962265e-06, 3.771856427192688e-06, 4.147179424762726e-06, 4.522502422332764e-06, 4.8978254199028015e-06, 5.273148417472839e-06, 5.648471415042877e-06, 6.023794412612915e-06, 6.399117410182953e-06, 6.774440407752991e-06, 7.1497634053230286e-06, 7.525086402893066e-06, 7.900409400463104e-06, 8.275732398033142e-06, 8.65105539560318e-06, 9.026378393173218e-06, 9.401701390743256e-06, 9.777024388313293e-06, 1.0152347385883331e-05, 1.0527670383453369e-05, 1.0902993381023407e-05, 1.1278316378593445e-05, 1.1653639376163483e-05, 1.202896237373352e-05, 1.2404285371303558e-05, 1.2779608368873596e-05, 1.3154931366443634e-05, 1.3530254364013672e-05]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 4.0, 2.0, 1.0, 1.0, 6.0, 7.0, 9.0, 18.0, 22.0, 41.0, 52.0, 71.0, 109.0, 202.0, 296.0, 460.0, 739.0, 1373.0, 2569.0, 4967.0, 9932.0, 22353.0, 54748.0, 137879.0, 283123.0, 288107.0, 141375.0, 55995.0, 22811.0, 10292.0, 5018.0, 2539.0, 1414.0, 730.0, 431.0, 289.0, 181.0, 128.0, 94.0, 55.0, 22.0, 26.0, 16.0, 11.0, 14.0, 10.0, 4.0, 8.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.016815185546875, -0.016289949417114258, -0.015764713287353516, -0.015239477157592773, -0.014714241027832031, -0.014189004898071289, -0.013663768768310547, -0.013138532638549805, -0.012613296508789062, -0.01208806037902832, -0.011562824249267578, -0.011037588119506836, -0.010512351989746094, -0.009987115859985352, -0.00946187973022461, -0.008936643600463867, -0.008411407470703125, -0.007886171340942383, -0.007360935211181641, -0.0068356990814208984, -0.006310462951660156, -0.005785226821899414, -0.005259990692138672, -0.00473475456237793, -0.0042095184326171875, -0.0036842823028564453, -0.003159046173095703, -0.002633810043334961, -0.0021085739135742188, -0.0015833377838134766, -0.0010581016540527344, -0.0005328655242919922, -7.62939453125e-06, 0.0005176067352294922, 0.0010428428649902344, 0.0015680789947509766, 0.0020933151245117188, 0.002618551254272461, 0.003143787384033203, 0.0036690235137939453, 0.0041942596435546875, 0.00471949577331543, 0.005244731903076172, 0.005769968032836914, 0.006295204162597656, 0.0068204402923583984, 0.007345676422119141, 0.007870912551879883, 0.008396148681640625, 0.008921384811401367, 0.00944662094116211, 0.009971857070922852, 0.010497093200683594, 0.011022329330444336, 0.011547565460205078, 0.01207280158996582, 0.012598037719726562, 0.013123273849487305, 0.013648509979248047, 0.014173746109008789, 0.014698982238769531, 0.015224218368530273, 0.015749454498291016, 0.016274690628051758, 0.0167999267578125]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 5.0, 1.0, 3.0, 4.0, 1.0, 2.0, 6.0, 7.0, 4.0, 5.0, 19.0, 8.0, 11.0, 16.0, 14.0, 22.0, 36.0, 31.0, 36.0, 41.0, 62.0, 53.0, 57.0, 64.0, 63.0, 53.0, 48.0, 40.0, 54.0, 43.0, 42.0, 29.0, 16.0, 19.0, 17.0, 24.0, 13.0, 9.0, 8.0, 7.0, 6.0, 4.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.00594329833984375, -0.005764663219451904, -0.005586028099060059, -0.005407392978668213, -0.005228757858276367, -0.0050501227378845215, -0.004871487617492676, -0.00469285249710083, -0.004514217376708984, -0.004335582256317139, -0.004156947135925293, -0.003978312015533447, -0.0037996768951416016, -0.003621041774749756, -0.00344240665435791, -0.0032637715339660645, -0.0030851364135742188, -0.002906501293182373, -0.0027278661727905273, -0.0025492310523986816, -0.002370595932006836, -0.0021919608116149902, -0.0020133256912231445, -0.0018346905708312988, -0.0016560554504394531, -0.0014774203300476074, -0.0012987852096557617, -0.001120150089263916, -0.0009415149688720703, -0.0007628798484802246, -0.0005842447280883789, -0.0004056096076965332, -0.0002269744873046875, -4.83393669128418e-05, 0.0001302957534790039, 0.0003089308738708496, 0.0004875659942626953, 0.000666201114654541, 0.0008448362350463867, 0.0010234713554382324, 0.0012021064758300781, 0.0013807415962219238, 0.0015593767166137695, 0.0017380118370056152, 0.001916646957397461, 0.0020952820777893066, 0.0022739171981811523, 0.002452552318572998, 0.0026311874389648438, 0.0028098225593566895, 0.002988457679748535, 0.003167092800140381, 0.0033457279205322266, 0.0035243630409240723, 0.003702998161315918, 0.0038816332817077637, 0.004060268402099609, 0.004238903522491455, 0.004417538642883301, 0.0045961737632751465, 0.004774808883666992, 0.004953444004058838, 0.005132079124450684, 0.005310714244842529, 0.005489349365234375]}, "gradients/decoder.model.decoder.layers.2.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 5.0, 6.0, 21.0, 26.0, 50.0, 117.0, 182.0, 202.0, 171.0, 96.0, 70.0, 35.0, 16.0, 10.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.921451210975647, -0.9012219309806824, -0.8809926509857178, -0.860763430595398, -0.8405341506004333, -0.8203048706054688, -0.8000755906105042, -0.7798463106155396, -0.7596170902252197, -0.7393878102302551, -0.7191585302352905, -0.6989293098449707, -0.6787000298500061, -0.6584707498550415, -0.6382414698600769, -0.6180121898651123, -0.5977829098701477, -0.5775536298751831, -0.5573243498802185, -0.5370951294898987, -0.5168658494949341, -0.4966365694999695, -0.4764072895050049, -0.4561780095100403, -0.43594875931739807, -0.41571947932243347, -0.39549022912979126, -0.37526094913482666, -0.35503166913986206, -0.33480241894721985, -0.31457313895225525, -0.29434388875961304, -0.2741146385669708, -0.2538853585720062, -0.233656108379364, -0.21342682838439941, -0.193197563290596, -0.1729682981967926, -0.152739018201828, -0.1325097531080246, -0.11228048801422119, -0.09205122292041779, -0.07182195037603378, -0.05159268155694008, -0.031363412737846375, -0.011134147644042969, 0.009095124900341034, 0.029324397444725037, 0.04955366253852844, 0.06978292763233185, 0.09001220017671585, 0.11024147272109985, 0.13047073781490326, 0.15070000290870667, 0.17092928290367126, 0.19115854799747467, 0.21138781309127808, 0.23161707818508148, 0.2518463432788849, 0.2720756232738495, 0.2923048734664917, 0.3125341534614563, 0.3327634334564209, 0.3529927134513855, 0.3732219636440277]}, "gradients/decoder.model.decoder.layers.2.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 6.0, 6.0, 9.0, 7.0, 10.0, 12.0, 4.0, 10.0, 13.0, 13.0, 24.0, 38.0, 38.0, 42.0, 49.0, 32.0, 41.0, 36.0, 35.0, 52.0, 49.0, 45.0, 41.0, 50.0, 45.0, 38.0, 37.0, 26.0, 28.0, 26.0, 19.0, 21.0, 25.0, 19.0, 14.0, 15.0, 11.0, 4.0, 4.0, 1.0, 6.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.19252769649028778, -0.18620455265045166, -0.17988139390945435, -0.17355825006961823, -0.1672350913286209, -0.1609119474887848, -0.15458878874778748, -0.14826564490795135, -0.14194248616695404, -0.13561934232711792, -0.1292961835861206, -0.12297303229570389, -0.11664988100528717, -0.11032673716545105, -0.10400357842445374, -0.09768043458461761, -0.0913572832942009, -0.08503413200378418, -0.07871098071336746, -0.07238782942295074, -0.06606467813253403, -0.05974153056740761, -0.05341837927699089, -0.04709522798657417, -0.040772076696157455, -0.03444892540574074, -0.02812577411532402, -0.021802624687552452, -0.015479473397135735, -0.009156323969364166, -0.0028331726789474487, 0.003489978611469269, 0.009813129901885986, 0.016136281192302704, 0.02245943248271942, 0.02878258191049099, 0.035105735063552856, 0.041428882628679276, 0.04775203391909599, 0.05407518520951271, 0.06039833649992943, 0.06672148406505585, 0.07304463535547256, 0.07936778664588928, 0.085690937936306, 0.09201408922672272, 0.09833724051713943, 0.10466039180755615, 0.11098354309797287, 0.11730669438838959, 0.1236298456788063, 0.12995299696922302, 0.13627614080905914, 0.14259929955005646, 0.14892244338989258, 0.1552456021308899, 0.161568745970726, 0.16789188981056213, 0.17421504855155945, 0.18053819239139557, 0.18686135113239288, 0.193184494972229, 0.19950765371322632, 0.20583079755306244, 0.21215395629405975]}, "gradients/decoder.model.decoder.layers.2.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 5.0, 3.0, 5.0, 5.0, 8.0, 7.0, 13.0, 11.0, 28.0, 26.0, 39.0, 54.0, 87.0, 112.0, 213.0, 279.0, 472.0, 785.0, 1328.0, 2389.0, 4289.0, 8585.0, 18899.0, 47369.0, 151385.0, 562541.0, 161808.0, 48904.0, 19415.0, 9019.0, 4439.0, 2402.0, 1436.0, 831.0, 461.0, 310.0, 214.0, 126.0, 90.0, 53.0, 33.0, 22.0, 17.0, 17.0, 9.0, 3.0, 5.0, 5.0, 0.0, 3.0, 1.0, 3.0, 0.0, 3.0], "bins": [-0.2900390625, -0.2818737030029297, -0.2737083435058594, -0.26554298400878906, -0.25737762451171875, -0.24921226501464844, -0.24104690551757812, -0.2328815460205078, -0.2247161865234375, -0.2165508270263672, -0.20838546752929688, -0.20022010803222656, -0.19205474853515625, -0.18388938903808594, -0.17572402954101562, -0.1675586700439453, -0.159393310546875, -0.1512279510498047, -0.14306259155273438, -0.13489723205566406, -0.12673187255859375, -0.11856651306152344, -0.11040115356445312, -0.10223579406738281, -0.0940704345703125, -0.08590507507324219, -0.07773971557617188, -0.06957435607910156, -0.06140899658203125, -0.05324363708496094, -0.045078277587890625, -0.03691291809082031, -0.02874755859375, -0.020582199096679688, -0.012416839599609375, -0.0042514801025390625, 0.00391387939453125, 0.012079238891601562, 0.020244598388671875, 0.028409957885742188, 0.0365753173828125, 0.04474067687988281, 0.052906036376953125, 0.06107139587402344, 0.06923675537109375, 0.07740211486816406, 0.08556747436523438, 0.09373283386230469, 0.101898193359375, 0.11006355285644531, 0.11822891235351562, 0.12639427185058594, 0.13455963134765625, 0.14272499084472656, 0.15089035034179688, 0.1590557098388672, 0.1672210693359375, 0.1753864288330078, 0.18355178833007812, 0.19171714782714844, 0.19988250732421875, 0.20804786682128906, 0.21621322631835938, 0.2243785858154297, 0.2325439453125]}, "gradients/decoder.model.decoder.layers.2.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 4.0, 0.0, 0.0, 2.0, 3.0, 6.0, 9.0, 5.0, 6.0, 9.0, 13.0, 8.0, 10.0, 19.0, 26.0, 29.0, 33.0, 46.0, 43.0, 33.0, 48.0, 67.0, 55.0, 45.0, 49.0, 53.0, 45.0, 55.0, 42.0, 38.0, 26.0, 29.0, 24.0, 24.0, 30.0, 24.0, 13.0, 14.0, 9.0, 3.0, 6.0, 6.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.36962890625, -0.3563995361328125, -0.343170166015625, -0.3299407958984375, -0.31671142578125, -0.3034820556640625, -0.290252685546875, -0.2770233154296875, -0.2637939453125, -0.2505645751953125, -0.237335205078125, -0.2241058349609375, -0.21087646484375, -0.1976470947265625, -0.184417724609375, -0.1711883544921875, -0.157958984375, -0.1447296142578125, -0.131500244140625, -0.1182708740234375, -0.10504150390625, -0.0918121337890625, -0.078582763671875, -0.0653533935546875, -0.0521240234375, -0.0388946533203125, -0.025665283203125, -0.0124359130859375, 0.00079345703125, 0.0140228271484375, 0.027252197265625, 0.0404815673828125, 0.0537109375, 0.0669403076171875, 0.080169677734375, 0.0933990478515625, 0.10662841796875, 0.1198577880859375, 0.133087158203125, 0.1463165283203125, 0.1595458984375, 0.1727752685546875, 0.186004638671875, 0.1992340087890625, 0.21246337890625, 0.2256927490234375, 0.238922119140625, 0.2521514892578125, 0.265380859375, 0.2786102294921875, 0.291839599609375, 0.3050689697265625, 0.31829833984375, 0.3315277099609375, 0.344757080078125, 0.3579864501953125, 0.3712158203125, 0.3844451904296875, 0.397674560546875, 0.4109039306640625, 0.42413330078125, 0.4373626708984375, 0.450592041015625, 0.4638214111328125, 0.47705078125]}, "gradients/decoder.model.decoder.layers.2.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 1.0, 3.0, 3.0, 5.0, 9.0, 10.0, 8.0, 19.0, 30.0, 34.0, 39.0, 84.0, 106.0, 201.0, 520.0, 1700.0, 9241.0, 104896.0, 876359.0, 47907.0, 5381.0, 1111.0, 373.0, 191.0, 88.0, 65.0, 33.0, 33.0, 23.0, 17.0, 16.0, 14.0, 7.0, 8.0, 5.0, 1.0, 3.0, 0.0, 4.0, 1.0, 0.0, 2.0, 0.0, 7.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.71728515625, -0.6928558349609375, -0.668426513671875, -0.6439971923828125, -0.61956787109375, -0.5951385498046875, -0.570709228515625, -0.5462799072265625, -0.5218505859375, -0.4974212646484375, -0.472991943359375, -0.4485626220703125, -0.42413330078125, -0.3997039794921875, -0.375274658203125, -0.3508453369140625, -0.326416015625, -0.3019866943359375, -0.277557373046875, -0.2531280517578125, -0.22869873046875, -0.2042694091796875, -0.179840087890625, -0.1554107666015625, -0.1309814453125, -0.1065521240234375, -0.082122802734375, -0.0576934814453125, -0.03326416015625, -0.0088348388671875, 0.015594482421875, 0.0400238037109375, 0.064453125, 0.0888824462890625, 0.113311767578125, 0.1377410888671875, 0.16217041015625, 0.1865997314453125, 0.211029052734375, 0.2354583740234375, 0.2598876953125, 0.2843170166015625, 0.308746337890625, 0.3331756591796875, 0.35760498046875, 0.3820343017578125, 0.406463623046875, 0.4308929443359375, 0.455322265625, 0.4797515869140625, 0.504180908203125, 0.5286102294921875, 0.55303955078125, 0.5774688720703125, 0.601898193359375, 0.6263275146484375, 0.6507568359375, 0.6751861572265625, 0.699615478515625, 0.7240447998046875, 0.74847412109375, 0.7729034423828125, 0.797332763671875, 0.8217620849609375, 0.84619140625]}, "gradients/decoder.model.decoder.layers.2.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 5.0, 0.0, 3.0, 1.0, 2.0, 0.0, 2.0, 2.0, 5.0, 4.0, 2.0, 4.0, 10.0, 14.0, 10.0, 15.0, 15.0, 32.0, 32.0, 40.0, 42.0, 43.0, 52.0, 51.0, 45.0, 51.0, 50.0, 53.0, 52.0, 60.0, 52.0, 36.0, 42.0, 39.0, 28.0, 16.0, 18.0, 12.0, 17.0, 10.0, 7.0, 13.0, 5.0, 7.0, 3.0, 5.0, 1.0, 5.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.53076171875, -0.5149078369140625, -0.499053955078125, -0.4832000732421875, -0.46734619140625, -0.4514923095703125, -0.435638427734375, -0.4197845458984375, -0.4039306640625, -0.3880767822265625, -0.372222900390625, -0.3563690185546875, -0.34051513671875, -0.3246612548828125, -0.308807373046875, -0.2929534912109375, -0.277099609375, -0.2612457275390625, -0.245391845703125, -0.2295379638671875, -0.21368408203125, -0.1978302001953125, -0.181976318359375, -0.1661224365234375, -0.1502685546875, -0.1344146728515625, -0.118560791015625, -0.1027069091796875, -0.08685302734375, -0.0709991455078125, -0.055145263671875, -0.0392913818359375, -0.0234375, -0.0075836181640625, 0.008270263671875, 0.0241241455078125, 0.03997802734375, 0.0558319091796875, 0.071685791015625, 0.0875396728515625, 0.1033935546875, 0.1192474365234375, 0.135101318359375, 0.1509552001953125, 0.16680908203125, 0.1826629638671875, 0.198516845703125, 0.2143707275390625, 0.230224609375, 0.2460784912109375, 0.261932373046875, 0.2777862548828125, 0.29364013671875, 0.3094940185546875, 0.325347900390625, 0.3412017822265625, 0.3570556640625, 0.3729095458984375, 0.388763427734375, 0.4046173095703125, 0.42047119140625, 0.4363250732421875, 0.452178955078125, 0.4680328369140625, 0.48388671875]}, "gradients/decoder.model.decoder.layers.2.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 3.0, 6.0, 9.0, 9.0, 8.0, 23.0, 26.0, 42.0, 100.0, 159.0, 292.0, 668.0, 1948.0, 9618.0, 140991.0, 850555.0, 37049.0, 4739.0, 1236.0, 477.0, 251.0, 143.0, 63.0, 53.0, 33.0, 27.0, 4.0, 7.0, 6.0, 7.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.251953125, -0.24570083618164062, -0.23944854736328125, -0.23319625854492188, -0.2269439697265625, -0.22069168090820312, -0.21443939208984375, -0.20818710327148438, -0.201934814453125, -0.19568252563476562, -0.18943023681640625, -0.18317794799804688, -0.1769256591796875, -0.17067337036132812, -0.16442108154296875, -0.15816879272460938, -0.15191650390625, -0.14566421508789062, -0.13941192626953125, -0.13315963745117188, -0.1269073486328125, -0.12065505981445312, -0.11440277099609375, -0.10815048217773438, -0.101898193359375, -0.09564590454101562, -0.08939361572265625, -0.08314132690429688, -0.0768890380859375, -0.07063674926757812, -0.06438446044921875, -0.058132171630859375, -0.0518798828125, -0.045627593994140625, -0.03937530517578125, -0.033123016357421875, -0.0268707275390625, -0.020618438720703125, -0.01436614990234375, -0.008113861083984375, -0.001861572265625, 0.004390716552734375, 0.01064300537109375, 0.016895294189453125, 0.0231475830078125, 0.029399871826171875, 0.03565216064453125, 0.041904449462890625, 0.04815673828125, 0.054409027099609375, 0.06066131591796875, 0.06691360473632812, 0.0731658935546875, 0.07941818237304688, 0.08567047119140625, 0.09192276000976562, 0.098175048828125, 0.10442733764648438, 0.11067962646484375, 0.11693191528320312, 0.1231842041015625, 0.12943649291992188, 0.13568878173828125, 0.14194107055664062, 0.148193359375]}, "gradients/decoder.model.decoder.layers.2.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 2.0, 3.0, 6.0, 3.0, 6.0, 18.0, 31.0, 40.0, 65.0, 147.0, 260.0, 180.0, 103.0, 68.0, 35.0, 10.0, 13.0, 10.0, 6.0, 0.0, 1.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.6524066925048828e-05, -2.540554851293564e-05, -2.428703010082245e-05, -2.316851168870926e-05, -2.204999327659607e-05, -2.093147486448288e-05, -1.981295645236969e-05, -1.86944380402565e-05, -1.757591962814331e-05, -1.645740121603012e-05, -1.533888280391693e-05, -1.4220364391803741e-05, -1.3101845979690552e-05, -1.1983327567577362e-05, -1.0864809155464172e-05, -9.746290743350983e-06, -8.627772331237793e-06, -7.509253919124603e-06, -6.3907355070114136e-06, -5.272217094898224e-06, -4.153698682785034e-06, -3.0351802706718445e-06, -1.9166618585586548e-06, -7.981434464454651e-07, 3.203749656677246e-07, 1.4388933777809143e-06, 2.557411789894104e-06, 3.6759302020072937e-06, 4.794448614120483e-06, 5.912967026233673e-06, 7.031485438346863e-06, 8.150003850460052e-06, 9.268522262573242e-06, 1.0387040674686432e-05, 1.1505559086799622e-05, 1.2624077498912811e-05, 1.3742595911026001e-05, 1.486111432313919e-05, 1.597963273525238e-05, 1.709815114736557e-05, 1.821666955947876e-05, 1.933518797159195e-05, 2.045370638370514e-05, 2.157222479581833e-05, 2.269074320793152e-05, 2.3809261620044708e-05, 2.4927780032157898e-05, 2.6046298444271088e-05, 2.7164816856384277e-05, 2.8283335268497467e-05, 2.9401853680610657e-05, 3.0520372092723846e-05, 3.1638890504837036e-05, 3.2757408916950226e-05, 3.3875927329063416e-05, 3.4994445741176605e-05, 3.6112964153289795e-05, 3.7231482565402985e-05, 3.8350000977516174e-05, 3.9468519389629364e-05, 4.0587037801742554e-05, 4.1705556213855743e-05, 4.282407462596893e-05, 4.394259303808212e-05, 4.506111145019531e-05]}, "gradients/decoder.model.decoder.layers.2.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 5.0, 8.0, 8.0, 9.0, 26.0, 30.0, 54.0, 58.0, 104.0, 175.0, 330.0, 591.0, 1347.0, 3167.0, 9994.0, 47971.0, 676198.0, 271569.0, 25964.0, 6513.0, 2325.0, 1019.0, 463.0, 238.0, 139.0, 104.0, 49.0, 30.0, 27.0, 12.0, 7.0, 10.0, 5.0, 2.0, 3.0, 3.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.12548828125, -0.12063026428222656, -0.11577224731445312, -0.11091423034667969, -0.10605621337890625, -0.10119819641113281, -0.09634017944335938, -0.09148216247558594, -0.0866241455078125, -0.08176612854003906, -0.07690811157226562, -0.07205009460449219, -0.06719207763671875, -0.06233406066894531, -0.057476043701171875, -0.05261802673339844, -0.047760009765625, -0.04290199279785156, -0.038043975830078125, -0.03318595886230469, -0.02832794189453125, -0.023469924926757812, -0.018611907958984375, -0.013753890991210938, -0.0088958740234375, -0.0040378570556640625, 0.000820159912109375, 0.0056781768798828125, 0.01053619384765625, 0.015394210815429688, 0.020252227783203125, 0.025110244750976562, 0.02996826171875, 0.03482627868652344, 0.039684295654296875, 0.04454231262207031, 0.04940032958984375, 0.05425834655761719, 0.059116363525390625, 0.06397438049316406, 0.0688323974609375, 0.07369041442871094, 0.07854843139648438, 0.08340644836425781, 0.08826446533203125, 0.09312248229980469, 0.09798049926757812, 0.10283851623535156, 0.107696533203125, 0.11255455017089844, 0.11741256713867188, 0.12227058410644531, 0.12712860107421875, 0.1319866180419922, 0.13684463500976562, 0.14170265197753906, 0.1465606689453125, 0.15141868591308594, 0.15627670288085938, 0.1611347198486328, 0.16599273681640625, 0.1708507537841797, 0.17570877075195312, 0.18056678771972656, 0.1854248046875]}, "gradients/decoder.model.decoder.layers.2.self_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 7.0, 4.0, 0.0, 5.0, 4.0, 12.0, 4.0, 14.0, 19.0, 28.0, 47.0, 79.0, 106.0, 144.0, 164.0, 135.0, 68.0, 41.0, 38.0, 18.0, 12.0, 10.0, 13.0, 9.0, 1.0, 3.0, 4.0, 5.0, 3.0, 6.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.07879638671875, -0.07688093185424805, -0.0749654769897461, -0.07305002212524414, -0.07113456726074219, -0.06921911239624023, -0.06730365753173828, -0.06538820266723633, -0.06347274780273438, -0.06155729293823242, -0.05964183807373047, -0.057726383209228516, -0.05581092834472656, -0.05389547348022461, -0.051980018615722656, -0.0500645637512207, -0.04814910888671875, -0.0462336540222168, -0.044318199157714844, -0.04240274429321289, -0.04048728942871094, -0.038571834564208984, -0.03665637969970703, -0.03474092483520508, -0.032825469970703125, -0.030910015106201172, -0.02899456024169922, -0.027079105377197266, -0.025163650512695312, -0.02324819564819336, -0.021332740783691406, -0.019417285919189453, -0.0175018310546875, -0.015586376190185547, -0.013670921325683594, -0.01175546646118164, -0.009840011596679688, -0.007924556732177734, -0.006009101867675781, -0.004093647003173828, -0.002178192138671875, -0.0002627372741699219, 0.0016527175903320312, 0.0035681724548339844, 0.0054836273193359375, 0.007399082183837891, 0.009314537048339844, 0.011229991912841797, 0.01314544677734375, 0.015060901641845703, 0.016976356506347656, 0.01889181137084961, 0.020807266235351562, 0.022722721099853516, 0.02463817596435547, 0.026553630828857422, 0.028469085693359375, 0.030384540557861328, 0.03229999542236328, 0.034215450286865234, 0.03613090515136719, 0.03804636001586914, 0.039961814880371094, 0.04187726974487305, 0.043792724609375]}, "gradients/decoder.model.decoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 2.0, 3.0, 6.0, 9.0, 4.0, 14.0, 20.0, 27.0, 43.0, 49.0, 65.0, 67.0, 90.0, 102.0, 105.0, 80.0, 78.0, 67.0, 45.0, 30.0, 27.0, 19.0, 19.0, 10.0, 9.0, 6.0, 5.0, 4.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.6882760524749756, -0.6679914593696594, -0.6477068662643433, -0.6274223327636719, -0.6071377396583557, -0.5868531465530396, -0.5665686130523682, -0.546284019947052, -0.5259994268417358, -0.5057148337364197, -0.4854302704334259, -0.46514570713043213, -0.44486111402511597, -0.4245765209197998, -0.40429195761680603, -0.38400739431381226, -0.3637228012084961, -0.34343820810317993, -0.32315364480018616, -0.3028690814971924, -0.2825844883918762, -0.26229989528656006, -0.24201533198356628, -0.22173075377941132, -0.20144617557525635, -0.18116159737110138, -0.1608770191669464, -0.14059244096279144, -0.12030786275863647, -0.1000232845544815, -0.07973870635032654, -0.05945412814617157, -0.03916960954666138, -0.01888503134250641, 0.0013995468616485596, 0.021684125065803528, 0.041968703269958496, 0.062253281474113464, 0.08253785967826843, 0.1028224378824234, 0.12310701608657837, 0.14339159429073334, 0.1636761724948883, 0.18396075069904327, 0.20424532890319824, 0.2245299071073532, 0.24481448531150818, 0.26509904861450195, 0.2853836417198181, 0.3056682348251343, 0.32595279812812805, 0.3462373614311218, 0.366521954536438, 0.38680654764175415, 0.4070911109447479, 0.4273756742477417, 0.44766026735305786, 0.467944860458374, 0.4882294237613678, 0.5085139870643616, 0.5287985801696777, 0.5490831732749939, 0.5693677663803101, 0.5896522998809814, 0.6099368929862976]}, "gradients/decoder.model.decoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 1.0, 4.0, 5.0, 5.0, 10.0, 6.0, 19.0, 11.0, 17.0, 16.0, 21.0, 21.0, 25.0, 24.0, 42.0, 31.0, 31.0, 30.0, 38.0, 39.0, 34.0, 30.0, 24.0, 48.0, 44.0, 26.0, 35.0, 42.0, 40.0, 34.0, 32.0, 24.0, 32.0, 26.0, 28.0, 18.0, 18.0, 12.0, 13.0, 14.0, 11.0, 7.0, 3.0, 11.0, 2.0, 6.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.5604451298713684, -0.5396989583969116, -0.5189528465270996, -0.4982066750526428, -0.47746050357818604, -0.45671436190605164, -0.43596822023391724, -0.41522204875946045, -0.39447587728500366, -0.37372973561286926, -0.3529835641384125, -0.3322374224662781, -0.3114912509918213, -0.2907451093196869, -0.2699989676475525, -0.2492527961730957, -0.2285066545009613, -0.2077604979276657, -0.18701434135437012, -0.16626819968223572, -0.14552202820777893, -0.12477587908506393, -0.10402972996234894, -0.08328357338905334, -0.06253741681575775, -0.04179126024246216, -0.021045107394456863, -0.0002989545464515686, 0.020447202026844025, 0.04119335860013962, 0.061939507722854614, 0.08268566429615021, 0.1034318208694458, 0.1241779774427414, 0.144924134016037, 0.1656702756881714, 0.18641644716262817, 0.20716258883476257, 0.22790874540805817, 0.24865490198135376, 0.26940107345581055, 0.29014721512794495, 0.31089338660240173, 0.33163952827453613, 0.3523856997489929, 0.3731318414211273, 0.3938779830932617, 0.4146241545677185, 0.4353702962398529, 0.4561164379119873, 0.4768626093864441, 0.4976087510585785, 0.5183548927307129, 0.5391010642051697, 0.5598472356796265, 0.5805933475494385, 0.6013395190238953, 0.622085690498352, 0.6428318023681641, 0.6635779738426208, 0.6843241453170776, 0.7050703167915344, 0.7258164286613464, 0.7465626001358032, 0.76730877161026]}, "gradients/decoder.model.decoder.layers.1.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 5.0, 3.0, 3.0, 11.0, 11.0, 12.0, 27.0, 50.0, 69.0, 144.0, 247.0, 412.0, 923.0, 2208.0, 6132.0, 25602.0, 432019.0, 3496197.0, 202254.0, 19453.0, 5003.0, 1787.0, 784.0, 402.0, 226.0, 126.0, 78.0, 44.0, 23.0, 14.0, 8.0, 7.0, 3.0, 4.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.8486328125, -0.8281364440917969, -0.8076400756835938, -0.7871437072753906, -0.7666473388671875, -0.7461509704589844, -0.7256546020507812, -0.7051582336425781, -0.684661865234375, -0.6641654968261719, -0.6436691284179688, -0.6231727600097656, -0.6026763916015625, -0.5821800231933594, -0.5616836547851562, -0.5411872863769531, -0.52069091796875, -0.5001945495605469, -0.47969818115234375, -0.4592018127441406, -0.4387054443359375, -0.4182090759277344, -0.39771270751953125, -0.3772163391113281, -0.356719970703125, -0.3362236022949219, -0.31572723388671875, -0.2952308654785156, -0.2747344970703125, -0.2542381286621094, -0.23374176025390625, -0.21324539184570312, -0.1927490234375, -0.17225265502929688, -0.15175628662109375, -0.13125991821289062, -0.1107635498046875, -0.09026718139648438, -0.06977081298828125, -0.049274444580078125, -0.028778076171875, -0.008281707763671875, 0.01221466064453125, 0.032711029052734375, 0.0532073974609375, 0.07370376586914062, 0.09420013427734375, 0.11469650268554688, 0.13519287109375, 0.15568923950195312, 0.17618560791015625, 0.19668197631835938, 0.2171783447265625, 0.23767471313476562, 0.25817108154296875, 0.2786674499511719, 0.299163818359375, 0.3196601867675781, 0.34015655517578125, 0.3606529235839844, 0.3811492919921875, 0.4016456604003906, 0.42214202880859375, 0.4426383972167969, 0.463134765625]}, "gradients/decoder.model.decoder.layers.1.fc2.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 3.0, 4.0, 7.0, 7.0, 7.0, 13.0, 18.0, 18.0, 19.0, 29.0, 19.0, 39.0, 36.0, 54.0, 42.0, 37.0, 52.0, 44.0, 59.0, 55.0, 42.0, 39.0, 54.0, 45.0, 33.0, 34.0, 27.0, 23.0, 24.0, 30.0, 19.0, 20.0, 17.0, 10.0, 10.0, 5.0, 4.0, 2.0, 4.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2467041015625, -0.23917388916015625, -0.2316436767578125, -0.22411346435546875, -0.216583251953125, -0.20905303955078125, -0.2015228271484375, -0.19399261474609375, -0.18646240234375, -0.17893218994140625, -0.1714019775390625, -0.16387176513671875, -0.156341552734375, -0.14881134033203125, -0.1412811279296875, -0.13375091552734375, -0.126220703125, -0.11869049072265625, -0.1111602783203125, -0.10363006591796875, -0.096099853515625, -0.08856964111328125, -0.0810394287109375, -0.07350921630859375, -0.06597900390625, -0.05844879150390625, -0.0509185791015625, -0.04338836669921875, -0.035858154296875, -0.02832794189453125, -0.0207977294921875, -0.01326751708984375, -0.0057373046875, 0.00179290771484375, 0.0093231201171875, 0.01685333251953125, 0.024383544921875, 0.03191375732421875, 0.0394439697265625, 0.04697418212890625, 0.05450439453125, 0.06203460693359375, 0.0695648193359375, 0.07709503173828125, 0.084625244140625, 0.09215545654296875, 0.0996856689453125, 0.10721588134765625, 0.11474609375, 0.12227630615234375, 0.1298065185546875, 0.13733673095703125, 0.144866943359375, 0.15239715576171875, 0.1599273681640625, 0.16745758056640625, 0.17498779296875, 0.18251800537109375, 0.1900482177734375, 0.19757843017578125, 0.205108642578125, 0.21263885498046875, 0.2201690673828125, 0.22769927978515625, 0.2352294921875]}, "gradients/decoder.model.decoder.layers.1.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 4.0, 5.0, 6.0, 12.0, 16.0, 14.0, 31.0, 54.0, 113.0, 223.0, 557.0, 1630.0, 6472.0, 41585.0, 2168253.0, 1926158.0, 40285.0, 6371.0, 1543.0, 496.0, 221.0, 88.0, 51.0, 38.0, 14.0, 20.0, 8.0, 7.0, 2.0, 3.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 3.0, 2.0], "bins": [-1.0341796875, -1.0089492797851562, -0.9837188720703125, -0.9584884643554688, -0.933258056640625, -0.9080276489257812, -0.8827972412109375, -0.8575668334960938, -0.83233642578125, -0.8071060180664062, -0.7818756103515625, -0.7566452026367188, -0.731414794921875, -0.7061843872070312, -0.6809539794921875, -0.6557235717773438, -0.6304931640625, -0.6052627563476562, -0.5800323486328125, -0.5548019409179688, -0.529571533203125, -0.5043411254882812, -0.4791107177734375, -0.45388031005859375, -0.42864990234375, -0.40341949462890625, -0.3781890869140625, -0.35295867919921875, -0.327728271484375, -0.30249786376953125, -0.2772674560546875, -0.25203704833984375, -0.226806640625, -0.20157623291015625, -0.1763458251953125, -0.15111541748046875, -0.125885009765625, -0.10065460205078125, -0.0754241943359375, -0.05019378662109375, -0.02496337890625, 0.00026702880859375, 0.0254974365234375, 0.05072784423828125, 0.075958251953125, 0.10118865966796875, 0.1264190673828125, 0.15164947509765625, 0.1768798828125, 0.20211029052734375, 0.2273406982421875, 0.25257110595703125, 0.277801513671875, 0.30303192138671875, 0.3282623291015625, 0.35349273681640625, 0.37872314453125, 0.40395355224609375, 0.4291839599609375, 0.45441436767578125, 0.479644775390625, 0.5048751831054688, 0.5301055908203125, 0.5553359985351562, 0.58056640625]}, "gradients/decoder.model.decoder.layers.1.fc1.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 1.0, 1.0, 3.0, 1.0, 3.0, 5.0, 8.0, 5.0, 8.0, 14.0, 12.0, 31.0, 27.0, 38.0, 49.0, 70.0, 78.0, 150.0, 290.0, 461.0, 716.0, 700.0, 516.0, 316.0, 194.0, 119.0, 64.0, 44.0, 34.0, 26.0, 24.0, 17.0, 13.0, 10.0, 9.0, 7.0, 4.0, 3.0, 0.0, 5.0, 0.0, 1.0, 4.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1470947265625, -0.1425151824951172, -0.13793563842773438, -0.13335609436035156, -0.12877655029296875, -0.12419700622558594, -0.11961746215820312, -0.11503791809082031, -0.1104583740234375, -0.10587882995605469, -0.10129928588867188, -0.09671974182128906, -0.09214019775390625, -0.08756065368652344, -0.08298110961914062, -0.07840156555175781, -0.073822021484375, -0.06924247741699219, -0.06466293334960938, -0.06008338928222656, -0.05550384521484375, -0.05092430114746094, -0.046344757080078125, -0.04176521301269531, -0.0371856689453125, -0.03260612487792969, -0.028026580810546875, -0.023447036743164062, -0.01886749267578125, -0.014287948608398438, -0.009708404541015625, -0.0051288604736328125, -0.00054931640625, 0.0040302276611328125, 0.008609771728515625, 0.013189315795898438, 0.01776885986328125, 0.022348403930664062, 0.026927947998046875, 0.03150749206542969, 0.0360870361328125, 0.04066658020019531, 0.045246124267578125, 0.04982566833496094, 0.05440521240234375, 0.05898475646972656, 0.06356430053710938, 0.06814384460449219, 0.072723388671875, 0.07730293273925781, 0.08188247680664062, 0.08646202087402344, 0.09104156494140625, 0.09562110900878906, 0.10020065307617188, 0.10478019714355469, 0.1093597412109375, 0.11393928527832031, 0.11851882934570312, 0.12309837341308594, 0.12767791748046875, 0.13225746154785156, 0.13683700561523438, 0.1414165496826172, 0.14599609375]}, "gradients/decoder.model.decoder.layers.1.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 4.0, 2.0, 2.0, 1.0, 1.0, 4.0, 4.0, 6.0, 8.0, 5.0, 14.0, 13.0, 27.0, 35.0, 29.0, 37.0, 67.0, 67.0, 78.0, 87.0, 73.0, 79.0, 72.0, 65.0, 44.0, 38.0, 46.0, 21.0, 22.0, 22.0, 11.0, 8.0, 5.0, 10.0, 3.0, 3.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.32633230090141296, -0.313091903924942, -0.29985153675079346, -0.2866111397743225, -0.27337074279785156, -0.2601303458213806, -0.24688997864723206, -0.2336495816707611, -0.22040919959545135, -0.2071688175201416, -0.19392842054367065, -0.1806880384683609, -0.16744765639305115, -0.1542072594165802, -0.14096687734127045, -0.1277264952659607, -0.11448609828948975, -0.1012457087635994, -0.08800531923770905, -0.07476493716239929, -0.06152454763650894, -0.04828415811061859, -0.03504377603530884, -0.021803386509418488, -0.008562996983528137, 0.004677390679717064, 0.017917778342962265, 0.031158164143562317, 0.04439855366945267, 0.05763894319534302, 0.07087932527065277, 0.08411971479654312, 0.09736013412475586, 0.11060052365064621, 0.12384091317653656, 0.1370812952518463, 0.15032169222831726, 0.16356207430362701, 0.17680245637893677, 0.19004285335540771, 0.20328323543071747, 0.21652361750602722, 0.22976401448249817, 0.24300439655780792, 0.2562447786331177, 0.2694851756095886, 0.28272557258605957, 0.29596593976020813, 0.3092063367366791, 0.32244673371315, 0.3356871008872986, 0.34892749786376953, 0.3621678948402405, 0.3754082918167114, 0.38864865899086, 0.40188905596733093, 0.4151294231414795, 0.42836982011795044, 0.441610187292099, 0.45485058426856995, 0.4680909812450409, 0.48133134841918945, 0.4945717453956604, 0.5078121423721313, 0.5210525393486023]}, "gradients/decoder.model.decoder.layers.1.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 4.0, 4.0, 6.0, 8.0, 7.0, 8.0, 9.0, 10.0, 10.0, 18.0, 21.0, 19.0, 16.0, 34.0, 25.0, 37.0, 38.0, 36.0, 42.0, 33.0, 46.0, 42.0, 41.0, 45.0, 41.0, 47.0, 48.0, 36.0, 49.0, 34.0, 22.0, 27.0, 24.0, 16.0, 22.0, 17.0, 19.0, 19.0, 11.0, 5.0, 3.0, 4.0, 6.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2926609516143799, -0.2831651270389557, -0.2736692726612091, -0.2641734480857849, -0.2546776235103607, -0.24518176913261414, -0.23568594455718994, -0.22619010508060455, -0.21669426560401917, -0.20719842612743378, -0.19770260155200958, -0.1882067620754242, -0.1787109225988388, -0.16921508312225342, -0.15971925854682922, -0.15022341907024384, -0.14072759449481964, -0.13123175501823425, -0.12173592299222946, -0.11224009096622467, -0.10274425148963928, -0.09324841946363449, -0.0837525874376297, -0.07425674796104431, -0.06476091593503952, -0.05526508018374443, -0.04576924443244934, -0.03627341240644455, -0.02677757665514946, -0.01728174090385437, -0.007785908877849579, 0.0017099305987358093, 0.0112057626247406, 0.02070159837603569, 0.03019743226468563, 0.03969326615333557, 0.04918910190463066, 0.05868493765592575, 0.06818076968193054, 0.07767660915851593, 0.08717244118452072, 0.09666827321052551, 0.1061641126871109, 0.11565994471311569, 0.12515577673912048, 0.13465161621570587, 0.14414745569229126, 0.15364328026771545, 0.16313911974430084, 0.17263495922088623, 0.18213078379631042, 0.1916266232728958, 0.2011224627494812, 0.2106182873249054, 0.22011412680149078, 0.22960996627807617, 0.23910579085350037, 0.24860163033008575, 0.25809746980667114, 0.26759329438209534, 0.27708911895751953, 0.2865849733352661, 0.2960807979106903, 0.3055766224861145, 0.3150724768638611]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 7.0, 3.0, 10.0, 10.0, 17.0, 27.0, 48.0, 70.0, 93.0, 147.0, 240.0, 390.0, 684.0, 1195.0, 1922.0, 3691.0, 6871.0, 14471.0, 46654.0, 313117.0, 534630.0, 84487.0, 20526.0, 8642.0, 4496.0, 2509.0, 1457.0, 806.0, 514.0, 312.0, 202.0, 125.0, 62.0, 38.0, 31.0, 21.0, 16.0, 12.0, 4.0, 2.0, 5.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.150390625, -0.14611530303955078, -0.14183998107910156, -0.13756465911865234, -0.13328933715820312, -0.1290140151977539, -0.12473869323730469, -0.12046337127685547, -0.11618804931640625, -0.11191272735595703, -0.10763740539550781, -0.1033620834350586, -0.09908676147460938, -0.09481143951416016, -0.09053611755371094, -0.08626079559326172, -0.0819854736328125, -0.07771015167236328, -0.07343482971191406, -0.06915950775146484, -0.06488418579101562, -0.060608863830566406, -0.05633354187011719, -0.05205821990966797, -0.04778289794921875, -0.04350757598876953, -0.03923225402832031, -0.034956932067871094, -0.030681610107421875, -0.026406288146972656, -0.022130966186523438, -0.01785564422607422, -0.013580322265625, -0.009305000305175781, -0.0050296783447265625, -0.0007543563842773438, 0.003520965576171875, 0.007796287536621094, 0.012071609497070312, 0.01634693145751953, 0.02062225341796875, 0.02489757537841797, 0.029172897338867188, 0.033448219299316406, 0.037723541259765625, 0.041998863220214844, 0.04627418518066406, 0.05054950714111328, 0.0548248291015625, 0.05910015106201172, 0.06337547302246094, 0.06765079498291016, 0.07192611694335938, 0.0762014389038086, 0.08047676086425781, 0.08475208282470703, 0.08902740478515625, 0.09330272674560547, 0.09757804870605469, 0.1018533706665039, 0.10612869262695312, 0.11040401458740234, 0.11467933654785156, 0.11895465850830078, 0.12322998046875]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 4.0, 0.0, 5.0, 1.0, 7.0, 14.0, 9.0, 13.0, 9.0, 10.0, 15.0, 22.0, 17.0, 28.0, 26.0, 32.0, 32.0, 40.0, 43.0, 31.0, 44.0, 40.0, 51.0, 48.0, 40.0, 46.0, 43.0, 38.0, 38.0, 43.0, 32.0, 22.0, 23.0, 22.0, 16.0, 12.0, 24.0, 24.0, 8.0, 8.0, 10.0, 8.0, 5.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.17578125, -0.17033004760742188, -0.16487884521484375, -0.15942764282226562, -0.1539764404296875, -0.14852523803710938, -0.14307403564453125, -0.13762283325195312, -0.132171630859375, -0.12672042846679688, -0.12126922607421875, -0.11581802368164062, -0.1103668212890625, -0.10491561889648438, -0.09946441650390625, -0.09401321411132812, -0.08856201171875, -0.08311080932617188, -0.07765960693359375, -0.07220840454101562, -0.0667572021484375, -0.061305999755859375, -0.05585479736328125, -0.050403594970703125, -0.044952392578125, -0.039501190185546875, -0.03404998779296875, -0.028598785400390625, -0.0231475830078125, -0.017696380615234375, -0.01224517822265625, -0.006793975830078125, -0.0013427734375, 0.004108428955078125, 0.00955963134765625, 0.015010833740234375, 0.0204620361328125, 0.025913238525390625, 0.03136444091796875, 0.036815643310546875, 0.042266845703125, 0.047718048095703125, 0.05316925048828125, 0.058620452880859375, 0.0640716552734375, 0.06952285766601562, 0.07497406005859375, 0.08042526245117188, 0.08587646484375, 0.09132766723632812, 0.09677886962890625, 0.10223007202148438, 0.1076812744140625, 0.11313247680664062, 0.11858367919921875, 0.12403488159179688, 0.129486083984375, 0.13493728637695312, 0.14038848876953125, 0.14583969116210938, 0.1512908935546875, 0.15674209594726562, 0.16219329833984375, 0.16764450073242188, 0.173095703125]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 1.0, 2.0, 1.0, 2.0, 7.0, 11.0, 8.0, 19.0, 23.0, 42.0, 55.0, 91.0, 131.0, 255.0, 413.0, 824.0, 1707.0, 3847.0, 9015.0, 26274.0, 102509.0, 434719.0, 354597.0, 78392.0, 21453.0, 7587.0, 3273.0, 1537.0, 806.0, 400.0, 227.0, 113.0, 74.0, 47.0, 35.0, 21.0, 18.0, 8.0, 5.0, 7.0, 2.0, 3.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0640869140625, -0.06151390075683594, -0.058940887451171875, -0.05636787414550781, -0.05379486083984375, -0.05122184753417969, -0.048648834228515625, -0.04607582092285156, -0.0435028076171875, -0.04092979431152344, -0.038356781005859375, -0.03578376770019531, -0.03321075439453125, -0.030637741088867188, -0.028064727783203125, -0.025491714477539062, -0.022918701171875, -0.020345687866210938, -0.017772674560546875, -0.015199661254882812, -0.01262664794921875, -0.010053634643554688, -0.007480621337890625, -0.0049076080322265625, -0.0023345947265625, 0.0002384185791015625, 0.002811431884765625, 0.0053844451904296875, 0.00795745849609375, 0.010530471801757812, 0.013103485107421875, 0.015676498413085938, 0.01824951171875, 0.020822525024414062, 0.023395538330078125, 0.025968551635742188, 0.02854156494140625, 0.031114578247070312, 0.033687591552734375, 0.03626060485839844, 0.0388336181640625, 0.04140663146972656, 0.043979644775390625, 0.04655265808105469, 0.04912567138671875, 0.05169868469238281, 0.054271697998046875, 0.05684471130371094, 0.059417724609375, 0.06199073791503906, 0.06456375122070312, 0.06713676452636719, 0.06970977783203125, 0.07228279113769531, 0.07485580444335938, 0.07742881774902344, 0.0800018310546875, 0.08257484436035156, 0.08514785766601562, 0.08772087097167969, 0.09029388427734375, 0.09286689758300781, 0.09543991088867188, 0.09801292419433594, 0.1005859375]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 2.0, 0.0, 2.0, 4.0, 6.0, 8.0, 5.0, 9.0, 9.0, 13.0, 14.0, 19.0, 16.0, 30.0, 30.0, 43.0, 35.0, 55.0, 43.0, 45.0, 55.0, 49.0, 44.0, 57.0, 47.0, 37.0, 55.0, 39.0, 38.0, 30.0, 30.0, 22.0, 19.0, 20.0, 14.0, 8.0, 16.0, 14.0, 3.0, 5.0, 3.0, 4.0, 2.0, 4.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.361572265625, -0.3499603271484375, -0.338348388671875, -0.3267364501953125, -0.31512451171875, -0.3035125732421875, -0.291900634765625, -0.2802886962890625, -0.2686767578125, -0.2570648193359375, -0.245452880859375, -0.2338409423828125, -0.22222900390625, -0.2106170654296875, -0.199005126953125, -0.1873931884765625, -0.17578125, -0.1641693115234375, -0.152557373046875, -0.1409454345703125, -0.12933349609375, -0.1177215576171875, -0.106109619140625, -0.0944976806640625, -0.0828857421875, -0.0712738037109375, -0.059661865234375, -0.0480499267578125, -0.03643798828125, -0.0248260498046875, -0.013214111328125, -0.0016021728515625, 0.010009765625, 0.0216217041015625, 0.033233642578125, 0.0448455810546875, 0.05645751953125, 0.0680694580078125, 0.079681396484375, 0.0912933349609375, 0.1029052734375, 0.1145172119140625, 0.126129150390625, 0.1377410888671875, 0.14935302734375, 0.1609649658203125, 0.172576904296875, 0.1841888427734375, 0.19580078125, 0.2074127197265625, 0.219024658203125, 0.2306365966796875, 0.24224853515625, 0.2538604736328125, 0.265472412109375, 0.2770843505859375, 0.2886962890625, 0.3003082275390625, 0.311920166015625, 0.3235321044921875, 0.33514404296875, 0.3467559814453125, 0.358367919921875, 0.3699798583984375, 0.381591796875]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 4.0, 1.0, 3.0, 2.0, 6.0, 1.0, 8.0, 18.0, 14.0, 13.0, 24.0, 23.0, 46.0, 65.0, 91.0, 89.0, 180.0, 275.0, 436.0, 778.0, 1291.0, 2468.0, 5347.0, 13364.0, 42558.0, 178553.0, 509923.0, 214874.0, 50496.0, 15148.0, 5950.0, 2805.0, 1455.0, 798.0, 486.0, 350.0, 200.0, 128.0, 79.0, 61.0, 47.0, 24.0, 21.0, 18.0, 15.0, 11.0, 7.0, 3.0, 4.0, 6.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.028106689453125, -0.02731633186340332, -0.02652597427368164, -0.02573561668395996, -0.02494525909423828, -0.0241549015045166, -0.023364543914794922, -0.022574186325073242, -0.021783828735351562, -0.020993471145629883, -0.020203113555908203, -0.019412755966186523, -0.018622398376464844, -0.017832040786743164, -0.017041683197021484, -0.016251325607299805, -0.015460968017578125, -0.014670610427856445, -0.013880252838134766, -0.013089895248413086, -0.012299537658691406, -0.011509180068969727, -0.010718822479248047, -0.009928464889526367, -0.009138107299804688, -0.008347749710083008, -0.007557392120361328, -0.0067670345306396484, -0.005976676940917969, -0.005186319351196289, -0.004395961761474609, -0.0036056041717529297, -0.00281524658203125, -0.0020248889923095703, -0.0012345314025878906, -0.00044417381286621094, 0.00034618377685546875, 0.0011365413665771484, 0.0019268989562988281, 0.002717256546020508, 0.0035076141357421875, 0.004297971725463867, 0.005088329315185547, 0.0058786869049072266, 0.006669044494628906, 0.007459402084350586, 0.008249759674072266, 0.009040117263793945, 0.009830474853515625, 0.010620832443237305, 0.011411190032958984, 0.012201547622680664, 0.012991905212402344, 0.013782262802124023, 0.014572620391845703, 0.015362977981567383, 0.016153335571289062, 0.016943693161010742, 0.017734050750732422, 0.0185244083404541, 0.01931476593017578, 0.02010512351989746, 0.02089548110961914, 0.02168583869934082, 0.0224761962890625]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 0.0, 2.0, 4.0, 1.0, 2.0, 3.0, 6.0, 5.0, 16.0, 13.0, 9.0, 26.0, 36.0, 39.0, 65.0, 48.0, 55.0, 75.0, 83.0, 67.0, 87.0, 81.0, 54.0, 44.0, 41.0, 33.0, 23.0, 23.0, 13.0, 16.0, 6.0, 5.0, 6.0, 6.0, 5.0, 3.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.2814998626708984e-05, -1.2401491403579712e-05, -1.198798418045044e-05, -1.1574476957321167e-05, -1.1160969734191895e-05, -1.0747462511062622e-05, -1.033395528793335e-05, -9.920448064804077e-06, -9.506940841674805e-06, -9.093433618545532e-06, -8.67992639541626e-06, -8.266419172286987e-06, -7.852911949157715e-06, -7.439404726028442e-06, -7.02589750289917e-06, -6.6123902797698975e-06, -6.198883056640625e-06, -5.7853758335113525e-06, -5.37186861038208e-06, -4.958361387252808e-06, -4.544854164123535e-06, -4.131346940994263e-06, -3.7178397178649902e-06, -3.3043324947357178e-06, -2.8908252716064453e-06, -2.477318048477173e-06, -2.0638108253479004e-06, -1.650303602218628e-06, -1.2367963790893555e-06, -8.23289155960083e-07, -4.0978193283081055e-07, 3.725290298461914e-09, 4.172325134277344e-07, 8.307397365570068e-07, 1.2442469596862793e-06, 1.6577541828155518e-06, 2.0712614059448242e-06, 2.4847686290740967e-06, 2.898275852203369e-06, 3.3117830753326416e-06, 3.725290298461914e-06, 4.1387975215911865e-06, 4.552304744720459e-06, 4.9658119678497314e-06, 5.379319190979004e-06, 5.792826414108276e-06, 6.206333637237549e-06, 6.619840860366821e-06, 7.033348083496094e-06, 7.446855306625366e-06, 7.860362529754639e-06, 8.273869752883911e-06, 8.687376976013184e-06, 9.100884199142456e-06, 9.514391422271729e-06, 9.927898645401001e-06, 1.0341405868530273e-05, 1.0754913091659546e-05, 1.1168420314788818e-05, 1.158192753791809e-05, 1.1995434761047363e-05, 1.2408941984176636e-05, 1.2822449207305908e-05, 1.323595643043518e-05, 1.3649463653564453e-05]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 8.0, 11.0, 9.0, 12.0, 16.0, 29.0, 48.0, 92.0, 140.0, 302.0, 547.0, 1091.0, 2500.0, 5714.0, 16578.0, 52568.0, 183045.0, 460809.0, 227976.0, 64904.0, 20045.0, 6893.0, 2614.0, 1249.0, 609.0, 326.0, 167.0, 87.0, 55.0, 35.0, 20.0, 11.0, 11.0, 4.0, 6.0, 7.0, 5.0, 3.0, 2.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.0306243896484375, -0.029738903045654297, -0.028853416442871094, -0.02796792984008789, -0.027082443237304688, -0.026196956634521484, -0.02531147003173828, -0.024425983428955078, -0.023540496826171875, -0.022655010223388672, -0.02176952362060547, -0.020884037017822266, -0.019998550415039062, -0.01911306381225586, -0.018227577209472656, -0.017342090606689453, -0.01645660400390625, -0.015571117401123047, -0.014685630798339844, -0.01380014419555664, -0.012914657592773438, -0.012029170989990234, -0.011143684387207031, -0.010258197784423828, -0.009372711181640625, -0.008487224578857422, -0.007601737976074219, -0.006716251373291016, -0.0058307647705078125, -0.004945278167724609, -0.004059791564941406, -0.003174304962158203, -0.002288818359375, -0.0014033317565917969, -0.0005178451538085938, 0.0003676414489746094, 0.0012531280517578125, 0.0021386146545410156, 0.0030241012573242188, 0.003909587860107422, 0.004795074462890625, 0.005680561065673828, 0.006566047668457031, 0.007451534271240234, 0.008337020874023438, 0.00922250747680664, 0.010107994079589844, 0.010993480682373047, 0.01187896728515625, 0.012764453887939453, 0.013649940490722656, 0.01453542709350586, 0.015420913696289062, 0.016306400299072266, 0.01719188690185547, 0.018077373504638672, 0.018962860107421875, 0.019848346710205078, 0.02073383331298828, 0.021619319915771484, 0.022504806518554688, 0.02339029312133789, 0.024275779724121094, 0.025161266326904297, 0.0260467529296875]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 3.0, 0.0, 0.0, 3.0, 4.0, 10.0, 14.0, 12.0, 16.0, 30.0, 29.0, 40.0, 53.0, 65.0, 94.0, 112.0, 103.0, 91.0, 77.0, 63.0, 44.0, 47.0, 21.0, 14.0, 14.0, 15.0, 10.0, 6.0, 1.0, 4.0, 1.0, 5.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.007549285888671875, -0.0072920918464660645, -0.007034897804260254, -0.006777703762054443, -0.006520509719848633, -0.006263315677642822, -0.006006121635437012, -0.005748927593231201, -0.005491733551025391, -0.00523453950881958, -0.0049773454666137695, -0.004720151424407959, -0.0044629573822021484, -0.004205763339996338, -0.003948569297790527, -0.003691375255584717, -0.0034341812133789062, -0.0031769871711730957, -0.002919793128967285, -0.0026625990867614746, -0.002405405044555664, -0.0021482110023498535, -0.001891016960144043, -0.0016338229179382324, -0.0013766288757324219, -0.0011194348335266113, -0.0008622407913208008, -0.0006050467491149902, -0.0003478527069091797, -9.065866470336914e-05, 0.0001665353775024414, 0.00042372941970825195, 0.0006809234619140625, 0.000938117504119873, 0.0011953115463256836, 0.0014525055885314941, 0.0017096996307373047, 0.0019668936729431152, 0.0022240877151489258, 0.0024812817573547363, 0.002738475799560547, 0.0029956698417663574, 0.003252863883972168, 0.0035100579261779785, 0.003767251968383789, 0.0040244460105896, 0.00428164005279541, 0.004538834095001221, 0.004796028137207031, 0.005053222179412842, 0.005310416221618652, 0.005567610263824463, 0.0058248043060302734, 0.006081998348236084, 0.0063391923904418945, 0.006596386432647705, 0.006853580474853516, 0.007110774517059326, 0.007367968559265137, 0.007625162601470947, 0.007882356643676758, 0.008139550685882568, 0.008396744728088379, 0.00865393877029419, 0.0089111328125]}, "gradients/decoder.model.decoder.layers.1.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 6.0, 3.0, 8.0, 12.0, 8.0, 18.0, 27.0, 30.0, 52.0, 83.0, 80.0, 89.0, 120.0, 104.0, 80.0, 74.0, 59.0, 31.0, 36.0, 29.0, 19.0, 11.0, 7.0, 11.0, 5.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.31619158387184143, -0.30709975957870483, -0.29800793528556824, -0.28891611099243164, -0.27982431650161743, -0.27073249220848083, -0.26164066791534424, -0.25254884362220764, -0.24345701932907104, -0.23436519503593445, -0.22527338564395905, -0.21618156135082245, -0.20708973705768585, -0.19799792766571045, -0.18890610337257385, -0.17981427907943726, -0.17072246968746185, -0.16163064539432526, -0.15253883600234985, -0.14344701170921326, -0.13435518741607666, -0.12526336312294006, -0.11617155373096466, -0.10707972943782806, -0.09798791259527206, -0.08889609575271606, -0.07980427145957947, -0.07071245461702347, -0.06162063404917717, -0.05252881348133087, -0.04343699663877487, -0.034345172345638275, -0.025253355503082275, -0.016161534935235977, -0.007069716230034828, 0.002022102475166321, 0.011113923043012619, 0.020205743610858917, 0.029297560453414917, 0.038389384746551514, 0.04748120158910751, 0.05657302215695381, 0.06566484272480011, 0.07475665956735611, 0.08384847640991211, 0.0929403007030487, 0.1020321175456047, 0.1111239418387413, 0.1202157586812973, 0.1293075829744339, 0.1383993923664093, 0.1474912166595459, 0.1565830409526825, 0.1656748652458191, 0.1747666746377945, 0.1838584989309311, 0.1929503083229065, 0.2020421326160431, 0.2111339420080185, 0.2202257663011551, 0.2293175905942917, 0.2384093999862671, 0.2475012242794037, 0.2565930485725403, 0.2656848728656769]}, "gradients/decoder.model.decoder.layers.1.self_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 4.0, 6.0, 8.0, 10.0, 5.0, 8.0, 10.0, 9.0, 13.0, 18.0, 14.0, 29.0, 25.0, 32.0, 22.0, 47.0, 29.0, 48.0, 30.0, 37.0, 38.0, 39.0, 50.0, 50.0, 46.0, 44.0, 48.0, 40.0, 38.0, 29.0, 24.0, 20.0, 21.0, 17.0, 17.0, 24.0, 18.0, 18.0, 7.0, 4.0, 6.0, 4.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.15941950678825378, -0.15409605205059052, -0.14877258241176605, -0.14344912767410278, -0.13812565803527832, -0.13280220329761505, -0.12747874855995178, -0.12215527892112732, -0.11683181673288345, -0.11150835454463959, -0.10618489235639572, -0.10086143016815186, -0.09553797543048859, -0.09021450579166412, -0.08489105105400085, -0.07956758886575699, -0.07424412667751312, -0.06892066448926926, -0.06359720230102539, -0.05827374383807182, -0.05295028164982796, -0.04762681946158409, -0.042303360998630524, -0.03697989881038666, -0.03165643662214279, -0.026332974433898926, -0.02100951410830021, -0.015686053782701492, -0.010362591594457626, -0.00503912940621376, 0.00028432905673980713, 0.005607791244983673, 0.010931238532066345, 0.01625470072031021, 0.021578161045908928, 0.026901621371507645, 0.03222508355975151, 0.03754854574799538, 0.042872004210948944, 0.04819546639919281, 0.053518928587436676, 0.05884239077568054, 0.06416585296392441, 0.06948931515216827, 0.07481276988983154, 0.080136239528656, 0.08545969426631927, 0.09078315645456314, 0.096106618642807, 0.10143008083105087, 0.10675354301929474, 0.11207699775695801, 0.11740046739578247, 0.12272392213344574, 0.128047376871109, 0.13337084650993347, 0.13869431614875793, 0.1440177708864212, 0.14934124052524567, 0.15466469526290894, 0.1599881649017334, 0.16531161963939667, 0.17063507437705994, 0.1759585440158844, 0.18128199875354767]}, "gradients/decoder.model.decoder.layers.1.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 4.0, 2.0, 4.0, 3.0, 5.0, 8.0, 10.0, 21.0, 26.0, 31.0, 38.0, 67.0, 92.0, 126.0, 192.0, 279.0, 412.0, 559.0, 955.0, 1229.0, 2072.0, 3285.0, 5434.0, 9539.0, 17843.0, 37756.0, 98952.0, 332636.0, 350769.0, 103498.0, 39110.0, 18481.0, 9695.0, 5733.0, 3393.0, 2126.0, 1373.0, 892.0, 611.0, 396.0, 297.0, 196.0, 139.0, 80.0, 66.0, 41.0, 33.0, 14.0, 8.0, 7.0, 9.0, 7.0, 2.0, 4.0, 2.0, 1.0, 2.0, 2.0, 0.0, 3.0, 0.0, 2.0], "bins": [-0.2291259765625, -0.2214946746826172, -0.21386337280273438, -0.20623207092285156, -0.19860076904296875, -0.19096946716308594, -0.18333816528320312, -0.1757068634033203, -0.1680755615234375, -0.1604442596435547, -0.15281295776367188, -0.14518165588378906, -0.13755035400390625, -0.12991905212402344, -0.12228775024414062, -0.11465644836425781, -0.107025146484375, -0.09939384460449219, -0.09176254272460938, -0.08413124084472656, -0.07649993896484375, -0.06886863708496094, -0.061237335205078125, -0.05360603332519531, -0.0459747314453125, -0.03834342956542969, -0.030712127685546875, -0.023080825805664062, -0.01544952392578125, -0.007818222045898438, -0.000186920166015625, 0.0074443817138671875, 0.01507568359375, 0.022706985473632812, 0.030338287353515625, 0.03796958923339844, 0.04560089111328125, 0.05323219299316406, 0.060863494873046875, 0.06849479675292969, 0.0761260986328125, 0.08375740051269531, 0.09138870239257812, 0.09902000427246094, 0.10665130615234375, 0.11428260803222656, 0.12191390991210938, 0.1295452117919922, 0.137176513671875, 0.1448078155517578, 0.15243911743164062, 0.16007041931152344, 0.16770172119140625, 0.17533302307128906, 0.18296432495117188, 0.1905956268310547, 0.1982269287109375, 0.2058582305908203, 0.21348953247070312, 0.22112083435058594, 0.22875213623046875, 0.23638343811035156, 0.24401473999023438, 0.2516460418701172, 0.25927734375]}, "gradients/decoder.model.decoder.layers.1.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 3.0, 6.0, 3.0, 7.0, 6.0, 7.0, 9.0, 8.0, 11.0, 8.0, 10.0, 17.0, 19.0, 28.0, 25.0, 28.0, 34.0, 27.0, 38.0, 36.0, 38.0, 42.0, 49.0, 44.0, 43.0, 35.0, 50.0, 43.0, 33.0, 28.0, 40.0, 26.0, 27.0, 24.0, 17.0, 27.0, 18.0, 17.0, 14.0, 17.0, 13.0, 13.0, 8.0, 3.0, 4.0, 3.0, 3.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.29150390625, -0.28211212158203125, -0.2727203369140625, -0.26332855224609375, -0.253936767578125, -0.24454498291015625, -0.2351531982421875, -0.22576141357421875, -0.21636962890625, -0.20697784423828125, -0.1975860595703125, -0.18819427490234375, -0.178802490234375, -0.16941070556640625, -0.1600189208984375, -0.15062713623046875, -0.1412353515625, -0.13184356689453125, -0.1224517822265625, -0.11305999755859375, -0.103668212890625, -0.09427642822265625, -0.0848846435546875, -0.07549285888671875, -0.06610107421875, -0.05670928955078125, -0.0473175048828125, -0.03792572021484375, -0.028533935546875, -0.01914215087890625, -0.0097503662109375, -0.00035858154296875, 0.009033203125, 0.01842498779296875, 0.0278167724609375, 0.03720855712890625, 0.046600341796875, 0.05599212646484375, 0.0653839111328125, 0.07477569580078125, 0.08416748046875, 0.09355926513671875, 0.1029510498046875, 0.11234283447265625, 0.121734619140625, 0.13112640380859375, 0.1405181884765625, 0.14990997314453125, 0.1593017578125, 0.16869354248046875, 0.1780853271484375, 0.18747711181640625, 0.196868896484375, 0.20626068115234375, 0.2156524658203125, 0.22504425048828125, 0.23443603515625, 0.24382781982421875, 0.2532196044921875, 0.26261138916015625, 0.272003173828125, 0.28139495849609375, 0.2907867431640625, 0.30017852783203125, 0.3095703125]}, "gradients/decoder.model.decoder.layers.1.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 4.0, 8.0, 9.0, 13.0, 9.0, 30.0, 41.0, 47.0, 80.0, 209.0, 374.0, 986.0, 2769.0, 10725.0, 59047.0, 738203.0, 204538.0, 23325.0, 5326.0, 1625.0, 590.0, 270.0, 131.0, 78.0, 44.0, 33.0, 15.0, 13.0, 5.0, 3.0, 3.0, 2.0, 2.0, 2.0, 2.0, 2.0, 1.0], "bins": [-0.7890625, -0.7706031799316406, -0.7521438598632812, -0.7336845397949219, -0.7152252197265625, -0.6967658996582031, -0.6783065795898438, -0.6598472595214844, -0.641387939453125, -0.6229286193847656, -0.6044692993164062, -0.5860099792480469, -0.5675506591796875, -0.5490913391113281, -0.5306320190429688, -0.5121726989746094, -0.49371337890625, -0.4752540588378906, -0.45679473876953125, -0.4383354187011719, -0.4198760986328125, -0.4014167785644531, -0.38295745849609375, -0.3644981384277344, -0.346038818359375, -0.3275794982910156, -0.30912017822265625, -0.2906608581542969, -0.2722015380859375, -0.2537422180175781, -0.23528289794921875, -0.21682357788085938, -0.1983642578125, -0.17990493774414062, -0.16144561767578125, -0.14298629760742188, -0.1245269775390625, -0.10606765747070312, -0.08760833740234375, -0.06914901733398438, -0.050689697265625, -0.032230377197265625, -0.01377105712890625, 0.004688262939453125, 0.0231475830078125, 0.041606903076171875, 0.06006622314453125, 0.07852554321289062, 0.09698486328125, 0.11544418334960938, 0.13390350341796875, 0.15236282348632812, 0.1708221435546875, 0.18928146362304688, 0.20774078369140625, 0.22620010375976562, 0.244659423828125, 0.2631187438964844, 0.28157806396484375, 0.3000373840332031, 0.3184967041015625, 0.3369560241699219, 0.35541534423828125, 0.3738746643066406, 0.392333984375]}, "gradients/decoder.model.decoder.layers.1.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 3.0, 5.0, 7.0, 5.0, 10.0, 5.0, 12.0, 12.0, 18.0, 20.0, 24.0, 34.0, 35.0, 37.0, 50.0, 49.0, 49.0, 51.0, 62.0, 62.0, 58.0, 44.0, 56.0, 41.0, 39.0, 29.0, 42.0, 22.0, 24.0, 28.0, 17.0, 8.0, 8.0, 7.0, 8.0, 2.0, 9.0, 3.0, 3.0, 5.0, 1.0, 4.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.447021484375, -0.4337730407714844, -0.42052459716796875, -0.4072761535644531, -0.3940277099609375, -0.3807792663574219, -0.36753082275390625, -0.3542823791503906, -0.341033935546875, -0.3277854919433594, -0.31453704833984375, -0.3012886047363281, -0.2880401611328125, -0.2747917175292969, -0.26154327392578125, -0.24829483032226562, -0.23504638671875, -0.22179794311523438, -0.20854949951171875, -0.19530105590820312, -0.1820526123046875, -0.16880416870117188, -0.15555572509765625, -0.14230728149414062, -0.129058837890625, -0.11581039428710938, -0.10256195068359375, -0.08931350708007812, -0.0760650634765625, -0.06281661987304688, -0.04956817626953125, -0.036319732666015625, -0.0230712890625, -0.009822845458984375, 0.00342559814453125, 0.016674041748046875, 0.0299224853515625, 0.043170928955078125, 0.05641937255859375, 0.06966781616210938, 0.082916259765625, 0.09616470336914062, 0.10941314697265625, 0.12266159057617188, 0.1359100341796875, 0.14915847778320312, 0.16240692138671875, 0.17565536499023438, 0.18890380859375, 0.20215225219726562, 0.21540069580078125, 0.22864913940429688, 0.2418975830078125, 0.2551460266113281, 0.26839447021484375, 0.2816429138183594, 0.294891357421875, 0.3081398010253906, 0.32138824462890625, 0.3346366882324219, 0.3478851318359375, 0.3611335754394531, 0.37438201904296875, 0.3876304626464844, 0.40087890625]}, "gradients/decoder.model.decoder.layers.1.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 2.0, 0.0, 2.0, 3.0, 7.0, 8.0, 18.0, 22.0, 42.0, 101.0, 313.0, 1078.0, 4737.0, 44120.0, 875103.0, 113020.0, 7707.0, 1562.0, 434.0, 149.0, 42.0, 23.0, 19.0, 6.0, 6.0, 7.0, 2.0, 6.0, 3.0, 4.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.2685546875, -0.26141929626464844, -0.2542839050292969, -0.2471485137939453, -0.24001312255859375, -0.2328777313232422, -0.22574234008789062, -0.21860694885253906, -0.2114715576171875, -0.20433616638183594, -0.19720077514648438, -0.1900653839111328, -0.18292999267578125, -0.1757946014404297, -0.16865921020507812, -0.16152381896972656, -0.154388427734375, -0.14725303649902344, -0.14011764526367188, -0.1329822540283203, -0.12584686279296875, -0.11871147155761719, -0.11157608032226562, -0.10444068908691406, -0.0973052978515625, -0.09016990661621094, -0.08303451538085938, -0.07589912414550781, -0.06876373291015625, -0.06162834167480469, -0.054492950439453125, -0.04735755920410156, -0.04022216796875, -0.03308677673339844, -0.025951385498046875, -0.018815994262695312, -0.01168060302734375, -0.0045452117919921875, 0.002590179443359375, 0.009725570678710938, 0.0168609619140625, 0.023996353149414062, 0.031131744384765625, 0.03826713562011719, 0.04540252685546875, 0.05253791809082031, 0.059673309326171875, 0.06680870056152344, 0.073944091796875, 0.08107948303222656, 0.08821487426757812, 0.09535026550292969, 0.10248565673828125, 0.10962104797363281, 0.11675643920898438, 0.12389183044433594, 0.1310272216796875, 0.13816261291503906, 0.14529800415039062, 0.1524333953857422, 0.15956878662109375, 0.1667041778564453, 0.17383956909179688, 0.18097496032714844, 0.1881103515625]}, "gradients/decoder.model.decoder.layers.1.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 2.0, 2.0, 3.0, 3.0, 2.0, 5.0, 12.0, 7.0, 17.0, 24.0, 27.0, 38.0, 39.0, 46.0, 85.0, 97.0, 100.0, 109.0, 92.0, 71.0, 47.0, 48.0, 37.0, 25.0, 16.0, 12.0, 10.0, 2.0, 4.0, 8.0, 6.0, 1.0, 4.0, 3.0, 2.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6689300537109375e-05, -1.621432602405548e-05, -1.5739351511001587e-05, -1.5264376997947693e-05, -1.4789402484893799e-05, -1.4314427971839905e-05, -1.383945345878601e-05, -1.3364478945732117e-05, -1.2889504432678223e-05, -1.2414529919624329e-05, -1.1939555406570435e-05, -1.146458089351654e-05, -1.0989606380462646e-05, -1.0514631867408752e-05, -1.0039657354354858e-05, -9.564682841300964e-06, -9.08970832824707e-06, -8.614733815193176e-06, -8.139759302139282e-06, -7.664784789085388e-06, -7.189810276031494e-06, -6.7148357629776e-06, -6.239861249923706e-06, -5.764886736869812e-06, -5.289912223815918e-06, -4.814937710762024e-06, -4.33996319770813e-06, -3.864988684654236e-06, -3.390014171600342e-06, -2.9150396585464478e-06, -2.4400651454925537e-06, -1.9650906324386597e-06, -1.4901161193847656e-06, -1.0151416063308716e-06, -5.401670932769775e-07, -6.51925802230835e-08, 4.0978193283081055e-07, 8.847564458847046e-07, 1.3597309589385986e-06, 1.8347054719924927e-06, 2.3096799850463867e-06, 2.7846544981002808e-06, 3.259629011154175e-06, 3.734603524208069e-06, 4.209578037261963e-06, 4.684552550315857e-06, 5.159527063369751e-06, 5.634501576423645e-06, 6.109476089477539e-06, 6.584450602531433e-06, 7.059425115585327e-06, 7.534399628639221e-06, 8.009374141693115e-06, 8.48434865474701e-06, 8.959323167800903e-06, 9.434297680854797e-06, 9.909272193908691e-06, 1.0384246706962585e-05, 1.085922122001648e-05, 1.1334195733070374e-05, 1.1809170246124268e-05, 1.2284144759178162e-05, 1.2759119272232056e-05, 1.323409378528595e-05, 1.3709068298339844e-05]}, "gradients/decoder.model.decoder.layers.1.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 0.0, 0.0, 2.0, 3.0, 4.0, 0.0, 2.0, 3.0, 1.0, 9.0, 12.0, 16.0, 19.0, 23.0, 47.0, 111.0, 207.0, 578.0, 1586.0, 4970.0, 24939.0, 241600.0, 683829.0, 75427.0, 10838.0, 2697.0, 953.0, 339.0, 162.0, 71.0, 38.0, 23.0, 20.0, 12.0, 11.0, 2.0, 3.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.158447265625, -0.1532115936279297, -0.14797592163085938, -0.14274024963378906, -0.13750457763671875, -0.13226890563964844, -0.12703323364257812, -0.12179756164550781, -0.1165618896484375, -0.11132621765136719, -0.10609054565429688, -0.10085487365722656, -0.09561920166015625, -0.09038352966308594, -0.08514785766601562, -0.07991218566894531, -0.074676513671875, -0.06944084167480469, -0.06420516967773438, -0.05896949768066406, -0.05373382568359375, -0.04849815368652344, -0.043262481689453125, -0.03802680969238281, -0.0327911376953125, -0.027555465698242188, -0.022319793701171875, -0.017084121704101562, -0.01184844970703125, -0.0066127777099609375, -0.001377105712890625, 0.0038585662841796875, 0.00909423828125, 0.014329910278320312, 0.019565582275390625, 0.024801254272460938, 0.03003692626953125, 0.03527259826660156, 0.040508270263671875, 0.04574394226074219, 0.0509796142578125, 0.05621528625488281, 0.061450958251953125, 0.06668663024902344, 0.07192230224609375, 0.07715797424316406, 0.08239364624023438, 0.08762931823730469, 0.092864990234375, 0.09810066223144531, 0.10333633422851562, 0.10857200622558594, 0.11380767822265625, 0.11904335021972656, 0.12427902221679688, 0.1295146942138672, 0.1347503662109375, 0.1399860382080078, 0.14522171020507812, 0.15045738220214844, 0.15569305419921875, 0.16092872619628906, 0.16616439819335938, 0.1714000701904297, 0.1766357421875]}, "gradients/decoder.model.decoder.layers.1.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 6.0, 4.0, 9.0, 10.0, 16.0, 22.0, 34.0, 37.0, 60.0, 75.0, 89.0, 133.0, 136.0, 109.0, 72.0, 54.0, 45.0, 23.0, 22.0, 16.0, 9.0, 8.0, 7.0, 7.0, 4.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.078369140625, -0.07599067687988281, -0.07361221313476562, -0.07123374938964844, -0.06885528564453125, -0.06647682189941406, -0.06409835815429688, -0.06171989440917969, -0.0593414306640625, -0.05696296691894531, -0.054584503173828125, -0.05220603942871094, -0.04982757568359375, -0.04744911193847656, -0.045070648193359375, -0.04269218444824219, -0.040313720703125, -0.03793525695800781, -0.035556793212890625, -0.03317832946777344, -0.03079986572265625, -0.028421401977539062, -0.026042938232421875, -0.023664474487304688, -0.0212860107421875, -0.018907546997070312, -0.016529083251953125, -0.014150619506835938, -0.01177215576171875, -0.009393692016601562, -0.007015228271484375, -0.0046367645263671875, -0.00225830078125, 0.0001201629638671875, 0.002498626708984375, 0.0048770904541015625, 0.00725555419921875, 0.009634017944335938, 0.012012481689453125, 0.014390945434570312, 0.0167694091796875, 0.019147872924804688, 0.021526336669921875, 0.023904800415039062, 0.02628326416015625, 0.028661727905273438, 0.031040191650390625, 0.03341865539550781, 0.035797119140625, 0.03817558288574219, 0.040554046630859375, 0.04293251037597656, 0.04531097412109375, 0.04768943786621094, 0.050067901611328125, 0.05244636535644531, 0.0548248291015625, 0.05720329284667969, 0.059581756591796875, 0.06196022033691406, 0.06433868408203125, 0.06671714782714844, 0.06909561157226562, 0.07147407531738281, 0.0738525390625]}, "gradients/decoder.model.decoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 5.0, 6.0, 16.0, 27.0, 64.0, 93.0, 156.0, 198.0, 170.0, 121.0, 84.0, 40.0, 21.0, 10.0, 2.0, 0.0, 1.0], "bins": [-1.9552181959152222, -1.9194824695587158, -1.8837467432022095, -1.8480111360549927, -1.8122754096984863, -1.77653968334198, -1.7408039569854736, -1.7050682306289673, -1.669332504272461, -1.6335967779159546, -1.5978610515594482, -1.5621254444122314, -1.526389718055725, -1.4906539916992188, -1.4549182653427124, -1.419182538986206, -1.3834469318389893, -1.347711205482483, -1.3119754791259766, -1.2762398719787598, -1.2405041456222534, -1.204768419265747, -1.1690326929092407, -1.1332969665527344, -1.0975613594055176, -1.0618256330490112, -1.0260899066925049, -0.9903542399406433, -0.9546185731887817, -0.9188828468322754, -0.883147120475769, -0.8474113941192627, -0.8116756081581116, -0.7759398818016052, -0.7402042150497437, -0.7044684886932373, -0.668732762336731, -0.6329970955848694, -0.597261369228363, -0.5615257024765015, -0.5257899761199951, -0.49005427956581116, -0.4543185830116272, -0.41858285665512085, -0.3828471601009369, -0.34711146354675293, -0.3113757371902466, -0.2756400406360626, -0.23990434408187866, -0.2041686475276947, -0.16843293607234955, -0.1326972246170044, -0.09696152806282043, -0.061225831508636475, -0.02549012005329132, 0.010245591402053833, 0.04598128795623779, 0.08171699196100235, 0.1174526959657669, 0.15318840742111206, 0.18892410397529602, 0.22465980052947998, 0.26039552688598633, 0.2961312234401703, 0.33186691999435425]}, "gradients/decoder.model.decoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 5.0, 2.0, 2.0, 8.0, 7.0, 5.0, 11.0, 9.0, 9.0, 14.0, 9.0, 24.0, 32.0, 30.0, 27.0, 37.0, 29.0, 34.0, 33.0, 43.0, 33.0, 45.0, 51.0, 41.0, 43.0, 34.0, 41.0, 40.0, 41.0, 36.0, 31.0, 31.0, 28.0, 26.0, 20.0, 20.0, 13.0, 7.0, 11.0, 14.0, 8.0, 8.0, 2.0, 6.0, 6.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.5767304301261902, -0.5587364435195923, -0.5407424569129944, -0.5227484703063965, -0.5047544836997986, -0.48676052689552307, -0.46876654028892517, -0.45077258348464966, -0.43277859687805176, -0.41478461027145386, -0.39679062366485596, -0.37879663705825806, -0.36080268025398254, -0.34280869364738464, -0.32481470704078674, -0.30682075023651123, -0.28882673382759094, -0.27083274722099304, -0.25283876061439514, -0.23484478890895844, -0.21685081720352173, -0.19885683059692383, -0.18086284399032593, -0.16286887228488922, -0.14487488567829132, -0.12688089907169342, -0.10888692736625671, -0.09089294075965881, -0.07289896160364151, -0.05490498244762421, -0.036910995841026306, -0.0189170241355896, -0.0009230375289916992, 0.017070943489670753, 0.035064924508333206, 0.05305890738964081, 0.07105288654565811, 0.08904686570167542, 0.10704085230827332, 0.12503482401371002, 0.14302881062030792, 0.16102279722690582, 0.17901676893234253, 0.19701075553894043, 0.21500474214553833, 0.23299871385097504, 0.25099271535873413, 0.26898667216300964, 0.28698065876960754, 0.30497464537620544, 0.32296863198280334, 0.34096258878707886, 0.35895657539367676, 0.37695056200027466, 0.39494454860687256, 0.41293853521347046, 0.43093252182006836, 0.44892650842666626, 0.46692049503326416, 0.48491448163986206, 0.50290846824646, 0.5209023952484131, 0.5388964414596558, 0.5568903684616089, 0.5748843550682068]}, "gradients/decoder.model.decoder.layers.0.fc2.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 2.0, 5.0, 11.0, 7.0, 9.0, 21.0, 19.0, 27.0, 46.0, 59.0, 80.0, 130.0, 187.0, 304.0, 498.0, 863.0, 1676.0, 3321.0, 7120.0, 18196.0, 87809.0, 971998.0, 2654493.0, 381211.0, 42885.0, 12190.0, 5097.0, 2583.0, 1400.0, 745.0, 417.0, 291.0, 175.0, 135.0, 106.0, 51.0, 36.0, 24.0, 14.0, 13.0, 9.0, 9.0, 9.0, 5.0, 1.0, 5.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.403076171875, -0.39166259765625, -0.3802490234375, -0.36883544921875, -0.357421875, -0.34600830078125, -0.3345947265625, -0.32318115234375, -0.311767578125, -0.30035400390625, -0.2889404296875, -0.27752685546875, -0.26611328125, -0.25469970703125, -0.2432861328125, -0.23187255859375, -0.220458984375, -0.20904541015625, -0.1976318359375, -0.18621826171875, -0.1748046875, -0.16339111328125, -0.1519775390625, -0.14056396484375, -0.129150390625, -0.11773681640625, -0.1063232421875, -0.09490966796875, -0.08349609375, -0.07208251953125, -0.0606689453125, -0.04925537109375, -0.037841796875, -0.02642822265625, -0.0150146484375, -0.00360107421875, 0.0078125, 0.01922607421875, 0.0306396484375, 0.04205322265625, 0.053466796875, 0.06488037109375, 0.0762939453125, 0.08770751953125, 0.09912109375, 0.11053466796875, 0.1219482421875, 0.13336181640625, 0.144775390625, 0.15618896484375, 0.1676025390625, 0.17901611328125, 0.1904296875, 0.20184326171875, 0.2132568359375, 0.22467041015625, 0.236083984375, 0.24749755859375, 0.2589111328125, 0.27032470703125, 0.28173828125, 0.29315185546875, 0.3045654296875, 0.31597900390625, 0.327392578125]}, "gradients/decoder.model.decoder.layers.0.fc2.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 5.0, 3.0, 3.0, 6.0, 2.0, 4.0, 7.0, 6.0, 8.0, 22.0, 11.0, 15.0, 19.0, 25.0, 30.0, 23.0, 32.0, 37.0, 34.0, 34.0, 34.0, 41.0, 48.0, 43.0, 38.0, 45.0, 45.0, 31.0, 29.0, 42.0, 33.0, 35.0, 32.0, 24.0, 28.0, 19.0, 22.0, 12.0, 16.0, 10.0, 11.0, 10.0, 8.0, 8.0, 8.0, 3.0, 3.0, 5.0, 3.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0], "bins": [-0.1927490234375, -0.18700408935546875, -0.1812591552734375, -0.17551422119140625, -0.169769287109375, -0.16402435302734375, -0.1582794189453125, -0.15253448486328125, -0.14678955078125, -0.14104461669921875, -0.1352996826171875, -0.12955474853515625, -0.123809814453125, -0.11806488037109375, -0.1123199462890625, -0.10657501220703125, -0.100830078125, -0.09508514404296875, -0.0893402099609375, -0.08359527587890625, -0.077850341796875, -0.07210540771484375, -0.0663604736328125, -0.06061553955078125, -0.05487060546875, -0.04912567138671875, -0.0433807373046875, -0.03763580322265625, -0.031890869140625, -0.02614593505859375, -0.0204010009765625, -0.01465606689453125, -0.0089111328125, -0.00316619873046875, 0.0025787353515625, 0.00832366943359375, 0.014068603515625, 0.01981353759765625, 0.0255584716796875, 0.03130340576171875, 0.03704833984375, 0.04279327392578125, 0.0485382080078125, 0.05428314208984375, 0.060028076171875, 0.06577301025390625, 0.0715179443359375, 0.07726287841796875, 0.0830078125, 0.08875274658203125, 0.0944976806640625, 0.10024261474609375, 0.105987548828125, 0.11173248291015625, 0.1174774169921875, 0.12322235107421875, 0.12896728515625, 0.13471221923828125, 0.1404571533203125, 0.14620208740234375, 0.151947021484375, 0.15769195556640625, 0.1634368896484375, 0.16918182373046875, 0.1749267578125]}, "gradients/decoder.model.decoder.layers.0.fc1.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 2.0, 0.0, 3.0, 9.0, 5.0, 10.0, 9.0, 12.0, 21.0, 39.0, 65.0, 97.0, 185.0, 500.0, 1943.0, 10580.0, 150557.0, 3920113.0, 98988.0, 8557.0, 1668.0, 488.0, 191.0, 100.0, 44.0, 33.0, 26.0, 12.0, 7.0, 6.0, 1.0, 5.0, 1.0, 3.0, 2.0, 1.0, 5.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.708984375, -0.6821746826171875, -0.655364990234375, -0.6285552978515625, -0.60174560546875, -0.5749359130859375, -0.548126220703125, -0.5213165283203125, -0.4945068359375, -0.4676971435546875, -0.440887451171875, -0.4140777587890625, -0.38726806640625, -0.3604583740234375, -0.333648681640625, -0.3068389892578125, -0.280029296875, -0.2532196044921875, -0.226409912109375, -0.1996002197265625, -0.17279052734375, -0.1459808349609375, -0.119171142578125, -0.0923614501953125, -0.0655517578125, -0.0387420654296875, -0.011932373046875, 0.0148773193359375, 0.04168701171875, 0.0684967041015625, 0.095306396484375, 0.1221160888671875, 0.14892578125, 0.1757354736328125, 0.202545166015625, 0.2293548583984375, 0.25616455078125, 0.2829742431640625, 0.309783935546875, 0.3365936279296875, 0.3634033203125, 0.3902130126953125, 0.417022705078125, 0.4438323974609375, 0.47064208984375, 0.4974517822265625, 0.524261474609375, 0.5510711669921875, 0.577880859375, 0.6046905517578125, 0.631500244140625, 0.6583099365234375, 0.68511962890625, 0.7119293212890625, 0.738739013671875, 0.7655487060546875, 0.7923583984375, 0.8191680908203125, 0.845977783203125, 0.8727874755859375, 0.89959716796875, 0.9264068603515625, 0.953216552734375, 0.9800262451171875, 1.0068359375]}, "gradients/decoder.model.decoder.layers.0.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 6.0, 2.0, 7.0, 14.0, 11.0, 15.0, 30.0, 40.0, 71.0, 108.0, 214.0, 417.0, 621.0, 831.0, 695.0, 416.0, 258.0, 122.0, 62.0, 31.0, 34.0, 19.0, 16.0, 12.0, 11.0, 4.0, 3.0, 5.0, 4.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.231201171875, -0.22589588165283203, -0.22059059143066406, -0.2152853012084961, -0.20998001098632812, -0.20467472076416016, -0.1993694305419922, -0.19406414031982422, -0.18875885009765625, -0.18345355987548828, -0.1781482696533203, -0.17284297943115234, -0.16753768920898438, -0.1622323989868164, -0.15692710876464844, -0.15162181854248047, -0.1463165283203125, -0.14101123809814453, -0.13570594787597656, -0.1304006576538086, -0.12509536743164062, -0.11979007720947266, -0.11448478698730469, -0.10917949676513672, -0.10387420654296875, -0.09856891632080078, -0.09326362609863281, -0.08795833587646484, -0.08265304565429688, -0.0773477554321289, -0.07204246520996094, -0.06673717498779297, -0.061431884765625, -0.05612659454345703, -0.05082130432128906, -0.045516014099121094, -0.040210723876953125, -0.034905433654785156, -0.029600143432617188, -0.02429485321044922, -0.01898956298828125, -0.013684272766113281, -0.008378982543945312, -0.0030736923217773438, 0.002231597900390625, 0.007536888122558594, 0.012842178344726562, 0.01814746856689453, 0.0234527587890625, 0.02875804901123047, 0.03406333923339844, 0.039368629455566406, 0.044673919677734375, 0.049979209899902344, 0.05528450012207031, 0.06058979034423828, 0.06589508056640625, 0.07120037078857422, 0.07650566101074219, 0.08181095123291016, 0.08711624145507812, 0.0924215316772461, 0.09772682189941406, 0.10303211212158203, 0.10833740234375]}, "gradients/decoder.model.decoder.layers.0.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 4.0, 5.0, 2.0, 6.0, 6.0, 6.0, 11.0, 14.0, 20.0, 27.0, 20.0, 24.0, 22.0, 31.0, 48.0, 43.0, 46.0, 58.0, 54.0, 45.0, 65.0, 59.0, 58.0, 41.0, 42.0, 33.0, 43.0, 26.0, 32.0, 24.0, 18.0, 11.0, 10.0, 6.0, 9.0, 5.0, 5.0, 5.0, 4.0, 8.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.2459697276353836, -0.23741993308067322, -0.22887013852596283, -0.22032034397125244, -0.21177054941654205, -0.20322075486183167, -0.19467097520828247, -0.1861211657524109, -0.1775713860988617, -0.1690215915441513, -0.16047179698944092, -0.15192200243473053, -0.14337220788002014, -0.13482241332530975, -0.12627261877059937, -0.11772283166646957, -0.10917302966117859, -0.1006232351064682, -0.09207344055175781, -0.08352364599704742, -0.07497385144233704, -0.06642405688762665, -0.05787426978349686, -0.04932447522878647, -0.04077468067407608, -0.03222488611936569, -0.023675093427300453, -0.015125300735235214, -0.006575506180524826, 0.001974288374185562, 0.010524079203605652, 0.01907387375831604, 0.027623653411865234, 0.03617344796657562, 0.04472324252128601, 0.0532730333507061, 0.06182282790541649, 0.07037262618541718, 0.07892241328954697, 0.08747220784425735, 0.09602200239896774, 0.10457179695367813, 0.11312159150838852, 0.12167137861251831, 0.1302211731672287, 0.1387709677219391, 0.14732076227664948, 0.15587055683135986, 0.16442035138607025, 0.17297014594078064, 0.18151994049549103, 0.19006973505020142, 0.1986195296049118, 0.2071693241596222, 0.2157191038131714, 0.22426891326904297, 0.23281869292259216, 0.24136848747730255, 0.24991828203201294, 0.25846806168556213, 0.2670178711414337, 0.2755676507949829, 0.2841174602508545, 0.2926672399044037, 0.30121704936027527]}, "gradients/decoder.model.decoder.layers.0.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 0.0, 3.0, 3.0, 7.0, 3.0, 1.0, 4.0, 4.0, 15.0, 7.0, 13.0, 13.0, 8.0, 19.0, 17.0, 23.0, 30.0, 26.0, 31.0, 30.0, 23.0, 37.0, 33.0, 36.0, 46.0, 44.0, 43.0, 40.0, 28.0, 37.0, 31.0, 40.0, 32.0, 29.0, 32.0, 29.0, 25.0, 32.0, 27.0, 14.0, 21.0, 14.0, 15.0, 8.0, 14.0, 6.0, 7.0, 1.0, 7.0, 3.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.22759267687797546, -0.2201193869113922, -0.21264611184597015, -0.2051728218793869, -0.19769954681396484, -0.1902262568473816, -0.18275296688079834, -0.17527969181537628, -0.16780640184879303, -0.16033311188220978, -0.15285983681678772, -0.14538654685020447, -0.1379132717847824, -0.13043998181819916, -0.1229666993021965, -0.11549341678619385, -0.10802013427019119, -0.10054685175418854, -0.09307356923818588, -0.08560028672218323, -0.07812699675559998, -0.07065371423959732, -0.06318043172359467, -0.05570714548230171, -0.04823386296629906, -0.0407605804502964, -0.03328729420900345, -0.025814011693000793, -0.01834072731435299, -0.010867442935705185, -0.00339416041970253, 0.004079125821590424, 0.011552408337593079, 0.019025692716240883, 0.026498977094888687, 0.03397225961089134, 0.041445545852184296, 0.04891882836818695, 0.056392110884189606, 0.06386539340019226, 0.07133868336677551, 0.07881196588277817, 0.08628524839878082, 0.09375853836536407, 0.10123182088136673, 0.10870510339736938, 0.11617838591337204, 0.1236516684293747, 0.13112494349479675, 0.13859823346138, 0.14607150852680206, 0.15354479849338531, 0.16101807355880737, 0.16849136352539062, 0.17596465349197388, 0.18343792855739594, 0.1909112185239792, 0.19838450849056244, 0.2058577835559845, 0.21333107352256775, 0.2208043485879898, 0.22827763855457306, 0.23575091361999512, 0.24322420358657837, 0.2506974935531616]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 7.0, 5.0, 9.0, 11.0, 23.0, 28.0, 46.0, 65.0, 90.0, 147.0, 232.0, 347.0, 663.0, 1262.0, 2546.0, 5343.0, 12261.0, 34561.0, 224337.0, 626466.0, 100073.0, 22697.0, 8991.0, 4005.0, 1941.0, 987.0, 551.0, 313.0, 191.0, 99.0, 95.0, 42.0, 30.0, 30.0, 17.0, 11.0, 20.0, 6.0, 3.0, 3.0, 5.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.1143798828125, -0.1108407974243164, -0.10730171203613281, -0.10376262664794922, -0.10022354125976562, -0.09668445587158203, -0.09314537048339844, -0.08960628509521484, -0.08606719970703125, -0.08252811431884766, -0.07898902893066406, -0.07544994354248047, -0.07191085815429688, -0.06837177276611328, -0.06483268737792969, -0.061293601989746094, -0.0577545166015625, -0.054215431213378906, -0.05067634582519531, -0.04713726043701172, -0.043598175048828125, -0.04005908966064453, -0.03652000427246094, -0.032980918884277344, -0.02944183349609375, -0.025902748107910156, -0.022363662719726562, -0.01882457733154297, -0.015285491943359375, -0.011746406555175781, -0.008207321166992188, -0.004668235778808594, -0.001129150390625, 0.0024099349975585938, 0.0059490203857421875, 0.009488105773925781, 0.013027191162109375, 0.01656627655029297, 0.020105361938476562, 0.023644447326660156, 0.02718353271484375, 0.030722618103027344, 0.03426170349121094, 0.03780078887939453, 0.041339874267578125, 0.04487895965576172, 0.04841804504394531, 0.051957130432128906, 0.0554962158203125, 0.059035301208496094, 0.06257438659667969, 0.06611347198486328, 0.06965255737304688, 0.07319164276123047, 0.07673072814941406, 0.08026981353759766, 0.08380889892578125, 0.08734798431396484, 0.09088706970214844, 0.09442615509033203, 0.09796524047851562, 0.10150432586669922, 0.10504341125488281, 0.1085824966430664, 0.11212158203125]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 4.0, 3.0, 7.0, 3.0, 5.0, 1.0, 6.0, 7.0, 7.0, 10.0, 14.0, 11.0, 23.0, 18.0, 21.0, 28.0, 26.0, 28.0, 26.0, 33.0, 41.0, 36.0, 47.0, 47.0, 35.0, 55.0, 33.0, 50.0, 27.0, 41.0, 31.0, 37.0, 42.0, 22.0, 25.0, 20.0, 23.0, 26.0, 19.0, 18.0, 13.0, 10.0, 12.0, 5.0, 4.0, 9.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1492919921875, -0.14422607421875, -0.13916015625, -0.13409423828125, -0.1290283203125, -0.12396240234375, -0.118896484375, -0.11383056640625, -0.1087646484375, -0.10369873046875, -0.0986328125, -0.09356689453125, -0.0885009765625, -0.08343505859375, -0.078369140625, -0.07330322265625, -0.0682373046875, -0.06317138671875, -0.05810546875, -0.05303955078125, -0.0479736328125, -0.04290771484375, -0.037841796875, -0.03277587890625, -0.0277099609375, -0.02264404296875, -0.017578125, -0.01251220703125, -0.0074462890625, -0.00238037109375, 0.002685546875, 0.00775146484375, 0.0128173828125, 0.01788330078125, 0.02294921875, 0.02801513671875, 0.0330810546875, 0.03814697265625, 0.043212890625, 0.04827880859375, 0.0533447265625, 0.05841064453125, 0.0634765625, 0.06854248046875, 0.0736083984375, 0.07867431640625, 0.083740234375, 0.08880615234375, 0.0938720703125, 0.09893798828125, 0.10400390625, 0.10906982421875, 0.1141357421875, 0.11920166015625, 0.124267578125, 0.12933349609375, 0.1343994140625, 0.13946533203125, 0.14453125, 0.14959716796875, 0.1546630859375, 0.15972900390625, 0.164794921875, 0.16986083984375, 0.1749267578125]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 3.0, 2.0, 6.0, 6.0, 11.0, 24.0, 51.0, 79.0, 108.0, 223.0, 426.0, 908.0, 2020.0, 5163.0, 15052.0, 53327.0, 279342.0, 530729.0, 118949.0, 27317.0, 8724.0, 3340.0, 1414.0, 639.0, 316.0, 161.0, 96.0, 36.0, 32.0, 28.0, 12.0, 5.0, 5.0, 6.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09014892578125, -0.0876626968383789, -0.08517646789550781, -0.08269023895263672, -0.08020401000976562, -0.07771778106689453, -0.07523155212402344, -0.07274532318115234, -0.07025909423828125, -0.06777286529541016, -0.06528663635253906, -0.06280040740966797, -0.060314178466796875, -0.05782794952392578, -0.05534172058105469, -0.052855491638183594, -0.0503692626953125, -0.047883033752441406, -0.04539680480957031, -0.04291057586669922, -0.040424346923828125, -0.03793811798095703, -0.03545188903808594, -0.032965660095214844, -0.03047943115234375, -0.027993202209472656, -0.025506973266601562, -0.02302074432373047, -0.020534515380859375, -0.01804828643798828, -0.015562057495117188, -0.013075828552246094, -0.010589599609375, -0.008103370666503906, -0.0056171417236328125, -0.0031309127807617188, -0.000644683837890625, 0.0018415451049804688, 0.0043277740478515625, 0.006814002990722656, 0.00930023193359375, 0.011786460876464844, 0.014272689819335938, 0.01675891876220703, 0.019245147705078125, 0.02173137664794922, 0.024217605590820312, 0.026703834533691406, 0.0291900634765625, 0.031676292419433594, 0.03416252136230469, 0.03664875030517578, 0.039134979248046875, 0.04162120819091797, 0.04410743713378906, 0.046593666076660156, 0.04907989501953125, 0.051566123962402344, 0.05405235290527344, 0.05653858184814453, 0.059024810791015625, 0.06151103973388672, 0.06399726867675781, 0.0664834976196289, 0.0689697265625]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 6.0, 5.0, 4.0, 4.0, 5.0, 9.0, 3.0, 7.0, 12.0, 18.0, 6.0, 25.0, 20.0, 27.0, 36.0, 35.0, 35.0, 42.0, 38.0, 39.0, 50.0, 39.0, 47.0, 41.0, 47.0, 41.0, 38.0, 34.0, 57.0, 38.0, 25.0, 31.0, 31.0, 21.0, 19.0, 13.0, 14.0, 12.0, 10.0, 6.0, 5.0, 7.0, 4.0, 1.0, 3.0, 3.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.380615234375, -0.3675994873046875, -0.354583740234375, -0.3415679931640625, -0.32855224609375, -0.3155364990234375, -0.302520751953125, -0.2895050048828125, -0.2764892578125, -0.2634735107421875, -0.250457763671875, -0.2374420166015625, -0.22442626953125, -0.2114105224609375, -0.198394775390625, -0.1853790283203125, -0.17236328125, -0.1593475341796875, -0.146331787109375, -0.1333160400390625, -0.12030029296875, -0.1072845458984375, -0.094268798828125, -0.0812530517578125, -0.0682373046875, -0.0552215576171875, -0.042205810546875, -0.0291900634765625, -0.01617431640625, -0.0031585693359375, 0.009857177734375, 0.0228729248046875, 0.035888671875, 0.0489044189453125, 0.061920166015625, 0.0749359130859375, 0.08795166015625, 0.1009674072265625, 0.113983154296875, 0.1269989013671875, 0.1400146484375, 0.1530303955078125, 0.166046142578125, 0.1790618896484375, 0.19207763671875, 0.2050933837890625, 0.218109130859375, 0.2311248779296875, 0.244140625, 0.2571563720703125, 0.270172119140625, 0.2831878662109375, 0.29620361328125, 0.3092193603515625, 0.322235107421875, 0.3352508544921875, 0.3482666015625, 0.3612823486328125, 0.374298095703125, 0.3873138427734375, 0.40032958984375, 0.4133453369140625, 0.426361083984375, 0.4393768310546875, 0.452392578125]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 3.0, 2.0, 6.0, 7.0, 10.0, 20.0, 23.0, 29.0, 47.0, 55.0, 101.0, 197.0, 367.0, 729.0, 1407.0, 3486.0, 9508.0, 34141.0, 223523.0, 614259.0, 125113.0, 23083.0, 7032.0, 2767.0, 1267.0, 589.0, 330.0, 198.0, 75.0, 66.0, 30.0, 31.0, 18.0, 14.0, 3.0, 7.0, 3.0, 2.0, 8.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03271484375, -0.031703948974609375, -0.03069305419921875, -0.029682159423828125, -0.0286712646484375, -0.027660369873046875, -0.02664947509765625, -0.025638580322265625, -0.024627685546875, -0.023616790771484375, -0.02260589599609375, -0.021595001220703125, -0.0205841064453125, -0.019573211669921875, -0.01856231689453125, -0.017551422119140625, -0.01654052734375, -0.015529632568359375, -0.01451873779296875, -0.013507843017578125, -0.0124969482421875, -0.011486053466796875, -0.01047515869140625, -0.009464263916015625, -0.008453369140625, -0.007442474365234375, -0.00643157958984375, -0.005420684814453125, -0.0044097900390625, -0.003398895263671875, -0.00238800048828125, -0.001377105712890625, -0.0003662109375, 0.000644683837890625, 0.00165557861328125, 0.002666473388671875, 0.0036773681640625, 0.004688262939453125, 0.00569915771484375, 0.006710052490234375, 0.007720947265625, 0.008731842041015625, 0.00974273681640625, 0.010753631591796875, 0.0117645263671875, 0.012775421142578125, 0.01378631591796875, 0.014797210693359375, 0.01580810546875, 0.016819000244140625, 0.01782989501953125, 0.018840789794921875, 0.0198516845703125, 0.020862579345703125, 0.02187347412109375, 0.022884368896484375, 0.023895263671875, 0.024906158447265625, 0.02591705322265625, 0.026927947998046875, 0.0279388427734375, 0.028949737548828125, 0.02996063232421875, 0.030971527099609375, 0.031982421875]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 3.0, 5.0, 3.0, 8.0, 6.0, 4.0, 10.0, 16.0, 15.0, 26.0, 40.0, 61.0, 89.0, 98.0, 87.0, 116.0, 111.0, 73.0, 72.0, 49.0, 35.0, 26.0, 7.0, 11.0, 7.0, 4.0, 4.0, 6.0, 4.0, 0.0, 3.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.6033649444580078e-05, -1.552049070596695e-05, -1.500733196735382e-05, -1.4494173228740692e-05, -1.3981014490127563e-05, -1.3467855751514435e-05, -1.2954697012901306e-05, -1.2441538274288177e-05, -1.1928379535675049e-05, -1.141522079706192e-05, -1.0902062058448792e-05, -1.0388903319835663e-05, -9.875744581222534e-06, -9.362585842609406e-06, -8.849427103996277e-06, -8.336268365383148e-06, -7.82310962677002e-06, -7.309950888156891e-06, -6.796792149543762e-06, -6.2836334109306335e-06, -5.770474672317505e-06, -5.257315933704376e-06, -4.7441571950912476e-06, -4.230998456478119e-06, -3.7178397178649902e-06, -3.2046809792518616e-06, -2.691522240638733e-06, -2.1783635020256042e-06, -1.6652047634124756e-06, -1.152046024799347e-06, -6.388872861862183e-07, -1.257285475730896e-07, 3.8743019104003906e-07, 9.005889296531677e-07, 1.4137476682662964e-06, 1.926906406879425e-06, 2.4400651454925537e-06, 2.9532238841056824e-06, 3.466382622718811e-06, 3.97954136133194e-06, 4.492700099945068e-06, 5.005858838558197e-06, 5.519017577171326e-06, 6.032176315784454e-06, 6.545335054397583e-06, 7.058493793010712e-06, 7.57165253162384e-06, 8.084811270236969e-06, 8.597970008850098e-06, 9.111128747463226e-06, 9.624287486076355e-06, 1.0137446224689484e-05, 1.0650604963302612e-05, 1.1163763701915741e-05, 1.167692244052887e-05, 1.2190081179141998e-05, 1.2703239917755127e-05, 1.3216398656368256e-05, 1.3729557394981384e-05, 1.4242716133594513e-05, 1.4755874872207642e-05, 1.526903361082077e-05, 1.57821923494339e-05, 1.6295351088047028e-05, 1.6808509826660156e-05]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 2.0, 7.0, 9.0, 11.0, 18.0, 37.0, 69.0, 117.0, 252.0, 503.0, 936.0, 1931.0, 3714.0, 7989.0, 17652.0, 41108.0, 103835.0, 242630.0, 319404.0, 180565.0, 72736.0, 29847.0, 13258.0, 5980.0, 2973.0, 1386.0, 734.0, 358.0, 228.0, 121.0, 57.0, 30.0, 28.0, 14.0, 10.0, 8.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.0200653076171875, -0.019496917724609375, -0.01892852783203125, -0.018360137939453125, -0.017791748046875, -0.017223358154296875, -0.01665496826171875, -0.016086578369140625, -0.0155181884765625, -0.014949798583984375, -0.01438140869140625, -0.013813018798828125, -0.01324462890625, -0.012676239013671875, -0.01210784912109375, -0.011539459228515625, -0.0109710693359375, -0.010402679443359375, -0.00983428955078125, -0.009265899658203125, -0.008697509765625, -0.008129119873046875, -0.00756072998046875, -0.006992340087890625, -0.0064239501953125, -0.005855560302734375, -0.00528717041015625, -0.004718780517578125, -0.004150390625, -0.003582000732421875, -0.00301361083984375, -0.002445220947265625, -0.0018768310546875, -0.001308441162109375, -0.00074005126953125, -0.000171661376953125, 0.000396728515625, 0.000965118408203125, 0.00153350830078125, 0.002101898193359375, 0.0026702880859375, 0.003238677978515625, 0.00380706787109375, 0.004375457763671875, 0.00494384765625, 0.005512237548828125, 0.00608062744140625, 0.006649017333984375, 0.0072174072265625, 0.007785797119140625, 0.00835418701171875, 0.008922576904296875, 0.009490966796875, 0.010059356689453125, 0.01062774658203125, 0.011196136474609375, 0.0117645263671875, 0.012332916259765625, 0.01290130615234375, 0.013469696044921875, 0.0140380859375, 0.014606475830078125, 0.01517486572265625, 0.015743255615234375, 0.0163116455078125]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 4.0, 5.0, 9.0, 8.0, 10.0, 15.0, 15.0, 10.0, 18.0, 30.0, 33.0, 42.0, 56.0, 58.0, 80.0, 96.0, 65.0, 52.0, 60.0, 80.0, 59.0, 45.0, 39.0, 24.0, 20.0, 16.0, 13.0, 13.0, 3.0, 9.0, 4.0, 4.0, 4.0, 5.0, 1.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.006076812744140625, -0.00585407018661499, -0.0056313276290893555, -0.005408585071563721, -0.005185842514038086, -0.004963099956512451, -0.004740357398986816, -0.004517614841461182, -0.004294872283935547, -0.004072129726409912, -0.0038493871688842773, -0.0036266446113586426, -0.003403902053833008, -0.003181159496307373, -0.0029584169387817383, -0.0027356743812561035, -0.0025129318237304688, -0.002290189266204834, -0.0020674467086791992, -0.0018447041511535645, -0.0016219615936279297, -0.001399219036102295, -0.0011764764785766602, -0.0009537339210510254, -0.0007309913635253906, -0.0005082488059997559, -0.0002855062484741211, -6.276369094848633e-05, 0.00015997886657714844, 0.0003827214241027832, 0.000605463981628418, 0.0008282065391540527, 0.0010509490966796875, 0.0012736916542053223, 0.001496434211730957, 0.0017191767692565918, 0.0019419193267822266, 0.0021646618843078613, 0.002387404441833496, 0.002610146999359131, 0.0028328895568847656, 0.0030556321144104004, 0.003278374671936035, 0.00350111722946167, 0.0037238597869873047, 0.0039466023445129395, 0.004169344902038574, 0.004392087459564209, 0.004614830017089844, 0.0048375725746154785, 0.005060315132141113, 0.005283057689666748, 0.005505800247192383, 0.005728542804718018, 0.005951285362243652, 0.006174027919769287, 0.006396770477294922, 0.006619513034820557, 0.006842255592346191, 0.007064998149871826, 0.007287740707397461, 0.007510483264923096, 0.0077332258224487305, 0.007955968379974365, 0.0081787109375]}, "gradients/decoder.model.decoder.layers.0.self_attn_layer_norm.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 5.0, 5.0, 3.0, 2.0, 9.0, 3.0, 9.0, 6.0, 14.0, 18.0, 21.0, 12.0, 19.0, 24.0, 30.0, 45.0, 54.0, 34.0, 48.0, 55.0, 55.0, 64.0, 58.0, 57.0, 58.0, 49.0, 46.0, 33.0, 29.0, 31.0, 23.0, 24.0, 12.0, 5.0, 8.0, 9.0, 8.0, 2.0, 3.0, 3.0, 4.0, 4.0, 2.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0], "bins": [-0.1713239848613739, -0.16605545580387115, -0.1607869267463684, -0.15551838278770447, -0.15024985373020172, -0.14498132467269897, -0.13971279561519623, -0.13444426655769348, -0.12917572259902954, -0.1239071935415268, -0.11863865703344345, -0.1133701279759407, -0.10810159146785736, -0.10283306241035461, -0.09756453335285187, -0.09229599684476852, -0.08702746778726578, -0.08175893872976303, -0.07649040222167969, -0.07122187316417694, -0.0659533366560936, -0.06068480759859085, -0.055416274815797806, -0.05014774203300476, -0.044879209250211716, -0.03961067646741867, -0.034342143684625626, -0.02907361276447773, -0.023805079981684685, -0.01853654719889164, -0.013268016278743744, -0.007999483495950699, -0.002730950713157654, 0.002537581603974104, 0.007806113921105862, 0.013074645772576332, 0.018343178555369377, 0.023611711338162422, 0.028880242258310318, 0.03414877504110336, 0.03941730782389641, 0.04468584060668945, 0.0499543733894825, 0.05522290617227554, 0.06049143522977829, 0.06575997173786163, 0.07102850079536438, 0.07629702985286713, 0.08156556636095047, 0.08683409541845322, 0.09210263192653656, 0.0973711609840393, 0.10263969749212265, 0.1079082265496254, 0.11317676305770874, 0.11844529211521149, 0.12371382117271423, 0.12898235023021698, 0.13425087928771973, 0.13951942324638367, 0.1447879523038864, 0.15005648136138916, 0.1553250104188919, 0.16059353947639465, 0.1658620834350586]}, "gradients/decoder.model.decoder.layers.0.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 5.0, 4.0, 5.0, 4.0, 1.0, 5.0, 12.0, 13.0, 13.0, 6.0, 7.0, 15.0, 28.0, 18.0, 25.0, 28.0, 36.0, 33.0, 21.0, 37.0, 41.0, 40.0, 33.0, 35.0, 53.0, 41.0, 37.0, 33.0, 33.0, 33.0, 38.0, 23.0, 30.0, 42.0, 27.0, 26.0, 18.0, 17.0, 22.0, 16.0, 12.0, 15.0, 5.0, 9.0, 4.0, 7.0, 2.0, 2.0, 2.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.14219404757022858, -0.13759928941726685, -0.13300453126430511, -0.12840977311134338, -0.12381501495838165, -0.11922025680541992, -0.11462550610303879, -0.11003074795007706, -0.10543598979711533, -0.1008412316441536, -0.09624647349119186, -0.09165171533823013, -0.087056964635849, -0.08246220648288727, -0.07786744832992554, -0.0732726901769638, -0.06867793202400208, -0.06408317387104034, -0.05948841571807861, -0.05489366129040718, -0.05029890313744545, -0.04570414498448372, -0.041109390556812286, -0.036514632403850555, -0.031919874250888824, -0.027325116097927094, -0.022730359807610512, -0.01813560351729393, -0.013540845364332199, -0.008946087211370468, -0.004351330921053886, 0.0002434253692626953, 0.004838183522224426, 0.009432940743863583, 0.014027697965502739, 0.01862245425581932, 0.02321721240878105, 0.027811970561742783, 0.032406724989414215, 0.037001483142375946, 0.04159624129533768, 0.04619099944829941, 0.05078575760126114, 0.05538051202893257, 0.0599752701818943, 0.06457002460956573, 0.06916478276252747, 0.0737595409154892, 0.07835429906845093, 0.08294905722141266, 0.08754381537437439, 0.09213857352733612, 0.09673333168029785, 0.10132808983325958, 0.10592284053564072, 0.11051759868860245, 0.11511235684156418, 0.11970711499452591, 0.12430187314748764, 0.12889662384986877, 0.1334913820028305, 0.13808614015579224, 0.14268089830875397, 0.1472756564617157, 0.15187041461467743]}, "gradients/decoder.model.decoder.layers.0.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 6.0, 4.0, 4.0, 6.0, 13.0, 10.0, 25.0, 31.0, 52.0, 76.0, 88.0, 160.0, 271.0, 438.0, 739.0, 1307.0, 2248.0, 4033.0, 7852.0, 16061.0, 36350.0, 90822.0, 237976.0, 359422.0, 171881.0, 65307.0, 27059.0, 12416.0, 6030.0, 3259.0, 1831.0, 1072.0, 662.0, 401.0, 237.0, 152.0, 101.0, 55.0, 39.0, 25.0, 11.0, 12.0, 11.0, 6.0, 3.0, 1.0, 0.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.291259765625, -0.2825202941894531, -0.27378082275390625, -0.2650413513183594, -0.2563018798828125, -0.24756240844726562, -0.23882293701171875, -0.23008346557617188, -0.221343994140625, -0.21260452270507812, -0.20386505126953125, -0.19512557983398438, -0.1863861083984375, -0.17764663696289062, -0.16890716552734375, -0.16016769409179688, -0.15142822265625, -0.14268875122070312, -0.13394927978515625, -0.12520980834960938, -0.1164703369140625, -0.10773086547851562, -0.09899139404296875, -0.09025192260742188, -0.081512451171875, -0.07277297973632812, -0.06403350830078125, -0.055294036865234375, -0.0465545654296875, -0.037815093994140625, -0.02907562255859375, -0.020336151123046875, -0.0115966796875, -0.002857208251953125, 0.00588226318359375, 0.014621734619140625, 0.0233612060546875, 0.032100677490234375, 0.04084014892578125, 0.049579620361328125, 0.058319091796875, 0.06705856323242188, 0.07579803466796875, 0.08453750610351562, 0.0932769775390625, 0.10201644897460938, 0.11075592041015625, 0.11949539184570312, 0.12823486328125, 0.13697433471679688, 0.14571380615234375, 0.15445327758789062, 0.1631927490234375, 0.17193222045898438, 0.18067169189453125, 0.18941116333007812, 0.198150634765625, 0.20689010620117188, 0.21562957763671875, 0.22436904907226562, 0.2331085205078125, 0.24184799194335938, 0.25058746337890625, 0.2593269348144531, 0.26806640625]}, "gradients/decoder.model.decoder.layers.0.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 2.0, 4.0, 3.0, 4.0, 9.0, 6.0, 9.0, 6.0, 14.0, 8.0, 12.0, 17.0, 17.0, 18.0, 34.0, 27.0, 22.0, 46.0, 39.0, 37.0, 38.0, 35.0, 41.0, 47.0, 38.0, 45.0, 43.0, 30.0, 41.0, 40.0, 38.0, 23.0, 25.0, 25.0, 21.0, 28.0, 26.0, 15.0, 12.0, 16.0, 11.0, 9.0, 9.0, 5.0, 5.0, 3.0, 2.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.2440185546875, -0.23641014099121094, -0.22880172729492188, -0.2211933135986328, -0.21358489990234375, -0.2059764862060547, -0.19836807250976562, -0.19075965881347656, -0.1831512451171875, -0.17554283142089844, -0.16793441772460938, -0.1603260040283203, -0.15271759033203125, -0.1451091766357422, -0.13750076293945312, -0.12989234924316406, -0.122283935546875, -0.11467552185058594, -0.10706710815429688, -0.09945869445800781, -0.09185028076171875, -0.08424186706542969, -0.07663345336914062, -0.06902503967285156, -0.0614166259765625, -0.05380821228027344, -0.046199798583984375, -0.03859138488769531, -0.03098297119140625, -0.023374557495117188, -0.015766143798828125, -0.008157730102539062, -0.00054931640625, 0.0070590972900390625, 0.014667510986328125, 0.022275924682617188, 0.02988433837890625, 0.03749275207519531, 0.045101165771484375, 0.05270957946777344, 0.0603179931640625, 0.06792640686035156, 0.07553482055664062, 0.08314323425292969, 0.09075164794921875, 0.09836006164550781, 0.10596847534179688, 0.11357688903808594, 0.121185302734375, 0.12879371643066406, 0.13640213012695312, 0.1440105438232422, 0.15161895751953125, 0.1592273712158203, 0.16683578491210938, 0.17444419860839844, 0.1820526123046875, 0.18966102600097656, 0.19726943969726562, 0.2048778533935547, 0.21248626708984375, 0.2200946807861328, 0.22770309448242188, 0.23531150817871094, 0.242919921875]}, "gradients/decoder.model.decoder.layers.0.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 0.0, 1.0, 5.0, 3.0, 5.0, 12.0, 16.0, 16.0, 14.0, 23.0, 34.0, 62.0, 74.0, 115.0, 193.0, 272.0, 490.0, 827.0, 1431.0, 2558.0, 4904.0, 9846.0, 20159.0, 45411.0, 105537.0, 246106.0, 319434.0, 163595.0, 68535.0, 29944.0, 13819.0, 6804.0, 3577.0, 1930.0, 1093.0, 623.0, 378.0, 251.0, 140.0, 91.0, 66.0, 47.0, 34.0, 25.0, 15.0, 14.0, 12.0, 9.0, 3.0, 5.0, 3.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.26953125, -0.2611732482910156, -0.25281524658203125, -0.24445724487304688, -0.2360992431640625, -0.22774124145507812, -0.21938323974609375, -0.21102523803710938, -0.202667236328125, -0.19430923461914062, -0.18595123291015625, -0.17759323120117188, -0.1692352294921875, -0.16087722778320312, -0.15251922607421875, -0.14416122436523438, -0.13580322265625, -0.12744522094726562, -0.11908721923828125, -0.11072921752929688, -0.1023712158203125, -0.09401321411132812, -0.08565521240234375, -0.07729721069335938, -0.068939208984375, -0.060581207275390625, -0.05222320556640625, -0.043865203857421875, -0.0355072021484375, -0.027149200439453125, -0.01879119873046875, -0.010433197021484375, -0.0020751953125, 0.006282806396484375, 0.01464080810546875, 0.022998809814453125, 0.0313568115234375, 0.039714813232421875, 0.04807281494140625, 0.056430816650390625, 0.064788818359375, 0.07314682006835938, 0.08150482177734375, 0.08986282348632812, 0.0982208251953125, 0.10657882690429688, 0.11493682861328125, 0.12329483032226562, 0.13165283203125, 0.14001083374023438, 0.14836883544921875, 0.15672683715820312, 0.1650848388671875, 0.17344284057617188, 0.18180084228515625, 0.19015884399414062, 0.198516845703125, 0.20687484741210938, 0.21523284912109375, 0.22359085083007812, 0.2319488525390625, 0.24030685424804688, 0.24866485595703125, 0.2570228576660156, 0.265380859375]}, "gradients/decoder.model.decoder.layers.0.self_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 2.0, 2.0, 5.0, 4.0, 3.0, 6.0, 4.0, 3.0, 5.0, 15.0, 5.0, 9.0, 12.0, 11.0, 19.0, 15.0, 19.0, 27.0, 25.0, 24.0, 28.0, 25.0, 33.0, 36.0, 37.0, 29.0, 44.0, 35.0, 42.0, 41.0, 31.0, 43.0, 33.0, 36.0, 28.0, 29.0, 38.0, 22.0, 25.0, 19.0, 23.0, 23.0, 11.0, 14.0, 3.0, 8.0, 10.0, 3.0, 9.0, 10.0, 7.0, 7.0, 1.0, 4.0, 3.0, 2.0, 4.0, 5.0, 2.0, 1.0], "bins": [-0.251708984375, -0.2440032958984375, -0.236297607421875, -0.2285919189453125, -0.22088623046875, -0.2131805419921875, -0.205474853515625, -0.1977691650390625, -0.1900634765625, -0.1823577880859375, -0.174652099609375, -0.1669464111328125, -0.15924072265625, -0.1515350341796875, -0.143829345703125, -0.1361236572265625, -0.12841796875, -0.1207122802734375, -0.113006591796875, -0.1053009033203125, -0.09759521484375, -0.0898895263671875, -0.082183837890625, -0.0744781494140625, -0.0667724609375, -0.0590667724609375, -0.051361083984375, -0.0436553955078125, -0.03594970703125, -0.0282440185546875, -0.020538330078125, -0.0128326416015625, -0.005126953125, 0.0025787353515625, 0.010284423828125, 0.0179901123046875, 0.02569580078125, 0.0334014892578125, 0.041107177734375, 0.0488128662109375, 0.0565185546875, 0.0642242431640625, 0.071929931640625, 0.0796356201171875, 0.08734130859375, 0.0950469970703125, 0.102752685546875, 0.1104583740234375, 0.1181640625, 0.1258697509765625, 0.133575439453125, 0.1412811279296875, 0.14898681640625, 0.1566925048828125, 0.164398193359375, 0.1721038818359375, 0.1798095703125, 0.1875152587890625, 0.195220947265625, 0.2029266357421875, 0.21063232421875, 0.2183380126953125, 0.226043701171875, 0.2337493896484375, 0.241455078125]}, "gradients/decoder.model.decoder.layers.0.self_attn.k_proj.weight": {"_type": "histogram", "values": [5.0, 1.0, 1.0, 4.0, 0.0, 4.0, 8.0, 5.0, 9.0, 13.0, 22.0, 26.0, 53.0, 79.0, 102.0, 153.0, 213.0, 295.0, 476.0, 662.0, 1028.0, 1715.0, 2911.0, 5338.0, 10445.0, 20609.0, 48942.0, 141468.0, 426160.0, 246271.0, 79359.0, 30776.0, 14028.0, 7365.0, 3975.0, 2217.0, 1309.0, 894.0, 517.0, 332.0, 232.0, 176.0, 101.0, 98.0, 48.0, 46.0, 33.0, 11.0, 12.0, 9.0, 7.0, 5.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07135009765625, -0.06886768341064453, -0.06638526916503906, -0.0639028549194336, -0.061420440673828125, -0.058938026428222656, -0.05645561218261719, -0.05397319793701172, -0.05149078369140625, -0.04900836944580078, -0.04652595520019531, -0.044043540954589844, -0.041561126708984375, -0.039078712463378906, -0.03659629821777344, -0.03411388397216797, -0.0316314697265625, -0.02914905548095703, -0.026666641235351562, -0.024184226989746094, -0.021701812744140625, -0.019219398498535156, -0.016736984252929688, -0.014254570007324219, -0.01177215576171875, -0.009289741516113281, -0.0068073272705078125, -0.004324913024902344, -0.001842498779296875, 0.0006399154663085938, 0.0031223297119140625, 0.005604743957519531, 0.008087158203125, 0.010569572448730469, 0.013051986694335938, 0.015534400939941406, 0.018016815185546875, 0.020499229431152344, 0.022981643676757812, 0.02546405792236328, 0.02794647216796875, 0.03042888641357422, 0.03291130065917969, 0.035393714904785156, 0.037876129150390625, 0.040358543395996094, 0.04284095764160156, 0.04532337188720703, 0.0478057861328125, 0.05028820037841797, 0.05277061462402344, 0.055253028869628906, 0.057735443115234375, 0.060217857360839844, 0.06270027160644531, 0.06518268585205078, 0.06766510009765625, 0.07014751434326172, 0.07262992858886719, 0.07511234283447266, 0.07759475708007812, 0.0800771713256836, 0.08255958557128906, 0.08504199981689453, 0.0875244140625]}, "gradients/decoder.model.decoder.layers.0.self_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 4.0, 2.0, 1.0, 1.0, 2.0, 3.0, 4.0, 6.0, 6.0, 10.0, 14.0, 25.0, 27.0, 43.0, 52.0, 78.0, 92.0, 131.0, 147.0, 100.0, 81.0, 45.0, 36.0, 22.0, 19.0, 13.0, 12.0, 10.0, 6.0, 3.0, 4.0, 3.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.806020736694336e-05, -1.7415732145309448e-05, -1.6771256923675537e-05, -1.6126781702041626e-05, -1.5482306480407715e-05, -1.4837831258773804e-05, -1.4193356037139893e-05, -1.3548880815505981e-05, -1.290440559387207e-05, -1.225993037223816e-05, -1.1615455150604248e-05, -1.0970979928970337e-05, -1.0326504707336426e-05, -9.682029485702515e-06, -9.037554264068604e-06, -8.393079042434692e-06, -7.748603820800781e-06, -7.10412859916687e-06, -6.459653377532959e-06, -5.815178155899048e-06, -5.170702934265137e-06, -4.526227712631226e-06, -3.8817524909973145e-06, -3.2372772693634033e-06, -2.592802047729492e-06, -1.948326826095581e-06, -1.30385160446167e-06, -6.593763828277588e-07, -1.4901161193847656e-08, 6.295740604400635e-07, 1.2740492820739746e-06, 1.9185245037078857e-06, 2.562999725341797e-06, 3.207474946975708e-06, 3.851950168609619e-06, 4.49642539024353e-06, 5.140900611877441e-06, 5.7853758335113525e-06, 6.429851055145264e-06, 7.074326276779175e-06, 7.718801498413086e-06, 8.363276720046997e-06, 9.007751941680908e-06, 9.65222716331482e-06, 1.029670238494873e-05, 1.0941177606582642e-05, 1.1585652828216553e-05, 1.2230128049850464e-05, 1.2874603271484375e-05, 1.3519078493118286e-05, 1.4163553714752197e-05, 1.4808028936386108e-05, 1.545250415802002e-05, 1.609697937965393e-05, 1.6741454601287842e-05, 1.7385929822921753e-05, 1.8030405044555664e-05, 1.8674880266189575e-05, 1.9319355487823486e-05, 1.9963830709457397e-05, 2.060830593109131e-05, 2.125278115272522e-05, 2.189725637435913e-05, 2.2541731595993042e-05, 2.3186206817626953e-05]}, "gradients/decoder.model.decoder.layers.0.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 9.0, 6.0, 9.0, 5.0, 7.0, 15.0, 21.0, 16.0, 19.0, 38.0, 54.0, 81.0, 77.0, 104.0, 176.0, 245.0, 350.0, 508.0, 731.0, 1064.0, 1753.0, 2913.0, 5272.0, 9274.0, 18874.0, 44418.0, 125960.0, 404254.0, 274645.0, 89580.0, 33609.0, 15102.0, 7853.0, 4294.0, 2486.0, 1564.0, 1009.0, 638.0, 414.0, 313.0, 208.0, 159.0, 117.0, 83.0, 66.0, 32.0, 34.0, 25.0, 30.0, 12.0, 17.0, 2.0, 8.0, 3.0, 5.0, 8.0, 2.0, 0.0, 2.0], "bins": [-0.08746337890625, -0.08480072021484375, -0.0821380615234375, -0.07947540283203125, -0.076812744140625, -0.07415008544921875, -0.0714874267578125, -0.06882476806640625, -0.066162109375, -0.06349945068359375, -0.0608367919921875, -0.05817413330078125, -0.055511474609375, -0.05284881591796875, -0.0501861572265625, -0.04752349853515625, -0.04486083984375, -0.04219818115234375, -0.0395355224609375, -0.03687286376953125, -0.034210205078125, -0.03154754638671875, -0.0288848876953125, -0.02622222900390625, -0.0235595703125, -0.02089691162109375, -0.0182342529296875, -0.01557159423828125, -0.012908935546875, -0.01024627685546875, -0.0075836181640625, -0.00492095947265625, -0.00225830078125, 0.00040435791015625, 0.0030670166015625, 0.00572967529296875, 0.008392333984375, 0.01105499267578125, 0.0137176513671875, 0.01638031005859375, 0.01904296875, 0.02170562744140625, 0.0243682861328125, 0.02703094482421875, 0.029693603515625, 0.03235626220703125, 0.0350189208984375, 0.03768157958984375, 0.04034423828125, 0.04300689697265625, 0.0456695556640625, 0.04833221435546875, 0.050994873046875, 0.05365753173828125, 0.0563201904296875, 0.05898284912109375, 0.0616455078125, 0.06430816650390625, 0.0669708251953125, 0.06963348388671875, 0.072296142578125, 0.07495880126953125, 0.0776214599609375, 0.08028411865234375, 0.08294677734375]}, "gradients/decoder.model.decoder.layers.0.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 2.0, 7.0, 3.0, 3.0, 7.0, 8.0, 17.0, 19.0, 23.0, 29.0, 41.0, 52.0, 62.0, 83.0, 138.0, 147.0, 82.0, 74.0, 53.0, 26.0, 34.0, 23.0, 21.0, 11.0, 10.0, 4.0, 5.0, 6.0, 7.0, 2.0, 4.0, 5.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08447265625, -0.08225774765014648, -0.08004283905029297, -0.07782793045043945, -0.07561302185058594, -0.07339811325073242, -0.0711832046508789, -0.06896829605102539, -0.06675338745117188, -0.06453847885131836, -0.062323570251464844, -0.06010866165161133, -0.05789375305175781, -0.0556788444519043, -0.05346393585205078, -0.051249027252197266, -0.04903411865234375, -0.046819210052490234, -0.04460430145263672, -0.0423893928527832, -0.04017448425292969, -0.03795957565307617, -0.035744667053222656, -0.03352975845336914, -0.031314849853515625, -0.02909994125366211, -0.026885032653808594, -0.024670124053955078, -0.022455215454101562, -0.020240306854248047, -0.01802539825439453, -0.015810489654541016, -0.0135955810546875, -0.011380672454833984, -0.009165763854980469, -0.006950855255126953, -0.0047359466552734375, -0.002521038055419922, -0.00030612945556640625, 0.0019087791442871094, 0.004123687744140625, 0.006338596343994141, 0.008553504943847656, 0.010768413543701172, 0.012983322143554688, 0.015198230743408203, 0.01741313934326172, 0.019628047943115234, 0.02184295654296875, 0.024057865142822266, 0.02627277374267578, 0.028487682342529297, 0.030702590942382812, 0.03291749954223633, 0.035132408142089844, 0.03734731674194336, 0.039562225341796875, 0.04177713394165039, 0.043992042541503906, 0.04620695114135742, 0.04842185974121094, 0.05063676834106445, 0.05285167694091797, 0.055066585540771484, 0.057281494140625]}, "gradients/decoder.model.decoder.layernorm_embedding.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 0.0, 1.0, 4.0, 4.0, 9.0, 11.0, 21.0, 42.0, 50.0, 99.0, 99.0, 127.0, 130.0, 115.0, 90.0, 73.0, 43.0, 38.0, 19.0, 8.0, 6.0, 9.0, 8.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5518237352371216, -0.5261011719703674, -0.5003785490989685, -0.47465598583221436, -0.4489334225654602, -0.42321082949638367, -0.39748823642730713, -0.371765673160553, -0.34604308009147644, -0.3203204870223999, -0.29459792375564575, -0.2688753306865692, -0.24315275251865387, -0.21743017435073853, -0.191707581281662, -0.16598500311374664, -0.1402624249458313, -0.11453984677791595, -0.08881726115942001, -0.06309467554092407, -0.03737209737300873, -0.011649519205093384, 0.014073073863983154, 0.0397956520318985, 0.06551823019981384, 0.09124080836772919, 0.11696339398622513, 0.14268597960472107, 0.1684085577726364, 0.19413113594055176, 0.2198537290096283, 0.24557630717754364, 0.271298885345459, 0.2970214784145355, 0.3227440416812897, 0.3484666347503662, 0.37418919801712036, 0.3999117910861969, 0.42563438415527344, 0.4513569474220276, 0.4770795404911041, 0.5028021335601807, 0.5285246968269348, 0.554247260093689, 0.5799698829650879, 0.605692446231842, 0.6314150094985962, 0.6571376323699951, 0.6828601956367493, 0.7085827589035034, 0.7343053817749023, 0.7600279450416565, 0.7857505083084106, 0.8114731311798096, 0.8371956944465637, 0.8629182577133179, 0.8886408805847168, 0.914363443851471, 0.9400860667228699, 0.965808629989624, 0.9915311932563782, 1.0172537565231323, 1.0429763793945312, 1.0686990022659302, 1.0944215059280396]}, "gradients/decoder.model.decoder.layernorm_embedding.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 5.0, 0.0, 3.0, 5.0, 5.0, 5.0, 19.0, 15.0, 14.0, 12.0, 16.0, 24.0, 25.0, 22.0, 15.0, 29.0, 27.0, 40.0, 41.0, 44.0, 35.0, 42.0, 39.0, 48.0, 41.0, 39.0, 34.0, 40.0, 27.0, 48.0, 25.0, 31.0, 35.0, 28.0, 22.0, 18.0, 12.0, 12.0, 13.0, 11.0, 11.0, 9.0, 9.0, 7.0, 5.0, 3.0, 2.0, 1.0, 4.0, 3.0], "bins": [-0.5624467730522156, -0.5475205183029175, -0.5325942635536194, -0.5176680088043213, -0.5027417540550232, -0.4878154993057251, -0.472889244556427, -0.4579629898071289, -0.4430367350578308, -0.4281104803085327, -0.4131842255592346, -0.3982579708099365, -0.3833317160606384, -0.36840546131134033, -0.35347920656204224, -0.33855295181274414, -0.32362669706344604, -0.30870044231414795, -0.29377418756484985, -0.27884793281555176, -0.26392167806625366, -0.24899542331695557, -0.23406916856765747, -0.21914291381835938, -0.20421665906906128, -0.18929040431976318, -0.1743641495704651, -0.159437894821167, -0.1445116400718689, -0.1295853853225708, -0.1146591305732727, -0.09973287582397461, -0.08480659127235413, -0.06988033652305603, -0.054954081773757935, -0.04002782702445984, -0.025101572275161743, -0.010175317525863647, 0.004750937223434448, 0.019677191972732544, 0.03460344672203064, 0.049529701471328735, 0.06445595622062683, 0.07938221096992493, 0.09430846571922302, 0.10923472046852112, 0.12416097521781921, 0.1390872299671173, 0.1540134847164154, 0.1689397394657135, 0.1838659942150116, 0.1987922489643097, 0.2137185037136078, 0.22864475846290588, 0.24357101321220398, 0.2584972679615021, 0.27342352271080017, 0.28834977746009827, 0.30327603220939636, 0.31820228695869446, 0.33312854170799255, 0.34805479645729065, 0.36298105120658875, 0.37790730595588684, 0.39283356070518494]}, "gradients/decoder.model.decoder.embed_positions.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 2.0, 3.0, 3.0, 7.0, 4.0, 14.0, 10.0, 14.0, 17.0, 26.0, 28.0, 30.0, 40.0, 55.0, 58.0, 79.0, 103.0, 169.0, 230.0, 320.0, 479.0, 835.0, 1651.0, 3147.0, 6804.0, 1021340.0, 7499.0, 3361.0, 1639.0, 916.0, 472.0, 336.0, 237.0, 144.0, 118.0, 81.0, 75.0, 54.0, 47.0, 24.0, 31.0, 27.0, 20.0, 15.0, 14.0, 8.0, 10.0, 3.0, 7.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0], "bins": [-0.7393447756767273, -0.7179401516914368, -0.6965355277061462, -0.6751309037208557, -0.6537262797355652, -0.6323216557502747, -0.6109169721603394, -0.5895123481750488, -0.5681077241897583, -0.5467031002044678, -0.5252984762191772, -0.5038938522338867, -0.4824892282485962, -0.46108460426330566, -0.43967995047569275, -0.4182753264904022, -0.3968707323074341, -0.37546610832214355, -0.354061484336853, -0.3326568603515625, -0.311252236366272, -0.28984761238098145, -0.26844295859336853, -0.247038334608078, -0.22563371062278748, -0.20422908663749695, -0.18282446265220642, -0.1614198237657547, -0.14001519978046417, -0.11861057579517365, -0.09720593690872192, -0.0758013129234314, -0.05439668893814087, -0.03299206122756004, -0.011587433516979218, 0.009817197918891907, 0.031221821904182434, 0.05262644588947296, 0.07403108477592468, 0.09543570876121521, 0.11684033274650574, 0.13824495673179626, 0.1596495807170868, 0.1810542196035385, 0.20245884358882904, 0.22386346757411957, 0.2452681064605713, 0.2666727304458618, 0.28807735443115234, 0.30948197841644287, 0.3308866024017334, 0.3522912263870239, 0.37369585037231445, 0.395100474357605, 0.4165051281452179, 0.4379097521305084, 0.45931437611579895, 0.4807190001010895, 0.5021236538887024, 0.5235282778739929, 0.5449329018592834, 0.566337525844574, 0.5877421498298645, 0.609146773815155, 0.6305513978004456]}, "gradients/decoder.model.decoder.embed_tokens.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 10.0, 10.0, 41.0, 41.0, 87.0, 130.0, 239.0, 378.0, 630.0, 1125.0, 3881.0, 51451648.0, 8589.0, 1608.0, 755.0, 447.0, 260.0, 190.0, 112.0, 55.0, 40.0, 16.0, 15.0, 6.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.5, -4.309838771820068, -4.119677543640137, -3.929516077041626, -3.7393546104431152, -3.5491933822631836, -3.359032154083252, -3.168870687484741, -2.9787092208862305, -2.788547992706299, -2.598386526107788, -2.4082252979278564, -2.2180638313293457, -2.027902603149414, -1.8377412557601929, -1.6475799083709717, -1.45741868019104, -1.2672573328018188, -1.0770959854125977, -0.8869346976280212, -0.6967733502388, -0.5066120028495789, -0.31645071506500244, -0.12628936767578125, 0.06387197971343994, 0.25403332710266113, 0.44419464468955994, 0.6343559622764587, 0.8245173096656799, 1.014678716659546, 1.2048399448394775, 1.3950012922286987, 1.58516263961792, 1.7753239870071411, 1.9654853343963623, 2.155646562576294, 2.3458080291748047, 2.5359692573547363, 2.726130485534668, 2.9162919521331787, 3.1064534187316895, 3.296614646911621, 3.486776113510132, 3.6769373416900635, 3.867098808288574, 4.057260036468506, 4.2474212646484375, 4.437582969665527, 4.627743721008301, 4.817904949188232, 5.008066177368164, 5.198227882385254, 5.3883891105651855, 5.578550338745117, 5.768711566925049, 5.9588727951049805, 6.14903450012207, 6.339195728302002, 6.529356956481934, 6.719518661499023, 6.909679889678955, 7.099841117858887, 7.290002346038818, 7.48016357421875, 7.67032527923584]}, "gradients/encoder.adapter.layers.2.conv.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 6.0, 10.0, 16.0, 23.0, 46.0, 83.0, 85.0, 161.0, 258.0, 463.0, 698.0, 1070.0, 2000.0, 3093.0, 5156.0, 8390.0, 14619.0, 25111.0, 41820.0, 71433.0, 118773.0, 189112.0, 284971.0, 409641.0, 2283907.0, 1700085.0, 393287.0, 274886.0, 181194.0, 113696.0, 68504.0, 40463.0, 24000.0, 14025.0, 8158.0, 4862.0, 2962.0, 1738.0, 1084.0, 583.0, 383.0, 232.0, 132.0, 86.0, 52.0, 39.0, 27.0, 6.0, 5.0, 7.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.349609375, -0.3390007019042969, -0.32839202880859375, -0.3177833557128906, -0.3071746826171875, -0.2965660095214844, -0.28595733642578125, -0.2753486633300781, -0.264739990234375, -0.2541313171386719, -0.24352264404296875, -0.23291397094726562, -0.2223052978515625, -0.21169662475585938, -0.20108795166015625, -0.19047927856445312, -0.17987060546875, -0.16926193237304688, -0.15865325927734375, -0.14804458618164062, -0.1374359130859375, -0.12682723999023438, -0.11621856689453125, -0.10560989379882812, -0.095001220703125, -0.08439254760742188, -0.07378387451171875, -0.06317520141601562, -0.0525665283203125, -0.041957855224609375, -0.03134918212890625, -0.020740509033203125, -0.0101318359375, 0.000476837158203125, 0.01108551025390625, 0.021694183349609375, 0.0323028564453125, 0.042911529541015625, 0.05352020263671875, 0.06412887573242188, 0.074737548828125, 0.08534622192382812, 0.09595489501953125, 0.10656356811523438, 0.1171722412109375, 0.12778091430664062, 0.13838958740234375, 0.14899826049804688, 0.15960693359375, 0.17021560668945312, 0.18082427978515625, 0.19143295288085938, 0.2020416259765625, 0.21265029907226562, 0.22325897216796875, 0.23386764526367188, 0.244476318359375, 0.2550849914550781, 0.26569366455078125, 0.2763023376464844, 0.2869110107421875, 0.2975196838378906, 0.30812835693359375, 0.3187370300292969, 0.329345703125]}, "gradients/encoder.adapter.layers.2.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 3.0, 9.0, 6.0, 2.0, 15.0, 13.0, 20.0, 24.0, 19.0, 36.0, 43.0, 43.0, 55.0, 59.0, 53.0, 115.0, 783.0, 273.0, 70.0, 57.0, 48.0, 47.0, 44.0, 39.0, 32.0, 23.0, 16.0, 22.0, 11.0, 11.0, 10.0, 7.0, 5.0, 2.0, 7.0, 6.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.400390625, -3.30242919921875, -3.2044677734375, -3.10650634765625, -3.008544921875, -2.91058349609375, -2.8126220703125, -2.71466064453125, -2.61669921875, -2.51873779296875, -2.4207763671875, -2.32281494140625, -2.224853515625, -2.12689208984375, -2.0289306640625, -1.93096923828125, -1.8330078125, -1.73504638671875, -1.6370849609375, -1.53912353515625, -1.441162109375, -1.34320068359375, -1.2452392578125, -1.14727783203125, -1.04931640625, -0.95135498046875, -0.8533935546875, -0.75543212890625, -0.657470703125, -0.55950927734375, -0.4615478515625, -0.36358642578125, -0.265625, -0.16766357421875, -0.0697021484375, 0.02825927734375, 0.126220703125, 0.22418212890625, 0.3221435546875, 0.42010498046875, 0.51806640625, 0.61602783203125, 0.7139892578125, 0.81195068359375, 0.909912109375, 1.00787353515625, 1.1058349609375, 1.20379638671875, 1.3017578125, 1.39971923828125, 1.4976806640625, 1.59564208984375, 1.693603515625, 1.79156494140625, 1.8895263671875, 1.98748779296875, 2.08544921875, 2.18341064453125, 2.2813720703125, 2.37933349609375, 2.477294921875, 2.57525634765625, 2.6732177734375, 2.77117919921875, 2.869140625]}, "gradients/encoder.adapter.layers.1.conv.weight": {"_type": "histogram", "values": [3.0, 3.0, 4.0, 4.0, 4.0, 11.0, 35.0, 33.0, 52.0, 85.0, 139.0, 201.0, 348.0, 502.0, 840.0, 1354.0, 2086.0, 3209.0, 4944.0, 7981.0, 12655.0, 19163.0, 29413.0, 44906.0, 67330.0, 97364.0, 136869.0, 183505.0, 237034.0, 285939.0, 556295.0, 3156300.0, 379149.0, 273559.0, 223757.0, 172477.0, 127462.0, 88908.0, 61594.0, 40542.0, 27048.0, 17443.0, 11372.0, 7048.0, 4533.0, 2922.0, 1821.0, 1152.0, 795.0, 455.0, 305.0, 192.0, 122.0, 72.0, 40.0, 39.0, 18.0, 4.0, 7.0, 4.0, 0.0, 2.0, 2.0, 1.0], "bins": [-0.19677734375, -0.1905059814453125, -0.184234619140625, -0.1779632568359375, -0.17169189453125, -0.1654205322265625, -0.159149169921875, -0.1528778076171875, -0.1466064453125, -0.1403350830078125, -0.134063720703125, -0.1277923583984375, -0.12152099609375, -0.1152496337890625, -0.108978271484375, -0.1027069091796875, -0.096435546875, -0.0901641845703125, -0.083892822265625, -0.0776214599609375, -0.07135009765625, -0.0650787353515625, -0.058807373046875, -0.0525360107421875, -0.0462646484375, -0.0399932861328125, -0.033721923828125, -0.0274505615234375, -0.02117919921875, -0.0149078369140625, -0.008636474609375, -0.0023651123046875, 0.00390625, 0.0101776123046875, 0.016448974609375, 0.0227203369140625, 0.02899169921875, 0.0352630615234375, 0.041534423828125, 0.0478057861328125, 0.0540771484375, 0.0603485107421875, 0.066619873046875, 0.0728912353515625, 0.07916259765625, 0.0854339599609375, 0.091705322265625, 0.0979766845703125, 0.104248046875, 0.1105194091796875, 0.116790771484375, 0.1230621337890625, 0.12933349609375, 0.1356048583984375, 0.141876220703125, 0.1481475830078125, 0.1544189453125, 0.1606903076171875, 0.166961669921875, 0.1732330322265625, 0.17950439453125, 0.1857757568359375, 0.192047119140625, 0.1983184814453125, 0.20458984375]}, "gradients/encoder.adapter.layers.1.conv.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 5.0, 6.0, 16.0, 8.0, 10.0, 12.0, 16.0, 23.0, 19.0, 20.0, 25.0, 23.0, 37.0, 27.0, 44.0, 49.0, 47.0, 37.0, 59.0, 402.0, 641.0, 95.0, 36.0, 39.0, 41.0, 37.0, 33.0, 18.0, 29.0, 28.0, 28.0, 27.0, 25.0, 12.0, 16.0, 10.0, 3.0, 6.0, 3.0, 3.0, 2.0, 5.0, 7.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0], "bins": [-2.29296875, -2.225830078125, -2.15869140625, -2.091552734375, -2.0244140625, -1.957275390625, -1.89013671875, -1.822998046875, -1.755859375, -1.688720703125, -1.62158203125, -1.554443359375, -1.4873046875, -1.420166015625, -1.35302734375, -1.285888671875, -1.21875, -1.151611328125, -1.08447265625, -1.017333984375, -0.9501953125, -0.883056640625, -0.81591796875, -0.748779296875, -0.681640625, -0.614501953125, -0.54736328125, -0.480224609375, -0.4130859375, -0.345947265625, -0.27880859375, -0.211669921875, -0.14453125, -0.077392578125, -0.01025390625, 0.056884765625, 0.1240234375, 0.191162109375, 0.25830078125, 0.325439453125, 0.392578125, 0.459716796875, 0.52685546875, 0.593994140625, 0.6611328125, 0.728271484375, 0.79541015625, 0.862548828125, 0.9296875, 0.996826171875, 1.06396484375, 1.131103515625, 1.1982421875, 1.265380859375, 1.33251953125, 1.399658203125, 1.466796875, 1.533935546875, 1.60107421875, 1.668212890625, 1.7353515625, 1.802490234375, 1.86962890625, 1.936767578125, 2.00390625]}, "gradients/encoder.adapter.layers.0.conv.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 2.0, 3.0, 3.0, 4.0, 8.0, 13.0, 6.0, 17.0, 38.0, 66.0, 68.0, 82.0, 119.0, 180.0, 221.0, 381.0, 481.0, 638.0, 916.0, 1327.0, 2060.0, 3291.0, 5768.0, 11103.0, 22930.0, 49991.0, 103331.0, 484754.0, 5350355.0, 128662.0, 62872.0, 29700.0, 13641.0, 6973.0, 3859.0, 2343.0, 1574.0, 1035.0, 698.0, 533.0, 379.0, 283.0, 182.0, 147.0, 114.0, 82.0, 63.0, 41.0, 36.0, 28.0, 14.0, 12.0, 8.0, 5.0, 4.0, 2.0, 1.0], "bins": [-0.9755859375, -0.9478302001953125, -0.920074462890625, -0.8923187255859375, -0.86456298828125, -0.8368072509765625, -0.809051513671875, -0.7812957763671875, -0.7535400390625, -0.7257843017578125, -0.698028564453125, -0.6702728271484375, -0.64251708984375, -0.6147613525390625, -0.587005615234375, -0.5592498779296875, -0.531494140625, -0.5037384033203125, -0.475982666015625, -0.4482269287109375, -0.42047119140625, -0.3927154541015625, -0.364959716796875, -0.3372039794921875, -0.3094482421875, -0.2816925048828125, -0.253936767578125, -0.2261810302734375, -0.19842529296875, -0.1706695556640625, -0.142913818359375, -0.1151580810546875, -0.08740234375, -0.0596466064453125, -0.031890869140625, -0.0041351318359375, 0.02362060546875, 0.0513763427734375, 0.079132080078125, 0.1068878173828125, 0.1346435546875, 0.1623992919921875, 0.190155029296875, 0.2179107666015625, 0.24566650390625, 0.2734222412109375, 0.301177978515625, 0.3289337158203125, 0.356689453125, 0.3844451904296875, 0.412200927734375, 0.4399566650390625, 0.46771240234375, 0.4954681396484375, 0.523223876953125, 0.5509796142578125, 0.5787353515625, 0.6064910888671875, 0.634246826171875, 0.6620025634765625, 0.68975830078125, 0.7175140380859375, 0.745269775390625, 0.7730255126953125, 0.80078125]}, "gradients/encoder.adapter.layers.0.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 4.0, 4.0, 2.0, 6.0, 7.0, 4.0, 7.0, 15.0, 11.0, 15.0, 15.0, 19.0, 19.0, 33.0, 41.0, 27.0, 34.0, 38.0, 40.0, 36.0, 48.0, 47.0, 268.0, 795.0, 85.0, 48.0, 40.0, 47.0, 31.0, 44.0, 23.0, 27.0, 23.0, 27.0, 22.0, 10.0, 11.0, 15.0, 6.0, 6.0, 12.0, 10.0, 1.0, 6.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.275390625, -2.202728271484375, -2.13006591796875, -2.057403564453125, -1.9847412109375, -1.912078857421875, -1.83941650390625, -1.766754150390625, -1.694091796875, -1.621429443359375, -1.54876708984375, -1.476104736328125, -1.4034423828125, -1.330780029296875, -1.25811767578125, -1.185455322265625, -1.11279296875, -1.040130615234375, -0.96746826171875, -0.894805908203125, -0.8221435546875, -0.749481201171875, -0.67681884765625, -0.604156494140625, -0.531494140625, -0.458831787109375, -0.38616943359375, -0.313507080078125, -0.2408447265625, -0.168182373046875, -0.09552001953125, -0.022857666015625, 0.0498046875, 0.122467041015625, 0.19512939453125, 0.267791748046875, 0.3404541015625, 0.413116455078125, 0.48577880859375, 0.558441162109375, 0.631103515625, 0.703765869140625, 0.77642822265625, 0.849090576171875, 0.9217529296875, 0.994415283203125, 1.06707763671875, 1.139739990234375, 1.21240234375, 1.285064697265625, 1.35772705078125, 1.430389404296875, 1.5030517578125, 1.575714111328125, 1.64837646484375, 1.721038818359375, 1.793701171875, 1.866363525390625, 1.93902587890625, 2.011688232421875, 2.0843505859375, 2.157012939453125, 2.22967529296875, 2.302337646484375, 2.375]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 2.0, 4.0, 2.0, 5.0, 19.0, 14.0, 24.0, 45.0, 69.0, 129.0, 176.0, 197.0, 121.0, 70.0, 47.0, 33.0, 13.0, 10.0, 13.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.672354698181152, -8.374412536621094, -8.076471328735352, -7.778529167175293, -7.480587005615234, -7.182644844055176, -6.884703159332275, -6.586761474609375, -6.288819313049316, -5.990877151489258, -5.692935466766357, -5.394993782043457, -5.097051620483398, -4.79910945892334, -4.5011677742004395, -4.203226089477539, -3.9052839279174805, -3.607342004776001, -3.3094000816345215, -3.011458158493042, -2.7135162353515625, -2.415574312210083, -2.1176323890686035, -1.819690465927124, -1.5217485427856445, -1.223806619644165, -0.9258646965026855, -0.627922773361206, -0.32998085021972656, -0.03203892707824707, 0.2659029960632324, 0.5638449192047119, 0.861785888671875, 1.1597278118133545, 1.457669734954834, 1.7556116580963135, 2.053553581237793, 2.3514955043792725, 2.649437427520752, 2.9473793506622314, 3.245321273803711, 3.5432631969451904, 3.84120512008667, 4.13914680480957, 4.437088966369629, 4.7350311279296875, 5.032972812652588, 5.330914497375488, 5.628856658935547, 5.9267988204956055, 6.224740505218506, 6.522682189941406, 6.820624351501465, 7.118566513061523, 7.416508197784424, 7.714449882507324, 8.012392044067383, 8.310334205627441, 8.6082763671875, 8.906217575073242, 9.2041597366333, 9.50210189819336, 9.800043106079102, 10.09798526763916, 10.395927429199219]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 3.0, 1.0, 4.0, 1.0, 5.0, 4.0, 5.0, 7.0, 10.0, 10.0, 12.0, 11.0, 21.0, 23.0, 27.0, 38.0, 44.0, 55.0, 43.0, 58.0, 72.0, 78.0, 81.0, 68.0, 59.0, 65.0, 43.0, 19.0, 34.0, 19.0, 14.0, 16.0, 13.0, 7.0, 9.0, 6.0, 5.0, 7.0, 4.0, 3.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.362794876098633, -9.073747634887695, -8.784699440002441, -8.495652198791504, -8.20660400390625, -7.9175567626953125, -7.628509044647217, -7.339461326599121, -7.050414085388184, -6.761366367340088, -6.472318649291992, -6.183271408081055, -5.894223690032959, -5.605175971984863, -5.316128253936768, -5.027080535888672, -4.738032817840576, -4.4489850997924805, -4.159937381744385, -3.870889902114868, -3.5818424224853516, -3.292794704437256, -3.00374698638916, -2.7146995067596436, -2.425651788711548, -2.136604070663452, -1.8475565910339355, -1.5585088729858398, -1.2694612741470337, -0.9804136753082275, -0.6913659572601318, -0.40231847763061523, -0.11327075958251953, 0.175776869058609, 0.46482449769973755, 0.7538721561431885, 1.0429197549819946, 1.3319673538208008, 1.6210150718688965, 1.910062551498413, 2.199110269546509, 2.4881579875946045, 2.777205467224121, 3.066253185272217, 3.3553009033203125, 3.644348382949829, 3.933396100997925, 4.222443580627441, 4.511491298675537, 4.800539016723633, 5.0895867347717285, 5.378634452819824, 5.667681694030762, 5.956729412078857, 6.245777130126953, 6.534824371337891, 6.8238725662231445, 7.11292028427124, 7.401968002319336, 7.691015243530273, 7.980062961578369, 8.269110679626465, 8.558158874511719, 8.847206115722656, 9.136253356933594]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 4.0, 3.0, 5.0, 6.0, 5.0, 8.0, 11.0, 13.0, 19.0, 23.0, 32.0, 39.0, 75.0, 106.0, 130.0, 230.0, 344.0, 585.0, 902.0, 1606.0, 2652.0, 4872.0, 9797.0, 22791.0, 82327.0, 3859514.0, 156094.0, 29304.0, 11189.0, 5345.0, 2657.0, 1452.0, 821.0, 510.0, 293.0, 180.0, 105.0, 81.0, 48.0, 34.0, 17.0, 21.0, 18.0, 10.0, 6.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0772705078125, -0.07503890991210938, -0.07280731201171875, -0.07057571411132812, -0.0683441162109375, -0.06611251831054688, -0.06388092041015625, -0.061649322509765625, -0.059417724609375, -0.057186126708984375, -0.05495452880859375, -0.052722930908203125, -0.0504913330078125, -0.048259735107421875, -0.04602813720703125, -0.043796539306640625, -0.04156494140625, -0.039333343505859375, -0.03710174560546875, -0.034870147705078125, -0.0326385498046875, -0.030406951904296875, -0.02817535400390625, -0.025943756103515625, -0.023712158203125, -0.021480560302734375, -0.01924896240234375, -0.017017364501953125, -0.0147857666015625, -0.012554168701171875, -0.01032257080078125, -0.008090972900390625, -0.005859375, -0.003627777099609375, -0.00139617919921875, 0.000835418701171875, 0.0030670166015625, 0.005298614501953125, 0.00753021240234375, 0.009761810302734375, 0.011993408203125, 0.014225006103515625, 0.01645660400390625, 0.018688201904296875, 0.0209197998046875, 0.023151397705078125, 0.02538299560546875, 0.027614593505859375, 0.02984619140625, 0.032077789306640625, 0.03430938720703125, 0.036540985107421875, 0.0387725830078125, 0.041004180908203125, 0.04323577880859375, 0.045467376708984375, 0.047698974609375, 0.049930572509765625, 0.05216217041015625, 0.054393768310546875, 0.0566253662109375, 0.058856964111328125, 0.06108856201171875, 0.06332015991210938, 0.0655517578125]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 0.0, 2.0, 1.0, 4.0, 3.0, 2.0, 2.0, 2.0, 1.0, 6.0, 6.0, 9.0, 8.0, 6.0, 1.0, 9.0, 10.0, 17.0, 15.0, 25.0, 43.0, 142.0, 488.0, 66.0, 34.0, 14.0, 17.0, 8.0, 10.0, 7.0, 7.0, 6.0, 9.0, 10.0, 2.0, 0.0, 5.0, 6.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.025177001953125, -0.024495840072631836, -0.023814678192138672, -0.023133516311645508, -0.022452354431152344, -0.02177119255065918, -0.021090030670166016, -0.02040886878967285, -0.019727706909179688, -0.019046545028686523, -0.01836538314819336, -0.017684221267700195, -0.01700305938720703, -0.016321897506713867, -0.015640735626220703, -0.014959573745727539, -0.014278411865234375, -0.013597249984741211, -0.012916088104248047, -0.012234926223754883, -0.011553764343261719, -0.010872602462768555, -0.01019144058227539, -0.009510278701782227, -0.008829116821289062, -0.008147954940795898, -0.007466793060302734, -0.00678563117980957, -0.006104469299316406, -0.005423307418823242, -0.004742145538330078, -0.004060983657836914, -0.00337982177734375, -0.002698659896850586, -0.002017498016357422, -0.0013363361358642578, -0.0006551742553710938, 2.5987625122070312e-05, 0.0007071495056152344, 0.0013883113861083984, 0.0020694732666015625, 0.0027506351470947266, 0.0034317970275878906, 0.004112958908081055, 0.004794120788574219, 0.005475282669067383, 0.006156444549560547, 0.006837606430053711, 0.007518768310546875, 0.008199930191040039, 0.008881092071533203, 0.009562253952026367, 0.010243415832519531, 0.010924577713012695, 0.01160573959350586, 0.012286901473999023, 0.012968063354492188, 0.013649225234985352, 0.014330387115478516, 0.01501154899597168, 0.015692710876464844, 0.016373872756958008, 0.017055034637451172, 0.017736196517944336, 0.0184173583984375]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 0.0, 7.0, 7.0, 6.0, 13.0, 10.0, 24.0, 32.0, 45.0, 84.0, 126.0, 290.0, 587.0, 1397.0, 3650.0, 11020.0, 41302.0, 250020.0, 3405564.0, 403938.0, 56312.0, 13266.0, 4047.0, 1384.0, 554.0, 282.0, 115.0, 84.0, 41.0, 21.0, 23.0, 15.0, 7.0, 4.0, 2.0, 4.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.09906005859375, -0.09635353088378906, -0.09364700317382812, -0.09094047546386719, -0.08823394775390625, -0.08552742004394531, -0.08282089233398438, -0.08011436462402344, -0.0774078369140625, -0.07470130920410156, -0.07199478149414062, -0.06928825378417969, -0.06658172607421875, -0.06387519836425781, -0.061168670654296875, -0.05846214294433594, -0.055755615234375, -0.05304908752441406, -0.050342559814453125, -0.04763603210449219, -0.04492950439453125, -0.04222297668457031, -0.039516448974609375, -0.03680992126464844, -0.0341033935546875, -0.03139686584472656, -0.028690338134765625, -0.025983810424804688, -0.02327728271484375, -0.020570755004882812, -0.017864227294921875, -0.015157699584960938, -0.012451171875, -0.009744644165039062, -0.007038116455078125, -0.0043315887451171875, -0.00162506103515625, 0.0010814666748046875, 0.003787994384765625, 0.0064945220947265625, 0.0092010498046875, 0.011907577514648438, 0.014614105224609375, 0.017320632934570312, 0.02002716064453125, 0.022733688354492188, 0.025440216064453125, 0.028146743774414062, 0.030853271484375, 0.03355979919433594, 0.036266326904296875, 0.03897285461425781, 0.04167938232421875, 0.04438591003417969, 0.047092437744140625, 0.04979896545410156, 0.0525054931640625, 0.05521202087402344, 0.057918548583984375, 0.06062507629394531, 0.06333160400390625, 0.06603813171386719, 0.06874465942382812, 0.07145118713378906, 0.07415771484375]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 6.0, 5.0, 2.0, 7.0, 4.0, 13.0, 13.0, 17.0, 20.0, 16.0, 44.0, 53.0, 62.0, 131.0, 171.0, 291.0, 764.0, 1313.0, 482.0, 220.0, 122.0, 94.0, 80.0, 39.0, 34.0, 22.0, 16.0, 15.0, 4.0, 9.0, 6.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.042510986328125, -0.0414280891418457, -0.040345191955566406, -0.03926229476928711, -0.03817939758300781, -0.037096500396728516, -0.03601360321044922, -0.03493070602416992, -0.033847808837890625, -0.03276491165161133, -0.03168201446533203, -0.030599117279052734, -0.029516220092773438, -0.02843332290649414, -0.027350425720214844, -0.026267528533935547, -0.02518463134765625, -0.024101734161376953, -0.023018836975097656, -0.02193593978881836, -0.020853042602539062, -0.019770145416259766, -0.01868724822998047, -0.017604351043701172, -0.016521453857421875, -0.015438556671142578, -0.014355659484863281, -0.013272762298583984, -0.012189865112304688, -0.01110696792602539, -0.010024070739746094, -0.008941173553466797, -0.0078582763671875, -0.006775379180908203, -0.005692481994628906, -0.004609584808349609, -0.0035266876220703125, -0.0024437904357910156, -0.0013608932495117188, -0.0002779960632324219, 0.000804901123046875, 0.0018877983093261719, 0.0029706954956054688, 0.004053592681884766, 0.0051364898681640625, 0.006219387054443359, 0.007302284240722656, 0.008385181427001953, 0.00946807861328125, 0.010550975799560547, 0.011633872985839844, 0.01271677017211914, 0.013799667358398438, 0.014882564544677734, 0.01596546173095703, 0.017048358917236328, 0.018131256103515625, 0.019214153289794922, 0.02029705047607422, 0.021379947662353516, 0.022462844848632812, 0.02354574203491211, 0.024628639221191406, 0.025711536407470703, 0.02679443359375]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 5.0, 4.0, 7.0, 13.0, 31.0, 99.0, 296.0, 338.0, 146.0, 44.0, 17.0, 5.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6040018200874329, -0.5917332172393799, -0.5794646143913269, -0.5671959519386292, -0.5549273490905762, -0.5426587462425232, -0.5303901433944702, -0.5181215405464172, -0.5058529376983643, -0.4935843348503113, -0.4813157021999359, -0.46904709935188293, -0.45677846670150757, -0.4445098638534546, -0.4322412610054016, -0.41997265815734863, -0.4077039957046509, -0.3954353928565979, -0.38316676020622253, -0.37089815735816956, -0.3586295247077942, -0.3463609218597412, -0.33409231901168823, -0.32182371616363525, -0.3095550835132599, -0.2972864806652069, -0.28501784801483154, -0.27274924516677856, -0.2604806423187256, -0.24821200966835022, -0.23594340682029724, -0.22367478907108307, -0.2114061564207077, -0.19913753867149353, -0.18686893582344055, -0.17460031807422638, -0.1623317003250122, -0.15006308257579803, -0.13779446482658386, -0.12552586197853088, -0.11325724422931671, -0.10098862648010254, -0.08872001618146896, -0.07645140588283539, -0.06418278813362122, -0.05191417410969734, -0.03964556008577347, -0.027376949787139893, -0.01510833203792572, -0.0028397180140018463, 0.009428896009922028, 0.0216975100338459, 0.033966124057769775, 0.04623473808169365, 0.05850335210561752, 0.0707719624042511, 0.08304058015346527, 0.09530919790267944, 0.10757780820131302, 0.1198464184999466, 0.13211503624916077, 0.14438365399837494, 0.1566522717475891, 0.1689208745956421, 0.18118949234485626]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 5.0, 3.0, 6.0, 3.0, 6.0, 12.0, 9.0, 14.0, 18.0, 18.0, 27.0, 37.0, 29.0, 35.0, 40.0, 51.0, 60.0, 47.0, 61.0, 65.0, 68.0, 48.0, 62.0, 47.0, 37.0, 34.0, 28.0, 24.0, 25.0, 18.0, 14.0, 15.0, 10.0, 9.0, 7.0, 5.0, 1.0, 5.0, 1.0, 2.0, 1.0, 1.0, 0.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1080290675163269, -0.10402168333530426, -0.10001429170370102, -0.09600690007209778, -0.09199951589107513, -0.08799213171005249, -0.08398474007844925, -0.07997734844684601, -0.07596996426582336, -0.07196258008480072, -0.06795518845319748, -0.06394779682159424, -0.059940412640571594, -0.05593302473425865, -0.05192563682794571, -0.04791824892163277, -0.043910861015319824, -0.03990347310900688, -0.03589608520269394, -0.031888697296381, -0.027881309390068054, -0.02387392148375511, -0.01986653357744217, -0.015859145671129227, -0.011851757764816284, -0.007844369858503342, -0.003836981952190399, 0.00017040595412254333, 0.004177793860435486, 0.008185181766748428, 0.01219256967306137, 0.016199957579374313, 0.020207345485687256, 0.0242147333920002, 0.02822212129831314, 0.03222950920462608, 0.036236897110939026, 0.04024428501725197, 0.04425167292356491, 0.04825906082987785, 0.052266448736190796, 0.05627383664250374, 0.06028122454881668, 0.06428861618041992, 0.06829600036144257, 0.07230338454246521, 0.07631077617406845, 0.08031816780567169, 0.08432555198669434, 0.08833293616771698, 0.09234032779932022, 0.09634771943092346, 0.1003551036119461, 0.10436248779296875, 0.10836987942457199, 0.11237727105617523, 0.11638465523719788, 0.12039203941822052, 0.12439943104982376, 0.128406822681427, 0.13241420686244965, 0.1364215910434723, 0.14042899012565613, 0.14443637430667877, 0.14844375848770142]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 14.0, 10.0, 14.0, 10.0, 19.0, 33.0, 45.0, 74.0, 86.0, 119.0, 186.0, 275.0, 384.0, 566.0, 863.0, 1297.0, 2005.0, 3140.0, 5082.0, 8393.0, 14586.0, 27413.0, 69570.0, 744651.0, 97704.0, 31321.0, 16278.0, 9090.0, 5518.0, 3457.0, 2137.0, 1363.0, 915.0, 601.0, 433.0, 286.0, 174.0, 120.0, 100.0, 69.0, 56.0, 32.0, 26.0, 12.0, 10.0, 11.0, 6.0, 4.0, 2.0, 4.0, 1.0, 1.0], "bins": [-0.08380126953125, -0.08144664764404297, -0.07909202575683594, -0.0767374038696289, -0.07438278198242188, -0.07202816009521484, -0.06967353820800781, -0.06731891632080078, -0.06496429443359375, -0.06260967254638672, -0.06025505065917969, -0.057900428771972656, -0.055545806884765625, -0.053191184997558594, -0.05083656311035156, -0.04848194122314453, -0.0461273193359375, -0.04377269744873047, -0.04141807556152344, -0.039063453674316406, -0.036708831787109375, -0.034354209899902344, -0.03199958801269531, -0.02964496612548828, -0.02729034423828125, -0.02493572235107422, -0.022581100463867188, -0.020226478576660156, -0.017871856689453125, -0.015517234802246094, -0.013162612915039062, -0.010807991027832031, -0.008453369140625, -0.006098747253417969, -0.0037441253662109375, -0.0013895034790039062, 0.000965118408203125, 0.0033197402954101562, 0.0056743621826171875, 0.008028984069824219, 0.01038360595703125, 0.012738227844238281, 0.015092849731445312, 0.017447471618652344, 0.019802093505859375, 0.022156715393066406, 0.024511337280273438, 0.02686595916748047, 0.0292205810546875, 0.03157520294189453, 0.03392982482910156, 0.036284446716308594, 0.038639068603515625, 0.040993690490722656, 0.04334831237792969, 0.04570293426513672, 0.04805755615234375, 0.05041217803955078, 0.05276679992675781, 0.055121421813964844, 0.057476043701171875, 0.059830665588378906, 0.06218528747558594, 0.06453990936279297, 0.06689453125]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 7.0, 4.0, 8.0, 6.0, 5.0, 3.0, 11.0, 8.0, 5.0, 9.0, 14.0, 15.0, 24.0, 47.0, 179.0, 367.0, 131.0, 29.0, 23.0, 19.0, 11.0, 12.0, 7.0, 3.0, 15.0, 3.0, 7.0, 7.0, 1.0, 3.0, 3.0, 6.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.022796630859375, -0.022165298461914062, -0.021533966064453125, -0.020902633666992188, -0.02027130126953125, -0.019639968872070312, -0.019008636474609375, -0.018377304077148438, -0.0177459716796875, -0.017114639282226562, -0.016483306884765625, -0.015851974487304688, -0.01522064208984375, -0.014589309692382812, -0.013957977294921875, -0.013326644897460938, -0.0126953125, -0.012063980102539062, -0.011432647705078125, -0.010801315307617188, -0.01016998291015625, -0.009538650512695312, -0.008907318115234375, -0.008275985717773438, -0.0076446533203125, -0.0070133209228515625, -0.006381988525390625, -0.0057506561279296875, -0.00511932373046875, -0.0044879913330078125, -0.003856658935546875, -0.0032253265380859375, -0.002593994140625, -0.0019626617431640625, -0.001331329345703125, -0.0006999969482421875, -6.866455078125e-05, 0.0005626678466796875, 0.001194000244140625, 0.0018253326416015625, 0.0024566650390625, 0.0030879974365234375, 0.003719329833984375, 0.0043506622314453125, 0.00498199462890625, 0.0056133270263671875, 0.006244659423828125, 0.0068759918212890625, 0.00750732421875, 0.008138656616210938, 0.008769989013671875, 0.009401321411132812, 0.01003265380859375, 0.010663986206054688, 0.011295318603515625, 0.011926651000976562, 0.0125579833984375, 0.013189315795898438, 0.013820648193359375, 0.014451980590820312, 0.01508331298828125, 0.015714645385742188, 0.016345977783203125, 0.016977310180664062, 0.017608642578125]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 5.0, 0.0, 3.0, 5.0, 8.0, 8.0, 9.0, 13.0, 16.0, 15.0, 29.0, 40.0, 48.0, 54.0, 92.0, 123.0, 165.0, 305.0, 447.0, 789.0, 1604.0, 3238.0, 7281.0, 16734.0, 44041.0, 131910.0, 371828.0, 307184.0, 101804.0, 35253.0, 13726.0, 5880.0, 2700.0, 1297.0, 693.0, 384.0, 238.0, 167.0, 104.0, 82.0, 64.0, 47.0, 33.0, 32.0, 14.0, 15.0, 9.0, 7.0, 7.0, 3.0, 6.0, 6.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0440673828125, -0.04264068603515625, -0.0412139892578125, -0.03978729248046875, -0.038360595703125, -0.03693389892578125, -0.0355072021484375, -0.03408050537109375, -0.03265380859375, -0.03122711181640625, -0.0298004150390625, -0.02837371826171875, -0.026947021484375, -0.02552032470703125, -0.0240936279296875, -0.02266693115234375, -0.021240234375, -0.01981353759765625, -0.0183868408203125, -0.01696014404296875, -0.015533447265625, -0.01410675048828125, -0.0126800537109375, -0.01125335693359375, -0.00982666015625, -0.00839996337890625, -0.0069732666015625, -0.00554656982421875, -0.004119873046875, -0.00269317626953125, -0.0012664794921875, 0.00016021728515625, 0.0015869140625, 0.00301361083984375, 0.0044403076171875, 0.00586700439453125, 0.007293701171875, 0.00872039794921875, 0.0101470947265625, 0.01157379150390625, 0.01300048828125, 0.01442718505859375, 0.0158538818359375, 0.01728057861328125, 0.018707275390625, 0.02013397216796875, 0.0215606689453125, 0.02298736572265625, 0.0244140625, 0.02584075927734375, 0.0272674560546875, 0.02869415283203125, 0.030120849609375, 0.03154754638671875, 0.0329742431640625, 0.03440093994140625, 0.03582763671875, 0.03725433349609375, 0.0386810302734375, 0.04010772705078125, 0.041534423828125, 0.04296112060546875, 0.0443878173828125, 0.04581451416015625, 0.0472412109375]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 2.0, 0.0, 2.0, 3.0, 3.0, 4.0, 4.0, 8.0, 4.0, 12.0, 14.0, 7.0, 13.0, 19.0, 22.0, 20.0, 15.0, 33.0, 30.0, 38.0, 34.0, 39.0, 44.0, 34.0, 39.0, 52.0, 49.0, 43.0, 40.0, 48.0, 41.0, 38.0, 34.0, 20.0, 32.0, 22.0, 21.0, 31.0, 12.0, 15.0, 17.0, 15.0, 9.0, 9.0, 4.0, 8.0, 3.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0643310546875, -0.06215476989746094, -0.059978485107421875, -0.05780220031738281, -0.05562591552734375, -0.05344963073730469, -0.051273345947265625, -0.04909706115722656, -0.0469207763671875, -0.04474449157714844, -0.042568206787109375, -0.04039192199707031, -0.03821563720703125, -0.03603935241699219, -0.033863067626953125, -0.03168678283691406, -0.029510498046875, -0.027334213256835938, -0.025157928466796875, -0.022981643676757812, -0.02080535888671875, -0.018629074096679688, -0.016452789306640625, -0.014276504516601562, -0.0121002197265625, -0.009923934936523438, -0.007747650146484375, -0.0055713653564453125, -0.00339508056640625, -0.0012187957763671875, 0.000957489013671875, 0.0031337738037109375, 0.00531005859375, 0.0074863433837890625, 0.009662628173828125, 0.011838912963867188, 0.01401519775390625, 0.016191482543945312, 0.018367767333984375, 0.020544052124023438, 0.0227203369140625, 0.024896621704101562, 0.027072906494140625, 0.029249191284179688, 0.03142547607421875, 0.03360176086425781, 0.035778045654296875, 0.03795433044433594, 0.040130615234375, 0.04230690002441406, 0.044483184814453125, 0.04665946960449219, 0.04883575439453125, 0.05101203918457031, 0.053188323974609375, 0.05536460876464844, 0.0575408935546875, 0.05971717834472656, 0.061893463134765625, 0.06406974792480469, 0.06624603271484375, 0.06842231750488281, 0.07059860229492188, 0.07277488708496094, 0.074951171875]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 7.0, 6.0, 4.0, 6.0, 21.0, 18.0, 29.0, 42.0, 72.0, 88.0, 169.0, 232.0, 484.0, 809.0, 1695.0, 3712.0, 9789.0, 34590.0, 219834.0, 628305.0, 113367.0, 22425.0, 6997.0, 2884.0, 1273.0, 682.0, 373.0, 226.0, 129.0, 94.0, 65.0, 38.0, 30.0, 16.0, 8.0, 14.0, 12.0, 4.0, 3.0, 1.0, 3.0, 2.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.05615234375, -0.05441617965698242, -0.052680015563964844, -0.050943851470947266, -0.04920768737792969, -0.04747152328491211, -0.04573535919189453, -0.04399919509887695, -0.042263031005859375, -0.0405268669128418, -0.03879070281982422, -0.03705453872680664, -0.03531837463378906, -0.033582210540771484, -0.031846046447753906, -0.030109882354736328, -0.02837371826171875, -0.026637554168701172, -0.024901390075683594, -0.023165225982666016, -0.021429061889648438, -0.01969289779663086, -0.01795673370361328, -0.016220569610595703, -0.014484405517578125, -0.012748241424560547, -0.011012077331542969, -0.00927591323852539, -0.0075397491455078125, -0.005803585052490234, -0.004067420959472656, -0.002331256866455078, -0.0005950927734375, 0.0011410713195800781, 0.0028772354125976562, 0.004613399505615234, 0.0063495635986328125, 0.00808572769165039, 0.009821891784667969, 0.011558055877685547, 0.013294219970703125, 0.015030384063720703, 0.01676654815673828, 0.01850271224975586, 0.020238876342773438, 0.021975040435791016, 0.023711204528808594, 0.025447368621826172, 0.02718353271484375, 0.028919696807861328, 0.030655860900878906, 0.032392024993896484, 0.03412818908691406, 0.03586435317993164, 0.03760051727294922, 0.0393366813659668, 0.041072845458984375, 0.04280900955200195, 0.04454517364501953, 0.04628133773803711, 0.04801750183105469, 0.049753665924072266, 0.051489830017089844, 0.05322599411010742, 0.054962158203125]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 2.0, 5.0, 5.0, 11.0, 9.0, 28.0, 19.0, 20.0, 33.0, 30.0, 48.0, 64.0, 71.0, 76.0, 85.0, 66.0, 82.0, 67.0, 69.0, 38.0, 42.0, 28.0, 28.0, 19.0, 13.0, 10.0, 5.0, 9.0, 5.0, 5.0, 3.0, 2.0, 5.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.6743621826171875e-05, -5.486421287059784e-05, -5.2984803915023804e-05, -5.110539495944977e-05, -4.922598600387573e-05, -4.73465770483017e-05, -4.546716809272766e-05, -4.3587759137153625e-05, -4.170835018157959e-05, -3.9828941226005554e-05, -3.794953227043152e-05, -3.607012331485748e-05, -3.419071435928345e-05, -3.231130540370941e-05, -3.0431896448135376e-05, -2.855248749256134e-05, -2.6673078536987305e-05, -2.479366958141327e-05, -2.2914260625839233e-05, -2.1034851670265198e-05, -1.9155442714691162e-05, -1.7276033759117126e-05, -1.539662480354309e-05, -1.3517215847969055e-05, -1.163780689239502e-05, -9.758397936820984e-06, -7.878988981246948e-06, -5.999580025672913e-06, -4.120171070098877e-06, -2.2407621145248413e-06, -3.6135315895080566e-07, 1.51805579662323e-06, 3.3974647521972656e-06, 5.276873707771301e-06, 7.156282663345337e-06, 9.035691618919373e-06, 1.0915100574493408e-05, 1.2794509530067444e-05, 1.467391848564148e-05, 1.6553327441215515e-05, 1.843273639678955e-05, 2.0312145352363586e-05, 2.2191554307937622e-05, 2.4070963263511658e-05, 2.5950372219085693e-05, 2.782978117465973e-05, 2.9709190130233765e-05, 3.15885990858078e-05, 3.3468008041381836e-05, 3.534741699695587e-05, 3.722682595252991e-05, 3.910623490810394e-05, 4.098564386367798e-05, 4.2865052819252014e-05, 4.474446177482605e-05, 4.6623870730400085e-05, 4.850327968597412e-05, 5.038268864154816e-05, 5.226209759712219e-05, 5.414150655269623e-05, 5.6020915508270264e-05, 5.79003244638443e-05, 5.9779733419418335e-05, 6.165914237499237e-05, 6.35385513305664e-05]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 9.0, 7.0, 4.0, 7.0, 19.0, 19.0, 33.0, 52.0, 84.0, 107.0, 190.0, 310.0, 483.0, 891.0, 1568.0, 3369.0, 7386.0, 19566.0, 64704.0, 289127.0, 481104.0, 125726.0, 32874.0, 11302.0, 4666.0, 2167.0, 1125.0, 639.0, 378.0, 201.0, 153.0, 92.0, 65.0, 36.0, 23.0, 20.0, 20.0, 11.0, 7.0, 4.0, 4.0, 1.0, 3.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.043060302734375, -0.041724205017089844, -0.04038810729980469, -0.03905200958251953, -0.037715911865234375, -0.03637981414794922, -0.03504371643066406, -0.033707618713378906, -0.03237152099609375, -0.031035423278808594, -0.029699325561523438, -0.02836322784423828, -0.027027130126953125, -0.02569103240966797, -0.024354934692382812, -0.023018836975097656, -0.0216827392578125, -0.020346641540527344, -0.019010543823242188, -0.01767444610595703, -0.016338348388671875, -0.015002250671386719, -0.013666152954101562, -0.012330055236816406, -0.01099395751953125, -0.009657859802246094, -0.008321762084960938, -0.006985664367675781, -0.005649566650390625, -0.004313468933105469, -0.0029773712158203125, -0.0016412734985351562, -0.00030517578125, 0.0010309219360351562, 0.0023670196533203125, 0.0037031173706054688, 0.005039215087890625, 0.006375312805175781, 0.0077114105224609375, 0.009047508239746094, 0.01038360595703125, 0.011719703674316406, 0.013055801391601562, 0.014391899108886719, 0.015727996826171875, 0.01706409454345703, 0.018400192260742188, 0.019736289978027344, 0.0210723876953125, 0.022408485412597656, 0.023744583129882812, 0.02508068084716797, 0.026416778564453125, 0.02775287628173828, 0.029088973999023438, 0.030425071716308594, 0.03176116943359375, 0.033097267150878906, 0.03443336486816406, 0.03576946258544922, 0.037105560302734375, 0.03844165802001953, 0.03977775573730469, 0.041113853454589844, 0.042449951171875]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 3.0, 5.0, 5.0, 3.0, 14.0, 14.0, 15.0, 17.0, 28.0, 17.0, 40.0, 42.0, 42.0, 44.0, 51.0, 81.0, 76.0, 70.0, 70.0, 58.0, 54.0, 37.0, 53.0, 39.0, 32.0, 21.0, 16.0, 16.0, 9.0, 12.0, 2.0, 3.0, 6.0, 8.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0297698974609375, -0.02862095832824707, -0.02747201919555664, -0.02632308006286621, -0.02517414093017578, -0.02402520179748535, -0.022876262664794922, -0.021727323532104492, -0.020578384399414062, -0.019429445266723633, -0.018280506134033203, -0.017131567001342773, -0.015982627868652344, -0.014833688735961914, -0.013684749603271484, -0.012535810470581055, -0.011386871337890625, -0.010237932205200195, -0.009088993072509766, -0.007940053939819336, -0.006791114807128906, -0.0056421756744384766, -0.004493236541748047, -0.003344297409057617, -0.0021953582763671875, -0.0010464191436767578, 0.00010251998901367188, 0.0012514591217041016, 0.0024003982543945312, 0.003549337387084961, 0.004698276519775391, 0.00584721565246582, 0.00699615478515625, 0.00814509391784668, 0.00929403305053711, 0.010442972183227539, 0.011591911315917969, 0.012740850448608398, 0.013889789581298828, 0.015038728713989258, 0.016187667846679688, 0.017336606979370117, 0.018485546112060547, 0.019634485244750977, 0.020783424377441406, 0.021932363510131836, 0.023081302642822266, 0.024230241775512695, 0.025379180908203125, 0.026528120040893555, 0.027677059173583984, 0.028825998306274414, 0.029974937438964844, 0.031123876571655273, 0.0322728157043457, 0.03342175483703613, 0.03457069396972656, 0.03571963310241699, 0.03686857223510742, 0.03801751136779785, 0.03916645050048828, 0.04031538963317871, 0.04146432876586914, 0.04261326789855957, 0.04376220703125]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 4.0, 8.0, 8.0, 15.0, 24.0, 66.0, 263.0, 362.0, 149.0, 60.0, 24.0, 10.0, 4.0, 6.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2281635999679565, -1.192326545715332, -1.156489610671997, -1.1206525564193726, -1.084815502166748, -1.048978567123413, -1.0131415128707886, -0.9773044586181641, -0.9414674639701843, -0.9056304693222046, -0.8697934150695801, -0.8339564204216003, -0.7981194257736206, -0.7622823715209961, -0.7264453768730164, -0.6906083822250366, -0.6547713279724121, -0.6189343333244324, -0.5830972790718079, -0.5472602844238281, -0.5114232301712036, -0.4755862355232239, -0.43974924087524414, -0.403912216424942, -0.3680751919746399, -0.33223816752433777, -0.29640114307403564, -0.2605641484260559, -0.22472712397575378, -0.18889009952545166, -0.15305308997631073, -0.1172160804271698, -0.08137917518615723, -0.0455421581864357, -0.009705141186714172, 0.026131875813007355, 0.06196889281272888, 0.097805917263031, 0.13364292681217194, 0.16947993636131287, 0.205316960811615, 0.24115398526191711, 0.27699100971221924, 0.312828004360199, 0.3486650288105011, 0.3845020532608032, 0.42033904790878296, 0.4561760723590851, 0.4920130968093872, 0.5278500914573669, 0.5636871457099915, 0.5995241403579712, 0.6353611946105957, 0.6711981892585754, 0.7070351839065552, 0.7428722381591797, 0.7787092328071594, 0.8145462274551392, 0.8503832817077637, 0.8862202763557434, 0.9220572710037231, 0.9578943252563477, 0.9937313199043274, 1.0295683145523071, 1.0654053688049316]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 4.0, 4.0, 5.0, 3.0, 8.0, 8.0, 9.0, 3.0, 7.0, 11.0, 25.0, 51.0, 95.0, 163.0, 182.0, 168.0, 89.0, 57.0, 27.0, 27.0, 12.0, 10.0, 12.0, 7.0, 4.0, 4.0, 6.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3230986595153809, -1.271431803703308, -1.2197649478912354, -1.1680982112884521, -1.1164313554763794, -1.0647644996643066, -1.0130977630615234, -0.9614309072494507, -0.9097640514373779, -0.8580971956253052, -0.8064303994178772, -0.7547636032104492, -0.7030967473983765, -0.6514298915863037, -0.5997630953788757, -0.5480962991714478, -0.496429443359375, -0.44476261734962463, -0.39309579133987427, -0.3414289653301239, -0.28976213932037354, -0.23809531331062317, -0.1864284873008728, -0.13476166129112244, -0.08309483528137207, -0.031428009271621704, 0.020238816738128662, 0.07190564274787903, 0.1235724687576294, 0.17523929476737976, 0.22690612077713013, 0.2785729467868805, 0.3302396535873413, 0.3819064795970917, 0.43357330560684204, 0.4852401316165924, 0.5369069576263428, 0.5885738134384155, 0.6402406096458435, 0.6919074058532715, 0.7435742616653442, 0.795241117477417, 0.846907913684845, 0.898574709892273, 0.9502415657043457, 1.0019084215164185, 1.0535752773284912, 1.1052420139312744, 1.1569088697433472, 1.20857572555542, 1.2602424621582031, 1.3119093179702759, 1.3635761737823486, 1.4152430295944214, 1.4669098854064941, 1.5185766220092773, 1.57024347782135, 1.6219103336334229, 1.673577070236206, 1.7252439260482788, 1.7769107818603516, 1.8285776376724243, 1.880244493484497, 1.9319112300872803, 1.983578085899353]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 7.0, 10.0, 6.0, 6.0, 8.0, 12.0, 10.0, 16.0, 26.0, 42.0, 69.0, 99.0, 135.0, 230.0, 331.0, 548.0, 872.0, 1397.0, 2420.0, 4384.0, 8460.0, 19031.0, 59998.0, 3353257.0, 663326.0, 48319.0, 16044.0, 6925.0, 3460.0, 1920.0, 1125.0, 666.0, 392.0, 237.0, 168.0, 111.0, 78.0, 44.0, 30.0, 29.0, 14.0, 6.0, 5.0, 5.0, 4.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.1697998046875, -0.164794921875, -0.1597900390625, -0.15478515625, -0.1497802734375, -0.144775390625, -0.1397705078125, -0.134765625, -0.1297607421875, -0.124755859375, -0.1197509765625, -0.11474609375, -0.1097412109375, -0.104736328125, -0.0997314453125, -0.0947265625, -0.0897216796875, -0.084716796875, -0.0797119140625, -0.07470703125, -0.0697021484375, -0.064697265625, -0.0596923828125, -0.0546875, -0.0496826171875, -0.044677734375, -0.0396728515625, -0.03466796875, -0.0296630859375, -0.024658203125, -0.0196533203125, -0.0146484375, -0.0096435546875, -0.004638671875, 0.0003662109375, 0.00537109375, 0.0103759765625, 0.015380859375, 0.0203857421875, 0.025390625, 0.0303955078125, 0.035400390625, 0.0404052734375, 0.04541015625, 0.0504150390625, 0.055419921875, 0.0604248046875, 0.0654296875, 0.0704345703125, 0.075439453125, 0.0804443359375, 0.08544921875, 0.0904541015625, 0.095458984375, 0.1004638671875, 0.10546875, 0.1104736328125, 0.115478515625, 0.1204833984375, 0.12548828125, 0.1304931640625, 0.135498046875, 0.1405029296875, 0.1455078125, 0.1505126953125]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 4.0, 1.0, 4.0, 4.0, 3.0, 5.0, 5.0, 5.0, 7.0, 8.0, 7.0, 9.0, 13.0, 7.0, 8.0, 22.0, 25.0, 43.0, 77.0, 172.0, 240.0, 143.0, 50.0, 27.0, 20.0, 23.0, 14.0, 7.0, 9.0, 5.0, 10.0, 7.0, 3.0, 3.0, 3.0, 1.0, 4.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0181121826171875, -0.017565011978149414, -0.017017841339111328, -0.016470670700073242, -0.015923500061035156, -0.01537632942199707, -0.014829158782958984, -0.014281988143920898, -0.013734817504882812, -0.013187646865844727, -0.01264047622680664, -0.012093305587768555, -0.011546134948730469, -0.010998964309692383, -0.010451793670654297, -0.009904623031616211, -0.009357452392578125, -0.008810281753540039, -0.008263111114501953, -0.007715940475463867, -0.007168769836425781, -0.006621599197387695, -0.006074428558349609, -0.0055272579193115234, -0.0049800872802734375, -0.0044329166412353516, -0.0038857460021972656, -0.0033385753631591797, -0.0027914047241210938, -0.002244234085083008, -0.0016970634460449219, -0.001149892807006836, -0.00060272216796875, -5.555152893066406e-05, 0.0004916191101074219, 0.0010387897491455078, 0.0015859603881835938, 0.0021331310272216797, 0.0026803016662597656, 0.0032274723052978516, 0.0037746429443359375, 0.0043218135833740234, 0.004868984222412109, 0.005416154861450195, 0.005963325500488281, 0.006510496139526367, 0.007057666778564453, 0.007604837417602539, 0.008152008056640625, 0.008699178695678711, 0.009246349334716797, 0.009793519973754883, 0.010340690612792969, 0.010887861251831055, 0.01143503189086914, 0.011982202529907227, 0.012529373168945312, 0.013076543807983398, 0.013623714447021484, 0.01417088508605957, 0.014718055725097656, 0.015265226364135742, 0.015812397003173828, 0.016359567642211914, 0.01690673828125]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 6.0, 6.0, 5.0, 3.0, 14.0, 9.0, 20.0, 24.0, 41.0, 77.0, 99.0, 210.0, 369.0, 675.0, 1551.0, 3649.0, 10609.0, 39195.0, 220565.0, 3468058.0, 374448.0, 53583.0, 13568.0, 4278.0, 1675.0, 742.0, 369.0, 172.0, 87.0, 56.0, 39.0, 33.0, 18.0, 9.0, 11.0, 8.0, 0.0, 1.0, 3.0, 2.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.1800537109375, -0.17526626586914062, -0.17047882080078125, -0.16569137573242188, -0.1609039306640625, -0.15611648559570312, -0.15132904052734375, -0.14654159545898438, -0.141754150390625, -0.13696670532226562, -0.13217926025390625, -0.12739181518554688, -0.1226043701171875, -0.11781692504882812, -0.11302947998046875, -0.10824203491210938, -0.10345458984375, -0.09866714477539062, -0.09387969970703125, -0.08909225463867188, -0.0843048095703125, -0.07951736450195312, -0.07472991943359375, -0.06994247436523438, -0.065155029296875, -0.060367584228515625, -0.05558013916015625, -0.050792694091796875, -0.0460052490234375, -0.041217803955078125, -0.03643035888671875, -0.031642913818359375, -0.02685546875, -0.022068023681640625, -0.01728057861328125, -0.012493133544921875, -0.0077056884765625, -0.002918243408203125, 0.00186920166015625, 0.006656646728515625, 0.011444091796875, 0.016231536865234375, 0.02101898193359375, 0.025806427001953125, 0.0305938720703125, 0.035381317138671875, 0.04016876220703125, 0.044956207275390625, 0.04974365234375, 0.054531097412109375, 0.05931854248046875, 0.06410598754882812, 0.0688934326171875, 0.07368087768554688, 0.07846832275390625, 0.08325576782226562, 0.088043212890625, 0.09283065795898438, 0.09761810302734375, 0.10240554809570312, 0.1071929931640625, 0.11198043823242188, 0.11676788330078125, 0.12155532836914062, 0.1263427734375]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 5.0, 4.0, 4.0, 5.0, 6.0, 13.0, 8.0, 18.0, 19.0, 26.0, 30.0, 44.0, 49.0, 82.0, 135.0, 246.0, 504.0, 1642.0, 532.0, 258.0, 143.0, 78.0, 74.0, 51.0, 30.0, 19.0, 19.0, 8.0, 7.0, 7.0, 3.0, 3.0, 4.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0284271240234375, -0.02764892578125, -0.0268707275390625, -0.026092529296875, -0.0253143310546875, -0.0245361328125, -0.0237579345703125, -0.022979736328125, -0.0222015380859375, -0.02142333984375, -0.0206451416015625, -0.019866943359375, -0.0190887451171875, -0.018310546875, -0.0175323486328125, -0.016754150390625, -0.0159759521484375, -0.01519775390625, -0.0144195556640625, -0.013641357421875, -0.0128631591796875, -0.0120849609375, -0.0113067626953125, -0.010528564453125, -0.0097503662109375, -0.00897216796875, -0.0081939697265625, -0.007415771484375, -0.0066375732421875, -0.005859375, -0.0050811767578125, -0.004302978515625, -0.0035247802734375, -0.00274658203125, -0.0019683837890625, -0.001190185546875, -0.0004119873046875, 0.0003662109375, 0.0011444091796875, 0.001922607421875, 0.0027008056640625, 0.00347900390625, 0.0042572021484375, 0.005035400390625, 0.0058135986328125, 0.006591796875, 0.0073699951171875, 0.008148193359375, 0.0089263916015625, 0.00970458984375, 0.0104827880859375, 0.011260986328125, 0.0120391845703125, 0.0128173828125, 0.0135955810546875, 0.014373779296875, 0.0151519775390625, 0.01593017578125, 0.0167083740234375, 0.017486572265625, 0.0182647705078125, 0.01904296875, 0.0198211669921875, 0.020599365234375, 0.0213775634765625]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 2.0, 6.0, 13.0, 67.0, 389.0, 466.0, 54.0, 9.0, 4.0], "bins": [-1.1765782833099365, -1.1570041179656982, -1.1374298334121704, -1.1178556680679321, -1.0982813835144043, -1.078707218170166, -1.0591329336166382, -1.0395587682724, -1.019984483718872, -1.0004103183746338, -0.980836033821106, -0.9612618088722229, -0.9416875839233398, -0.9221134185791016, -0.9025391936302185, -0.8829649686813354, -0.8633908033370972, -0.8438165783882141, -0.824242353439331, -0.804668128490448, -0.7850939035415649, -0.7655197381973267, -0.7459455132484436, -0.7263712882995605, -0.7067970633506775, -0.6872228384017944, -0.6676486134529114, -0.6480743885040283, -0.62850022315979, -0.608925998210907, -0.5893517732620239, -0.5697775483131409, -0.5502033233642578, -0.5306290984153748, -0.5110548734664917, -0.49148067831993103, -0.471906453371048, -0.4523322284221649, -0.43275803327560425, -0.4131838083267212, -0.39360958337783813, -0.3740353584289551, -0.354461133480072, -0.33488693833351135, -0.3153127133846283, -0.29573848843574524, -0.27616429328918457, -0.2565900683403015, -0.23701582849025726, -0.2174416184425354, -0.19786739349365234, -0.1782931685447693, -0.15871895849704742, -0.13914474844932556, -0.1195705235004425, -0.09999631345272064, -0.08042208850383759, -0.060847871005535126, -0.041273653507232666, -0.021699436008930206, -0.0021252185106277466, 0.017448998987674713, 0.03702321648597717, 0.056597426533699036, 0.07617165148258209]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 6.0, 5.0, 9.0, 11.0, 17.0, 14.0, 19.0, 31.0, 37.0, 51.0, 64.0, 52.0, 68.0, 60.0, 71.0, 65.0, 64.0, 56.0, 51.0, 48.0, 48.0, 36.0, 31.0, 16.0, 18.0, 18.0, 7.0, 9.0, 9.0, 3.0, 3.0, 6.0, 1.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.15123337507247925, -0.1470901519060135, -0.14294694364070892, -0.13880372047424316, -0.1346604973077774, -0.13051727414131165, -0.12637406587600708, -0.12223084270954132, -0.11808762699365616, -0.113944411277771, -0.10980118811130524, -0.10565797239542007, -0.10151475667953491, -0.09737153351306915, -0.09322831779718399, -0.08908510208129883, -0.08494187891483307, -0.0807986631989479, -0.07665544003248215, -0.07251222431659698, -0.06836900115013123, -0.06422578543424606, -0.0600825697183609, -0.05593935027718544, -0.05179613083600998, -0.04765291139483452, -0.04350969195365906, -0.039366476237773895, -0.035223256796598434, -0.031080037355422974, -0.026936819776892662, -0.02279360219836235, -0.01865038275718689, -0.014507164247334003, -0.010363945737481117, -0.006220727227628231, -0.002077508717775345, 0.002065710723400116, 0.0062089283019304276, 0.01035214588046074, 0.0144953653216362, 0.01863858476281166, 0.022781802341341972, 0.026925019919872284, 0.031068239361047745, 0.035211458802223206, 0.03935467451810837, 0.04349789395928383, 0.04764111340045929, 0.05178433284163475, 0.05592755228281021, 0.060070767998695374, 0.06421399116516113, 0.0683572068810463, 0.07250042259693146, 0.07664364576339722, 0.08078686147928238, 0.08493007719516754, 0.0890733003616333, 0.09321651607751846, 0.09735973179340363, 0.10150295495986938, 0.10564617067575455, 0.10978938639163971, 0.11393260955810547]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 5.0, 2.0, 4.0, 1.0, 1.0, 2.0, 15.0, 13.0, 14.0, 35.0, 38.0, 67.0, 137.0, 172.0, 279.0, 528.0, 977.0, 2015.0, 4612.0, 11826.0, 36045.0, 256835.0, 650119.0, 56269.0, 16691.0, 6357.0, 2722.0, 1268.0, 609.0, 357.0, 229.0, 105.0, 73.0, 48.0, 30.0, 21.0, 9.0, 9.0, 7.0, 8.0, 1.0, 3.0, 5.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.128662109375, -0.12425041198730469, -0.11983871459960938, -0.11542701721191406, -0.11101531982421875, -0.10660362243652344, -0.10219192504882812, -0.09778022766113281, -0.0933685302734375, -0.08895683288574219, -0.08454513549804688, -0.08013343811035156, -0.07572174072265625, -0.07131004333496094, -0.06689834594726562, -0.06248664855957031, -0.058074951171875, -0.05366325378417969, -0.049251556396484375, -0.04483985900878906, -0.04042816162109375, -0.03601646423339844, -0.031604766845703125, -0.027193069458007812, -0.0227813720703125, -0.018369674682617188, -0.013957977294921875, -0.009546279907226562, -0.00513458251953125, -0.0007228851318359375, 0.003688812255859375, 0.008100509643554688, 0.01251220703125, 0.016923904418945312, 0.021335601806640625, 0.025747299194335938, 0.03015899658203125, 0.03457069396972656, 0.038982391357421875, 0.04339408874511719, 0.0478057861328125, 0.05221748352050781, 0.056629180908203125, 0.06104087829589844, 0.06545257568359375, 0.06986427307128906, 0.07427597045898438, 0.07868766784667969, 0.083099365234375, 0.08751106262207031, 0.09192276000976562, 0.09633445739746094, 0.10074615478515625, 0.10515785217285156, 0.10956954956054688, 0.11398124694824219, 0.1183929443359375, 0.12280464172363281, 0.12721633911132812, 0.13162803649902344, 0.13603973388671875, 0.14045143127441406, 0.14486312866210938, 0.1492748260498047, 0.1536865234375]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 3.0, 1.0, 2.0, 5.0, 6.0, 6.0, 10.0, 3.0, 11.0, 14.0, 15.0, 15.0, 21.0, 46.0, 80.0, 170.0, 190.0, 156.0, 88.0, 50.0, 18.0, 27.0, 16.0, 10.0, 5.0, 11.0, 5.0, 4.0, 1.0, 2.0, 3.0, 6.0, 0.0, 4.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0222625732421875, -0.021650314331054688, -0.021038055419921875, -0.020425796508789062, -0.01981353759765625, -0.019201278686523438, -0.018589019775390625, -0.017976760864257812, -0.017364501953125, -0.016752243041992188, -0.016139984130859375, -0.015527725219726562, -0.01491546630859375, -0.014303207397460938, -0.013690948486328125, -0.013078689575195312, -0.0124664306640625, -0.011854171752929688, -0.011241912841796875, -0.010629653930664062, -0.01001739501953125, -0.009405136108398438, -0.008792877197265625, -0.008180618286132812, -0.007568359375, -0.0069561004638671875, -0.006343841552734375, -0.0057315826416015625, -0.00511932373046875, -0.0045070648193359375, -0.003894805908203125, -0.0032825469970703125, -0.0026702880859375, -0.0020580291748046875, -0.001445770263671875, -0.0008335113525390625, -0.00022125244140625, 0.0003910064697265625, 0.001003265380859375, 0.0016155242919921875, 0.002227783203125, 0.0028400421142578125, 0.003452301025390625, 0.0040645599365234375, 0.00467681884765625, 0.0052890777587890625, 0.005901336669921875, 0.0065135955810546875, 0.0071258544921875, 0.0077381134033203125, 0.008350372314453125, 0.008962631225585938, 0.00957489013671875, 0.010187149047851562, 0.010799407958984375, 0.011411666870117188, 0.01202392578125, 0.012636184692382812, 0.013248443603515625, 0.013860702514648438, 0.01447296142578125, 0.015085220336914062, 0.015697479248046875, 0.016309738159179688, 0.0169219970703125]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 4.0, 8.0, 3.0, 3.0, 11.0, 19.0, 35.0, 41.0, 61.0, 84.0, 118.0, 196.0, 325.0, 540.0, 1000.0, 1909.0, 4218.0, 10675.0, 34882.0, 162831.0, 539178.0, 224263.0, 44891.0, 12896.0, 5253.0, 2276.0, 1186.0, 651.0, 359.0, 202.0, 131.0, 80.0, 62.0, 52.0, 34.0, 27.0, 13.0, 15.0, 13.0, 5.0, 3.0, 4.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06915283203125, -0.06681537628173828, -0.06447792053222656, -0.062140464782714844, -0.059803009033203125, -0.057465553283691406, -0.05512809753417969, -0.05279064178466797, -0.05045318603515625, -0.04811573028564453, -0.04577827453613281, -0.043440818786621094, -0.041103363037109375, -0.038765907287597656, -0.03642845153808594, -0.03409099578857422, -0.0317535400390625, -0.02941608428955078, -0.027078628540039062, -0.024741172790527344, -0.022403717041015625, -0.020066261291503906, -0.017728805541992188, -0.015391349792480469, -0.01305389404296875, -0.010716438293457031, -0.008378982543945312, -0.006041526794433594, -0.003704071044921875, -0.0013666152954101562, 0.0009708404541015625, 0.0033082962036132812, 0.005645751953125, 0.007983207702636719, 0.010320663452148438, 0.012658119201660156, 0.014995574951171875, 0.017333030700683594, 0.019670486450195312, 0.02200794219970703, 0.02434539794921875, 0.02668285369873047, 0.029020309448242188, 0.031357765197753906, 0.033695220947265625, 0.036032676696777344, 0.03837013244628906, 0.04070758819580078, 0.0430450439453125, 0.04538249969482422, 0.04771995544433594, 0.050057411193847656, 0.052394866943359375, 0.054732322692871094, 0.05706977844238281, 0.05940723419189453, 0.06174468994140625, 0.06408214569091797, 0.06641960144042969, 0.0687570571899414, 0.07109451293945312, 0.07343196868896484, 0.07576942443847656, 0.07810688018798828, 0.0804443359375]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 6.0, 5.0, 3.0, 5.0, 11.0, 16.0, 11.0, 20.0, 18.0, 23.0, 18.0, 28.0, 26.0, 33.0, 40.0, 43.0, 45.0, 41.0, 48.0, 44.0, 48.0, 43.0, 45.0, 48.0, 54.0, 53.0, 34.0, 35.0, 29.0, 32.0, 32.0, 13.0, 7.0, 12.0, 8.0, 7.0, 7.0, 7.0, 5.0, 4.0, 4.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.050079345703125, -0.048338890075683594, -0.04659843444824219, -0.04485797882080078, -0.043117523193359375, -0.04137706756591797, -0.03963661193847656, -0.037896156311035156, -0.03615570068359375, -0.034415245056152344, -0.03267478942871094, -0.03093433380126953, -0.029193878173828125, -0.02745342254638672, -0.025712966918945312, -0.023972511291503906, -0.0222320556640625, -0.020491600036621094, -0.018751144409179688, -0.01701068878173828, -0.015270233154296875, -0.013529777526855469, -0.011789321899414062, -0.010048866271972656, -0.00830841064453125, -0.006567955017089844, -0.0048274993896484375, -0.0030870437622070312, -0.001346588134765625, 0.00039386749267578125, 0.0021343231201171875, 0.0038747787475585938, 0.005615234375, 0.007355690002441406, 0.009096145629882812, 0.010836601257324219, 0.012577056884765625, 0.014317512512207031, 0.016057968139648438, 0.017798423767089844, 0.01953887939453125, 0.021279335021972656, 0.023019790649414062, 0.02476024627685547, 0.026500701904296875, 0.02824115753173828, 0.029981613159179688, 0.031722068786621094, 0.0334625244140625, 0.035202980041503906, 0.03694343566894531, 0.03868389129638672, 0.040424346923828125, 0.04216480255126953, 0.04390525817871094, 0.045645713806152344, 0.04738616943359375, 0.049126625061035156, 0.05086708068847656, 0.05260753631591797, 0.054347991943359375, 0.05608844757080078, 0.05782890319824219, 0.059569358825683594, 0.061309814453125]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 4.0, 6.0, 4.0, 4.0, 17.0, 15.0, 30.0, 43.0, 61.0, 81.0, 139.0, 269.0, 486.0, 1071.0, 2613.0, 7649.0, 29898.0, 212276.0, 647143.0, 117431.0, 19812.0, 5562.0, 2090.0, 872.0, 414.0, 221.0, 118.0, 74.0, 44.0, 37.0, 20.0, 19.0, 11.0, 6.0, 6.0, 3.0, 5.0, 6.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09210205078125, -0.08873653411865234, -0.08537101745605469, -0.08200550079345703, -0.07863998413085938, -0.07527446746826172, -0.07190895080566406, -0.0685434341430664, -0.06517791748046875, -0.061812400817871094, -0.05844688415527344, -0.05508136749267578, -0.051715850830078125, -0.04835033416748047, -0.04498481750488281, -0.041619300842285156, -0.0382537841796875, -0.034888267517089844, -0.03152275085449219, -0.02815723419189453, -0.024791717529296875, -0.02142620086669922, -0.018060684204101562, -0.014695167541503906, -0.01132965087890625, -0.007964134216308594, -0.0045986175537109375, -0.0012331008911132812, 0.002132415771484375, 0.005497932434082031, 0.008863449096679688, 0.012228965759277344, 0.015594482421875, 0.018959999084472656, 0.022325515747070312, 0.02569103240966797, 0.029056549072265625, 0.03242206573486328, 0.03578758239746094, 0.039153099060058594, 0.04251861572265625, 0.045884132385253906, 0.04924964904785156, 0.05261516571044922, 0.055980682373046875, 0.05934619903564453, 0.06271171569824219, 0.06607723236083984, 0.0694427490234375, 0.07280826568603516, 0.07617378234863281, 0.07953929901123047, 0.08290481567382812, 0.08627033233642578, 0.08963584899902344, 0.0930013656616211, 0.09636688232421875, 0.0997323989868164, 0.10309791564941406, 0.10646343231201172, 0.10982894897460938, 0.11319446563720703, 0.11655998229980469, 0.11992549896240234, 0.123291015625]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 7.0, 6.0, 12.0, 15.0, 22.0, 31.0, 44.0, 66.0, 77.0, 81.0, 96.0, 93.0, 89.0, 95.0, 74.0, 50.0, 47.0, 32.0, 24.0, 12.0, 8.0, 5.0, 7.0, 7.0, 4.0, 5.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.459257125854492e-05, -9.146705269813538e-05, -8.834153413772583e-05, -8.521601557731628e-05, -8.209049701690674e-05, -7.896497845649719e-05, -7.583945989608765e-05, -7.27139413356781e-05, -6.958842277526855e-05, -6.646290421485901e-05, -6.333738565444946e-05, -6.021186709403992e-05, -5.708634853363037e-05, -5.3960829973220825e-05, -5.083531141281128e-05, -4.7709792852401733e-05, -4.458427429199219e-05, -4.145875573158264e-05, -3.8333237171173096e-05, -3.520771861076355e-05, -3.2082200050354004e-05, -2.8956681489944458e-05, -2.5831162929534912e-05, -2.2705644369125366e-05, -1.958012580871582e-05, -1.6454607248306274e-05, -1.3329088687896729e-05, -1.0203570127487183e-05, -7.078051567077637e-06, -3.952533006668091e-06, -8.270144462585449e-07, 2.298504114151001e-06, 5.424022674560547e-06, 8.549541234970093e-06, 1.1675059795379639e-05, 1.4800578355789185e-05, 1.792609691619873e-05, 2.1051615476608276e-05, 2.4177134037017822e-05, 2.7302652597427368e-05, 3.0428171157836914e-05, 3.355368971824646e-05, 3.6679208278656006e-05, 3.980472683906555e-05, 4.29302453994751e-05, 4.6055763959884644e-05, 4.918128252029419e-05, 5.2306801080703735e-05, 5.543231964111328e-05, 5.855783820152283e-05, 6.168335676193237e-05, 6.480887532234192e-05, 6.793439388275146e-05, 7.105991244316101e-05, 7.418543100357056e-05, 7.73109495639801e-05, 8.043646812438965e-05, 8.35619866847992e-05, 8.668750524520874e-05, 8.981302380561829e-05, 9.293854236602783e-05, 9.606406092643738e-05, 9.918957948684692e-05, 0.00010231509804725647, 0.00010544061660766602]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 5.0, 5.0, 8.0, 13.0, 12.0, 25.0, 41.0, 83.0, 146.0, 276.0, 613.0, 1727.0, 5590.0, 26733.0, 236267.0, 664280.0, 93282.0, 13880.0, 3394.0, 1194.0, 447.0, 226.0, 140.0, 73.0, 33.0, 25.0, 16.0, 14.0, 4.0, 3.0, 0.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0826416015625, -0.07893753051757812, -0.07523345947265625, -0.07152938842773438, -0.0678253173828125, -0.06412124633789062, -0.06041717529296875, -0.056713104248046875, -0.053009033203125, -0.049304962158203125, -0.04560089111328125, -0.041896820068359375, -0.0381927490234375, -0.034488677978515625, -0.03078460693359375, -0.027080535888671875, -0.02337646484375, -0.019672393798828125, -0.01596832275390625, -0.012264251708984375, -0.0085601806640625, -0.004856109619140625, -0.00115203857421875, 0.002552032470703125, 0.006256103515625, 0.009960174560546875, 0.01366424560546875, 0.017368316650390625, 0.0210723876953125, 0.024776458740234375, 0.02848052978515625, 0.032184600830078125, 0.035888671875, 0.039592742919921875, 0.04329681396484375, 0.047000885009765625, 0.0507049560546875, 0.054409027099609375, 0.05811309814453125, 0.061817169189453125, 0.065521240234375, 0.06922531127929688, 0.07292938232421875, 0.07663345336914062, 0.0803375244140625, 0.08404159545898438, 0.08774566650390625, 0.09144973754882812, 0.09515380859375, 0.09885787963867188, 0.10256195068359375, 0.10626602172851562, 0.1099700927734375, 0.11367416381835938, 0.11737823486328125, 0.12108230590820312, 0.124786376953125, 0.12849044799804688, 0.13219451904296875, 0.13589859008789062, 0.1396026611328125, 0.14330673217773438, 0.14701080322265625, 0.15071487426757812, 0.1544189453125]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 3.0, 5.0, 7.0, 5.0, 9.0, 12.0, 22.0, 28.0, 41.0, 43.0, 46.0, 72.0, 120.0, 100.0, 108.0, 90.0, 73.0, 42.0, 54.0, 29.0, 28.0, 17.0, 14.0, 6.0, 8.0, 8.0, 5.0, 5.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.04693603515625, -0.04491138458251953, -0.04288673400878906, -0.040862083435058594, -0.038837432861328125, -0.036812782287597656, -0.03478813171386719, -0.03276348114013672, -0.03073883056640625, -0.02871417999267578, -0.026689529418945312, -0.024664878845214844, -0.022640228271484375, -0.020615577697753906, -0.018590927124023438, -0.01656627655029297, -0.0145416259765625, -0.012516975402832031, -0.010492324829101562, -0.008467674255371094, -0.006443023681640625, -0.004418373107910156, -0.0023937225341796875, -0.00036907196044921875, 0.00165557861328125, 0.0036802291870117188, 0.0057048797607421875, 0.007729530334472656, 0.009754180908203125, 0.011778831481933594, 0.013803482055664062, 0.01582813262939453, 0.017852783203125, 0.01987743377685547, 0.021902084350585938, 0.023926734924316406, 0.025951385498046875, 0.027976036071777344, 0.030000686645507812, 0.03202533721923828, 0.03404998779296875, 0.03607463836669922, 0.03809928894042969, 0.040123939514160156, 0.042148590087890625, 0.044173240661621094, 0.04619789123535156, 0.04822254180908203, 0.0502471923828125, 0.05227184295654297, 0.05429649353027344, 0.056321144104003906, 0.058345794677734375, 0.060370445251464844, 0.06239509582519531, 0.06441974639892578, 0.06644439697265625, 0.06846904754638672, 0.07049369812011719, 0.07251834869384766, 0.07454299926757812, 0.0765676498413086, 0.07859230041503906, 0.08061695098876953, 0.0826416015625]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 3.0, 11.0, 9.0, 37.0, 117.0, 300.0, 327.0, 152.0, 29.0, 13.0, 6.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7799245715141296, -0.7462612390518188, -0.7125979661941528, -0.678934633731842, -0.6452713012695312, -0.6116080284118652, -0.5779446959495544, -0.5442813634872437, -0.5106180906295776, -0.47695478796958923, -0.44329145550727844, -0.40962815284729004, -0.37596482038497925, -0.34230151772499084, -0.30863821506500244, -0.27497488260269165, -0.24131155014038086, -0.20764823257923126, -0.17398491501808167, -0.14032161235809326, -0.10665829479694366, -0.07299497723579407, -0.039331674575805664, -0.005668357014656067, 0.02799496054649353, 0.06165827438235283, 0.09532158821821213, 0.12898489832878113, 0.16264821588993073, 0.19631153345108032, 0.22997483611106873, 0.26363813877105713, 0.29730141162872314, 0.33096471428871155, 0.36462804675102234, 0.39829134941101074, 0.43195468187332153, 0.46561798453330994, 0.49928128719329834, 0.5329446196556091, 0.5666079521179199, 0.6002712845802307, 0.6339345574378967, 0.6675978899002075, 0.7012612223625183, 0.7349245548248291, 0.7685878276824951, 0.8022511601448059, 0.8359144330024719, 0.8695777654647827, 0.9032410383224487, 0.9369043707847595, 0.9705677032470703, 1.0042309761047363, 1.0378942489624023, 1.071557641029358, 1.105220913887024, 1.13888418674469, 1.1725475788116455, 1.2062108516693115, 1.2398741245269775, 1.273537516593933, 1.3072007894515991, 1.3408640623092651, 1.3745274543762207]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 2.0, 1.0, 3.0, 4.0, 4.0, 3.0, 6.0, 3.0, 9.0, 12.0, 9.0, 16.0, 26.0, 23.0, 50.0, 57.0, 58.0, 70.0, 85.0, 85.0, 75.0, 79.0, 71.0, 62.0, 51.0, 41.0, 22.0, 20.0, 15.0, 8.0, 8.0, 6.0, 4.0, 2.0, 2.0, 6.0, 0.0, 4.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5281582474708557, -0.5105385184288025, -0.49291878938674927, -0.47529906034469604, -0.4576793313026428, -0.4400596022605896, -0.4224398732185364, -0.40482014417648315, -0.38720041513442993, -0.3695806860923767, -0.3519609570503235, -0.33434122800827026, -0.31672149896621704, -0.2991017699241638, -0.2814820408821106, -0.2638623118400574, -0.24624258279800415, -0.22862285375595093, -0.2110031247138977, -0.19338339567184448, -0.17576366662979126, -0.15814393758773804, -0.14052420854568481, -0.12290447950363159, -0.10528475046157837, -0.08766502141952515, -0.07004529237747192, -0.0524255633354187, -0.03480583429336548, -0.017186105251312256, 0.0004336237907409668, 0.01805335283279419, 0.03567302227020264, 0.05329275131225586, 0.07091248035430908, 0.0885322093963623, 0.10615193843841553, 0.12377166748046875, 0.14139139652252197, 0.1590111255645752, 0.17663085460662842, 0.19425058364868164, 0.21187031269073486, 0.22949004173278809, 0.2471097707748413, 0.26472949981689453, 0.28234922885894775, 0.299968957901001, 0.3175886869430542, 0.3352084159851074, 0.35282814502716064, 0.37044787406921387, 0.3880676031112671, 0.4056873321533203, 0.42330706119537354, 0.44092679023742676, 0.45854651927948, 0.4761662483215332, 0.4937859773635864, 0.5114057064056396, 0.5290254354476929, 0.5466451644897461, 0.5642648935317993, 0.5818846225738525, 0.5995043516159058]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 3.0, 0.0, 2.0, 1.0, 5.0, 4.0, 3.0, 1.0, 5.0, 9.0, 10.0, 17.0, 19.0, 16.0, 24.0, 42.0, 57.0, 109.0, 124.0, 193.0, 275.0, 468.0, 745.0, 1216.0, 2153.0, 4170.0, 9291.0, 28517.0, 190161.0, 3816619.0, 103852.0, 21157.0, 7206.0, 3358.0, 1722.0, 935.0, 576.0, 372.0, 247.0, 197.0, 130.0, 90.0, 61.0, 32.0, 29.0, 19.0, 13.0, 13.0, 7.0, 7.0, 6.0, 1.0, 1.0, 1.0, 5.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.2208251953125, -0.2140045166015625, -0.207183837890625, -0.2003631591796875, -0.19354248046875, -0.1867218017578125, -0.179901123046875, -0.1730804443359375, -0.166259765625, -0.1594390869140625, -0.152618408203125, -0.1457977294921875, -0.13897705078125, -0.1321563720703125, -0.125335693359375, -0.1185150146484375, -0.1116943359375, -0.1048736572265625, -0.098052978515625, -0.0912322998046875, -0.08441162109375, -0.0775909423828125, -0.070770263671875, -0.0639495849609375, -0.05712890625, -0.0503082275390625, -0.043487548828125, -0.0366668701171875, -0.02984619140625, -0.0230255126953125, -0.016204833984375, -0.0093841552734375, -0.0025634765625, 0.0042572021484375, 0.011077880859375, 0.0178985595703125, 0.02471923828125, 0.0315399169921875, 0.038360595703125, 0.0451812744140625, 0.052001953125, 0.0588226318359375, 0.065643310546875, 0.0724639892578125, 0.07928466796875, 0.0861053466796875, 0.092926025390625, 0.0997467041015625, 0.1065673828125, 0.1133880615234375, 0.120208740234375, 0.1270294189453125, 0.13385009765625, 0.1406707763671875, 0.147491455078125, 0.1543121337890625, 0.1611328125, 0.1679534912109375, 0.174774169921875, 0.1815948486328125, 0.18841552734375, 0.1952362060546875, 0.202056884765625, 0.2088775634765625, 0.2156982421875]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 4.0, 1.0, 3.0, 0.0, 6.0, 5.0, 6.0, 7.0, 6.0, 7.0, 14.0, 18.0, 21.0, 42.0, 69.0, 126.0, 161.0, 164.0, 103.0, 86.0, 55.0, 28.0, 21.0, 13.0, 7.0, 7.0, 1.0, 8.0, 2.0, 2.0, 1.0, 6.0, 2.0, 1.0, 1.0, 4.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0203094482421875, -0.019712209701538086, -0.019114971160888672, -0.018517732620239258, -0.017920494079589844, -0.01732325553894043, -0.016726016998291016, -0.0161287784576416, -0.015531539916992188, -0.014934301376342773, -0.01433706283569336, -0.013739824295043945, -0.013142585754394531, -0.012545347213745117, -0.011948108673095703, -0.011350870132446289, -0.010753631591796875, -0.010156393051147461, -0.009559154510498047, -0.008961915969848633, -0.008364677429199219, -0.007767438888549805, -0.007170200347900391, -0.0065729618072509766, -0.0059757232666015625, -0.0053784847259521484, -0.004781246185302734, -0.00418400764465332, -0.0035867691040039062, -0.002989530563354492, -0.002392292022705078, -0.001795053482055664, -0.00119781494140625, -0.0006005764007568359, -3.337860107421875e-06, 0.0005939006805419922, 0.0011911392211914062, 0.0017883777618408203, 0.0023856163024902344, 0.0029828548431396484, 0.0035800933837890625, 0.0041773319244384766, 0.004774570465087891, 0.005371809005737305, 0.005969047546386719, 0.006566286087036133, 0.007163524627685547, 0.007760763168334961, 0.008358001708984375, 0.008955240249633789, 0.009552478790283203, 0.010149717330932617, 0.010746955871582031, 0.011344194412231445, 0.01194143295288086, 0.012538671493530273, 0.013135910034179688, 0.013733148574829102, 0.014330387115478516, 0.01492762565612793, 0.015524864196777344, 0.016122102737426758, 0.016719341278076172, 0.017316579818725586, 0.017913818359375]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 2.0, 1.0, 2.0, 5.0, 5.0, 4.0, 9.0, 11.0, 21.0, 27.0, 39.0, 51.0, 162.0, 250.0, 758.0, 2444.0, 11059.0, 92705.0, 3811188.0, 250662.0, 19372.0, 3717.0, 993.0, 410.0, 156.0, 96.0, 44.0, 31.0, 18.0, 14.0, 7.0, 7.0, 8.0, 3.0, 0.0, 1.0, 5.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.32275390625, -0.3128700256347656, -0.30298614501953125, -0.2931022644042969, -0.2832183837890625, -0.2733345031738281, -0.26345062255859375, -0.2535667419433594, -0.243682861328125, -0.23379898071289062, -0.22391510009765625, -0.21403121948242188, -0.2041473388671875, -0.19426345825195312, -0.18437957763671875, -0.17449569702148438, -0.16461181640625, -0.15472793579101562, -0.14484405517578125, -0.13496017456054688, -0.1250762939453125, -0.11519241333007812, -0.10530853271484375, -0.09542465209960938, -0.085540771484375, -0.07565689086914062, -0.06577301025390625, -0.055889129638671875, -0.0460052490234375, -0.036121368408203125, -0.02623748779296875, -0.016353607177734375, -0.0064697265625, 0.003414154052734375, 0.01329803466796875, 0.023181915283203125, 0.0330657958984375, 0.042949676513671875, 0.05283355712890625, 0.06271743774414062, 0.072601318359375, 0.08248519897460938, 0.09236907958984375, 0.10225296020507812, 0.1121368408203125, 0.12202072143554688, 0.13190460205078125, 0.14178848266601562, 0.15167236328125, 0.16155624389648438, 0.17144012451171875, 0.18132400512695312, 0.1912078857421875, 0.20109176635742188, 0.21097564697265625, 0.22085952758789062, 0.230743408203125, 0.24062728881835938, 0.25051116943359375, 0.2603950500488281, 0.2702789306640625, 0.2801628112792969, 0.29004669189453125, 0.2999305725097656, 0.309814453125]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 4.0, 3.0, 3.0, 4.0, 6.0, 5.0, 11.0, 14.0, 22.0, 17.0, 32.0, 38.0, 69.0, 97.0, 162.0, 270.0, 533.0, 1558.0, 525.0, 273.0, 129.0, 86.0, 62.0, 52.0, 26.0, 15.0, 12.0, 12.0, 9.0, 5.0, 5.0, 4.0, 3.0, 2.0, 4.0, 2.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0244293212890625, -0.02354121208190918, -0.02265310287475586, -0.02176499366760254, -0.02087688446044922, -0.0199887752532959, -0.019100666046142578, -0.018212556838989258, -0.017324447631835938, -0.016436338424682617, -0.015548229217529297, -0.014660120010375977, -0.013772010803222656, -0.012883901596069336, -0.011995792388916016, -0.011107683181762695, -0.010219573974609375, -0.009331464767456055, -0.008443355560302734, -0.007555246353149414, -0.006667137145996094, -0.0057790279388427734, -0.004890918731689453, -0.004002809524536133, -0.0031147003173828125, -0.002226591110229492, -0.0013384819030761719, -0.00045037269592285156, 0.00043773651123046875, 0.001325845718383789, 0.0022139549255371094, 0.0031020641326904297, 0.00399017333984375, 0.00487828254699707, 0.005766391754150391, 0.006654500961303711, 0.007542610168457031, 0.008430719375610352, 0.009318828582763672, 0.010206937789916992, 0.011095046997070312, 0.011983156204223633, 0.012871265411376953, 0.013759374618530273, 0.014647483825683594, 0.015535593032836914, 0.016423702239990234, 0.017311811447143555, 0.018199920654296875, 0.019088029861450195, 0.019976139068603516, 0.020864248275756836, 0.021752357482910156, 0.022640466690063477, 0.023528575897216797, 0.024416685104370117, 0.025304794311523438, 0.026192903518676758, 0.027081012725830078, 0.0279691219329834, 0.02885723114013672, 0.02974534034729004, 0.03063344955444336, 0.03152155876159668, 0.03240966796875]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 7.0, 2.0, 5.0, 13.0, 27.0, 38.0, 88.0, 154.0, 187.0, 201.0, 124.0, 91.0, 39.0, 11.0, 14.0, 3.0, 2.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.17661650478839874, -0.1692686378955841, -0.16192075610160828, -0.15457288920879364, -0.147225022315979, -0.13987715542316437, -0.13252928853034973, -0.1251814067363739, -0.11783353984355927, -0.11048567295074463, -0.1031377986073494, -0.09578992426395416, -0.08844205737113953, -0.08109419047832489, -0.07374631613492966, -0.06639844179153442, -0.05905057489871979, -0.05170270428061485, -0.04435483366250992, -0.037006963044404984, -0.02965909242630005, -0.022311221808195114, -0.01496335119009018, -0.007615480571985245, -0.00026760995388031006, 0.007080260664224625, 0.01442813128232956, 0.021776001900434494, 0.02912387251853943, 0.03647174313664436, 0.0438196137547493, 0.05116748437285423, 0.05851536989212036, 0.065863236784935, 0.07321111112833023, 0.08055898547172546, 0.0879068523645401, 0.09525471925735474, 0.10260259360074997, 0.1099504679441452, 0.11729833483695984, 0.12464620172977448, 0.1319940686225891, 0.13934195041656494, 0.14668981730937958, 0.1540376842021942, 0.16138556599617004, 0.16873343288898468, 0.17608129978179932, 0.18342916667461395, 0.1907770335674286, 0.19812491536140442, 0.20547278225421906, 0.2128206491470337, 0.22016853094100952, 0.22751639783382416, 0.2348642647266388, 0.24221213161945343, 0.24955999851226807, 0.2569078803062439, 0.2642557621002197, 0.27160361409187317, 0.278951495885849, 0.28629934787750244, 0.29364722967147827]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 4.0, 9.0, 9.0, 5.0, 11.0, 12.0, 16.0, 20.0, 31.0, 36.0, 36.0, 31.0, 55.0, 58.0, 58.0, 59.0, 48.0, 59.0, 53.0, 59.0, 59.0, 46.0, 41.0, 47.0, 22.0, 27.0, 19.0, 21.0, 17.0, 9.0, 6.0, 4.0, 4.0, 5.0, 2.0, 5.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.13427317142486572, -0.1303783506155014, -0.12648354470729828, -0.12258872389793396, -0.11869390308856964, -0.11479908972978592, -0.1109042763710022, -0.10700945556163788, -0.10311464220285416, -0.09921982884407043, -0.09532500803470612, -0.0914301946759224, -0.08753538131713867, -0.08364056050777435, -0.07974574714899063, -0.07585093379020691, -0.07195611298084259, -0.06806129962205887, -0.06416647881269455, -0.06027166545391083, -0.05637684836983681, -0.05248203128576279, -0.048587217926979065, -0.044692400842905045, -0.040797583758831024, -0.036902766674757004, -0.03300794959068298, -0.02911313623189926, -0.02521831914782524, -0.02132350206375122, -0.01742868684232235, -0.013533871620893478, -0.009639054536819458, -0.005744238384068012, -0.0018494222313165665, 0.0020453939214348793, 0.005940210074186325, 0.009835027158260345, 0.013729842379689217, 0.017624657601118088, 0.021519474685192108, 0.02541429176926613, 0.029309106990695, 0.03320392221212387, 0.03709873929619789, 0.04099355638027191, 0.044888369739055634, 0.048783186823129654, 0.052678003907203674, 0.056572820991277695, 0.060467638075351715, 0.06436245143413544, 0.06825727224349976, 0.07215208560228348, 0.0760468989610672, 0.07994171977043152, 0.08383653312921524, 0.08773134648799896, 0.09162616729736328, 0.095520980656147, 0.09941579401493073, 0.10331061482429504, 0.10720542818307877, 0.11110024154186249, 0.1149950623512268]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 1.0, 3.0, 3.0, 6.0, 10.0, 10.0, 16.0, 28.0, 24.0, 36.0, 60.0, 74.0, 107.0, 210.0, 311.0, 510.0, 843.0, 1518.0, 2897.0, 5893.0, 13684.0, 40044.0, 193481.0, 595380.0, 138503.0, 32085.0, 11710.0, 5140.0, 2510.0, 1359.0, 764.0, 485.0, 278.0, 168.0, 124.0, 76.0, 50.0, 38.0, 38.0, 20.0, 17.0, 13.0, 14.0, 4.0, 1.0, 5.0, 3.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.15185546875, -0.1473102569580078, -0.14276504516601562, -0.13821983337402344, -0.13367462158203125, -0.12912940979003906, -0.12458419799804688, -0.12003898620605469, -0.1154937744140625, -0.11094856262207031, -0.10640335083007812, -0.10185813903808594, -0.09731292724609375, -0.09276771545410156, -0.08822250366210938, -0.08367729187011719, -0.079132080078125, -0.07458686828613281, -0.07004165649414062, -0.06549644470214844, -0.06095123291015625, -0.05640602111816406, -0.051860809326171875, -0.04731559753417969, -0.0427703857421875, -0.03822517395019531, -0.033679962158203125, -0.029134750366210938, -0.02458953857421875, -0.020044326782226562, -0.015499114990234375, -0.010953903198242188, -0.00640869140625, -0.0018634796142578125, 0.002681732177734375, 0.0072269439697265625, 0.01177215576171875, 0.016317367553710938, 0.020862579345703125, 0.025407791137695312, 0.0299530029296875, 0.03449821472167969, 0.039043426513671875, 0.04358863830566406, 0.04813385009765625, 0.05267906188964844, 0.057224273681640625, 0.06176948547363281, 0.066314697265625, 0.07085990905761719, 0.07540512084960938, 0.07995033264160156, 0.08449554443359375, 0.08904075622558594, 0.09358596801757812, 0.09813117980957031, 0.1026763916015625, 0.10722160339355469, 0.11176681518554688, 0.11631202697753906, 0.12085723876953125, 0.12540245056152344, 0.12994766235351562, 0.1344928741455078, 0.1390380859375]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 6.0, 4.0, 4.0, 11.0, 15.0, 19.0, 29.0, 40.0, 67.0, 102.0, 129.0, 146.0, 139.0, 101.0, 59.0, 48.0, 32.0, 15.0, 6.0, 8.0, 3.0, 4.0, 4.0, 4.0, 3.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0225830078125, -0.021944284439086914, -0.021305561065673828, -0.020666837692260742, -0.020028114318847656, -0.01938939094543457, -0.018750667572021484, -0.0181119441986084, -0.017473220825195312, -0.016834497451782227, -0.01619577407836914, -0.015557050704956055, -0.014918327331542969, -0.014279603958129883, -0.013640880584716797, -0.013002157211303711, -0.012363433837890625, -0.011724710464477539, -0.011085987091064453, -0.010447263717651367, -0.009808540344238281, -0.009169816970825195, -0.00853109359741211, -0.007892370223999023, -0.0072536468505859375, -0.0066149234771728516, -0.005976200103759766, -0.00533747673034668, -0.004698753356933594, -0.004060029983520508, -0.003421306610107422, -0.002782583236694336, -0.00214385986328125, -0.001505136489868164, -0.0008664131164550781, -0.0002276897430419922, 0.00041103363037109375, 0.0010497570037841797, 0.0016884803771972656, 0.0023272037506103516, 0.0029659271240234375, 0.0036046504974365234, 0.004243373870849609, 0.004882097244262695, 0.005520820617675781, 0.006159543991088867, 0.006798267364501953, 0.007436990737915039, 0.008075714111328125, 0.008714437484741211, 0.009353160858154297, 0.009991884231567383, 0.010630607604980469, 0.011269330978393555, 0.01190805435180664, 0.012546777725219727, 0.013185501098632812, 0.013824224472045898, 0.014462947845458984, 0.01510167121887207, 0.015740394592285156, 0.016379117965698242, 0.017017841339111328, 0.017656564712524414, 0.0182952880859375]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 3.0, 10.0, 4.0, 8.0, 9.0, 10.0, 11.0, 26.0, 34.0, 49.0, 58.0, 79.0, 108.0, 178.0, 257.0, 412.0, 693.0, 1507.0, 3670.0, 11741.0, 48807.0, 249124.0, 523580.0, 161994.0, 32004.0, 8416.0, 2899.0, 1223.0, 609.0, 370.0, 210.0, 157.0, 92.0, 68.0, 46.0, 29.0, 21.0, 9.0, 11.0, 6.0, 6.0, 5.0, 3.0, 3.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.1474609375, -0.14304161071777344, -0.13862228393554688, -0.1342029571533203, -0.12978363037109375, -0.1253643035888672, -0.12094497680664062, -0.11652565002441406, -0.1121063232421875, -0.10768699645996094, -0.10326766967773438, -0.09884834289550781, -0.09442901611328125, -0.09000968933105469, -0.08559036254882812, -0.08117103576660156, -0.076751708984375, -0.07233238220214844, -0.06791305541992188, -0.06349372863769531, -0.05907440185546875, -0.05465507507324219, -0.050235748291015625, -0.04581642150878906, -0.0413970947265625, -0.03697776794433594, -0.032558441162109375, -0.028139114379882812, -0.02371978759765625, -0.019300460815429688, -0.014881134033203125, -0.010461807250976562, -0.00604248046875, -0.0016231536865234375, 0.002796173095703125, 0.0072154998779296875, 0.01163482666015625, 0.016054153442382812, 0.020473480224609375, 0.024892807006835938, 0.0293121337890625, 0.03373146057128906, 0.038150787353515625, 0.04257011413574219, 0.04698944091796875, 0.05140876770019531, 0.055828094482421875, 0.06024742126464844, 0.064666748046875, 0.06908607482910156, 0.07350540161132812, 0.07792472839355469, 0.08234405517578125, 0.08676338195800781, 0.09118270874023438, 0.09560203552246094, 0.1000213623046875, 0.10444068908691406, 0.10886001586914062, 0.11327934265136719, 0.11769866943359375, 0.12211799621582031, 0.12653732299804688, 0.13095664978027344, 0.1353759765625]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [3.0, 2.0, 2.0, 1.0, 3.0, 1.0, 2.0, 2.0, 5.0, 7.0, 15.0, 12.0, 8.0, 8.0, 14.0, 12.0, 13.0, 23.0, 16.0, 23.0, 25.0, 32.0, 28.0, 40.0, 42.0, 36.0, 39.0, 44.0, 40.0, 39.0, 59.0, 52.0, 45.0, 33.0, 38.0, 30.0, 28.0, 23.0, 25.0, 23.0, 17.0, 15.0, 20.0, 17.0, 7.0, 10.0, 13.0, 7.0, 3.0, 1.0, 4.0, 1.0, 4.0, 3.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.05181884765625, -0.05005359649658203, -0.04828834533691406, -0.046523094177246094, -0.044757843017578125, -0.042992591857910156, -0.04122734069824219, -0.03946208953857422, -0.03769683837890625, -0.03593158721923828, -0.03416633605957031, -0.032401084899902344, -0.030635833740234375, -0.028870582580566406, -0.027105331420898438, -0.02534008026123047, -0.0235748291015625, -0.02180957794189453, -0.020044326782226562, -0.018279075622558594, -0.016513824462890625, -0.014748573303222656, -0.012983322143554688, -0.011218070983886719, -0.00945281982421875, -0.007687568664550781, -0.0059223175048828125, -0.004157066345214844, -0.002391815185546875, -0.0006265640258789062, 0.0011386871337890625, 0.0029039382934570312, 0.004669189453125, 0.006434440612792969, 0.008199691772460938, 0.009964942932128906, 0.011730194091796875, 0.013495445251464844, 0.015260696411132812, 0.01702594757080078, 0.01879119873046875, 0.02055644989013672, 0.022321701049804688, 0.024086952209472656, 0.025852203369140625, 0.027617454528808594, 0.029382705688476562, 0.03114795684814453, 0.0329132080078125, 0.03467845916748047, 0.03644371032714844, 0.038208961486816406, 0.039974212646484375, 0.041739463806152344, 0.04350471496582031, 0.04526996612548828, 0.04703521728515625, 0.04880046844482422, 0.05056571960449219, 0.052330970764160156, 0.054096221923828125, 0.055861473083496094, 0.05762672424316406, 0.05939197540283203, 0.0611572265625]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 4.0, 1.0, 2.0, 7.0, 11.0, 7.0, 16.0, 28.0, 42.0, 53.0, 100.0, 153.0, 281.0, 428.0, 830.0, 1603.0, 3636.0, 9191.0, 28631.0, 134838.0, 634739.0, 180628.0, 34472.0, 10798.0, 4141.0, 1796.0, 871.0, 504.0, 266.0, 191.0, 106.0, 65.0, 34.0, 29.0, 22.0, 13.0, 6.0, 8.0, 7.0, 4.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.12939453125, -0.12516212463378906, -0.12092971801757812, -0.11669731140136719, -0.11246490478515625, -0.10823249816894531, -0.10400009155273438, -0.09976768493652344, -0.0955352783203125, -0.09130287170410156, -0.08707046508789062, -0.08283805847167969, -0.07860565185546875, -0.07437324523925781, -0.07014083862304688, -0.06590843200683594, -0.061676025390625, -0.05744361877441406, -0.053211212158203125, -0.04897880554199219, -0.04474639892578125, -0.04051399230957031, -0.036281585693359375, -0.03204917907714844, -0.0278167724609375, -0.023584365844726562, -0.019351959228515625, -0.015119552612304688, -0.01088714599609375, -0.0066547393798828125, -0.002422332763671875, 0.0018100738525390625, 0.00604248046875, 0.010274887084960938, 0.014507293701171875, 0.018739700317382812, 0.02297210693359375, 0.027204513549804688, 0.031436920166015625, 0.03566932678222656, 0.0399017333984375, 0.04413414001464844, 0.048366546630859375, 0.05259895324707031, 0.05683135986328125, 0.06106376647949219, 0.06529617309570312, 0.06952857971191406, 0.073760986328125, 0.07799339294433594, 0.08222579956054688, 0.08645820617675781, 0.09069061279296875, 0.09492301940917969, 0.09915542602539062, 0.10338783264160156, 0.1076202392578125, 0.11185264587402344, 0.11608505249023438, 0.12031745910644531, 0.12454986572265625, 0.1287822723388672, 0.13301467895507812, 0.13724708557128906, 0.1414794921875]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 2.0, 3.0, 2.0, 6.0, 2.0, 4.0, 10.0, 11.0, 10.0, 19.0, 27.0, 19.0, 21.0, 33.0, 43.0, 50.0, 78.0, 80.0, 87.0, 84.0, 64.0, 70.0, 55.0, 46.0, 29.0, 39.0, 20.0, 28.0, 15.0, 13.0, 4.0, 13.0, 5.0, 5.0, 3.0, 3.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.051229476928711e-05, -6.824173033237457e-05, -6.597116589546204e-05, -6.37006014585495e-05, -6.143003702163696e-05, -5.9159472584724426e-05, -5.688890814781189e-05, -5.461834371089935e-05, -5.2347779273986816e-05, -5.007721483707428e-05, -4.780665040016174e-05, -4.5536085963249207e-05, -4.326552152633667e-05, -4.099495708942413e-05, -3.87243926525116e-05, -3.645382821559906e-05, -3.4183263778686523e-05, -3.191269934177399e-05, -2.964213490486145e-05, -2.7371570467948914e-05, -2.5101006031036377e-05, -2.283044159412384e-05, -2.0559877157211304e-05, -1.8289312720298767e-05, -1.601874828338623e-05, -1.3748183846473694e-05, -1.1477619409561157e-05, -9.20705497264862e-06, -6.936490535736084e-06, -4.665926098823547e-06, -2.3953616619110107e-06, -1.2479722499847412e-07, 2.1457672119140625e-06, 4.416331648826599e-06, 6.686896085739136e-06, 8.957460522651672e-06, 1.1228024959564209e-05, 1.3498589396476746e-05, 1.5769153833389282e-05, 1.803971827030182e-05, 2.0310282707214355e-05, 2.2580847144126892e-05, 2.485141158103943e-05, 2.7121976017951965e-05, 2.9392540454864502e-05, 3.166310489177704e-05, 3.3933669328689575e-05, 3.620423376560211e-05, 3.847479820251465e-05, 4.0745362639427185e-05, 4.301592707633972e-05, 4.528649151325226e-05, 4.7557055950164795e-05, 4.982762038707733e-05, 5.209818482398987e-05, 5.4368749260902405e-05, 5.663931369781494e-05, 5.890987813472748e-05, 6.118044257164001e-05, 6.345100700855255e-05, 6.572157144546509e-05, 6.799213588237762e-05, 7.026270031929016e-05, 7.25332647562027e-05, 7.480382919311523e-05]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 1.0, 5.0, 4.0, 1.0, 6.0, 7.0, 6.0, 10.0, 9.0, 9.0, 18.0, 17.0, 20.0, 35.0, 57.0, 83.0, 108.0, 164.0, 337.0, 683.0, 1704.0, 4488.0, 14204.0, 69194.0, 700084.0, 217735.0, 27385.0, 7447.0, 2543.0, 1008.0, 462.0, 266.0, 131.0, 110.0, 58.0, 43.0, 18.0, 23.0, 16.0, 14.0, 5.0, 8.0, 9.0, 7.0, 3.0, 4.0, 3.0, 2.0, 1.0, 1.0, 3.0, 2.0, 1.0, 2.0], "bins": [-0.200927734375, -0.1951427459716797, -0.18935775756835938, -0.18357276916503906, -0.17778778076171875, -0.17200279235839844, -0.16621780395507812, -0.1604328155517578, -0.1546478271484375, -0.1488628387451172, -0.14307785034179688, -0.13729286193847656, -0.13150787353515625, -0.12572288513183594, -0.11993789672851562, -0.11415290832519531, -0.108367919921875, -0.10258293151855469, -0.09679794311523438, -0.09101295471191406, -0.08522796630859375, -0.07944297790527344, -0.07365798950195312, -0.06787300109863281, -0.0620880126953125, -0.05630302429199219, -0.050518035888671875, -0.04473304748535156, -0.03894805908203125, -0.03316307067871094, -0.027378082275390625, -0.021593093872070312, -0.01580810546875, -0.010023117065429688, -0.004238128662109375, 0.0015468597412109375, 0.00733184814453125, 0.013116836547851562, 0.018901824951171875, 0.024686813354492188, 0.0304718017578125, 0.03625679016113281, 0.042041778564453125, 0.04782676696777344, 0.05361175537109375, 0.05939674377441406, 0.06518173217773438, 0.07096672058105469, 0.076751708984375, 0.08253669738769531, 0.08832168579101562, 0.09410667419433594, 0.09989166259765625, 0.10567665100097656, 0.11146163940429688, 0.11724662780761719, 0.1230316162109375, 0.1288166046142578, 0.13460159301757812, 0.14038658142089844, 0.14617156982421875, 0.15195655822753906, 0.15774154663085938, 0.1635265350341797, 0.1693115234375]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 3.0, 1.0, 2.0, 4.0, 2.0, 3.0, 5.0, 3.0, 1.0, 3.0, 5.0, 10.0, 12.0, 8.0, 12.0, 20.0, 27.0, 50.0, 57.0, 90.0, 87.0, 127.0, 104.0, 85.0, 71.0, 55.0, 37.0, 33.0, 27.0, 11.0, 13.0, 5.0, 4.0, 6.0, 8.0, 7.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06842041015625, -0.06611824035644531, -0.06381607055664062, -0.06151390075683594, -0.05921173095703125, -0.05690956115722656, -0.054607391357421875, -0.05230522155761719, -0.0500030517578125, -0.04770088195800781, -0.045398712158203125, -0.04309654235839844, -0.04079437255859375, -0.03849220275878906, -0.036190032958984375, -0.03388786315917969, -0.031585693359375, -0.029283523559570312, -0.026981353759765625, -0.024679183959960938, -0.02237701416015625, -0.020074844360351562, -0.017772674560546875, -0.015470504760742188, -0.0131683349609375, -0.010866165161132812, -0.008563995361328125, -0.0062618255615234375, -0.00395965576171875, -0.0016574859619140625, 0.000644683837890625, 0.0029468536376953125, 0.0052490234375, 0.0075511932373046875, 0.009853363037109375, 0.012155532836914062, 0.01445770263671875, 0.016759872436523438, 0.019062042236328125, 0.021364212036132812, 0.0236663818359375, 0.025968551635742188, 0.028270721435546875, 0.030572891235351562, 0.03287506103515625, 0.03517723083496094, 0.037479400634765625, 0.03978157043457031, 0.042083740234375, 0.04438591003417969, 0.046688079833984375, 0.04899024963378906, 0.05129241943359375, 0.05359458923339844, 0.055896759033203125, 0.05819892883300781, 0.0605010986328125, 0.06280326843261719, 0.06510543823242188, 0.06740760803222656, 0.06970977783203125, 0.07201194763183594, 0.07431411743164062, 0.07661628723144531, 0.07891845703125]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 5.0, 11.0, 31.0, 168.0, 410.0, 281.0, 71.0, 20.0, 7.0, 4.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3670365810394287, -1.2896817922592163, -1.2123271226882935, -1.134972333908081, -1.0576175451278687, -0.980262815952301, -0.9029080867767334, -0.825553297996521, -0.7481985688209534, -0.6708438396453857, -0.5934890508651733, -0.5161343216896057, -0.4387795627117157, -0.3614248037338257, -0.28407007455825806, -0.20671528577804565, -0.12936055660247803, -0.05200580507516861, 0.025348946452140808, 0.10270369052886963, 0.18005844950675964, 0.25741320848464966, 0.3347679376602173, 0.4121227264404297, 0.4894774556159973, 0.5668321847915649, 0.6441869735717773, 0.721541702747345, 0.7988964319229126, 0.876251220703125, 0.9536059498786926, 1.0309607982635498, 1.1083154678344727, 1.185670256614685, 1.263024926185608, 1.3403797149658203, 1.4177345037460327, 1.4950892925262451, 1.572443962097168, 1.6497987508773804, 1.7271535396575928, 1.8045083284378052, 1.881862998008728, 1.9592177867889404, 2.0365724563598633, 2.1139273643493652, 2.191282033920288, 2.268636703491211, 2.345991611480713, 2.4233462810516357, 2.5007011890411377, 2.5780558586120605, 2.6554105281829834, 2.7327654361724854, 2.810120105743408, 2.88747501373291, 2.964829444885254, 3.0421841144561768, 3.1195390224456787, 3.1968936920166016, 3.2742483615875244, 3.3516032695770264, 3.428957939147949, 3.506312847137451, 3.583667516708374]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 5.0, 10.0, 5.0, 16.0, 12.0, 10.0, 12.0, 18.0, 22.0, 18.0, 25.0, 29.0, 36.0, 34.0, 45.0, 40.0, 49.0, 42.0, 38.0, 44.0, 58.0, 55.0, 49.0, 40.0, 45.0, 31.0, 44.0, 27.0, 24.0, 24.0, 22.0, 16.0, 12.0, 8.0, 13.0, 9.0, 5.0, 7.0, 4.0, 6.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5400216579437256, -0.5233773589134216, -0.5067330002784729, -0.49008867144584656, -0.4734443426132202, -0.45680004358291626, -0.4401557147502899, -0.4235113859176636, -0.40686705708503723, -0.3902227282524109, -0.37357839941978455, -0.3569340705871582, -0.34028977155685425, -0.3236454129219055, -0.30700111389160156, -0.2903567850589752, -0.2737124562263489, -0.25706812739372253, -0.2404237985610962, -0.22377948462963104, -0.2071351557970047, -0.19049082696437836, -0.1738465130329132, -0.15720218420028687, -0.14055785536766052, -0.12391352653503418, -0.10726920515298843, -0.09062488377094269, -0.07398055493831635, -0.05733622610569, -0.04069190472364426, -0.02404758334159851, -0.007403194904327393, 0.009241130203008652, 0.025885455310344696, 0.04252978041768074, 0.059174105525016785, 0.07581843435764313, 0.09246275573968887, 0.10910707712173462, 0.12575140595436096, 0.1423957347869873, 0.15904006361961365, 0.1756843775510788, 0.19232870638370514, 0.20897303521633148, 0.22561734914779663, 0.24226167798042297, 0.2589060068130493, 0.27555033564567566, 0.292194664478302, 0.30883899331092834, 0.3254833221435547, 0.34212762117385864, 0.358771950006485, 0.37541627883911133, 0.39206060767173767, 0.408704936504364, 0.42534926533699036, 0.4419935941696167, 0.45863789319992065, 0.4752822518348694, 0.49192655086517334, 0.5085709095001221, 0.525215208530426]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 5.0, 1.0, 7.0, 3.0, 2.0, 10.0, 18.0, 17.0, 29.0, 47.0, 85.0, 195.0, 301.0, 724.0, 2168.0, 9740.0, 143502.0, 3992187.0, 38208.0, 4921.0, 1217.0, 453.0, 206.0, 100.0, 55.0, 36.0, 17.0, 15.0, 6.0, 3.0, 5.0, 2.0, 1.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.5078125, -0.4945564270019531, -0.48130035400390625, -0.4680442810058594, -0.4547882080078125, -0.4415321350097656, -0.42827606201171875, -0.4150199890136719, -0.401763916015625, -0.3885078430175781, -0.37525177001953125, -0.3619956970214844, -0.3487396240234375, -0.3354835510253906, -0.32222747802734375, -0.3089714050292969, -0.29571533203125, -0.2824592590332031, -0.26920318603515625, -0.2559471130371094, -0.2426910400390625, -0.22943496704101562, -0.21617889404296875, -0.20292282104492188, -0.189666748046875, -0.17641067504882812, -0.16315460205078125, -0.14989852905273438, -0.1366424560546875, -0.12338638305664062, -0.11013031005859375, -0.09687423706054688, -0.0836181640625, -0.07036209106445312, -0.05710601806640625, -0.043849945068359375, -0.0305938720703125, -0.017337799072265625, -0.00408172607421875, 0.009174346923828125, 0.022430419921875, 0.035686492919921875, 0.04894256591796875, 0.062198638916015625, 0.0754547119140625, 0.08871078491210938, 0.10196685791015625, 0.11522293090820312, 0.12847900390625, 0.14173507690429688, 0.15499114990234375, 0.16824722290039062, 0.1815032958984375, 0.19475936889648438, 0.20801544189453125, 0.22127151489257812, 0.234527587890625, 0.24778366088867188, 0.26103973388671875, 0.2742958068847656, 0.2875518798828125, 0.3008079528808594, 0.31406402587890625, 0.3273200988769531, 0.340576171875]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 4.0, 4.0, 3.0, 6.0, 8.0, 17.0, 32.0, 27.0, 44.0, 54.0, 79.0, 70.0, 92.0, 96.0, 100.0, 100.0, 77.0, 56.0, 35.0, 25.0, 19.0, 18.0, 11.0, 4.0, 6.0, 4.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.022918701171875, -0.022288799285888672, -0.021658897399902344, -0.021028995513916016, -0.020399093627929688, -0.01976919174194336, -0.01913928985595703, -0.018509387969970703, -0.017879486083984375, -0.017249584197998047, -0.01661968231201172, -0.01598978042602539, -0.015359878540039062, -0.014729976654052734, -0.014100074768066406, -0.013470172882080078, -0.01284027099609375, -0.012210369110107422, -0.011580467224121094, -0.010950565338134766, -0.010320663452148438, -0.00969076156616211, -0.009060859680175781, -0.008430957794189453, -0.007801055908203125, -0.007171154022216797, -0.006541252136230469, -0.005911350250244141, -0.0052814483642578125, -0.004651546478271484, -0.004021644592285156, -0.003391742706298828, -0.0027618408203125, -0.002131938934326172, -0.0015020370483398438, -0.0008721351623535156, -0.0002422332763671875, 0.0003876686096191406, 0.0010175704956054688, 0.0016474723815917969, 0.002277374267578125, 0.002907276153564453, 0.0035371780395507812, 0.004167079925537109, 0.0047969818115234375, 0.005426883697509766, 0.006056785583496094, 0.006686687469482422, 0.00731658935546875, 0.007946491241455078, 0.008576393127441406, 0.009206295013427734, 0.009836196899414062, 0.01046609878540039, 0.011096000671386719, 0.011725902557373047, 0.012355804443359375, 0.012985706329345703, 0.013615608215332031, 0.01424551010131836, 0.014875411987304688, 0.015505313873291016, 0.016135215759277344, 0.016765117645263672, 0.01739501953125]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 5.0, 2.0, 8.0, 13.0, 19.0, 30.0, 47.0, 81.0, 118.0, 186.0, 360.0, 812.0, 2172.0, 7148.0, 31236.0, 247773.0, 3633773.0, 228610.0, 30587.0, 7267.0, 2200.0, 880.0, 422.0, 210.0, 114.0, 80.0, 56.0, 23.0, 19.0, 12.0, 13.0, 5.0, 6.0, 6.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.20458984375, -0.1978778839111328, -0.19116592407226562, -0.18445396423339844, -0.17774200439453125, -0.17103004455566406, -0.16431808471679688, -0.1576061248779297, -0.1508941650390625, -0.1441822052001953, -0.13747024536132812, -0.13075828552246094, -0.12404632568359375, -0.11733436584472656, -0.11062240600585938, -0.10391044616699219, -0.097198486328125, -0.09048652648925781, -0.08377456665039062, -0.07706260681152344, -0.07035064697265625, -0.06363868713378906, -0.056926727294921875, -0.05021476745605469, -0.0435028076171875, -0.03679084777832031, -0.030078887939453125, -0.023366928100585938, -0.01665496826171875, -0.009943008422851562, -0.003231048583984375, 0.0034809112548828125, 0.01019287109375, 0.016904830932617188, 0.023616790771484375, 0.030328750610351562, 0.03704071044921875, 0.04375267028808594, 0.050464630126953125, 0.05717658996582031, 0.0638885498046875, 0.07060050964355469, 0.07731246948242188, 0.08402442932128906, 0.09073638916015625, 0.09744834899902344, 0.10416030883789062, 0.11087226867675781, 0.117584228515625, 0.12429618835449219, 0.13100814819335938, 0.13772010803222656, 0.14443206787109375, 0.15114402770996094, 0.15785598754882812, 0.1645679473876953, 0.1712799072265625, 0.1779918670654297, 0.18470382690429688, 0.19141578674316406, 0.19812774658203125, 0.20483970642089844, 0.21155166625976562, 0.2182636260986328, 0.2249755859375]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 7.0, 4.0, 7.0, 8.0, 12.0, 29.0, 29.0, 53.0, 88.0, 171.0, 339.0, 1370.0, 1192.0, 310.0, 165.0, 87.0, 70.0, 54.0, 25.0, 19.0, 12.0, 7.0, 5.0, 4.0, 5.0, 4.0, 4.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.034027099609375, -0.0326085090637207, -0.031189918518066406, -0.02977132797241211, -0.028352737426757812, -0.026934146881103516, -0.02551555633544922, -0.024096965789794922, -0.022678375244140625, -0.021259784698486328, -0.01984119415283203, -0.018422603607177734, -0.017004013061523438, -0.01558542251586914, -0.014166831970214844, -0.012748241424560547, -0.01132965087890625, -0.009911060333251953, -0.008492469787597656, -0.007073879241943359, -0.0056552886962890625, -0.004236698150634766, -0.0028181076049804688, -0.0013995170593261719, 1.9073486328125e-05, 0.0014376640319824219, 0.0028562545776367188, 0.004274845123291016, 0.0056934356689453125, 0.007112026214599609, 0.008530616760253906, 0.009949207305908203, 0.0113677978515625, 0.012786388397216797, 0.014204978942871094, 0.01562356948852539, 0.017042160034179688, 0.018460750579833984, 0.01987934112548828, 0.021297931671142578, 0.022716522216796875, 0.024135112762451172, 0.02555370330810547, 0.026972293853759766, 0.028390884399414062, 0.02980947494506836, 0.031228065490722656, 0.03264665603637695, 0.03406524658203125, 0.03548383712768555, 0.036902427673339844, 0.03832101821899414, 0.03973960876464844, 0.041158199310302734, 0.04257678985595703, 0.04399538040161133, 0.045413970947265625, 0.04683256149291992, 0.04825115203857422, 0.049669742584228516, 0.05108833312988281, 0.05250692367553711, 0.053925514221191406, 0.0553441047668457, 0.0567626953125]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 8.0, 9.0, 33.0, 56.0, 108.0, 163.0, 189.0, 156.0, 118.0, 75.0, 39.0, 22.0, 10.0, 9.0, 4.0, 5.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3375924527645111, -0.32863524556159973, -0.31967806816101074, -0.31072086095809937, -0.301763653755188, -0.292806476354599, -0.2838492691516876, -0.27489209175109863, -0.26593488454818726, -0.2569776773452759, -0.2480204850435257, -0.2390632927417755, -0.23010610044002533, -0.22114890813827515, -0.21219170093536377, -0.2032345086336136, -0.1942773014307022, -0.18532010912895203, -0.17636290192604065, -0.16740570962429047, -0.15844851732254028, -0.1494913101196289, -0.14053411781787872, -0.13157692551612854, -0.12261972576379776, -0.11366252601146698, -0.1047053337097168, -0.09574813395738602, -0.08679093420505524, -0.07783374190330505, -0.06887654215097427, -0.05991934984922409, -0.05096215009689331, -0.04200495406985283, -0.03304775804281235, -0.024090558290481567, -0.015133362263441086, -0.006176166236400604, 0.0027810335159301758, 0.011738225817680359, 0.02069542557001114, 0.02965262159705162, 0.0386098176240921, 0.04756701737642288, 0.056524213403463364, 0.06548140943050385, 0.07443860918283463, 0.08339580148458481, 0.09235300123691559, 0.10131020098924637, 0.11026739329099655, 0.11922459304332733, 0.12818178534507751, 0.1371389925479889, 0.14609618484973907, 0.15505337715148926, 0.16401058435440063, 0.17296777665615082, 0.1819249838590622, 0.19088217616081238, 0.19983936846256256, 0.20879656076431274, 0.21775376796722412, 0.2267109602689743, 0.2356681525707245]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 6.0, 2.0, 5.0, 2.0, 2.0, 5.0, 3.0, 7.0, 7.0, 8.0, 16.0, 17.0, 21.0, 19.0, 20.0, 23.0, 23.0, 25.0, 28.0, 26.0, 43.0, 43.0, 42.0, 40.0, 43.0, 35.0, 34.0, 44.0, 42.0, 48.0, 41.0, 43.0, 34.0, 35.0, 19.0, 23.0, 30.0, 10.0, 9.0, 20.0, 16.0, 12.0, 12.0, 6.0, 7.0, 6.0, 4.0, 2.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10585081577301025, -0.10256566107273102, -0.09928051382303238, -0.09599536657333374, -0.0927102118730545, -0.08942505717277527, -0.08613990992307663, -0.08285476267337799, -0.07956960797309875, -0.07628445327281952, -0.07299930602312088, -0.06971415877342224, -0.066429004073143, -0.06314384937286377, -0.05985870212316513, -0.05657355114817619, -0.053288400173187256, -0.05000324919819832, -0.04671809822320938, -0.043432947248220444, -0.040147796273231506, -0.03686264529824257, -0.03357749432325363, -0.030292343348264694, -0.027007192373275757, -0.02372204139828682, -0.020436890423297882, -0.017151739448308945, -0.013866588473320007, -0.01058143749833107, -0.007296286523342133, -0.004011135548353195, -0.0007259845733642578, 0.0025591664016246796, 0.005844317376613617, 0.009129468351602554, 0.012414619326591492, 0.01569977030158043, 0.018984921276569366, 0.022270072251558304, 0.02555522322654724, 0.02884037420153618, 0.032125525176525116, 0.03541067615151405, 0.03869582712650299, 0.04198097810149193, 0.045266129076480865, 0.0485512800514698, 0.05183643102645874, 0.05512158200144768, 0.058406732976436615, 0.06169188395142555, 0.06497703492641449, 0.06826218962669373, 0.07154733687639236, 0.074832484126091, 0.07811763882637024, 0.08140279352664948, 0.08468794077634811, 0.08797308802604675, 0.09125824272632599, 0.09454339742660522, 0.09782854467630386, 0.1011136919260025, 0.10439884662628174]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 0.0, 3.0, 2.0, 8.0, 5.0, 2.0, 9.0, 13.0, 23.0, 21.0, 37.0, 41.0, 85.0, 119.0, 168.0, 287.0, 472.0, 725.0, 1281.0, 2579.0, 5438.0, 14161.0, 43780.0, 165267.0, 469187.0, 247590.0, 63758.0, 19405.0, 7064.0, 3188.0, 1647.0, 858.0, 486.0, 297.0, 189.0, 133.0, 86.0, 45.0, 29.0, 25.0, 11.0, 9.0, 12.0, 11.0, 5.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10992431640625, -0.10594844818115234, -0.10197257995605469, -0.09799671173095703, -0.09402084350585938, -0.09004497528076172, -0.08606910705566406, -0.0820932388305664, -0.07811737060546875, -0.0741415023803711, -0.07016563415527344, -0.06618976593017578, -0.062213897705078125, -0.05823802947998047, -0.05426216125488281, -0.050286293029785156, -0.0463104248046875, -0.042334556579589844, -0.03835868835449219, -0.03438282012939453, -0.030406951904296875, -0.02643108367919922, -0.022455215454101562, -0.018479347229003906, -0.01450347900390625, -0.010527610778808594, -0.0065517425537109375, -0.0025758743286132812, 0.001399993896484375, 0.005375862121582031, 0.009351730346679688, 0.013327598571777344, 0.017303466796875, 0.021279335021972656, 0.025255203247070312, 0.02923107147216797, 0.033206939697265625, 0.03718280792236328, 0.04115867614746094, 0.045134544372558594, 0.04911041259765625, 0.053086280822753906, 0.05706214904785156, 0.06103801727294922, 0.06501388549804688, 0.06898975372314453, 0.07296562194824219, 0.07694149017333984, 0.0809173583984375, 0.08489322662353516, 0.08886909484863281, 0.09284496307373047, 0.09682083129882812, 0.10079669952392578, 0.10477256774902344, 0.1087484359741211, 0.11272430419921875, 0.1167001724243164, 0.12067604064941406, 0.12465190887451172, 0.12862777709960938, 0.13260364532470703, 0.1365795135498047, 0.14055538177490234, 0.14453125]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 3.0, 8.0, 10.0, 4.0, 9.0, 14.0, 20.0, 32.0, 34.0, 50.0, 61.0, 72.0, 88.0, 80.0, 82.0, 78.0, 74.0, 62.0, 50.0, 49.0, 28.0, 30.0, 17.0, 16.0, 9.0, 4.0, 6.0, 3.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.021697998046875, -0.02113056182861328, -0.020563125610351562, -0.019995689392089844, -0.019428253173828125, -0.018860816955566406, -0.018293380737304688, -0.01772594451904297, -0.01715850830078125, -0.01659107208251953, -0.016023635864257812, -0.015456199645996094, -0.014888763427734375, -0.014321327209472656, -0.013753890991210938, -0.013186454772949219, -0.0126190185546875, -0.012051582336425781, -0.011484146118164062, -0.010916709899902344, -0.010349273681640625, -0.009781837463378906, -0.009214401245117188, -0.008646965026855469, -0.00807952880859375, -0.007512092590332031, -0.0069446563720703125, -0.006377220153808594, -0.005809783935546875, -0.005242347717285156, -0.0046749114990234375, -0.004107475280761719, -0.0035400390625, -0.0029726028442382812, -0.0024051666259765625, -0.0018377304077148438, -0.001270294189453125, -0.0007028579711914062, -0.0001354217529296875, 0.00043201446533203125, 0.00099945068359375, 0.0015668869018554688, 0.0021343231201171875, 0.0027017593383789062, 0.003269195556640625, 0.0038366317749023438, 0.0044040679931640625, 0.004971504211425781, 0.0055389404296875, 0.006106376647949219, 0.0066738128662109375, 0.007241249084472656, 0.007808685302734375, 0.008376121520996094, 0.008943557739257812, 0.009510993957519531, 0.01007843017578125, 0.010645866394042969, 0.011213302612304688, 0.011780738830566406, 0.012348175048828125, 0.012915611267089844, 0.013483047485351562, 0.014050483703613281, 0.014617919921875]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 8.0, 3.0, 13.0, 6.0, 14.0, 16.0, 23.0, 33.0, 55.0, 59.0, 69.0, 121.0, 149.0, 231.0, 261.0, 477.0, 752.0, 1359.0, 2761.0, 6719.0, 20161.0, 67537.0, 229906.0, 441336.0, 191495.0, 56212.0, 16827.0, 6147.0, 2486.0, 1160.0, 695.0, 475.0, 266.0, 213.0, 127.0, 98.0, 71.0, 52.0, 27.0, 33.0, 21.0, 27.0, 12.0, 9.0, 6.0, 16.0, 3.0, 3.0, 4.0, 1.0, 1.0, 2.0, 3.0, 2.0], "bins": [-0.12188720703125, -0.1182403564453125, -0.114593505859375, -0.1109466552734375, -0.1072998046875, -0.1036529541015625, -0.100006103515625, -0.0963592529296875, -0.09271240234375, -0.0890655517578125, -0.085418701171875, -0.0817718505859375, -0.078125, -0.0744781494140625, -0.070831298828125, -0.0671844482421875, -0.06353759765625, -0.0598907470703125, -0.056243896484375, -0.0525970458984375, -0.0489501953125, -0.0453033447265625, -0.041656494140625, -0.0380096435546875, -0.03436279296875, -0.0307159423828125, -0.027069091796875, -0.0234222412109375, -0.019775390625, -0.0161285400390625, -0.012481689453125, -0.0088348388671875, -0.00518798828125, -0.0015411376953125, 0.002105712890625, 0.0057525634765625, 0.0093994140625, 0.0130462646484375, 0.016693115234375, 0.0203399658203125, 0.02398681640625, 0.0276336669921875, 0.031280517578125, 0.0349273681640625, 0.03857421875, 0.0422210693359375, 0.045867919921875, 0.0495147705078125, 0.05316162109375, 0.0568084716796875, 0.060455322265625, 0.0641021728515625, 0.0677490234375, 0.0713958740234375, 0.075042724609375, 0.0786895751953125, 0.08233642578125, 0.0859832763671875, 0.089630126953125, 0.0932769775390625, 0.096923828125, 0.1005706787109375, 0.104217529296875, 0.1078643798828125, 0.11151123046875]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 6.0, 2.0, 5.0, 8.0, 4.0, 14.0, 8.0, 10.0, 10.0, 17.0, 21.0, 17.0, 16.0, 16.0, 16.0, 22.0, 33.0, 39.0, 35.0, 47.0, 44.0, 41.0, 26.0, 48.0, 36.0, 38.0, 31.0, 40.0, 44.0, 34.0, 34.0, 26.0, 30.0, 20.0, 25.0, 24.0, 23.0, 18.0, 12.0, 8.0, 8.0, 8.0, 5.0, 6.0, 5.0, 4.0, 5.0, 9.0, 5.0, 3.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0], "bins": [-0.05950927734375, -0.05758380889892578, -0.05565834045410156, -0.053732872009277344, -0.051807403564453125, -0.049881935119628906, -0.04795646667480469, -0.04603099822998047, -0.04410552978515625, -0.04218006134033203, -0.04025459289550781, -0.038329124450683594, -0.036403656005859375, -0.034478187561035156, -0.03255271911621094, -0.03062725067138672, -0.0287017822265625, -0.02677631378173828, -0.024850845336914062, -0.022925376892089844, -0.020999908447265625, -0.019074440002441406, -0.017148971557617188, -0.015223503112792969, -0.01329803466796875, -0.011372566223144531, -0.009447097778320312, -0.007521629333496094, -0.005596160888671875, -0.0036706924438476562, -0.0017452239990234375, 0.00018024444580078125, 0.002105712890625, 0.004031181335449219, 0.0059566497802734375, 0.007882118225097656, 0.009807586669921875, 0.011733055114746094, 0.013658523559570312, 0.015583992004394531, 0.01750946044921875, 0.01943492889404297, 0.021360397338867188, 0.023285865783691406, 0.025211334228515625, 0.027136802673339844, 0.029062271118164062, 0.03098773956298828, 0.0329132080078125, 0.03483867645263672, 0.03676414489746094, 0.038689613342285156, 0.040615081787109375, 0.042540550231933594, 0.04446601867675781, 0.04639148712158203, 0.04831695556640625, 0.05024242401123047, 0.05216789245605469, 0.054093360900878906, 0.056018829345703125, 0.057944297790527344, 0.05986976623535156, 0.06179523468017578, 0.063720703125]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 1.0, 10.0, 6.0, 5.0, 15.0, 18.0, 15.0, 49.0, 53.0, 84.0, 107.0, 168.0, 244.0, 347.0, 567.0, 1070.0, 1869.0, 4177.0, 11241.0, 47952.0, 508415.0, 412971.0, 40681.0, 10155.0, 3914.0, 1853.0, 930.0, 580.0, 317.0, 242.0, 144.0, 115.0, 63.0, 51.0, 34.0, 22.0, 16.0, 18.0, 9.0, 12.0, 6.0, 7.0, 4.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1463623046875, -0.1411266326904297, -0.13589096069335938, -0.13065528869628906, -0.12541961669921875, -0.12018394470214844, -0.11494827270507812, -0.10971260070800781, -0.1044769287109375, -0.09924125671386719, -0.09400558471679688, -0.08876991271972656, -0.08353424072265625, -0.07829856872558594, -0.07306289672851562, -0.06782722473144531, -0.062591552734375, -0.05735588073730469, -0.052120208740234375, -0.04688453674316406, -0.04164886474609375, -0.03641319274902344, -0.031177520751953125, -0.025941848754882812, -0.0207061767578125, -0.015470504760742188, -0.010234832763671875, -0.0049991607666015625, 0.00023651123046875, 0.0054721832275390625, 0.010707855224609375, 0.015943527221679688, 0.02117919921875, 0.026414871215820312, 0.031650543212890625, 0.03688621520996094, 0.04212188720703125, 0.04735755920410156, 0.052593231201171875, 0.05782890319824219, 0.0630645751953125, 0.06830024719238281, 0.07353591918945312, 0.07877159118652344, 0.08400726318359375, 0.08924293518066406, 0.09447860717773438, 0.09971427917480469, 0.104949951171875, 0.11018562316894531, 0.11542129516601562, 0.12065696716308594, 0.12589263916015625, 0.13112831115722656, 0.13636398315429688, 0.1415996551513672, 0.1468353271484375, 0.1520709991455078, 0.15730667114257812, 0.16254234313964844, 0.16777801513671875, 0.17301368713378906, 0.17824935913085938, 0.1834850311279297, 0.188720703125]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 4.0, 6.0, 4.0, 2.0, 14.0, 15.0, 15.0, 23.0, 22.0, 42.0, 59.0, 73.0, 89.0, 90.0, 104.0, 102.0, 83.0, 69.0, 47.0, 47.0, 28.0, 25.0, 11.0, 10.0, 9.0, 6.0, 5.0, 3.0, 1.0, 1.0, 0.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.246566772460938e-05, -5.9925951063632965e-05, -5.7386234402656555e-05, -5.4846517741680145e-05, -5.2306801080703735e-05, -4.9767084419727325e-05, -4.7227367758750916e-05, -4.4687651097774506e-05, -4.2147934436798096e-05, -3.9608217775821686e-05, -3.7068501114845276e-05, -3.4528784453868866e-05, -3.1989067792892456e-05, -2.9449351131916046e-05, -2.6909634470939636e-05, -2.4369917809963226e-05, -2.1830201148986816e-05, -1.9290484488010406e-05, -1.6750767827033997e-05, -1.4211051166057587e-05, -1.1671334505081177e-05, -9.131617844104767e-06, -6.591901183128357e-06, -4.052184522151947e-06, -1.5124678611755371e-06, 1.0272487998008728e-06, 3.5669654607772827e-06, 6.106682121753693e-06, 8.646398782730103e-06, 1.1186115443706512e-05, 1.3725832104682922e-05, 1.6265548765659332e-05, 1.8805265426635742e-05, 2.1344982087612152e-05, 2.3884698748588562e-05, 2.6424415409564972e-05, 2.8964132070541382e-05, 3.150384873151779e-05, 3.40435653924942e-05, 3.658328205347061e-05, 3.912299871444702e-05, 4.166271537542343e-05, 4.420243203639984e-05, 4.674214869737625e-05, 4.928186535835266e-05, 5.182158201932907e-05, 5.436129868030548e-05, 5.690101534128189e-05, 5.94407320022583e-05, 6.198044866323471e-05, 6.452016532421112e-05, 6.705988198518753e-05, 6.959959864616394e-05, 7.213931530714035e-05, 7.467903196811676e-05, 7.721874862909317e-05, 7.975846529006958e-05, 8.229818195104599e-05, 8.48378986120224e-05, 8.737761527299881e-05, 8.991733193397522e-05, 9.245704859495163e-05, 9.499676525592804e-05, 9.753648191690445e-05, 0.00010007619857788086]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 4.0, 5.0, 4.0, 4.0, 10.0, 15.0, 16.0, 28.0, 48.0, 93.0, 109.0, 229.0, 515.0, 1285.0, 4050.0, 22847.0, 832427.0, 172853.0, 9766.0, 2545.0, 881.0, 382.0, 165.0, 115.0, 48.0, 38.0, 20.0, 17.0, 9.0, 10.0, 4.0, 6.0, 7.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.328857421875, -0.3191261291503906, -0.30939483642578125, -0.2996635437011719, -0.2899322509765625, -0.2802009582519531, -0.27046966552734375, -0.2607383728027344, -0.251007080078125, -0.24127578735351562, -0.23154449462890625, -0.22181320190429688, -0.2120819091796875, -0.20235061645507812, -0.19261932373046875, -0.18288803100585938, -0.17315673828125, -0.16342544555664062, -0.15369415283203125, -0.14396286010742188, -0.1342315673828125, -0.12450027465820312, -0.11476898193359375, -0.10503768920898438, -0.095306396484375, -0.08557510375976562, -0.07584381103515625, -0.06611251831054688, -0.0563812255859375, -0.046649932861328125, -0.03691864013671875, -0.027187347412109375, -0.0174560546875, -0.007724761962890625, 0.00200653076171875, 0.011737823486328125, 0.0214691162109375, 0.031200408935546875, 0.04093170166015625, 0.050662994384765625, 0.060394287109375, 0.07012557983398438, 0.07985687255859375, 0.08958816528320312, 0.0993194580078125, 0.10905075073242188, 0.11878204345703125, 0.12851333618164062, 0.13824462890625, 0.14797592163085938, 0.15770721435546875, 0.16743850708007812, 0.1771697998046875, 0.18690109252929688, 0.19663238525390625, 0.20636367797851562, 0.216094970703125, 0.22582626342773438, 0.23555755615234375, 0.24528884887695312, 0.2550201416015625, 0.2647514343261719, 0.27448272705078125, 0.2842140197753906, 0.2939453125]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 1.0, 2.0, 3.0, 6.0, 14.0, 14.0, 14.0, 42.0, 50.0, 84.0, 150.0, 208.0, 155.0, 95.0, 48.0, 48.0, 25.0, 12.0, 8.0, 6.0, 3.0, 6.0, 3.0, 0.0, 3.0, 0.0, 1.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1328125, -0.1288604736328125, -0.124908447265625, -0.1209564208984375, -0.11700439453125, -0.1130523681640625, -0.109100341796875, -0.1051483154296875, -0.1011962890625, -0.0972442626953125, -0.093292236328125, -0.0893402099609375, -0.08538818359375, -0.0814361572265625, -0.077484130859375, -0.0735321044921875, -0.069580078125, -0.0656280517578125, -0.061676025390625, -0.0577239990234375, -0.05377197265625, -0.0498199462890625, -0.045867919921875, -0.0419158935546875, -0.0379638671875, -0.0340118408203125, -0.030059814453125, -0.0261077880859375, -0.02215576171875, -0.0182037353515625, -0.014251708984375, -0.0102996826171875, -0.00634765625, -0.0023956298828125, 0.001556396484375, 0.0055084228515625, 0.00946044921875, 0.0134124755859375, 0.017364501953125, 0.0213165283203125, 0.0252685546875, 0.0292205810546875, 0.033172607421875, 0.0371246337890625, 0.04107666015625, 0.0450286865234375, 0.048980712890625, 0.0529327392578125, 0.056884765625, 0.0608367919921875, 0.064788818359375, 0.0687408447265625, 0.07269287109375, 0.0766448974609375, 0.080596923828125, 0.0845489501953125, 0.0885009765625, 0.0924530029296875, 0.096405029296875, 0.1003570556640625, 0.10430908203125, 0.1082611083984375, 0.112213134765625, 0.1161651611328125, 0.1201171875]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 1.0, 1.0, 3.0, 5.0, 7.0, 10.0, 28.0, 65.0, 91.0, 154.0, 223.0, 169.0, 127.0, 57.0, 33.0, 14.0, 5.0, 7.0, 2.0, 4.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0696489810943604, -1.0295755863189697, -0.9895022511482239, -0.949428915977478, -0.9093555808067322, -0.8692822456359863, -0.8292088508605957, -0.7891355156898499, -0.749062180519104, -0.7089888453483582, -0.6689154505729675, -0.6288421154022217, -0.5887687802314758, -0.54869544506073, -0.5086220502853394, -0.4685487151145935, -0.4284753203392029, -0.38840195536613464, -0.3483286201953888, -0.30825525522232056, -0.2681819200515747, -0.22810855507850647, -0.18803519010543823, -0.14796185493469238, -0.10788848996162415, -0.0678151398897171, -0.02774178236722946, 0.012331575155258179, 0.05240492522716522, 0.09247827529907227, 0.1325516402721405, 0.17262497544288635, 0.2126983404159546, 0.2527717053890228, 0.2928450405597687, 0.3329184055328369, 0.37299174070358276, 0.413065105676651, 0.45313847064971924, 0.4932118058204651, 0.5332851409912109, 0.5733584761619568, 0.6134318709373474, 0.6535052061080933, 0.6935785412788391, 0.733651876449585, 0.7737252712249756, 0.8137986063957214, 0.8538720011711121, 0.8939453363418579, 0.9340187311172485, 0.9740920662879944, 1.0141654014587402, 1.0542387962341309, 1.0943121910095215, 1.1343854665756226, 1.1744588613510132, 1.2145322561264038, 1.2546055316925049, 1.2946789264678955, 1.3347523212432861, 1.3748255968093872, 1.4148989915847778, 1.454972267150879, 1.4950456619262695]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 5.0, 6.0, 5.0, 6.0, 8.0, 13.0, 12.0, 10.0, 13.0, 16.0, 18.0, 32.0, 14.0, 18.0, 29.0, 41.0, 35.0, 46.0, 47.0, 33.0, 43.0, 60.0, 51.0, 44.0, 37.0, 35.0, 39.0, 33.0, 45.0, 30.0, 30.0, 31.0, 29.0, 21.0, 13.0, 14.0, 13.0, 7.0, 5.0, 3.0, 8.0, 6.0, 1.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5479835271835327, -0.5316440463066101, -0.5153045654296875, -0.49896514415740967, -0.48262566328048706, -0.46628618240356445, -0.44994673132896423, -0.433607280254364, -0.4172677993774414, -0.4009283185005188, -0.3845888674259186, -0.36824941635131836, -0.35190993547439575, -0.33557045459747314, -0.3192310035228729, -0.3028915524482727, -0.2865520715713501, -0.2702125906944275, -0.25387313961982727, -0.23753367364406586, -0.22119420766830444, -0.20485474169254303, -0.18851527571678162, -0.1721758097410202, -0.1558363437652588, -0.13949687778949738, -0.12315741181373596, -0.10681794583797455, -0.09047847986221313, -0.07413901388645172, -0.05779954791069031, -0.041460081934928894, -0.02512061595916748, -0.008781149983406067, 0.007558315992355347, 0.02389778196811676, 0.040237247943878174, 0.05657671391963959, 0.072916179895401, 0.08925564587116241, 0.10559511184692383, 0.12193457782268524, 0.13827404379844666, 0.15461350977420807, 0.17095297574996948, 0.1872924417257309, 0.2036319077014923, 0.21997137367725372, 0.23631083965301514, 0.25265032052993774, 0.26898977160453796, 0.2853292226791382, 0.3016687035560608, 0.3180081844329834, 0.3343476355075836, 0.35068708658218384, 0.36702656745910645, 0.38336604833602905, 0.3997054994106293, 0.4160449504852295, 0.4323844313621521, 0.4487239122390747, 0.4650633633136749, 0.48140281438827515, 0.49774229526519775]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 3.0, 7.0, 13.0, 13.0, 21.0, 25.0, 40.0, 44.0, 97.0, 148.0, 273.0, 518.0, 961.0, 1980.0, 5207.0, 16043.0, 79663.0, 3575029.0, 457330.0, 40627.0, 9818.0, 3346.0, 1440.0, 688.0, 371.0, 204.0, 130.0, 87.0, 55.0, 31.0, 28.0, 16.0, 14.0, 7.0, 4.0, 5.0, 1.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.2291259765625, -0.2229022979736328, -0.21667861938476562, -0.21045494079589844, -0.20423126220703125, -0.19800758361816406, -0.19178390502929688, -0.1855602264404297, -0.1793365478515625, -0.1731128692626953, -0.16688919067382812, -0.16066551208496094, -0.15444183349609375, -0.14821815490722656, -0.14199447631835938, -0.1357707977294922, -0.129547119140625, -0.12332344055175781, -0.11709976196289062, -0.11087608337402344, -0.10465240478515625, -0.09842872619628906, -0.09220504760742188, -0.08598136901855469, -0.0797576904296875, -0.07353401184082031, -0.06731033325195312, -0.06108665466308594, -0.05486297607421875, -0.04863929748535156, -0.042415618896484375, -0.03619194030761719, -0.02996826171875, -0.023744583129882812, -0.017520904541015625, -0.011297225952148438, -0.00507354736328125, 0.0011501312255859375, 0.007373809814453125, 0.013597488403320312, 0.0198211669921875, 0.026044845581054688, 0.032268524169921875, 0.03849220275878906, 0.04471588134765625, 0.05093955993652344, 0.057163238525390625, 0.06338691711425781, 0.069610595703125, 0.07583427429199219, 0.08205795288085938, 0.08828163146972656, 0.09450531005859375, 0.10072898864746094, 0.10695266723632812, 0.11317634582519531, 0.1194000244140625, 0.1256237030029297, 0.13184738159179688, 0.13807106018066406, 0.14429473876953125, 0.15051841735839844, 0.15674209594726562, 0.1629657745361328, 0.169189453125]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 4.0, 1.0, 3.0, 4.0, 6.0, 12.0, 15.0, 13.0, 19.0, 21.0, 34.0, 36.0, 39.0, 52.0, 50.0, 55.0, 57.0, 76.0, 62.0, 83.0, 55.0, 50.0, 54.0, 47.0, 39.0, 25.0, 18.0, 18.0, 15.0, 7.0, 10.0, 7.0, 4.0, 5.0, 1.0, 5.0, 0.0, 2.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.020660400390625, -0.020084381103515625, -0.01950836181640625, -0.018932342529296875, -0.0183563232421875, -0.017780303955078125, -0.01720428466796875, -0.016628265380859375, -0.01605224609375, -0.015476226806640625, -0.01490020751953125, -0.014324188232421875, -0.0137481689453125, -0.013172149658203125, -0.01259613037109375, -0.012020111083984375, -0.011444091796875, -0.010868072509765625, -0.01029205322265625, -0.009716033935546875, -0.0091400146484375, -0.008563995361328125, -0.00798797607421875, -0.007411956787109375, -0.0068359375, -0.006259918212890625, -0.00568389892578125, -0.005107879638671875, -0.0045318603515625, -0.003955841064453125, -0.00337982177734375, -0.002803802490234375, -0.002227783203125, -0.001651763916015625, -0.00107574462890625, -0.000499725341796875, 7.62939453125e-05, 0.000652313232421875, 0.00122833251953125, 0.001804351806640625, 0.00238037109375, 0.002956390380859375, 0.00353240966796875, 0.004108428955078125, 0.0046844482421875, 0.005260467529296875, 0.00583648681640625, 0.006412506103515625, 0.006988525390625, 0.007564544677734375, 0.00814056396484375, 0.008716583251953125, 0.0092926025390625, 0.009868621826171875, 0.01044464111328125, 0.011020660400390625, 0.0115966796875, 0.012172698974609375, 0.01274871826171875, 0.013324737548828125, 0.0139007568359375, 0.014476776123046875, 0.01505279541015625, 0.015628814697265625, 0.016204833984375]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 6.0, 5.0, 7.0, 8.0, 14.0, 24.0, 33.0, 73.0, 103.0, 181.0, 237.0, 514.0, 1000.0, 2188.0, 5660.0, 17261.0, 72474.0, 728141.0, 3199262.0, 126681.0, 26571.0, 8081.0, 3051.0, 1287.0, 624.0, 312.0, 171.0, 130.0, 70.0, 41.0, 29.0, 17.0, 10.0, 8.0, 6.0, 3.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.2017822265625, -0.19620132446289062, -0.19062042236328125, -0.18503952026367188, -0.1794586181640625, -0.17387771606445312, -0.16829681396484375, -0.16271591186523438, -0.157135009765625, -0.15155410766601562, -0.14597320556640625, -0.14039230346679688, -0.1348114013671875, -0.12923049926757812, -0.12364959716796875, -0.11806869506835938, -0.11248779296875, -0.10690689086914062, -0.10132598876953125, -0.09574508666992188, -0.0901641845703125, -0.08458328247070312, -0.07900238037109375, -0.07342147827148438, -0.067840576171875, -0.062259674072265625, -0.05667877197265625, -0.051097869873046875, -0.0455169677734375, -0.039936065673828125, -0.03435516357421875, -0.028774261474609375, -0.023193359375, -0.017612457275390625, -0.01203155517578125, -0.006450653076171875, -0.0008697509765625, 0.004711151123046875, 0.01029205322265625, 0.015872955322265625, 0.021453857421875, 0.027034759521484375, 0.03261566162109375, 0.038196563720703125, 0.0437774658203125, 0.049358367919921875, 0.05493927001953125, 0.060520172119140625, 0.06610107421875, 0.07168197631835938, 0.07726287841796875, 0.08284378051757812, 0.0884246826171875, 0.09400558471679688, 0.09958648681640625, 0.10516738891601562, 0.110748291015625, 0.11632919311523438, 0.12191009521484375, 0.12749099731445312, 0.1330718994140625, 0.13865280151367188, 0.14423370361328125, 0.14981460571289062, 0.1553955078125]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 1.0, 2.0, 3.0, 6.0, 5.0, 5.0, 14.0, 18.0, 29.0, 46.0, 68.0, 96.0, 162.0, 353.0, 1701.0, 866.0, 283.0, 154.0, 72.0, 63.0, 39.0, 26.0, 16.0, 15.0, 10.0, 9.0, 8.0, 6.0, 4.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.05029296875, -0.04880809783935547, -0.04732322692871094, -0.045838356018066406, -0.044353485107421875, -0.042868614196777344, -0.04138374328613281, -0.03989887237548828, -0.03841400146484375, -0.03692913055419922, -0.03544425964355469, -0.033959388732910156, -0.032474517822265625, -0.030989646911621094, -0.029504776000976562, -0.02801990509033203, -0.0265350341796875, -0.02505016326904297, -0.023565292358398438, -0.022080421447753906, -0.020595550537109375, -0.019110679626464844, -0.017625808715820312, -0.01614093780517578, -0.01465606689453125, -0.013171195983886719, -0.011686325073242188, -0.010201454162597656, -0.008716583251953125, -0.007231712341308594, -0.0057468414306640625, -0.004261970520019531, -0.002777099609375, -0.0012922286987304688, 0.0001926422119140625, 0.0016775131225585938, 0.003162384033203125, 0.004647254943847656, 0.0061321258544921875, 0.007616996765136719, 0.00910186767578125, 0.010586738586425781, 0.012071609497070312, 0.013556480407714844, 0.015041351318359375, 0.016526222229003906, 0.018011093139648438, 0.01949596405029297, 0.0209808349609375, 0.02246570587158203, 0.023950576782226562, 0.025435447692871094, 0.026920318603515625, 0.028405189514160156, 0.029890060424804688, 0.03137493133544922, 0.03285980224609375, 0.03434467315673828, 0.03582954406738281, 0.037314414978027344, 0.038799285888671875, 0.040284156799316406, 0.04176902770996094, 0.04325389862060547, 0.04473876953125]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 2.0, 4.0, 13.0, 16.0, 24.0, 52.0, 92.0, 109.0, 177.0, 171.0, 142.0, 84.0, 55.0, 24.0, 15.0, 14.0, 5.0, 4.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3525882363319397, -0.3422180414199829, -0.3318478465080261, -0.32147762179374695, -0.31110742688179016, -0.3007372319698334, -0.2903670072555542, -0.2799968123435974, -0.2696266174316406, -0.25925642251968384, -0.24888621270656586, -0.23851600289344788, -0.2281458079814911, -0.2177756130695343, -0.20740540325641632, -0.19703519344329834, -0.18666499853134155, -0.17629480361938477, -0.16592459380626678, -0.1555543839931488, -0.14518418908119202, -0.13481399416923523, -0.12444378435611725, -0.11407358199357986, -0.10370337963104248, -0.0933331772685051, -0.08296297490596771, -0.07259277254343033, -0.062222570180892944, -0.05185236781835556, -0.041482165455818176, -0.031111963093280792, -0.020741790533065796, -0.010371588170528412, -1.385807991027832e-06, 0.010368816554546356, 0.02073901891708374, 0.031109221279621124, 0.04147942364215851, 0.05184962600469589, 0.062219828367233276, 0.07259003072977066, 0.08296023309230804, 0.09333043545484543, 0.10370063781738281, 0.1140708401799202, 0.12444104254245758, 0.13481125235557556, 0.14518144726753235, 0.15555164217948914, 0.16592185199260712, 0.1762920618057251, 0.18666225671768188, 0.19703245162963867, 0.20740266144275665, 0.21777287125587463, 0.22814306616783142, 0.2385132610797882, 0.2488834708929062, 0.25925368070602417, 0.26962387561798096, 0.27999407052993774, 0.29036426544189453, 0.3007344901561737, 0.3111046850681305]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 1.0, 6.0, 3.0, 5.0, 10.0, 11.0, 8.0, 10.0, 9.0, 19.0, 15.0, 22.0, 21.0, 29.0, 31.0, 30.0, 42.0, 41.0, 35.0, 44.0, 47.0, 52.0, 65.0, 46.0, 52.0, 48.0, 43.0, 35.0, 34.0, 23.0, 22.0, 19.0, 22.0, 20.0, 16.0, 18.0, 8.0, 16.0, 6.0, 14.0, 4.0, 2.0, 2.0, 1.0, 1.0, 3.0, 2.0, 2.0, 0.0, 1.0], "bins": [-0.15605264902114868, -0.15176625549793243, -0.1474798619747162, -0.14319345355033875, -0.1389070600271225, -0.13462066650390625, -0.13033427298069, -0.12604787945747375, -0.12176147848367691, -0.11747508496046066, -0.11318868398666382, -0.10890229046344757, -0.10461589694023132, -0.10032949596643448, -0.09604310244321823, -0.09175670146942139, -0.08747030794620514, -0.08318391442298889, -0.07889751344919205, -0.0746111199259758, -0.07032471895217896, -0.06603832542896271, -0.06175193190574646, -0.057465534657239914, -0.05317913740873337, -0.04889274016022682, -0.044606342911720276, -0.04031994938850403, -0.03603355213999748, -0.031747154891490936, -0.02746075950562954, -0.023174364119768143, -0.018887966871261597, -0.014601570554077625, -0.010315174236893654, -0.0060287779197096825, -0.001742381602525711, 0.002544015645980835, 0.006830411031842232, 0.011116806417703629, 0.015403203666210175, 0.01968960091471672, 0.023975996300578117, 0.028262391686439514, 0.03254878893494606, 0.036835186183452606, 0.041121579706668854, 0.0454079769551754, 0.049694374203681946, 0.05398077145218849, 0.05826716870069504, 0.06255356222391129, 0.06683996319770813, 0.07112635672092438, 0.07541275024414062, 0.07969914376735687, 0.08398554474115372, 0.08827193826436996, 0.09255833923816681, 0.09684473276138306, 0.1011311262845993, 0.10541752725839615, 0.1097039207816124, 0.11399032175540924, 0.11827671527862549]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 3.0, 3.0, 8.0, 10.0, 20.0, 23.0, 35.0, 64.0, 89.0, 153.0, 251.0, 457.0, 853.0, 1752.0, 3936.0, 10513.0, 33206.0, 123985.0, 426934.0, 322897.0, 84961.0, 24122.0, 8041.0, 3151.0, 1369.0, 738.0, 380.0, 237.0, 140.0, 83.0, 54.0, 27.0, 15.0, 21.0, 9.0, 11.0, 2.0, 4.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11163330078125, -0.10762691497802734, -0.10362052917480469, -0.09961414337158203, -0.09560775756835938, -0.09160137176513672, -0.08759498596191406, -0.0835886001586914, -0.07958221435546875, -0.0755758285522461, -0.07156944274902344, -0.06756305694580078, -0.06355667114257812, -0.05955028533935547, -0.05554389953613281, -0.051537513732910156, -0.0475311279296875, -0.043524742126464844, -0.03951835632324219, -0.03551197052001953, -0.031505584716796875, -0.02749919891357422, -0.023492813110351562, -0.019486427307128906, -0.01548004150390625, -0.011473655700683594, -0.0074672698974609375, -0.0034608840942382812, 0.000545501708984375, 0.004551887512207031, 0.008558273315429688, 0.012564659118652344, 0.016571044921875, 0.020577430725097656, 0.024583816528320312, 0.02859020233154297, 0.032596588134765625, 0.03660297393798828, 0.04060935974121094, 0.044615745544433594, 0.04862213134765625, 0.052628517150878906, 0.05663490295410156, 0.06064128875732422, 0.06464767456054688, 0.06865406036376953, 0.07266044616699219, 0.07666683197021484, 0.0806732177734375, 0.08467960357666016, 0.08868598937988281, 0.09269237518310547, 0.09669876098632812, 0.10070514678955078, 0.10471153259277344, 0.1087179183959961, 0.11272430419921875, 0.1167306900024414, 0.12073707580566406, 0.12474346160888672, 0.12874984741210938, 0.13275623321533203, 0.1367626190185547, 0.14076900482177734, 0.144775390625]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 2.0, 3.0, 4.0, 2.0, 3.0, 3.0, 12.0, 14.0, 13.0, 19.0, 23.0, 25.0, 40.0, 44.0, 41.0, 65.0, 63.0, 66.0, 55.0, 68.0, 64.0, 65.0, 48.0, 56.0, 44.0, 38.0, 33.0, 24.0, 14.0, 18.0, 11.0, 7.0, 5.0, 1.0, 3.0, 4.0, 4.0, 2.0, 0.0, 3.0, 1.0, 2.0, 0.0, 2.0, 1.0], "bins": [-0.023101806640625, -0.02249312400817871, -0.021884441375732422, -0.021275758743286133, -0.020667076110839844, -0.020058393478393555, -0.019449710845947266, -0.018841028213500977, -0.018232345581054688, -0.0176236629486084, -0.01701498031616211, -0.01640629768371582, -0.01579761505126953, -0.015188932418823242, -0.014580249786376953, -0.013971567153930664, -0.013362884521484375, -0.012754201889038086, -0.012145519256591797, -0.011536836624145508, -0.010928153991699219, -0.01031947135925293, -0.00971078872680664, -0.009102106094360352, -0.008493423461914062, -0.007884740829467773, -0.007276058197021484, -0.006667375564575195, -0.006058692932128906, -0.005450010299682617, -0.004841327667236328, -0.004232645034790039, -0.00362396240234375, -0.003015279769897461, -0.002406597137451172, -0.0017979145050048828, -0.0011892318725585938, -0.0005805492401123047, 2.8133392333984375e-05, 0.0006368160247802734, 0.0012454986572265625, 0.0018541812896728516, 0.0024628639221191406, 0.0030715465545654297, 0.0036802291870117188, 0.004288911819458008, 0.004897594451904297, 0.005506277084350586, 0.006114959716796875, 0.006723642349243164, 0.007332324981689453, 0.007941007614135742, 0.008549690246582031, 0.00915837287902832, 0.00976705551147461, 0.010375738143920898, 0.010984420776367188, 0.011593103408813477, 0.012201786041259766, 0.012810468673706055, 0.013419151306152344, 0.014027833938598633, 0.014636516571044922, 0.015245199203491211, 0.0158538818359375]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 4.0, 4.0, 8.0, 8.0, 17.0, 35.0, 54.0, 43.0, 65.0, 130.0, 179.0, 267.0, 465.0, 792.0, 1563.0, 3691.0, 10573.0, 40137.0, 184108.0, 531848.0, 209657.0, 45134.0, 11846.0, 3995.0, 1703.0, 877.0, 513.0, 267.0, 210.0, 135.0, 81.0, 49.0, 40.0, 24.0, 13.0, 8.0, 5.0, 10.0, 3.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1368408203125, -0.13236045837402344, -0.12788009643554688, -0.12339973449707031, -0.11891937255859375, -0.11443901062011719, -0.10995864868164062, -0.10547828674316406, -0.1009979248046875, -0.09651756286621094, -0.09203720092773438, -0.08755683898925781, -0.08307647705078125, -0.07859611511230469, -0.07411575317382812, -0.06963539123535156, -0.065155029296875, -0.06067466735839844, -0.056194305419921875, -0.05171394348144531, -0.04723358154296875, -0.04275321960449219, -0.038272857666015625, -0.03379249572753906, -0.0293121337890625, -0.024831771850585938, -0.020351409912109375, -0.015871047973632812, -0.01139068603515625, -0.0069103240966796875, -0.002429962158203125, 0.0020503997802734375, 0.00653076171875, 0.011011123657226562, 0.015491485595703125, 0.019971847534179688, 0.02445220947265625, 0.028932571411132812, 0.033412933349609375, 0.03789329528808594, 0.0423736572265625, 0.04685401916503906, 0.051334381103515625, 0.05581474304199219, 0.06029510498046875, 0.06477546691894531, 0.06925582885742188, 0.07373619079589844, 0.078216552734375, 0.08269691467285156, 0.08717727661132812, 0.09165763854980469, 0.09613800048828125, 0.10061836242675781, 0.10509872436523438, 0.10957908630371094, 0.1140594482421875, 0.11853981018066406, 0.12302017211914062, 0.1275005340576172, 0.13198089599609375, 0.1364612579345703, 0.14094161987304688, 0.14542198181152344, 0.14990234375]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 1.0, 3.0, 0.0, 3.0, 5.0, 8.0, 8.0, 4.0, 13.0, 20.0, 23.0, 25.0, 24.0, 35.0, 50.0, 33.0, 59.0, 48.0, 49.0, 67.0, 53.0, 65.0, 57.0, 57.0, 47.0, 54.0, 46.0, 29.0, 22.0, 30.0, 18.0, 17.0, 3.0, 9.0, 9.0, 7.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.102294921875, -0.09900951385498047, -0.09572410583496094, -0.0924386978149414, -0.08915328979492188, -0.08586788177490234, -0.08258247375488281, -0.07929706573486328, -0.07601165771484375, -0.07272624969482422, -0.06944084167480469, -0.06615543365478516, -0.06287002563476562, -0.059584617614746094, -0.05629920959472656, -0.05301380157470703, -0.0497283935546875, -0.04644298553466797, -0.04315757751464844, -0.039872169494628906, -0.036586761474609375, -0.033301353454589844, -0.030015945434570312, -0.02673053741455078, -0.02344512939453125, -0.02015972137451172, -0.016874313354492188, -0.013588905334472656, -0.010303497314453125, -0.007018089294433594, -0.0037326812744140625, -0.00044727325439453125, 0.002838134765625, 0.006123542785644531, 0.009408950805664062, 0.012694358825683594, 0.015979766845703125, 0.019265174865722656, 0.022550582885742188, 0.02583599090576172, 0.02912139892578125, 0.03240680694580078, 0.03569221496582031, 0.038977622985839844, 0.042263031005859375, 0.045548439025878906, 0.04883384704589844, 0.05211925506591797, 0.0554046630859375, 0.05869007110595703, 0.06197547912597656, 0.0652608871459961, 0.06854629516601562, 0.07183170318603516, 0.07511711120605469, 0.07840251922607422, 0.08168792724609375, 0.08497333526611328, 0.08825874328613281, 0.09154415130615234, 0.09482955932617188, 0.0981149673461914, 0.10140037536621094, 0.10468578338623047, 0.10797119140625]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 4.0, 1.0, 2.0, 6.0, 5.0, 14.0, 18.0, 20.0, 40.0, 55.0, 79.0, 101.0, 155.0, 249.0, 368.0, 611.0, 975.0, 1689.0, 2833.0, 5285.0, 10731.0, 24460.0, 72016.0, 322747.0, 448990.0, 98604.0, 31032.0, 12929.0, 6325.0, 3286.0, 1886.0, 1106.0, 721.0, 421.0, 231.0, 174.0, 123.0, 91.0, 55.0, 26.0, 24.0, 19.0, 18.0, 13.0, 11.0, 4.0, 4.0, 2.0, 3.0, 4.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.09423828125, -0.0914764404296875, -0.088714599609375, -0.0859527587890625, -0.08319091796875, -0.0804290771484375, -0.077667236328125, -0.0749053955078125, -0.0721435546875, -0.0693817138671875, -0.066619873046875, -0.0638580322265625, -0.06109619140625, -0.0583343505859375, -0.055572509765625, -0.0528106689453125, -0.050048828125, -0.0472869873046875, -0.044525146484375, -0.0417633056640625, -0.03900146484375, -0.0362396240234375, -0.033477783203125, -0.0307159423828125, -0.0279541015625, -0.0251922607421875, -0.022430419921875, -0.0196685791015625, -0.01690673828125, -0.0141448974609375, -0.011383056640625, -0.0086212158203125, -0.005859375, -0.0030975341796875, -0.000335693359375, 0.0024261474609375, 0.00518798828125, 0.0079498291015625, 0.010711669921875, 0.0134735107421875, 0.0162353515625, 0.0189971923828125, 0.021759033203125, 0.0245208740234375, 0.02728271484375, 0.0300445556640625, 0.032806396484375, 0.0355682373046875, 0.038330078125, 0.0410919189453125, 0.043853759765625, 0.0466156005859375, 0.04937744140625, 0.0521392822265625, 0.054901123046875, 0.0576629638671875, 0.0604248046875, 0.0631866455078125, 0.065948486328125, 0.0687103271484375, 0.07147216796875, 0.0742340087890625, 0.076995849609375, 0.0797576904296875, 0.08251953125]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 3.0, 3.0, 3.0, 6.0, 10.0, 10.0, 19.0, 20.0, 29.0, 36.0, 46.0, 57.0, 57.0, 60.0, 75.0, 96.0, 48.0, 60.0, 72.0, 70.0, 45.0, 40.0, 32.0, 26.0, 25.0, 11.0, 9.0, 11.0, 8.0, 9.0, 5.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.882978439331055e-05, -5.7044439017772675e-05, -5.52590936422348e-05, -5.347374826669693e-05, -5.168840289115906e-05, -4.9903057515621185e-05, -4.811771214008331e-05, -4.633236676454544e-05, -4.454702138900757e-05, -4.2761676013469696e-05, -4.0976330637931824e-05, -3.919098526239395e-05, -3.740563988685608e-05, -3.562029451131821e-05, -3.3834949135780334e-05, -3.204960376024246e-05, -3.026425838470459e-05, -2.8478913009166718e-05, -2.6693567633628845e-05, -2.4908222258090973e-05, -2.31228768825531e-05, -2.1337531507015228e-05, -1.9552186131477356e-05, -1.7766840755939484e-05, -1.598149538040161e-05, -1.4196150004863739e-05, -1.2410804629325867e-05, -1.0625459253787994e-05, -8.840113878250122e-06, -7.05476850271225e-06, -5.2694231271743774e-06, -3.484077751636505e-06, -1.6987323760986328e-06, 8.66129994392395e-08, 1.8719583749771118e-06, 3.657303750514984e-06, 5.4426491260528564e-06, 7.227994501590729e-06, 9.013339877128601e-06, 1.0798685252666473e-05, 1.2584030628204346e-05, 1.4369376003742218e-05, 1.615472137928009e-05, 1.7940066754817963e-05, 1.9725412130355835e-05, 2.1510757505893707e-05, 2.329610288143158e-05, 2.5081448256969452e-05, 2.6866793632507324e-05, 2.8652139008045197e-05, 3.043748438358307e-05, 3.222282975912094e-05, 3.4008175134658813e-05, 3.5793520510196686e-05, 3.757886588573456e-05, 3.936421126127243e-05, 4.11495566368103e-05, 4.2934902012348175e-05, 4.472024738788605e-05, 4.650559276342392e-05, 4.829093813896179e-05, 5.0076283514499664e-05, 5.186162889003754e-05, 5.364697426557541e-05, 5.543231964111328e-05]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 6.0, 5.0, 5.0, 5.0, 7.0, 3.0, 10.0, 17.0, 16.0, 38.0, 37.0, 49.0, 65.0, 114.0, 180.0, 233.0, 423.0, 717.0, 1152.0, 2339.0, 4520.0, 9694.0, 25457.0, 94637.0, 562427.0, 266692.0, 49326.0, 16065.0, 6782.0, 3358.0, 1756.0, 939.0, 564.0, 305.0, 185.0, 141.0, 77.0, 57.0, 31.0, 37.0, 23.0, 13.0, 12.0, 11.0, 8.0, 6.0, 6.0, 5.0, 5.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.095947265625, -0.09282970428466797, -0.08971214294433594, -0.0865945816040039, -0.08347702026367188, -0.08035945892333984, -0.07724189758300781, -0.07412433624267578, -0.07100677490234375, -0.06788921356201172, -0.06477165222167969, -0.061654090881347656, -0.058536529541015625, -0.055418968200683594, -0.05230140686035156, -0.04918384552001953, -0.0460662841796875, -0.04294872283935547, -0.03983116149902344, -0.036713600158691406, -0.033596038818359375, -0.030478477478027344, -0.027360916137695312, -0.02424335479736328, -0.02112579345703125, -0.01800823211669922, -0.014890670776367188, -0.011773109436035156, -0.008655548095703125, -0.005537986755371094, -0.0024204254150390625, 0.0006971359252929688, 0.003814697265625, 0.006932258605957031, 0.010049819946289062, 0.013167381286621094, 0.016284942626953125, 0.019402503967285156, 0.022520065307617188, 0.02563762664794922, 0.02875518798828125, 0.03187274932861328, 0.03499031066894531, 0.038107872009277344, 0.041225433349609375, 0.044342994689941406, 0.04746055603027344, 0.05057811737060547, 0.0536956787109375, 0.05681324005126953, 0.05993080139160156, 0.0630483627319336, 0.06616592407226562, 0.06928348541259766, 0.07240104675292969, 0.07551860809326172, 0.07863616943359375, 0.08175373077392578, 0.08487129211425781, 0.08798885345458984, 0.09110641479492188, 0.0942239761352539, 0.09734153747558594, 0.10045909881591797, 0.10357666015625]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 5.0, 6.0, 3.0, 5.0, 7.0, 5.0, 6.0, 16.0, 9.0, 16.0, 20.0, 10.0, 29.0, 30.0, 55.0, 54.0, 89.0, 79.0, 105.0, 108.0, 76.0, 68.0, 38.0, 40.0, 27.0, 18.0, 15.0, 9.0, 10.0, 12.0, 12.0, 3.0, 4.0, 3.0, 1.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0], "bins": [-0.0667724609375, -0.06485795974731445, -0.0629434585571289, -0.06102895736694336, -0.05911445617675781, -0.057199954986572266, -0.05528545379638672, -0.05337095260620117, -0.051456451416015625, -0.04954195022583008, -0.04762744903564453, -0.045712947845458984, -0.04379844665527344, -0.04188394546508789, -0.039969444274902344, -0.0380549430847168, -0.03614044189453125, -0.0342259407043457, -0.032311439514160156, -0.03039693832397461, -0.028482437133789062, -0.026567935943603516, -0.02465343475341797, -0.022738933563232422, -0.020824432373046875, -0.018909931182861328, -0.01699542999267578, -0.015080928802490234, -0.013166427612304688, -0.01125192642211914, -0.009337425231933594, -0.007422924041748047, -0.0055084228515625, -0.003593921661376953, -0.0016794204711914062, 0.00023508071899414062, 0.0021495819091796875, 0.004064083099365234, 0.005978584289550781, 0.007893085479736328, 0.009807586669921875, 0.011722087860107422, 0.013636589050292969, 0.015551090240478516, 0.017465591430664062, 0.01938009262084961, 0.021294593811035156, 0.023209095001220703, 0.02512359619140625, 0.027038097381591797, 0.028952598571777344, 0.03086709976196289, 0.03278160095214844, 0.034696102142333984, 0.03661060333251953, 0.03852510452270508, 0.040439605712890625, 0.04235410690307617, 0.04426860809326172, 0.046183109283447266, 0.04809761047363281, 0.05001211166381836, 0.051926612854003906, 0.05384111404418945, 0.055755615234375]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 8.0, 21.0, 44.0, 77.0, 122.0, 171.0, 160.0, 146.0, 106.0, 61.0, 36.0, 25.0, 14.0, 8.0, 8.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.870172381401062, -0.8330138921737671, -0.7958553433418274, -0.7586967945098877, -0.7215383052825928, -0.6843798160552979, -0.6472212672233582, -0.6100627183914185, -0.5729042291641235, -0.5357457399368286, -0.4985871911048889, -0.4614286720752716, -0.4242701530456543, -0.387111634016037, -0.3499531149864197, -0.31279459595680237, -0.27563607692718506, -0.23847755789756775, -0.20131903886795044, -0.16416051983833313, -0.12700200080871582, -0.08984348177909851, -0.0526849627494812, -0.015526443719863892, 0.021632075309753418, 0.05879059433937073, 0.09594911336898804, 0.13310763239860535, 0.17026615142822266, 0.20742467045783997, 0.24458318948745728, 0.2817417085170746, 0.31890034675598145, 0.35605886578559875, 0.39321738481521606, 0.4303759038448334, 0.4675344228744507, 0.5046929121017456, 0.5418514609336853, 0.579010009765625, 0.6161684989929199, 0.6533269882202148, 0.6904855370521545, 0.7276440858840942, 0.7648025751113892, 0.8019610643386841, 0.8391196131706238, 0.8762781620025635, 0.9134366512298584, 0.9505951404571533, 0.987753689289093, 1.0249122381210327, 1.0620707273483276, 1.0992292165756226, 1.136387825012207, 1.173546314239502, 1.2107048034667969, 1.2478632926940918, 1.2850217819213867, 1.3221803903579712, 1.3593388795852661, 1.396497368812561, 1.4336559772491455, 1.4708144664764404, 1.5079729557037354]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 2.0, 5.0, 4.0, 4.0, 8.0, 18.0, 10.0, 15.0, 21.0, 16.0, 16.0, 21.0, 25.0, 39.0, 32.0, 28.0, 35.0, 31.0, 43.0, 33.0, 54.0, 42.0, 50.0, 48.0, 41.0, 37.0, 42.0, 36.0, 29.0, 41.0, 21.0, 30.0, 19.0, 19.0, 21.0, 14.0, 15.0, 7.0, 9.0, 4.0, 7.0, 6.0, 3.0, 1.0, 5.0, 2.0, 5.0, 2.0], "bins": [-0.5639013051986694, -0.5490701198577881, -0.5342389941215515, -0.5194078087806702, -0.5045766234397888, -0.48974549770355225, -0.4749143123626709, -0.46008315682411194, -0.445252001285553, -0.430420845746994, -0.41558966040611267, -0.4007585048675537, -0.38592734932899475, -0.3710961937904358, -0.35626500844955444, -0.3414338529109955, -0.3266026973724365, -0.31177154183387756, -0.2969403564929962, -0.28210920095443726, -0.2672780454158783, -0.25244688987731934, -0.237615704536438, -0.22278454899787903, -0.20795336365699768, -0.19312219321727753, -0.17829103767871857, -0.1634598672389984, -0.14862871170043945, -0.1337975412607193, -0.11896637827157974, -0.10413521528244019, -0.08930405974388123, -0.07447289675474167, -0.05964173376560211, -0.044810567051172256, -0.0299794040620327, -0.015148237347602844, -0.00031707435846328735, 0.01451408863067627, 0.029345251619815826, 0.04417641460895538, 0.05900757759809494, 0.0738387405872345, 0.08866991102695465, 0.10350107401609421, 0.11833223700523376, 0.13316339254379272, 0.14799456298351288, 0.16282573342323303, 0.177656888961792, 0.19248805940151215, 0.2073192149400711, 0.22215038537979126, 0.23698154091835022, 0.2518126964569092, 0.2666438817977905, 0.2814750373363495, 0.29630622267723083, 0.3111373782157898, 0.32596853375434875, 0.3407996892929077, 0.35563087463378906, 0.370462030172348, 0.385293185710907]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 4.0, 2.0, 1.0, 2.0, 2.0, 11.0, 9.0, 19.0, 17.0, 32.0, 30.0, 64.0, 101.0, 168.0, 299.0, 604.0, 1337.0, 3052.0, 8714.0, 32426.0, 257228.0, 3760837.0, 100883.0, 18845.0, 5609.0, 2064.0, 880.0, 444.0, 237.0, 128.0, 63.0, 59.0, 36.0, 27.0, 18.0, 8.0, 8.0, 8.0, 0.0, 3.0, 3.0, 6.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.209716796875, -0.20342254638671875, -0.1971282958984375, -0.19083404541015625, -0.184539794921875, -0.17824554443359375, -0.1719512939453125, -0.16565704345703125, -0.15936279296875, -0.15306854248046875, -0.1467742919921875, -0.14048004150390625, -0.134185791015625, -0.12789154052734375, -0.1215972900390625, -0.11530303955078125, -0.1090087890625, -0.10271453857421875, -0.0964202880859375, -0.09012603759765625, -0.083831787109375, -0.07753753662109375, -0.0712432861328125, -0.06494903564453125, -0.05865478515625, -0.05236053466796875, -0.0460662841796875, -0.03977203369140625, -0.033477783203125, -0.02718353271484375, -0.0208892822265625, -0.01459503173828125, -0.00830078125, -0.00200653076171875, 0.0042877197265625, 0.01058197021484375, 0.016876220703125, 0.02317047119140625, 0.0294647216796875, 0.03575897216796875, 0.04205322265625, 0.04834747314453125, 0.0546417236328125, 0.06093597412109375, 0.067230224609375, 0.07352447509765625, 0.0798187255859375, 0.08611297607421875, 0.0924072265625, 0.09870147705078125, 0.1049957275390625, 0.11128997802734375, 0.117584228515625, 0.12387847900390625, 0.1301727294921875, 0.13646697998046875, 0.14276123046875, 0.14905548095703125, 0.1553497314453125, 0.16164398193359375, 0.167938232421875, 0.17423248291015625, 0.1805267333984375, 0.18682098388671875, 0.193115234375]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 0.0, 4.0, 4.0, 3.0, 2.0, 9.0, 14.0, 17.0, 18.0, 22.0, 34.0, 38.0, 33.0, 44.0, 55.0, 63.0, 71.0, 56.0, 58.0, 73.0, 68.0, 53.0, 54.0, 32.0, 35.0, 36.0, 22.0, 19.0, 20.0, 10.0, 8.0, 9.0, 9.0, 5.0, 4.0, 3.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.0250091552734375, -0.024371623992919922, -0.023734092712402344, -0.023096561431884766, -0.022459030151367188, -0.02182149887084961, -0.02118396759033203, -0.020546436309814453, -0.019908905029296875, -0.019271373748779297, -0.01863384246826172, -0.01799631118774414, -0.017358779907226562, -0.016721248626708984, -0.016083717346191406, -0.015446186065673828, -0.01480865478515625, -0.014171123504638672, -0.013533592224121094, -0.012896060943603516, -0.012258529663085938, -0.01162099838256836, -0.010983467102050781, -0.010345935821533203, -0.009708404541015625, -0.009070873260498047, -0.008433341979980469, -0.007795810699462891, -0.0071582794189453125, -0.006520748138427734, -0.005883216857910156, -0.005245685577392578, -0.004608154296875, -0.003970623016357422, -0.0033330917358398438, -0.0026955604553222656, -0.0020580291748046875, -0.0014204978942871094, -0.0007829666137695312, -0.00014543533325195312, 0.000492095947265625, 0.0011296272277832031, 0.0017671585083007812, 0.0024046897888183594, 0.0030422210693359375, 0.0036797523498535156, 0.004317283630371094, 0.004954814910888672, 0.00559234619140625, 0.006229877471923828, 0.006867408752441406, 0.007504940032958984, 0.008142471313476562, 0.00878000259399414, 0.009417533874511719, 0.010055065155029297, 0.010692596435546875, 0.011330127716064453, 0.011967658996582031, 0.01260519027709961, 0.013242721557617188, 0.013880252838134766, 0.014517784118652344, 0.015155315399169922, 0.0157928466796875]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 3.0, 7.0, 4.0, 5.0, 17.0, 18.0, 37.0, 41.0, 65.0, 82.0, 173.0, 257.0, 388.0, 698.0, 1303.0, 3132.0, 8696.0, 31872.0, 202306.0, 3684335.0, 213411.0, 32371.0, 8963.0, 3087.0, 1319.0, 696.0, 336.0, 214.0, 164.0, 110.0, 67.0, 38.0, 28.0, 13.0, 12.0, 8.0, 6.0, 5.0, 1.0, 1.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.224609375, -0.21699905395507812, -0.20938873291015625, -0.20177841186523438, -0.1941680908203125, -0.18655776977539062, -0.17894744873046875, -0.17133712768554688, -0.163726806640625, -0.15611648559570312, -0.14850616455078125, -0.14089584350585938, -0.1332855224609375, -0.12567520141601562, -0.11806488037109375, -0.11045455932617188, -0.10284423828125, -0.09523391723632812, -0.08762359619140625, -0.08001327514648438, -0.0724029541015625, -0.06479263305664062, -0.05718231201171875, -0.049571990966796875, -0.041961669921875, -0.034351348876953125, -0.02674102783203125, -0.019130706787109375, -0.0115203857421875, -0.003910064697265625, 0.00370025634765625, 0.011310577392578125, 0.0189208984375, 0.026531219482421875, 0.03414154052734375, 0.041751861572265625, 0.0493621826171875, 0.056972503662109375, 0.06458282470703125, 0.07219314575195312, 0.079803466796875, 0.08741378784179688, 0.09502410888671875, 0.10263442993164062, 0.1102447509765625, 0.11785507202148438, 0.12546539306640625, 0.13307571411132812, 0.14068603515625, 0.14829635620117188, 0.15590667724609375, 0.16351699829101562, 0.1711273193359375, 0.17873764038085938, 0.18634796142578125, 0.19395828247070312, 0.201568603515625, 0.20917892456054688, 0.21678924560546875, 0.22439956665039062, 0.2320098876953125, 0.23962020874023438, 0.24723052978515625, 0.2548408508300781, 0.262451171875]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 3.0, 5.0, 2.0, 10.0, 14.0, 22.0, 33.0, 59.0, 82.0, 165.0, 375.0, 2086.0, 730.0, 205.0, 117.0, 65.0, 38.0, 16.0, 18.0, 12.0, 3.0, 7.0, 5.0, 4.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.067626953125, -0.0653543472290039, -0.06308174133300781, -0.06080913543701172, -0.058536529541015625, -0.05626392364501953, -0.05399131774902344, -0.051718711853027344, -0.04944610595703125, -0.047173500061035156, -0.04490089416503906, -0.04262828826904297, -0.040355682373046875, -0.03808307647705078, -0.03581047058105469, -0.033537864685058594, -0.0312652587890625, -0.028992652893066406, -0.026720046997070312, -0.02444744110107422, -0.022174835205078125, -0.01990222930908203, -0.017629623413085938, -0.015357017517089844, -0.01308441162109375, -0.010811805725097656, -0.008539199829101562, -0.006266593933105469, -0.003993988037109375, -0.0017213821411132812, 0.0005512237548828125, 0.0028238296508789062, 0.005096435546875, 0.007369041442871094, 0.009641647338867188, 0.011914253234863281, 0.014186859130859375, 0.01645946502685547, 0.018732070922851562, 0.021004676818847656, 0.02327728271484375, 0.025549888610839844, 0.027822494506835938, 0.03009510040283203, 0.032367706298828125, 0.03464031219482422, 0.03691291809082031, 0.039185523986816406, 0.0414581298828125, 0.043730735778808594, 0.04600334167480469, 0.04827594757080078, 0.050548553466796875, 0.05282115936279297, 0.05509376525878906, 0.057366371154785156, 0.05963897705078125, 0.061911582946777344, 0.06418418884277344, 0.06645679473876953, 0.06872940063476562, 0.07100200653076172, 0.07327461242675781, 0.0755472183227539, 0.07781982421875]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 2.0, 4.0, 5.0, 5.0, 22.0, 22.0, 33.0, 35.0, 62.0, 83.0, 114.0, 127.0, 128.0, 98.0, 92.0, 72.0, 39.0, 20.0, 16.0, 4.0, 6.0, 6.0, 4.0, 4.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.22873511910438538, -0.21800638735294342, -0.20727764070034027, -0.19654890894889832, -0.18582016229629517, -0.1750914305448532, -0.16436269879341125, -0.1536339521408081, -0.14290522038936615, -0.1321764886379242, -0.12144774198532104, -0.11071901023387909, -0.09999027103185654, -0.08926153182983398, -0.07853280007839203, -0.06780406087636948, -0.057075321674346924, -0.04634658247232437, -0.03561784699559212, -0.024889111518859863, -0.01416037231683731, -0.0034316331148147583, 0.007297098636627197, 0.01802583783864975, 0.028754577040672302, 0.039483316242694855, 0.05021205171942711, 0.06094078719615936, 0.07166952639818192, 0.08239826560020447, 0.09312699735164642, 0.10385573655366898, 0.11458450555801392, 0.12531323730945587, 0.13604198396205902, 0.14677071571350098, 0.15749946236610413, 0.16822819411754608, 0.17895692586898804, 0.1896856725215912, 0.20041440427303314, 0.2111431360244751, 0.22187188267707825, 0.2326006144285202, 0.24332934617996216, 0.2540580928325653, 0.26478683948516846, 0.2755155563354492, 0.28624430298805237, 0.2969730496406555, 0.3077017664909363, 0.31843051314353943, 0.3291592597961426, 0.33988797664642334, 0.3506167232990265, 0.36134546995162964, 0.3720741868019104, 0.38280293345451355, 0.3935316503047943, 0.40426039695739746, 0.4149891436100006, 0.42571789026260376, 0.4364466071128845, 0.44717535376548767, 0.4579041004180908]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 6.0, 9.0, 4.0, 5.0, 9.0, 10.0, 19.0, 21.0, 24.0, 24.0, 31.0, 43.0, 35.0, 34.0, 46.0, 50.0, 36.0, 38.0, 48.0, 43.0, 36.0, 52.0, 35.0, 41.0, 39.0, 30.0, 40.0, 33.0, 21.0, 17.0, 15.0, 21.0, 15.0, 15.0, 16.0, 10.0, 13.0, 7.0, 3.0, 5.0, 3.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.2103520631790161, -0.20420262217521667, -0.19805316627025604, -0.1919037252664566, -0.18575426936149597, -0.17960482835769653, -0.1734553873538971, -0.16730594635009766, -0.16115649044513702, -0.15500704944133759, -0.14885759353637695, -0.14270815253257751, -0.13655871152877808, -0.13040925562381744, -0.124259814620018, -0.11811036616563797, -0.11196091771125793, -0.1058114692568779, -0.09966202080249786, -0.09351257979869843, -0.08736313134431839, -0.08121368288993835, -0.07506424188613892, -0.06891479343175888, -0.06276534497737885, -0.05661589652299881, -0.05046645179390907, -0.044317007064819336, -0.0381675586104393, -0.032018110156059265, -0.025868665426969528, -0.01971922069787979, -0.013569772243499756, -0.00742032565176487, -0.0012708790600299835, 0.004878567531704903, 0.011028014123439789, 0.017177460715174675, 0.02332690730690956, 0.029476352035999298, 0.035625800490379333, 0.04177524894475937, 0.047924693673849106, 0.05407413840293884, 0.06022358685731888, 0.06637303531169891, 0.07252247631549835, 0.07867192476987839, 0.08482137322425842, 0.09097082167863846, 0.0971202701330185, 0.10326971113681793, 0.10941915959119797, 0.115568608045578, 0.12171804904937744, 0.12786749005317688, 0.1340169459581375, 0.14016638696193695, 0.14631584286689758, 0.15246528387069702, 0.15861472487449646, 0.1647641807794571, 0.17091362178325653, 0.17706307768821716, 0.1832125186920166]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 7.0, 8.0, 12.0, 11.0, 14.0, 33.0, 31.0, 72.0, 113.0, 156.0, 310.0, 582.0, 1068.0, 2205.0, 5041.0, 13144.0, 39044.0, 134718.0, 438450.0, 292963.0, 80071.0, 24595.0, 8723.0, 3697.0, 1619.0, 823.0, 421.0, 261.0, 131.0, 84.0, 48.0, 35.0, 26.0, 15.0, 18.0, 7.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.14501953125, -0.14096832275390625, -0.1369171142578125, -0.13286590576171875, -0.128814697265625, -0.12476348876953125, -0.1207122802734375, -0.11666107177734375, -0.11260986328125, -0.10855865478515625, -0.1045074462890625, -0.10045623779296875, -0.096405029296875, -0.09235382080078125, -0.0883026123046875, -0.08425140380859375, -0.0802001953125, -0.07614898681640625, -0.0720977783203125, -0.06804656982421875, -0.063995361328125, -0.05994415283203125, -0.0558929443359375, -0.05184173583984375, -0.04779052734375, -0.04373931884765625, -0.0396881103515625, -0.03563690185546875, -0.031585693359375, -0.02753448486328125, -0.0234832763671875, -0.01943206787109375, -0.015380859375, -0.01132965087890625, -0.0072784423828125, -0.00322723388671875, 0.000823974609375, 0.00487518310546875, 0.0089263916015625, 0.01297760009765625, 0.01702880859375, 0.02108001708984375, 0.0251312255859375, 0.02918243408203125, 0.033233642578125, 0.03728485107421875, 0.0413360595703125, 0.04538726806640625, 0.0494384765625, 0.05348968505859375, 0.0575408935546875, 0.06159210205078125, 0.065643310546875, 0.06969451904296875, 0.0737457275390625, 0.07779693603515625, 0.08184814453125, 0.08589935302734375, 0.0899505615234375, 0.09400177001953125, 0.098052978515625, 0.10210418701171875, 0.1061553955078125, 0.11020660400390625, 0.1142578125]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 2.0, 5.0, 4.0, 5.0, 9.0, 9.0, 14.0, 13.0, 23.0, 32.0, 41.0, 38.0, 54.0, 70.0, 70.0, 71.0, 86.0, 75.0, 70.0, 51.0, 46.0, 55.0, 38.0, 34.0, 19.0, 15.0, 16.0, 12.0, 11.0, 7.0, 5.0, 3.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0289764404296875, -0.02816009521484375, -0.02734375, -0.02652740478515625, -0.0257110595703125, -0.02489471435546875, -0.024078369140625, -0.02326202392578125, -0.0224456787109375, -0.02162933349609375, -0.02081298828125, -0.01999664306640625, -0.0191802978515625, -0.01836395263671875, -0.017547607421875, -0.01673126220703125, -0.0159149169921875, -0.01509857177734375, -0.0142822265625, -0.01346588134765625, -0.0126495361328125, -0.01183319091796875, -0.011016845703125, -0.01020050048828125, -0.0093841552734375, -0.00856781005859375, -0.00775146484375, -0.00693511962890625, -0.0061187744140625, -0.00530242919921875, -0.004486083984375, -0.00366973876953125, -0.0028533935546875, -0.00203704833984375, -0.001220703125, -0.00040435791015625, 0.0004119873046875, 0.00122833251953125, 0.002044677734375, 0.00286102294921875, 0.0036773681640625, 0.00449371337890625, 0.00531005859375, 0.00612640380859375, 0.0069427490234375, 0.00775909423828125, 0.008575439453125, 0.00939178466796875, 0.0102081298828125, 0.01102447509765625, 0.0118408203125, 0.01265716552734375, 0.0134735107421875, 0.01428985595703125, 0.015106201171875, 0.01592254638671875, 0.0167388916015625, 0.01755523681640625, 0.01837158203125, 0.01918792724609375, 0.0200042724609375, 0.02082061767578125, 0.021636962890625, 0.02245330810546875, 0.0232696533203125]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 8.0, 3.0, 8.0, 6.0, 10.0, 9.0, 21.0, 30.0, 45.0, 57.0, 60.0, 105.0, 138.0, 207.0, 273.0, 510.0, 860.0, 1692.0, 3782.0, 10509.0, 37396.0, 163211.0, 560043.0, 203176.0, 44871.0, 12757.0, 4387.0, 1899.0, 935.0, 541.0, 324.0, 204.0, 142.0, 100.0, 62.0, 46.0, 39.0, 30.0, 19.0, 13.0, 6.0, 8.0, 6.0, 6.0, 4.0, 2.0, 0.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1484375, -0.1434173583984375, -0.138397216796875, -0.1333770751953125, -0.12835693359375, -0.1233367919921875, -0.118316650390625, -0.1132965087890625, -0.1082763671875, -0.1032562255859375, -0.098236083984375, -0.0932159423828125, -0.08819580078125, -0.0831756591796875, -0.078155517578125, -0.0731353759765625, -0.068115234375, -0.0630950927734375, -0.058074951171875, -0.0530548095703125, -0.04803466796875, -0.0430145263671875, -0.037994384765625, -0.0329742431640625, -0.0279541015625, -0.0229339599609375, -0.017913818359375, -0.0128936767578125, -0.00787353515625, -0.0028533935546875, 0.002166748046875, 0.0071868896484375, 0.01220703125, 0.0172271728515625, 0.022247314453125, 0.0272674560546875, 0.03228759765625, 0.0373077392578125, 0.042327880859375, 0.0473480224609375, 0.0523681640625, 0.0573883056640625, 0.062408447265625, 0.0674285888671875, 0.07244873046875, 0.0774688720703125, 0.082489013671875, 0.0875091552734375, 0.092529296875, 0.0975494384765625, 0.102569580078125, 0.1075897216796875, 0.11260986328125, 0.1176300048828125, 0.122650146484375, 0.1276702880859375, 0.1326904296875, 0.1377105712890625, 0.142730712890625, 0.1477508544921875, 0.15277099609375, 0.1577911376953125, 0.162811279296875, 0.1678314208984375, 0.1728515625]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 3.0, 5.0, 8.0, 5.0, 8.0, 12.0, 11.0, 24.0, 29.0, 30.0, 29.0, 32.0, 46.0, 39.0, 47.0, 58.0, 51.0, 52.0, 57.0, 53.0, 50.0, 41.0, 39.0, 45.0, 38.0, 28.0, 30.0, 35.0, 19.0, 13.0, 15.0, 10.0, 8.0, 6.0, 10.0, 4.0, 8.0, 1.0, 2.0, 1.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1051025390625, -0.10149955749511719, -0.09789657592773438, -0.09429359436035156, -0.09069061279296875, -0.08708763122558594, -0.08348464965820312, -0.07988166809082031, -0.0762786865234375, -0.07267570495605469, -0.06907272338867188, -0.06546974182128906, -0.06186676025390625, -0.05826377868652344, -0.054660797119140625, -0.05105781555175781, -0.047454833984375, -0.04385185241699219, -0.040248870849609375, -0.03664588928222656, -0.03304290771484375, -0.029439926147460938, -0.025836944580078125, -0.022233963012695312, -0.0186309814453125, -0.015027999877929688, -0.011425018310546875, -0.007822036743164062, -0.00421905517578125, -0.0006160736083984375, 0.002986907958984375, 0.0065898895263671875, 0.01019287109375, 0.013795852661132812, 0.017398834228515625, 0.021001815795898438, 0.02460479736328125, 0.028207778930664062, 0.031810760498046875, 0.03541374206542969, 0.0390167236328125, 0.04261970520019531, 0.046222686767578125, 0.04982566833496094, 0.05342864990234375, 0.05703163146972656, 0.060634613037109375, 0.06423759460449219, 0.067840576171875, 0.07144355773925781, 0.07504653930664062, 0.07864952087402344, 0.08225250244140625, 0.08585548400878906, 0.08945846557617188, 0.09306144714355469, 0.0966644287109375, 0.10026741027832031, 0.10387039184570312, 0.10747337341308594, 0.11107635498046875, 0.11467933654785156, 0.11828231811523438, 0.12188529968261719, 0.12548828125]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 6.0, 4.0, 5.0, 15.0, 10.0, 21.0, 24.0, 44.0, 60.0, 83.0, 145.0, 220.0, 313.0, 568.0, 1028.0, 1926.0, 3811.0, 8576.0, 23513.0, 107516.0, 717301.0, 137928.0, 26752.0, 9588.0, 4199.0, 2077.0, 1169.0, 620.0, 415.0, 227.0, 133.0, 98.0, 61.0, 33.0, 23.0, 16.0, 11.0, 9.0, 4.0, 5.0, 1.0, 2.0, 2.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.1756591796875, -0.1705760955810547, -0.16549301147460938, -0.16040992736816406, -0.15532684326171875, -0.15024375915527344, -0.14516067504882812, -0.1400775909423828, -0.1349945068359375, -0.1299114227294922, -0.12482833862304688, -0.11974525451660156, -0.11466217041015625, -0.10957908630371094, -0.10449600219726562, -0.09941291809082031, -0.094329833984375, -0.08924674987792969, -0.08416366577148438, -0.07908058166503906, -0.07399749755859375, -0.06891441345214844, -0.06383132934570312, -0.05874824523925781, -0.0536651611328125, -0.04858207702636719, -0.043498992919921875, -0.03841590881347656, -0.03333282470703125, -0.028249740600585938, -0.023166656494140625, -0.018083572387695312, -0.01300048828125, -0.007917404174804688, -0.002834320068359375, 0.0022487640380859375, 0.00733184814453125, 0.012414932250976562, 0.017498016357421875, 0.022581100463867188, 0.0276641845703125, 0.03274726867675781, 0.037830352783203125, 0.04291343688964844, 0.04799652099609375, 0.05307960510253906, 0.058162689208984375, 0.06324577331542969, 0.068328857421875, 0.07341194152832031, 0.07849502563476562, 0.08357810974121094, 0.08866119384765625, 0.09374427795410156, 0.09882736206054688, 0.10391044616699219, 0.1089935302734375, 0.11407661437988281, 0.11915969848632812, 0.12424278259277344, 0.12932586669921875, 0.13440895080566406, 0.13949203491210938, 0.1445751190185547, 0.149658203125]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 2.0, 7.0, 5.0, 13.0, 14.0, 21.0, 24.0, 32.0, 40.0, 49.0, 42.0, 72.0, 79.0, 107.0, 97.0, 84.0, 73.0, 58.0, 46.0, 39.0, 30.0, 15.0, 6.0, 12.0, 7.0, 7.0, 7.0, 4.0, 5.0, 3.0, 2.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-7.909536361694336e-05, -7.656682282686234e-05, -7.403828203678131e-05, -7.150974124670029e-05, -6.898120045661926e-05, -6.645265966653824e-05, -6.392411887645721e-05, -6.139557808637619e-05, -5.8867037296295166e-05, -5.633849650621414e-05, -5.380995571613312e-05, -5.1281414926052094e-05, -4.875287413597107e-05, -4.6224333345890045e-05, -4.369579255580902e-05, -4.1167251765728e-05, -3.863871097564697e-05, -3.611017018556595e-05, -3.3581629395484924e-05, -3.10530886054039e-05, -2.8524547815322876e-05, -2.5996007025241852e-05, -2.3467466235160828e-05, -2.0938925445079803e-05, -1.841038465499878e-05, -1.5881843864917755e-05, -1.3353303074836731e-05, -1.0824762284755707e-05, -8.296221494674683e-06, -5.7676807045936584e-06, -3.2391399145126343e-06, -7.105991244316101e-07, 1.817941665649414e-06, 4.346482455730438e-06, 6.875023245811462e-06, 9.403564035892487e-06, 1.193210482597351e-05, 1.4460645616054535e-05, 1.698918640613556e-05, 1.9517727196216583e-05, 2.2046267986297607e-05, 2.457480877637863e-05, 2.7103349566459656e-05, 2.963189035654068e-05, 3.2160431146621704e-05, 3.468897193670273e-05, 3.721751272678375e-05, 3.9746053516864777e-05, 4.22745943069458e-05, 4.4803135097026825e-05, 4.733167588710785e-05, 4.986021667718887e-05, 5.23887574672699e-05, 5.491729825735092e-05, 5.7445839047431946e-05, 5.997437983751297e-05, 6.2502920627594e-05, 6.503146141767502e-05, 6.756000220775604e-05, 7.008854299783707e-05, 7.261708378791809e-05, 7.514562457799911e-05, 7.767416536808014e-05, 8.020270615816116e-05, 8.273124694824219e-05]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 3.0, 1.0, 1.0, 1.0, 4.0, 1.0, 4.0, 3.0, 10.0, 4.0, 8.0, 13.0, 23.0, 30.0, 42.0, 65.0, 84.0, 146.0, 223.0, 385.0, 730.0, 1352.0, 2821.0, 6682.0, 19029.0, 84885.0, 702539.0, 184091.0, 28625.0, 9089.0, 3831.0, 1721.0, 858.0, 492.0, 285.0, 150.0, 84.0, 67.0, 57.0, 34.0, 21.0, 23.0, 13.0, 8.0, 3.0, 10.0, 6.0, 6.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.142333984375, -0.13736915588378906, -0.13240432739257812, -0.1274394989013672, -0.12247467041015625, -0.11750984191894531, -0.11254501342773438, -0.10758018493652344, -0.1026153564453125, -0.09765052795410156, -0.09268569946289062, -0.08772087097167969, -0.08275604248046875, -0.07779121398925781, -0.07282638549804688, -0.06786155700683594, -0.062896728515625, -0.05793190002441406, -0.052967071533203125, -0.04800224304199219, -0.04303741455078125, -0.03807258605957031, -0.033107757568359375, -0.028142929077148438, -0.0231781005859375, -0.018213272094726562, -0.013248443603515625, -0.008283615112304688, -0.00331878662109375, 0.0016460418701171875, 0.006610870361328125, 0.011575698852539062, 0.01654052734375, 0.021505355834960938, 0.026470184326171875, 0.03143501281738281, 0.03639984130859375, 0.04136466979980469, 0.046329498291015625, 0.05129432678222656, 0.0562591552734375, 0.06122398376464844, 0.06618881225585938, 0.07115364074707031, 0.07611846923828125, 0.08108329772949219, 0.08604812622070312, 0.09101295471191406, 0.095977783203125, 0.10094261169433594, 0.10590744018554688, 0.11087226867675781, 0.11583709716796875, 0.12080192565917969, 0.12576675415039062, 0.13073158264160156, 0.1356964111328125, 0.14066123962402344, 0.14562606811523438, 0.1505908966064453, 0.15555572509765625, 0.1605205535888672, 0.16548538208007812, 0.17045021057128906, 0.1754150390625]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 0.0, 2.0, 3.0, 6.0, 4.0, 4.0, 6.0, 7.0, 11.0, 14.0, 9.0, 22.0, 31.0, 55.0, 69.0, 89.0, 108.0, 161.0, 112.0, 75.0, 54.0, 46.0, 26.0, 26.0, 15.0, 8.0, 11.0, 7.0, 3.0, 6.0, 6.0, 3.0, 1.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1051025390625, -0.10175609588623047, -0.09840965270996094, -0.0950632095336914, -0.09171676635742188, -0.08837032318115234, -0.08502388000488281, -0.08167743682861328, -0.07833099365234375, -0.07498455047607422, -0.07163810729980469, -0.06829166412353516, -0.06494522094726562, -0.061598777770996094, -0.05825233459472656, -0.05490589141845703, -0.0515594482421875, -0.04821300506591797, -0.04486656188964844, -0.041520118713378906, -0.038173675537109375, -0.034827232360839844, -0.03148078918457031, -0.02813434600830078, -0.02478790283203125, -0.02144145965576172, -0.018095016479492188, -0.014748573303222656, -0.011402130126953125, -0.008055686950683594, -0.0047092437744140625, -0.0013628005981445312, 0.001983642578125, 0.005330085754394531, 0.008676528930664062, 0.012022972106933594, 0.015369415283203125, 0.018715858459472656, 0.022062301635742188, 0.02540874481201172, 0.02875518798828125, 0.03210163116455078, 0.03544807434082031, 0.038794517517089844, 0.042140960693359375, 0.045487403869628906, 0.04883384704589844, 0.05218029022216797, 0.0555267333984375, 0.05887317657470703, 0.06221961975097656, 0.0655660629272461, 0.06891250610351562, 0.07225894927978516, 0.07560539245605469, 0.07895183563232422, 0.08229827880859375, 0.08564472198486328, 0.08899116516113281, 0.09233760833740234, 0.09568405151367188, 0.0990304946899414, 0.10237693786621094, 0.10572338104248047, 0.10906982421875]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 5.0, 10.0, 17.0, 35.0, 54.0, 58.0, 117.0, 140.0, 169.0, 127.0, 109.0, 71.0, 41.0, 24.0, 11.0, 9.0, 2.0, 2.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3229131698608398, -1.2794944047927856, -1.236075758934021, -1.1926569938659668, -1.1492382287979126, -1.1058194637298584, -1.0624008178710938, -1.0189820528030396, -0.9755632877349854, -0.9321445822715759, -0.8887258172035217, -0.8453071117401123, -0.8018883466720581, -0.7584696412086487, -0.7150509357452393, -0.6716321706771851, -0.6282134652137756, -0.5847947597503662, -0.541375994682312, -0.4979572892189026, -0.4545385241508484, -0.41111981868743896, -0.36770108342170715, -0.32428234815597534, -0.28086361289024353, -0.23744487762451172, -0.1940261423587799, -0.1506074219942093, -0.10718868672847748, -0.06376995146274567, -0.02035123109817505, 0.023067504167556763, 0.06648623943328857, 0.10990497469902039, 0.1533237099647522, 0.19674243032932281, 0.24016116559505463, 0.28357988595962524, 0.32699862122535706, 0.37041735649108887, 0.4138360917568207, 0.4572548270225525, 0.5006735324859619, 0.5440922975540161, 0.5875110030174255, 0.6309297680854797, 0.6743484735488892, 0.7177672386169434, 0.7611859440803528, 0.8046046495437622, 0.8480234146118164, 0.8914421200752258, 0.93486088514328, 0.9782795906066895, 1.0216983556747437, 1.0651171207427979, 1.1085357666015625, 1.1519545316696167, 1.1953731775283813, 1.2387919425964355, 1.2822107076644897, 1.325629472732544, 1.3690481185913086, 1.4124668836593628, 1.455885648727417]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 3.0, 7.0, 6.0, 5.0, 6.0, 6.0, 10.0, 14.0, 29.0, 31.0, 38.0, 26.0, 42.0, 34.0, 51.0, 46.0, 40.0, 50.0, 46.0, 54.0, 61.0, 44.0, 53.0, 55.0, 31.0, 34.0, 33.0, 23.0, 26.0, 22.0, 12.0, 7.0, 10.0, 13.0, 8.0, 2.0, 8.0, 3.0, 4.0, 4.0, 4.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.698948860168457, -0.6785315871238708, -0.6581143736839294, -0.6376971006393433, -0.6172798871994019, -0.5968626141548157, -0.5764453411102295, -0.5560281276702881, -0.5356108546257019, -0.5151935815811157, -0.4947763681411743, -0.47435909509658813, -0.45394185185432434, -0.43352460861206055, -0.41310736536979675, -0.39269012212753296, -0.37227287888526917, -0.35185563564300537, -0.3314383924007416, -0.3110211491584778, -0.2906038761138916, -0.2701866328716278, -0.249769389629364, -0.22935213148593903, -0.20893488824367523, -0.18851764500141144, -0.16810038685798645, -0.14768314361572266, -0.12726590037345886, -0.10684864223003387, -0.08643139898777008, -0.06601414084434509, -0.0455968976020813, -0.025179648771882057, -0.0047623999416828156, 0.015654847025871277, 0.03607209771871567, 0.05648934841156006, 0.07690659165382385, 0.09732384979724884, 0.11774109303951263, 0.13815833628177643, 0.15857559442520142, 0.1789928376674652, 0.199410080909729, 0.219827339053154, 0.24024458229541779, 0.2606618404388428, 0.28107908368110657, 0.30149632692337036, 0.32191357016563416, 0.34233081340789795, 0.36274808645248413, 0.3831653296947479, 0.4035825729370117, 0.4239998459815979, 0.4444170594215393, 0.4648343026638031, 0.4852515459060669, 0.5056688189506531, 0.5260860323905945, 0.5465033054351807, 0.5669205188751221, 0.5873377919197083, 0.6077550649642944]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 2.0, 2.0, 3.0, 14.0, 3.0, 10.0, 19.0, 27.0, 28.0, 40.0, 56.0, 70.0, 109.0, 166.0, 253.0, 404.0, 652.0, 1086.0, 1796.0, 3468.0, 6691.0, 14117.0, 33833.0, 98961.0, 535691.0, 3177951.0, 217138.0, 58799.0, 22101.0, 9727.0, 4766.0, 2605.0, 1397.0, 829.0, 515.0, 339.0, 200.0, 130.0, 99.0, 63.0, 40.0, 24.0, 20.0, 14.0, 11.0, 5.0, 10.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.1287841796875, -0.12502670288085938, -0.12126922607421875, -0.11751174926757812, -0.1137542724609375, -0.10999679565429688, -0.10623931884765625, -0.10248184204101562, -0.098724365234375, -0.09496688842773438, -0.09120941162109375, -0.08745193481445312, -0.0836944580078125, -0.07993698120117188, -0.07617950439453125, -0.07242202758789062, -0.06866455078125, -0.06490707397460938, -0.06114959716796875, -0.057392120361328125, -0.0536346435546875, -0.049877166748046875, -0.04611968994140625, -0.042362213134765625, -0.038604736328125, -0.034847259521484375, -0.03108978271484375, -0.027332305908203125, -0.0235748291015625, -0.019817352294921875, -0.01605987548828125, -0.012302398681640625, -0.008544921875, -0.004787445068359375, -0.00102996826171875, 0.002727508544921875, 0.0064849853515625, 0.010242462158203125, 0.01399993896484375, 0.017757415771484375, 0.021514892578125, 0.025272369384765625, 0.02902984619140625, 0.032787322998046875, 0.0365447998046875, 0.040302276611328125, 0.04405975341796875, 0.047817230224609375, 0.05157470703125, 0.055332183837890625, 0.05908966064453125, 0.06284713745117188, 0.0666046142578125, 0.07036209106445312, 0.07411956787109375, 0.07787704467773438, 0.081634521484375, 0.08539199829101562, 0.08914947509765625, 0.09290695190429688, 0.0966644287109375, 0.10042190551757812, 0.10417938232421875, 0.10793685913085938, 0.1116943359375]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 4.0, 3.0, 5.0, 8.0, 7.0, 13.0, 14.0, 7.0, 16.0, 24.0, 15.0, 29.0, 52.0, 44.0, 49.0, 55.0, 60.0, 63.0, 62.0, 67.0, 52.0, 58.0, 46.0, 46.0, 37.0, 35.0, 34.0, 19.0, 15.0, 21.0, 10.0, 8.0, 6.0, 8.0, 6.0, 2.0, 4.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.0282135009765625, -0.02747964859008789, -0.02674579620361328, -0.026011943817138672, -0.025278091430664062, -0.024544239044189453, -0.023810386657714844, -0.023076534271240234, -0.022342681884765625, -0.021608829498291016, -0.020874977111816406, -0.020141124725341797, -0.019407272338867188, -0.018673419952392578, -0.01793956756591797, -0.01720571517944336, -0.01647186279296875, -0.01573801040649414, -0.015004158020019531, -0.014270305633544922, -0.013536453247070312, -0.012802600860595703, -0.012068748474121094, -0.011334896087646484, -0.010601043701171875, -0.009867191314697266, -0.009133338928222656, -0.008399486541748047, -0.0076656341552734375, -0.006931781768798828, -0.006197929382324219, -0.005464076995849609, -0.004730224609375, -0.003996372222900391, -0.0032625198364257812, -0.002528667449951172, -0.0017948150634765625, -0.0010609626770019531, -0.00032711029052734375, 0.0004067420959472656, 0.001140594482421875, 0.0018744468688964844, 0.0026082992553710938, 0.003342151641845703, 0.0040760040283203125, 0.004809856414794922, 0.005543708801269531, 0.006277561187744141, 0.00701141357421875, 0.007745265960693359, 0.008479118347167969, 0.009212970733642578, 0.009946823120117188, 0.010680675506591797, 0.011414527893066406, 0.012148380279541016, 0.012882232666015625, 0.013616085052490234, 0.014349937438964844, 0.015083789825439453, 0.015817642211914062, 0.016551494598388672, 0.01728534698486328, 0.01801919937133789, 0.0187530517578125]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 0.0, 6.0, 6.0, 6.0, 7.0, 9.0, 19.0, 23.0, 40.0, 39.0, 69.0, 102.0, 225.0, 308.0, 635.0, 1025.0, 2095.0, 4257.0, 9934.0, 28028.0, 107547.0, 1385619.0, 2476765.0, 126074.0, 30947.0, 10523.0, 4564.0, 2299.0, 1281.0, 719.0, 401.0, 271.0, 163.0, 94.0, 65.0, 47.0, 23.0, 24.0, 14.0, 6.0, 3.0, 5.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2117919921875, -0.2051830291748047, -0.19857406616210938, -0.19196510314941406, -0.18535614013671875, -0.17874717712402344, -0.17213821411132812, -0.1655292510986328, -0.1589202880859375, -0.1523113250732422, -0.14570236206054688, -0.13909339904785156, -0.13248443603515625, -0.12587547302246094, -0.11926651000976562, -0.11265754699707031, -0.106048583984375, -0.09943962097167969, -0.09283065795898438, -0.08622169494628906, -0.07961273193359375, -0.07300376892089844, -0.06639480590820312, -0.05978584289550781, -0.0531768798828125, -0.04656791687011719, -0.039958953857421875, -0.03334999084472656, -0.02674102783203125, -0.020132064819335938, -0.013523101806640625, -0.0069141387939453125, -0.00030517578125, 0.0063037872314453125, 0.012912750244140625, 0.019521713256835938, 0.02613067626953125, 0.03273963928222656, 0.039348602294921875, 0.04595756530761719, 0.0525665283203125, 0.05917549133300781, 0.06578445434570312, 0.07239341735839844, 0.07900238037109375, 0.08561134338378906, 0.09222030639648438, 0.09882926940917969, 0.105438232421875, 0.11204719543457031, 0.11865615844726562, 0.12526512145996094, 0.13187408447265625, 0.13848304748535156, 0.14509201049804688, 0.1517009735107422, 0.1583099365234375, 0.1649188995361328, 0.17152786254882812, 0.17813682556152344, 0.18474578857421875, 0.19135475158691406, 0.19796371459960938, 0.2045726776123047, 0.211181640625]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 4.0, 11.0, 12.0, 9.0, 11.0, 22.0, 20.0, 35.0, 45.0, 60.0, 107.0, 144.0, 266.0, 586.0, 1470.0, 526.0, 271.0, 140.0, 105.0, 49.0, 45.0, 33.0, 30.0, 17.0, 12.0, 6.0, 12.0, 8.0, 5.0, 2.0, 3.0, 1.0, 1.0, 2.0, 3.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.07586669921875, -0.07337570190429688, -0.07088470458984375, -0.06839370727539062, -0.0659027099609375, -0.06341171264648438, -0.06092071533203125, -0.058429718017578125, -0.055938720703125, -0.053447723388671875, -0.05095672607421875, -0.048465728759765625, -0.0459747314453125, -0.043483734130859375, -0.04099273681640625, -0.038501739501953125, -0.0360107421875, -0.033519744873046875, -0.03102874755859375, -0.028537750244140625, -0.0260467529296875, -0.023555755615234375, -0.02106475830078125, -0.018573760986328125, -0.016082763671875, -0.013591766357421875, -0.01110076904296875, -0.008609771728515625, -0.0061187744140625, -0.003627777099609375, -0.00113677978515625, 0.001354217529296875, 0.00384521484375, 0.006336212158203125, 0.00882720947265625, 0.011318206787109375, 0.0138092041015625, 0.016300201416015625, 0.01879119873046875, 0.021282196044921875, 0.023773193359375, 0.026264190673828125, 0.02875518798828125, 0.031246185302734375, 0.0337371826171875, 0.036228179931640625, 0.03871917724609375, 0.041210174560546875, 0.043701171875, 0.046192169189453125, 0.04868316650390625, 0.051174163818359375, 0.0536651611328125, 0.056156158447265625, 0.05864715576171875, 0.061138153076171875, 0.063629150390625, 0.06612014770507812, 0.06861114501953125, 0.07110214233398438, 0.0735931396484375, 0.07608413696289062, 0.07857513427734375, 0.08106613159179688, 0.08355712890625]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 5.0, 8.0, 21.0, 27.0, 42.0, 70.0, 119.0, 152.0, 150.0, 133.0, 98.0, 78.0, 42.0, 23.0, 18.0, 6.0, 3.0, 8.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.6217930316925049, -0.6005716323852539, -0.5793502330780029, -0.5581288933753967, -0.5369074940681458, -0.5156860947608948, -0.4944647252559662, -0.4732433557510376, -0.4520219564437866, -0.43080055713653564, -0.40957918763160706, -0.38835781812667847, -0.3671364188194275, -0.3459150195121765, -0.3246936500072479, -0.30347228050231934, -0.28225088119506836, -0.2610294818878174, -0.2398081123828888, -0.218586727976799, -0.19736534357070923, -0.17614395916461945, -0.15492257475852966, -0.13370119035243988, -0.1124798059463501, -0.09125842154026031, -0.07003703713417053, -0.04881565272808075, -0.027594268321990967, -0.006372883915901184, 0.014848500490188599, 0.03606988489627838, 0.057291269302368164, 0.07851265370845795, 0.09973403811454773, 0.12095542252063751, 0.1421768069267273, 0.16339819133281708, 0.18461957573890686, 0.20584096014499664, 0.22706234455108643, 0.2482837289571762, 0.269505113363266, 0.2907264828681946, 0.31194788217544556, 0.33316928148269653, 0.3543906509876251, 0.3756120204925537, 0.3968334197998047, 0.41805481910705566, 0.43927618861198425, 0.46049755811691284, 0.4817189574241638, 0.5029403567314148, 0.524161696434021, 0.545383095741272, 0.566604495048523, 0.5878258943557739, 0.6090472936630249, 0.6302686333656311, 0.6514900326728821, 0.6727114319801331, 0.6939327716827393, 0.7151541709899902, 0.7363755702972412]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 5.0, 4.0, 9.0, 3.0, 12.0, 10.0, 13.0, 18.0, 13.0, 24.0, 17.0, 29.0, 33.0, 32.0, 38.0, 39.0, 54.0, 43.0, 36.0, 44.0, 58.0, 49.0, 40.0, 48.0, 42.0, 32.0, 39.0, 38.0, 30.0, 27.0, 25.0, 22.0, 18.0, 16.0, 7.0, 6.0, 8.0, 10.0, 6.0, 6.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.34330523014068604, -0.3336755037307739, -0.3240457773208618, -0.3144160509109497, -0.3047863245010376, -0.2951566278934479, -0.28552690148353577, -0.27589717507362366, -0.26626744866371155, -0.25663772225379944, -0.24700799584388733, -0.2373782843351364, -0.2277485579252243, -0.2181188315153122, -0.20848912000656128, -0.19885939359664917, -0.18922966718673706, -0.17959994077682495, -0.16997021436691284, -0.16034050285816193, -0.15071077644824982, -0.1410810500383377, -0.1314513385295868, -0.12182161211967468, -0.11219188570976257, -0.10256215929985046, -0.09293244034051895, -0.08330272138118744, -0.07367299497127533, -0.06404326856136322, -0.05441354960203171, -0.044783830642700195, -0.035154104232788086, -0.025524381548166275, -0.015894658863544464, -0.006264936178922653, 0.0033647865056991577, 0.012994509190320969, 0.02262423187494278, 0.03225395083427429, 0.0418836772441864, 0.05151339992880821, 0.06114312261343002, 0.07077284157276154, 0.08040256798267365, 0.09003229439258575, 0.09966201335191727, 0.10929173231124878, 0.11892145872116089, 0.128551185131073, 0.1381809115409851, 0.14781062304973602, 0.15744034945964813, 0.16707007586956024, 0.17669978737831116, 0.18632951378822327, 0.19595924019813538, 0.20558896660804749, 0.2152186930179596, 0.2248484045267105, 0.23447813093662262, 0.24410785734653473, 0.25373756885528564, 0.26336729526519775, 0.27299702167510986]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 4.0, 5.0, 3.0, 8.0, 16.0, 21.0, 42.0, 75.0, 116.0, 245.0, 514.0, 1207.0, 3147.0, 10110.0, 40138.0, 189200.0, 612174.0, 146110.0, 32263.0, 8373.0, 2801.0, 1041.0, 487.0, 225.0, 107.0, 48.0, 30.0, 17.0, 15.0, 10.0, 5.0, 7.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.20263671875, -0.19597625732421875, -0.1893157958984375, -0.18265533447265625, -0.175994873046875, -0.16933441162109375, -0.1626739501953125, -0.15601348876953125, -0.14935302734375, -0.14269256591796875, -0.1360321044921875, -0.12937164306640625, -0.122711181640625, -0.11605072021484375, -0.1093902587890625, -0.10272979736328125, -0.0960693359375, -0.08940887451171875, -0.0827484130859375, -0.07608795166015625, -0.069427490234375, -0.06276702880859375, -0.0561065673828125, -0.04944610595703125, -0.04278564453125, -0.03612518310546875, -0.0294647216796875, -0.02280426025390625, -0.016143798828125, -0.00948333740234375, -0.0028228759765625, 0.00383758544921875, 0.010498046875, 0.01715850830078125, 0.0238189697265625, 0.03047943115234375, 0.037139892578125, 0.04380035400390625, 0.0504608154296875, 0.05712127685546875, 0.06378173828125, 0.07044219970703125, 0.0771026611328125, 0.08376312255859375, 0.090423583984375, 0.09708404541015625, 0.1037445068359375, 0.11040496826171875, 0.1170654296875, 0.12372589111328125, 0.1303863525390625, 0.13704681396484375, 0.143707275390625, 0.15036773681640625, 0.1570281982421875, 0.16368865966796875, 0.17034912109375, 0.17700958251953125, 0.1836700439453125, 0.19033050537109375, 0.196990966796875, 0.20365142822265625, 0.2103118896484375, 0.21697235107421875, 0.2236328125]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 6.0, 4.0, 7.0, 7.0, 10.0, 15.0, 17.0, 25.0, 35.0, 26.0, 35.0, 48.0, 50.0, 55.0, 64.0, 59.0, 75.0, 62.0, 50.0, 60.0, 56.0, 39.0, 32.0, 31.0, 35.0, 22.0, 17.0, 20.0, 14.0, 9.0, 8.0, 4.0, 2.0, 3.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0301513671875, -0.029324769973754883, -0.028498172760009766, -0.02767157554626465, -0.02684497833251953, -0.026018381118774414, -0.025191783905029297, -0.02436518669128418, -0.023538589477539062, -0.022711992263793945, -0.021885395050048828, -0.02105879783630371, -0.020232200622558594, -0.019405603408813477, -0.01857900619506836, -0.017752408981323242, -0.016925811767578125, -0.016099214553833008, -0.01527261734008789, -0.014446020126342773, -0.013619422912597656, -0.012792825698852539, -0.011966228485107422, -0.011139631271362305, -0.010313034057617188, -0.00948643684387207, -0.008659839630126953, -0.007833242416381836, -0.007006645202636719, -0.0061800479888916016, -0.005353450775146484, -0.004526853561401367, -0.00370025634765625, -0.002873659133911133, -0.0020470619201660156, -0.0012204647064208984, -0.00039386749267578125, 0.00043272972106933594, 0.0012593269348144531, 0.0020859241485595703, 0.0029125213623046875, 0.0037391185760498047, 0.004565715789794922, 0.005392313003540039, 0.006218910217285156, 0.0070455074310302734, 0.00787210464477539, 0.008698701858520508, 0.009525299072265625, 0.010351896286010742, 0.01117849349975586, 0.012005090713500977, 0.012831687927246094, 0.013658285140991211, 0.014484882354736328, 0.015311479568481445, 0.016138076782226562, 0.01696467399597168, 0.017791271209716797, 0.018617868423461914, 0.01944446563720703, 0.02027106285095215, 0.021097660064697266, 0.021924257278442383, 0.0227508544921875]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [5.0, 4.0, 2.0, 3.0, 3.0, 5.0, 13.0, 9.0, 6.0, 12.0, 18.0, 21.0, 30.0, 39.0, 40.0, 59.0, 84.0, 121.0, 182.0, 317.0, 500.0, 946.0, 1881.0, 3976.0, 9196.0, 24256.0, 69551.0, 240727.0, 475847.0, 144565.0, 46353.0, 16630.0, 6706.0, 2987.0, 1445.0, 793.0, 396.0, 295.0, 176.0, 121.0, 68.0, 45.0, 42.0, 30.0, 16.0, 15.0, 7.0, 4.0, 7.0, 8.0, 1.0, 3.0, 1.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11834716796875, -0.1141672134399414, -0.10998725891113281, -0.10580730438232422, -0.10162734985351562, -0.09744739532470703, -0.09326744079589844, -0.08908748626708984, -0.08490753173828125, -0.08072757720947266, -0.07654762268066406, -0.07236766815185547, -0.06818771362304688, -0.06400775909423828, -0.05982780456542969, -0.055647850036621094, -0.0514678955078125, -0.047287940979003906, -0.04310798645019531, -0.03892803192138672, -0.034748077392578125, -0.03056812286376953, -0.026388168334960938, -0.022208213806152344, -0.01802825927734375, -0.013848304748535156, -0.009668350219726562, -0.005488395690917969, -0.001308441162109375, 0.0028715133666992188, 0.0070514678955078125, 0.011231422424316406, 0.015411376953125, 0.019591331481933594, 0.023771286010742188, 0.02795124053955078, 0.032131195068359375, 0.03631114959716797, 0.04049110412597656, 0.044671058654785156, 0.04885101318359375, 0.053030967712402344, 0.05721092224121094, 0.06139087677001953, 0.06557083129882812, 0.06975078582763672, 0.07393074035644531, 0.0781106948852539, 0.0822906494140625, 0.0864706039428711, 0.09065055847167969, 0.09483051300048828, 0.09901046752929688, 0.10319042205810547, 0.10737037658691406, 0.11155033111572266, 0.11573028564453125, 0.11991024017333984, 0.12409019470214844, 0.12827014923095703, 0.13245010375976562, 0.13663005828857422, 0.1408100128173828, 0.1449899673461914, 0.149169921875]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 0.0, 1.0, 3.0, 4.0, 7.0, 1.0, 8.0, 9.0, 9.0, 18.0, 21.0, 19.0, 11.0, 24.0, 22.0, 36.0, 27.0, 31.0, 41.0, 44.0, 42.0, 55.0, 55.0, 50.0, 40.0, 46.0, 41.0, 48.0, 40.0, 28.0, 30.0, 26.0, 32.0, 29.0, 18.0, 14.0, 15.0, 11.0, 9.0, 7.0, 10.0, 3.0, 5.0, 7.0, 6.0, 3.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.11212158203125, -0.10877799987792969, -0.10543441772460938, -0.10209083557128906, -0.09874725341796875, -0.09540367126464844, -0.09206008911132812, -0.08871650695800781, -0.0853729248046875, -0.08202934265136719, -0.07868576049804688, -0.07534217834472656, -0.07199859619140625, -0.06865501403808594, -0.06531143188476562, -0.06196784973144531, -0.058624267578125, -0.05528068542480469, -0.051937103271484375, -0.04859352111816406, -0.04524993896484375, -0.04190635681152344, -0.038562774658203125, -0.03521919250488281, -0.0318756103515625, -0.028532028198242188, -0.025188446044921875, -0.021844863891601562, -0.01850128173828125, -0.015157699584960938, -0.011814117431640625, -0.008470535278320312, -0.005126953125, -0.0017833709716796875, 0.001560211181640625, 0.0049037933349609375, 0.00824737548828125, 0.011590957641601562, 0.014934539794921875, 0.018278121948242188, 0.0216217041015625, 0.024965286254882812, 0.028308868408203125, 0.03165245056152344, 0.03499603271484375, 0.03833961486816406, 0.041683197021484375, 0.04502677917480469, 0.048370361328125, 0.05171394348144531, 0.055057525634765625, 0.05840110778808594, 0.06174468994140625, 0.06508827209472656, 0.06843185424804688, 0.07177543640136719, 0.0751190185546875, 0.07846260070800781, 0.08180618286132812, 0.08514976501464844, 0.08849334716796875, 0.09183692932128906, 0.09518051147460938, 0.09852409362792969, 0.10186767578125]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 6.0, 9.0, 18.0, 16.0, 28.0, 35.0, 59.0, 86.0, 151.0, 263.0, 451.0, 776.0, 1428.0, 3053.0, 7072.0, 19771.0, 77671.0, 539526.0, 320395.0, 51986.0, 14913.0, 5513.0, 2445.0, 1235.0, 671.0, 397.0, 245.0, 129.0, 70.0, 57.0, 24.0, 21.0, 17.0, 10.0, 4.0, 3.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1591796875, -0.15385055541992188, -0.14852142333984375, -0.14319229125976562, -0.1378631591796875, -0.13253402709960938, -0.12720489501953125, -0.12187576293945312, -0.116546630859375, -0.11121749877929688, -0.10588836669921875, -0.10055923461914062, -0.0952301025390625, -0.08990097045898438, -0.08457183837890625, -0.07924270629882812, -0.07391357421875, -0.06858444213867188, -0.06325531005859375, -0.057926177978515625, -0.0525970458984375, -0.047267913818359375, -0.04193878173828125, -0.036609649658203125, -0.031280517578125, -0.025951385498046875, -0.02062225341796875, -0.015293121337890625, -0.0099639892578125, -0.004634857177734375, 0.00069427490234375, 0.006023406982421875, 0.0113525390625, 0.016681671142578125, 0.02201080322265625, 0.027339935302734375, 0.0326690673828125, 0.037998199462890625, 0.04332733154296875, 0.048656463623046875, 0.053985595703125, 0.059314727783203125, 0.06464385986328125, 0.06997299194335938, 0.0753021240234375, 0.08063125610351562, 0.08596038818359375, 0.09128952026367188, 0.09661865234375, 0.10194778442382812, 0.10727691650390625, 0.11260604858398438, 0.1179351806640625, 0.12326431274414062, 0.12859344482421875, 0.13392257690429688, 0.139251708984375, 0.14458084106445312, 0.14990997314453125, 0.15523910522460938, 0.1605682373046875, 0.16589736938476562, 0.17122650146484375, 0.17655563354492188, 0.181884765625]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 8.0, 3.0, 5.0, 5.0, 9.0, 11.0, 12.0, 34.0, 49.0, 82.0, 97.0, 124.0, 145.0, 101.0, 117.0, 79.0, 49.0, 31.0, 14.0, 12.0, 10.0, 6.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00011861324310302734, -0.00011481903493404388, -0.00011102482676506042, -0.00010723061859607697, -0.0001034364104270935, -9.964220225811005e-05, -9.584799408912659e-05, -9.205378592014313e-05, -8.825957775115967e-05, -8.446536958217621e-05, -8.067116141319275e-05, -7.687695324420929e-05, -7.308274507522583e-05, -6.928853690624237e-05, -6.549432873725891e-05, -6.170012056827545e-05, -5.790591239929199e-05, -5.411170423030853e-05, -5.031749606132507e-05, -4.6523287892341614e-05, -4.2729079723358154e-05, -3.8934871554374695e-05, -3.5140663385391235e-05, -3.1346455216407776e-05, -2.7552247047424316e-05, -2.3758038878440857e-05, -1.9963830709457397e-05, -1.6169622540473938e-05, -1.2375414371490479e-05, -8.581206202507019e-06, -4.7869980335235596e-06, -9.927898645401e-07, 2.8014183044433594e-06, 6.595626473426819e-06, 1.0389834642410278e-05, 1.4184042811393738e-05, 1.7978250980377197e-05, 2.1772459149360657e-05, 2.5566667318344116e-05, 2.9360875487327576e-05, 3.3155083656311035e-05, 3.6949291825294495e-05, 4.0743499994277954e-05, 4.4537708163261414e-05, 4.833191633224487e-05, 5.212612450122833e-05, 5.592033267021179e-05, 5.971454083919525e-05, 6.350874900817871e-05, 6.730295717716217e-05, 7.109716534614563e-05, 7.489137351512909e-05, 7.868558168411255e-05, 8.247978985309601e-05, 8.627399802207947e-05, 9.006820619106293e-05, 9.386241436004639e-05, 9.765662252902985e-05, 0.0001014508306980133, 0.00010524503886699677, 0.00010903924703598022, 0.00011283345520496368, 0.00011662766337394714, 0.0001204218715429306, 0.00012421607971191406]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 1.0, 4.0, 6.0, 8.0, 9.0, 10.0, 8.0, 15.0, 28.0, 38.0, 38.0, 59.0, 111.0, 185.0, 272.0, 628.0, 1353.0, 3411.0, 10352.0, 45433.0, 462152.0, 462374.0, 45308.0, 10483.0, 3532.0, 1321.0, 617.0, 301.0, 151.0, 105.0, 75.0, 49.0, 31.0, 25.0, 11.0, 8.0, 15.0, 9.0, 7.0, 6.0, 4.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0], "bins": [-0.179443359375, -0.17303466796875, -0.1666259765625, -0.16021728515625, -0.15380859375, -0.14739990234375, -0.1409912109375, -0.13458251953125, -0.128173828125, -0.12176513671875, -0.1153564453125, -0.10894775390625, -0.1025390625, -0.09613037109375, -0.0897216796875, -0.08331298828125, -0.076904296875, -0.07049560546875, -0.0640869140625, -0.05767822265625, -0.05126953125, -0.04486083984375, -0.0384521484375, -0.03204345703125, -0.025634765625, -0.01922607421875, -0.0128173828125, -0.00640869140625, 0.0, 0.00640869140625, 0.0128173828125, 0.01922607421875, 0.025634765625, 0.03204345703125, 0.0384521484375, 0.04486083984375, 0.05126953125, 0.05767822265625, 0.0640869140625, 0.07049560546875, 0.076904296875, 0.08331298828125, 0.0897216796875, 0.09613037109375, 0.1025390625, 0.10894775390625, 0.1153564453125, 0.12176513671875, 0.128173828125, 0.13458251953125, 0.1409912109375, 0.14739990234375, 0.15380859375, 0.16021728515625, 0.1666259765625, 0.17303466796875, 0.179443359375, 0.18585205078125, 0.1922607421875, 0.19866943359375, 0.205078125, 0.21148681640625, 0.2178955078125, 0.22430419921875, 0.230712890625]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 5.0, 9.0, 10.0, 11.0, 15.0, 13.0, 25.0, 33.0, 40.0, 71.0, 140.0, 158.0, 144.0, 98.0, 59.0, 57.0, 34.0, 27.0, 18.0, 13.0, 7.0, 9.0, 8.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1805419921875, -0.17622756958007812, -0.17191314697265625, -0.16759872436523438, -0.1632843017578125, -0.15896987915039062, -0.15465545654296875, -0.15034103393554688, -0.146026611328125, -0.14171218872070312, -0.13739776611328125, -0.13308334350585938, -0.1287689208984375, -0.12445449829101562, -0.12014007568359375, -0.11582565307617188, -0.11151123046875, -0.10719680786132812, -0.10288238525390625, -0.09856796264648438, -0.0942535400390625, -0.08993911743164062, -0.08562469482421875, -0.08131027221679688, -0.076995849609375, -0.07268142700195312, -0.06836700439453125, -0.06405258178710938, -0.0597381591796875, -0.055423736572265625, -0.05110931396484375, -0.046794891357421875, -0.04248046875, -0.038166046142578125, -0.03385162353515625, -0.029537200927734375, -0.0252227783203125, -0.020908355712890625, -0.01659393310546875, -0.012279510498046875, -0.007965087890625, -0.003650665283203125, 0.00066375732421875, 0.004978179931640625, 0.0092926025390625, 0.013607025146484375, 0.01792144775390625, 0.022235870361328125, 0.02655029296875, 0.030864715576171875, 0.03517913818359375, 0.039493560791015625, 0.0438079833984375, 0.048122406005859375, 0.05243682861328125, 0.056751251220703125, 0.061065673828125, 0.06538009643554688, 0.06969451904296875, 0.07400894165039062, 0.0783233642578125, 0.08263778686523438, 0.08695220947265625, 0.09126663208007812, 0.0955810546875]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 5.0, 6.0, 6.0, 18.0, 24.0, 29.0, 46.0, 61.0, 83.0, 88.0, 99.0, 94.0, 102.0, 94.0, 64.0, 52.0, 41.0, 36.0, 16.0, 15.0, 5.0, 6.0, 2.0, 1.0, 3.0, 2.0, 1.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.0270849466323853, -0.9951000809669495, -0.9631152749061584, -0.9311304092407227, -0.8991455435752869, -0.8671606779098511, -0.8351758718490601, -0.8031910061836243, -0.7712061405181885, -0.7392212748527527, -0.7072364687919617, -0.6752516031265259, -0.6432667374610901, -0.6112818717956543, -0.5792970657348633, -0.5473122000694275, -0.5153273940086365, -0.48334255814552307, -0.4513576924800873, -0.4193728566169739, -0.3873879909515381, -0.3554031550884247, -0.3234183192253113, -0.2914334535598755, -0.2594486176967621, -0.2274637669324875, -0.1954789161682129, -0.1634940803050995, -0.1315092295408249, -0.09952437877655029, -0.06753954291343689, -0.03555469214916229, -0.0035698413848876953, 0.028415005654096603, 0.0603998526930809, 0.0923846960067749, 0.1243695467710495, 0.1563543975353241, 0.1883392333984375, 0.2203240841627121, 0.2523089349269867, 0.2842937707901001, 0.3162786364555359, 0.3482634723186493, 0.3802483081817627, 0.4122331738471985, 0.4442180097103119, 0.4762028455734253, 0.5081877112388611, 0.5401725769042969, 0.5721573829650879, 0.6041422486305237, 0.6361271142959595, 0.6681119203567505, 0.7000967860221863, 0.7320816516876221, 0.7640664577484131, 0.7960513234138489, 0.8280361294746399, 0.8600209951400757, 0.8920058608055115, 0.9239907264709473, 0.9559755325317383, 0.9879603981971741, 1.0199452638626099]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 2.0, 4.0, 2.0, 5.0, 4.0, 5.0, 15.0, 7.0, 9.0, 25.0, 20.0, 19.0, 25.0, 29.0, 32.0, 35.0, 42.0, 39.0, 39.0, 63.0, 46.0, 54.0, 44.0, 46.0, 59.0, 47.0, 47.0, 32.0, 28.0, 43.0, 23.0, 24.0, 15.0, 17.0, 16.0, 15.0, 9.0, 4.0, 2.0, 4.0, 5.0, 0.0, 7.0, 3.0, 0.0, 0.0, 2.0], "bins": [-0.8435479998588562, -0.821363091468811, -0.7991781234741211, -0.7769932150840759, -0.7548083066940308, -0.7326233386993408, -0.7104384303092957, -0.6882535219192505, -0.6660685539245605, -0.6438836455345154, -0.6216986775398254, -0.5995137691497803, -0.5773288607597351, -0.5551439523696899, -0.532958984375, -0.5107740759849548, -0.48858916759490967, -0.4664042294025421, -0.44421932101249695, -0.4220343828201294, -0.39984947443008423, -0.3776645362377167, -0.3554795980453491, -0.33329468965530396, -0.3111097514629364, -0.28892481327056885, -0.2667399048805237, -0.24455496668815613, -0.22237004339694977, -0.2001851201057434, -0.17800018191337585, -0.1558152586221695, -0.13363027572631836, -0.111445352435112, -0.08926042169332504, -0.06707549095153809, -0.044890567660331726, -0.022705644369125366, -0.0005207061767578125, 0.021664217114448547, 0.04384914040565491, 0.06603406369686127, 0.08821899443864822, 0.11040392518043518, 0.13258884847164154, 0.1547737717628479, 0.17695870995521545, 0.19914363324642181, 0.22132855653762817, 0.24351347982883453, 0.2656984031200409, 0.28788334131240845, 0.3100682497024536, 0.33225318789482117, 0.3544381260871887, 0.3766230344772339, 0.39880797266960144, 0.420992910861969, 0.44317781925201416, 0.4653627574443817, 0.48754769563674927, 0.5097326040267944, 0.5319175720214844, 0.5541024804115295, 0.5762873888015747]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 4.0, 2.0, 2.0, 9.0, 13.0, 17.0, 17.0, 32.0, 44.0, 74.0, 112.0, 229.0, 323.0, 596.0, 1150.0, 2351.0, 5197.0, 13582.0, 46395.0, 397465.0, 3586956.0, 102443.0, 22752.0, 7916.0, 3244.0, 1553.0, 784.0, 420.0, 250.0, 137.0, 81.0, 52.0, 37.0, 18.0, 8.0, 9.0, 5.0, 4.0, 4.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.192626953125, -0.1858043670654297, -0.17898178100585938, -0.17215919494628906, -0.16533660888671875, -0.15851402282714844, -0.15169143676757812, -0.1448688507080078, -0.1380462646484375, -0.1312236785888672, -0.12440109252929688, -0.11757850646972656, -0.11075592041015625, -0.10393333435058594, -0.09711074829101562, -0.09028816223144531, -0.083465576171875, -0.07664299011230469, -0.06982040405273438, -0.06299781799316406, -0.05617523193359375, -0.04935264587402344, -0.042530059814453125, -0.03570747375488281, -0.0288848876953125, -0.022062301635742188, -0.015239715576171875, -0.008417129516601562, -0.00159454345703125, 0.0052280426025390625, 0.012050628662109375, 0.018873214721679688, 0.02569580078125, 0.03251838684082031, 0.039340972900390625, 0.04616355895996094, 0.05298614501953125, 0.05980873107910156, 0.06663131713867188, 0.07345390319824219, 0.0802764892578125, 0.08709907531738281, 0.09392166137695312, 0.10074424743652344, 0.10756683349609375, 0.11438941955566406, 0.12121200561523438, 0.1280345916748047, 0.134857177734375, 0.1416797637939453, 0.14850234985351562, 0.15532493591308594, 0.16214752197265625, 0.16897010803222656, 0.17579269409179688, 0.1826152801513672, 0.1894378662109375, 0.1962604522705078, 0.20308303833007812, 0.20990562438964844, 0.21672821044921875, 0.22355079650878906, 0.23037338256835938, 0.2371959686279297, 0.2440185546875]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0, 3.0, 4.0, 12.0, 6.0, 14.0, 16.0, 17.0, 20.0, 28.0, 33.0, 37.0, 40.0, 48.0, 53.0, 55.0, 74.0, 61.0, 58.0, 57.0, 54.0, 53.0, 43.0, 41.0, 42.0, 32.0, 26.0, 22.0, 14.0, 15.0, 12.0, 7.0, 3.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.031982421875, -0.031085968017578125, -0.03018951416015625, -0.029293060302734375, -0.0283966064453125, -0.027500152587890625, -0.02660369873046875, -0.025707244873046875, -0.024810791015625, -0.023914337158203125, -0.02301788330078125, -0.022121429443359375, -0.0212249755859375, -0.020328521728515625, -0.01943206787109375, -0.018535614013671875, -0.01763916015625, -0.016742706298828125, -0.01584625244140625, -0.014949798583984375, -0.0140533447265625, -0.013156890869140625, -0.01226043701171875, -0.011363983154296875, -0.010467529296875, -0.009571075439453125, -0.00867462158203125, -0.007778167724609375, -0.0068817138671875, -0.005985260009765625, -0.00508880615234375, -0.004192352294921875, -0.0032958984375, -0.002399444580078125, -0.00150299072265625, -0.000606536865234375, 0.0002899169921875, 0.001186370849609375, 0.00208282470703125, 0.002979278564453125, 0.003875732421875, 0.004772186279296875, 0.00566864013671875, 0.006565093994140625, 0.0074615478515625, 0.008358001708984375, 0.00925445556640625, 0.010150909423828125, 0.01104736328125, 0.011943817138671875, 0.01284027099609375, 0.013736724853515625, 0.0146331787109375, 0.015529632568359375, 0.01642608642578125, 0.017322540283203125, 0.018218994140625, 0.019115447998046875, 0.02001190185546875, 0.020908355712890625, 0.0218048095703125, 0.022701263427734375, 0.02359771728515625, 0.024494171142578125, 0.025390625]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 4.0, 6.0, 8.0, 6.0, 10.0, 9.0, 13.0, 19.0, 30.0, 40.0, 52.0, 90.0, 171.0, 253.0, 432.0, 743.0, 1528.0, 2682.0, 5334.0, 11381.0, 28163.0, 91582.0, 1019317.0, 2858331.0, 116020.0, 32696.0, 12929.0, 5867.0, 2869.0, 1622.0, 826.0, 492.0, 295.0, 171.0, 106.0, 56.0, 39.0, 24.0, 18.0, 17.0, 9.0, 5.0, 7.0, 8.0, 3.0, 2.0, 3.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.27783203125, -0.26943206787109375, -0.2610321044921875, -0.25263214111328125, -0.244232177734375, -0.23583221435546875, -0.2274322509765625, -0.21903228759765625, -0.21063232421875, -0.20223236083984375, -0.1938323974609375, -0.18543243408203125, -0.177032470703125, -0.16863250732421875, -0.1602325439453125, -0.15183258056640625, -0.1434326171875, -0.13503265380859375, -0.1266326904296875, -0.11823272705078125, -0.109832763671875, -0.10143280029296875, -0.0930328369140625, -0.08463287353515625, -0.07623291015625, -0.06783294677734375, -0.0594329833984375, -0.05103302001953125, -0.042633056640625, -0.03423309326171875, -0.0258331298828125, -0.01743316650390625, -0.009033203125, -0.00063323974609375, 0.0077667236328125, 0.01616668701171875, 0.024566650390625, 0.03296661376953125, 0.0413665771484375, 0.04976654052734375, 0.05816650390625, 0.06656646728515625, 0.0749664306640625, 0.08336639404296875, 0.091766357421875, 0.10016632080078125, 0.1085662841796875, 0.11696624755859375, 0.1253662109375, 0.13376617431640625, 0.1421661376953125, 0.15056610107421875, 0.158966064453125, 0.16736602783203125, 0.1757659912109375, 0.18416595458984375, 0.19256591796875, 0.20096588134765625, 0.2093658447265625, 0.21776580810546875, 0.226165771484375, 0.23456573486328125, 0.2429656982421875, 0.25136566162109375, 0.259765625]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 9.0, 4.0, 5.0, 10.0, 10.0, 12.0, 16.0, 26.0, 33.0, 61.0, 86.0, 151.0, 406.0, 1998.0, 676.0, 228.0, 135.0, 72.0, 33.0, 32.0, 26.0, 13.0, 14.0, 5.0, 2.0, 6.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.154296875, -0.15050697326660156, -0.14671707153320312, -0.1429271697998047, -0.13913726806640625, -0.1353473663330078, -0.13155746459960938, -0.12776756286621094, -0.1239776611328125, -0.12018775939941406, -0.11639785766601562, -0.11260795593261719, -0.10881805419921875, -0.10502815246582031, -0.10123825073242188, -0.09744834899902344, -0.093658447265625, -0.08986854553222656, -0.08607864379882812, -0.08228874206542969, -0.07849884033203125, -0.07470893859863281, -0.07091903686523438, -0.06712913513183594, -0.0633392333984375, -0.05954933166503906, -0.055759429931640625, -0.05196952819824219, -0.04817962646484375, -0.04438972473144531, -0.040599822998046875, -0.03680992126464844, -0.03302001953125, -0.029230117797851562, -0.025440216064453125, -0.021650314331054688, -0.01786041259765625, -0.014070510864257812, -0.010280609130859375, -0.0064907073974609375, -0.0027008056640625, 0.0010890960693359375, 0.004878997802734375, 0.008668899536132812, 0.01245880126953125, 0.016248703002929688, 0.020038604736328125, 0.023828506469726562, 0.027618408203125, 0.03140830993652344, 0.035198211669921875, 0.03898811340332031, 0.04277801513671875, 0.04656791687011719, 0.050357818603515625, 0.05414772033691406, 0.0579376220703125, 0.06172752380371094, 0.06551742553710938, 0.06930732727050781, 0.07309722900390625, 0.07688713073730469, 0.08067703247070312, 0.08446693420410156, 0.0882568359375]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 2.0, 3.0, 12.0, 12.0, 17.0, 35.0, 50.0, 81.0, 104.0, 128.0, 117.0, 131.0, 101.0, 84.0, 57.0, 22.0, 18.0, 9.0, 13.0, 5.0, 2.0, 1.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6314496994018555, -0.6076474785804749, -0.5838451981544495, -0.5600429773330688, -0.5362407565116882, -0.5124384760856628, -0.4886362552642822, -0.4648340046405792, -0.4410317540168762, -0.4172295033931732, -0.3934272825717926, -0.3696250319480896, -0.3458227813243866, -0.3220205307006836, -0.298218309879303, -0.2744160592556, -0.25061383843421936, -0.22681160271167755, -0.20300935208797455, -0.17920711636543274, -0.15540486574172974, -0.13160263001918793, -0.10780039429664612, -0.08399814367294312, -0.060195907950401306, -0.0363936647772789, -0.012591425329446793, 0.011210814118385315, 0.03501305729150772, 0.05881530046463013, 0.08261753618717194, 0.10641978681087494, 0.13022202253341675, 0.15402425825595856, 0.17782650887966156, 0.20162874460220337, 0.22543099522590637, 0.24923323094844818, 0.27303546667099, 0.296837717294693, 0.320639967918396, 0.344442218542099, 0.3682444393634796, 0.3920466899871826, 0.4158489406108856, 0.4396511912345886, 0.46345341205596924, 0.48725566267967224, 0.5110578536987305, 0.5348600745201111, 0.5586623549461365, 0.5824645757675171, 0.6062667965888977, 0.6300690770149231, 0.6538712978363037, 0.6776735782623291, 0.7014757990837097, 0.7252780199050903, 0.7490803003311157, 0.7728825211524963, 0.796684741973877, 0.8204870223999023, 0.844289243221283, 0.8680914640426636, 0.891893744468689]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 1.0, 6.0, 8.0, 2.0, 9.0, 10.0, 7.0, 18.0, 10.0, 15.0, 25.0, 19.0, 30.0, 34.0, 34.0, 49.0, 50.0, 55.0, 43.0, 55.0, 53.0, 49.0, 49.0, 47.0, 44.0, 26.0, 33.0, 22.0, 41.0, 35.0, 29.0, 20.0, 17.0, 20.0, 10.0, 6.0, 10.0, 3.0, 7.0, 1.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 3.0], "bins": [-0.47905051708221436, -0.4659593403339386, -0.45286816358566284, -0.4397769570350647, -0.42668578028678894, -0.4135946035385132, -0.4005034267902374, -0.38741225004196167, -0.3743210434913635, -0.36122986674308777, -0.348138689994812, -0.33504748344421387, -0.3219563066959381, -0.30886512994766235, -0.2957739531993866, -0.28268277645111084, -0.2695915699005127, -0.25650039315223694, -0.2434092015028, -0.23031802475452423, -0.21722683310508728, -0.20413565635681152, -0.19104447960853577, -0.17795328795909882, -0.16486212611198425, -0.1517709493637085, -0.13867975771427155, -0.1255885809659958, -0.11249738931655884, -0.09940621256828308, -0.08631502836942673, -0.07322384417057037, -0.06013265252113342, -0.04704146832227707, -0.033950284123420715, -0.02085910364985466, -0.007767919450998306, 0.005323261022567749, 0.018414445221424103, 0.03150562942028046, 0.04459681361913681, 0.057687997817993164, 0.07077918201684952, 0.08387036621570587, 0.09696154296398163, 0.11005272716283798, 0.12314391136169434, 0.1362350881099701, 0.14932627975940704, 0.1624174565076828, 0.17550864815711975, 0.1885998249053955, 0.20169101655483246, 0.21478219330310822, 0.22787338495254517, 0.24096456170082092, 0.2540557384490967, 0.26714691519737244, 0.2802380919456482, 0.29332929849624634, 0.3064204752445221, 0.31951165199279785, 0.3326028287410736, 0.34569400548934937, 0.3587852120399475]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 5.0, 1.0, 3.0, 9.0, 5.0, 6.0, 8.0, 13.0, 11.0, 14.0, 28.0, 37.0, 45.0, 67.0, 116.0, 202.0, 322.0, 584.0, 945.0, 1752.0, 3454.0, 7258.0, 15509.0, 37312.0, 95073.0, 279521.0, 384841.0, 132030.0, 50419.0, 20456.0, 9159.0, 4310.0, 2187.0, 1154.0, 639.0, 362.0, 249.0, 138.0, 92.0, 48.0, 55.0, 40.0, 19.0, 21.0, 12.0, 16.0, 5.0, 6.0, 4.0, 2.0, 2.0, 0.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.1488037109375, -0.14370155334472656, -0.13859939575195312, -0.1334972381591797, -0.12839508056640625, -0.12329292297363281, -0.11819076538085938, -0.11308860778808594, -0.1079864501953125, -0.10288429260253906, -0.09778213500976562, -0.09267997741699219, -0.08757781982421875, -0.08247566223144531, -0.07737350463867188, -0.07227134704589844, -0.067169189453125, -0.06206703186035156, -0.056964874267578125, -0.05186271667480469, -0.04676055908203125, -0.04165840148925781, -0.036556243896484375, -0.03145408630371094, -0.0263519287109375, -0.021249771118164062, -0.016147613525390625, -0.011045455932617188, -0.00594329833984375, -0.0008411407470703125, 0.004261016845703125, 0.009363174438476562, 0.01446533203125, 0.019567489624023438, 0.024669647216796875, 0.029771804809570312, 0.03487396240234375, 0.03997611999511719, 0.045078277587890625, 0.05018043518066406, 0.0552825927734375, 0.06038475036621094, 0.06548690795898438, 0.07058906555175781, 0.07569122314453125, 0.08079338073730469, 0.08589553833007812, 0.09099769592285156, 0.096099853515625, 0.10120201110839844, 0.10630416870117188, 0.11140632629394531, 0.11650848388671875, 0.12161064147949219, 0.12671279907226562, 0.13181495666503906, 0.1369171142578125, 0.14201927185058594, 0.14712142944335938, 0.1522235870361328, 0.15732574462890625, 0.1624279022216797, 0.16753005981445312, 0.17263221740722656, 0.177734375]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 4.0, 0.0, 6.0, 5.0, 6.0, 9.0, 4.0, 14.0, 14.0, 18.0, 30.0, 30.0, 36.0, 50.0, 61.0, 60.0, 50.0, 73.0, 69.0, 65.0, 59.0, 63.0, 42.0, 47.0, 44.0, 28.0, 33.0, 22.0, 14.0, 24.0, 14.0, 8.0, 5.0, 5.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.029876708984375, -0.02874898910522461, -0.02762126922607422, -0.026493549346923828, -0.025365829467773438, -0.024238109588623047, -0.023110389709472656, -0.021982669830322266, -0.020854949951171875, -0.019727230072021484, -0.018599510192871094, -0.017471790313720703, -0.016344070434570312, -0.015216350555419922, -0.014088630676269531, -0.01296091079711914, -0.01183319091796875, -0.01070547103881836, -0.009577751159667969, -0.008450031280517578, -0.0073223114013671875, -0.006194591522216797, -0.005066871643066406, -0.003939151763916016, -0.002811431884765625, -0.0016837120056152344, -0.0005559921264648438, 0.0005717277526855469, 0.0016994476318359375, 0.002827167510986328, 0.003954887390136719, 0.005082607269287109, 0.0062103271484375, 0.007338047027587891, 0.008465766906738281, 0.009593486785888672, 0.010721206665039062, 0.011848926544189453, 0.012976646423339844, 0.014104366302490234, 0.015232086181640625, 0.016359806060791016, 0.017487525939941406, 0.018615245819091797, 0.019742965698242188, 0.020870685577392578, 0.02199840545654297, 0.02312612533569336, 0.02425384521484375, 0.02538156509399414, 0.02650928497314453, 0.027637004852294922, 0.028764724731445312, 0.029892444610595703, 0.031020164489746094, 0.032147884368896484, 0.033275604248046875, 0.034403324127197266, 0.035531044006347656, 0.03665876388549805, 0.03778648376464844, 0.03891420364379883, 0.04004192352294922, 0.04116964340209961, 0.04229736328125]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 4.0, 0.0, 1.0, 0.0, 3.0, 4.0, 4.0, 7.0, 4.0, 12.0, 17.0, 17.0, 18.0, 19.0, 30.0, 30.0, 70.0, 104.0, 101.0, 165.0, 265.0, 393.0, 735.0, 1524.0, 3472.0, 9379.0, 32683.0, 156862.0, 644097.0, 151004.0, 31449.0, 9350.0, 3339.0, 1486.0, 709.0, 413.0, 258.0, 156.0, 103.0, 63.0, 54.0, 25.0, 30.0, 28.0, 18.0, 13.0, 12.0, 10.0, 7.0, 7.0, 8.0, 1.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.255126953125, -0.2464752197265625, -0.237823486328125, -0.2291717529296875, -0.22052001953125, -0.2118682861328125, -0.203216552734375, -0.1945648193359375, -0.1859130859375, -0.1772613525390625, -0.168609619140625, -0.1599578857421875, -0.15130615234375, -0.1426544189453125, -0.134002685546875, -0.1253509521484375, -0.11669921875, -0.1080474853515625, -0.099395751953125, -0.0907440185546875, -0.08209228515625, -0.0734405517578125, -0.064788818359375, -0.0561370849609375, -0.0474853515625, -0.0388336181640625, -0.030181884765625, -0.0215301513671875, -0.01287841796875, -0.0042266845703125, 0.004425048828125, 0.0130767822265625, 0.021728515625, 0.0303802490234375, 0.039031982421875, 0.0476837158203125, 0.05633544921875, 0.0649871826171875, 0.073638916015625, 0.0822906494140625, 0.0909423828125, 0.0995941162109375, 0.108245849609375, 0.1168975830078125, 0.12554931640625, 0.1342010498046875, 0.142852783203125, 0.1515045166015625, 0.16015625, 0.1688079833984375, 0.177459716796875, 0.1861114501953125, 0.19476318359375, 0.2034149169921875, 0.212066650390625, 0.2207183837890625, 0.2293701171875, 0.2380218505859375, 0.246673583984375, 0.2553253173828125, 0.26397705078125, 0.2726287841796875, 0.281280517578125, 0.2899322509765625, 0.298583984375]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 0.0, 3.0, 5.0, 6.0, 2.0, 8.0, 8.0, 12.0, 12.0, 14.0, 23.0, 19.0, 29.0, 24.0, 21.0, 23.0, 35.0, 50.0, 36.0, 50.0, 38.0, 39.0, 42.0, 55.0, 48.0, 54.0, 51.0, 34.0, 43.0, 27.0, 31.0, 13.0, 23.0, 21.0, 13.0, 18.0, 22.0, 11.0, 12.0, 7.0, 9.0, 4.0, 4.0, 0.0, 3.0, 4.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.1533203125, -0.14864349365234375, -0.1439666748046875, -0.13928985595703125, -0.134613037109375, -0.12993621826171875, -0.1252593994140625, -0.12058258056640625, -0.11590576171875, -0.11122894287109375, -0.1065521240234375, -0.10187530517578125, -0.097198486328125, -0.09252166748046875, -0.0878448486328125, -0.08316802978515625, -0.0784912109375, -0.07381439208984375, -0.0691375732421875, -0.06446075439453125, -0.059783935546875, -0.05510711669921875, -0.0504302978515625, -0.04575347900390625, -0.04107666015625, -0.03639984130859375, -0.0317230224609375, -0.02704620361328125, -0.022369384765625, -0.01769256591796875, -0.0130157470703125, -0.00833892822265625, -0.003662109375, 0.00101470947265625, 0.0056915283203125, 0.01036834716796875, 0.015045166015625, 0.01972198486328125, 0.0243988037109375, 0.02907562255859375, 0.03375244140625, 0.03842926025390625, 0.0431060791015625, 0.04778289794921875, 0.052459716796875, 0.05713653564453125, 0.0618133544921875, 0.06649017333984375, 0.0711669921875, 0.07584381103515625, 0.0805206298828125, 0.08519744873046875, 0.089874267578125, 0.09455108642578125, 0.0992279052734375, 0.10390472412109375, 0.10858154296875, 0.11325836181640625, 0.1179351806640625, 0.12261199951171875, 0.127288818359375, 0.13196563720703125, 0.1366424560546875, 0.14131927490234375, 0.14599609375]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 0.0, 0.0, 4.0, 2.0, 5.0, 9.0, 9.0, 7.0, 22.0, 20.0, 42.0, 85.0, 166.0, 238.0, 528.0, 943.0, 2024.0, 5441.0, 17332.0, 77802.0, 571008.0, 308564.0, 45621.0, 11498.0, 3925.0, 1640.0, 719.0, 367.0, 211.0, 125.0, 77.0, 33.0, 26.0, 23.0, 12.0, 10.0, 4.0, 5.0, 4.0, 2.0, 2.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.22021484375, -0.21370697021484375, -0.2071990966796875, -0.20069122314453125, -0.194183349609375, -0.18767547607421875, -0.1811676025390625, -0.17465972900390625, -0.16815185546875, -0.16164398193359375, -0.1551361083984375, -0.14862823486328125, -0.142120361328125, -0.13561248779296875, -0.1291046142578125, -0.12259674072265625, -0.1160888671875, -0.10958099365234375, -0.1030731201171875, -0.09656524658203125, -0.090057373046875, -0.08354949951171875, -0.0770416259765625, -0.07053375244140625, -0.06402587890625, -0.05751800537109375, -0.0510101318359375, -0.04450225830078125, -0.037994384765625, -0.03148651123046875, -0.0249786376953125, -0.01847076416015625, -0.011962890625, -0.00545501708984375, 0.0010528564453125, 0.00756072998046875, 0.014068603515625, 0.02057647705078125, 0.0270843505859375, 0.03359222412109375, 0.04010009765625, 0.04660797119140625, 0.0531158447265625, 0.05962371826171875, 0.066131591796875, 0.07263946533203125, 0.0791473388671875, 0.08565521240234375, 0.0921630859375, 0.09867095947265625, 0.1051788330078125, 0.11168670654296875, 0.118194580078125, 0.12470245361328125, 0.1312103271484375, 0.13771820068359375, 0.14422607421875, 0.15073394775390625, 0.1572418212890625, 0.16374969482421875, 0.170257568359375, 0.17676544189453125, 0.1832733154296875, 0.18978118896484375, 0.1962890625]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 4.0, 1.0, 6.0, 7.0, 4.0, 10.0, 12.0, 13.0, 8.0, 26.0, 36.0, 43.0, 41.0, 65.0, 70.0, 50.0, 68.0, 65.0, 59.0, 52.0, 48.0, 63.0, 46.0, 42.0, 37.0, 37.0, 21.0, 9.0, 14.0, 10.0, 7.0, 9.0, 6.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.9664249420166016e-05, -5.7853758335113525e-05, -5.6043267250061035e-05, -5.4232776165008545e-05, -5.2422285079956055e-05, -5.0611793994903564e-05, -4.8801302909851074e-05, -4.6990811824798584e-05, -4.5180320739746094e-05, -4.3369829654693604e-05, -4.155933856964111e-05, -3.974884748458862e-05, -3.793835639953613e-05, -3.612786531448364e-05, -3.431737422943115e-05, -3.250688314437866e-05, -3.069639205932617e-05, -2.888590097427368e-05, -2.707540988922119e-05, -2.52649188041687e-05, -2.345442771911621e-05, -2.164393663406372e-05, -1.983344554901123e-05, -1.802295446395874e-05, -1.621246337890625e-05, -1.440197229385376e-05, -1.259148120880127e-05, -1.078099012374878e-05, -8.970499038696289e-06, -7.160007953643799e-06, -5.349516868591309e-06, -3.5390257835388184e-06, -1.7285346984863281e-06, 8.195638656616211e-08, 1.8924474716186523e-06, 3.7029385566711426e-06, 5.513429641723633e-06, 7.323920726776123e-06, 9.134411811828613e-06, 1.0944902896881104e-05, 1.2755393981933594e-05, 1.4565885066986084e-05, 1.6376376152038574e-05, 1.8186867237091064e-05, 1.9997358322143555e-05, 2.1807849407196045e-05, 2.3618340492248535e-05, 2.5428831577301025e-05, 2.7239322662353516e-05, 2.9049813747406006e-05, 3.0860304832458496e-05, 3.2670795917510986e-05, 3.4481287002563477e-05, 3.629177808761597e-05, 3.810226917266846e-05, 3.991276025772095e-05, 4.172325134277344e-05, 4.353374242782593e-05, 4.534423351287842e-05, 4.715472459793091e-05, 4.89652156829834e-05, 5.077570676803589e-05, 5.258619785308838e-05, 5.439668893814087e-05, 5.620718002319336e-05]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 3.0, 2.0, 2.0, 5.0, 10.0, 14.0, 14.0, 28.0, 28.0, 50.0, 90.0, 131.0, 202.0, 314.0, 552.0, 1115.0, 2298.0, 5742.0, 17204.0, 72012.0, 548640.0, 331712.0, 47140.0, 12582.0, 4568.0, 1937.0, 936.0, 473.0, 271.0, 167.0, 113.0, 66.0, 39.0, 28.0, 18.0, 19.0, 10.0, 9.0, 2.0, 2.0, 1.0, 5.0, 1.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.2078857421875, -0.20174789428710938, -0.19561004638671875, -0.18947219848632812, -0.1833343505859375, -0.17719650268554688, -0.17105865478515625, -0.16492080688476562, -0.158782958984375, -0.15264511108398438, -0.14650726318359375, -0.14036941528320312, -0.1342315673828125, -0.12809371948242188, -0.12195587158203125, -0.11581802368164062, -0.10968017578125, -0.10354232788085938, -0.09740447998046875, -0.09126663208007812, -0.0851287841796875, -0.07899093627929688, -0.07285308837890625, -0.06671524047851562, -0.060577392578125, -0.054439544677734375, -0.04830169677734375, -0.042163848876953125, -0.0360260009765625, -0.029888153076171875, -0.02375030517578125, -0.017612457275390625, -0.011474609375, -0.005336761474609375, 0.00080108642578125, 0.006938934326171875, 0.0130767822265625, 0.019214630126953125, 0.02535247802734375, 0.031490325927734375, 0.037628173828125, 0.043766021728515625, 0.04990386962890625, 0.056041717529296875, 0.0621795654296875, 0.06831741333007812, 0.07445526123046875, 0.08059310913085938, 0.08673095703125, 0.09286880493164062, 0.09900665283203125, 0.10514450073242188, 0.1112823486328125, 0.11742019653320312, 0.12355804443359375, 0.12969589233398438, 0.135833740234375, 0.14197158813476562, 0.14810943603515625, 0.15424728393554688, 0.1603851318359375, 0.16652297973632812, 0.17266082763671875, 0.17879867553710938, 0.1849365234375]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 5.0, 2.0, 6.0, 4.0, 5.0, 7.0, 4.0, 4.0, 10.0, 10.0, 11.0, 22.0, 19.0, 32.0, 47.0, 69.0, 85.0, 105.0, 91.0, 115.0, 105.0, 55.0, 44.0, 43.0, 23.0, 21.0, 16.0, 10.0, 6.0, 5.0, 10.0, 9.0, 5.0, 5.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.1326904296875, -0.1284942626953125, -0.124298095703125, -0.1201019287109375, -0.11590576171875, -0.1117095947265625, -0.107513427734375, -0.1033172607421875, -0.09912109375, -0.0949249267578125, -0.090728759765625, -0.0865325927734375, -0.08233642578125, -0.0781402587890625, -0.073944091796875, -0.0697479248046875, -0.0655517578125, -0.0613555908203125, -0.057159423828125, -0.0529632568359375, -0.04876708984375, -0.0445709228515625, -0.040374755859375, -0.0361785888671875, -0.031982421875, -0.0277862548828125, -0.023590087890625, -0.0193939208984375, -0.01519775390625, -0.0110015869140625, -0.006805419921875, -0.0026092529296875, 0.0015869140625, 0.0057830810546875, 0.009979248046875, 0.0141754150390625, 0.01837158203125, 0.0225677490234375, 0.026763916015625, 0.0309600830078125, 0.03515625, 0.0393524169921875, 0.043548583984375, 0.0477447509765625, 0.05194091796875, 0.0561370849609375, 0.060333251953125, 0.0645294189453125, 0.0687255859375, 0.0729217529296875, 0.077117919921875, 0.0813140869140625, 0.08551025390625, 0.0897064208984375, 0.093902587890625, 0.0980987548828125, 0.102294921875, 0.1064910888671875, 0.110687255859375, 0.1148834228515625, 0.11907958984375, 0.1232757568359375, 0.127471923828125, 0.1316680908203125, 0.1358642578125]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 2.0, 5.0, 1.0, 14.0, 35.0, 58.0, 100.0, 164.0, 201.0, 198.0, 122.0, 66.0, 22.0, 13.0, 5.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.2188172340393066, -2.1281116008758545, -2.0374059677124023, -1.9467002153396606, -1.855994462966919, -1.7652888298034668, -1.6745831966400146, -1.5838775634765625, -1.4931718111038208, -1.4024661779403687, -1.311760425567627, -1.2210547924041748, -1.1303491592407227, -1.039643406867981, -0.9489377737045288, -0.8582320809364319, -0.767526388168335, -0.676820695400238, -0.5861150026321411, -0.49540936946868896, -0.40470367670059204, -0.3139979839324951, -0.22329235076904297, -0.13258665800094604, -0.04188096523284912, 0.04882471263408661, 0.13953039050102234, 0.23023605346679688, 0.3209417462348938, 0.4116474390029907, 0.5023530721664429, 0.5930587649345398, 0.6837644577026367, 0.7744701504707336, 0.8651758432388306, 0.9558814764022827, 1.0465872287750244, 1.1372928619384766, 1.2279984951019287, 1.3187041282653809, 1.4094098806381226, 1.5001155138015747, 1.5908212661743164, 1.6815268993377686, 1.7722325325012207, 1.8629382848739624, 1.9536439180374146, 2.0443496704101562, 2.1350553035736084, 2.2257609367370605, 2.3164665699005127, 2.407172203063965, 2.497878074645996, 2.5885837078094482, 2.6792893409729004, 2.7699949741363525, 2.8607006072998047, 2.951406240463257, 3.042111873626709, 3.1328177452087402, 3.2235233783721924, 3.3142290115356445, 3.4049346446990967, 3.495640277862549, 3.58634614944458]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 1.0, 3.0, 7.0, 1.0, 5.0, 5.0, 5.0, 10.0, 9.0, 11.0, 6.0, 15.0, 18.0, 22.0, 16.0, 14.0, 28.0, 24.0, 30.0, 30.0, 34.0, 42.0, 26.0, 28.0, 31.0, 35.0, 26.0, 27.0, 35.0, 44.0, 39.0, 29.0, 39.0, 30.0, 35.0, 23.0, 20.0, 35.0, 20.0, 13.0, 19.0, 22.0, 11.0, 5.0, 12.0, 12.0, 7.0, 11.0, 8.0, 9.0, 9.0, 6.0, 2.0, 7.0, 4.0, 0.0, 2.0, 2.0, 0.0, 1.0], "bins": [-0.6889705061912537, -0.667195737361908, -0.6454209089279175, -0.6236461400985718, -0.6018713712692261, -0.5800965428352356, -0.5583217740058899, -0.5365469455718994, -0.5147721767425537, -0.4929973781108856, -0.4712226092815399, -0.4494478106498718, -0.42767301201820374, -0.40589821338653564, -0.38412344455718994, -0.36234864592552185, -0.34057387709617615, -0.31879907846450806, -0.29702430963516235, -0.27524951100349426, -0.25347471237182617, -0.23169992864131927, -0.20992514491081238, -0.1881503462791443, -0.1663755625486374, -0.1446007788181305, -0.1228259801864624, -0.1010511964559555, -0.07927640527486801, -0.05750161409378052, -0.03572683036327362, -0.01395203173160553, 0.007822751998901367, 0.029597541317343712, 0.051372330635786057, 0.07314711809158325, 0.09492190927267075, 0.11669670045375824, 0.13847148418426514, 0.16024628281593323, 0.18202106654644012, 0.20379585027694702, 0.2255706489086151, 0.247345432639122, 0.2691202163696289, 0.290895015001297, 0.3126698136329651, 0.3344445824623108, 0.3562193810939789, 0.377994179725647, 0.3997689485549927, 0.42154374718666077, 0.44331854581832886, 0.46509331464767456, 0.48686811327934265, 0.5086429119110107, 0.5304176807403564, 0.5521924495697021, 0.5739672780036926, 0.5957420468330383, 0.617516815662384, 0.6392916440963745, 0.6610664129257202, 0.6828411817550659, 0.7046160101890564]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 8.0, 1.0, 1.0, 7.0, 9.0, 16.0, 23.0, 33.0, 40.0, 74.0, 119.0, 211.0, 328.0, 644.0, 1175.0, 2358.0, 5660.0, 14422.0, 47686.0, 265944.0, 3600214.0, 195515.0, 39286.0, 12093.0, 4593.0, 1876.0, 912.0, 430.0, 252.0, 117.0, 82.0, 49.0, 36.0, 21.0, 22.0, 9.0, 5.0, 7.0, 5.0, 2.0, 2.0, 5.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2210693359375, -0.21329307556152344, -0.20551681518554688, -0.1977405548095703, -0.18996429443359375, -0.1821880340576172, -0.17441177368164062, -0.16663551330566406, -0.1588592529296875, -0.15108299255371094, -0.14330673217773438, -0.1355304718017578, -0.12775421142578125, -0.11997795104980469, -0.11220169067382812, -0.10442543029785156, -0.096649169921875, -0.08887290954589844, -0.08109664916992188, -0.07332038879394531, -0.06554412841796875, -0.05776786804199219, -0.049991607666015625, -0.04221534729003906, -0.0344390869140625, -0.026662826538085938, -0.018886566162109375, -0.011110305786132812, -0.00333404541015625, 0.0044422149658203125, 0.012218475341796875, 0.019994735717773438, 0.02777099609375, 0.03554725646972656, 0.043323516845703125, 0.05109977722167969, 0.05887603759765625, 0.06665229797363281, 0.07442855834960938, 0.08220481872558594, 0.0899810791015625, 0.09775733947753906, 0.10553359985351562, 0.11330986022949219, 0.12108612060546875, 0.1288623809814453, 0.13663864135742188, 0.14441490173339844, 0.152191162109375, 0.15996742248535156, 0.16774368286132812, 0.1755199432373047, 0.18329620361328125, 0.1910724639892578, 0.19884872436523438, 0.20662498474121094, 0.2144012451171875, 0.22217750549316406, 0.22995376586914062, 0.2377300262451172, 0.24550628662109375, 0.2532825469970703, 0.2610588073730469, 0.26883506774902344, 0.276611328125]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 10.0, 13.0, 15.0, 15.0, 21.0, 30.0, 25.0, 34.0, 41.0, 43.0, 55.0, 63.0, 65.0, 74.0, 67.0, 66.0, 60.0, 57.0, 40.0, 49.0, 33.0, 29.0, 22.0, 19.0, 15.0, 16.0, 10.0, 6.0, 4.0, 3.0, 1.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.04229736328125, -0.041054725646972656, -0.03981208801269531, -0.03856945037841797, -0.037326812744140625, -0.03608417510986328, -0.03484153747558594, -0.033598899841308594, -0.03235626220703125, -0.031113624572753906, -0.029870986938476562, -0.02862834930419922, -0.027385711669921875, -0.02614307403564453, -0.024900436401367188, -0.023657798767089844, -0.0224151611328125, -0.021172523498535156, -0.019929885864257812, -0.01868724822998047, -0.017444610595703125, -0.01620197296142578, -0.014959335327148438, -0.013716697692871094, -0.01247406005859375, -0.011231422424316406, -0.009988784790039062, -0.008746147155761719, -0.007503509521484375, -0.006260871887207031, -0.0050182342529296875, -0.0037755966186523438, -0.002532958984375, -0.0012903213500976562, -4.76837158203125e-05, 0.0011949539184570312, 0.002437591552734375, 0.0036802291870117188, 0.0049228668212890625, 0.006165504455566406, 0.00740814208984375, 0.008650779724121094, 0.009893417358398438, 0.011136054992675781, 0.012378692626953125, 0.013621330261230469, 0.014863967895507812, 0.016106605529785156, 0.0173492431640625, 0.018591880798339844, 0.019834518432617188, 0.02107715606689453, 0.022319793701171875, 0.02356243133544922, 0.024805068969726562, 0.026047706604003906, 0.02729034423828125, 0.028532981872558594, 0.029775619506835938, 0.03101825714111328, 0.032260894775390625, 0.03350353240966797, 0.03474617004394531, 0.035988807678222656, 0.0372314453125]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 11.0, 13.0, 18.0, 46.0, 54.0, 94.0, 145.0, 249.0, 434.0, 829.0, 1508.0, 3205.0, 6945.0, 17862.0, 54965.0, 249667.0, 3427182.0, 331950.0, 63995.0, 20455.0, 7934.0, 3349.0, 1535.0, 798.0, 434.0, 247.0, 135.0, 87.0, 48.0, 25.0, 19.0, 14.0, 11.0, 4.0, 6.0, 3.0, 7.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.298095703125, -0.2880134582519531, -0.27793121337890625, -0.2678489685058594, -0.2577667236328125, -0.24768447875976562, -0.23760223388671875, -0.22751998901367188, -0.217437744140625, -0.20735549926757812, -0.19727325439453125, -0.18719100952148438, -0.1771087646484375, -0.16702651977539062, -0.15694427490234375, -0.14686203002929688, -0.13677978515625, -0.12669754028320312, -0.11661529541015625, -0.10653305053710938, -0.0964508056640625, -0.08636856079101562, -0.07628631591796875, -0.06620407104492188, -0.056121826171875, -0.046039581298828125, -0.03595733642578125, -0.025875091552734375, -0.0157928466796875, -0.005710601806640625, 0.00437164306640625, 0.014453887939453125, 0.0245361328125, 0.034618377685546875, 0.04470062255859375, 0.054782867431640625, 0.0648651123046875, 0.07494735717773438, 0.08502960205078125, 0.09511184692382812, 0.105194091796875, 0.11527633666992188, 0.12535858154296875, 0.13544082641601562, 0.1455230712890625, 0.15560531616210938, 0.16568756103515625, 0.17576980590820312, 0.18585205078125, 0.19593429565429688, 0.20601654052734375, 0.21609878540039062, 0.2261810302734375, 0.23626327514648438, 0.24634552001953125, 0.2564277648925781, 0.266510009765625, 0.2765922546386719, 0.28667449951171875, 0.2967567443847656, 0.3068389892578125, 0.3169212341308594, 0.32700347900390625, 0.3370857238769531, 0.34716796875]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 3.0, 4.0, 5.0, 6.0, 1.0, 8.0, 4.0, 12.0, 9.0, 22.0, 34.0, 42.0, 47.0, 66.0, 90.0, 164.0, 338.0, 1294.0, 1135.0, 314.0, 158.0, 86.0, 60.0, 50.0, 35.0, 26.0, 18.0, 16.0, 10.0, 12.0, 3.0, 5.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.159423828125, -0.15486717224121094, -0.15031051635742188, -0.1457538604736328, -0.14119720458984375, -0.1366405487060547, -0.13208389282226562, -0.12752723693847656, -0.1229705810546875, -0.11841392517089844, -0.11385726928710938, -0.10930061340332031, -0.10474395751953125, -0.10018730163574219, -0.09563064575195312, -0.09107398986816406, -0.086517333984375, -0.08196067810058594, -0.07740402221679688, -0.07284736633300781, -0.06829071044921875, -0.06373405456542969, -0.059177398681640625, -0.05462074279785156, -0.0500640869140625, -0.04550743103027344, -0.040950775146484375, -0.03639411926269531, -0.03183746337890625, -0.027280807495117188, -0.022724151611328125, -0.018167495727539062, -0.01361083984375, -0.009054183959960938, -0.004497528076171875, 5.91278076171875e-05, 0.00461578369140625, 0.009172439575195312, 0.013729095458984375, 0.018285751342773438, 0.0228424072265625, 0.027399063110351562, 0.031955718994140625, 0.03651237487792969, 0.04106903076171875, 0.04562568664550781, 0.050182342529296875, 0.05473899841308594, 0.059295654296875, 0.06385231018066406, 0.06840896606445312, 0.07296562194824219, 0.07752227783203125, 0.08207893371582031, 0.08663558959960938, 0.09119224548339844, 0.0957489013671875, 0.10030555725097656, 0.10486221313476562, 0.10941886901855469, 0.11397552490234375, 0.11853218078613281, 0.12308883666992188, 0.12764549255371094, 0.1322021484375]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 5.0, 2.0, 9.0, 6.0, 18.0, 14.0, 19.0, 44.0, 60.0, 81.0, 107.0, 139.0, 129.0, 106.0, 84.0, 59.0, 46.0, 23.0, 17.0, 11.0, 5.0, 11.0, 2.0, 3.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.8910911679267883, -0.8627834320068359, -0.8344757556915283, -0.8061680197715759, -0.7778603434562683, -0.7495526075363159, -0.7212449312210083, -0.6929371953010559, -0.6646295189857483, -0.6363217830657959, -0.6080141067504883, -0.5797063708305359, -0.5513986945152283, -0.5230909585952759, -0.49478328227996826, -0.46647554636001587, -0.43816784024238586, -0.40986013412475586, -0.38155242800712585, -0.35324472188949585, -0.32493701577186584, -0.29662930965423584, -0.26832157373428345, -0.24001388251781464, -0.21170617640018463, -0.18339847028255463, -0.15509076416492462, -0.12678304314613342, -0.09847534447908401, -0.07016763091087341, -0.04185992479324341, -0.013552218675613403, 0.014755487442016602, 0.043063193559646606, 0.07137089967727661, 0.09967861324548721, 0.12798631191253662, 0.15629403293132782, 0.18460173904895782, 0.21290944516658783, 0.24121715128421783, 0.26952487230300903, 0.29783257842063904, 0.32614028453826904, 0.35444799065589905, 0.38275569677352905, 0.41106340289115906, 0.43937110900878906, 0.46767881512641907, 0.4959865212440491, 0.5242942571640015, 0.5526019334793091, 0.5809096693992615, 0.6092173457145691, 0.6375250816345215, 0.6658327579498291, 0.6941404938697815, 0.7224482297897339, 0.7507559061050415, 0.7790636420249939, 0.8073713183403015, 0.8356790542602539, 0.8639867305755615, 0.8922944664955139, 0.9206021428108215]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 7.0, 5.0, 10.0, 7.0, 21.0, 20.0, 26.0, 31.0, 32.0, 27.0, 45.0, 50.0, 51.0, 52.0, 68.0, 73.0, 58.0, 60.0, 50.0, 57.0, 49.0, 42.0, 36.0, 31.0, 27.0, 18.0, 17.0, 12.0, 8.0, 5.0, 4.0, 3.0, 3.0, 3.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6114271283149719, -0.589939296245575, -0.5684515237808228, -0.5469636917114258, -0.5254758596420288, -0.5039880871772766, -0.48250025510787964, -0.46101245284080505, -0.43952465057373047, -0.4180368483066559, -0.3965490162372589, -0.3750612139701843, -0.35357341170310974, -0.33208560943603516, -0.3105977773666382, -0.2891099750995636, -0.2676221430301666, -0.24613432586193085, -0.22464652359485626, -0.20315870642662048, -0.1816709041595459, -0.16018308699131012, -0.13869526982307434, -0.11720746755599976, -0.09571965038776398, -0.0742318406701088, -0.052744027227163315, -0.031256213784217834, -0.009768404066562653, 0.01171940565109253, 0.03320722281932831, 0.05469502508640289, 0.07618284225463867, 0.09767065197229385, 0.11915846168994904, 0.14064627885818481, 0.1621340811252594, 0.18362189829349518, 0.20510971546173096, 0.22659751772880554, 0.24808533489704132, 0.2695731520652771, 0.2910609543323517, 0.31254875659942627, 0.33403658866882324, 0.3555243909358978, 0.3770121932029724, 0.3985000252723694, 0.41998782753944397, 0.44147562980651855, 0.4629634618759155, 0.4844512641429901, 0.5059390664100647, 0.5274268984794617, 0.5489146709442139, 0.5704025030136108, 0.5918903350830078, 0.6133781671524048, 0.634865939617157, 0.656353771686554, 0.6778416037559509, 0.6993293762207031, 0.7208172082901001, 0.7423050403594971, 0.7637928128242493]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 2.0, 3.0, 2.0, 5.0, 11.0, 12.0, 20.0, 24.0, 35.0, 56.0, 91.0, 158.0, 349.0, 706.0, 1901.0, 4919.0, 16913.0, 62855.0, 529176.0, 356680.0, 53040.0, 14244.0, 4432.0, 1572.0, 652.0, 300.0, 171.0, 87.0, 57.0, 31.0, 21.0, 15.0, 7.0, 5.0, 6.0, 5.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2283935546875, -0.21843528747558594, -0.20847702026367188, -0.1985187530517578, -0.18856048583984375, -0.1786022186279297, -0.16864395141601562, -0.15868568420410156, -0.1487274169921875, -0.13876914978027344, -0.12881088256835938, -0.11885261535644531, -0.10889434814453125, -0.09893608093261719, -0.08897781372070312, -0.07901954650878906, -0.069061279296875, -0.05910301208496094, -0.049144744873046875, -0.03918647766113281, -0.02922821044921875, -0.019269943237304688, -0.009311676025390625, 0.0006465911865234375, 0.0106048583984375, 0.020563125610351562, 0.030521392822265625, 0.04047966003417969, 0.05043792724609375, 0.06039619445800781, 0.07035446166992188, 0.08031272888183594, 0.09027099609375, 0.10022926330566406, 0.11018753051757812, 0.12014579772949219, 0.13010406494140625, 0.1400623321533203, 0.15002059936523438, 0.15997886657714844, 0.1699371337890625, 0.17989540100097656, 0.18985366821289062, 0.1998119354248047, 0.20977020263671875, 0.2197284698486328, 0.22968673706054688, 0.23964500427246094, 0.249603271484375, 0.25956153869628906, 0.2695198059082031, 0.2794780731201172, 0.28943634033203125, 0.2993946075439453, 0.3093528747558594, 0.31931114196777344, 0.3292694091796875, 0.33922767639160156, 0.3491859436035156, 0.3591442108154297, 0.36910247802734375, 0.3790607452392578, 0.3890190124511719, 0.39897727966308594, 0.408935546875]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 6.0, 4.0, 8.0, 10.0, 14.0, 16.0, 25.0, 35.0, 39.0, 46.0, 62.0, 60.0, 71.0, 79.0, 65.0, 57.0, 64.0, 71.0, 44.0, 47.0, 44.0, 34.0, 34.0, 27.0, 13.0, 10.0, 7.0, 8.0, 5.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.06378173828125, -0.062213897705078125, -0.06064605712890625, -0.059078216552734375, -0.0575103759765625, -0.055942535400390625, -0.05437469482421875, -0.052806854248046875, -0.051239013671875, -0.049671173095703125, -0.04810333251953125, -0.046535491943359375, -0.0449676513671875, -0.043399810791015625, -0.04183197021484375, -0.040264129638671875, -0.0386962890625, -0.037128448486328125, -0.03556060791015625, -0.033992767333984375, -0.0324249267578125, -0.030857086181640625, -0.02928924560546875, -0.027721405029296875, -0.026153564453125, -0.024585723876953125, -0.02301788330078125, -0.021450042724609375, -0.0198822021484375, -0.018314361572265625, -0.01674652099609375, -0.015178680419921875, -0.01361083984375, -0.012042999267578125, -0.01047515869140625, -0.008907318115234375, -0.0073394775390625, -0.005771636962890625, -0.00420379638671875, -0.002635955810546875, -0.001068115234375, 0.000499725341796875, 0.00206756591796875, 0.003635406494140625, 0.0052032470703125, 0.006771087646484375, 0.00833892822265625, 0.009906768798828125, 0.011474609375, 0.013042449951171875, 0.01461029052734375, 0.016178131103515625, 0.0177459716796875, 0.019313812255859375, 0.02088165283203125, 0.022449493408203125, 0.024017333984375, 0.025585174560546875, 0.02715301513671875, 0.028720855712890625, 0.0302886962890625, 0.031856536865234375, 0.03342437744140625, 0.034992218017578125, 0.03656005859375]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 2.0, 1.0, 1.0, 2.0, 8.0, 8.0, 21.0, 21.0, 43.0, 89.0, 122.0, 276.0, 603.0, 1935.0, 11487.0, 202420.0, 802796.0, 24191.0, 2953.0, 862.0, 319.0, 182.0, 90.0, 48.0, 27.0, 20.0, 15.0, 7.0, 5.0, 0.0, 5.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.73291015625, -0.7120590209960938, -0.6912078857421875, -0.6703567504882812, -0.649505615234375, -0.6286544799804688, -0.6078033447265625, -0.5869522094726562, -0.56610107421875, -0.5452499389648438, -0.5243988037109375, -0.5035476684570312, -0.482696533203125, -0.46184539794921875, -0.4409942626953125, -0.42014312744140625, -0.3992919921875, -0.37844085693359375, -0.3575897216796875, -0.33673858642578125, -0.315887451171875, -0.29503631591796875, -0.2741851806640625, -0.25333404541015625, -0.23248291015625, -0.21163177490234375, -0.1907806396484375, -0.16992950439453125, -0.149078369140625, -0.12822723388671875, -0.1073760986328125, -0.08652496337890625, -0.065673828125, -0.04482269287109375, -0.0239715576171875, -0.00312042236328125, 0.017730712890625, 0.03858184814453125, 0.0594329833984375, 0.08028411865234375, 0.10113525390625, 0.12198638916015625, 0.1428375244140625, 0.16368865966796875, 0.184539794921875, 0.20539093017578125, 0.2262420654296875, 0.24709320068359375, 0.2679443359375, 0.28879547119140625, 0.3096466064453125, 0.33049774169921875, 0.351348876953125, 0.37220001220703125, 0.3930511474609375, 0.41390228271484375, 0.43475341796875, 0.45560455322265625, 0.4764556884765625, 0.49730682373046875, 0.518157958984375, 0.5390090942382812, 0.5598602294921875, 0.5807113647460938, 0.6015625]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 5.0, 2.0, 4.0, 8.0, 13.0, 15.0, 24.0, 32.0, 28.0, 33.0, 33.0, 45.0, 60.0, 39.0, 55.0, 63.0, 48.0, 62.0, 67.0, 64.0, 64.0, 48.0, 24.0, 34.0, 24.0, 27.0, 28.0, 17.0, 19.0, 6.0, 6.0, 4.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2178955078125, -0.21079444885253906, -0.20369338989257812, -0.1965923309326172, -0.18949127197265625, -0.1823902130126953, -0.17528915405273438, -0.16818809509277344, -0.1610870361328125, -0.15398597717285156, -0.14688491821289062, -0.1397838592529297, -0.13268280029296875, -0.1255817413330078, -0.11848068237304688, -0.11137962341308594, -0.104278564453125, -0.09717750549316406, -0.09007644653320312, -0.08297538757324219, -0.07587432861328125, -0.06877326965332031, -0.061672210693359375, -0.05457115173339844, -0.0474700927734375, -0.04036903381347656, -0.033267974853515625, -0.026166915893554688, -0.01906585693359375, -0.011964797973632812, -0.004863739013671875, 0.0022373199462890625, 0.00933837890625, 0.016439437866210938, 0.023540496826171875, 0.030641555786132812, 0.03774261474609375, 0.04484367370605469, 0.051944732666015625, 0.05904579162597656, 0.0661468505859375, 0.07324790954589844, 0.08034896850585938, 0.08745002746582031, 0.09455108642578125, 0.10165214538574219, 0.10875320434570312, 0.11585426330566406, 0.122955322265625, 0.13005638122558594, 0.13715744018554688, 0.1442584991455078, 0.15135955810546875, 0.1584606170654297, 0.16556167602539062, 0.17266273498535156, 0.1797637939453125, 0.18686485290527344, 0.19396591186523438, 0.2010669708251953, 0.20816802978515625, 0.2152690887451172, 0.22237014770507812, 0.22947120666503906, 0.236572265625]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 5.0, 3.0, 4.0, 11.0, 12.0, 25.0, 31.0, 69.0, 151.0, 272.0, 560.0, 1473.0, 4105.0, 14944.0, 86747.0, 853791.0, 67543.0, 12788.0, 3663.0, 1329.0, 516.0, 241.0, 107.0, 65.0, 37.0, 24.0, 18.0, 10.0, 6.0, 4.0, 2.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.353271484375, -0.340850830078125, -0.32843017578125, -0.316009521484375, -0.3035888671875, -0.291168212890625, -0.27874755859375, -0.266326904296875, -0.25390625, -0.241485595703125, -0.22906494140625, -0.216644287109375, -0.2042236328125, -0.191802978515625, -0.17938232421875, -0.166961669921875, -0.154541015625, -0.142120361328125, -0.12969970703125, -0.117279052734375, -0.1048583984375, -0.092437744140625, -0.08001708984375, -0.067596435546875, -0.05517578125, -0.042755126953125, -0.03033447265625, -0.017913818359375, -0.0054931640625, 0.006927490234375, 0.01934814453125, 0.031768798828125, 0.044189453125, 0.056610107421875, 0.06903076171875, 0.081451416015625, 0.0938720703125, 0.106292724609375, 0.11871337890625, 0.131134033203125, 0.1435546875, 0.155975341796875, 0.16839599609375, 0.180816650390625, 0.1932373046875, 0.205657958984375, 0.21807861328125, 0.230499267578125, 0.242919921875, 0.255340576171875, 0.26776123046875, 0.280181884765625, 0.2926025390625, 0.305023193359375, 0.31744384765625, 0.329864501953125, 0.34228515625, 0.354705810546875, 0.36712646484375, 0.379547119140625, 0.3919677734375, 0.404388427734375, 0.41680908203125, 0.429229736328125, 0.441650390625]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 5.0, 3.0, 5.0, 6.0, 20.0, 12.0, 22.0, 34.0, 37.0, 52.0, 77.0, 100.0, 119.0, 109.0, 95.0, 94.0, 64.0, 40.0, 29.0, 19.0, 19.0, 10.0, 10.0, 6.0, 4.0, 4.0, 1.0, 2.0, 5.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.00011110305786132812, -0.00010819640010595322, -0.00010528974235057831, -0.0001023830845952034, -9.947642683982849e-05, -9.656976908445358e-05, -9.366311132907867e-05, -9.075645357370377e-05, -8.784979581832886e-05, -8.494313806295395e-05, -8.203648030757904e-05, -7.912982255220413e-05, -7.622316479682922e-05, -7.331650704145432e-05, -7.04098492860794e-05, -6.75031915307045e-05, -6.459653377532959e-05, -6.168987601995468e-05, -5.878321826457977e-05, -5.5876560509204865e-05, -5.2969902753829956e-05, -5.006324499845505e-05, -4.715658724308014e-05, -4.424992948770523e-05, -4.134327173233032e-05, -3.8436613976955414e-05, -3.5529956221580505e-05, -3.26232984662056e-05, -2.971664071083069e-05, -2.680998295545578e-05, -2.390332520008087e-05, -2.0996667444705963e-05, -1.8090009689331055e-05, -1.5183351933956146e-05, -1.2276694178581238e-05, -9.37003642320633e-06, -6.463378667831421e-06, -3.5567209124565125e-06, -6.50063157081604e-07, 2.2565945982933044e-06, 5.163252353668213e-06, 8.069910109043121e-06, 1.097656786441803e-05, 1.3883225619792938e-05, 1.6789883375167847e-05, 1.9696541130542755e-05, 2.2603198885917664e-05, 2.5509856641292572e-05, 2.841651439666748e-05, 3.132317215204239e-05, 3.42298299074173e-05, 3.7136487662792206e-05, 4.0043145418167114e-05, 4.294980317354202e-05, 4.585646092891693e-05, 4.876311868429184e-05, 5.166977643966675e-05, 5.4576434195041656e-05, 5.7483091950416565e-05, 6.0389749705791473e-05, 6.329640746116638e-05, 6.620306521654129e-05, 6.91097229719162e-05, 7.201638072729111e-05, 7.492303848266602e-05]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 6.0, 10.0, 10.0, 28.0, 44.0, 111.0, 269.0, 743.0, 3287.0, 33080.0, 951941.0, 53060.0, 4528.0, 905.0, 315.0, 115.0, 52.0, 21.0, 8.0, 9.0, 7.0, 4.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.72998046875, -0.7088699340820312, -0.6877593994140625, -0.6666488647460938, -0.645538330078125, -0.6244277954101562, -0.6033172607421875, -0.5822067260742188, -0.56109619140625, -0.5399856567382812, -0.5188751220703125, -0.49776458740234375, -0.476654052734375, -0.45554351806640625, -0.4344329833984375, -0.41332244873046875, -0.3922119140625, -0.37110137939453125, -0.3499908447265625, -0.32888031005859375, -0.307769775390625, -0.28665924072265625, -0.2655487060546875, -0.24443817138671875, -0.22332763671875, -0.20221710205078125, -0.1811065673828125, -0.15999603271484375, -0.138885498046875, -0.11777496337890625, -0.0966644287109375, -0.07555389404296875, -0.054443359375, -0.03333282470703125, -0.0122222900390625, 0.00888824462890625, 0.029998779296875, 0.05110931396484375, 0.0722198486328125, 0.09333038330078125, 0.11444091796875, 0.13555145263671875, 0.1566619873046875, 0.17777252197265625, 0.198883056640625, 0.21999359130859375, 0.2411041259765625, 0.26221466064453125, 0.2833251953125, 0.30443572998046875, 0.3255462646484375, 0.34665679931640625, 0.367767333984375, 0.38887786865234375, 0.4099884033203125, 0.43109893798828125, 0.45220947265625, 0.47332000732421875, 0.4944305419921875, 0.5155410766601562, 0.536651611328125, 0.5577621459960938, 0.5788726806640625, 0.5999832153320312, 0.62109375]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 7.0, 8.0, 14.0, 26.0, 21.0, 35.0, 58.0, 289.0, 339.0, 101.0, 36.0, 27.0, 21.0, 6.0, 8.0, 6.0, 4.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.419189453125, -0.40819549560546875, -0.3972015380859375, -0.38620758056640625, -0.375213623046875, -0.36421966552734375, -0.3532257080078125, -0.34223175048828125, -0.33123779296875, -0.32024383544921875, -0.3092498779296875, -0.29825592041015625, -0.287261962890625, -0.27626800537109375, -0.2652740478515625, -0.25428009033203125, -0.2432861328125, -0.23229217529296875, -0.2212982177734375, -0.21030426025390625, -0.199310302734375, -0.18831634521484375, -0.1773223876953125, -0.16632843017578125, -0.15533447265625, -0.14434051513671875, -0.1333465576171875, -0.12235260009765625, -0.111358642578125, -0.10036468505859375, -0.0893707275390625, -0.07837677001953125, -0.0673828125, -0.05638885498046875, -0.0453948974609375, -0.03440093994140625, -0.023406982421875, -0.01241302490234375, -0.0014190673828125, 0.00957489013671875, 0.02056884765625, 0.03156280517578125, 0.0425567626953125, 0.05355072021484375, 0.064544677734375, 0.07553863525390625, 0.0865325927734375, 0.09752655029296875, 0.1085205078125, 0.11951446533203125, 0.1305084228515625, 0.14150238037109375, 0.152496337890625, 0.16349029541015625, 0.1744842529296875, 0.18547821044921875, 0.19647216796875, 0.20746612548828125, 0.2184600830078125, 0.22945404052734375, 0.240447998046875, 0.25144195556640625, 0.2624359130859375, 0.27342987060546875, 0.284423828125]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 3.0, 4.0, 5.0, 2.0, 13.0, 18.0, 25.0, 35.0, 54.0, 70.0, 90.0, 83.0, 100.0, 93.0, 93.0, 91.0, 64.0, 55.0, 30.0, 27.0, 16.0, 9.0, 10.0, 4.0, 7.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.1051135063171387, -2.050590753555298, -1.996067762374878, -1.9415448904037476, -1.8870220184326172, -1.8324991464614868, -1.7779762744903564, -1.7234535217285156, -1.6689305305480957, -1.6144076585769653, -1.559884786605835, -1.5053619146347046, -1.4508390426635742, -1.3963161706924438, -1.3417932987213135, -1.2872705459594727, -1.2327476739883423, -1.178224802017212, -1.1237019300460815, -1.0691790580749512, -1.0146561861038208, -0.9601333141326904, -0.9056105017662048, -0.8510876297950745, -0.7965647578239441, -0.7420418858528137, -0.6875190138816833, -0.6329962015151978, -0.5784733295440674, -0.523950457572937, -0.46942758560180664, -0.41490471363067627, -0.3603818416595459, -0.3058589696884155, -0.25133609771728516, -0.19681325554847717, -0.1422903835773468, -0.08776751160621643, -0.03324466943740845, 0.021278202533721924, 0.0758010745048523, 0.13032394647598267, 0.18484680354595184, 0.23936966061592102, 0.2938925325870514, 0.34841540455818176, 0.40293824672698975, 0.4574611186981201, 0.5119839906692505, 0.5665068626403809, 0.6210297346115112, 0.6755526065826416, 0.730075478553772, 0.7845983505249023, 0.8391211628913879, 0.8936440348625183, 0.9481669068336487, 1.0026897192001343, 1.0572125911712646, 1.111735463142395, 1.1662583351135254, 1.2207812070846558, 1.2753040790557861, 1.3298269510269165, 1.3843498229980469]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 1.0, 3.0, 4.0, 2.0, 7.0, 8.0, 8.0, 18.0, 12.0, 16.0, 19.0, 27.0, 23.0, 25.0, 38.0, 38.0, 42.0, 42.0, 59.0, 46.0, 52.0, 47.0, 52.0, 44.0, 39.0, 47.0, 39.0, 47.0, 35.0, 29.0, 25.0, 22.0, 18.0, 10.0, 16.0, 10.0, 6.0, 8.0, 8.0, 4.0, 2.0, 8.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.0756940841674805, -1.0431574583053589, -1.0106208324432373, -0.9780842065811157, -0.9455475807189941, -0.9130109548568726, -0.880474328994751, -0.8479377031326294, -0.8154010772705078, -0.7828644514083862, -0.7503278255462646, -0.7177911996841431, -0.6852545738220215, -0.6527179479598999, -0.6201813220977783, -0.5876446962356567, -0.5551080703735352, -0.5225714445114136, -0.490034818649292, -0.4574981927871704, -0.42496156692504883, -0.39242494106292725, -0.35988831520080566, -0.3273516893386841, -0.2948150634765625, -0.2622784376144409, -0.22974181175231934, -0.19720518589019775, -0.16466856002807617, -0.1321319341659546, -0.09959530830383301, -0.06705868244171143, -0.03452193737030029, -0.001985311508178711, 0.03055131435394287, 0.06308794021606445, 0.09562456607818604, 0.12816119194030762, 0.1606978178024292, 0.19323444366455078, 0.22577106952667236, 0.25830769538879395, 0.2908443212509155, 0.3233809471130371, 0.3559175729751587, 0.3884541988372803, 0.42099082469940186, 0.45352745056152344, 0.486064076423645, 0.5186007022857666, 0.5511373281478882, 0.5836739540100098, 0.6162105798721313, 0.6487472057342529, 0.6812838315963745, 0.7138204574584961, 0.7463570833206177, 0.7788937091827393, 0.8114303350448608, 0.8439669609069824, 0.876503586769104, 0.9090402126312256, 0.9415768384933472, 0.9741134643554688, 1.0066500902175903]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 4.0, 11.0, 10.0, 15.0, 22.0, 35.0, 49.0, 80.0, 110.0, 214.0, 399.0, 776.0, 1791.0, 4683.0, 15552.0, 78816.0, 3801006.0, 247783.0, 30342.0, 7955.0, 2671.0, 967.0, 447.0, 221.0, 138.0, 71.0, 41.0, 30.0, 14.0, 16.0, 6.0, 4.0, 1.0, 1.0, 4.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.417236328125, -0.4031982421875, -0.38916015625, -0.3751220703125, -0.361083984375, -0.3470458984375, -0.3330078125, -0.3189697265625, -0.304931640625, -0.2908935546875, -0.27685546875, -0.2628173828125, -0.248779296875, -0.2347412109375, -0.220703125, -0.2066650390625, -0.192626953125, -0.1785888671875, -0.16455078125, -0.1505126953125, -0.136474609375, -0.1224365234375, -0.1083984375, -0.0943603515625, -0.080322265625, -0.0662841796875, -0.05224609375, -0.0382080078125, -0.024169921875, -0.0101318359375, 0.00390625, 0.0179443359375, 0.031982421875, 0.0460205078125, 0.06005859375, 0.0740966796875, 0.088134765625, 0.1021728515625, 0.1162109375, 0.1302490234375, 0.144287109375, 0.1583251953125, 0.17236328125, 0.1864013671875, 0.200439453125, 0.2144775390625, 0.228515625, 0.2425537109375, 0.256591796875, 0.2706298828125, 0.28466796875, 0.2987060546875, 0.312744140625, 0.3267822265625, 0.3408203125, 0.3548583984375, 0.368896484375, 0.3829345703125, 0.39697265625, 0.4110107421875, 0.425048828125, 0.4390869140625, 0.453125, 0.4671630859375, 0.481201171875]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 4.0, 2.0, 3.0, 5.0, 13.0, 16.0, 19.0, 26.0, 42.0, 45.0, 52.0, 60.0, 78.0, 73.0, 77.0, 80.0, 77.0, 75.0, 59.0, 44.0, 53.0, 30.0, 18.0, 17.0, 15.0, 13.0, 4.0, 7.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07183837890625, -0.06993675231933594, -0.06803512573242188, -0.06613349914550781, -0.06423187255859375, -0.06233024597167969, -0.060428619384765625, -0.05852699279785156, -0.0566253662109375, -0.05472373962402344, -0.052822113037109375, -0.05092048645019531, -0.04901885986328125, -0.04711723327636719, -0.045215606689453125, -0.04331398010253906, -0.041412353515625, -0.03951072692871094, -0.037609100341796875, -0.03570747375488281, -0.03380584716796875, -0.03190422058105469, -0.030002593994140625, -0.028100967407226562, -0.0261993408203125, -0.024297714233398438, -0.022396087646484375, -0.020494461059570312, -0.01859283447265625, -0.016691207885742188, -0.014789581298828125, -0.012887954711914062, -0.010986328125, -0.009084701538085938, -0.007183074951171875, -0.0052814483642578125, -0.00337982177734375, -0.0014781951904296875, 0.000423431396484375, 0.0023250579833984375, 0.0042266845703125, 0.0061283111572265625, 0.008029937744140625, 0.009931564331054688, 0.01183319091796875, 0.013734817504882812, 0.015636444091796875, 0.017538070678710938, 0.019439697265625, 0.021341323852539062, 0.023242950439453125, 0.025144577026367188, 0.02704620361328125, 0.028947830200195312, 0.030849456787109375, 0.03275108337402344, 0.0346527099609375, 0.03655433654785156, 0.038455963134765625, 0.04035758972167969, 0.04225921630859375, 0.04416084289550781, 0.046062469482421875, 0.04796409606933594, 0.04986572265625]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 6.0, 7.0, 14.0, 12.0, 24.0, 59.0, 67.0, 111.0, 213.0, 355.0, 648.0, 1315.0, 2792.0, 6601.0, 19127.0, 72355.0, 1124808.0, 2847077.0, 84126.0, 21497.0, 7211.0, 2878.0, 1391.0, 713.0, 359.0, 179.0, 111.0, 89.0, 51.0, 37.0, 20.0, 9.0, 11.0, 10.0, 5.0, 3.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3291015625, -0.3154144287109375, -0.301727294921875, -0.2880401611328125, -0.27435302734375, -0.2606658935546875, -0.246978759765625, -0.2332916259765625, -0.2196044921875, -0.2059173583984375, -0.192230224609375, -0.1785430908203125, -0.16485595703125, -0.1511688232421875, -0.137481689453125, -0.1237945556640625, -0.110107421875, -0.0964202880859375, -0.082733154296875, -0.0690460205078125, -0.05535888671875, -0.0416717529296875, -0.027984619140625, -0.0142974853515625, -0.0006103515625, 0.0130767822265625, 0.026763916015625, 0.0404510498046875, 0.05413818359375, 0.0678253173828125, 0.081512451171875, 0.0951995849609375, 0.10888671875, 0.1225738525390625, 0.136260986328125, 0.1499481201171875, 0.16363525390625, 0.1773223876953125, 0.191009521484375, 0.2046966552734375, 0.2183837890625, 0.2320709228515625, 0.245758056640625, 0.2594451904296875, 0.27313232421875, 0.2868194580078125, 0.300506591796875, 0.3141937255859375, 0.327880859375, 0.3415679931640625, 0.355255126953125, 0.3689422607421875, 0.38262939453125, 0.3963165283203125, 0.410003662109375, 0.4236907958984375, 0.4373779296875, 0.4510650634765625, 0.464752197265625, 0.4784393310546875, 0.49212646484375, 0.5058135986328125, 0.519500732421875, 0.5331878662109375, 0.546875]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 4.0, 7.0, 12.0, 17.0, 18.0, 23.0, 23.0, 36.0, 69.0, 83.0, 163.0, 515.0, 2145.0, 486.0, 167.0, 84.0, 67.0, 30.0, 34.0, 25.0, 21.0, 12.0, 6.0, 10.0, 2.0, 4.0, 2.0, 3.0, 0.0, 3.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.170654296875, -0.1655559539794922, -0.16045761108398438, -0.15535926818847656, -0.15026092529296875, -0.14516258239746094, -0.14006423950195312, -0.1349658966064453, -0.1298675537109375, -0.12476921081542969, -0.11967086791992188, -0.11457252502441406, -0.10947418212890625, -0.10437583923339844, -0.09927749633789062, -0.09417915344238281, -0.089080810546875, -0.08398246765136719, -0.07888412475585938, -0.07378578186035156, -0.06868743896484375, -0.06358909606933594, -0.058490753173828125, -0.05339241027832031, -0.0482940673828125, -0.04319572448730469, -0.038097381591796875, -0.03299903869628906, -0.02790069580078125, -0.022802352905273438, -0.017704010009765625, -0.012605667114257812, -0.00750732421875, -0.0024089813232421875, 0.002689361572265625, 0.0077877044677734375, 0.01288604736328125, 0.017984390258789062, 0.023082733154296875, 0.028181076049804688, 0.0332794189453125, 0.03837776184082031, 0.043476104736328125, 0.04857444763183594, 0.05367279052734375, 0.05877113342285156, 0.06386947631835938, 0.06896781921386719, 0.074066162109375, 0.07916450500488281, 0.08426284790039062, 0.08936119079589844, 0.09445953369140625, 0.09955787658691406, 0.10465621948242188, 0.10975456237792969, 0.1148529052734375, 0.11995124816894531, 0.12504959106445312, 0.13014793395996094, 0.13524627685546875, 0.14034461975097656, 0.14544296264648438, 0.1505413055419922, 0.1556396484375]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 5.0, 8.0, 20.0, 57.0, 123.0, 249.0, 261.0, 153.0, 90.0, 20.0, 12.0, 10.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2433688640594482, -1.1813781261444092, -1.1193873882293701, -1.0573965311050415, -0.9954057931900024, -0.9334150552749634, -0.8714243173599243, -0.8094335198402405, -0.7474427223205566, -0.6854519844055176, -0.6234611868858337, -0.5614704489707947, -0.49947965145111084, -0.4374889135360718, -0.3754981458187103, -0.3135073781013489, -0.2515166401863098, -0.18952587246894836, -0.12753510475158691, -0.06554435193538666, -0.0035535842180252075, 0.05843716859817505, 0.1204279363155365, 0.18241870403289795, 0.2444094717502594, 0.30640023946762085, 0.3683910071849823, 0.43038177490234375, 0.4923725128173828, 0.5543632507324219, 0.6163540482521057, 0.6783448457717896, 0.7403355836868286, 0.8023263216018677, 0.8643171191215515, 0.9263078570365906, 0.9882986545562744, 1.0502893924713135, 1.1122801303863525, 1.1742708683013916, 1.2362617254257202, 1.2982524633407593, 1.3602432012557983, 1.422234058380127, 1.484224796295166, 1.546215534210205, 1.6082062721252441, 1.6701970100402832, 1.7321877479553223, 1.7941784858703613, 1.8561692237854004, 1.918160080909729, 1.980150818824768, 2.0421414375305176, 2.1041324138641357, 2.166123151779175, 2.228113889694214, 2.290104627609253, 2.352095365524292, 2.414086103439331, 2.47607684135437, 2.5380678176879883, 2.6000585556030273, 2.6620492935180664, 2.7240400314331055]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 4.0, 4.0, 6.0, 12.0, 3.0, 10.0, 10.0, 14.0, 15.0, 14.0, 30.0, 24.0, 32.0, 32.0, 29.0, 34.0, 41.0, 35.0, 49.0, 54.0, 40.0, 50.0, 55.0, 36.0, 37.0, 27.0, 31.0, 45.0, 30.0, 30.0, 25.0, 13.0, 19.0, 20.0, 11.0, 20.0, 19.0, 7.0, 11.0, 7.0, 11.0, 3.0, 3.0, 2.0, 2.0, 2.0, 4.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.47076505422592163, -0.4563966989517212, -0.44202831387519836, -0.4276599586009979, -0.4132915735244751, -0.39892321825027466, -0.3845548629760742, -0.3701864778995514, -0.35581812262535095, -0.3414497673511505, -0.3270813822746277, -0.31271302700042725, -0.2983446419239044, -0.283976286649704, -0.26960790157318115, -0.2552395462989807, -0.24087117612361908, -0.22650280594825745, -0.2121344357728958, -0.19776606559753418, -0.18339771032333374, -0.1690293401479721, -0.15466096997261047, -0.14029261469841003, -0.1259242296218872, -0.11155585944652557, -0.09718749672174454, -0.0828191265463829, -0.06845076382160187, -0.054082393646240234, -0.0397140234708786, -0.025345660746097565, -0.010977298021316528, 0.003391069360077381, 0.01775943674147129, 0.032127805054187775, 0.04649617150425911, 0.060864537954330444, 0.07523290812969208, 0.08960127085447311, 0.10396964102983475, 0.11833801120519638, 0.13270637392997742, 0.14707474410533905, 0.16144311428070068, 0.17581146955490112, 0.19017985463142395, 0.2045482099056244, 0.21891658008098602, 0.23328495025634766, 0.2476533204317093, 0.2620216906070709, 0.27639004588127136, 0.2907584309577942, 0.30512678623199463, 0.31949514150619507, 0.3338635265827179, 0.34823188185691833, 0.36260026693344116, 0.3769686222076416, 0.39133700728416443, 0.40570536255836487, 0.4200737476348877, 0.43444210290908813, 0.4488104581832886]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 7.0, 5.0, 4.0, 2.0, 8.0, 19.0, 19.0, 43.0, 42.0, 70.0, 128.0, 270.0, 688.0, 2159.0, 7836.0, 30892.0, 188867.0, 737570.0, 59393.0, 14745.0, 3794.0, 1117.0, 408.0, 207.0, 98.0, 63.0, 38.0, 21.0, 22.0, 12.0, 9.0, 1.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.337890625, -0.32671356201171875, -0.3155364990234375, -0.30435943603515625, -0.293182373046875, -0.28200531005859375, -0.2708282470703125, -0.25965118408203125, -0.24847412109375, -0.23729705810546875, -0.2261199951171875, -0.21494293212890625, -0.203765869140625, -0.19258880615234375, -0.1814117431640625, -0.17023468017578125, -0.1590576171875, -0.14788055419921875, -0.1367034912109375, -0.12552642822265625, -0.114349365234375, -0.10317230224609375, -0.0919952392578125, -0.08081817626953125, -0.06964111328125, -0.05846405029296875, -0.0472869873046875, -0.03610992431640625, -0.024932861328125, -0.01375579833984375, -0.0025787353515625, 0.00859832763671875, 0.019775390625, 0.03095245361328125, 0.0421295166015625, 0.05330657958984375, 0.064483642578125, 0.07566070556640625, 0.0868377685546875, 0.09801483154296875, 0.10919189453125, 0.12036895751953125, 0.1315460205078125, 0.14272308349609375, 0.153900146484375, 0.16507720947265625, 0.1762542724609375, 0.18743133544921875, 0.1986083984375, 0.20978546142578125, 0.2209625244140625, 0.23213958740234375, 0.243316650390625, 0.25449371337890625, 0.2656707763671875, 0.27684783935546875, 0.28802490234375, 0.29920196533203125, 0.3103790283203125, 0.32155609130859375, 0.332733154296875, 0.34391021728515625, 0.3550872802734375, 0.36626434326171875, 0.37744140625]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 2.0, 6.0, 5.0, 9.0, 11.0, 6.0, 19.0, 22.0, 32.0, 49.0, 64.0, 73.0, 67.0, 85.0, 76.0, 75.0, 84.0, 72.0, 55.0, 43.0, 46.0, 29.0, 28.0, 18.0, 8.0, 12.0, 4.0, 7.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0953369140625, -0.09305763244628906, -0.09077835083007812, -0.08849906921386719, -0.08621978759765625, -0.08394050598144531, -0.08166122436523438, -0.07938194274902344, -0.0771026611328125, -0.07482337951660156, -0.07254409790039062, -0.07026481628417969, -0.06798553466796875, -0.06570625305175781, -0.06342697143554688, -0.06114768981933594, -0.058868408203125, -0.05658912658691406, -0.054309844970703125, -0.05203056335449219, -0.04975128173828125, -0.04747200012207031, -0.045192718505859375, -0.04291343688964844, -0.0406341552734375, -0.03835487365722656, -0.036075592041015625, -0.03379631042480469, -0.03151702880859375, -0.029237747192382812, -0.026958465576171875, -0.024679183959960938, -0.02239990234375, -0.020120620727539062, -0.017841339111328125, -0.015562057495117188, -0.01328277587890625, -0.011003494262695312, -0.008724212646484375, -0.0064449310302734375, -0.0041656494140625, -0.0018863677978515625, 0.000392913818359375, 0.0026721954345703125, 0.00495147705078125, 0.0072307586669921875, 0.009510040283203125, 0.011789321899414062, 0.014068603515625, 0.016347885131835938, 0.018627166748046875, 0.020906448364257812, 0.02318572998046875, 0.025465011596679688, 0.027744293212890625, 0.030023574829101562, 0.0323028564453125, 0.03458213806152344, 0.036861419677734375, 0.03914070129394531, 0.04141998291015625, 0.04369926452636719, 0.045978546142578125, 0.04825782775878906, 0.050537109375]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 5.0, 8.0, 5.0, 10.0, 23.0, 30.0, 42.0, 82.0, 150.0, 330.0, 870.0, 2752.0, 11652.0, 56269.0, 814091.0, 133282.0, 21833.0, 4870.0, 1322.0, 433.0, 239.0, 118.0, 50.0, 32.0, 24.0, 13.0, 7.0, 15.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.429931640625, -0.41678619384765625, -0.4036407470703125, -0.39049530029296875, -0.377349853515625, -0.36420440673828125, -0.3510589599609375, -0.33791351318359375, -0.32476806640625, -0.31162261962890625, -0.2984771728515625, -0.28533172607421875, -0.272186279296875, -0.25904083251953125, -0.2458953857421875, -0.23274993896484375, -0.2196044921875, -0.20645904541015625, -0.1933135986328125, -0.18016815185546875, -0.167022705078125, -0.15387725830078125, -0.1407318115234375, -0.12758636474609375, -0.11444091796875, -0.10129547119140625, -0.0881500244140625, -0.07500457763671875, -0.061859130859375, -0.04871368408203125, -0.0355682373046875, -0.02242279052734375, -0.00927734375, 0.00386810302734375, 0.0170135498046875, 0.03015899658203125, 0.043304443359375, 0.05644989013671875, 0.0695953369140625, 0.08274078369140625, 0.09588623046875, 0.10903167724609375, 0.1221771240234375, 0.13532257080078125, 0.148468017578125, 0.16161346435546875, 0.1747589111328125, 0.18790435791015625, 0.2010498046875, 0.21419525146484375, 0.2273406982421875, 0.24048614501953125, 0.253631591796875, 0.26677703857421875, 0.2799224853515625, 0.29306793212890625, 0.30621337890625, 0.31935882568359375, 0.3325042724609375, 0.34564971923828125, 0.358795166015625, 0.37194061279296875, 0.3850860595703125, 0.39823150634765625, 0.411376953125]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 3.0, 4.0, 5.0, 10.0, 8.0, 14.0, 18.0, 25.0, 31.0, 42.0, 53.0, 61.0, 61.0, 70.0, 75.0, 74.0, 68.0, 77.0, 65.0, 54.0, 47.0, 34.0, 31.0, 22.0, 16.0, 16.0, 5.0, 12.0, 1.0, 3.0, 4.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.35693359375, -0.3458442687988281, -0.33475494384765625, -0.3236656188964844, -0.3125762939453125, -0.3014869689941406, -0.29039764404296875, -0.2793083190917969, -0.268218994140625, -0.2571296691894531, -0.24604034423828125, -0.23495101928710938, -0.2238616943359375, -0.21277236938476562, -0.20168304443359375, -0.19059371948242188, -0.17950439453125, -0.16841506958007812, -0.15732574462890625, -0.14623641967773438, -0.1351470947265625, -0.12405776977539062, -0.11296844482421875, -0.10187911987304688, -0.090789794921875, -0.07970046997070312, -0.06861114501953125, -0.057521820068359375, -0.0464324951171875, -0.035343170166015625, -0.02425384521484375, -0.013164520263671875, -0.0020751953125, 0.009014129638671875, 0.02010345458984375, 0.031192779541015625, 0.0422821044921875, 0.053371429443359375, 0.06446075439453125, 0.07555007934570312, 0.086639404296875, 0.09772872924804688, 0.10881805419921875, 0.11990737915039062, 0.1309967041015625, 0.14208602905273438, 0.15317535400390625, 0.16426467895507812, 0.17535400390625, 0.18644332885742188, 0.19753265380859375, 0.20862197875976562, 0.2197113037109375, 0.23080062866210938, 0.24188995361328125, 0.2529792785644531, 0.264068603515625, 0.2751579284667969, 0.28624725341796875, 0.2973365783691406, 0.3084259033203125, 0.3195152282714844, 0.33060455322265625, 0.3416938781738281, 0.352783203125]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 4.0, 5.0, 2.0, 7.0, 5.0, 18.0, 16.0, 31.0, 50.0, 65.0, 140.0, 243.0, 477.0, 925.0, 1986.0, 4297.0, 10809.0, 27812.0, 86254.0, 666063.0, 180840.0, 41957.0, 15233.0, 5917.0, 2724.0, 1246.0, 605.0, 359.0, 174.0, 114.0, 63.0, 46.0, 23.0, 14.0, 11.0, 11.0, 4.0, 3.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11993408203125, -0.1160268783569336, -0.11211967468261719, -0.10821247100830078, -0.10430526733398438, -0.10039806365966797, -0.09649085998535156, -0.09258365631103516, -0.08867645263671875, -0.08476924896240234, -0.08086204528808594, -0.07695484161376953, -0.07304763793945312, -0.06914043426513672, -0.06523323059082031, -0.061326026916503906, -0.0574188232421875, -0.053511619567871094, -0.04960441589355469, -0.04569721221923828, -0.041790008544921875, -0.03788280487060547, -0.03397560119628906, -0.030068397521972656, -0.02616119384765625, -0.022253990173339844, -0.018346786499023438, -0.014439582824707031, -0.010532379150390625, -0.006625175476074219, -0.0027179718017578125, 0.0011892318725585938, 0.005096435546875, 0.009003639221191406, 0.012910842895507812, 0.01681804656982422, 0.020725250244140625, 0.02463245391845703, 0.028539657592773438, 0.032446861267089844, 0.03635406494140625, 0.040261268615722656, 0.04416847229003906, 0.04807567596435547, 0.051982879638671875, 0.05589008331298828, 0.05979728698730469, 0.0637044906616211, 0.0676116943359375, 0.0715188980102539, 0.07542610168457031, 0.07933330535888672, 0.08324050903320312, 0.08714771270751953, 0.09105491638183594, 0.09496212005615234, 0.09886932373046875, 0.10277652740478516, 0.10668373107910156, 0.11059093475341797, 0.11449813842773438, 0.11840534210205078, 0.12231254577636719, 0.1262197494506836, 0.130126953125]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 2.0, 2.0, 5.0, 6.0, 4.0, 9.0, 7.0, 15.0, 28.0, 41.0, 50.0, 100.0, 98.0, 106.0, 129.0, 120.0, 85.0, 69.0, 41.0, 26.0, 17.0, 14.0, 5.0, 12.0, 9.0, 3.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.50422477722168e-05, -7.217936217784882e-05, -6.931647658348083e-05, -6.645359098911285e-05, -6.359070539474487e-05, -6.072781980037689e-05, -5.786493420600891e-05, -5.500204861164093e-05, -5.213916301727295e-05, -4.927627742290497e-05, -4.641339182853699e-05, -4.3550506234169006e-05, -4.0687620639801025e-05, -3.7824735045433044e-05, -3.4961849451065063e-05, -3.209896385669708e-05, -2.92360782623291e-05, -2.637319266796112e-05, -2.351030707359314e-05, -2.064742147922516e-05, -1.7784535884857178e-05, -1.4921650290489197e-05, -1.2058764696121216e-05, -9.195879101753235e-06, -6.332993507385254e-06, -3.470107913017273e-06, -6.07222318649292e-07, 2.255663275718689e-06, 5.11854887008667e-06, 7.981434464454651e-06, 1.0844320058822632e-05, 1.3707205653190613e-05, 1.6570091247558594e-05, 1.9432976841926575e-05, 2.2295862436294556e-05, 2.5158748030662537e-05, 2.8021633625030518e-05, 3.08845192193985e-05, 3.374740481376648e-05, 3.661029040813446e-05, 3.947317600250244e-05, 4.233606159687042e-05, 4.51989471912384e-05, 4.8061832785606384e-05, 5.0924718379974365e-05, 5.3787603974342346e-05, 5.665048956871033e-05, 5.951337516307831e-05, 6.237626075744629e-05, 6.523914635181427e-05, 6.810203194618225e-05, 7.096491754055023e-05, 7.382780313491821e-05, 7.66906887292862e-05, 7.955357432365417e-05, 8.241645991802216e-05, 8.527934551239014e-05, 8.814223110675812e-05, 9.10051167011261e-05, 9.386800229549408e-05, 9.673088788986206e-05, 9.959377348423004e-05, 0.00010245665907859802, 0.000105319544672966, 0.00010818243026733398]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 6.0, 7.0, 10.0, 11.0, 15.0, 8.0, 26.0, 48.0, 45.0, 76.0, 182.0, 293.0, 601.0, 1189.0, 2534.0, 6277.0, 17559.0, 57561.0, 378121.0, 485570.0, 66351.0, 19733.0, 6882.0, 2849.0, 1253.0, 589.0, 293.0, 177.0, 104.0, 49.0, 38.0, 28.0, 19.0, 14.0, 14.0, 10.0, 5.0, 3.0, 4.0, 2.0, 3.0, 2.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.13623046875, -0.1321086883544922, -0.12798690795898438, -0.12386512756347656, -0.11974334716796875, -0.11562156677246094, -0.11149978637695312, -0.10737800598144531, -0.1032562255859375, -0.09913444519042969, -0.09501266479492188, -0.09089088439941406, -0.08676910400390625, -0.08264732360839844, -0.07852554321289062, -0.07440376281738281, -0.070281982421875, -0.06616020202636719, -0.062038421630859375, -0.05791664123535156, -0.05379486083984375, -0.04967308044433594, -0.045551300048828125, -0.04142951965332031, -0.0373077392578125, -0.03318595886230469, -0.029064178466796875, -0.024942398071289062, -0.02082061767578125, -0.016698837280273438, -0.012577056884765625, -0.008455276489257812, -0.00433349609375, -0.0002117156982421875, 0.003910064697265625, 0.008031845092773438, 0.01215362548828125, 0.016275405883789062, 0.020397186279296875, 0.024518966674804688, 0.0286407470703125, 0.03276252746582031, 0.036884307861328125, 0.04100608825683594, 0.04512786865234375, 0.04924964904785156, 0.053371429443359375, 0.05749320983886719, 0.061614990234375, 0.06573677062988281, 0.06985855102539062, 0.07398033142089844, 0.07810211181640625, 0.08222389221191406, 0.08634567260742188, 0.09046745300292969, 0.0945892333984375, 0.09871101379394531, 0.10283279418945312, 0.10695457458496094, 0.11107635498046875, 0.11519813537597656, 0.11931991577148438, 0.12344169616699219, 0.1275634765625]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 0.0, 2.0, 3.0, 3.0, 4.0, 3.0, 5.0, 4.0, 8.0, 9.0, 14.0, 11.0, 17.0, 33.0, 40.0, 61.0, 103.0, 168.0, 177.0, 99.0, 71.0, 48.0, 27.0, 18.0, 23.0, 8.0, 12.0, 11.0, 5.0, 4.0, 6.0, 1.0, 5.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.128173828125, -0.1244049072265625, -0.120635986328125, -0.1168670654296875, -0.11309814453125, -0.1093292236328125, -0.105560302734375, -0.1017913818359375, -0.0980224609375, -0.0942535400390625, -0.090484619140625, -0.0867156982421875, -0.08294677734375, -0.0791778564453125, -0.075408935546875, -0.0716400146484375, -0.06787109375, -0.0641021728515625, -0.060333251953125, -0.0565643310546875, -0.05279541015625, -0.0490264892578125, -0.045257568359375, -0.0414886474609375, -0.0377197265625, -0.0339508056640625, -0.030181884765625, -0.0264129638671875, -0.02264404296875, -0.0188751220703125, -0.015106201171875, -0.0113372802734375, -0.007568359375, -0.0037994384765625, -3.0517578125e-05, 0.0037384033203125, 0.00750732421875, 0.0112762451171875, 0.015045166015625, 0.0188140869140625, 0.0225830078125, 0.0263519287109375, 0.030120849609375, 0.0338897705078125, 0.03765869140625, 0.0414276123046875, 0.045196533203125, 0.0489654541015625, 0.052734375, 0.0565032958984375, 0.060272216796875, 0.0640411376953125, 0.06781005859375, 0.0715789794921875, 0.075347900390625, 0.0791168212890625, 0.0828857421875, 0.0866546630859375, 0.090423583984375, 0.0941925048828125, 0.09796142578125, 0.1017303466796875, 0.105499267578125, 0.1092681884765625, 0.113037109375]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 5.0, 11.0, 34.0, 67.0, 124.0, 198.0, 227.0, 156.0, 102.0, 48.0, 14.0, 11.0, 8.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.5935535430908203, -3.5121028423309326, -3.430651903152466, -3.349201202392578, -3.2677502632141113, -3.1862995624542236, -3.104848861694336, -3.023397922515869, -2.9419472217559814, -2.8604965209960938, -2.779045581817627, -2.6975948810577393, -2.6161441802978516, -2.5346932411193848, -2.453242540359497, -2.3717918395996094, -2.2903409004211426, -2.208890199661255, -2.127439260482788, -2.0459885597229004, -1.9645377397537231, -1.883086919784546, -1.8016362190246582, -1.720185399055481, -1.6387345790863037, -1.5572837591171265, -1.4758329391479492, -1.3943822383880615, -1.3129314184188843, -1.231480598449707, -1.1500298976898193, -1.068579077720642, -0.9871282577514648, -0.9056774377822876, -0.8242266774177551, -0.7427759170532227, -0.6613250970840454, -0.5798742771148682, -0.4984235167503357, -0.4169727563858032, -0.335521936416626, -0.2540711462497711, -0.17262035608291626, -0.0911695659160614, -0.009718775749206543, 0.07173201441764832, 0.15318280458450317, 0.23463356494903564, 0.3160843849182129, 0.39753517508506775, 0.4789859652519226, 0.5604367256164551, 0.6418875455856323, 0.7233383655548096, 0.804789125919342, 0.8862398862838745, 0.9676907062530518, 1.049141526222229, 1.1305923461914062, 1.212043046951294, 1.2934938669204712, 1.3749446868896484, 1.4563953876495361, 1.5378462076187134, 1.6192970275878906]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 4.0, 2.0, 4.0, 3.0, 6.0, 6.0, 12.0, 12.0, 18.0, 19.0, 20.0, 29.0, 30.0, 28.0, 37.0, 35.0, 39.0, 39.0, 50.0, 54.0, 44.0, 48.0, 35.0, 46.0, 38.0, 44.0, 35.0, 33.0, 32.0, 28.0, 26.0, 30.0, 22.0, 19.0, 22.0, 12.0, 13.0, 12.0, 6.0, 1.0, 12.0, 6.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.2355091571807861, -1.2025368213653564, -1.1695646047592163, -1.1365922689437866, -1.103619933128357, -1.0706475973129272, -1.037675380706787, -1.0047030448913574, -0.9717307090759277, -0.9387584328651428, -0.9057860970497131, -0.8728138208389282, -0.8398414850234985, -0.8068692088127136, -0.7738969326019287, -0.740924596786499, -0.7079523205757141, -0.6749800443649292, -0.6420077085494995, -0.6090354323387146, -0.5760630965232849, -0.5430908203125, -0.5101184844970703, -0.4771462082862854, -0.4441739022731781, -0.4112015962600708, -0.3782292902469635, -0.3452569842338562, -0.3122847080230713, -0.2793123722076416, -0.2463400959968567, -0.2133677899837494, -0.18039542436599731, -0.14742311835289001, -0.11445081979036331, -0.08147852122783661, -0.04850621521472931, -0.01553390920162201, 0.017438381910324097, 0.050410687923431396, 0.0833829939365387, 0.116355299949646, 0.1493276059627533, 0.1822998970746994, 0.2152722030878067, 0.248244509100914, 0.2812168002128601, 0.3141891062259674, 0.3471614122390747, 0.380133718252182, 0.4131060242652893, 0.4460783004760742, 0.4790506362915039, 0.5120229125022888, 0.5449951887130737, 0.5779675245285034, 0.6109398603439331, 0.643912136554718, 0.6768844723701477, 0.7098567485809326, 0.7428290843963623, 0.7758013606071472, 0.8087736368179321, 0.8417459726333618, 0.8747182488441467]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 5.0, 6.0, 8.0, 14.0, 14.0, 32.0, 64.0, 106.0, 237.0, 539.0, 1495.0, 5268.0, 28271.0, 662841.0, 3449899.0, 36617.0, 6213.0, 1627.0, 568.0, 243.0, 107.0, 53.0, 24.0, 15.0, 5.0, 5.0, 7.0, 2.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6376953125, -0.6178054809570312, -0.5979156494140625, -0.5780258178710938, -0.558135986328125, -0.5382461547851562, -0.5183563232421875, -0.49846649169921875, -0.47857666015625, -0.45868682861328125, -0.4387969970703125, -0.41890716552734375, -0.399017333984375, -0.37912750244140625, -0.3592376708984375, -0.33934783935546875, -0.3194580078125, -0.29956817626953125, -0.2796783447265625, -0.25978851318359375, -0.239898681640625, -0.22000885009765625, -0.2001190185546875, -0.18022918701171875, -0.16033935546875, -0.14044952392578125, -0.1205596923828125, -0.10066986083984375, -0.080780029296875, -0.06089019775390625, -0.0410003662109375, -0.02111053466796875, -0.001220703125, 0.01866912841796875, 0.0385589599609375, 0.05844879150390625, 0.078338623046875, 0.09822845458984375, 0.1181182861328125, 0.13800811767578125, 0.15789794921875, 0.17778778076171875, 0.1976776123046875, 0.21756744384765625, 0.237457275390625, 0.25734710693359375, 0.2772369384765625, 0.29712677001953125, 0.3170166015625, 0.33690643310546875, 0.3567962646484375, 0.37668609619140625, 0.396575927734375, 0.41646575927734375, 0.4363555908203125, 0.45624542236328125, 0.47613525390625, 0.49602508544921875, 0.5159149169921875, 0.5358047485351562, 0.555694580078125, 0.5755844116210938, 0.5954742431640625, 0.6153640747070312, 0.63525390625]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 4.0, 7.0, 7.0, 12.0, 22.0, 18.0, 26.0, 36.0, 51.0, 51.0, 73.0, 67.0, 90.0, 83.0, 91.0, 69.0, 65.0, 50.0, 61.0, 31.0, 29.0, 25.0, 17.0, 11.0, 5.0, 9.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08447265625, -0.08215618133544922, -0.07983970642089844, -0.07752323150634766, -0.07520675659179688, -0.0728902816772461, -0.07057380676269531, -0.06825733184814453, -0.06594085693359375, -0.06362438201904297, -0.06130790710449219, -0.058991432189941406, -0.056674957275390625, -0.054358482360839844, -0.05204200744628906, -0.04972553253173828, -0.0474090576171875, -0.04509258270263672, -0.04277610778808594, -0.040459632873535156, -0.038143157958984375, -0.035826683044433594, -0.03351020812988281, -0.03119373321533203, -0.02887725830078125, -0.02656078338623047, -0.024244308471679688, -0.021927833557128906, -0.019611358642578125, -0.017294883728027344, -0.014978408813476562, -0.012661933898925781, -0.010345458984375, -0.008028984069824219, -0.0057125091552734375, -0.0033960342407226562, -0.001079559326171875, 0.0012369155883789062, 0.0035533905029296875, 0.005869865417480469, 0.00818634033203125, 0.010502815246582031, 0.012819290161132812, 0.015135765075683594, 0.017452239990234375, 0.019768714904785156, 0.022085189819335938, 0.02440166473388672, 0.0267181396484375, 0.02903461456298828, 0.03135108947753906, 0.033667564392089844, 0.035984039306640625, 0.038300514221191406, 0.04061698913574219, 0.04293346405029297, 0.04524993896484375, 0.04756641387939453, 0.04988288879394531, 0.052199363708496094, 0.054515838623046875, 0.056832313537597656, 0.05914878845214844, 0.06146526336669922, 0.06378173828125]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 7.0, 7.0, 8.0, 12.0, 33.0, 33.0, 52.0, 67.0, 111.0, 186.0, 273.0, 493.0, 988.0, 2340.0, 6440.0, 23293.0, 134238.0, 3727970.0, 248522.0, 35012.0, 8724.0, 2892.0, 1170.0, 515.0, 343.0, 186.0, 127.0, 64.0, 49.0, 45.0, 29.0, 16.0, 21.0, 9.0, 6.0, 5.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6279296875, -0.6103057861328125, -0.592681884765625, -0.5750579833984375, -0.55743408203125, -0.5398101806640625, -0.522186279296875, -0.5045623779296875, -0.4869384765625, -0.4693145751953125, -0.451690673828125, -0.4340667724609375, -0.41644287109375, -0.3988189697265625, -0.381195068359375, -0.3635711669921875, -0.345947265625, -0.3283233642578125, -0.310699462890625, -0.2930755615234375, -0.27545166015625, -0.2578277587890625, -0.240203857421875, -0.2225799560546875, -0.2049560546875, -0.1873321533203125, -0.169708251953125, -0.1520843505859375, -0.13446044921875, -0.1168365478515625, -0.099212646484375, -0.0815887451171875, -0.06396484375, -0.0463409423828125, -0.028717041015625, -0.0110931396484375, 0.00653076171875, 0.0241546630859375, 0.041778564453125, 0.0594024658203125, 0.0770263671875, 0.0946502685546875, 0.112274169921875, 0.1298980712890625, 0.14752197265625, 0.1651458740234375, 0.182769775390625, 0.2003936767578125, 0.218017578125, 0.2356414794921875, 0.253265380859375, 0.2708892822265625, 0.28851318359375, 0.3061370849609375, 0.323760986328125, 0.3413848876953125, 0.3590087890625, 0.3766326904296875, 0.394256591796875, 0.4118804931640625, 0.42950439453125, 0.4471282958984375, 0.464752197265625, 0.4823760986328125, 0.5]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 2.0, 8.0, 8.0, 8.0, 17.0, 17.0, 30.0, 48.0, 68.0, 165.0, 312.0, 2449.0, 523.0, 178.0, 80.0, 54.0, 38.0, 28.0, 16.0, 13.0, 3.0, 2.0, 4.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2081298828125, -0.2015514373779297, -0.19497299194335938, -0.18839454650878906, -0.18181610107421875, -0.17523765563964844, -0.16865921020507812, -0.1620807647705078, -0.1555023193359375, -0.1489238739013672, -0.14234542846679688, -0.13576698303222656, -0.12918853759765625, -0.12261009216308594, -0.11603164672851562, -0.10945320129394531, -0.102874755859375, -0.09629631042480469, -0.08971786499023438, -0.08313941955566406, -0.07656097412109375, -0.06998252868652344, -0.06340408325195312, -0.05682563781738281, -0.0502471923828125, -0.04366874694824219, -0.037090301513671875, -0.030511856079101562, -0.02393341064453125, -0.017354965209960938, -0.010776519775390625, -0.0041980743408203125, 0.00238037109375, 0.008958816528320312, 0.015537261962890625, 0.022115707397460938, 0.02869415283203125, 0.03527259826660156, 0.041851043701171875, 0.04842948913574219, 0.0550079345703125, 0.06158638000488281, 0.06816482543945312, 0.07474327087402344, 0.08132171630859375, 0.08790016174316406, 0.09447860717773438, 0.10105705261230469, 0.107635498046875, 0.11421394348144531, 0.12079238891601562, 0.12737083435058594, 0.13394927978515625, 0.14052772521972656, 0.14710617065429688, 0.1536846160888672, 0.1602630615234375, 0.1668415069580078, 0.17341995239257812, 0.17999839782714844, 0.18657684326171875, 0.19315528869628906, 0.19973373413085938, 0.2063121795654297, 0.212890625]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 4.0, 6.0, 17.0, 26.0, 59.0, 110.0, 167.0, 217.0, 189.0, 96.0, 60.0, 25.0, 22.0, 9.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3730878829956055, -1.323355793952942, -1.2736235857009888, -1.2238914966583252, -1.174159288406372, -1.1244271993637085, -1.074695110321045, -1.0249629020690918, -0.9752307534217834, -0.9254986047744751, -0.8757664561271667, -0.8260343074798584, -0.7763022184371948, -0.7265700101852417, -0.6768379211425781, -0.6271057724952698, -0.5773736238479614, -0.5276414752006531, -0.4779093265533447, -0.42817720770835876, -0.3784450590610504, -0.32871291041374207, -0.2789807915687561, -0.22924864292144775, -0.1795164942741394, -0.12978434562683105, -0.0800522118806839, -0.030320078134536743, 0.019412070512771606, 0.06914421916007996, 0.11887633800506592, 0.16860848665237427, 0.21834063529968262, 0.26807278394699097, 0.3178049325942993, 0.3675370514392853, 0.41726920008659363, 0.467001348733902, 0.5167334675788879, 0.5664656162261963, 0.6161977648735046, 0.665929913520813, 0.7156620621681213, 0.7653942108154297, 0.8151262998580933, 0.8648585081100464, 0.91459059715271, 0.9643227458000183, 1.0140548944473267, 1.0637869834899902, 1.1135191917419434, 1.163251280784607, 1.21298348903656, 1.2627155780792236, 1.3124477863311768, 1.3621798753738403, 1.411911964416504, 1.4616440534591675, 1.5113762617111206, 1.5611083507537842, 1.6108405590057373, 1.6605726480484009, 1.7103047370910645, 1.7600369453430176, 1.8097691535949707]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 4.0, 3.0, 10.0, 1.0, 4.0, 6.0, 5.0, 14.0, 22.0, 19.0, 14.0, 22.0, 21.0, 34.0, 32.0, 31.0, 26.0, 37.0, 30.0, 41.0, 49.0, 35.0, 42.0, 45.0, 38.0, 44.0, 38.0, 43.0, 40.0, 29.0, 37.0, 28.0, 18.0, 27.0, 17.0, 19.0, 14.0, 19.0, 9.0, 13.0, 7.0, 4.0, 4.0, 5.0, 5.0, 2.0, 2.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.4628755450248718, -0.4484281539916992, -0.4339807331562042, -0.4195333421230316, -0.4050859212875366, -0.390638530254364, -0.3761911392211914, -0.3617437183856964, -0.3472963273525238, -0.3328489363193512, -0.3184015154838562, -0.3039541244506836, -0.2895067036151886, -0.275059312582016, -0.260611891746521, -0.2461645007133484, -0.2317170947790146, -0.2172696888446808, -0.20282228291034698, -0.18837487697601318, -0.17392748594284058, -0.15948008000850677, -0.14503267407417297, -0.13058528304100037, -0.11613786965608597, -0.10169046372175217, -0.08724306523799896, -0.07279565930366516, -0.05834825709462166, -0.043900854885578156, -0.029453448951244354, -0.01500605046749115, -0.0005586445331573486, 0.013888758607208729, 0.028336161747574806, 0.04278356581926346, 0.05723096802830696, 0.07167837023735046, 0.08612577617168427, 0.10057317465543747, 0.11502058058977127, 0.12946797907352448, 0.14391538500785828, 0.15836279094219208, 0.17281019687652588, 0.1872575879096985, 0.20170500874519348, 0.2161523997783661, 0.2305998057126999, 0.2450472116470337, 0.2594946026802063, 0.2739420235157013, 0.2883894145488739, 0.3028368353843689, 0.3172842264175415, 0.3317316174507141, 0.3461790382862091, 0.3606264293193817, 0.3750738501548767, 0.3895212411880493, 0.4039686620235443, 0.4184160530567169, 0.4328634738922119, 0.4473108649253845, 0.46175825595855713]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 3.0, 3.0, 5.0, 6.0, 9.0, 11.0, 10.0, 24.0, 31.0, 78.0, 135.0, 252.0, 686.0, 2430.0, 9610.0, 43586.0, 225758.0, 610230.0, 122111.0, 25252.0, 5834.0, 1580.0, 489.0, 204.0, 91.0, 58.0, 29.0, 10.0, 13.0, 5.0, 6.0, 4.0, 2.0, 5.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3271484375, -0.31472015380859375, -0.3022918701171875, -0.28986358642578125, -0.277435302734375, -0.26500701904296875, -0.2525787353515625, -0.24015045166015625, -0.22772216796875, -0.21529388427734375, -0.2028656005859375, -0.19043731689453125, -0.178009033203125, -0.16558074951171875, -0.1531524658203125, -0.14072418212890625, -0.1282958984375, -0.11586761474609375, -0.1034393310546875, -0.09101104736328125, -0.078582763671875, -0.06615447998046875, -0.0537261962890625, -0.04129791259765625, -0.02886962890625, -0.01644134521484375, -0.0040130615234375, 0.00841522216796875, 0.020843505859375, 0.03327178955078125, 0.0457000732421875, 0.05812835693359375, 0.070556640625, 0.08298492431640625, 0.0954132080078125, 0.10784149169921875, 0.120269775390625, 0.13269805908203125, 0.1451263427734375, 0.15755462646484375, 0.16998291015625, 0.18241119384765625, 0.1948394775390625, 0.20726776123046875, 0.219696044921875, 0.23212432861328125, 0.2445526123046875, 0.25698089599609375, 0.2694091796875, 0.28183746337890625, 0.2942657470703125, 0.30669403076171875, 0.319122314453125, 0.33155059814453125, 0.3439788818359375, 0.35640716552734375, 0.36883544921875, 0.38126373291015625, 0.3936920166015625, 0.40612030029296875, 0.418548583984375, 0.43097686767578125, 0.4434051513671875, 0.45583343505859375, 0.46826171875]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 1.0, 3.0, 5.0, 3.0, 12.0, 10.0, 21.0, 20.0, 29.0, 47.0, 38.0, 56.0, 50.0, 66.0, 70.0, 62.0, 61.0, 66.0, 63.0, 61.0, 52.0, 36.0, 47.0, 37.0, 21.0, 19.0, 10.0, 17.0, 10.0, 9.0, 4.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0865478515625, -0.08422279357910156, -0.08189773559570312, -0.07957267761230469, -0.07724761962890625, -0.07492256164550781, -0.07259750366210938, -0.07027244567871094, -0.0679473876953125, -0.06562232971191406, -0.06329727172851562, -0.06097221374511719, -0.05864715576171875, -0.05632209777832031, -0.053997039794921875, -0.05167198181152344, -0.049346923828125, -0.04702186584472656, -0.044696807861328125, -0.04237174987792969, -0.04004669189453125, -0.03772163391113281, -0.035396575927734375, -0.03307151794433594, -0.0307464599609375, -0.028421401977539062, -0.026096343994140625, -0.023771286010742188, -0.02144622802734375, -0.019121170043945312, -0.016796112060546875, -0.014471054077148438, -0.01214599609375, -0.009820938110351562, -0.007495880126953125, -0.0051708221435546875, -0.00284576416015625, -0.0005207061767578125, 0.001804351806640625, 0.0041294097900390625, 0.0064544677734375, 0.008779525756835938, 0.011104583740234375, 0.013429641723632812, 0.01575469970703125, 0.018079757690429688, 0.020404815673828125, 0.022729873657226562, 0.025054931640625, 0.027379989624023438, 0.029705047607421875, 0.03203010559082031, 0.03435516357421875, 0.03668022155761719, 0.039005279541015625, 0.04133033752441406, 0.0436553955078125, 0.04598045349121094, 0.048305511474609375, 0.05063056945800781, 0.05295562744140625, 0.05528068542480469, 0.057605743408203125, 0.05993080139160156, 0.062255859375]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 1.0, 2.0, 1.0, 2.0, 8.0, 6.0, 12.0, 15.0, 20.0, 8.0, 18.0, 27.0, 31.0, 45.0, 54.0, 75.0, 114.0, 136.0, 204.0, 307.0, 565.0, 966.0, 2085.0, 4843.0, 14386.0, 49958.0, 198363.0, 592716.0, 130293.0, 35012.0, 10602.0, 3775.0, 1626.0, 799.0, 469.0, 277.0, 215.0, 139.0, 98.0, 80.0, 54.0, 33.0, 17.0, 24.0, 16.0, 15.0, 11.0, 15.0, 11.0, 6.0, 5.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0], "bins": [-0.296142578125, -0.2863883972167969, -0.27663421630859375, -0.2668800354003906, -0.2571258544921875, -0.24737167358398438, -0.23761749267578125, -0.22786331176757812, -0.218109130859375, -0.20835494995117188, -0.19860076904296875, -0.18884658813476562, -0.1790924072265625, -0.16933822631835938, -0.15958404541015625, -0.14982986450195312, -0.14007568359375, -0.13032150268554688, -0.12056732177734375, -0.11081314086914062, -0.1010589599609375, -0.09130477905273438, -0.08155059814453125, -0.07179641723632812, -0.062042236328125, -0.052288055419921875, -0.04253387451171875, -0.032779693603515625, -0.0230255126953125, -0.013271331787109375, -0.00351715087890625, 0.006237030029296875, 0.0159912109375, 0.025745391845703125, 0.03549957275390625, 0.045253753662109375, 0.0550079345703125, 0.06476211547851562, 0.07451629638671875, 0.08427047729492188, 0.094024658203125, 0.10377883911132812, 0.11353302001953125, 0.12328720092773438, 0.1330413818359375, 0.14279556274414062, 0.15254974365234375, 0.16230392456054688, 0.17205810546875, 0.18181228637695312, 0.19156646728515625, 0.20132064819335938, 0.2110748291015625, 0.22082901000976562, 0.23058319091796875, 0.24033737182617188, 0.250091552734375, 0.2598457336425781, 0.26959991455078125, 0.2793540954589844, 0.2891082763671875, 0.2988624572753906, 0.30861663818359375, 0.3183708190917969, 0.328125]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 3.0, 2.0, 5.0, 5.0, 2.0, 4.0, 5.0, 10.0, 5.0, 13.0, 14.0, 13.0, 19.0, 17.0, 26.0, 23.0, 31.0, 23.0, 36.0, 43.0, 33.0, 42.0, 40.0, 38.0, 35.0, 44.0, 40.0, 36.0, 31.0, 43.0, 31.0, 36.0, 21.0, 32.0, 24.0, 26.0, 28.0, 21.0, 16.0, 11.0, 15.0, 7.0, 13.0, 8.0, 7.0, 16.0, 5.0, 1.0, 5.0, 3.0, 4.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0], "bins": [-0.2149658203125, -0.20830917358398438, -0.20165252685546875, -0.19499588012695312, -0.1883392333984375, -0.18168258666992188, -0.17502593994140625, -0.16836929321289062, -0.161712646484375, -0.15505599975585938, -0.14839935302734375, -0.14174270629882812, -0.1350860595703125, -0.12842941284179688, -0.12177276611328125, -0.11511611938476562, -0.10845947265625, -0.10180282592773438, -0.09514617919921875, -0.08848953247070312, -0.0818328857421875, -0.07517623901367188, -0.06851959228515625, -0.061862945556640625, -0.055206298828125, -0.048549652099609375, -0.04189300537109375, -0.035236358642578125, -0.0285797119140625, -0.021923065185546875, -0.01526641845703125, -0.008609771728515625, -0.001953125, 0.004703521728515625, 0.01136016845703125, 0.018016815185546875, 0.0246734619140625, 0.031330108642578125, 0.03798675537109375, 0.044643402099609375, 0.051300048828125, 0.057956695556640625, 0.06461334228515625, 0.07126998901367188, 0.0779266357421875, 0.08458328247070312, 0.09123992919921875, 0.09789657592773438, 0.10455322265625, 0.11120986938476562, 0.11786651611328125, 0.12452316284179688, 0.1311798095703125, 0.13783645629882812, 0.14449310302734375, 0.15114974975585938, 0.157806396484375, 0.16446304321289062, 0.17111968994140625, 0.17777633666992188, 0.1844329833984375, 0.19108963012695312, 0.19774627685546875, 0.20440292358398438, 0.2110595703125]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 3.0, 4.0, 4.0, 6.0, 9.0, 22.0, 30.0, 39.0, 79.0, 126.0, 204.0, 361.0, 655.0, 1426.0, 3153.0, 8282.0, 27380.0, 104144.0, 501760.0, 299262.0, 71200.0, 19353.0, 6158.0, 2503.0, 1069.0, 582.0, 297.0, 173.0, 101.0, 53.0, 34.0, 26.0, 32.0, 9.0, 13.0, 4.0, 2.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.1884765625, -0.18349838256835938, -0.17852020263671875, -0.17354202270507812, -0.1685638427734375, -0.16358566284179688, -0.15860748291015625, -0.15362930297851562, -0.148651123046875, -0.14367294311523438, -0.13869476318359375, -0.13371658325195312, -0.1287384033203125, -0.12376022338867188, -0.11878204345703125, -0.11380386352539062, -0.10882568359375, -0.10384750366210938, -0.09886932373046875, -0.09389114379882812, -0.0889129638671875, -0.08393478393554688, -0.07895660400390625, -0.07397842407226562, -0.069000244140625, -0.06402206420898438, -0.05904388427734375, -0.054065704345703125, -0.0490875244140625, -0.044109344482421875, -0.03913116455078125, -0.034152984619140625, -0.0291748046875, -0.024196624755859375, -0.01921844482421875, -0.014240264892578125, -0.0092620849609375, -0.004283905029296875, 0.00069427490234375, 0.005672454833984375, 0.010650634765625, 0.015628814697265625, 0.02060699462890625, 0.025585174560546875, 0.0305633544921875, 0.035541534423828125, 0.04051971435546875, 0.045497894287109375, 0.05047607421875, 0.055454254150390625, 0.06043243408203125, 0.06541061401367188, 0.0703887939453125, 0.07536697387695312, 0.08034515380859375, 0.08532333374023438, 0.090301513671875, 0.09527969360351562, 0.10025787353515625, 0.10523605346679688, 0.1102142333984375, 0.11519241333007812, 0.12017059326171875, 0.12514877319335938, 0.130126953125]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 3.0, 2.0, 2.0, 4.0, 6.0, 5.0, 8.0, 13.0, 12.0, 14.0, 17.0, 24.0, 29.0, 40.0, 39.0, 63.0, 69.0, 76.0, 63.0, 60.0, 79.0, 70.0, 62.0, 43.0, 41.0, 29.0, 30.0, 22.0, 19.0, 9.0, 15.0, 11.0, 5.0, 6.0, 4.0, 5.0, 4.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.349252700805664e-05, -7.14082270860672e-05, -6.932392716407776e-05, -6.723962724208832e-05, -6.515532732009888e-05, -6.307102739810944e-05, -6.0986727476119995e-05, -5.8902427554130554e-05, -5.681812763214111e-05, -5.473382771015167e-05, -5.264952778816223e-05, -5.056522786617279e-05, -4.848092794418335e-05, -4.639662802219391e-05, -4.431232810020447e-05, -4.222802817821503e-05, -4.0143728256225586e-05, -3.8059428334236145e-05, -3.5975128412246704e-05, -3.389082849025726e-05, -3.180652856826782e-05, -2.972222864627838e-05, -2.763792872428894e-05, -2.55536288022995e-05, -2.346932888031006e-05, -2.1385028958320618e-05, -1.9300729036331177e-05, -1.7216429114341736e-05, -1.5132129192352295e-05, -1.3047829270362854e-05, -1.0963529348373413e-05, -8.879229426383972e-06, -6.794929504394531e-06, -4.71062958240509e-06, -2.6263296604156494e-06, -5.420297384262085e-07, 1.5422701835632324e-06, 3.6265701055526733e-06, 5.710870027542114e-06, 7.795169949531555e-06, 9.879469871520996e-06, 1.1963769793510437e-05, 1.4048069715499878e-05, 1.613236963748932e-05, 1.821666955947876e-05, 2.03009694814682e-05, 2.238526940345764e-05, 2.4469569325447083e-05, 2.6553869247436523e-05, 2.8638169169425964e-05, 3.0722469091415405e-05, 3.2806769013404846e-05, 3.489106893539429e-05, 3.697536885738373e-05, 3.905966877937317e-05, 4.114396870136261e-05, 4.322826862335205e-05, 4.531256854534149e-05, 4.739686846733093e-05, 4.9481168389320374e-05, 5.1565468311309814e-05, 5.3649768233299255e-05, 5.5734068155288696e-05, 5.781836807727814e-05, 5.990266799926758e-05]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 6.0, 4.0, 5.0, 8.0, 14.0, 18.0, 30.0, 39.0, 82.0, 182.0, 273.0, 541.0, 1502.0, 5006.0, 27955.0, 285353.0, 645762.0, 68275.0, 9556.0, 2313.0, 812.0, 368.0, 177.0, 107.0, 62.0, 48.0, 22.0, 18.0, 11.0, 8.0, 2.0, 1.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.26806640625, -0.25974273681640625, -0.2514190673828125, -0.24309539794921875, -0.234771728515625, -0.22644805908203125, -0.2181243896484375, -0.20980072021484375, -0.20147705078125, -0.19315338134765625, -0.1848297119140625, -0.17650604248046875, -0.168182373046875, -0.15985870361328125, -0.1515350341796875, -0.14321136474609375, -0.1348876953125, -0.12656402587890625, -0.1182403564453125, -0.10991668701171875, -0.101593017578125, -0.09326934814453125, -0.0849456787109375, -0.07662200927734375, -0.06829833984375, -0.05997467041015625, -0.0516510009765625, -0.04332733154296875, -0.035003662109375, -0.02667999267578125, -0.0183563232421875, -0.01003265380859375, -0.001708984375, 0.00661468505859375, 0.0149383544921875, 0.02326202392578125, 0.031585693359375, 0.03990936279296875, 0.0482330322265625, 0.05655670166015625, 0.06488037109375, 0.07320404052734375, 0.0815277099609375, 0.08985137939453125, 0.098175048828125, 0.10649871826171875, 0.1148223876953125, 0.12314605712890625, 0.1314697265625, 0.13979339599609375, 0.1481170654296875, 0.15644073486328125, 0.164764404296875, 0.17308807373046875, 0.1814117431640625, 0.18973541259765625, 0.19805908203125, 0.20638275146484375, 0.2147064208984375, 0.22303009033203125, 0.231353759765625, 0.23967742919921875, 0.2480010986328125, 0.25632476806640625, 0.2646484375]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 3.0, 7.0, 4.0, 5.0, 3.0, 4.0, 5.0, 6.0, 9.0, 10.0, 14.0, 22.0, 31.0, 22.0, 36.0, 36.0, 63.0, 81.0, 95.0, 80.0, 67.0, 59.0, 58.0, 54.0, 49.0, 39.0, 23.0, 29.0, 16.0, 12.0, 17.0, 10.0, 7.0, 3.0, 8.0, 3.0, 2.0, 4.0, 1.0, 7.0, 0.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.1307373046875, -0.12703990936279297, -0.12334251403808594, -0.1196451187133789, -0.11594772338867188, -0.11225032806396484, -0.10855293273925781, -0.10485553741455078, -0.10115814208984375, -0.09746074676513672, -0.09376335144042969, -0.09006595611572266, -0.08636856079101562, -0.0826711654663086, -0.07897377014160156, -0.07527637481689453, -0.0715789794921875, -0.06788158416748047, -0.06418418884277344, -0.060486793518066406, -0.056789398193359375, -0.053092002868652344, -0.04939460754394531, -0.04569721221923828, -0.04199981689453125, -0.03830242156982422, -0.03460502624511719, -0.030907630920410156, -0.027210235595703125, -0.023512840270996094, -0.019815444946289062, -0.01611804962158203, -0.012420654296875, -0.008723258972167969, -0.0050258636474609375, -0.0013284683227539062, 0.002368927001953125, 0.006066322326660156, 0.009763717651367188, 0.013461112976074219, 0.01715850830078125, 0.02085590362548828, 0.024553298950195312, 0.028250694274902344, 0.031948089599609375, 0.035645484924316406, 0.03934288024902344, 0.04304027557373047, 0.0467376708984375, 0.05043506622314453, 0.05413246154785156, 0.057829856872558594, 0.061527252197265625, 0.06522464752197266, 0.06892204284667969, 0.07261943817138672, 0.07631683349609375, 0.08001422882080078, 0.08371162414550781, 0.08740901947021484, 0.09110641479492188, 0.0948038101196289, 0.09850120544433594, 0.10219860076904297, 0.10589599609375]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 6.0, 3.0, 7.0, 13.0, 12.0, 27.0, 39.0, 64.0, 92.0, 118.0, 152.0, 157.0, 116.0, 80.0, 54.0, 31.0, 16.0, 12.0, 2.0, 3.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.618297815322876, -2.538825750350952, -2.4593536853790283, -2.3798816204071045, -2.3004095554351807, -2.220937490463257, -2.141465425491333, -2.0619935989379883, -1.982521414756775, -1.903049349784851, -1.8235772848129272, -1.7441052198410034, -1.6646332740783691, -1.5851612091064453, -1.5056891441345215, -1.4262170791625977, -1.3467450141906738, -1.26727294921875, -1.1878008842468262, -1.1083288192749023, -1.0288567543029785, -0.9493847489356995, -0.8699127435684204, -0.7904406785964966, -0.7109686136245728, -0.6314965486526489, -0.5520244836807251, -0.47255247831344604, -0.3930804133415222, -0.3136083483695984, -0.23413631319999695, -0.1546642780303955, -0.07519245147705078, 0.004279598593711853, 0.08375164866447449, 0.16322369873523712, 0.24269574880599976, 0.3221678137779236, 0.401639848947525, 0.48111188411712646, 0.5605839490890503, 0.6400560140609741, 0.719528079032898, 0.799000084400177, 0.8784721493721008, 0.9579442143440247, 1.0374162197113037, 1.1168882846832275, 1.1963603496551514, 1.2758324146270752, 1.355304479598999, 1.4347765445709229, 1.5142486095428467, 1.5937206745147705, 1.6731926202774048, 1.7526646852493286, 1.8321367502212524, 1.9116088151931763, 1.9910808801651, 2.0705528259277344, 2.150024890899658, 2.229496955871582, 2.308969020843506, 2.3884410858154297, 2.4679131507873535]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 3.0, 2.0, 5.0, 8.0, 5.0, 5.0, 11.0, 10.0, 19.0, 16.0, 16.0, 13.0, 20.0, 23.0, 22.0, 35.0, 27.0, 36.0, 27.0, 40.0, 56.0, 55.0, 50.0, 42.0, 47.0, 47.0, 40.0, 35.0, 33.0, 40.0, 31.0, 28.0, 22.0, 15.0, 26.0, 11.0, 16.0, 15.0, 11.0, 13.0, 12.0, 7.0, 3.0, 4.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.1948093175888062, -1.1562271118164062, -1.117645025253296, -1.079062819480896, -1.040480613708496, -1.0018985271453857, -0.9633163213729858, -0.9247341156005859, -0.8861519694328308, -0.8475698232650757, -0.8089876174926758, -0.7704054713249207, -0.7318233251571655, -0.6932411193847656, -0.6546589732170105, -0.6160768270492554, -0.5774946212768555, -0.5389124751091003, -0.5003302693367004, -0.4617481231689453, -0.4231659471988678, -0.3845837712287903, -0.34600162506103516, -0.30741944909095764, -0.2688372731208801, -0.2302550971508026, -0.1916729360818863, -0.15309077501296997, -0.11450859904289246, -0.07592642307281494, -0.03734426200389862, 0.0012378990650177002, 0.039820194244384766, 0.07840236276388168, 0.1169845312833786, 0.15556669235229492, 0.19414886832237244, 0.23273104429244995, 0.2713131904602051, 0.3098953664302826, 0.3484775424003601, 0.3870597183704376, 0.42564189434051514, 0.46422404050827026, 0.5028061866760254, 0.5413883924484253, 0.5799705386161804, 0.6185526847839355, 0.6571348905563354, 0.6957170367240906, 0.7342992424964905, 0.7728813886642456, 0.8114635944366455, 0.8500457406044006, 0.8886278867721558, 0.9272100925445557, 0.9657922387123108, 1.004374384880066, 1.0429565906524658, 1.0815387964248657, 1.120120882987976, 1.158703088760376, 1.1972852945327759, 1.2358673810958862, 1.2744495868682861]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 3.0, 2.0, 2.0, 2.0, 3.0, 6.0, 6.0, 10.0, 12.0, 15.0, 28.0, 32.0, 40.0, 67.0, 104.0, 158.0, 317.0, 604.0, 1350.0, 3397.0, 9068.0, 29617.0, 155319.0, 3697635.0, 240453.0, 37836.0, 11000.0, 3962.0, 1613.0, 778.0, 358.0, 173.0, 107.0, 62.0, 41.0, 24.0, 23.0, 27.0, 11.0, 2.0, 7.0, 9.0, 0.0, 2.0, 2.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.4052734375, -0.3932075500488281, -0.38114166259765625, -0.3690757751464844, -0.3570098876953125, -0.3449440002441406, -0.33287811279296875, -0.3208122253417969, -0.308746337890625, -0.2966804504394531, -0.28461456298828125, -0.2725486755371094, -0.2604827880859375, -0.24841690063476562, -0.23635101318359375, -0.22428512573242188, -0.21221923828125, -0.20015335083007812, -0.18808746337890625, -0.17602157592773438, -0.1639556884765625, -0.15188980102539062, -0.13982391357421875, -0.12775802612304688, -0.115692138671875, -0.10362625122070312, -0.09156036376953125, -0.07949447631835938, -0.0674285888671875, -0.055362701416015625, -0.04329681396484375, -0.031230926513671875, -0.0191650390625, -0.007099151611328125, 0.00496673583984375, 0.017032623291015625, 0.0290985107421875, 0.041164398193359375, 0.05323028564453125, 0.06529617309570312, 0.077362060546875, 0.08942794799804688, 0.10149383544921875, 0.11355972290039062, 0.1256256103515625, 0.13769149780273438, 0.14975738525390625, 0.16182327270507812, 0.17388916015625, 0.18595504760742188, 0.19802093505859375, 0.21008682250976562, 0.2221527099609375, 0.23421859741210938, 0.24628448486328125, 0.2583503723144531, 0.270416259765625, 0.2824821472167969, 0.29454803466796875, 0.3066139221191406, 0.3186798095703125, 0.3307456970214844, 0.34281158447265625, 0.3548774719238281, 0.366943359375]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 1.0, 4.0, 9.0, 8.0, 12.0, 20.0, 26.0, 29.0, 55.0, 61.0, 64.0, 59.0, 80.0, 85.0, 59.0, 72.0, 71.0, 59.0, 63.0, 41.0, 41.0, 23.0, 25.0, 15.0, 9.0, 11.0, 3.0, 4.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09820556640625, -0.09555721282958984, -0.09290885925292969, -0.09026050567626953, -0.08761215209960938, -0.08496379852294922, -0.08231544494628906, -0.0796670913696289, -0.07701873779296875, -0.0743703842163086, -0.07172203063964844, -0.06907367706298828, -0.06642532348632812, -0.06377696990966797, -0.06112861633300781, -0.058480262756347656, -0.0558319091796875, -0.053183555603027344, -0.05053520202636719, -0.04788684844970703, -0.045238494873046875, -0.04259014129638672, -0.03994178771972656, -0.037293434143066406, -0.03464508056640625, -0.031996726989746094, -0.029348373413085938, -0.02670001983642578, -0.024051666259765625, -0.02140331268310547, -0.018754959106445312, -0.016106605529785156, -0.013458251953125, -0.010809898376464844, -0.008161544799804688, -0.005513191223144531, -0.002864837646484375, -0.00021648406982421875, 0.0024318695068359375, 0.005080223083496094, 0.00772857666015625, 0.010376930236816406, 0.013025283813476562, 0.01567363739013672, 0.018321990966796875, 0.02097034454345703, 0.023618698120117188, 0.026267051696777344, 0.0289154052734375, 0.031563758850097656, 0.03421211242675781, 0.03686046600341797, 0.039508819580078125, 0.04215717315673828, 0.04480552673339844, 0.047453880310058594, 0.05010223388671875, 0.052750587463378906, 0.05539894104003906, 0.05804729461669922, 0.060695648193359375, 0.06334400177001953, 0.06599235534667969, 0.06864070892333984, 0.0712890625]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 6.0, 4.0, 9.0, 3.0, 12.0, 8.0, 22.0, 24.0, 18.0, 50.0, 89.0, 138.0, 224.0, 303.0, 500.0, 1082.0, 2015.0, 4810.0, 13880.0, 54693.0, 460577.0, 3479290.0, 134832.0, 27056.0, 8141.0, 3208.0, 1420.0, 786.0, 467.0, 233.0, 142.0, 88.0, 59.0, 31.0, 25.0, 14.0, 14.0, 5.0, 3.0, 8.0, 2.0, 0.0, 0.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.482666015625, -0.4661674499511719, -0.44966888427734375, -0.4331703186035156, -0.4166717529296875, -0.4001731872558594, -0.38367462158203125, -0.3671760559082031, -0.350677490234375, -0.3341789245605469, -0.31768035888671875, -0.3011817932128906, -0.2846832275390625, -0.2681846618652344, -0.25168609619140625, -0.23518753051757812, -0.21868896484375, -0.20219039916992188, -0.18569183349609375, -0.16919326782226562, -0.1526947021484375, -0.13619613647460938, -0.11969757080078125, -0.10319900512695312, -0.086700439453125, -0.07020187377929688, -0.05370330810546875, -0.037204742431640625, -0.0207061767578125, -0.004207611083984375, 0.01229095458984375, 0.028789520263671875, 0.0452880859375, 0.061786651611328125, 0.07828521728515625, 0.09478378295898438, 0.1112823486328125, 0.12778091430664062, 0.14427947998046875, 0.16077804565429688, 0.177276611328125, 0.19377517700195312, 0.21027374267578125, 0.22677230834960938, 0.2432708740234375, 0.2597694396972656, 0.27626800537109375, 0.2927665710449219, 0.30926513671875, 0.3257637023925781, 0.34226226806640625, 0.3587608337402344, 0.3752593994140625, 0.3917579650878906, 0.40825653076171875, 0.4247550964355469, 0.441253662109375, 0.4577522277832031, 0.47425079345703125, 0.4907493591308594, 0.5072479248046875, 0.5237464904785156, 0.5402450561523438, 0.5567436218261719, 0.5732421875]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 0.0, 2.0, 1.0, 2.0, 4.0, 2.0, 7.0, 5.0, 10.0, 10.0, 21.0, 25.0, 49.0, 88.0, 130.0, 277.0, 1226.0, 1558.0, 289.0, 123.0, 84.0, 47.0, 36.0, 27.0, 29.0, 15.0, 4.0, 1.0, 1.0, 6.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.326416015625, -0.3182640075683594, -0.31011199951171875, -0.3019599914550781, -0.2938079833984375, -0.2856559753417969, -0.27750396728515625, -0.2693519592285156, -0.261199951171875, -0.2530479431152344, -0.24489593505859375, -0.23674392700195312, -0.2285919189453125, -0.22043991088867188, -0.21228790283203125, -0.20413589477539062, -0.19598388671875, -0.18783187866210938, -0.17967987060546875, -0.17152786254882812, -0.1633758544921875, -0.15522384643554688, -0.14707183837890625, -0.13891983032226562, -0.130767822265625, -0.12261581420898438, -0.11446380615234375, -0.10631179809570312, -0.0981597900390625, -0.09000778198242188, -0.08185577392578125, -0.07370376586914062, -0.0655517578125, -0.057399749755859375, -0.04924774169921875, -0.041095733642578125, -0.0329437255859375, -0.024791717529296875, -0.01663970947265625, -0.008487701416015625, -0.000335693359375, 0.007816314697265625, 0.01596832275390625, 0.024120330810546875, 0.0322723388671875, 0.040424346923828125, 0.04857635498046875, 0.056728363037109375, 0.06488037109375, 0.07303237915039062, 0.08118438720703125, 0.08933639526367188, 0.0974884033203125, 0.10564041137695312, 0.11379241943359375, 0.12194442749023438, 0.130096435546875, 0.13824844360351562, 0.14640045166015625, 0.15455245971679688, 0.1627044677734375, 0.17085647583007812, 0.17900848388671875, 0.18716049194335938, 0.1953125]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 5.0, 2.0, 7.0, 12.0, 8.0, 18.0, 32.0, 44.0, 67.0, 97.0, 128.0, 131.0, 120.0, 111.0, 85.0, 61.0, 27.0, 14.0, 15.0, 9.0, 11.0, 4.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9450716376304626, -0.899733304977417, -0.8543950319290161, -0.8090566992759705, -0.7637183666229248, -0.7183800339698792, -0.6730417013168335, -0.6277034282684326, -0.582365095615387, -0.5370267629623413, -0.49168846011161804, -0.4463501572608948, -0.4010118246078491, -0.35567349195480347, -0.3103351891040802, -0.26499688625335693, -0.21965855360031128, -0.17432023584842682, -0.12898191809654236, -0.0836436003446579, -0.03830528259277344, 0.007033035159111023, 0.05237135291099548, 0.09770965576171875, 0.1430479884147644, 0.18838630616664886, 0.23372462391853333, 0.2790629267692566, 0.32440125942230225, 0.3697395920753479, 0.41507789492607117, 0.46041619777679443, 0.5057544708251953, 0.551092803478241, 0.5964311361312866, 0.6417694091796875, 0.6871077418327332, 0.7324460744857788, 0.7777843475341797, 0.8231226801872253, 0.868461012840271, 0.9137993454933167, 0.9591376781463623, 1.0044759511947632, 1.049814224243164, 1.0951526165008545, 1.1404908895492554, 1.1858291625976562, 1.2311675548553467, 1.2765058279037476, 1.321844220161438, 1.3671824932098389, 1.4125208854675293, 1.4578591585159302, 1.503197431564331, 1.5485358238220215, 1.5938740968704224, 1.6392123699188232, 1.6845507621765137, 1.7298890352249146, 1.7752273082733154, 1.8205657005310059, 1.8659039735794067, 1.9112422466278076, 1.956580638885498]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 4.0, 2.0, 1.0, 3.0, 5.0, 3.0, 5.0, 11.0, 10.0, 11.0, 12.0, 10.0, 29.0, 23.0, 29.0, 26.0, 41.0, 43.0, 27.0, 35.0, 39.0, 47.0, 47.0, 46.0, 49.0, 46.0, 24.0, 42.0, 34.0, 39.0, 35.0, 28.0, 27.0, 25.0, 21.0, 24.0, 19.0, 19.0, 16.0, 16.0, 11.0, 7.0, 6.0, 4.0, 3.0, 5.0, 0.0, 3.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5808115005493164, -0.5603252649307251, -0.5398390293121338, -0.5193527936935425, -0.4988665282726288, -0.4783802926540375, -0.4578940272331238, -0.43740779161453247, -0.41692155599594116, -0.39643532037734985, -0.37594908475875854, -0.35546281933784485, -0.33497658371925354, -0.31449034810066223, -0.29400408267974854, -0.2735178470611572, -0.2530316114425659, -0.2325453758239746, -0.2120591253042221, -0.1915728747844696, -0.1710866391658783, -0.150600403547287, -0.13011415302753448, -0.10962790250778198, -0.08914166688919067, -0.06865542382001877, -0.04816918075084686, -0.027682937681674957, -0.007196694612503052, 0.013289548456668854, 0.03377579152584076, 0.05426204204559326, 0.07474833726882935, 0.09523458033800125, 0.11572082340717316, 0.13620707392692566, 0.15669330954551697, 0.17717954516410828, 0.19766579568386078, 0.21815204620361328, 0.2386382818222046, 0.2591245174407959, 0.2796107530593872, 0.3000970184803009, 0.3205832540988922, 0.3410694897174835, 0.3615557551383972, 0.3820419907569885, 0.40252822637557983, 0.42301446199417114, 0.44350069761276245, 0.46398696303367615, 0.48447319865226746, 0.5049594640731812, 0.5254456996917725, 0.5459319353103638, 0.5664181709289551, 0.5869044065475464, 0.6073906421661377, 0.627876877784729, 0.6483631134033203, 0.6688494086265564, 0.6893356442451477, 0.709821879863739, 0.7303081154823303]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 2.0, 2.0, 3.0, 2.0, 2.0, 1.0, 7.0, 3.0, 2.0, 7.0, 9.0, 13.0, 22.0, 24.0, 15.0, 33.0, 47.0, 82.0, 139.0, 278.0, 449.0, 840.0, 1797.0, 3962.0, 9441.0, 24673.0, 69857.0, 211121.0, 417466.0, 201596.0, 66575.0, 23591.0, 9070.0, 3875.0, 1698.0, 779.0, 405.0, 208.0, 144.0, 100.0, 60.0, 40.0, 20.0, 24.0, 13.0, 20.0, 7.0, 9.0, 12.0, 4.0, 5.0, 5.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0], "bins": [-0.257568359375, -0.24938583374023438, -0.24120330810546875, -0.23302078247070312, -0.2248382568359375, -0.21665573120117188, -0.20847320556640625, -0.20029067993164062, -0.192108154296875, -0.18392562866210938, -0.17574310302734375, -0.16756057739257812, -0.1593780517578125, -0.15119552612304688, -0.14301300048828125, -0.13483047485351562, -0.12664794921875, -0.11846542358398438, -0.11028289794921875, -0.10210037231445312, -0.0939178466796875, -0.08573532104492188, -0.07755279541015625, -0.06937026977539062, -0.061187744140625, -0.053005218505859375, -0.04482269287109375, -0.036640167236328125, -0.0284576416015625, -0.020275115966796875, -0.01209259033203125, -0.003910064697265625, 0.0042724609375, 0.012454986572265625, 0.02063751220703125, 0.028820037841796875, 0.0370025634765625, 0.045185089111328125, 0.05336761474609375, 0.061550140380859375, 0.069732666015625, 0.07791519165039062, 0.08609771728515625, 0.09428024291992188, 0.1024627685546875, 0.11064529418945312, 0.11882781982421875, 0.12701034545898438, 0.13519287109375, 0.14337539672851562, 0.15155792236328125, 0.15974044799804688, 0.1679229736328125, 0.17610549926757812, 0.18428802490234375, 0.19247055053710938, 0.200653076171875, 0.20883560180664062, 0.21701812744140625, 0.22520065307617188, 0.2333831787109375, 0.24156570434570312, 0.24974822998046875, 0.2579307556152344, 0.26611328125]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 6.0, 2.0, 6.0, 15.0, 21.0, 18.0, 22.0, 26.0, 35.0, 38.0, 48.0, 49.0, 57.0, 47.0, 70.0, 63.0, 53.0, 60.0, 69.0, 46.0, 57.0, 32.0, 38.0, 32.0, 27.0, 20.0, 14.0, 11.0, 9.0, 4.0, 10.0, 3.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0887451171875, -0.08612346649169922, -0.08350181579589844, -0.08088016510009766, -0.07825851440429688, -0.0756368637084961, -0.07301521301269531, -0.07039356231689453, -0.06777191162109375, -0.06515026092529297, -0.06252861022949219, -0.059906959533691406, -0.057285308837890625, -0.054663658142089844, -0.05204200744628906, -0.04942035675048828, -0.0467987060546875, -0.04417705535888672, -0.04155540466308594, -0.038933753967285156, -0.036312103271484375, -0.033690452575683594, -0.031068801879882812, -0.02844715118408203, -0.02582550048828125, -0.02320384979248047, -0.020582199096679688, -0.017960548400878906, -0.015338897705078125, -0.012717247009277344, -0.010095596313476562, -0.007473945617675781, -0.004852294921875, -0.0022306442260742188, 0.0003910064697265625, 0.0030126571655273438, 0.005634307861328125, 0.008255958557128906, 0.010877609252929688, 0.013499259948730469, 0.01612091064453125, 0.01874256134033203, 0.021364212036132812, 0.023985862731933594, 0.026607513427734375, 0.029229164123535156, 0.03185081481933594, 0.03447246551513672, 0.0370941162109375, 0.03971576690673828, 0.04233741760253906, 0.044959068298339844, 0.047580718994140625, 0.050202369689941406, 0.05282402038574219, 0.05544567108154297, 0.05806732177734375, 0.06068897247314453, 0.06331062316894531, 0.0659322738647461, 0.06855392456054688, 0.07117557525634766, 0.07379722595214844, 0.07641887664794922, 0.07904052734375]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 4.0, 2.0, 4.0, 4.0, 7.0, 12.0, 19.0, 26.0, 39.0, 53.0, 73.0, 158.0, 254.0, 579.0, 1396.0, 4203.0, 21577.0, 224801.0, 719689.0, 62321.0, 9252.0, 2314.0, 891.0, 362.0, 197.0, 127.0, 68.0, 39.0, 28.0, 27.0, 15.0, 8.0, 4.0, 4.0, 2.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.57763671875, -0.557891845703125, -0.53814697265625, -0.518402099609375, -0.4986572265625, -0.478912353515625, -0.45916748046875, -0.439422607421875, -0.419677734375, -0.399932861328125, -0.38018798828125, -0.360443115234375, -0.3406982421875, -0.320953369140625, -0.30120849609375, -0.281463623046875, -0.26171875, -0.241973876953125, -0.22222900390625, -0.202484130859375, -0.1827392578125, -0.162994384765625, -0.14324951171875, -0.123504638671875, -0.103759765625, -0.084014892578125, -0.06427001953125, -0.044525146484375, -0.0247802734375, -0.005035400390625, 0.01470947265625, 0.034454345703125, 0.05419921875, 0.073944091796875, 0.09368896484375, 0.113433837890625, 0.1331787109375, 0.152923583984375, 0.17266845703125, 0.192413330078125, 0.212158203125, 0.231903076171875, 0.25164794921875, 0.271392822265625, 0.2911376953125, 0.310882568359375, 0.33062744140625, 0.350372314453125, 0.3701171875, 0.389862060546875, 0.40960693359375, 0.429351806640625, 0.4490966796875, 0.468841552734375, 0.48858642578125, 0.508331298828125, 0.528076171875, 0.547821044921875, 0.56756591796875, 0.587310791015625, 0.6070556640625, 0.626800537109375, 0.64654541015625, 0.666290283203125, 0.68603515625]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 5.0, 6.0, 4.0, 3.0, 6.0, 8.0, 9.0, 9.0, 12.0, 10.0, 24.0, 20.0, 16.0, 23.0, 20.0, 25.0, 34.0, 34.0, 38.0, 41.0, 42.0, 34.0, 46.0, 48.0, 45.0, 38.0, 33.0, 42.0, 32.0, 36.0, 26.0, 37.0, 28.0, 26.0, 19.0, 19.0, 30.0, 12.0, 8.0, 14.0, 5.0, 6.0, 11.0, 2.0, 5.0, 5.0, 3.0, 6.0, 4.0, 2.0, 0.0, 2.0, 1.0], "bins": [-0.340087890625, -0.33039093017578125, -0.3206939697265625, -0.31099700927734375, -0.301300048828125, -0.29160308837890625, -0.2819061279296875, -0.27220916748046875, -0.26251220703125, -0.25281524658203125, -0.2431182861328125, -0.23342132568359375, -0.223724365234375, -0.21402740478515625, -0.2043304443359375, -0.19463348388671875, -0.1849365234375, -0.17523956298828125, -0.1655426025390625, -0.15584564208984375, -0.146148681640625, -0.13645172119140625, -0.1267547607421875, -0.11705780029296875, -0.10736083984375, -0.09766387939453125, -0.0879669189453125, -0.07826995849609375, -0.068572998046875, -0.05887603759765625, -0.0491790771484375, -0.03948211669921875, -0.02978515625, -0.02008819580078125, -0.0103912353515625, -0.00069427490234375, 0.009002685546875, 0.01869964599609375, 0.0283966064453125, 0.03809356689453125, 0.04779052734375, 0.05748748779296875, 0.0671844482421875, 0.07688140869140625, 0.086578369140625, 0.09627532958984375, 0.1059722900390625, 0.11566925048828125, 0.1253662109375, 0.13506317138671875, 0.1447601318359375, 0.15445709228515625, 0.164154052734375, 0.17385101318359375, 0.1835479736328125, 0.19324493408203125, 0.20294189453125, 0.21263885498046875, 0.2223358154296875, 0.23203277587890625, 0.241729736328125, 0.25142669677734375, 0.2611236572265625, 0.27082061767578125, 0.280517578125]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 5.0, 3.0, 7.0, 15.0, 36.0, 36.0, 98.0, 218.0, 499.0, 1053.0, 2695.0, 8985.0, 52067.0, 591029.0, 348646.0, 32841.0, 6502.0, 2195.0, 844.0, 373.0, 210.0, 94.0, 46.0, 25.0, 12.0, 15.0, 4.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.403564453125, -0.3923187255859375, -0.381072998046875, -0.3698272705078125, -0.35858154296875, -0.3473358154296875, -0.336090087890625, -0.3248443603515625, -0.3135986328125, -0.3023529052734375, -0.291107177734375, -0.2798614501953125, -0.26861572265625, -0.2573699951171875, -0.246124267578125, -0.2348785400390625, -0.2236328125, -0.2123870849609375, -0.201141357421875, -0.1898956298828125, -0.17864990234375, -0.1674041748046875, -0.156158447265625, -0.1449127197265625, -0.1336669921875, -0.1224212646484375, -0.111175537109375, -0.0999298095703125, -0.08868408203125, -0.0774383544921875, -0.066192626953125, -0.0549468994140625, -0.043701171875, -0.0324554443359375, -0.021209716796875, -0.0099639892578125, 0.00128173828125, 0.0125274658203125, 0.023773193359375, 0.0350189208984375, 0.0462646484375, 0.0575103759765625, 0.068756103515625, 0.0800018310546875, 0.09124755859375, 0.1024932861328125, 0.113739013671875, 0.1249847412109375, 0.13623046875, 0.1474761962890625, 0.158721923828125, 0.1699676513671875, 0.18121337890625, 0.1924591064453125, 0.203704833984375, 0.2149505615234375, 0.2261962890625, 0.2374420166015625, 0.248687744140625, 0.2599334716796875, 0.27117919921875, 0.2824249267578125, 0.293670654296875, 0.3049163818359375, 0.316162109375]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 5.0, 2.0, 9.0, 8.0, 17.0, 16.0, 29.0, 39.0, 40.0, 70.0, 64.0, 71.0, 89.0, 107.0, 71.0, 76.0, 52.0, 65.0, 54.0, 33.0, 32.0, 15.0, 16.0, 10.0, 3.0, 4.0, 3.0, 5.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.823373794555664e-05, -5.536247044801712e-05, -5.24912029504776e-05, -4.961993545293808e-05, -4.674866795539856e-05, -4.387740045785904e-05, -4.100613296031952e-05, -3.813486546278e-05, -3.526359796524048e-05, -3.239233046770096e-05, -2.9521062970161438e-05, -2.6649795472621918e-05, -2.3778527975082397e-05, -2.0907260477542877e-05, -1.8035992980003357e-05, -1.5164725482463837e-05, -1.2293457984924316e-05, -9.422190487384796e-06, -6.550922989845276e-06, -3.6796554923057556e-06, -8.083879947662354e-07, 2.062879502773285e-06, 4.934147000312805e-06, 7.805414497852325e-06, 1.0676681995391846e-05, 1.3547949492931366e-05, 1.6419216990470886e-05, 1.9290484488010406e-05, 2.2161751985549927e-05, 2.5033019483089447e-05, 2.7904286980628967e-05, 3.077555447816849e-05, 3.364682197570801e-05, 3.651808947324753e-05, 3.938935697078705e-05, 4.226062446832657e-05, 4.513189196586609e-05, 4.800315946340561e-05, 5.087442696094513e-05, 5.374569445848465e-05, 5.661696195602417e-05, 5.948822945356369e-05, 6.235949695110321e-05, 6.523076444864273e-05, 6.810203194618225e-05, 7.097329944372177e-05, 7.384456694126129e-05, 7.671583443880081e-05, 7.958710193634033e-05, 8.245836943387985e-05, 8.532963693141937e-05, 8.820090442895889e-05, 9.107217192649841e-05, 9.394343942403793e-05, 9.681470692157745e-05, 9.968597441911697e-05, 0.0001025572419166565, 0.00010542850941419601, 0.00010829977691173553, 0.00011117104440927505, 0.00011404231190681458, 0.0001169135794043541, 0.00011978484690189362, 0.00012265611439943314, 0.00012552738189697266]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 5.0, 11.0, 10.0, 13.0, 20.0, 24.0, 32.0, 42.0, 61.0, 99.0, 175.0, 264.0, 413.0, 787.0, 1561.0, 3146.0, 7159.0, 21334.0, 91505.0, 480619.0, 350121.0, 63289.0, 16188.0, 5934.0, 2727.0, 1277.0, 677.0, 394.0, 217.0, 145.0, 81.0, 59.0, 40.0, 33.0, 18.0, 27.0, 14.0, 11.0, 9.0, 6.0, 3.0, 3.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2467041015625, -0.23920249938964844, -0.23170089721679688, -0.2241992950439453, -0.21669769287109375, -0.2091960906982422, -0.20169448852539062, -0.19419288635253906, -0.1866912841796875, -0.17918968200683594, -0.17168807983398438, -0.1641864776611328, -0.15668487548828125, -0.1491832733154297, -0.14168167114257812, -0.13418006896972656, -0.126678466796875, -0.11917686462402344, -0.11167526245117188, -0.10417366027832031, -0.09667205810546875, -0.08917045593261719, -0.08166885375976562, -0.07416725158691406, -0.0666656494140625, -0.05916404724121094, -0.051662445068359375, -0.04416084289550781, -0.03665924072265625, -0.029157638549804688, -0.021656036376953125, -0.014154434204101562, -0.00665283203125, 0.0008487701416015625, 0.008350372314453125, 0.015851974487304688, 0.02335357666015625, 0.030855178833007812, 0.038356781005859375, 0.04585838317871094, 0.0533599853515625, 0.06086158752441406, 0.06836318969726562, 0.07586479187011719, 0.08336639404296875, 0.09086799621582031, 0.09836959838867188, 0.10587120056152344, 0.113372802734375, 0.12087440490722656, 0.12837600708007812, 0.1358776092529297, 0.14337921142578125, 0.1508808135986328, 0.15838241577148438, 0.16588401794433594, 0.1733856201171875, 0.18088722229003906, 0.18838882446289062, 0.1958904266357422, 0.20339202880859375, 0.2108936309814453, 0.21839523315429688, 0.22589683532714844, 0.2333984375]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [4.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 6.0, 1.0, 1.0, 3.0, 3.0, 4.0, 15.0, 9.0, 12.0, 12.0, 14.0, 29.0, 25.0, 33.0, 42.0, 45.0, 56.0, 74.0, 73.0, 98.0, 89.0, 60.0, 60.0, 36.0, 38.0, 31.0, 32.0, 21.0, 19.0, 18.0, 12.0, 5.0, 9.0, 4.0, 3.0, 6.0, 3.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1318359375, -0.1268329620361328, -0.12182998657226562, -0.11682701110839844, -0.11182403564453125, -0.10682106018066406, -0.10181808471679688, -0.09681510925292969, -0.0918121337890625, -0.08680915832519531, -0.08180618286132812, -0.07680320739746094, -0.07180023193359375, -0.06679725646972656, -0.061794281005859375, -0.05679130554199219, -0.051788330078125, -0.04678535461425781, -0.041782379150390625, -0.03677940368652344, -0.03177642822265625, -0.026773452758789062, -0.021770477294921875, -0.016767501831054688, -0.0117645263671875, -0.0067615509033203125, -0.001758575439453125, 0.0032444000244140625, 0.00824737548828125, 0.013250350952148438, 0.018253326416015625, 0.023256301879882812, 0.02825927734375, 0.03326225280761719, 0.038265228271484375, 0.04326820373535156, 0.04827117919921875, 0.05327415466308594, 0.058277130126953125, 0.06328010559082031, 0.0682830810546875, 0.07328605651855469, 0.07828903198242188, 0.08329200744628906, 0.08829498291015625, 0.09329795837402344, 0.09830093383789062, 0.10330390930175781, 0.108306884765625, 0.11330986022949219, 0.11831283569335938, 0.12331581115722656, 0.12831878662109375, 0.13332176208496094, 0.13832473754882812, 0.1433277130126953, 0.1483306884765625, 0.1533336639404297, 0.15833663940429688, 0.16333961486816406, 0.16834259033203125, 0.17334556579589844, 0.17834854125976562, 0.1833515167236328, 0.1883544921875]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 5.0, 2.0, 3.0, 3.0, 4.0, 11.0, 26.0, 56.0, 88.0, 125.0, 129.0, 155.0, 138.0, 110.0, 62.0, 41.0, 20.0, 14.0, 8.0, 3.0, 5.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.39874267578125, -4.286345958709717, -4.173948764801025, -4.061552047729492, -3.949154853820801, -3.8367581367492676, -3.7243611812591553, -3.611964225769043, -3.4995672702789307, -3.3871703147888184, -3.274773359298706, -3.1623764038085938, -3.0499796867370605, -2.937582492828369, -2.825185775756836, -2.7127888202667236, -2.6003918647766113, -2.487994909286499, -2.3755979537963867, -2.2632009983062744, -2.150804042816162, -2.038407325744629, -1.9260103702545166, -1.8136134147644043, -1.701216459274292, -1.5888195037841797, -1.4764225482940674, -1.3640257120132446, -1.2516287565231323, -1.13923180103302, -1.0268349647521973, -0.914438009262085, -0.8020412921905518, -0.6896443367004395, -0.5772474408149719, -0.464850515127182, -0.3524535894393921, -0.24005663394927979, -0.12765973806381226, -0.015262842178344727, 0.09713411331176758, 0.2095310389995575, 0.3219279646873474, 0.43432489037513733, 0.5467218160629272, 0.6591187715530396, 0.7715156674385071, 0.8839125633239746, 0.9963095188140869, 1.1087064743041992, 1.2211034297943115, 1.3335002660751343, 1.4458972215652466, 1.5582941770553589, 1.6706910133361816, 1.783087968826294, 1.8954849243164062, 2.0078818798065186, 2.120278835296631, 2.232675790786743, 2.3450727462768555, 2.4574694633483887, 2.569866418838501, 2.6822633743286133, 2.7946603298187256]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 3.0, 2.0, 4.0, 2.0, 5.0, 2.0, 10.0, 6.0, 5.0, 12.0, 10.0, 3.0, 9.0, 18.0, 12.0, 16.0, 22.0, 18.0, 29.0, 29.0, 31.0, 37.0, 32.0, 36.0, 26.0, 45.0, 51.0, 43.0, 50.0, 40.0, 41.0, 43.0, 37.0, 25.0, 29.0, 24.0, 37.0, 20.0, 18.0, 15.0, 23.0, 11.0, 15.0, 17.0, 11.0, 11.0, 9.0, 4.0, 3.0, 4.0, 4.0, 1.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.4752309322357178, -1.4266610145568848, -1.3780912160873413, -1.3295212984085083, -1.2809514999389648, -1.2323815822601318, -1.1838117837905884, -1.1352418661117554, -1.086672067642212, -1.038102149963379, -0.9895323514938354, -0.9409624934196472, -0.892392635345459, -0.8438227772712708, -0.7952529191970825, -0.7466830015182495, -0.6981131434440613, -0.649543285369873, -0.6009734272956848, -0.5524035692214966, -0.5038337111473083, -0.4552638530731201, -0.4066939651966095, -0.35812410712242126, -0.30955424904823303, -0.2609843909740448, -0.21241453289985657, -0.16384465992450714, -0.11527480185031891, -0.06670494377613068, -0.01813507080078125, 0.030434787273406982, 0.07900464534759521, 0.12757450342178345, 0.17614436149597168, 0.2247142344713211, 0.27328407764434814, 0.3218539357185364, 0.370423823595047, 0.41899368166923523, 0.46756353974342346, 0.5161334276199341, 0.5647032856941223, 0.6132731437683105, 0.6618430018424988, 0.710412859916687, 0.7589827179908752, 0.8075525760650635, 0.8561224341392517, 0.9046922922134399, 0.9532621502876282, 1.0018320083618164, 1.0504019260406494, 1.0989717245101929, 1.1475416421890259, 1.1961114406585693, 1.2446813583374023, 1.2932512760162354, 1.3418210744857788, 1.3903909921646118, 1.4389607906341553, 1.4875307083129883, 1.5361005067825317, 1.5846704244613647, 1.6332402229309082]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 6.0, 9.0, 9.0, 12.0, 12.0, 22.0, 33.0, 36.0, 63.0, 99.0, 140.0, 199.0, 358.0, 568.0, 1015.0, 2027.0, 4738.0, 16254.0, 210063.0, 3921801.0, 25198.0, 6140.0, 2485.0, 1142.0, 671.0, 392.0, 246.0, 165.0, 110.0, 70.0, 56.0, 29.0, 35.0, 21.0, 17.0, 16.0, 6.0, 5.0, 6.0, 2.0, 3.0, 5.0, 3.0, 1.0, 3.0], "bins": [-0.5751953125, -0.5601119995117188, -0.5450286865234375, -0.5299453735351562, -0.514862060546875, -0.49977874755859375, -0.4846954345703125, -0.46961212158203125, -0.45452880859375, -0.43944549560546875, -0.4243621826171875, -0.40927886962890625, -0.394195556640625, -0.37911224365234375, -0.3640289306640625, -0.34894561767578125, -0.3338623046875, -0.31877899169921875, -0.3036956787109375, -0.28861236572265625, -0.273529052734375, -0.25844573974609375, -0.2433624267578125, -0.22827911376953125, -0.21319580078125, -0.19811248779296875, -0.1830291748046875, -0.16794586181640625, -0.152862548828125, -0.13777923583984375, -0.1226959228515625, -0.10761260986328125, -0.092529296875, -0.07744598388671875, -0.0623626708984375, -0.04727935791015625, -0.032196044921875, -0.01711273193359375, -0.0020294189453125, 0.01305389404296875, 0.02813720703125, 0.04322052001953125, 0.0583038330078125, 0.07338714599609375, 0.088470458984375, 0.10355377197265625, 0.1186370849609375, 0.13372039794921875, 0.1488037109375, 0.16388702392578125, 0.1789703369140625, 0.19405364990234375, 0.209136962890625, 0.22422027587890625, 0.2393035888671875, 0.25438690185546875, 0.26947021484375, 0.28455352783203125, 0.2996368408203125, 0.31472015380859375, 0.329803466796875, 0.34488677978515625, 0.3599700927734375, 0.37505340576171875, 0.39013671875]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 1.0, 3.0, 5.0, 6.0, 11.0, 16.0, 18.0, 24.0, 23.0, 30.0, 41.0, 41.0, 46.0, 37.0, 50.0, 55.0, 39.0, 74.0, 36.0, 51.0, 44.0, 60.0, 55.0, 42.0, 41.0, 35.0, 26.0, 17.0, 25.0, 12.0, 15.0, 10.0, 7.0, 4.0, 3.0, 0.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.061767578125, -0.059174537658691406, -0.05658149719238281, -0.05398845672607422, -0.051395416259765625, -0.04880237579345703, -0.04620933532714844, -0.043616294860839844, -0.04102325439453125, -0.038430213928222656, -0.03583717346191406, -0.03324413299560547, -0.030651092529296875, -0.02805805206298828, -0.025465011596679688, -0.022871971130371094, -0.0202789306640625, -0.017685890197753906, -0.015092849731445312, -0.012499809265136719, -0.009906768798828125, -0.007313728332519531, -0.0047206878662109375, -0.0021276473999023438, 0.00046539306640625, 0.0030584335327148438, 0.0056514739990234375, 0.008244514465332031, 0.010837554931640625, 0.013430595397949219, 0.016023635864257812, 0.018616676330566406, 0.021209716796875, 0.023802757263183594, 0.026395797729492188, 0.02898883819580078, 0.031581878662109375, 0.03417491912841797, 0.03676795959472656, 0.039361000061035156, 0.04195404052734375, 0.044547080993652344, 0.04714012145996094, 0.04973316192626953, 0.052326202392578125, 0.05491924285888672, 0.05751228332519531, 0.060105323791503906, 0.0626983642578125, 0.0652914047241211, 0.06788444519042969, 0.07047748565673828, 0.07307052612304688, 0.07566356658935547, 0.07825660705566406, 0.08084964752197266, 0.08344268798828125, 0.08603572845458984, 0.08862876892089844, 0.09122180938720703, 0.09381484985351562, 0.09640789031982422, 0.09900093078613281, 0.1015939712524414, 0.10418701171875]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 0.0, 5.0, 4.0, 13.0, 14.0, 14.0, 21.0, 28.0, 36.0, 38.0, 67.0, 117.0, 389.0, 2191.0, 40301.0, 4142022.0, 7632.0, 901.0, 226.0, 81.0, 64.0, 40.0, 31.0, 25.0, 12.0, 6.0, 7.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.53125, -2.452789306640625, -2.37432861328125, -2.295867919921875, -2.2174072265625, -2.138946533203125, -2.06048583984375, -1.982025146484375, -1.903564453125, -1.825103759765625, -1.74664306640625, -1.668182373046875, -1.5897216796875, -1.511260986328125, -1.43280029296875, -1.354339599609375, -1.27587890625, -1.197418212890625, -1.11895751953125, -1.040496826171875, -0.9620361328125, -0.883575439453125, -0.80511474609375, -0.726654052734375, -0.648193359375, -0.569732666015625, -0.49127197265625, -0.412811279296875, -0.3343505859375, -0.255889892578125, -0.17742919921875, -0.098968505859375, -0.0205078125, 0.057952880859375, 0.13641357421875, 0.214874267578125, 0.2933349609375, 0.371795654296875, 0.45025634765625, 0.528717041015625, 0.607177734375, 0.685638427734375, 0.76409912109375, 0.842559814453125, 0.9210205078125, 0.999481201171875, 1.07794189453125, 1.156402587890625, 1.23486328125, 1.313323974609375, 1.39178466796875, 1.470245361328125, 1.5487060546875, 1.627166748046875, 1.70562744140625, 1.784088134765625, 1.862548828125, 1.941009521484375, 2.01947021484375, 2.097930908203125, 2.1763916015625, 2.254852294921875, 2.33331298828125, 2.411773681640625, 2.490234375]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 4.0, 7.0, 18.0, 40.0, 135.0, 3645.0, 159.0, 33.0, 15.0, 9.0, 11.0, 3.0, 1.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.4248046875, -0.41640281677246094, -0.4080009460449219, -0.3995990753173828, -0.39119720458984375, -0.3827953338623047, -0.3743934631347656, -0.36599159240722656, -0.3575897216796875, -0.34918785095214844, -0.3407859802246094, -0.3323841094970703, -0.32398223876953125, -0.3155803680419922, -0.3071784973144531, -0.29877662658691406, -0.290374755859375, -0.28197288513183594, -0.2735710144042969, -0.2651691436767578, -0.25676727294921875, -0.2483654022216797, -0.23996353149414062, -0.23156166076660156, -0.2231597900390625, -0.21475791931152344, -0.20635604858398438, -0.1979541778564453, -0.18955230712890625, -0.1811504364013672, -0.17274856567382812, -0.16434669494628906, -0.15594482421875, -0.14754295349121094, -0.13914108276367188, -0.1307392120361328, -0.12233734130859375, -0.11393547058105469, -0.10553359985351562, -0.09713172912597656, -0.0887298583984375, -0.08032798767089844, -0.07192611694335938, -0.06352424621582031, -0.05512237548828125, -0.04672050476074219, -0.038318634033203125, -0.029916763305664062, -0.021514892578125, -0.013113021850585938, -0.004711151123046875, 0.0036907196044921875, 0.01209259033203125, 0.020494461059570312, 0.028896331787109375, 0.03729820251464844, 0.0457000732421875, 0.05410194396972656, 0.06250381469726562, 0.07090568542480469, 0.07930755615234375, 0.08770942687988281, 0.09611129760742188, 0.10451316833496094, 0.1129150390625]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 4.0, 6.0, 3.0, 5.0, 13.0, 7.0, 7.0, 16.0, 17.0, 30.0, 34.0, 53.0, 40.0, 77.0, 109.0, 110.0, 102.0, 106.0, 75.0, 67.0, 41.0, 20.0, 17.0, 18.0, 5.0, 8.0, 4.0, 7.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.6309416890144348, -0.6151684522628784, -0.5993952751159668, -0.5836220979690552, -0.5678488612174988, -0.5520756244659424, -0.5363024473190308, -0.5205292701721191, -0.5047560334205627, -0.48898282647132874, -0.4732096195220947, -0.4574364125728607, -0.4416632056236267, -0.4258899986743927, -0.4101167917251587, -0.3943435847759247, -0.3785703778266907, -0.36279717087745667, -0.34702396392822266, -0.33125075697898865, -0.31547755002975464, -0.29970434308052063, -0.2839311361312866, -0.2681579291820526, -0.2523847222328186, -0.2366115152835846, -0.22083830833435059, -0.20506510138511658, -0.18929189443588257, -0.17351868748664856, -0.15774548053741455, -0.14197227358818054, -0.1261991262435913, -0.1104259192943573, -0.09465271234512329, -0.07887950539588928, -0.06310629844665527, -0.047333091497421265, -0.031559884548187256, -0.015786677598953247, -1.3470649719238281e-05, 0.01575973629951477, 0.03153294324874878, 0.04730615019798279, 0.0630793571472168, 0.0788525640964508, 0.09462577104568481, 0.11039897799491882, 0.12617218494415283, 0.14194539189338684, 0.15771859884262085, 0.17349180579185486, 0.18926501274108887, 0.20503821969032288, 0.22081142663955688, 0.2365846335887909, 0.2523578405380249, 0.2681310474872589, 0.2839042544364929, 0.29967746138572693, 0.31545066833496094, 0.33122387528419495, 0.34699708223342896, 0.36277028918266296, 0.378543496131897]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 3.0, 1.0, 1.0, 2.0, 1.0, 2.0, 6.0, 9.0, 10.0, 16.0, 15.0, 18.0, 19.0, 14.0, 16.0, 19.0, 16.0, 18.0, 20.0, 24.0, 26.0, 32.0, 28.0, 28.0, 27.0, 37.0, 40.0, 36.0, 34.0, 35.0, 35.0, 24.0, 30.0, 39.0, 23.0, 25.0, 31.0, 28.0, 19.0, 33.0, 23.0, 27.0, 26.0, 13.0, 17.0, 13.0, 7.0, 6.0, 9.0, 8.0, 6.0, 4.0, 2.0, 5.0, 2.0, 2.0, 4.0, 1.0, 1.0, 3.0, 2.0], "bins": [-0.2320060133934021, -0.22464530169963837, -0.21728459000587463, -0.2099238634109497, -0.20256315171718597, -0.19520244002342224, -0.18784171342849731, -0.18048100173473358, -0.17312029004096985, -0.16575957834720612, -0.15839886665344238, -0.15103814005851746, -0.14367742836475372, -0.13631671667099, -0.12895599007606506, -0.12159527838230133, -0.1142345666885376, -0.10687385499477386, -0.09951313585042953, -0.0921524167060852, -0.08479170501232147, -0.07743099331855774, -0.07007027417421341, -0.06270955502986908, -0.05534884333610535, -0.047988127917051315, -0.040627412497997284, -0.03326669707894325, -0.02590598165988922, -0.01854526624083519, -0.011184550821781158, -0.003823835402727127, 0.0035368800163269043, 0.010897595435380936, 0.018258310854434967, 0.025619026273489, 0.03297974169254303, 0.04034045711159706, 0.04770117253065109, 0.055061887949705124, 0.062422603368759155, 0.06978331506252289, 0.07714403420686722, 0.08450475335121155, 0.09186546504497528, 0.09922617673873901, 0.10658689588308334, 0.11394761502742767, 0.1213083267211914, 0.12866903841495514, 0.13602975010871887, 0.1433904767036438, 0.15075118839740753, 0.15811190009117126, 0.1654726266860962, 0.17283333837985992, 0.18019405007362366, 0.1875547617673874, 0.19491547346115112, 0.20227620005607605, 0.20963691174983978, 0.21699762344360352, 0.22435835003852844, 0.23171906173229218, 0.2390797734260559]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 0.0, 5.0, 8.0, 7.0, 2.0, 6.0, 16.0, 12.0, 23.0, 22.0, 51.0, 55.0, 85.0, 116.0, 191.0, 310.0, 572.0, 1091.0, 2300.0, 4861.0, 11367.0, 26153.0, 62985.0, 147343.0, 282900.0, 270795.0, 135643.0, 58153.0, 24051.0, 10379.0, 4473.0, 2156.0, 1032.0, 521.0, 293.0, 208.0, 100.0, 86.0, 40.0, 46.0, 21.0, 24.0, 15.0, 11.0, 13.0, 6.0, 8.0, 2.0, 4.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.222900390625, -0.2156982421875, -0.20849609375, -0.2012939453125, -0.194091796875, -0.1868896484375, -0.1796875, -0.1724853515625, -0.165283203125, -0.1580810546875, -0.15087890625, -0.1436767578125, -0.136474609375, -0.1292724609375, -0.1220703125, -0.1148681640625, -0.107666015625, -0.1004638671875, -0.09326171875, -0.0860595703125, -0.078857421875, -0.0716552734375, -0.064453125, -0.0572509765625, -0.050048828125, -0.0428466796875, -0.03564453125, -0.0284423828125, -0.021240234375, -0.0140380859375, -0.0068359375, 0.0003662109375, 0.007568359375, 0.0147705078125, 0.02197265625, 0.0291748046875, 0.036376953125, 0.0435791015625, 0.05078125, 0.0579833984375, 0.065185546875, 0.0723876953125, 0.07958984375, 0.0867919921875, 0.093994140625, 0.1011962890625, 0.1083984375, 0.1156005859375, 0.122802734375, 0.1300048828125, 0.13720703125, 0.1444091796875, 0.151611328125, 0.1588134765625, 0.166015625, 0.1732177734375, 0.180419921875, 0.1876220703125, 0.19482421875, 0.2020263671875, 0.209228515625, 0.2164306640625, 0.2236328125, 0.2308349609375, 0.238037109375]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 2.0, 3.0, 3.0, 7.0, 8.0, 14.0, 12.0, 14.0, 16.0, 26.0, 22.0, 23.0, 24.0, 43.0, 39.0, 37.0, 39.0, 50.0, 49.0, 42.0, 58.0, 60.0, 50.0, 43.0, 49.0, 40.0, 37.0, 34.0, 26.0, 31.0, 23.0, 17.0, 19.0, 12.0, 12.0, 8.0, 7.0, 1.0, 6.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07659912109375, -0.07368755340576172, -0.07077598571777344, -0.06786441802978516, -0.06495285034179688, -0.062041282653808594, -0.05912971496582031, -0.05621814727783203, -0.05330657958984375, -0.05039501190185547, -0.04748344421386719, -0.044571876525878906, -0.041660308837890625, -0.038748741149902344, -0.03583717346191406, -0.03292560577392578, -0.0300140380859375, -0.02710247039794922, -0.024190902709960938, -0.021279335021972656, -0.018367767333984375, -0.015456199645996094, -0.012544631958007812, -0.009633064270019531, -0.00672149658203125, -0.0038099288940429688, -0.0008983612060546875, 0.0020132064819335938, 0.004924774169921875, 0.007836341857910156, 0.010747909545898438, 0.013659477233886719, 0.016571044921875, 0.01948261260986328, 0.022394180297851562, 0.025305747985839844, 0.028217315673828125, 0.031128883361816406, 0.03404045104980469, 0.03695201873779297, 0.03986358642578125, 0.04277515411376953, 0.04568672180175781, 0.048598289489746094, 0.051509857177734375, 0.054421424865722656, 0.05733299255371094, 0.06024456024169922, 0.0631561279296875, 0.06606769561767578, 0.06897926330566406, 0.07189083099365234, 0.07480239868164062, 0.0777139663696289, 0.08062553405761719, 0.08353710174560547, 0.08644866943359375, 0.08936023712158203, 0.09227180480957031, 0.0951833724975586, 0.09809494018554688, 0.10100650787353516, 0.10391807556152344, 0.10682964324951172, 0.1097412109375]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 8.0, 2.0, 7.0, 6.0, 8.0, 17.0, 17.0, 36.0, 32.0, 50.0, 67.0, 103.0, 140.0, 188.0, 262.0, 364.0, 619.0, 1067.0, 2330.0, 5616.0, 16865.0, 63173.0, 287724.0, 496609.0, 126590.0, 30201.0, 9188.0, 3375.0, 1489.0, 785.0, 480.0, 356.0, 204.0, 178.0, 113.0, 73.0, 42.0, 49.0, 38.0, 22.0, 25.0, 16.0, 7.0, 8.0, 2.0, 2.0, 4.0, 5.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.38525390625, -0.3736610412597656, -0.36206817626953125, -0.3504753112792969, -0.3388824462890625, -0.3272895812988281, -0.31569671630859375, -0.3041038513183594, -0.292510986328125, -0.2809181213378906, -0.26932525634765625, -0.2577323913574219, -0.2461395263671875, -0.23454666137695312, -0.22295379638671875, -0.21136093139648438, -0.19976806640625, -0.18817520141601562, -0.17658233642578125, -0.16498947143554688, -0.1533966064453125, -0.14180374145507812, -0.13021087646484375, -0.11861801147460938, -0.107025146484375, -0.09543228149414062, -0.08383941650390625, -0.07224655151367188, -0.0606536865234375, -0.049060821533203125, -0.03746795654296875, -0.025875091552734375, -0.0142822265625, -0.002689361572265625, 0.00890350341796875, 0.020496368408203125, 0.0320892333984375, 0.043682098388671875, 0.05527496337890625, 0.06686782836914062, 0.078460693359375, 0.09005355834960938, 0.10164642333984375, 0.11323928833007812, 0.1248321533203125, 0.13642501831054688, 0.14801788330078125, 0.15961074829101562, 0.17120361328125, 0.18279647827148438, 0.19438934326171875, 0.20598220825195312, 0.2175750732421875, 0.22916793823242188, 0.24076080322265625, 0.2523536682128906, 0.263946533203125, 0.2755393981933594, 0.28713226318359375, 0.2987251281738281, 0.3103179931640625, 0.3219108581542969, 0.33350372314453125, 0.3450965881347656, 0.356689453125]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 3.0, 6.0, 8.0, 8.0, 9.0, 7.0, 12.0, 17.0, 24.0, 28.0, 26.0, 30.0, 31.0, 46.0, 37.0, 49.0, 58.0, 59.0, 54.0, 49.0, 55.0, 43.0, 35.0, 50.0, 44.0, 37.0, 23.0, 25.0, 26.0, 27.0, 27.0, 18.0, 9.0, 11.0, 8.0, 3.0, 6.0, 0.0, 3.0, 3.0, 1.0, 2.0, 1.0], "bins": [-0.6376953125, -0.621856689453125, -0.60601806640625, -0.590179443359375, -0.5743408203125, -0.558502197265625, -0.54266357421875, -0.526824951171875, -0.510986328125, -0.495147705078125, -0.47930908203125, -0.463470458984375, -0.4476318359375, -0.431793212890625, -0.41595458984375, -0.400115966796875, -0.38427734375, -0.368438720703125, -0.35260009765625, -0.336761474609375, -0.3209228515625, -0.305084228515625, -0.28924560546875, -0.273406982421875, -0.257568359375, -0.241729736328125, -0.22589111328125, -0.210052490234375, -0.1942138671875, -0.178375244140625, -0.16253662109375, -0.146697998046875, -0.130859375, -0.115020751953125, -0.09918212890625, -0.083343505859375, -0.0675048828125, -0.051666259765625, -0.03582763671875, -0.019989013671875, -0.004150390625, 0.011688232421875, 0.02752685546875, 0.043365478515625, 0.0592041015625, 0.075042724609375, 0.09088134765625, 0.106719970703125, 0.12255859375, 0.138397216796875, 0.15423583984375, 0.170074462890625, 0.1859130859375, 0.201751708984375, 0.21759033203125, 0.233428955078125, 0.249267578125, 0.265106201171875, 0.28094482421875, 0.296783447265625, 0.3126220703125, 0.328460693359375, 0.34429931640625, 0.360137939453125, 0.3759765625]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 6.0, 4.0, 2.0, 5.0, 6.0, 10.0, 13.0, 14.0, 17.0, 37.0, 59.0, 88.0, 152.0, 227.0, 553.0, 1336.0, 3544.0, 12259.0, 58474.0, 413467.0, 471729.0, 66589.0, 13389.0, 3829.0, 1415.0, 643.0, 289.0, 162.0, 82.0, 41.0, 45.0, 19.0, 13.0, 20.0, 8.0, 7.0, 5.0, 4.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2313232421875, -0.2233562469482422, -0.21538925170898438, -0.20742225646972656, -0.19945526123046875, -0.19148826599121094, -0.18352127075195312, -0.1755542755126953, -0.1675872802734375, -0.1596202850341797, -0.15165328979492188, -0.14368629455566406, -0.13571929931640625, -0.12775230407714844, -0.11978530883789062, -0.11181831359863281, -0.103851318359375, -0.09588432312011719, -0.08791732788085938, -0.07995033264160156, -0.07198333740234375, -0.06401634216308594, -0.056049346923828125, -0.04808235168457031, -0.0401153564453125, -0.03214836120605469, -0.024181365966796875, -0.016214370727539062, -0.00824737548828125, -0.0002803802490234375, 0.007686614990234375, 0.015653610229492188, 0.02362060546875, 0.03158760070800781, 0.039554595947265625, 0.04752159118652344, 0.05548858642578125, 0.06345558166503906, 0.07142257690429688, 0.07938957214355469, 0.0873565673828125, 0.09532356262207031, 0.10329055786132812, 0.11125755310058594, 0.11922454833984375, 0.12719154357910156, 0.13515853881835938, 0.1431255340576172, 0.151092529296875, 0.1590595245361328, 0.16702651977539062, 0.17499351501464844, 0.18296051025390625, 0.19092750549316406, 0.19889450073242188, 0.2068614959716797, 0.2148284912109375, 0.2227954864501953, 0.23076248168945312, 0.23872947692871094, 0.24669647216796875, 0.25466346740722656, 0.2626304626464844, 0.2705974578857422, 0.278564453125]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 5.0, 6.0, 6.0, 7.0, 6.0, 19.0, 21.0, 19.0, 32.0, 33.0, 49.0, 61.0, 49.0, 80.0, 69.0, 80.0, 78.0, 75.0, 66.0, 50.0, 30.0, 34.0, 25.0, 30.0, 22.0, 16.0, 16.0, 9.0, 2.0, 4.0, 3.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.683038711547852e-05, -7.431674748659134e-05, -7.180310785770416e-05, -6.928946822881699e-05, -6.677582859992981e-05, -6.426218897104263e-05, -6.174854934215546e-05, -5.923490971326828e-05, -5.6721270084381104e-05, -5.420763045549393e-05, -5.169399082660675e-05, -4.9180351197719574e-05, -4.66667115688324e-05, -4.415307193994522e-05, -4.1639432311058044e-05, -3.912579268217087e-05, -3.661215305328369e-05, -3.4098513424396515e-05, -3.158487379550934e-05, -2.9071234166622162e-05, -2.6557594537734985e-05, -2.404395490884781e-05, -2.1530315279960632e-05, -1.9016675651073456e-05, -1.650303602218628e-05, -1.3989396393299103e-05, -1.1475756764411926e-05, -8.96211713552475e-06, -6.448477506637573e-06, -3.934837877750397e-06, -1.4211982488632202e-06, 1.0924413800239563e-06, 3.606081008911133e-06, 6.119720637798309e-06, 8.633360266685486e-06, 1.1146999895572662e-05, 1.3660639524459839e-05, 1.6174279153347015e-05, 1.8687918782234192e-05, 2.120155841112137e-05, 2.3715198040008545e-05, 2.622883766889572e-05, 2.8742477297782898e-05, 3.1256116926670074e-05, 3.376975655555725e-05, 3.628339618444443e-05, 3.8797035813331604e-05, 4.131067544221878e-05, 4.382431507110596e-05, 4.6337954699993134e-05, 4.885159432888031e-05, 5.1365233957767487e-05, 5.387887358665466e-05, 5.639251321554184e-05, 5.8906152844429016e-05, 6.141979247331619e-05, 6.393343210220337e-05, 6.644707173109055e-05, 6.896071135997772e-05, 7.14743509888649e-05, 7.398799061775208e-05, 7.650163024663925e-05, 7.901526987552643e-05, 8.15289095044136e-05, 8.404254913330078e-05]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 4.0, 3.0, 4.0, 13.0, 13.0, 34.0, 39.0, 90.0, 188.0, 325.0, 879.0, 2306.0, 8352.0, 49440.0, 574368.0, 371114.0, 31940.0, 6236.0, 1889.0, 682.0, 281.0, 171.0, 69.0, 41.0, 27.0, 19.0, 14.0, 6.0, 5.0, 2.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.342041015625, -0.33097076416015625, -0.3199005126953125, -0.30883026123046875, -0.297760009765625, -0.28668975830078125, -0.2756195068359375, -0.26454925537109375, -0.25347900390625, -0.24240875244140625, -0.2313385009765625, -0.22026824951171875, -0.209197998046875, -0.19812774658203125, -0.1870574951171875, -0.17598724365234375, -0.1649169921875, -0.15384674072265625, -0.1427764892578125, -0.13170623779296875, -0.120635986328125, -0.10956573486328125, -0.0984954833984375, -0.08742523193359375, -0.07635498046875, -0.06528472900390625, -0.0542144775390625, -0.04314422607421875, -0.032073974609375, -0.02100372314453125, -0.0099334716796875, 0.00113677978515625, 0.01220703125, 0.02327728271484375, 0.0343475341796875, 0.04541778564453125, 0.056488037109375, 0.06755828857421875, 0.0786285400390625, 0.08969879150390625, 0.10076904296875, 0.11183929443359375, 0.1229095458984375, 0.13397979736328125, 0.145050048828125, 0.15612030029296875, 0.1671905517578125, 0.17826080322265625, 0.1893310546875, 0.20040130615234375, 0.2114715576171875, 0.22254180908203125, 0.233612060546875, 0.24468231201171875, 0.2557525634765625, 0.26682281494140625, 0.27789306640625, 0.28896331787109375, 0.3000335693359375, 0.31110382080078125, 0.322174072265625, 0.33324432373046875, 0.3443145751953125, 0.35538482666015625, 0.366455078125]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 3.0, 4.0, 8.0, 8.0, 14.0, 16.0, 29.0, 38.0, 54.0, 83.0, 117.0, 103.0, 115.0, 114.0, 97.0, 68.0, 49.0, 28.0, 15.0, 19.0, 10.0, 4.0, 2.0, 0.0, 2.0, 2.0, 4.0, 1.0, 1.0, 1.0, 3.0], "bins": [-0.3974609375, -0.38864898681640625, -0.3798370361328125, -0.37102508544921875, -0.362213134765625, -0.35340118408203125, -0.3445892333984375, -0.33577728271484375, -0.32696533203125, -0.31815338134765625, -0.3093414306640625, -0.30052947998046875, -0.291717529296875, -0.28290557861328125, -0.2740936279296875, -0.26528167724609375, -0.2564697265625, -0.24765777587890625, -0.2388458251953125, -0.23003387451171875, -0.221221923828125, -0.21240997314453125, -0.2035980224609375, -0.19478607177734375, -0.18597412109375, -0.17716217041015625, -0.1683502197265625, -0.15953826904296875, -0.150726318359375, -0.14191436767578125, -0.1331024169921875, -0.12429046630859375, -0.115478515625, -0.10666656494140625, -0.0978546142578125, -0.08904266357421875, -0.080230712890625, -0.07141876220703125, -0.0626068115234375, -0.05379486083984375, -0.04498291015625, -0.03617095947265625, -0.0273590087890625, -0.01854705810546875, -0.009735107421875, -0.00092315673828125, 0.0078887939453125, 0.01670074462890625, 0.0255126953125, 0.03432464599609375, 0.0431365966796875, 0.05194854736328125, 0.060760498046875, 0.06957244873046875, 0.0783843994140625, 0.08719635009765625, 0.09600830078125, 0.10482025146484375, 0.1136322021484375, 0.12244415283203125, 0.131256103515625, 0.14006805419921875, 0.1488800048828125, 0.15769195556640625, 0.16650390625]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 4.0, 7.0, 6.0, 11.0, 26.0, 49.0, 63.0, 133.0, 130.0, 154.0, 145.0, 106.0, 66.0, 50.0, 20.0, 14.0, 8.0, 7.0, 4.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.7330493927001953, -2.610830068588257, -2.4886107444763184, -2.366391181945801, -2.2441718578338623, -2.121952533721924, -1.9997330904006958, -1.8775136470794678, -1.7552943229675293, -1.6330749988555908, -1.5108555555343628, -1.3886361122131348, -1.2664167881011963, -1.1441974639892578, -1.0219780206680298, -0.8997586369514465, -0.7775392532348633, -0.65531986951828, -0.5331004858016968, -0.4108811020851135, -0.2886617183685303, -0.16644233465194702, -0.04422295093536377, 0.07799643278121948, 0.20021581649780273, 0.322435200214386, 0.44465458393096924, 0.5668739676475525, 0.6890933513641357, 0.811312735080719, 0.9335321187973022, 1.0557515621185303, 1.1779708862304688, 1.3001902103424072, 1.4224096536636353, 1.5446290969848633, 1.6668484210968018, 1.7890677452087402, 1.9112871885299683, 2.0335066318511963, 2.1557259559631348, 2.2779452800750732, 2.4001646041870117, 2.5223841667175293, 2.6446034908294678, 2.7668228149414062, 2.889042377471924, 3.0112617015838623, 3.133481025695801, 3.2557003498077393, 3.3779196739196777, 3.5001392364501953, 3.622358560562134, 3.7445778846740723, 3.86679744720459, 3.9890167713165283, 4.111236095428467, 4.233455657958984, 4.355674743652344, 4.477894306182861, 4.600113868713379, 4.722332954406738, 4.844552516937256, 4.966771602630615, 5.088991165161133]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 7.0, 3.0, 7.0, 5.0, 8.0, 8.0, 8.0, 17.0, 16.0, 17.0, 23.0, 32.0, 14.0, 20.0, 26.0, 32.0, 49.0, 47.0, 30.0, 47.0, 42.0, 49.0, 43.0, 40.0, 27.0, 39.0, 35.0, 56.0, 27.0, 35.0, 29.0, 22.0, 19.0, 22.0, 22.0, 10.0, 8.0, 7.0, 11.0, 12.0, 6.0, 7.0, 7.0, 4.0, 4.0, 4.0, 4.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0], "bins": [-2.189267158508301, -2.1211721897125244, -2.053077220916748, -1.9849822521209717, -1.9168872833251953, -1.848792314529419, -1.780697226524353, -1.7126022577285767, -1.6445072889328003, -1.576412320137024, -1.5083173513412476, -1.4402223825454712, -1.3721272945404053, -1.304032325744629, -1.2359373569488525, -1.1678423881530762, -1.0997474193572998, -1.0316524505615234, -0.9635574817657471, -0.8954624533653259, -0.8273674845695496, -0.7592725157737732, -0.691177487373352, -0.6230825185775757, -0.5549875497817993, -0.48689258098602295, -0.4187975823879242, -0.35070258378982544, -0.2826076149940491, -0.2145126461982727, -0.14641764760017395, -0.0783226490020752, -0.010227680206298828, 0.05786730349063873, 0.1259622871875763, 0.19405727088451385, 0.2621522545814514, 0.3302472233772278, 0.39834222197532654, 0.4664372205734253, 0.5345321893692017, 0.602627158164978, 0.6707221269607544, 0.7388171553611755, 0.8069121241569519, 0.8750070929527283, 0.9431021213531494, 1.0111970901489258, 1.0792920589447021, 1.1473870277404785, 1.2154819965362549, 1.2835769653320312, 1.3516719341278076, 1.419766902923584, 1.48786199092865, 1.5559569597244263, 1.6240519285202026, 1.692146897315979, 1.7602418661117554, 1.8283368349075317, 1.8964319229125977, 1.964526891708374, 2.0326218605041504, 2.1007168292999268, 2.168811798095703]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 6.0, 5.0, 10.0, 13.0, 15.0, 29.0, 34.0, 50.0, 80.0, 116.0, 194.0, 302.0, 506.0, 1023.0, 2413.0, 8373.0, 73473.0, 4072426.0, 26637.0, 5008.0, 1654.0, 766.0, 415.0, 241.0, 169.0, 100.0, 64.0, 47.0, 33.0, 24.0, 22.0, 12.0, 15.0, 3.0, 7.0, 4.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.53271484375, -0.5124740600585938, -0.4922332763671875, -0.47199249267578125, -0.451751708984375, -0.43151092529296875, -0.4112701416015625, -0.39102935791015625, -0.37078857421875, -0.35054779052734375, -0.3303070068359375, -0.31006622314453125, -0.289825439453125, -0.26958465576171875, -0.2493438720703125, -0.22910308837890625, -0.2088623046875, -0.18862152099609375, -0.1683807373046875, -0.14813995361328125, -0.127899169921875, -0.10765838623046875, -0.0874176025390625, -0.06717681884765625, -0.04693603515625, -0.02669525146484375, -0.0064544677734375, 0.01378631591796875, 0.034027099609375, 0.05426788330078125, 0.0745086669921875, 0.09474945068359375, 0.114990234375, 0.13523101806640625, 0.1554718017578125, 0.17571258544921875, 0.195953369140625, 0.21619415283203125, 0.2364349365234375, 0.25667572021484375, 0.27691650390625, 0.29715728759765625, 0.3173980712890625, 0.33763885498046875, 0.357879638671875, 0.37812042236328125, 0.3983612060546875, 0.41860198974609375, 0.4388427734375, 0.45908355712890625, 0.4793243408203125, 0.49956512451171875, 0.519805908203125, 0.5400466918945312, 0.5602874755859375, 0.5805282592773438, 0.60076904296875, 0.6210098266601562, 0.6412506103515625, 0.6614913940429688, 0.681732177734375, 0.7019729614257812, 0.7222137451171875, 0.7424545288085938, 0.7626953125]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 3.0, 8.0, 6.0, 5.0, 12.0, 13.0, 15.0, 20.0, 24.0, 29.0, 48.0, 46.0, 55.0, 47.0, 51.0, 50.0, 60.0, 57.0, 58.0, 61.0, 54.0, 48.0, 56.0, 27.0, 22.0, 34.0, 25.0, 14.0, 19.0, 9.0, 4.0, 6.0, 5.0, 5.0, 0.0, 3.0, 3.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1077880859375, -0.10442638397216797, -0.10106468200683594, -0.0977029800415039, -0.09434127807617188, -0.09097957611083984, -0.08761787414550781, -0.08425617218017578, -0.08089447021484375, -0.07753276824951172, -0.07417106628417969, -0.07080936431884766, -0.06744766235351562, -0.0640859603881836, -0.06072425842285156, -0.05736255645751953, -0.0540008544921875, -0.05063915252685547, -0.04727745056152344, -0.043915748596191406, -0.040554046630859375, -0.037192344665527344, -0.03383064270019531, -0.03046894073486328, -0.02710723876953125, -0.02374553680419922, -0.020383834838867188, -0.017022132873535156, -0.013660430908203125, -0.010298728942871094, -0.0069370269775390625, -0.0035753250122070312, -0.000213623046875, 0.0031480789184570312, 0.0065097808837890625, 0.009871482849121094, 0.013233184814453125, 0.016594886779785156, 0.019956588745117188, 0.02331829071044922, 0.02667999267578125, 0.03004169464111328, 0.03340339660644531, 0.036765098571777344, 0.040126800537109375, 0.043488502502441406, 0.04685020446777344, 0.05021190643310547, 0.0535736083984375, 0.05693531036376953, 0.06029701232910156, 0.0636587142944336, 0.06702041625976562, 0.07038211822509766, 0.07374382019042969, 0.07710552215576172, 0.08046722412109375, 0.08382892608642578, 0.08719062805175781, 0.09055233001708984, 0.09391403198242188, 0.0972757339477539, 0.10063743591308594, 0.10399913787841797, 0.10736083984375]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 2.0, 6.0, 5.0, 5.0, 4.0, 11.0, 9.0, 19.0, 20.0, 25.0, 34.0, 28.0, 44.0, 53.0, 72.0, 93.0, 155.0, 224.0, 342.0, 586.0, 973.0, 1878.0, 4071.0, 11605.0, 64638.0, 4020659.0, 68134.0, 11782.0, 4168.0, 1910.0, 1034.0, 564.0, 341.0, 239.0, 142.0, 81.0, 76.0, 44.0, 44.0, 30.0, 36.0, 21.0, 23.0, 14.0, 10.0, 7.0, 7.0, 6.0, 8.0, 4.0, 2.0, 2.0, 4.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.6220703125, -0.6009902954101562, -0.5799102783203125, -0.5588302612304688, -0.537750244140625, -0.5166702270507812, -0.4955902099609375, -0.47451019287109375, -0.45343017578125, -0.43235015869140625, -0.4112701416015625, -0.39019012451171875, -0.369110107421875, -0.34803009033203125, -0.3269500732421875, -0.30587005615234375, -0.2847900390625, -0.26371002197265625, -0.2426300048828125, -0.22154998779296875, -0.200469970703125, -0.17938995361328125, -0.1583099365234375, -0.13722991943359375, -0.11614990234375, -0.09506988525390625, -0.0739898681640625, -0.05290985107421875, -0.031829833984375, -0.01074981689453125, 0.0103302001953125, 0.03141021728515625, 0.052490234375, 0.07357025146484375, 0.0946502685546875, 0.11573028564453125, 0.136810302734375, 0.15789031982421875, 0.1789703369140625, 0.20005035400390625, 0.22113037109375, 0.24221038818359375, 0.2632904052734375, 0.28437042236328125, 0.305450439453125, 0.32653045654296875, 0.3476104736328125, 0.36869049072265625, 0.3897705078125, 0.41085052490234375, 0.4319305419921875, 0.45301055908203125, 0.474090576171875, 0.49517059326171875, 0.5162506103515625, 0.5373306274414062, 0.55841064453125, 0.5794906616210938, 0.6005706787109375, 0.6216506958007812, 0.642730712890625, 0.6638107299804688, 0.6848907470703125, 0.7059707641601562, 0.72705078125]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 2.0, 3.0, 5.0, 5.0, 7.0, 16.0, 14.0, 31.0, 59.0, 182.0, 3318.0, 268.0, 76.0, 35.0, 14.0, 11.0, 9.0, 7.0, 3.0, 4.0, 1.0, 4.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.11273193359375, -0.10774517059326172, -0.10275840759277344, -0.09777164459228516, -0.09278488159179688, -0.0877981185913086, -0.08281135559082031, -0.07782459259033203, -0.07283782958984375, -0.06785106658935547, -0.06286430358886719, -0.057877540588378906, -0.052890777587890625, -0.047904014587402344, -0.04291725158691406, -0.03793048858642578, -0.0329437255859375, -0.02795696258544922, -0.022970199584960938, -0.017983436584472656, -0.012996673583984375, -0.008009910583496094, -0.0030231475830078125, 0.0019636154174804688, 0.00695037841796875, 0.011937141418457031, 0.016923904418945312, 0.021910667419433594, 0.026897430419921875, 0.031884193420410156, 0.03687095642089844, 0.04185771942138672, 0.046844482421875, 0.05183124542236328, 0.05681800842285156, 0.061804771423339844, 0.06679153442382812, 0.0717782974243164, 0.07676506042480469, 0.08175182342529297, 0.08673858642578125, 0.09172534942626953, 0.09671211242675781, 0.1016988754272461, 0.10668563842773438, 0.11167240142822266, 0.11665916442871094, 0.12164592742919922, 0.1266326904296875, 0.13161945343017578, 0.13660621643066406, 0.14159297943115234, 0.14657974243164062, 0.1515665054321289, 0.1565532684326172, 0.16154003143310547, 0.16652679443359375, 0.17151355743408203, 0.1765003204345703, 0.1814870834350586, 0.18647384643554688, 0.19146060943603516, 0.19644737243652344, 0.20143413543701172, 0.2064208984375]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 4.0, 4.0, 5.0, 5.0, 13.0, 21.0, 43.0, 33.0, 62.0, 57.0, 89.0, 98.0, 109.0, 102.0, 82.0, 55.0, 56.0, 49.0, 24.0, 29.0, 19.0, 11.0, 12.0, 4.0, 9.0, 2.0, 5.0, 0.0, 5.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.36404624581336975, -0.34841758012771606, -0.33278894424438477, -0.3171602785587311, -0.3015316128730774, -0.2859029769897461, -0.2702743113040924, -0.2546456456184387, -0.23901700973510742, -0.22338835895061493, -0.20775970816612244, -0.19213104248046875, -0.17650239169597626, -0.16087374091148376, -0.14524507522583008, -0.12961642444133759, -0.11398777365684509, -0.0983591228723526, -0.08273046463727951, -0.06710180640220642, -0.05147315561771393, -0.035844504833221436, -0.020215846598148346, -0.004587188363075256, 0.011041462421417236, 0.026670116931200027, 0.04229877144098282, 0.05792742595076561, 0.0735560804605484, 0.0891847312450409, 0.10481338948011398, 0.12044204771518707, 0.13607066869735718, 0.15169931948184967, 0.16732797026634216, 0.18295663595199585, 0.19858528673648834, 0.21421393752098083, 0.22984260320663452, 0.24547125399112701, 0.2610999047756195, 0.2767285704612732, 0.2923572063446045, 0.3079858720302582, 0.32361453771591187, 0.33924317359924316, 0.35487183928489685, 0.37050050497055054, 0.38612914085388184, 0.4017578065395355, 0.4173864424228668, 0.4330151081085205, 0.4486437439918518, 0.4642724096775055, 0.4799010753631592, 0.4955297112464905, 0.5111583471298218, 0.5267869830131531, 0.5424156785011292, 0.5580443143844604, 0.5736729502677917, 0.589301586151123, 0.6049302816390991, 0.6205589175224304, 0.6361876130104065]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 4.0, 2.0, 6.0, 2.0, 5.0, 11.0, 7.0, 10.0, 13.0, 19.0, 19.0, 28.0, 22.0, 27.0, 24.0, 24.0, 29.0, 34.0, 39.0, 42.0, 41.0, 45.0, 34.0, 51.0, 45.0, 44.0, 42.0, 37.0, 26.0, 41.0, 31.0, 25.0, 17.0, 19.0, 18.0, 12.0, 28.0, 14.0, 7.0, 16.0, 12.0, 10.0, 4.0, 12.0, 6.0, 3.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.30475783348083496, -0.29590699076652527, -0.2870561480522156, -0.2782053053379059, -0.2693544626235962, -0.2605036199092865, -0.2516527771949768, -0.24280193448066711, -0.23395109176635742, -0.22510024905204773, -0.21624940633773804, -0.20739856362342834, -0.19854772090911865, -0.18969687819480896, -0.18084603548049927, -0.17199519276618958, -0.16314436495304108, -0.15429352223873138, -0.1454426795244217, -0.136591836810112, -0.1277409940958023, -0.11889015138149261, -0.11003931611776352, -0.10118847340345383, -0.09233763068914413, -0.08348678797483444, -0.07463594526052475, -0.06578510999679565, -0.05693426355719566, -0.04808342084288597, -0.03923258185386658, -0.030381739139556885, -0.021530896425247192, -0.012680054642260075, -0.003829212859272957, 0.005021627992391586, 0.013872470706701279, 0.02272331342101097, 0.031574152410030365, 0.04042499512434006, 0.04927583783864975, 0.05812668055295944, 0.06697752326726913, 0.07582835853099823, 0.08467920124530792, 0.09353004395961761, 0.10238088667392731, 0.111231729388237, 0.12008257210254669, 0.12893341481685638, 0.13778425753116608, 0.14663510024547577, 0.15548594295978546, 0.16433678567409515, 0.17318761348724365, 0.18203845620155334, 0.19088929891586304, 0.19974014163017273, 0.20859098434448242, 0.21744182705879211, 0.2262926697731018, 0.2351435124874115, 0.2439943552017212, 0.2528451979160309, 0.2616960406303406]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 5.0, 7.0, 5.0, 7.0, 14.0, 13.0, 37.0, 39.0, 84.0, 129.0, 216.0, 402.0, 774.0, 1642.0, 4061.0, 11306.0, 37876.0, 161177.0, 515222.0, 237660.0, 53549.0, 14977.0, 5150.0, 2164.0, 947.0, 448.0, 260.0, 136.0, 83.0, 58.0, 30.0, 22.0, 24.0, 18.0, 9.0, 6.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.351806640625, -0.3406829833984375, -0.329559326171875, -0.3184356689453125, -0.30731201171875, -0.2961883544921875, -0.285064697265625, -0.2739410400390625, -0.2628173828125, -0.2516937255859375, -0.240570068359375, -0.2294464111328125, -0.21832275390625, -0.2071990966796875, -0.196075439453125, -0.1849517822265625, -0.173828125, -0.1627044677734375, -0.151580810546875, -0.1404571533203125, -0.12933349609375, -0.1182098388671875, -0.107086181640625, -0.0959625244140625, -0.0848388671875, -0.0737152099609375, -0.062591552734375, -0.0514678955078125, -0.04034423828125, -0.0292205810546875, -0.018096923828125, -0.0069732666015625, 0.004150390625, 0.0152740478515625, 0.026397705078125, 0.0375213623046875, 0.04864501953125, 0.0597686767578125, 0.070892333984375, 0.0820159912109375, 0.0931396484375, 0.1042633056640625, 0.115386962890625, 0.1265106201171875, 0.13763427734375, 0.1487579345703125, 0.159881591796875, 0.1710052490234375, 0.18212890625, 0.1932525634765625, 0.204376220703125, 0.2154998779296875, 0.22662353515625, 0.2377471923828125, 0.248870849609375, 0.2599945068359375, 0.2711181640625, 0.2822418212890625, 0.293365478515625, 0.3044891357421875, 0.31561279296875, 0.3267364501953125, 0.337860107421875, 0.3489837646484375, 0.360107421875]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 4.0, 6.0, 4.0, 7.0, 8.0, 8.0, 22.0, 12.0, 19.0, 22.0, 37.0, 27.0, 30.0, 37.0, 59.0, 46.0, 45.0, 50.0, 62.0, 68.0, 43.0, 64.0, 52.0, 37.0, 41.0, 33.0, 23.0, 31.0, 17.0, 28.0, 19.0, 17.0, 8.0, 11.0, 2.0, 2.0, 3.0, 1.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.11529541015625, -0.11187362670898438, -0.10845184326171875, -0.10503005981445312, -0.1016082763671875, -0.09818649291992188, -0.09476470947265625, -0.09134292602539062, -0.087921142578125, -0.08449935913085938, -0.08107757568359375, -0.07765579223632812, -0.0742340087890625, -0.07081222534179688, -0.06739044189453125, -0.06396865844726562, -0.060546875, -0.057125091552734375, -0.05370330810546875, -0.050281524658203125, -0.0468597412109375, -0.043437957763671875, -0.04001617431640625, -0.036594390869140625, -0.033172607421875, -0.029750823974609375, -0.02632904052734375, -0.022907257080078125, -0.0194854736328125, -0.016063690185546875, -0.01264190673828125, -0.009220123291015625, -0.00579833984375, -0.002376556396484375, 0.00104522705078125, 0.004467010498046875, 0.0078887939453125, 0.011310577392578125, 0.01473236083984375, 0.018154144287109375, 0.021575927734375, 0.024997711181640625, 0.02841949462890625, 0.031841278076171875, 0.0352630615234375, 0.038684844970703125, 0.04210662841796875, 0.045528411865234375, 0.0489501953125, 0.052371978759765625, 0.05579376220703125, 0.059215545654296875, 0.0626373291015625, 0.06605911254882812, 0.06948089599609375, 0.07290267944335938, 0.076324462890625, 0.07974624633789062, 0.08316802978515625, 0.08658981323242188, 0.0900115966796875, 0.09343338012695312, 0.09685516357421875, 0.10027694702148438, 0.10369873046875]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 8.0, 22.0, 7.0, 23.0, 31.0, 28.0, 47.0, 75.0, 128.0, 157.0, 273.0, 435.0, 836.0, 1607.0, 3969.0, 12406.0, 59985.0, 542849.0, 366305.0, 42660.0, 10086.0, 3271.0, 1471.0, 724.0, 401.0, 264.0, 153.0, 95.0, 72.0, 40.0, 36.0, 32.0, 19.0, 11.0, 9.0, 8.0, 4.0, 2.0, 8.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.42919921875, -0.41484832763671875, -0.4004974365234375, -0.38614654541015625, -0.371795654296875, -0.35744476318359375, -0.3430938720703125, -0.32874298095703125, -0.31439208984375, -0.30004119873046875, -0.2856903076171875, -0.27133941650390625, -0.256988525390625, -0.24263763427734375, -0.2282867431640625, -0.21393585205078125, -0.1995849609375, -0.18523406982421875, -0.1708831787109375, -0.15653228759765625, -0.142181396484375, -0.12783050537109375, -0.1134796142578125, -0.09912872314453125, -0.08477783203125, -0.07042694091796875, -0.0560760498046875, -0.04172515869140625, -0.027374267578125, -0.01302337646484375, 0.0013275146484375, 0.01567840576171875, 0.030029296875, 0.04438018798828125, 0.0587310791015625, 0.07308197021484375, 0.087432861328125, 0.10178375244140625, 0.1161346435546875, 0.13048553466796875, 0.14483642578125, 0.15918731689453125, 0.1735382080078125, 0.18788909912109375, 0.202239990234375, 0.21659088134765625, 0.2309417724609375, 0.24529266357421875, 0.2596435546875, 0.27399444580078125, 0.2883453369140625, 0.30269622802734375, 0.317047119140625, 0.33139801025390625, 0.3457489013671875, 0.36009979248046875, 0.37445068359375, 0.38880157470703125, 0.4031524658203125, 0.41750335693359375, 0.431854248046875, 0.44620513916015625, 0.4605560302734375, 0.47490692138671875, 0.4892578125]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 5.0, 2.0, 3.0, 4.0, 6.0, 4.0, 16.0, 10.0, 18.0, 8.0, 29.0, 25.0, 12.0, 24.0, 24.0, 41.0, 39.0, 49.0, 43.0, 44.0, 46.0, 47.0, 52.0, 40.0, 48.0, 41.0, 42.0, 37.0, 24.0, 39.0, 35.0, 22.0, 20.0, 22.0, 14.0, 16.0, 9.0, 7.0, 9.0, 9.0, 9.0, 6.0, 2.0, 2.0, 2.0, 3.0, 1.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.400146484375, -0.3865089416503906, -0.37287139892578125, -0.3592338562011719, -0.3455963134765625, -0.3319587707519531, -0.31832122802734375, -0.3046836853027344, -0.291046142578125, -0.2774085998535156, -0.26377105712890625, -0.2501335144042969, -0.2364959716796875, -0.22285842895507812, -0.20922088623046875, -0.19558334350585938, -0.18194580078125, -0.16830825805664062, -0.15467071533203125, -0.14103317260742188, -0.1273956298828125, -0.11375808715820312, -0.10012054443359375, -0.08648300170898438, -0.072845458984375, -0.059207916259765625, -0.04557037353515625, -0.031932830810546875, -0.0182952880859375, -0.004657745361328125, 0.00897979736328125, 0.022617340087890625, 0.0362548828125, 0.049892425537109375, 0.06352996826171875, 0.07716751098632812, 0.0908050537109375, 0.10444259643554688, 0.11808013916015625, 0.13171768188476562, 0.145355224609375, 0.15899276733398438, 0.17263031005859375, 0.18626785278320312, 0.1999053955078125, 0.21354293823242188, 0.22718048095703125, 0.24081802368164062, 0.25445556640625, 0.2680931091308594, 0.28173065185546875, 0.2953681945800781, 0.3090057373046875, 0.3226432800292969, 0.33628082275390625, 0.3499183654785156, 0.363555908203125, 0.3771934509277344, 0.39083099365234375, 0.4044685363769531, 0.4181060791015625, 0.4317436218261719, 0.44538116455078125, 0.4590187072753906, 0.47265625]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 4.0, 1.0, 4.0, 8.0, 9.0, 14.0, 23.0, 37.0, 46.0, 96.0, 144.0, 285.0, 621.0, 1492.0, 4161.0, 15615.0, 103011.0, 674209.0, 212739.0, 26470.0, 5938.0, 1941.0, 797.0, 375.0, 194.0, 117.0, 81.0, 44.0, 22.0, 13.0, 18.0, 11.0, 5.0, 5.0, 3.0, 3.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.195068359375, -0.18746566772460938, -0.17986297607421875, -0.17226028442382812, -0.1646575927734375, -0.15705490112304688, -0.14945220947265625, -0.14184951782226562, -0.134246826171875, -0.12664413452148438, -0.11904144287109375, -0.11143875122070312, -0.1038360595703125, -0.09623336791992188, -0.08863067626953125, -0.08102798461914062, -0.07342529296875, -0.06582260131835938, -0.05821990966796875, -0.050617218017578125, -0.0430145263671875, -0.035411834716796875, -0.02780914306640625, -0.020206451416015625, -0.012603759765625, -0.005001068115234375, 0.00260162353515625, 0.010204315185546875, 0.0178070068359375, 0.025409698486328125, 0.03301239013671875, 0.040615081787109375, 0.0482177734375, 0.055820465087890625, 0.06342315673828125, 0.07102584838867188, 0.0786285400390625, 0.08623123168945312, 0.09383392333984375, 0.10143661499023438, 0.109039306640625, 0.11664199829101562, 0.12424468994140625, 0.13184738159179688, 0.1394500732421875, 0.14705276489257812, 0.15465545654296875, 0.16225814819335938, 0.16986083984375, 0.17746353149414062, 0.18506622314453125, 0.19266891479492188, 0.2002716064453125, 0.20787429809570312, 0.21547698974609375, 0.22307968139648438, 0.230682373046875, 0.23828506469726562, 0.24588775634765625, 0.2534904479980469, 0.2610931396484375, 0.2686958312988281, 0.27629852294921875, 0.2839012145996094, 0.29150390625]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 4.0, 7.0, 4.0, 4.0, 5.0, 4.0, 10.0, 17.0, 16.0, 23.0, 21.0, 33.0, 25.0, 53.0, 51.0, 57.0, 61.0, 88.0, 74.0, 65.0, 70.0, 58.0, 49.0, 36.0, 27.0, 30.0, 24.0, 22.0, 14.0, 12.0, 11.0, 7.0, 5.0, 5.0, 1.0, 3.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-6.204843521118164e-05, -6.000790745019913e-05, -5.7967379689216614e-05, -5.59268519282341e-05, -5.388632416725159e-05, -5.1845796406269073e-05, -4.980526864528656e-05, -4.776474088430405e-05, -4.572421312332153e-05, -4.368368536233902e-05, -4.1643157601356506e-05, -3.960262984037399e-05, -3.756210207939148e-05, -3.5521574318408966e-05, -3.348104655742645e-05, -3.144051879644394e-05, -2.9399991035461426e-05, -2.7359463274478912e-05, -2.53189355134964e-05, -2.3278407752513885e-05, -2.1237879991531372e-05, -1.919735223054886e-05, -1.7156824469566345e-05, -1.5116296708583832e-05, -1.3075768947601318e-05, -1.1035241186618805e-05, -8.994713425636292e-06, -6.954185664653778e-06, -4.913657903671265e-06, -2.8731301426887512e-06, -8.326023817062378e-07, 1.2079253792762756e-06, 3.248453140258789e-06, 5.2889809012413025e-06, 7.329508662223816e-06, 9.37003642320633e-06, 1.1410564184188843e-05, 1.3451091945171356e-05, 1.549161970615387e-05, 1.7532147467136383e-05, 1.9572675228118896e-05, 2.161320298910141e-05, 2.3653730750083923e-05, 2.5694258511066437e-05, 2.773478627204895e-05, 2.9775314033031464e-05, 3.181584179401398e-05, 3.385636955499649e-05, 3.5896897315979004e-05, 3.793742507696152e-05, 3.997795283794403e-05, 4.2018480598926544e-05, 4.405900835990906e-05, 4.609953612089157e-05, 4.8140063881874084e-05, 5.01805916428566e-05, 5.222111940383911e-05, 5.4261647164821625e-05, 5.630217492580414e-05, 5.834270268678665e-05, 6.0383230447769165e-05, 6.242375820875168e-05, 6.446428596973419e-05, 6.65048137307167e-05, 6.854534149169922e-05]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 0.0, 5.0, 1.0, 1.0, 4.0, 5.0, 13.0, 17.0, 24.0, 31.0, 61.0, 158.0, 265.0, 525.0, 1258.0, 4348.0, 26269.0, 386985.0, 580102.0, 40034.0, 5707.0, 1528.0, 597.0, 291.0, 136.0, 86.0, 35.0, 34.0, 16.0, 10.0, 6.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.383056640625, -0.3732566833496094, -0.36345672607421875, -0.3536567687988281, -0.3438568115234375, -0.3340568542480469, -0.32425689697265625, -0.3144569396972656, -0.304656982421875, -0.2948570251464844, -0.28505706787109375, -0.2752571105957031, -0.2654571533203125, -0.2556571960449219, -0.24585723876953125, -0.23605728149414062, -0.22625732421875, -0.21645736694335938, -0.20665740966796875, -0.19685745239257812, -0.1870574951171875, -0.17725753784179688, -0.16745758056640625, -0.15765762329101562, -0.147857666015625, -0.13805770874023438, -0.12825775146484375, -0.11845779418945312, -0.1086578369140625, -0.09885787963867188, -0.08905792236328125, -0.07925796508789062, -0.0694580078125, -0.059658050537109375, -0.04985809326171875, -0.040058135986328125, -0.0302581787109375, -0.020458221435546875, -0.01065826416015625, -0.000858306884765625, 0.008941650390625, 0.018741607666015625, 0.02854156494140625, 0.038341522216796875, 0.0481414794921875, 0.057941436767578125, 0.06774139404296875, 0.07754135131835938, 0.08734130859375, 0.09714126586914062, 0.10694122314453125, 0.11674118041992188, 0.1265411376953125, 0.13634109497070312, 0.14614105224609375, 0.15594100952148438, 0.165740966796875, 0.17554092407226562, 0.18534088134765625, 0.19514083862304688, 0.2049407958984375, 0.21474075317382812, 0.22454071044921875, 0.23434066772460938, 0.244140625]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 4.0, 6.0, 14.0, 13.0, 17.0, 31.0, 36.0, 41.0, 70.0, 91.0, 102.0, 116.0, 85.0, 98.0, 76.0, 58.0, 42.0, 32.0, 22.0, 13.0, 15.0, 9.0, 5.0, 4.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2034912109375, -0.1968860626220703, -0.19028091430664062, -0.18367576599121094, -0.17707061767578125, -0.17046546936035156, -0.16386032104492188, -0.1572551727294922, -0.1506500244140625, -0.1440448760986328, -0.13743972778320312, -0.13083457946777344, -0.12422943115234375, -0.11762428283691406, -0.11101913452148438, -0.10441398620605469, -0.097808837890625, -0.09120368957519531, -0.08459854125976562, -0.07799339294433594, -0.07138824462890625, -0.06478309631347656, -0.058177947998046875, -0.05157279968261719, -0.0449676513671875, -0.03836250305175781, -0.031757354736328125, -0.025152206420898438, -0.01854705810546875, -0.011941909790039062, -0.005336761474609375, 0.0012683868408203125, 0.00787353515625, 0.014478683471679688, 0.021083831787109375, 0.027688980102539062, 0.03429412841796875, 0.04089927673339844, 0.047504425048828125, 0.05410957336425781, 0.0607147216796875, 0.06731986999511719, 0.07392501831054688, 0.08053016662597656, 0.08713531494140625, 0.09374046325683594, 0.10034561157226562, 0.10695075988769531, 0.113555908203125, 0.12016105651855469, 0.12676620483398438, 0.13337135314941406, 0.13997650146484375, 0.14658164978027344, 0.15318679809570312, 0.1597919464111328, 0.1663970947265625, 0.1730022430419922, 0.17960739135742188, 0.18621253967285156, 0.19281768798828125, 0.19942283630371094, 0.20602798461914062, 0.2126331329345703, 0.21923828125]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 4.0, 3.0, 5.0, 10.0, 18.0, 35.0, 58.0, 106.0, 196.0, 214.0, 158.0, 106.0, 57.0, 24.0, 10.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.8017022609710693, -2.6483891010284424, -2.4950761795043945, -2.3417630195617676, -2.1884500980377197, -2.0351369380950928, -1.8818238973617554, -1.728510856628418, -1.5751978158950806, -1.4218847751617432, -1.2685717344284058, -1.1152586936950684, -0.9619455933570862, -0.8086325526237488, -0.6553194522857666, -0.5020064115524292, -0.3486933708190918, -0.1953803151845932, -0.042067259550094604, 0.11124581098556519, 0.2645588517189026, 0.41787189245224, 0.5711849927902222, 0.7244980335235596, 0.877811074256897, 1.0311241149902344, 1.1844371557235718, 1.3377501964569092, 1.4910633563995361, 1.644376277923584, 1.797689437866211, 1.9510024785995483, 2.1043152809143066, 2.2576284408569336, 2.4109413623809814, 2.5642545223236084, 2.7175674438476562, 2.870880603790283, 3.02419376373291, 3.177506685256958, 3.330819606781006, 3.484132766723633, 3.6374456882476807, 3.7907588481903076, 3.9440717697143555, 4.097384929656982, 4.250698089599609, 4.404010772705078, 4.557324409484863, 4.71063756942749, 4.863950729370117, 5.017263412475586, 5.170576572418213, 5.32388973236084, 5.477202892303467, 5.630516052246094, 5.7838287353515625, 5.9371418952941895, 6.090455055236816, 6.243767738342285, 6.397080898284912, 6.550394058227539, 6.703707218170166, 6.857020378112793, 7.010333061218262]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 5.0, 7.0, 6.0, 2.0, 10.0, 14.0, 5.0, 7.0, 7.0, 21.0, 22.0, 20.0, 19.0, 30.0, 23.0, 38.0, 41.0, 40.0, 44.0, 41.0, 50.0, 51.0, 53.0, 57.0, 41.0, 45.0, 50.0, 38.0, 34.0, 30.0, 30.0, 27.0, 15.0, 17.0, 14.0, 7.0, 16.0, 9.0, 2.0, 4.0, 6.0, 2.0, 3.0, 2.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-2.297757625579834, -2.229525566101074, -2.1612935066223145, -2.0930614471435547, -2.024829387664795, -1.9565974473953247, -1.8883655071258545, -1.8201334476470947, -1.751901388168335, -1.6836693286895752, -1.6154372692108154, -1.5472053289413452, -1.4789732694625854, -1.4107412099838257, -1.3425092697143555, -1.2742772102355957, -1.206045150756836, -1.1378130912780762, -1.0695810317993164, -1.0013490915298462, -0.9331170320510864, -0.8648849725723267, -0.7966529726982117, -0.7284209728240967, -0.6601889133453369, -0.5919568538665771, -0.5237248539924622, -0.4554928243160248, -0.3872607946395874, -0.31902876496315, -0.25079673528671265, -0.18256470561027527, -0.11433291435241699, -0.046100884675979614, 0.022131145000457764, 0.09036317467689514, 0.15859520435333252, 0.2268272340297699, 0.2950592637062073, 0.36329129338264465, 0.43152332305908203, 0.4997553527355194, 0.5679873824119568, 0.6362193822860718, 0.7044514417648315, 0.7726835012435913, 0.8409155011177063, 0.9091475009918213, 0.977379560470581, 1.0456116199493408, 1.1138436794281006, 1.1820756196975708, 1.2503076791763306, 1.3185397386550903, 1.3867716789245605, 1.4550037384033203, 1.52323579788208, 1.5914678573608398, 1.6596999168395996, 1.7279318571090698, 1.7961639165878296, 1.8643959760665894, 1.9326279163360596, 2.0008599758148193, 2.069092035293579]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 3.0, 2.0, 0.0, 0.0, 3.0, 4.0, 2.0, 8.0, 5.0, 8.0, 10.0, 21.0, 28.0, 27.0, 41.0, 57.0, 78.0, 85.0, 119.0, 168.0, 260.0, 366.0, 618.0, 1173.0, 2579.0, 7463.0, 40046.0, 4097511.0, 31726.0, 6592.0, 2347.0, 1102.0, 555.0, 376.0, 253.0, 159.0, 122.0, 92.0, 67.0, 58.0, 37.0, 31.0, 25.0, 21.0, 10.0, 8.0, 6.0, 5.0, 2.0, 6.0, 3.0, 5.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.488525390625, -0.4713554382324219, -0.45418548583984375, -0.4370155334472656, -0.4198455810546875, -0.4026756286621094, -0.38550567626953125, -0.3683357238769531, -0.351165771484375, -0.3339958190917969, -0.31682586669921875, -0.2996559143066406, -0.2824859619140625, -0.2653160095214844, -0.24814605712890625, -0.23097610473632812, -0.21380615234375, -0.19663619995117188, -0.17946624755859375, -0.16229629516601562, -0.1451263427734375, -0.12795639038085938, -0.11078643798828125, -0.09361648559570312, -0.076446533203125, -0.059276580810546875, -0.04210662841796875, -0.024936676025390625, -0.0077667236328125, 0.009403228759765625, 0.02657318115234375, 0.043743133544921875, 0.0609130859375, 0.07808303833007812, 0.09525299072265625, 0.11242294311523438, 0.1295928955078125, 0.14676284790039062, 0.16393280029296875, 0.18110275268554688, 0.198272705078125, 0.21544265747070312, 0.23261260986328125, 0.24978256225585938, 0.2669525146484375, 0.2841224670410156, 0.30129241943359375, 0.3184623718261719, 0.33563232421875, 0.3528022766113281, 0.36997222900390625, 0.3871421813964844, 0.4043121337890625, 0.4214820861816406, 0.43865203857421875, 0.4558219909667969, 0.472991943359375, 0.4901618957519531, 0.5073318481445312, 0.5245018005371094, 0.5416717529296875, 0.5588417053222656, 0.5760116577148438, 0.5931816101074219, 0.6103515625]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 4.0, 10.0, 12.0, 12.0, 18.0, 23.0, 25.0, 23.0, 46.0, 31.0, 56.0, 65.0, 60.0, 78.0, 61.0, 65.0, 74.0, 64.0, 56.0, 53.0, 43.0, 29.0, 27.0, 21.0, 14.0, 16.0, 10.0, 2.0, 3.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11627197265625, -0.11190509796142578, -0.10753822326660156, -0.10317134857177734, -0.09880447387695312, -0.0944375991821289, -0.09007072448730469, -0.08570384979248047, -0.08133697509765625, -0.07697010040283203, -0.07260322570800781, -0.0682363510131836, -0.06386947631835938, -0.059502601623535156, -0.05513572692871094, -0.05076885223388672, -0.0464019775390625, -0.04203510284423828, -0.03766822814941406, -0.033301353454589844, -0.028934478759765625, -0.024567604064941406, -0.020200729370117188, -0.01583385467529297, -0.01146697998046875, -0.007100105285644531, -0.0027332305908203125, 0.0016336441040039062, 0.006000518798828125, 0.010367393493652344, 0.014734268188476562, 0.01910114288330078, 0.023468017578125, 0.02783489227294922, 0.03220176696777344, 0.036568641662597656, 0.040935516357421875, 0.045302391052246094, 0.04966926574707031, 0.05403614044189453, 0.05840301513671875, 0.06276988983154297, 0.06713676452636719, 0.0715036392211914, 0.07587051391601562, 0.08023738861083984, 0.08460426330566406, 0.08897113800048828, 0.0933380126953125, 0.09770488739013672, 0.10207176208496094, 0.10643863677978516, 0.11080551147460938, 0.1151723861694336, 0.11953926086425781, 0.12390613555908203, 0.12827301025390625, 0.13263988494873047, 0.1370067596435547, 0.1413736343383789, 0.14574050903320312, 0.15010738372802734, 0.15447425842285156, 0.15884113311767578, 0.1632080078125]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 5.0, 0.0, 2.0, 3.0, 6.0, 4.0, 10.0, 6.0, 17.0, 22.0, 29.0, 45.0, 65.0, 84.0, 115.0, 125.0, 185.0, 277.0, 417.0, 707.0, 1125.0, 2174.0, 5002.0, 14671.0, 121151.0, 4005783.0, 27934.0, 7385.0, 2949.0, 1460.0, 833.0, 486.0, 351.0, 243.0, 151.0, 131.0, 85.0, 64.0, 61.0, 38.0, 23.0, 15.0, 17.0, 7.0, 8.0, 9.0, 6.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.6669921875, -0.6480484008789062, -0.6291046142578125, -0.6101608276367188, -0.591217041015625, -0.5722732543945312, -0.5533294677734375, -0.5343856811523438, -0.51544189453125, -0.49649810791015625, -0.4775543212890625, -0.45861053466796875, -0.439666748046875, -0.42072296142578125, -0.4017791748046875, -0.38283538818359375, -0.3638916015625, -0.34494781494140625, -0.3260040283203125, -0.30706024169921875, -0.288116455078125, -0.26917266845703125, -0.2502288818359375, -0.23128509521484375, -0.21234130859375, -0.19339752197265625, -0.1744537353515625, -0.15550994873046875, -0.136566162109375, -0.11762237548828125, -0.0986785888671875, -0.07973480224609375, -0.060791015625, -0.04184722900390625, -0.0229034423828125, -0.00395965576171875, 0.014984130859375, 0.03392791748046875, 0.0528717041015625, 0.07181549072265625, 0.09075927734375, 0.10970306396484375, 0.1286468505859375, 0.14759063720703125, 0.166534423828125, 0.18547821044921875, 0.2044219970703125, 0.22336578369140625, 0.2423095703125, 0.26125335693359375, 0.2801971435546875, 0.29914093017578125, 0.318084716796875, 0.33702850341796875, 0.3559722900390625, 0.37491607666015625, 0.39385986328125, 0.41280364990234375, 0.4317474365234375, 0.45069122314453125, 0.469635009765625, 0.48857879638671875, 0.5075225830078125, 0.5264663696289062, 0.54541015625]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 3.0, 2.0, 5.0, 1.0, 4.0, 9.0, 4.0, 12.0, 18.0, 46.0, 121.0, 3552.0, 178.0, 53.0, 29.0, 9.0, 12.0, 6.0, 6.0, 4.0, 5.0, 4.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.1622314453125, -0.15767860412597656, -0.15312576293945312, -0.1485729217529297, -0.14402008056640625, -0.1394672393798828, -0.13491439819335938, -0.13036155700683594, -0.1258087158203125, -0.12125587463378906, -0.11670303344726562, -0.11215019226074219, -0.10759735107421875, -0.10304450988769531, -0.09849166870117188, -0.09393882751464844, -0.089385986328125, -0.08483314514160156, -0.08028030395507812, -0.07572746276855469, -0.07117462158203125, -0.06662178039550781, -0.062068939208984375, -0.05751609802246094, -0.0529632568359375, -0.04841041564941406, -0.043857574462890625, -0.03930473327636719, -0.03475189208984375, -0.030199050903320312, -0.025646209716796875, -0.021093368530273438, -0.01654052734375, -0.011987686157226562, -0.007434844970703125, -0.0028820037841796875, 0.00167083740234375, 0.0062236785888671875, 0.010776519775390625, 0.015329360961914062, 0.0198822021484375, 0.024435043334960938, 0.028987884521484375, 0.03354072570800781, 0.03809356689453125, 0.04264640808105469, 0.047199249267578125, 0.05175209045410156, 0.056304931640625, 0.06085777282714844, 0.06541061401367188, 0.06996345520019531, 0.07451629638671875, 0.07906913757324219, 0.08362197875976562, 0.08817481994628906, 0.0927276611328125, 0.09728050231933594, 0.10183334350585938, 0.10638618469238281, 0.11093902587890625, 0.11549186706542969, 0.12004470825195312, 0.12459754943847656, 0.129150390625]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 2.0, 2.0, 4.0, 4.0, 6.0, 8.0, 16.0, 16.0, 23.0, 35.0, 45.0, 83.0, 98.0, 146.0, 156.0, 111.0, 101.0, 60.0, 40.0, 12.0, 13.0, 9.0, 5.0, 3.0, 1.0, 4.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.7845587730407715, -0.7639135122299194, -0.7432682514190674, -0.7226229310035706, -0.7019776701927185, -0.6813324093818665, -0.6606871485710144, -0.6400418877601624, -0.6193965673446655, -0.5987513065338135, -0.5781060457229614, -0.5574607253074646, -0.5368154644966125, -0.5161702036857605, -0.49552494287490845, -0.4748796820640564, -0.45423442125320435, -0.4335891604423523, -0.41294386982917786, -0.3922986090183258, -0.37165331840515137, -0.3510080575942993, -0.33036279678344727, -0.3097175359725952, -0.2890722453594208, -0.2684269845485687, -0.2477816939353943, -0.22713643312454224, -0.206491157412529, -0.18584588170051575, -0.1652006208896637, -0.14455534517765045, -0.12391000986099243, -0.10326473414897919, -0.08261946588754654, -0.06197419390082359, -0.04132892191410065, -0.020683646202087402, -3.837794065475464e-05, 0.020606890320777893, 0.04125216603279114, 0.061897438019514084, 0.08254271000623703, 0.10318797826766968, 0.12383325397968292, 0.14447852969169617, 0.16512379050254822, 0.18576906621456146, 0.2064143419265747, 0.22705961763858795, 0.2477048933506012, 0.26835015416145325, 0.2889954447746277, 0.30964070558547974, 0.3302859663963318, 0.35093122720718384, 0.3715765178203583, 0.3922217786312103, 0.41286706924438477, 0.4335123300552368, 0.45415759086608887, 0.4748028814792633, 0.49544814229011536, 0.5160934329032898, 0.5367386937141418]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 5.0, 4.0, 5.0, 6.0, 7.0, 8.0, 6.0, 9.0, 12.0, 7.0, 19.0, 20.0, 19.0, 28.0, 22.0, 25.0, 32.0, 31.0, 26.0, 19.0, 40.0, 34.0, 38.0, 34.0, 44.0, 47.0, 38.0, 40.0, 37.0, 38.0, 42.0, 26.0, 27.0, 17.0, 22.0, 26.0, 19.0, 13.0, 18.0, 15.0, 13.0, 16.0, 12.0, 12.0, 4.0, 6.0, 9.0, 5.0, 3.0, 3.0, 6.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.21090805530548096, -0.20432889461517334, -0.19774973392486572, -0.1911705732345581, -0.18459142744541168, -0.17801226675510406, -0.17143310606479645, -0.16485394537448883, -0.1582747995853424, -0.1516956388950348, -0.14511647820472717, -0.13853731751441956, -0.13195817172527313, -0.12537901103496552, -0.1187998503446579, -0.11222068965435028, -0.10564152896404266, -0.09906236827373505, -0.09248321503400803, -0.08590405434370041, -0.07932490110397339, -0.07274574041366577, -0.06616657972335815, -0.059587422758340836, -0.05300826579332352, -0.0464291088283062, -0.03984995186328888, -0.03327079117298126, -0.026691634207963943, -0.020112477242946625, -0.013533316552639008, -0.006954159587621689, -0.0003750026226043701, 0.006204155273735523, 0.012783313170075417, 0.019362471997737885, 0.025941628962755203, 0.03252078592777252, 0.03909994661808014, 0.04567910358309746, 0.05225826054811478, 0.058837417513132095, 0.06541657447814941, 0.07199573516845703, 0.07857489585876465, 0.08515404909849167, 0.09173320978879929, 0.0983123630285263, 0.10489152371883392, 0.11147068440914154, 0.11804983764886856, 0.12462899833917618, 0.1312081515789032, 0.13778731226921082, 0.14436647295951843, 0.15094563364982605, 0.15752479434013367, 0.16410395503044128, 0.1706831157207489, 0.17726227641105652, 0.18384142220020294, 0.19042058289051056, 0.19699974358081818, 0.2035789042711258, 0.21015805006027222]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 9.0, 6.0, 15.0, 16.0, 25.0, 27.0, 37.0, 74.0, 121.0, 212.0, 380.0, 681.0, 1329.0, 2933.0, 6709.0, 17165.0, 50491.0, 170057.0, 466526.0, 228919.0, 65902.0, 21917.0, 8141.0, 3488.0, 1583.0, 742.0, 447.0, 206.0, 148.0, 91.0, 51.0, 36.0, 23.0, 21.0, 10.0, 8.0, 7.0, 1.0, 3.0, 1.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.307373046875, -0.29874229431152344, -0.2901115417480469, -0.2814807891845703, -0.27285003662109375, -0.2642192840576172, -0.2555885314941406, -0.24695777893066406, -0.2383270263671875, -0.22969627380371094, -0.22106552124023438, -0.2124347686767578, -0.20380401611328125, -0.1951732635498047, -0.18654251098632812, -0.17791175842285156, -0.169281005859375, -0.16065025329589844, -0.15201950073242188, -0.1433887481689453, -0.13475799560546875, -0.1261272430419922, -0.11749649047851562, -0.10886573791503906, -0.1002349853515625, -0.09160423278808594, -0.08297348022460938, -0.07434272766113281, -0.06571197509765625, -0.05708122253417969, -0.048450469970703125, -0.03981971740722656, -0.03118896484375, -0.022558212280273438, -0.013927459716796875, -0.0052967071533203125, 0.00333404541015625, 0.011964797973632812, 0.020595550537109375, 0.029226303100585938, 0.0378570556640625, 0.04648780822753906, 0.055118560791015625, 0.06374931335449219, 0.07238006591796875, 0.08101081848144531, 0.08964157104492188, 0.09827232360839844, 0.106903076171875, 0.11553382873535156, 0.12416458129882812, 0.1327953338623047, 0.14142608642578125, 0.1500568389892578, 0.15868759155273438, 0.16731834411621094, 0.1759490966796875, 0.18457984924316406, 0.19321060180664062, 0.2018413543701172, 0.21047210693359375, 0.2191028594970703, 0.22773361206054688, 0.23636436462402344, 0.2449951171875]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 8.0, 3.0, 9.0, 14.0, 7.0, 19.0, 17.0, 22.0, 26.0, 25.0, 44.0, 47.0, 43.0, 62.0, 60.0, 51.0, 61.0, 56.0, 50.0, 60.0, 50.0, 43.0, 45.0, 35.0, 38.0, 22.0, 24.0, 15.0, 9.0, 13.0, 5.0, 7.0, 3.0, 3.0, 3.0, 5.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.134033203125, -0.1300678253173828, -0.12610244750976562, -0.12213706970214844, -0.11817169189453125, -0.11420631408691406, -0.11024093627929688, -0.10627555847167969, -0.1023101806640625, -0.09834480285644531, -0.09437942504882812, -0.09041404724121094, -0.08644866943359375, -0.08248329162597656, -0.07851791381835938, -0.07455253601074219, -0.070587158203125, -0.06662178039550781, -0.06265640258789062, -0.05869102478027344, -0.05472564697265625, -0.05076026916503906, -0.046794891357421875, -0.04282951354980469, -0.0388641357421875, -0.03489875793457031, -0.030933380126953125, -0.026968002319335938, -0.02300262451171875, -0.019037246704101562, -0.015071868896484375, -0.011106491088867188, -0.00714111328125, -0.0031757354736328125, 0.000789642333984375, 0.0047550201416015625, 0.00872039794921875, 0.012685775756835938, 0.016651153564453125, 0.020616531372070312, 0.0245819091796875, 0.028547286987304688, 0.032512664794921875, 0.03647804260253906, 0.04044342041015625, 0.04440879821777344, 0.048374176025390625, 0.05233955383300781, 0.056304931640625, 0.06027030944824219, 0.06423568725585938, 0.06820106506347656, 0.07216644287109375, 0.07613182067871094, 0.08009719848632812, 0.08406257629394531, 0.0880279541015625, 0.09199333190917969, 0.09595870971679688, 0.09992408752441406, 0.10388946533203125, 0.10785484313964844, 0.11182022094726562, 0.11578559875488281, 0.1197509765625]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 5.0, 2.0, 5.0, 4.0, 4.0, 5.0, 16.0, 18.0, 19.0, 22.0, 22.0, 40.0, 43.0, 73.0, 126.0, 143.0, 198.0, 280.0, 425.0, 711.0, 1162.0, 2653.0, 6793.0, 24080.0, 133889.0, 683713.0, 153620.0, 26508.0, 7578.0, 2766.0, 1346.0, 691.0, 479.0, 329.0, 228.0, 161.0, 111.0, 95.0, 46.0, 36.0, 36.0, 21.0, 19.0, 11.0, 11.0, 6.0, 6.0, 5.0, 3.0, 3.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.316650390625, -0.3055534362792969, -0.29445648193359375, -0.2833595275878906, -0.2722625732421875, -0.2611656188964844, -0.25006866455078125, -0.23897171020507812, -0.227874755859375, -0.21677780151367188, -0.20568084716796875, -0.19458389282226562, -0.1834869384765625, -0.17238998413085938, -0.16129302978515625, -0.15019607543945312, -0.13909912109375, -0.12800216674804688, -0.11690521240234375, -0.10580825805664062, -0.0947113037109375, -0.08361434936523438, -0.07251739501953125, -0.061420440673828125, -0.050323486328125, -0.039226531982421875, -0.02812957763671875, -0.017032623291015625, -0.0059356689453125, 0.005161285400390625, 0.01625823974609375, 0.027355194091796875, 0.0384521484375, 0.049549102783203125, 0.06064605712890625, 0.07174301147460938, 0.0828399658203125, 0.09393692016601562, 0.10503387451171875, 0.11613082885742188, 0.127227783203125, 0.13832473754882812, 0.14942169189453125, 0.16051864624023438, 0.1716156005859375, 0.18271255493164062, 0.19380950927734375, 0.20490646362304688, 0.21600341796875, 0.22710037231445312, 0.23819732666015625, 0.24929428100585938, 0.2603912353515625, 0.2714881896972656, 0.28258514404296875, 0.2936820983886719, 0.304779052734375, 0.3158760070800781, 0.32697296142578125, 0.3380699157714844, 0.3491668701171875, 0.3602638244628906, 0.37136077880859375, 0.3824577331542969, 0.3935546875]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 2.0, 2.0, 2.0, 1.0, 5.0, 3.0, 6.0, 7.0, 11.0, 15.0, 14.0, 13.0, 23.0, 25.0, 26.0, 31.0, 31.0, 44.0, 44.0, 40.0, 46.0, 39.0, 51.0, 38.0, 42.0, 56.0, 34.0, 39.0, 40.0, 32.0, 32.0, 35.0, 33.0, 19.0, 22.0, 28.0, 12.0, 11.0, 10.0, 16.0, 8.0, 6.0, 7.0, 5.0, 3.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.41845703125, -0.4046669006347656, -0.39087677001953125, -0.3770866394042969, -0.3632965087890625, -0.3495063781738281, -0.33571624755859375, -0.3219261169433594, -0.308135986328125, -0.2943458557128906, -0.28055572509765625, -0.2667655944824219, -0.2529754638671875, -0.23918533325195312, -0.22539520263671875, -0.21160507202148438, -0.19781494140625, -0.18402481079101562, -0.17023468017578125, -0.15644454956054688, -0.1426544189453125, -0.12886428833007812, -0.11507415771484375, -0.10128402709960938, -0.087493896484375, -0.07370376586914062, -0.05991363525390625, -0.046123504638671875, -0.0323333740234375, -0.018543243408203125, -0.00475311279296875, 0.009037017822265625, 0.0228271484375, 0.036617279052734375, 0.05040740966796875, 0.06419754028320312, 0.0779876708984375, 0.09177780151367188, 0.10556793212890625, 0.11935806274414062, 0.133148193359375, 0.14693832397460938, 0.16072845458984375, 0.17451858520507812, 0.1883087158203125, 0.20209884643554688, 0.21588897705078125, 0.22967910766601562, 0.24346923828125, 0.2572593688964844, 0.27104949951171875, 0.2848396301269531, 0.2986297607421875, 0.3124198913574219, 0.32621002197265625, 0.3400001525878906, 0.353790283203125, 0.3675804138183594, 0.38137054443359375, 0.3951606750488281, 0.4089508056640625, 0.4227409362792969, 0.43653106689453125, 0.4503211975097656, 0.464111328125]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 1.0, 1.0, 3.0, 5.0, 1.0, 1.0, 3.0, 4.0, 8.0, 12.0, 13.0, 27.0, 28.0, 57.0, 91.0, 212.0, 512.0, 1626.0, 7892.0, 91143.0, 870528.0, 67482.0, 6500.0, 1487.0, 456.0, 206.0, 95.0, 57.0, 39.0, 17.0, 19.0, 9.0, 8.0, 5.0, 4.0, 5.0, 2.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.412841796875, -0.4015159606933594, -0.39019012451171875, -0.3788642883300781, -0.3675384521484375, -0.3562126159667969, -0.34488677978515625, -0.3335609436035156, -0.322235107421875, -0.3109092712402344, -0.29958343505859375, -0.2882575988769531, -0.2769317626953125, -0.2656059265136719, -0.25428009033203125, -0.24295425415039062, -0.23162841796875, -0.22030258178710938, -0.20897674560546875, -0.19765090942382812, -0.1863250732421875, -0.17499923706054688, -0.16367340087890625, -0.15234756469726562, -0.141021728515625, -0.12969589233398438, -0.11837005615234375, -0.10704421997070312, -0.0957183837890625, -0.08439254760742188, -0.07306671142578125, -0.061740875244140625, -0.0504150390625, -0.039089202880859375, -0.02776336669921875, -0.016437530517578125, -0.0051116943359375, 0.006214141845703125, 0.01753997802734375, 0.028865814208984375, 0.040191650390625, 0.051517486572265625, 0.06284332275390625, 0.07416915893554688, 0.0854949951171875, 0.09682083129882812, 0.10814666748046875, 0.11947250366210938, 0.13079833984375, 0.14212417602539062, 0.15345001220703125, 0.16477584838867188, 0.1761016845703125, 0.18742752075195312, 0.19875335693359375, 0.21007919311523438, 0.221405029296875, 0.23273086547851562, 0.24405670166015625, 0.2553825378417969, 0.2667083740234375, 0.2780342102050781, 0.28936004638671875, 0.3006858825683594, 0.31201171875]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 0.0, 1.0, 5.0, 5.0, 2.0, 3.0, 5.0, 6.0, 7.0, 15.0, 11.0, 20.0, 31.0, 41.0, 48.0, 50.0, 61.0, 68.0, 98.0, 71.0, 98.0, 84.0, 66.0, 47.0, 38.0, 27.0, 15.0, 17.0, 17.0, 11.0, 11.0, 8.0, 6.0, 4.0, 6.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.826089859008789e-05, -7.590930908918381e-05, -7.355771958827972e-05, -7.120613008737564e-05, -6.885454058647156e-05, -6.650295108556747e-05, -6.415136158466339e-05, -6.179977208375931e-05, -5.9448182582855225e-05, -5.709659308195114e-05, -5.474500358104706e-05, -5.2393414080142975e-05, -5.004182457923889e-05, -4.769023507833481e-05, -4.5338645577430725e-05, -4.298705607652664e-05, -4.063546657562256e-05, -3.8283877074718475e-05, -3.593228757381439e-05, -3.358069807291031e-05, -3.1229108572006226e-05, -2.8877519071102142e-05, -2.652592957019806e-05, -2.4174340069293976e-05, -2.1822750568389893e-05, -1.947116106748581e-05, -1.7119571566581726e-05, -1.4767982065677643e-05, -1.241639256477356e-05, -1.0064803063869476e-05, -7.713213562965393e-06, -5.36162406206131e-06, -3.0100345611572266e-06, -6.584450602531433e-07, 1.69314444065094e-06, 4.044733941555023e-06, 6.3963234424591064e-06, 8.74791294336319e-06, 1.1099502444267273e-05, 1.3451091945171356e-05, 1.580268144607544e-05, 1.8154270946979523e-05, 2.0505860447883606e-05, 2.285744994878769e-05, 2.5209039449691772e-05, 2.7560628950595856e-05, 2.991221845149994e-05, 3.226380795240402e-05, 3.4615397453308105e-05, 3.696698695421219e-05, 3.931857645511627e-05, 4.1670165956020355e-05, 4.402175545692444e-05, 4.637334495782852e-05, 4.8724934458732605e-05, 5.107652395963669e-05, 5.342811346054077e-05, 5.5779702961444855e-05, 5.813129246234894e-05, 6.048288196325302e-05, 6.28344714641571e-05, 6.518606096506119e-05, 6.753765046596527e-05, 6.988923996686935e-05, 7.224082946777344e-05]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 3.0, 3.0, 7.0, 8.0, 4.0, 22.0, 23.0, 34.0, 81.0, 131.0, 229.0, 535.0, 1491.0, 6216.0, 58665.0, 843380.0, 124865.0, 9602.0, 1993.0, 641.0, 289.0, 144.0, 75.0, 36.0, 32.0, 14.0, 10.0, 6.0, 8.0, 4.0, 3.0, 2.0, 1.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.34521484375, -0.33315277099609375, -0.3210906982421875, -0.30902862548828125, -0.296966552734375, -0.28490447998046875, -0.2728424072265625, -0.26078033447265625, -0.24871826171875, -0.23665618896484375, -0.2245941162109375, -0.21253204345703125, -0.200469970703125, -0.18840789794921875, -0.1763458251953125, -0.16428375244140625, -0.1522216796875, -0.14015960693359375, -0.1280975341796875, -0.11603546142578125, -0.103973388671875, -0.09191131591796875, -0.0798492431640625, -0.06778717041015625, -0.05572509765625, -0.04366302490234375, -0.0316009521484375, -0.01953887939453125, -0.007476806640625, 0.00458526611328125, 0.0166473388671875, 0.02870941162109375, 0.040771484375, 0.05283355712890625, 0.0648956298828125, 0.07695770263671875, 0.089019775390625, 0.10108184814453125, 0.1131439208984375, 0.12520599365234375, 0.13726806640625, 0.14933013916015625, 0.1613922119140625, 0.17345428466796875, 0.185516357421875, 0.19757843017578125, 0.2096405029296875, 0.22170257568359375, 0.2337646484375, 0.24582672119140625, 0.2578887939453125, 0.26995086669921875, 0.282012939453125, 0.29407501220703125, 0.3061370849609375, 0.31819915771484375, 0.33026123046875, 0.34232330322265625, 0.3543853759765625, 0.36644744873046875, 0.378509521484375, 0.39057159423828125, 0.4026336669921875, 0.41469573974609375, 0.4267578125]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 5.0, 4.0, 14.0, 17.0, 26.0, 43.0, 66.0, 98.0, 127.0, 165.0, 154.0, 102.0, 52.0, 35.0, 37.0, 24.0, 14.0, 11.0, 7.0, 9.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.304443359375, -0.29449462890625, -0.2845458984375, -0.27459716796875, -0.2646484375, -0.25469970703125, -0.2447509765625, -0.23480224609375, -0.224853515625, -0.21490478515625, -0.2049560546875, -0.19500732421875, -0.18505859375, -0.17510986328125, -0.1651611328125, -0.15521240234375, -0.145263671875, -0.13531494140625, -0.1253662109375, -0.11541748046875, -0.10546875, -0.09552001953125, -0.0855712890625, -0.07562255859375, -0.065673828125, -0.05572509765625, -0.0457763671875, -0.03582763671875, -0.02587890625, -0.01593017578125, -0.0059814453125, 0.00396728515625, 0.013916015625, 0.02386474609375, 0.0338134765625, 0.04376220703125, 0.0537109375, 0.06365966796875, 0.0736083984375, 0.08355712890625, 0.093505859375, 0.10345458984375, 0.1134033203125, 0.12335205078125, 0.13330078125, 0.14324951171875, 0.1531982421875, 0.16314697265625, 0.173095703125, 0.18304443359375, 0.1929931640625, 0.20294189453125, 0.212890625, 0.22283935546875, 0.2327880859375, 0.24273681640625, 0.252685546875, 0.26263427734375, 0.2725830078125, 0.28253173828125, 0.29248046875, 0.30242919921875, 0.3123779296875, 0.32232666015625, 0.332275390625]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 3.0, 1.0, 2.0, 5.0, 8.0, 8.0, 20.0, 52.0, 89.0, 185.0, 208.0, 175.0, 115.0, 53.0, 41.0, 18.0, 11.0, 5.0, 4.0, 4.0, 2.0, 2.0, 1.0, 1.0], "bins": [-7.870377540588379, -7.715275287628174, -7.560173034667969, -7.405071258544922, -7.249969005584717, -7.094866752624512, -6.939764499664307, -6.784662246704102, -6.629560470581055, -6.47445821762085, -6.3193559646606445, -6.164254188537598, -6.009151935577393, -5.8540496826171875, -5.698947429656982, -5.543845176696777, -5.388742923736572, -5.233640670776367, -5.078538417816162, -4.923436641693115, -4.76833438873291, -4.613232135772705, -4.4581298828125, -4.303027629852295, -4.14792537689209, -3.9928231239318848, -3.837721109390259, -3.6826188564300537, -3.5275168418884277, -3.3724145889282227, -3.2173123359680176, -3.0622100830078125, -2.907108783721924, -2.7520065307617188, -2.5969045162200928, -2.4418022632598877, -2.2867002487182617, -2.1315979957580566, -1.9764957427978516, -1.821393609046936, -1.6662914752960205, -1.511189341545105, -1.3560872077941895, -1.2009849548339844, -1.0458828210830688, -0.8907806873321533, -0.735678493976593, -0.5805763006210327, -0.4254741668701172, -0.2703720033168793, -0.11526983976364136, 0.03983232378959656, 0.19493448734283447, 0.35003662109375, 0.5051388144493103, 0.6602410078048706, 0.8153431415557861, 0.9704452753067017, 1.1255474090576172, 1.2806496620178223, 1.4357517957687378, 1.5908539295196533, 1.7459561824798584, 1.901058316230774, 2.0561604499816895]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 6.0, 3.0, 1.0, 3.0, 8.0, 6.0, 7.0, 9.0, 16.0, 19.0, 24.0, 20.0, 31.0, 42.0, 37.0, 37.0, 42.0, 45.0, 51.0, 49.0, 59.0, 58.0, 55.0, 62.0, 46.0, 38.0, 33.0, 27.0, 33.0, 33.0, 20.0, 17.0, 19.0, 13.0, 4.0, 9.0, 13.0, 6.0, 4.0, 3.0, 3.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.454786777496338, -2.3776750564575195, -2.3005635738372803, -2.223451852798462, -2.1463403701782227, -2.0692286491394043, -1.992116928100586, -1.9150053262710571, -1.8378937244415283, -1.7607821226119995, -1.6836705207824707, -1.6065587997436523, -1.5294471979141235, -1.4523355960845947, -1.3752238750457764, -1.2981122732162476, -1.2210006713867188, -1.14388906955719, -1.0667774677276611, -0.9896657466888428, -0.912554144859314, -0.8354425430297852, -0.7583308815956116, -0.681219220161438, -0.6041076183319092, -0.5269960165023804, -0.4498843550682068, -0.3727727234363556, -0.2956610918045044, -0.2185494601726532, -0.141437828540802, -0.06432616710662842, 0.01278543472290039, 0.08989706635475159, 0.16700869798660278, 0.24412032961845398, 0.3212319612503052, 0.39834359288215637, 0.47545522451400757, 0.5525668859481812, 0.62967848777771, 0.7067900896072388, 0.7839017510414124, 0.8610134124755859, 0.9381250143051147, 1.0152366161346436, 1.092348337173462, 1.1694599390029907, 1.2465715408325195, 1.3236831426620483, 1.4007947444915771, 1.4779064655303955, 1.5550180673599243, 1.6321296691894531, 1.7092413902282715, 1.7863529920578003, 1.863464593887329, 1.940576195716858, 2.0176877975463867, 2.094799518585205, 2.1719112396240234, 2.2490227222442627, 2.326134443283081, 2.4032459259033203, 2.4803576469421387]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 3.0, 0.0, 1.0, 1.0, 2.0, 7.0, 6.0, 14.0, 9.0, 14.0, 25.0, 41.0, 57.0, 71.0, 101.0, 184.0, 252.0, 431.0, 767.0, 1373.0, 3024.0, 9445.0, 86877.0, 4049244.0, 31639.0, 5679.0, 2233.0, 1121.0, 603.0, 352.0, 234.0, 157.0, 99.0, 56.0, 51.0, 38.0, 28.0, 20.0, 8.0, 9.0, 5.0, 6.0, 4.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.55078125, -0.5306243896484375, -0.510467529296875, -0.4903106689453125, -0.47015380859375, -0.4499969482421875, -0.429840087890625, -0.4096832275390625, -0.3895263671875, -0.3693695068359375, -0.349212646484375, -0.3290557861328125, -0.30889892578125, -0.2887420654296875, -0.268585205078125, -0.2484283447265625, -0.228271484375, -0.2081146240234375, -0.187957763671875, -0.1678009033203125, -0.14764404296875, -0.1274871826171875, -0.107330322265625, -0.0871734619140625, -0.0670166015625, -0.0468597412109375, -0.026702880859375, -0.0065460205078125, 0.01361083984375, 0.0337677001953125, 0.053924560546875, 0.0740814208984375, 0.09423828125, 0.1143951416015625, 0.134552001953125, 0.1547088623046875, 0.17486572265625, 0.1950225830078125, 0.215179443359375, 0.2353363037109375, 0.2554931640625, 0.2756500244140625, 0.295806884765625, 0.3159637451171875, 0.33612060546875, 0.3562774658203125, 0.376434326171875, 0.3965911865234375, 0.416748046875, 0.4369049072265625, 0.457061767578125, 0.4772186279296875, 0.49737548828125, 0.5175323486328125, 0.537689208984375, 0.5578460693359375, 0.5780029296875, 0.5981597900390625, 0.618316650390625, 0.6384735107421875, 0.65863037109375, 0.6787872314453125, 0.698944091796875, 0.7191009521484375, 0.7392578125]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 1.0, 2.0, 2.0, 1.0, 2.0, 3.0, 4.0, 7.0, 8.0, 11.0, 11.0, 12.0, 20.0, 14.0, 31.0, 25.0, 42.0, 39.0, 46.0, 59.0, 59.0, 44.0, 76.0, 63.0, 57.0, 55.0, 55.0, 38.0, 30.0, 35.0, 35.0, 29.0, 18.0, 18.0, 15.0, 4.0, 8.0, 6.0, 5.0, 4.0, 6.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.12139892578125, -0.1176919937133789, -0.11398506164550781, -0.11027812957763672, -0.10657119750976562, -0.10286426544189453, -0.09915733337402344, -0.09545040130615234, -0.09174346923828125, -0.08803653717041016, -0.08432960510253906, -0.08062267303466797, -0.07691574096679688, -0.07320880889892578, -0.06950187683105469, -0.0657949447631836, -0.0620880126953125, -0.058381080627441406, -0.05467414855957031, -0.05096721649169922, -0.047260284423828125, -0.04355335235595703, -0.03984642028808594, -0.036139488220214844, -0.03243255615234375, -0.028725624084472656, -0.025018692016601562, -0.02131175994873047, -0.017604827880859375, -0.013897895812988281, -0.010190963745117188, -0.006484031677246094, -0.002777099609375, 0.0009298324584960938, 0.0046367645263671875, 0.008343696594238281, 0.012050628662109375, 0.01575756072998047, 0.019464492797851562, 0.023171424865722656, 0.02687835693359375, 0.030585289001464844, 0.03429222106933594, 0.03799915313720703, 0.041706085205078125, 0.04541301727294922, 0.04911994934082031, 0.052826881408691406, 0.0565338134765625, 0.060240745544433594, 0.06394767761230469, 0.06765460968017578, 0.07136154174804688, 0.07506847381591797, 0.07877540588378906, 0.08248233795166016, 0.08618927001953125, 0.08989620208740234, 0.09360313415527344, 0.09731006622314453, 0.10101699829101562, 0.10472393035888672, 0.10843086242675781, 0.1121377944946289, 0.1158447265625]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 3.0, 7.0, 4.0, 7.0, 5.0, 14.0, 16.0, 15.0, 25.0, 29.0, 58.0, 60.0, 109.0, 152.0, 315.0, 787.0, 1812.0, 5877.0, 31559.0, 3989293.0, 146385.0, 12272.0, 3239.0, 1151.0, 458.0, 209.0, 133.0, 76.0, 58.0, 29.0, 26.0, 17.0, 24.0, 14.0, 10.0, 16.0, 10.0, 5.0, 2.0, 2.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.84765625, -0.82177734375, -0.7958984375, -0.77001953125, -0.744140625, -0.71826171875, -0.6923828125, -0.66650390625, -0.640625, -0.61474609375, -0.5888671875, -0.56298828125, -0.537109375, -0.51123046875, -0.4853515625, -0.45947265625, -0.43359375, -0.40771484375, -0.3818359375, -0.35595703125, -0.330078125, -0.30419921875, -0.2783203125, -0.25244140625, -0.2265625, -0.20068359375, -0.1748046875, -0.14892578125, -0.123046875, -0.09716796875, -0.0712890625, -0.04541015625, -0.01953125, 0.00634765625, 0.0322265625, 0.05810546875, 0.083984375, 0.10986328125, 0.1357421875, 0.16162109375, 0.1875, 0.21337890625, 0.2392578125, 0.26513671875, 0.291015625, 0.31689453125, 0.3427734375, 0.36865234375, 0.39453125, 0.42041015625, 0.4462890625, 0.47216796875, 0.498046875, 0.52392578125, 0.5498046875, 0.57568359375, 0.6015625, 0.62744140625, 0.6533203125, 0.67919921875, 0.705078125, 0.73095703125, 0.7568359375, 0.78271484375, 0.80859375]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 5.0, 2.0, 6.0, 14.0, 16.0, 37.0, 76.0, 300.0, 3226.0, 242.0, 73.0, 31.0, 20.0, 10.0, 8.0, 7.0, 3.0, 2.0, 2.0, 0.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.221923828125, -0.211578369140625, -0.20123291015625, -0.190887451171875, -0.1805419921875, -0.170196533203125, -0.15985107421875, -0.149505615234375, -0.13916015625, -0.128814697265625, -0.11846923828125, -0.108123779296875, -0.0977783203125, -0.087432861328125, -0.07708740234375, -0.066741943359375, -0.056396484375, -0.046051025390625, -0.03570556640625, -0.025360107421875, -0.0150146484375, -0.004669189453125, 0.00567626953125, 0.016021728515625, 0.0263671875, 0.036712646484375, 0.04705810546875, 0.057403564453125, 0.0677490234375, 0.078094482421875, 0.08843994140625, 0.098785400390625, 0.109130859375, 0.119476318359375, 0.12982177734375, 0.140167236328125, 0.1505126953125, 0.160858154296875, 0.17120361328125, 0.181549072265625, 0.19189453125, 0.202239990234375, 0.21258544921875, 0.222930908203125, 0.2332763671875, 0.243621826171875, 0.25396728515625, 0.264312744140625, 0.274658203125, 0.285003662109375, 0.29534912109375, 0.305694580078125, 0.3160400390625, 0.326385498046875, 0.33673095703125, 0.347076416015625, 0.357421875, 0.367767333984375, 0.37811279296875, 0.388458251953125, 0.3988037109375, 0.409149169921875, 0.41949462890625, 0.429840087890625, 0.440185546875]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 6.0, 2.0, 5.0, 1.0, 6.0, 11.0, 19.0, 37.0, 46.0, 81.0, 117.0, 125.0, 126.0, 120.0, 89.0, 71.0, 44.0, 37.0, 20.0, 8.0, 8.0, 5.0, 4.0, 6.0, 2.0, 4.0, 1.0, 2.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.697595477104187, -0.6671168804168701, -0.636638343334198, -0.6061597466468811, -0.575681209564209, -0.5452026128768921, -0.51472407579422, -0.4842454791069031, -0.45376694202423096, -0.42328837513923645, -0.39280980825424194, -0.36233124136924744, -0.33185267448425293, -0.30137407779693604, -0.2708955407142639, -0.24041695892810822, -0.20993837714195251, -0.179459810256958, -0.1489812433719635, -0.1185026690363884, -0.08802410215139389, -0.05754552781581879, -0.02706696093082428, 0.003411605954170227, 0.033890172839164734, 0.06436873972415924, 0.09484730660915375, 0.12532588839530945, 0.15580445528030396, 0.18628302216529846, 0.21676158905029297, 0.24724015593528748, 0.277718722820282, 0.3081972897052765, 0.338675856590271, 0.3691544234752655, 0.39963299036026, 0.4301115870475769, 0.460590124130249, 0.4910687208175659, 0.521547257900238, 0.5520258545875549, 0.582504391670227, 0.612982988357544, 0.6434615254402161, 0.673940122127533, 0.7044186592102051, 0.734897255897522, 0.7653758525848389, 0.7958544492721558, 0.8263329863548279, 0.8568115830421448, 0.8872901201248169, 0.9177687168121338, 0.9482472538948059, 0.9787258505821228, 1.009204387664795, 1.0396829843521118, 1.0701615810394287, 1.100640058517456, 1.131118655204773, 1.1615972518920898, 1.1920758485794067, 1.222554326057434, 1.253032922744751]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 7.0, 7.0, 6.0, 10.0, 16.0, 14.0, 18.0, 18.0, 17.0, 25.0, 24.0, 27.0, 33.0, 25.0, 31.0, 51.0, 43.0, 50.0, 40.0, 47.0, 40.0, 44.0, 50.0, 35.0, 49.0, 39.0, 36.0, 41.0, 24.0, 28.0, 20.0, 13.0, 20.0, 5.0, 14.0, 10.0, 6.0, 7.0, 5.0, 4.0, 5.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.4916629195213318, -0.47459128499031067, -0.45751968026161194, -0.4404480457305908, -0.4233764410018921, -0.40630480647087097, -0.38923317193984985, -0.3721615672111511, -0.3550899624824524, -0.3380183279514313, -0.32094672322273254, -0.3038750886917114, -0.2868034839630127, -0.2697318494319916, -0.25266021490097046, -0.23558861017227173, -0.2185169756412506, -0.20144535601139069, -0.18437373638153076, -0.16730210185050964, -0.1502304971218109, -0.1331588625907898, -0.11608724296092987, -0.09901562333106995, -0.08194400370121002, -0.0648723840713501, -0.047800760716199875, -0.030729137361049652, -0.013657517731189728, 0.0034141018986701965, 0.020485728979110718, 0.03755734860897064, 0.054628968238830566, 0.07170058786869049, 0.08877220749855042, 0.10584383457899094, 0.12291545420885086, 0.13998708128929138, 0.1570587009191513, 0.17413032054901123, 0.19120194017887115, 0.20827355980873108, 0.225345179438591, 0.24241679906845093, 0.25948843359947205, 0.2765600383281708, 0.2936316728591919, 0.3107032775878906, 0.32777491211891174, 0.34484654664993286, 0.3619181513786316, 0.3789897859096527, 0.39606139063835144, 0.41313302516937256, 0.4302046298980713, 0.4472762644290924, 0.4643478989601135, 0.48141953349113464, 0.4984911382198334, 0.5155627727508545, 0.5326343774795532, 0.549705982208252, 0.5667776465415955, 0.5838492512702942, 0.6009208559989929]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 4.0, 4.0, 14.0, 15.0, 23.0, 17.0, 43.0, 51.0, 89.0, 149.0, 227.0, 501.0, 945.0, 1804.0, 3877.0, 9184.0, 23220.0, 66424.0, 222738.0, 491103.0, 149491.0, 48064.0, 17604.0, 6929.0, 2956.0, 1390.0, 717.0, 398.0, 208.0, 135.0, 80.0, 57.0, 32.0, 21.0, 17.0, 7.0, 7.0, 3.0, 4.0, 2.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.402099609375, -0.3900413513183594, -0.37798309326171875, -0.3659248352050781, -0.3538665771484375, -0.3418083190917969, -0.32975006103515625, -0.3176918029785156, -0.305633544921875, -0.2935752868652344, -0.28151702880859375, -0.2694587707519531, -0.2574005126953125, -0.24534225463867188, -0.23328399658203125, -0.22122573852539062, -0.20916748046875, -0.19710922241210938, -0.18505096435546875, -0.17299270629882812, -0.1609344482421875, -0.14887619018554688, -0.13681793212890625, -0.12475967407226562, -0.112701416015625, -0.10064315795898438, -0.08858489990234375, -0.07652664184570312, -0.0644683837890625, -0.052410125732421875, -0.04035186767578125, -0.028293609619140625, -0.0162353515625, -0.004177093505859375, 0.00788116455078125, 0.019939422607421875, 0.0319976806640625, 0.044055938720703125, 0.05611419677734375, 0.06817245483398438, 0.080230712890625, 0.09228897094726562, 0.10434722900390625, 0.11640548706054688, 0.1284637451171875, 0.14052200317382812, 0.15258026123046875, 0.16463851928710938, 0.17669677734375, 0.18875503540039062, 0.20081329345703125, 0.21287155151367188, 0.2249298095703125, 0.23698806762695312, 0.24904632568359375, 0.2611045837402344, 0.273162841796875, 0.2852210998535156, 0.29727935791015625, 0.3093376159667969, 0.3213958740234375, 0.3334541320800781, 0.34551239013671875, 0.3575706481933594, 0.36962890625]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 0.0, 1.0, 4.0, 2.0, 4.0, 4.0, 8.0, 10.0, 7.0, 19.0, 28.0, 26.0, 40.0, 39.0, 49.0, 51.0, 59.0, 70.0, 62.0, 69.0, 49.0, 68.0, 50.0, 59.0, 50.0, 43.0, 25.0, 37.0, 25.0, 14.0, 12.0, 9.0, 2.0, 5.0, 2.0, 4.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1591796875, -0.15453720092773438, -0.14989471435546875, -0.14525222778320312, -0.1406097412109375, -0.13596725463867188, -0.13132476806640625, -0.12668228149414062, -0.122039794921875, -0.11739730834960938, -0.11275482177734375, -0.10811233520507812, -0.1034698486328125, -0.09882736206054688, -0.09418487548828125, -0.08954238891601562, -0.08489990234375, -0.08025741577148438, -0.07561492919921875, -0.07097244262695312, -0.0663299560546875, -0.061687469482421875, -0.05704498291015625, -0.052402496337890625, -0.047760009765625, -0.043117523193359375, -0.03847503662109375, -0.033832550048828125, -0.0291900634765625, -0.024547576904296875, -0.01990509033203125, -0.015262603759765625, -0.0106201171875, -0.005977630615234375, -0.00133514404296875, 0.003307342529296875, 0.0079498291015625, 0.012592315673828125, 0.01723480224609375, 0.021877288818359375, 0.026519775390625, 0.031162261962890625, 0.03580474853515625, 0.040447235107421875, 0.0450897216796875, 0.049732208251953125, 0.05437469482421875, 0.059017181396484375, 0.06365966796875, 0.06830215454101562, 0.07294464111328125, 0.07758712768554688, 0.0822296142578125, 0.08687210083007812, 0.09151458740234375, 0.09615707397460938, 0.100799560546875, 0.10544204711914062, 0.11008453369140625, 0.11472702026367188, 0.1193695068359375, 0.12401199340820312, 0.12865447998046875, 0.13329696655273438, 0.137939453125]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 2.0, 1.0, 5.0, 4.0, 6.0, 11.0, 14.0, 14.0, 19.0, 29.0, 34.0, 41.0, 60.0, 98.0, 134.0, 187.0, 279.0, 443.0, 726.0, 1375.0, 3099.0, 8168.0, 32572.0, 233002.0, 664593.0, 78964.0, 15060.0, 4823.0, 2052.0, 1084.0, 568.0, 336.0, 219.0, 145.0, 128.0, 66.0, 38.0, 39.0, 31.0, 30.0, 16.0, 10.0, 10.0, 7.0, 7.0, 5.0, 3.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.49609375, -0.48021697998046875, -0.4643402099609375, -0.44846343994140625, -0.432586669921875, -0.41670989990234375, -0.4008331298828125, -0.38495635986328125, -0.36907958984375, -0.35320281982421875, -0.3373260498046875, -0.32144927978515625, -0.305572509765625, -0.28969573974609375, -0.2738189697265625, -0.25794219970703125, -0.2420654296875, -0.22618865966796875, -0.2103118896484375, -0.19443511962890625, -0.178558349609375, -0.16268157958984375, -0.1468048095703125, -0.13092803955078125, -0.11505126953125, -0.09917449951171875, -0.0832977294921875, -0.06742095947265625, -0.051544189453125, -0.03566741943359375, -0.0197906494140625, -0.00391387939453125, 0.011962890625, 0.02783966064453125, 0.0437164306640625, 0.05959320068359375, 0.075469970703125, 0.09134674072265625, 0.1072235107421875, 0.12310028076171875, 0.13897705078125, 0.15485382080078125, 0.1707305908203125, 0.18660736083984375, 0.202484130859375, 0.21836090087890625, 0.2342376708984375, 0.25011444091796875, 0.2659912109375, 0.28186798095703125, 0.2977447509765625, 0.31362152099609375, 0.329498291015625, 0.34537506103515625, 0.3612518310546875, 0.37712860107421875, 0.39300537109375, 0.40888214111328125, 0.4247589111328125, 0.44063568115234375, 0.456512451171875, 0.47238922119140625, 0.4882659912109375, 0.5041427612304688, 0.52001953125]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 2.0, 4.0, 1.0, 2.0, 4.0, 3.0, 3.0, 7.0, 8.0, 12.0, 19.0, 13.0, 14.0, 23.0, 26.0, 21.0, 31.0, 36.0, 33.0, 36.0, 37.0, 45.0, 45.0, 45.0, 32.0, 58.0, 46.0, 54.0, 41.0, 44.0, 39.0, 35.0, 34.0, 31.0, 23.0, 15.0, 16.0, 21.0, 17.0, 7.0, 7.0, 7.0, 4.0, 2.0, 1.0, 3.0, 1.0, 4.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.417236328125, -0.4026679992675781, -0.38809967041015625, -0.3735313415527344, -0.3589630126953125, -0.3443946838378906, -0.32982635498046875, -0.3152580261230469, -0.300689697265625, -0.2861213684082031, -0.27155303955078125, -0.2569847106933594, -0.2424163818359375, -0.22784805297851562, -0.21327972412109375, -0.19871139526367188, -0.18414306640625, -0.16957473754882812, -0.15500640869140625, -0.14043807983398438, -0.1258697509765625, -0.11130142211914062, -0.09673309326171875, -0.08216476440429688, -0.067596435546875, -0.053028106689453125, -0.03845977783203125, -0.023891448974609375, -0.0093231201171875, 0.005245208740234375, 0.01981353759765625, 0.034381866455078125, 0.0489501953125, 0.06351852416992188, 0.07808685302734375, 0.09265518188476562, 0.1072235107421875, 0.12179183959960938, 0.13636016845703125, 0.15092849731445312, 0.165496826171875, 0.18006515502929688, 0.19463348388671875, 0.20920181274414062, 0.2237701416015625, 0.23833847045898438, 0.25290679931640625, 0.2674751281738281, 0.28204345703125, 0.2966117858886719, 0.31118011474609375, 0.3257484436035156, 0.3403167724609375, 0.3548851013183594, 0.36945343017578125, 0.3840217590332031, 0.398590087890625, 0.4131584167480469, 0.42772674560546875, 0.4422950744628906, 0.4568634033203125, 0.4714317321777344, 0.48600006103515625, 0.5005683898925781, 0.51513671875]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 5.0, 4.0, 1.0, 1.0, 7.0, 6.0, 6.0, 12.0, 15.0, 38.0, 33.0, 63.0, 82.0, 178.0, 227.0, 416.0, 711.0, 1356.0, 2720.0, 6079.0, 15425.0, 47276.0, 186007.0, 575247.0, 149132.0, 39237.0, 13547.0, 5360.0, 2463.0, 1257.0, 668.0, 337.0, 232.0, 127.0, 90.0, 63.0, 44.0, 28.0, 18.0, 11.0, 11.0, 7.0, 4.0, 5.0, 5.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0], "bins": [-0.167236328125, -0.16251564025878906, -0.15779495239257812, -0.1530742645263672, -0.14835357666015625, -0.1436328887939453, -0.13891220092773438, -0.13419151306152344, -0.1294708251953125, -0.12475013732910156, -0.12002944946289062, -0.11530876159667969, -0.11058807373046875, -0.10586738586425781, -0.10114669799804688, -0.09642601013183594, -0.091705322265625, -0.08698463439941406, -0.08226394653320312, -0.07754325866699219, -0.07282257080078125, -0.06810188293457031, -0.06338119506835938, -0.05866050720214844, -0.0539398193359375, -0.04921913146972656, -0.044498443603515625, -0.03977775573730469, -0.03505706787109375, -0.030336380004882812, -0.025615692138671875, -0.020895004272460938, -0.01617431640625, -0.011453628540039062, -0.006732940673828125, -0.0020122528076171875, 0.00270843505859375, 0.0074291229248046875, 0.012149810791015625, 0.016870498657226562, 0.0215911865234375, 0.026311874389648438, 0.031032562255859375, 0.03575325012207031, 0.04047393798828125, 0.04519462585449219, 0.049915313720703125, 0.05463600158691406, 0.059356689453125, 0.06407737731933594, 0.06879806518554688, 0.07351875305175781, 0.07823944091796875, 0.08296012878417969, 0.08768081665039062, 0.09240150451660156, 0.0971221923828125, 0.10184288024902344, 0.10656356811523438, 0.11128425598144531, 0.11600494384765625, 0.12072563171386719, 0.12544631958007812, 0.13016700744628906, 0.1348876953125]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 4.0, 1.0, 4.0, 4.0, 4.0, 5.0, 8.0, 6.0, 6.0, 8.0, 16.0, 14.0, 22.0, 15.0, 37.0, 25.0, 33.0, 33.0, 55.0, 74.0, 78.0, 87.0, 88.0, 70.0, 62.0, 40.0, 41.0, 32.0, 22.0, 23.0, 20.0, 13.0, 13.0, 9.0, 10.0, 10.0, 6.0, 2.0, 6.0, 2.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.2988529205322266e-05, -5.093030631542206e-05, -4.887208342552185e-05, -4.681386053562164e-05, -4.4755637645721436e-05, -4.269741475582123e-05, -4.063919186592102e-05, -3.858096897602081e-05, -3.6522746086120605e-05, -3.44645231962204e-05, -3.240630030632019e-05, -3.0348077416419983e-05, -2.8289854526519775e-05, -2.6231631636619568e-05, -2.417340874671936e-05, -2.2115185856819153e-05, -2.0056962966918945e-05, -1.7998740077018738e-05, -1.594051718711853e-05, -1.3882294297218323e-05, -1.1824071407318115e-05, -9.765848517417908e-06, -7.7076256275177e-06, -5.649402737617493e-06, -3.591179847717285e-06, -1.5329569578170776e-06, 5.252659320831299e-07, 2.5834888219833374e-06, 4.641711711883545e-06, 6.6999346017837524e-06, 8.75815749168396e-06, 1.0816380381584167e-05, 1.2874603271484375e-05, 1.4932826161384583e-05, 1.699104905128479e-05, 1.9049271941184998e-05, 2.1107494831085205e-05, 2.3165717720985413e-05, 2.522394061088562e-05, 2.7282163500785828e-05, 2.9340386390686035e-05, 3.139860928058624e-05, 3.345683217048645e-05, 3.551505506038666e-05, 3.7573277950286865e-05, 3.963150084018707e-05, 4.168972373008728e-05, 4.374794661998749e-05, 4.5806169509887695e-05, 4.78643923997879e-05, 4.992261528968811e-05, 5.198083817958832e-05, 5.4039061069488525e-05, 5.609728395938873e-05, 5.815550684928894e-05, 6.021372973918915e-05, 6.227195262908936e-05, 6.433017551898956e-05, 6.638839840888977e-05, 6.844662129878998e-05, 7.050484418869019e-05, 7.256306707859039e-05, 7.46212899684906e-05, 7.667951285839081e-05, 7.873773574829102e-05]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 4.0, 3.0, 7.0, 6.0, 8.0, 7.0, 15.0, 33.0, 30.0, 37.0, 88.0, 107.0, 179.0, 296.0, 565.0, 1094.0, 2485.0, 7014.0, 28299.0, 192673.0, 670614.0, 116347.0, 19308.0, 5244.0, 1992.0, 902.0, 465.0, 278.0, 163.0, 105.0, 64.0, 44.0, 27.0, 23.0, 8.0, 10.0, 7.0, 2.0, 3.0, 5.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.2159423828125, -0.20966148376464844, -0.20338058471679688, -0.1970996856689453, -0.19081878662109375, -0.1845378875732422, -0.17825698852539062, -0.17197608947753906, -0.1656951904296875, -0.15941429138183594, -0.15313339233398438, -0.1468524932861328, -0.14057159423828125, -0.1342906951904297, -0.12800979614257812, -0.12172889709472656, -0.115447998046875, -0.10916709899902344, -0.10288619995117188, -0.09660530090332031, -0.09032440185546875, -0.08404350280761719, -0.07776260375976562, -0.07148170471191406, -0.0652008056640625, -0.05891990661621094, -0.052639007568359375, -0.04635810852050781, -0.04007720947265625, -0.03379631042480469, -0.027515411376953125, -0.021234512329101562, -0.01495361328125, -0.008672714233398438, -0.002391815185546875, 0.0038890838623046875, 0.01016998291015625, 0.016450881958007812, 0.022731781005859375, 0.029012680053710938, 0.0352935791015625, 0.04157447814941406, 0.047855377197265625, 0.05413627624511719, 0.06041717529296875, 0.06669807434082031, 0.07297897338867188, 0.07925987243652344, 0.085540771484375, 0.09182167053222656, 0.09810256958007812, 0.10438346862792969, 0.11066436767578125, 0.11694526672363281, 0.12322616577148438, 0.12950706481933594, 0.1357879638671875, 0.14206886291503906, 0.14834976196289062, 0.1546306610107422, 0.16091156005859375, 0.1671924591064453, 0.17347335815429688, 0.17975425720214844, 0.18603515625]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 2.0, 6.0, 1.0, 12.0, 12.0, 17.0, 17.0, 8.0, 28.0, 22.0, 39.0, 44.0, 50.0, 62.0, 104.0, 114.0, 94.0, 74.0, 69.0, 48.0, 40.0, 31.0, 19.0, 21.0, 21.0, 14.0, 8.0, 8.0, 4.0, 7.0, 3.0, 2.0, 6.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0], "bins": [-0.22900390625, -0.22325706481933594, -0.21751022338867188, -0.2117633819580078, -0.20601654052734375, -0.2002696990966797, -0.19452285766601562, -0.18877601623535156, -0.1830291748046875, -0.17728233337402344, -0.17153549194335938, -0.1657886505126953, -0.16004180908203125, -0.1542949676513672, -0.14854812622070312, -0.14280128479003906, -0.137054443359375, -0.13130760192871094, -0.12556076049804688, -0.11981391906738281, -0.11406707763671875, -0.10832023620605469, -0.10257339477539062, -0.09682655334472656, -0.0910797119140625, -0.08533287048339844, -0.07958602905273438, -0.07383918762207031, -0.06809234619140625, -0.06234550476074219, -0.056598663330078125, -0.05085182189941406, -0.04510498046875, -0.03935813903808594, -0.033611297607421875, -0.027864456176757812, -0.02211761474609375, -0.016370773315429688, -0.010623931884765625, -0.0048770904541015625, 0.0008697509765625, 0.0066165924072265625, 0.012363433837890625, 0.018110275268554688, 0.02385711669921875, 0.029603958129882812, 0.035350799560546875, 0.04109764099121094, 0.046844482421875, 0.05259132385253906, 0.058338165283203125, 0.06408500671386719, 0.06983184814453125, 0.07557868957519531, 0.08132553100585938, 0.08707237243652344, 0.0928192138671875, 0.09856605529785156, 0.10431289672851562, 0.11005973815917969, 0.11580657958984375, 0.12155342102050781, 0.12730026245117188, 0.13304710388183594, 0.1387939453125]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 4.0, 6.0, 18.0, 23.0, 48.0, 77.0, 136.0, 194.0, 205.0, 145.0, 65.0, 41.0, 27.0, 8.0, 4.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.366976737976074, -4.2116475105285645, -4.056318283081055, -3.900989294052124, -3.7456603050231934, -3.5903310775756836, -3.435001850128174, -3.279672861099243, -3.1243438720703125, -2.9690146446228027, -2.813685655593872, -2.6583564281463623, -2.5030274391174316, -2.347698211669922, -2.192368984222412, -2.0370399951934814, -1.8817107677459717, -1.7263816595077515, -1.5710525512695312, -1.4157233238220215, -1.2603943347930908, -1.105065107345581, -0.9497359991073608, -0.7944068908691406, -0.6390777826309204, -0.4837486743927002, -0.3284195363521576, -0.173090398311615, -0.017761290073394775, 0.13756781816482544, 0.29289698600769043, 0.44822609424591064, 0.6035552024841309, 0.7588843107223511, 0.9142134189605713, 1.069542646408081, 1.2248716354370117, 1.3802008628845215, 1.5355299711227417, 1.690859079360962, 1.8461881875991821, 2.0015172958374023, 2.156846523284912, 2.3121755123138428, 2.4675047397613525, 2.622833728790283, 2.778162956237793, 2.9334921836853027, 3.0888211727142334, 3.244150400161743, 3.399479389190674, 3.5548086166381836, 3.7101376056671143, 3.865466833114624, 4.020795822143555, 4.1761250495910645, 4.331454277038574, 4.486783504486084, 4.642112731933594, 4.797441482543945, 4.952770709991455, 5.108099937438965, 5.263429164886475, 5.418758392333984, 5.574087142944336]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 4.0, 4.0, 5.0, 6.0, 11.0, 4.0, 2.0, 17.0, 15.0, 18.0, 26.0, 15.0, 13.0, 28.0, 27.0, 31.0, 38.0, 47.0, 42.0, 56.0, 46.0, 49.0, 48.0, 50.0, 47.0, 41.0, 34.0, 41.0, 36.0, 27.0, 31.0, 22.0, 18.0, 28.0, 26.0, 13.0, 12.0, 5.0, 4.0, 1.0, 7.0, 7.0, 4.0, 1.0, 1.0, 3.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.0970375537872314, -2.0320422649383545, -1.9670469760894775, -1.9020518064498901, -1.8370565176010132, -1.7720612287521362, -1.7070660591125488, -1.6420707702636719, -1.577075481414795, -1.512080192565918, -1.447084903717041, -1.3820897340774536, -1.3170944452285767, -1.2520991563796997, -1.1871039867401123, -1.1221086978912354, -1.0571134090423584, -0.9921181201934814, -0.9271228909492493, -0.8621276617050171, -0.7971323728561401, -0.7321370840072632, -0.667141854763031, -0.6021466255187988, -0.5371513366699219, -0.4721560776233673, -0.40716081857681274, -0.3421655595302582, -0.2771703004837036, -0.21217504143714905, -0.14717978239059448, -0.08218452334403992, -0.017189502716064453, 0.04780575633049011, 0.11280101537704468, 0.17779627442359924, 0.2427915334701538, 0.3077867925167084, 0.37278205156326294, 0.4377773106098175, 0.5027725696563721, 0.567767858505249, 0.6327630877494812, 0.6977583169937134, 0.7627536058425903, 0.8277488946914673, 0.8927441239356995, 0.9577393531799316, 1.0227346420288086, 1.0877299308776855, 1.1527252197265625, 1.21772038936615, 1.2827156782150269, 1.3477109670639038, 1.4127061367034912, 1.4777014255523682, 1.5426967144012451, 1.607692003250122, 1.672687292098999, 1.7376824617385864, 1.8026777505874634, 1.8676730394363403, 1.9326682090759277, 1.9976634979248047, 2.0626587867736816]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 1.0, 3.0, 4.0, 5.0, 8.0, 12.0, 12.0, 30.0, 35.0, 48.0, 75.0, 131.0, 188.0, 286.0, 440.0, 732.0, 1249.0, 2080.0, 3813.0, 6995.0, 14310.0, 33195.0, 103630.0, 728891.0, 2868122.0, 314960.0, 66314.0, 24357.0, 11207.0, 5617.0, 3001.0, 1757.0, 1069.0, 638.0, 368.0, 233.0, 163.0, 98.0, 64.0, 51.0, 31.0, 18.0, 14.0, 13.0, 10.0, 7.0, 3.0, 0.0, 0.0, 4.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.247802734375, -0.2405834197998047, -0.23336410522460938, -0.22614479064941406, -0.21892547607421875, -0.21170616149902344, -0.20448684692382812, -0.1972675323486328, -0.1900482177734375, -0.1828289031982422, -0.17560958862304688, -0.16839027404785156, -0.16117095947265625, -0.15395164489746094, -0.14673233032226562, -0.1395130157470703, -0.132293701171875, -0.1250743865966797, -0.11785507202148438, -0.11063575744628906, -0.10341644287109375, -0.09619712829589844, -0.08897781372070312, -0.08175849914550781, -0.0745391845703125, -0.06731986999511719, -0.060100555419921875, -0.05288124084472656, -0.04566192626953125, -0.03844261169433594, -0.031223297119140625, -0.024003982543945312, -0.01678466796875, -0.009565353393554688, -0.002346038818359375, 0.0048732757568359375, 0.01209259033203125, 0.019311904907226562, 0.026531219482421875, 0.03375053405761719, 0.0409698486328125, 0.04818916320800781, 0.055408477783203125, 0.06262779235839844, 0.06984710693359375, 0.07706642150878906, 0.08428573608398438, 0.09150505065917969, 0.098724365234375, 0.10594367980957031, 0.11316299438476562, 0.12038230895996094, 0.12760162353515625, 0.13482093811035156, 0.14204025268554688, 0.1492595672607422, 0.1564788818359375, 0.1636981964111328, 0.17091751098632812, 0.17813682556152344, 0.18535614013671875, 0.19257545471191406, 0.19979476928710938, 0.2070140838623047, 0.2142333984375]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 5.0, 7.0, 7.0, 14.0, 10.0, 20.0, 15.0, 25.0, 27.0, 34.0, 38.0, 35.0, 42.0, 53.0, 58.0, 58.0, 66.0, 74.0, 55.0, 48.0, 43.0, 35.0, 34.0, 32.0, 35.0, 24.0, 25.0, 18.0, 13.0, 12.0, 20.0, 7.0, 12.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1358642578125, -0.1319723129272461, -0.1280803680419922, -0.12418842315673828, -0.12029647827148438, -0.11640453338623047, -0.11251258850097656, -0.10862064361572266, -0.10472869873046875, -0.10083675384521484, -0.09694480895996094, -0.09305286407470703, -0.08916091918945312, -0.08526897430419922, -0.08137702941894531, -0.0774850845336914, -0.0735931396484375, -0.0697011947631836, -0.06580924987792969, -0.06191730499267578, -0.058025360107421875, -0.05413341522216797, -0.05024147033691406, -0.046349525451660156, -0.04245758056640625, -0.038565635681152344, -0.03467369079589844, -0.03078174591064453, -0.026889801025390625, -0.02299785614013672, -0.019105911254882812, -0.015213966369628906, -0.011322021484375, -0.007430076599121094, -0.0035381317138671875, 0.00035381317138671875, 0.004245758056640625, 0.008137702941894531, 0.012029647827148438, 0.015921592712402344, 0.01981353759765625, 0.023705482482910156, 0.027597427368164062, 0.03148937225341797, 0.035381317138671875, 0.03927326202392578, 0.04316520690917969, 0.047057151794433594, 0.0509490966796875, 0.054841041564941406, 0.05873298645019531, 0.06262493133544922, 0.06651687622070312, 0.07040882110595703, 0.07430076599121094, 0.07819271087646484, 0.08208465576171875, 0.08597660064697266, 0.08986854553222656, 0.09376049041748047, 0.09765243530273438, 0.10154438018798828, 0.10543632507324219, 0.1093282699584961, 0.11322021484375]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 4.0, 5.0, 5.0, 6.0, 10.0, 13.0, 13.0, 31.0, 21.0, 32.0, 53.0, 100.0, 139.0, 223.0, 386.0, 728.0, 1323.0, 2892.0, 6552.0, 16991.0, 54295.0, 275017.0, 3253108.0, 470963.0, 73916.0, 22064.0, 8137.0, 3523.0, 1692.0, 850.0, 445.0, 297.0, 153.0, 94.0, 76.0, 39.0, 35.0, 21.0, 9.0, 11.0, 4.0, 5.0, 2.0, 6.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.344482421875, -0.33322906494140625, -0.3219757080078125, -0.31072235107421875, -0.299468994140625, -0.28821563720703125, -0.2769622802734375, -0.26570892333984375, -0.25445556640625, -0.24320220947265625, -0.2319488525390625, -0.22069549560546875, -0.209442138671875, -0.19818878173828125, -0.1869354248046875, -0.17568206787109375, -0.1644287109375, -0.15317535400390625, -0.1419219970703125, -0.13066864013671875, -0.119415283203125, -0.10816192626953125, -0.0969085693359375, -0.08565521240234375, -0.07440185546875, -0.06314849853515625, -0.0518951416015625, -0.04064178466796875, -0.029388427734375, -0.01813507080078125, -0.0068817138671875, 0.00437164306640625, 0.015625, 0.02687835693359375, 0.0381317138671875, 0.04938507080078125, 0.060638427734375, 0.07189178466796875, 0.0831451416015625, 0.09439849853515625, 0.10565185546875, 0.11690521240234375, 0.1281585693359375, 0.13941192626953125, 0.150665283203125, 0.16191864013671875, 0.1731719970703125, 0.18442535400390625, 0.1956787109375, 0.20693206787109375, 0.2181854248046875, 0.22943878173828125, 0.240692138671875, 0.25194549560546875, 0.2631988525390625, 0.27445220947265625, 0.28570556640625, 0.29695892333984375, 0.3082122802734375, 0.31946563720703125, 0.330718994140625, 0.34197235107421875, 0.3532257080078125, 0.36447906494140625, 0.375732421875]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 0.0, 1.0, 3.0, 6.0, 5.0, 4.0, 7.0, 16.0, 12.0, 19.0, 18.0, 33.0, 56.0, 75.0, 97.0, 186.0, 308.0, 700.0, 1088.0, 638.0, 286.0, 161.0, 84.0, 63.0, 54.0, 43.0, 19.0, 23.0, 13.0, 10.0, 8.0, 13.0, 5.0, 6.0, 7.0, 5.0, 1.0, 1.0, 2.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.41357421875, -0.40081024169921875, -0.3880462646484375, -0.37528228759765625, -0.362518310546875, -0.34975433349609375, -0.3369903564453125, -0.32422637939453125, -0.31146240234375, -0.29869842529296875, -0.2859344482421875, -0.27317047119140625, -0.260406494140625, -0.24764251708984375, -0.2348785400390625, -0.22211456298828125, -0.2093505859375, -0.19658660888671875, -0.1838226318359375, -0.17105865478515625, -0.158294677734375, -0.14553070068359375, -0.1327667236328125, -0.12000274658203125, -0.10723876953125, -0.09447479248046875, -0.0817108154296875, -0.06894683837890625, -0.056182861328125, -0.04341888427734375, -0.0306549072265625, -0.01789093017578125, -0.005126953125, 0.00763702392578125, 0.0204010009765625, 0.03316497802734375, 0.045928955078125, 0.05869293212890625, 0.0714569091796875, 0.08422088623046875, 0.09698486328125, 0.10974884033203125, 0.1225128173828125, 0.13527679443359375, 0.148040771484375, 0.16080474853515625, 0.1735687255859375, 0.18633270263671875, 0.1990966796875, 0.21186065673828125, 0.2246246337890625, 0.23738861083984375, 0.250152587890625, 0.26291656494140625, 0.2756805419921875, 0.28844451904296875, 0.30120849609375, 0.31397247314453125, 0.3267364501953125, 0.33950042724609375, 0.352264404296875, 0.36502838134765625, 0.3777923583984375, 0.39055633544921875, 0.4033203125]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 4.0, 2.0, 1.0, 9.0, 12.0, 14.0, 40.0, 67.0, 146.0, 210.0, 222.0, 136.0, 65.0, 33.0, 14.0, 12.0, 2.0, 3.0, 3.0, 4.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.339809894561768, -4.179210662841797, -4.018610954284668, -3.858011484146118, -3.6974120140075684, -3.5368127822875977, -3.376213312149048, -3.215613842010498, -3.0550143718719482, -2.8944149017333984, -2.7338154315948486, -2.573215961456299, -2.412616729736328, -2.252017021179199, -2.0914177894592285, -1.9308183193206787, -1.770218849182129, -1.609619379043579, -1.4490199089050293, -1.288420557975769, -1.1278210878372192, -0.9672216176986694, -0.8066222071647644, -0.6460227966308594, -0.48542332649230957, -0.32482388615608215, -0.16422444581985474, -0.0036250054836273193, 0.1569744348526001, 0.3175739049911499, 0.47817331552505493, 0.63877272605896, 0.7993717193603516, 0.9599711894989014, 1.1205706596374512, 1.2811700105667114, 1.4417694807052612, 1.602368950843811, 1.7629683017730713, 1.923567771911621, 2.084167242050171, 2.2447667121887207, 2.4053661823272705, 2.5659656524658203, 2.726564884185791, 2.88716459274292, 3.0477638244628906, 3.2083632946014404, 3.3689627647399902, 3.52956223487854, 3.69016170501709, 3.8507611751556396, 4.0113606452941895, 4.17195987701416, 4.332559585571289, 4.49315881729126, 4.6537580490112305, 4.814357280731201, 4.97495698928833, 5.135556221008301, 5.29615592956543, 5.4567551612854, 5.617354869842529, 5.7779541015625, 5.938553810119629]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 2.0, 3.0, 2.0, 2.0, 10.0, 7.0, 4.0, 9.0, 11.0, 19.0, 15.0, 21.0, 13.0, 16.0, 22.0, 26.0, 39.0, 19.0, 25.0, 40.0, 39.0, 48.0, 38.0, 39.0, 37.0, 52.0, 49.0, 43.0, 43.0, 36.0, 37.0, 31.0, 33.0, 25.0, 23.0, 23.0, 16.0, 15.0, 16.0, 8.0, 4.0, 10.0, 4.0, 9.0, 6.0, 7.0, 1.0, 1.0, 1.0, 6.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0], "bins": [-1.7202401161193848, -1.665005087852478, -1.6097701787948608, -1.554535150527954, -1.4993001222610474, -1.4440650939941406, -1.3888301849365234, -1.3335951566696167, -1.27836012840271, -1.2231251001358032, -1.167890191078186, -1.1126551628112793, -1.0574201345443726, -1.0021851062774658, -0.9469501972198486, -0.8917151689529419, -0.8364802598953247, -0.7812452912330627, -0.726010262966156, -0.670775294303894, -0.6155402660369873, -0.5603052973747253, -0.5050703287124634, -0.44983533024787903, -0.3946003317832947, -0.3393653333187103, -0.284130334854126, -0.228895366191864, -0.17366036772727966, -0.11842536926269531, -0.06319040060043335, -0.007955402135848999, 0.04727959632873535, 0.1025145873427391, 0.15774957835674286, 0.21298456192016602, 0.26821956038475037, 0.3234545588493347, 0.3786895275115967, 0.43392452597618103, 0.4891595244407654, 0.5443944931030273, 0.5996295213699341, 0.654864490032196, 0.710099458694458, 0.7653344869613647, 0.8205694556236267, 0.8758044242858887, 0.9310394525527954, 0.9862744212150574, 1.0415093898773193, 1.096744418144226, 1.1519794464111328, 1.20721435546875, 1.2624493837356567, 1.3176844120025635, 1.3729193210601807, 1.4281543493270874, 1.4833892583847046, 1.5386242866516113, 1.593859314918518, 1.6490943431854248, 1.704329252243042, 1.7595642805099487, 1.8147993087768555]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 6.0, 5.0, 1.0, 9.0, 5.0, 15.0, 13.0, 21.0, 35.0, 60.0, 87.0, 142.0, 241.0, 353.0, 607.0, 1019.0, 1782.0, 3301.0, 6549.0, 13082.0, 29234.0, 75071.0, 307025.0, 437972.0, 102253.0, 36652.0, 16209.0, 7748.0, 4015.0, 2073.0, 1205.0, 695.0, 414.0, 229.0, 153.0, 83.0, 66.0, 41.0, 26.0, 24.0, 14.0, 8.0, 4.0, 5.0, 1.0, 7.0, 1.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.29931640625, -0.2893829345703125, -0.279449462890625, -0.2695159912109375, -0.25958251953125, -0.2496490478515625, -0.239715576171875, -0.2297821044921875, -0.2198486328125, -0.2099151611328125, -0.199981689453125, -0.1900482177734375, -0.18011474609375, -0.1701812744140625, -0.160247802734375, -0.1503143310546875, -0.140380859375, -0.1304473876953125, -0.120513916015625, -0.1105804443359375, -0.10064697265625, -0.0907135009765625, -0.080780029296875, -0.0708465576171875, -0.0609130859375, -0.0509796142578125, -0.041046142578125, -0.0311126708984375, -0.02117919921875, -0.0112457275390625, -0.001312255859375, 0.0086212158203125, 0.0185546875, 0.0284881591796875, 0.038421630859375, 0.0483551025390625, 0.05828857421875, 0.0682220458984375, 0.078155517578125, 0.0880889892578125, 0.0980224609375, 0.1079559326171875, 0.117889404296875, 0.1278228759765625, 0.13775634765625, 0.1476898193359375, 0.157623291015625, 0.1675567626953125, 0.177490234375, 0.1874237060546875, 0.197357177734375, 0.2072906494140625, 0.21722412109375, 0.2271575927734375, 0.237091064453125, 0.2470245361328125, 0.2569580078125, 0.2668914794921875, 0.276824951171875, 0.2867584228515625, 0.29669189453125, 0.3066253662109375, 0.316558837890625, 0.3264923095703125, 0.33642578125]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 5.0, 10.0, 6.0, 7.0, 13.0, 15.0, 19.0, 21.0, 28.0, 45.0, 36.0, 29.0, 41.0, 60.0, 49.0, 47.0, 56.0, 50.0, 43.0, 52.0, 52.0, 43.0, 49.0, 30.0, 33.0, 29.0, 28.0, 19.0, 26.0, 16.0, 4.0, 10.0, 8.0, 8.0, 7.0, 6.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.126708984375, -0.12279891967773438, -0.11888885498046875, -0.11497879028320312, -0.1110687255859375, -0.10715866088867188, -0.10324859619140625, -0.09933853149414062, -0.095428466796875, -0.09151840209960938, -0.08760833740234375, -0.08369827270507812, -0.0797882080078125, -0.07587814331054688, -0.07196807861328125, -0.06805801391601562, -0.06414794921875, -0.060237884521484375, -0.05632781982421875, -0.052417755126953125, -0.0485076904296875, -0.044597625732421875, -0.04068756103515625, -0.036777496337890625, -0.032867431640625, -0.028957366943359375, -0.02504730224609375, -0.021137237548828125, -0.0172271728515625, -0.013317108154296875, -0.00940704345703125, -0.005496978759765625, -0.0015869140625, 0.002323150634765625, 0.00623321533203125, 0.010143280029296875, 0.0140533447265625, 0.017963409423828125, 0.02187347412109375, 0.025783538818359375, 0.029693603515625, 0.033603668212890625, 0.03751373291015625, 0.041423797607421875, 0.0453338623046875, 0.049243927001953125, 0.05315399169921875, 0.057064056396484375, 0.06097412109375, 0.06488418579101562, 0.06879425048828125, 0.07270431518554688, 0.0766143798828125, 0.08052444458007812, 0.08443450927734375, 0.08834457397460938, 0.092254638671875, 0.09616470336914062, 0.10007476806640625, 0.10398483276367188, 0.1078948974609375, 0.11180496215820312, 0.11571502685546875, 0.11962509155273438, 0.12353515625]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 3.0, 6.0, 6.0, 9.0, 12.0, 18.0, 17.0, 18.0, 43.0, 61.0, 125.0, 192.0, 330.0, 661.0, 1476.0, 4181.0, 19990.0, 529991.0, 465058.0, 19224.0, 4081.0, 1514.0, 645.0, 346.0, 199.0, 113.0, 70.0, 55.0, 40.0, 23.0, 16.0, 9.0, 2.0, 7.0, 3.0, 4.0, 2.0, 1.0, 3.0, 0.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.01171875, -0.9819564819335938, -0.9521942138671875, -0.9224319458007812, -0.892669677734375, -0.8629074096679688, -0.8331451416015625, -0.8033828735351562, -0.77362060546875, -0.7438583374023438, -0.7140960693359375, -0.6843338012695312, -0.654571533203125, -0.6248092651367188, -0.5950469970703125, -0.5652847290039062, -0.5355224609375, -0.5057601928710938, -0.4759979248046875, -0.44623565673828125, -0.416473388671875, -0.38671112060546875, -0.3569488525390625, -0.32718658447265625, -0.29742431640625, -0.26766204833984375, -0.2378997802734375, -0.20813751220703125, -0.178375244140625, -0.14861297607421875, -0.1188507080078125, -0.08908843994140625, -0.059326171875, -0.02956390380859375, 0.0001983642578125, 0.02996063232421875, 0.059722900390625, 0.08948516845703125, 0.1192474365234375, 0.14900970458984375, 0.17877197265625, 0.20853424072265625, 0.2382965087890625, 0.26805877685546875, 0.297821044921875, 0.32758331298828125, 0.3573455810546875, 0.38710784912109375, 0.4168701171875, 0.44663238525390625, 0.4763946533203125, 0.5061569213867188, 0.535919189453125, 0.5656814575195312, 0.5954437255859375, 0.6252059936523438, 0.65496826171875, 0.6847305297851562, 0.7144927978515625, 0.7442550659179688, 0.774017333984375, 0.8037796020507812, 0.8335418701171875, 0.8633041381835938, 0.89306640625]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 4.0, 4.0, 4.0, 11.0, 15.0, 15.0, 21.0, 19.0, 26.0, 29.0, 44.0, 48.0, 49.0, 51.0, 67.0, 73.0, 61.0, 69.0, 58.0, 55.0, 46.0, 31.0, 32.0, 33.0, 30.0, 27.0, 22.0, 20.0, 9.0, 14.0, 4.0, 2.0, 3.0, 4.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.759765625, -0.7371597290039062, -0.7145538330078125, -0.6919479370117188, -0.669342041015625, -0.6467361450195312, -0.6241302490234375, -0.6015243530273438, -0.57891845703125, -0.5563125610351562, -0.5337066650390625, -0.5111007690429688, -0.488494873046875, -0.46588897705078125, -0.4432830810546875, -0.42067718505859375, -0.3980712890625, -0.37546539306640625, -0.3528594970703125, -0.33025360107421875, -0.307647705078125, -0.28504180908203125, -0.2624359130859375, -0.23983001708984375, -0.21722412109375, -0.19461822509765625, -0.1720123291015625, -0.14940643310546875, -0.126800537109375, -0.10419464111328125, -0.0815887451171875, -0.05898284912109375, -0.036376953125, -0.01377105712890625, 0.0088348388671875, 0.03144073486328125, 0.054046630859375, 0.07665252685546875, 0.0992584228515625, 0.12186431884765625, 0.14447021484375, 0.16707611083984375, 0.1896820068359375, 0.21228790283203125, 0.234893798828125, 0.25749969482421875, 0.2801055908203125, 0.30271148681640625, 0.3253173828125, 0.34792327880859375, 0.3705291748046875, 0.39313507080078125, 0.415740966796875, 0.43834686279296875, 0.4609527587890625, 0.48355865478515625, 0.50616455078125, 0.5287704467773438, 0.5513763427734375, 0.5739822387695312, 0.596588134765625, 0.6191940307617188, 0.6417999267578125, 0.6644058227539062, 0.68701171875]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 3.0, 1.0, 7.0, 8.0, 14.0, 29.0, 62.0, 94.0, 208.0, 434.0, 1466.0, 9392.0, 325334.0, 697010.0, 11833.0, 1760.0, 463.0, 199.0, 106.0, 48.0, 26.0, 19.0, 16.0, 9.0, 5.0, 3.0, 3.0, 1.0, 2.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.86962890625, -0.8473587036132812, -0.8250885009765625, -0.8028182983398438, -0.780548095703125, -0.7582778930664062, -0.7360076904296875, -0.7137374877929688, -0.69146728515625, -0.6691970825195312, -0.6469268798828125, -0.6246566772460938, -0.602386474609375, -0.5801162719726562, -0.5578460693359375, -0.5355758666992188, -0.5133056640625, -0.49103546142578125, -0.4687652587890625, -0.44649505615234375, -0.424224853515625, -0.40195465087890625, -0.3796844482421875, -0.35741424560546875, -0.33514404296875, -0.31287384033203125, -0.2906036376953125, -0.26833343505859375, -0.246063232421875, -0.22379302978515625, -0.2015228271484375, -0.17925262451171875, -0.156982421875, -0.13471221923828125, -0.1124420166015625, -0.09017181396484375, -0.067901611328125, -0.04563140869140625, -0.0233612060546875, -0.00109100341796875, 0.02117919921875, 0.04344940185546875, 0.0657196044921875, 0.08798980712890625, 0.110260009765625, 0.13253021240234375, 0.1548004150390625, 0.17707061767578125, 0.1993408203125, 0.22161102294921875, 0.2438812255859375, 0.26615142822265625, 0.288421630859375, 0.31069183349609375, 0.3329620361328125, 0.35523223876953125, 0.37750244140625, 0.39977264404296875, 0.4220428466796875, 0.44431304931640625, 0.466583251953125, 0.48885345458984375, 0.5111236572265625, 0.5333938598632812, 0.5556640625]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 5.0, 2.0, 3.0, 2.0, 8.0, 6.0, 4.0, 10.0, 12.0, 7.0, 21.0, 24.0, 31.0, 38.0, 80.0, 81.0, 108.0, 140.0, 120.0, 83.0, 67.0, 53.0, 22.0, 21.0, 10.0, 16.0, 11.0, 7.0, 5.0, 9.0, 7.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.575750350952148e-05, -7.265154272317886e-05, -6.954558193683624e-05, -6.643962115049362e-05, -6.3333660364151e-05, -6.022769957780838e-05, -5.712173879146576e-05, -5.401577800512314e-05, -5.090981721878052e-05, -4.78038564324379e-05, -4.4697895646095276e-05, -4.1591934859752655e-05, -3.8485974073410034e-05, -3.538001328706741e-05, -3.227405250072479e-05, -2.916809171438217e-05, -2.606213092803955e-05, -2.295617014169693e-05, -1.985020935535431e-05, -1.6744248569011688e-05, -1.3638287782669067e-05, -1.0532326996326447e-05, -7.426366209983826e-06, -4.320405423641205e-06, -1.214444637298584e-06, 1.8915161490440369e-06, 4.997476935386658e-06, 8.103437721729279e-06, 1.12093985080719e-05, 1.431535929441452e-05, 1.742132008075714e-05, 2.0527280867099762e-05, 2.3633241653442383e-05, 2.6739202439785004e-05, 2.9845163226127625e-05, 3.2951124012470245e-05, 3.6057084798812866e-05, 3.916304558515549e-05, 4.226900637149811e-05, 4.537496715784073e-05, 4.848092794418335e-05, 5.158688873052597e-05, 5.469284951686859e-05, 5.779881030321121e-05, 6.090477108955383e-05, 6.401073187589645e-05, 6.711669266223907e-05, 7.02226534485817e-05, 7.332861423492432e-05, 7.643457502126694e-05, 7.954053580760956e-05, 8.264649659395218e-05, 8.57524573802948e-05, 8.885841816663742e-05, 9.196437895298004e-05, 9.507033973932266e-05, 9.817630052566528e-05, 0.0001012822613120079, 0.00010438822209835052, 0.00010749418288469315, 0.00011060014367103577, 0.00011370610445737839, 0.00011681206524372101, 0.00011991802603006363, 0.00012302398681640625]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 5.0, 7.0, 8.0, 15.0, 27.0, 36.0, 72.0, 133.0, 282.0, 713.0, 2223.0, 12798.0, 468271.0, 547174.0, 13196.0, 2266.0, 717.0, 300.0, 123.0, 70.0, 48.0, 23.0, 24.0, 9.0, 3.0, 5.0, 2.0, 5.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5341796875, -0.5169525146484375, -0.499725341796875, -0.4824981689453125, -0.46527099609375, -0.4480438232421875, -0.430816650390625, -0.4135894775390625, -0.3963623046875, -0.3791351318359375, -0.361907958984375, -0.3446807861328125, -0.32745361328125, -0.3102264404296875, -0.292999267578125, -0.2757720947265625, -0.258544921875, -0.2413177490234375, -0.224090576171875, -0.2068634033203125, -0.18963623046875, -0.1724090576171875, -0.155181884765625, -0.1379547119140625, -0.1207275390625, -0.1035003662109375, -0.086273193359375, -0.0690460205078125, -0.05181884765625, -0.0345916748046875, -0.017364501953125, -0.0001373291015625, 0.01708984375, 0.0343170166015625, 0.051544189453125, 0.0687713623046875, 0.08599853515625, 0.1032257080078125, 0.120452880859375, 0.1376800537109375, 0.1549072265625, 0.1721343994140625, 0.189361572265625, 0.2065887451171875, 0.22381591796875, 0.2410430908203125, 0.258270263671875, 0.2754974365234375, 0.292724609375, 0.3099517822265625, 0.327178955078125, 0.3444061279296875, 0.36163330078125, 0.3788604736328125, 0.396087646484375, 0.4133148193359375, 0.4305419921875, 0.4477691650390625, 0.464996337890625, 0.4822235107421875, 0.49945068359375, 0.5166778564453125, 0.533905029296875, 0.5511322021484375, 0.568359375]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 3.0, 3.0, 8.0, 13.0, 20.0, 23.0, 27.0, 44.0, 46.0, 65.0, 125.0, 149.0, 148.0, 108.0, 50.0, 50.0, 26.0, 25.0, 15.0, 17.0, 12.0, 7.0, 2.0, 5.0, 4.0, 6.0, 2.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2303466796875, -0.21973609924316406, -0.20912551879882812, -0.1985149383544922, -0.18790435791015625, -0.1772937774658203, -0.16668319702148438, -0.15607261657714844, -0.1454620361328125, -0.13485145568847656, -0.12424087524414062, -0.11363029479980469, -0.10301971435546875, -0.09240913391113281, -0.08179855346679688, -0.07118797302246094, -0.060577392578125, -0.04996681213378906, -0.039356231689453125, -0.028745651245117188, -0.01813507080078125, -0.0075244903564453125, 0.003086090087890625, 0.013696670532226562, 0.0243072509765625, 0.03491783142089844, 0.045528411865234375, 0.05613899230957031, 0.06674957275390625, 0.07736015319824219, 0.08797073364257812, 0.09858131408691406, 0.10919189453125, 0.11980247497558594, 0.13041305541992188, 0.1410236358642578, 0.15163421630859375, 0.1622447967529297, 0.17285537719726562, 0.18346595764160156, 0.1940765380859375, 0.20468711853027344, 0.21529769897460938, 0.2259082794189453, 0.23651885986328125, 0.2471294403076172, 0.2577400207519531, 0.26835060119628906, 0.278961181640625, 0.28957176208496094, 0.3001823425292969, 0.3107929229736328, 0.32140350341796875, 0.3320140838623047, 0.3426246643066406, 0.35323524475097656, 0.3638458251953125, 0.37445640563964844, 0.3850669860839844, 0.3956775665283203, 0.40628814697265625, 0.4168987274169922, 0.4275093078613281, 0.43811988830566406, 0.44873046875]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 0.0, 0.0, 6.0, 10.0, 19.0, 25.0, 63.0, 106.0, 205.0, 260.0, 166.0, 82.0, 37.0, 10.0, 10.0, 4.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.174959182739258, -8.968500137329102, -8.762041091918945, -8.555582046508789, -8.349123001098633, -8.142663955688477, -7.936204433441162, -7.729745388031006, -7.523285865783691, -7.316826820373535, -7.110367774963379, -6.903908729553223, -6.697449207305908, -6.490990161895752, -6.284531116485596, -6.0780720710754395, -5.871613025665283, -5.665153980255127, -5.458694934844971, -5.252235412597656, -5.0457763671875, -4.839317321777344, -4.6328582763671875, -4.426399230957031, -4.219940185546875, -4.013481140136719, -3.8070218563079834, -3.600562810897827, -3.394103527069092, -3.1876444816589355, -2.9811854362487793, -2.774726390838623, -2.5682668685913086, -2.3618078231811523, -2.155348539352417, -1.9488894939422607, -1.742430329322815, -1.5359711647033691, -1.329512119293213, -1.123052954673767, -0.9165937900543213, -0.7101346254348755, -0.5036755204200745, -0.29721641540527344, -0.09075725078582764, 0.11570191383361816, 0.3221609592437744, 0.5286201238632202, 0.735079288482666, 0.9415384531021118, 1.1479976177215576, 1.3544566631317139, 1.5609158277511597, 1.7673749923706055, 1.9738340377807617, 2.180293083190918, 2.3867523670196533, 2.5932114124298096, 2.799670696258545, 3.006129741668701, 3.2125887870788574, 3.4190480709075928, 3.625507116317749, 3.8319664001464844, 4.038425445556641]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 6.0, 8.0, 7.0, 10.0, 19.0, 16.0, 25.0, 14.0, 30.0, 32.0, 36.0, 40.0, 42.0, 44.0, 56.0, 68.0, 70.0, 72.0, 58.0, 63.0, 49.0, 51.0, 27.0, 21.0, 30.0, 27.0, 24.0, 20.0, 17.0, 9.0, 4.0, 4.0, 4.0, 2.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.09306001663208, -2.0042996406555176, -1.9155393838882446, -1.8267791271209717, -1.7380187511444092, -1.6492584943771362, -1.5604982376098633, -1.4717378616333008, -1.3829776048660278, -1.2942173480987549, -1.2054569721221924, -1.1166967153549194, -1.0279364585876465, -0.939176082611084, -0.850415825843811, -0.7616555094718933, -0.6728951930999756, -0.5841348767280579, -0.4953745901584625, -0.4066143035888672, -0.31785398721694946, -0.22909367084503174, -0.1403334140777588, -0.051573097705841064, 0.03718721866607666, 0.1259475201368332, 0.21470782160758972, 0.30346810817718506, 0.3922284245491028, 0.4809887409210205, 0.5697489976882935, 0.6585093140602112, 0.7472696304321289, 0.8360299468040466, 0.9247902631759644, 1.0135505199432373, 1.1023108959197998, 1.1910711526870728, 1.2798314094543457, 1.3685917854309082, 1.4573520421981812, 1.546112298965454, 1.6348726749420166, 1.7236329317092896, 1.8123931884765625, 1.901153564453125, 1.989913821220398, 2.078674077987671, 2.1674344539642334, 2.256194829940796, 2.3449549674987793, 2.433715343475342, 2.5224757194519043, 2.611236095428467, 2.69999623298645, 2.7887566089630127, 2.877516746520996, 2.9662771224975586, 3.055037260055542, 3.1437976360321045, 3.232558012008667, 3.3213181495666504, 3.410078525543213, 3.4988389015197754, 3.587599277496338]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 5.0, 3.0, 6.0, 2.0, 1.0, 12.0, 8.0, 13.0, 21.0, 25.0, 39.0, 59.0, 80.0, 145.0, 266.0, 593.0, 2033.0, 8883.0, 77177.0, 3804296.0, 277011.0, 18099.0, 3452.0, 1075.0, 411.0, 203.0, 125.0, 76.0, 43.0, 30.0, 25.0, 22.0, 18.0, 11.0, 11.0, 3.0, 2.0, 3.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.45068359375, -0.430816650390625, -0.41094970703125, -0.391082763671875, -0.3712158203125, -0.351348876953125, -0.33148193359375, -0.311614990234375, -0.291748046875, -0.271881103515625, -0.25201416015625, -0.232147216796875, -0.2122802734375, -0.192413330078125, -0.17254638671875, -0.152679443359375, -0.1328125, -0.112945556640625, -0.09307861328125, -0.073211669921875, -0.0533447265625, -0.033477783203125, -0.01361083984375, 0.006256103515625, 0.026123046875, 0.045989990234375, 0.06585693359375, 0.085723876953125, 0.1055908203125, 0.125457763671875, 0.14532470703125, 0.165191650390625, 0.18505859375, 0.204925537109375, 0.22479248046875, 0.244659423828125, 0.2645263671875, 0.284393310546875, 0.30426025390625, 0.324127197265625, 0.343994140625, 0.363861083984375, 0.38372802734375, 0.403594970703125, 0.4234619140625, 0.443328857421875, 0.46319580078125, 0.483062744140625, 0.5029296875, 0.522796630859375, 0.54266357421875, 0.562530517578125, 0.5823974609375, 0.602264404296875, 0.62213134765625, 0.641998291015625, 0.661865234375, 0.681732177734375, 0.70159912109375, 0.721466064453125, 0.7413330078125, 0.761199951171875, 0.78106689453125, 0.800933837890625, 0.82080078125]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 8.0, 7.0, 9.0, 7.0, 19.0, 21.0, 35.0, 52.0, 52.0, 56.0, 52.0, 61.0, 90.0, 61.0, 74.0, 71.0, 71.0, 52.0, 48.0, 40.0, 27.0, 29.0, 17.0, 16.0, 10.0, 5.0, 8.0, 2.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1697998046875, -0.1644115447998047, -0.15902328491210938, -0.15363502502441406, -0.14824676513671875, -0.14285850524902344, -0.13747024536132812, -0.1320819854736328, -0.1266937255859375, -0.12130546569824219, -0.11591720581054688, -0.11052894592285156, -0.10514068603515625, -0.09975242614746094, -0.09436416625976562, -0.08897590637207031, -0.083587646484375, -0.07819938659667969, -0.07281112670898438, -0.06742286682128906, -0.06203460693359375, -0.05664634704589844, -0.051258087158203125, -0.04586982727050781, -0.0404815673828125, -0.03509330749511719, -0.029705047607421875, -0.024316787719726562, -0.01892852783203125, -0.013540267944335938, -0.008152008056640625, -0.0027637481689453125, 0.00262451171875, 0.008012771606445312, 0.013401031494140625, 0.018789291381835938, 0.02417755126953125, 0.029565811157226562, 0.034954071044921875, 0.04034233093261719, 0.0457305908203125, 0.05111885070800781, 0.056507110595703125, 0.06189537048339844, 0.06728363037109375, 0.07267189025878906, 0.07806015014648438, 0.08344841003417969, 0.088836669921875, 0.09422492980957031, 0.09961318969726562, 0.10500144958496094, 0.11038970947265625, 0.11577796936035156, 0.12116622924804688, 0.1265544891357422, 0.1319427490234375, 0.1373310089111328, 0.14271926879882812, 0.14810752868652344, 0.15349578857421875, 0.15888404846191406, 0.16427230834960938, 0.1696605682373047, 0.175048828125]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 1.0, 2.0, 4.0, 9.0, 12.0, 18.0, 23.0, 28.0, 66.0, 82.0, 155.0, 236.0, 328.0, 607.0, 1027.0, 1663.0, 2934.0, 5655.0, 12105.0, 27742.0, 78983.0, 379463.0, 2959374.0, 562480.0, 100407.0, 33431.0, 13867.0, 6274.0, 3221.0, 1748.0, 884.0, 541.0, 337.0, 200.0, 130.0, 96.0, 38.0, 30.0, 27.0, 11.0, 10.0, 9.0, 10.0, 7.0, 4.0, 4.0, 5.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.3486328125, -0.3382530212402344, -0.32787322998046875, -0.3174934387207031, -0.3071136474609375, -0.2967338562011719, -0.28635406494140625, -0.2759742736816406, -0.265594482421875, -0.2552146911621094, -0.24483489990234375, -0.23445510864257812, -0.2240753173828125, -0.21369552612304688, -0.20331573486328125, -0.19293594360351562, -0.18255615234375, -0.17217636108398438, -0.16179656982421875, -0.15141677856445312, -0.1410369873046875, -0.13065719604492188, -0.12027740478515625, -0.10989761352539062, -0.099517822265625, -0.08913803100585938, -0.07875823974609375, -0.06837844848632812, -0.0579986572265625, -0.047618865966796875, -0.03723907470703125, -0.026859283447265625, -0.0164794921875, -0.006099700927734375, 0.00428009033203125, 0.014659881591796875, 0.0250396728515625, 0.035419464111328125, 0.04579925537109375, 0.056179046630859375, 0.066558837890625, 0.07693862915039062, 0.08731842041015625, 0.09769821166992188, 0.1080780029296875, 0.11845779418945312, 0.12883758544921875, 0.13921737670898438, 0.14959716796875, 0.15997695922851562, 0.17035675048828125, 0.18073654174804688, 0.1911163330078125, 0.20149612426757812, 0.21187591552734375, 0.22225570678710938, 0.232635498046875, 0.24301528930664062, 0.25339508056640625, 0.2637748718261719, 0.2741546630859375, 0.2845344543457031, 0.29491424560546875, 0.3052940368652344, 0.315673828125]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 4.0, 4.0, 6.0, 4.0, 5.0, 5.0, 11.0, 14.0, 12.0, 20.0, 21.0, 32.0, 66.0, 72.0, 126.0, 180.0, 353.0, 659.0, 996.0, 547.0, 323.0, 198.0, 120.0, 72.0, 60.0, 33.0, 27.0, 29.0, 18.0, 18.0, 11.0, 10.0, 6.0, 2.0, 1.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.423095703125, -0.4096527099609375, -0.396209716796875, -0.3827667236328125, -0.36932373046875, -0.3558807373046875, -0.342437744140625, -0.3289947509765625, -0.3155517578125, -0.3021087646484375, -0.288665771484375, -0.2752227783203125, -0.26177978515625, -0.2483367919921875, -0.234893798828125, -0.2214508056640625, -0.2080078125, -0.1945648193359375, -0.181121826171875, -0.1676788330078125, -0.15423583984375, -0.1407928466796875, -0.127349853515625, -0.1139068603515625, -0.1004638671875, -0.0870208740234375, -0.073577880859375, -0.0601348876953125, -0.04669189453125, -0.0332489013671875, -0.019805908203125, -0.0063629150390625, 0.007080078125, 0.0205230712890625, 0.033966064453125, 0.0474090576171875, 0.06085205078125, 0.0742950439453125, 0.087738037109375, 0.1011810302734375, 0.1146240234375, 0.1280670166015625, 0.141510009765625, 0.1549530029296875, 0.16839599609375, 0.1818389892578125, 0.195281982421875, 0.2087249755859375, 0.22216796875, 0.2356109619140625, 0.249053955078125, 0.2624969482421875, 0.27593994140625, 0.2893829345703125, 0.302825927734375, 0.3162689208984375, 0.3297119140625, 0.3431549072265625, 0.356597900390625, 0.3700408935546875, 0.38348388671875, 0.3969268798828125, 0.410369873046875, 0.4238128662109375, 0.437255859375]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 3.0, 2.0, 8.0, 12.0, 29.0, 42.0, 178.0, 306.0, 271.0, 99.0, 32.0, 8.0, 6.0, 4.0, 2.0, 2.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.499153137207031, -9.260161399841309, -9.021169662475586, -8.782177925109863, -8.543187141418457, -8.304195404052734, -8.065203666687012, -7.826211929321289, -7.587220191955566, -7.348228454589844, -7.109237194061279, -6.870245456695557, -6.631253719329834, -6.3922624588012695, -6.153270721435547, -5.914278984069824, -5.675287246704102, -5.436295509338379, -5.1973042488098145, -4.958312511444092, -4.719320774078369, -4.480329513549805, -4.241337776184082, -4.002346038818359, -3.763354778289795, -3.5243632793426514, -3.2853715419769287, -3.046380043029785, -2.8073883056640625, -2.568396806716919, -2.3294053077697754, -2.0904135704040527, -1.85142183303833, -1.612430214881897, -1.3734385967254639, -1.1344470977783203, -0.8954554200172424, -0.6564638614654541, -0.417472243309021, -0.1784806251525879, 0.060510993003845215, 0.2995026111602783, 0.5384942293167114, 0.7774857878684998, 1.016477346420288, 1.2554689645767212, 1.4944605827331543, 1.7334522008895874, 1.9724438190460205, 2.211435317993164, 2.4504270553588867, 2.6894185543060303, 2.928410291671753, 3.1674017906188965, 3.406393527984619, 3.6453850269317627, 3.8843765258789062, 4.123368263244629, 4.362359523773193, 4.601351261138916, 4.840342998504639, 5.079334259033203, 5.318325996398926, 5.557317733764648, 5.796309471130371]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 3.0, 4.0, 4.0, 9.0, 5.0, 12.0, 15.0, 12.0, 13.0, 23.0, 29.0, 35.0, 62.0, 59.0, 68.0, 62.0, 80.0, 59.0, 59.0, 64.0, 58.0, 40.0, 53.0, 46.0, 33.0, 33.0, 13.0, 19.0, 9.0, 11.0, 9.0, 4.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.5564966201782227, -2.464078187942505, -2.371659517288208, -2.2792410850524902, -2.1868224143981934, -2.0944039821624756, -2.001985549926758, -1.9095669984817505, -1.8171484470367432, -1.7247298955917358, -1.6323113441467285, -1.5398929119110107, -1.4474743604660034, -1.355055809020996, -1.2626373767852783, -1.170218825340271, -1.0778002738952637, -0.9853817224502563, -0.8929632306098938, -0.8005447387695312, -0.7081261873245239, -0.6157076358795166, -0.523289144039154, -0.4308706521987915, -0.3384521007537842, -0.24603357911109924, -0.1536150574684143, -0.06119653582572937, 0.031221985816955566, 0.1236405074596405, 0.21605902910232544, 0.308477520942688, 0.4008963108062744, 0.49331483244895935, 0.5857333540916443, 0.6781518459320068, 0.7705703973770142, 0.8629889488220215, 0.955407440662384, 1.0478259325027466, 1.140244483947754, 1.2326630353927612, 1.3250815868377686, 1.4175000190734863, 1.5099185705184937, 1.602337121963501, 1.6947555541992188, 1.787174105644226, 1.8795926570892334, 1.9720112085342407, 2.064429759979248, 2.156848192214966, 2.2492666244506836, 2.3416852951049805, 2.4341037273406982, 2.526522159576416, 2.618940830230713, 2.7113592624664307, 2.8037779331207275, 2.8961963653564453, 2.988615036010742, 3.08103346824646, 3.1734519004821777, 3.2658705711364746, 3.3582890033721924]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 3.0, 2.0, 6.0, 5.0, 12.0, 19.0, 37.0, 56.0, 107.0, 148.0, 243.0, 541.0, 1071.0, 2190.0, 5138.0, 13142.0, 36656.0, 159192.0, 637367.0, 137821.0, 33915.0, 11933.0, 4761.0, 2031.0, 928.0, 555.0, 275.0, 155.0, 102.0, 52.0, 27.0, 23.0, 10.0, 13.0, 9.0, 5.0, 2.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.5126953125, -0.49823760986328125, -0.4837799072265625, -0.46932220458984375, -0.454864501953125, -0.44040679931640625, -0.4259490966796875, -0.41149139404296875, -0.39703369140625, -0.38257598876953125, -0.3681182861328125, -0.35366058349609375, -0.339202880859375, -0.32474517822265625, -0.3102874755859375, -0.29582977294921875, -0.2813720703125, -0.26691436767578125, -0.2524566650390625, -0.23799896240234375, -0.223541259765625, -0.20908355712890625, -0.1946258544921875, -0.18016815185546875, -0.16571044921875, -0.15125274658203125, -0.1367950439453125, -0.12233734130859375, -0.107879638671875, -0.09342193603515625, -0.0789642333984375, -0.06450653076171875, -0.050048828125, -0.03559112548828125, -0.0211334228515625, -0.00667572021484375, 0.007781982421875, 0.02223968505859375, 0.0366973876953125, 0.05115509033203125, 0.06561279296875, 0.08007049560546875, 0.0945281982421875, 0.10898590087890625, 0.123443603515625, 0.13790130615234375, 0.1523590087890625, 0.16681671142578125, 0.1812744140625, 0.19573211669921875, 0.2101898193359375, 0.22464752197265625, 0.239105224609375, 0.25356292724609375, 0.2680206298828125, 0.28247833251953125, 0.29693603515625, 0.31139373779296875, 0.3258514404296875, 0.34030914306640625, 0.354766845703125, 0.36922454833984375, 0.3836822509765625, 0.39813995361328125, 0.41259765625]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 2.0, 2.0, 3.0, 4.0, 4.0, 9.0, 8.0, 10.0, 12.0, 21.0, 20.0, 30.0, 50.0, 40.0, 49.0, 47.0, 71.0, 58.0, 70.0, 54.0, 68.0, 65.0, 51.0, 56.0, 31.0, 42.0, 33.0, 17.0, 23.0, 14.0, 16.0, 8.0, 5.0, 9.0, 5.0, 2.0, 5.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.2047119140625, -0.198883056640625, -0.19305419921875, -0.187225341796875, -0.181396484375, -0.175567626953125, -0.16973876953125, -0.163909912109375, -0.1580810546875, -0.152252197265625, -0.14642333984375, -0.140594482421875, -0.134765625, -0.128936767578125, -0.12310791015625, -0.117279052734375, -0.1114501953125, -0.105621337890625, -0.09979248046875, -0.093963623046875, -0.088134765625, -0.082305908203125, -0.07647705078125, -0.070648193359375, -0.0648193359375, -0.058990478515625, -0.05316162109375, -0.047332763671875, -0.04150390625, -0.035675048828125, -0.02984619140625, -0.024017333984375, -0.0181884765625, -0.012359619140625, -0.00653076171875, -0.000701904296875, 0.005126953125, 0.010955810546875, 0.01678466796875, 0.022613525390625, 0.0284423828125, 0.034271240234375, 0.04010009765625, 0.045928955078125, 0.0517578125, 0.057586669921875, 0.06341552734375, 0.069244384765625, 0.0750732421875, 0.080902099609375, 0.08673095703125, 0.092559814453125, 0.098388671875, 0.104217529296875, 0.11004638671875, 0.115875244140625, 0.1217041015625, 0.127532958984375, 0.13336181640625, 0.139190673828125, 0.14501953125, 0.150848388671875, 0.15667724609375, 0.162506103515625, 0.1683349609375]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 4.0, 1.0, 3.0, 5.0, 16.0, 20.0, 26.0, 55.0, 113.0, 190.0, 494.0, 1280.0, 4876.0, 40621.0, 902519.0, 87444.0, 8008.0, 1748.0, 595.0, 259.0, 133.0, 66.0, 38.0, 22.0, 6.0, 6.0, 6.0, 4.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0634765625, -1.026336669921875, -0.98919677734375, -0.952056884765625, -0.9149169921875, -0.877777099609375, -0.84063720703125, -0.803497314453125, -0.766357421875, -0.729217529296875, -0.69207763671875, -0.654937744140625, -0.6177978515625, -0.580657958984375, -0.54351806640625, -0.506378173828125, -0.46923828125, -0.432098388671875, -0.39495849609375, -0.357818603515625, -0.3206787109375, -0.283538818359375, -0.24639892578125, -0.209259033203125, -0.172119140625, -0.134979248046875, -0.09783935546875, -0.060699462890625, -0.0235595703125, 0.013580322265625, 0.05072021484375, 0.087860107421875, 0.125, 0.162139892578125, 0.19927978515625, 0.236419677734375, 0.2735595703125, 0.310699462890625, 0.34783935546875, 0.384979248046875, 0.422119140625, 0.459259033203125, 0.49639892578125, 0.533538818359375, 0.5706787109375, 0.607818603515625, 0.64495849609375, 0.682098388671875, 0.71923828125, 0.756378173828125, 0.79351806640625, 0.830657958984375, 0.8677978515625, 0.904937744140625, 0.94207763671875, 0.979217529296875, 1.016357421875, 1.053497314453125, 1.09063720703125, 1.127777099609375, 1.1649169921875, 1.202056884765625, 1.23919677734375, 1.276336669921875, 1.3134765625]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 6.0, 5.0, 4.0, 8.0, 14.0, 18.0, 25.0, 32.0, 37.0, 43.0, 50.0, 66.0, 82.0, 99.0, 83.0, 70.0, 89.0, 60.0, 60.0, 37.0, 29.0, 20.0, 21.0, 17.0, 12.0, 5.0, 6.0, 6.0, 1.0, 2.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1484375, -1.1138153076171875, -1.079193115234375, -1.0445709228515625, -1.00994873046875, -0.9753265380859375, -0.940704345703125, -0.9060821533203125, -0.8714599609375, -0.8368377685546875, -0.802215576171875, -0.7675933837890625, -0.73297119140625, -0.6983489990234375, -0.663726806640625, -0.6291046142578125, -0.594482421875, -0.5598602294921875, -0.525238037109375, -0.4906158447265625, -0.45599365234375, -0.4213714599609375, -0.386749267578125, -0.3521270751953125, -0.3175048828125, -0.2828826904296875, -0.248260498046875, -0.2136383056640625, -0.17901611328125, -0.1443939208984375, -0.109771728515625, -0.0751495361328125, -0.04052734375, -0.0059051513671875, 0.028717041015625, 0.0633392333984375, 0.09796142578125, 0.1325836181640625, 0.167205810546875, 0.2018280029296875, 0.2364501953125, 0.2710723876953125, 0.305694580078125, 0.3403167724609375, 0.37493896484375, 0.4095611572265625, 0.444183349609375, 0.4788055419921875, 0.513427734375, 0.5480499267578125, 0.582672119140625, 0.6172943115234375, 0.65191650390625, 0.6865386962890625, 0.721160888671875, 0.7557830810546875, 0.7904052734375, 0.8250274658203125, 0.859649658203125, 0.8942718505859375, 0.92889404296875, 0.9635162353515625, 0.998138427734375, 1.0327606201171875, 1.0673828125]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 5.0, 3.0, 3.0, 3.0, 3.0, 10.0, 14.0, 16.0, 22.0, 18.0, 33.0, 58.0, 86.0, 137.0, 205.0, 367.0, 699.0, 1365.0, 3043.0, 7857.0, 24587.0, 121303.0, 698944.0, 146824.0, 27852.0, 8537.0, 3317.0, 1460.0, 745.0, 408.0, 210.0, 133.0, 84.0, 63.0, 39.0, 21.0, 24.0, 13.0, 12.0, 11.0, 7.0, 6.0, 5.0, 2.0, 2.0, 5.0, 0.0, 1.0, 2.0], "bins": [-0.3330078125, -0.3241386413574219, -0.31526947021484375, -0.3064002990722656, -0.2975311279296875, -0.2886619567871094, -0.27979278564453125, -0.2709236145019531, -0.262054443359375, -0.2531852722167969, -0.24431610107421875, -0.23544692993164062, -0.2265777587890625, -0.21770858764648438, -0.20883941650390625, -0.19997024536132812, -0.19110107421875, -0.18223190307617188, -0.17336273193359375, -0.16449356079101562, -0.1556243896484375, -0.14675521850585938, -0.13788604736328125, -0.12901687622070312, -0.120147705078125, -0.11127853393554688, -0.10240936279296875, -0.09354019165039062, -0.0846710205078125, -0.07580184936523438, -0.06693267822265625, -0.058063507080078125, -0.0491943359375, -0.040325164794921875, -0.03145599365234375, -0.022586822509765625, -0.0137176513671875, -0.004848480224609375, 0.00402069091796875, 0.012889862060546875, 0.021759033203125, 0.030628204345703125, 0.03949737548828125, 0.048366546630859375, 0.0572357177734375, 0.06610488891601562, 0.07497406005859375, 0.08384323120117188, 0.09271240234375, 0.10158157348632812, 0.11045074462890625, 0.11931991577148438, 0.1281890869140625, 0.13705825805664062, 0.14592742919921875, 0.15479660034179688, 0.163665771484375, 0.17253494262695312, 0.18140411376953125, 0.19027328491210938, 0.1991424560546875, 0.20801162719726562, 0.21688079833984375, 0.22574996948242188, 0.234619140625]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 0.0, 2.0, 3.0, 3.0, 3.0, 6.0, 9.0, 6.0, 16.0, 19.0, 17.0, 25.0, 27.0, 52.0, 61.0, 82.0, 96.0, 123.0, 114.0, 95.0, 54.0, 42.0, 26.0, 30.0, 21.0, 16.0, 14.0, 11.0, 13.0, 8.0, 4.0, 2.0, 1.0, 2.0, 2.0, 3.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-8.767843246459961e-05, -8.520111441612244e-05, -8.272379636764526e-05, -8.024647831916809e-05, -7.776916027069092e-05, -7.529184222221375e-05, -7.281452417373657e-05, -7.03372061252594e-05, -6.785988807678223e-05, -6.538257002830505e-05, -6.290525197982788e-05, -6.042793393135071e-05, -5.7950615882873535e-05, -5.547329783439636e-05, -5.299597978591919e-05, -5.0518661737442017e-05, -4.8041343688964844e-05, -4.556402564048767e-05, -4.30867075920105e-05, -4.0609389543533325e-05, -3.813207149505615e-05, -3.565475344657898e-05, -3.317743539810181e-05, -3.0700117349624634e-05, -2.822279930114746e-05, -2.5745481252670288e-05, -2.3268163204193115e-05, -2.0790845155715942e-05, -1.831352710723877e-05, -1.5836209058761597e-05, -1.3358891010284424e-05, -1.0881572961807251e-05, -8.404254913330078e-06, -5.926936864852905e-06, -3.4496188163757324e-06, -9.723007678985596e-07, 1.5050172805786133e-06, 3.982335329055786e-06, 6.459653377532959e-06, 8.936971426010132e-06, 1.1414289474487305e-05, 1.3891607522964478e-05, 1.636892557144165e-05, 1.8846243619918823e-05, 2.1323561668395996e-05, 2.380087971687317e-05, 2.6278197765350342e-05, 2.8755515813827515e-05, 3.123283386230469e-05, 3.371015191078186e-05, 3.618746995925903e-05, 3.8664788007736206e-05, 4.114210605621338e-05, 4.361942410469055e-05, 4.6096742153167725e-05, 4.85740602016449e-05, 5.105137825012207e-05, 5.352869629859924e-05, 5.6006014347076416e-05, 5.848333239555359e-05, 6.096065044403076e-05, 6.343796849250793e-05, 6.591528654098511e-05, 6.839260458946228e-05, 7.086992263793945e-05]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 3.0, 2.0, 6.0, 7.0, 7.0, 11.0, 17.0, 27.0, 26.0, 26.0, 43.0, 72.0, 90.0, 143.0, 251.0, 413.0, 789.0, 1661.0, 3753.0, 10211.0, 36593.0, 216573.0, 650442.0, 95135.0, 20459.0, 6464.0, 2508.0, 1238.0, 639.0, 351.0, 203.0, 116.0, 92.0, 45.0, 34.0, 30.0, 17.0, 15.0, 16.0, 8.0, 8.0, 7.0, 5.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.2705078125, -0.2621307373046875, -0.253753662109375, -0.2453765869140625, -0.23699951171875, -0.2286224365234375, -0.220245361328125, -0.2118682861328125, -0.2034912109375, -0.1951141357421875, -0.186737060546875, -0.1783599853515625, -0.16998291015625, -0.1616058349609375, -0.153228759765625, -0.1448516845703125, -0.136474609375, -0.1280975341796875, -0.119720458984375, -0.1113433837890625, -0.10296630859375, -0.0945892333984375, -0.086212158203125, -0.0778350830078125, -0.0694580078125, -0.0610809326171875, -0.052703857421875, -0.0443267822265625, -0.03594970703125, -0.0275726318359375, -0.019195556640625, -0.0108184814453125, -0.00244140625, 0.0059356689453125, 0.014312744140625, 0.0226898193359375, 0.03106689453125, 0.0394439697265625, 0.047821044921875, 0.0561981201171875, 0.0645751953125, 0.0729522705078125, 0.081329345703125, 0.0897064208984375, 0.09808349609375, 0.1064605712890625, 0.114837646484375, 0.1232147216796875, 0.131591796875, 0.1399688720703125, 0.148345947265625, 0.1567230224609375, 0.16510009765625, 0.1734771728515625, 0.181854248046875, 0.1902313232421875, 0.1986083984375, 0.2069854736328125, 0.215362548828125, 0.2237396240234375, 0.23211669921875, 0.2404937744140625, 0.248870849609375, 0.2572479248046875, 0.265625]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 1.0, 6.0, 4.0, 1.0, 1.0, 3.0, 5.0, 3.0, 2.0, 13.0, 18.0, 21.0, 20.0, 19.0, 42.0, 44.0, 65.0, 85.0, 85.0, 114.0, 100.0, 62.0, 60.0, 54.0, 36.0, 34.0, 27.0, 16.0, 13.0, 10.0, 9.0, 6.0, 4.0, 6.0, 4.0, 6.0, 4.0, 0.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.26416015625, -0.25655174255371094, -0.24894332885742188, -0.2413349151611328, -0.23372650146484375, -0.2261180877685547, -0.21850967407226562, -0.21090126037597656, -0.2032928466796875, -0.19568443298339844, -0.18807601928710938, -0.1804676055908203, -0.17285919189453125, -0.1652507781982422, -0.15764236450195312, -0.15003395080566406, -0.142425537109375, -0.13481712341308594, -0.12720870971679688, -0.11960029602050781, -0.11199188232421875, -0.10438346862792969, -0.09677505493164062, -0.08916664123535156, -0.0815582275390625, -0.07394981384277344, -0.06634140014648438, -0.05873298645019531, -0.05112457275390625, -0.04351615905761719, -0.035907745361328125, -0.028299331665039062, -0.02069091796875, -0.013082504272460938, -0.005474090576171875, 0.0021343231201171875, 0.00974273681640625, 0.017351150512695312, 0.024959564208984375, 0.03256797790527344, 0.0401763916015625, 0.04778480529785156, 0.055393218994140625, 0.06300163269042969, 0.07061004638671875, 0.07821846008300781, 0.08582687377929688, 0.09343528747558594, 0.101043701171875, 0.10865211486816406, 0.11626052856445312, 0.12386894226074219, 0.13147735595703125, 0.1390857696533203, 0.14669418334960938, 0.15430259704589844, 0.1619110107421875, 0.16951942443847656, 0.17712783813476562, 0.1847362518310547, 0.19234466552734375, 0.1999530792236328, 0.20756149291992188, 0.21516990661621094, 0.2227783203125]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 6.0, 7.0, 12.0, 14.0, 31.0, 61.0, 100.0, 174.0, 225.0, 142.0, 96.0, 55.0, 36.0, 10.0, 14.0, 10.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.719073295593262, -4.558575630187988, -4.398078441619873, -4.2375807762146, -4.077083587646484, -3.916585922241211, -3.7560884952545166, -3.5955910682678223, -3.435093402862549, -3.2745959758758545, -3.11409854888916, -2.9536008834838867, -2.7931034564971924, -2.632606029510498, -2.4721086025238037, -2.3116111755371094, -2.151113748550415, -1.9906163215637207, -1.8301187753677368, -1.6696213483810425, -1.5091238021850586, -1.3486263751983643, -1.18812894821167, -1.027631402015686, -0.8671339750289917, -0.7066364884376526, -0.5461390018463135, -0.38564157485961914, -0.22514408826828003, -0.06464660167694092, 0.09585082530975342, 0.2563483715057373, 0.41684579849243164, 0.5773432850837708, 0.7378407716751099, 0.8983381986618042, 1.058835744857788, 1.2193331718444824, 1.3798305988311768, 1.5403281450271606, 1.700825572013855, 1.8613229990005493, 2.021820545196533, 2.1823179721832275, 2.342815399169922, 2.5033130645751953, 2.6638102531433105, 2.824307918548584, 2.9848053455352783, 3.1453027725219727, 3.305800199508667, 3.4662976264953613, 3.6267952919006348, 3.787292718887329, 3.9477901458740234, 4.108287811279297, 4.268784999847412, 4.4292826652526855, 4.589779853820801, 4.750277519226074, 4.9107747077941895, 5.071272373199463, 5.231769561767578, 5.392267227172852, 5.552764892578125]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 6.0, 8.0, 2.0, 6.0, 6.0, 5.0, 19.0, 13.0, 14.0, 19.0, 20.0, 30.0, 29.0, 32.0, 49.0, 42.0, 46.0, 55.0, 57.0, 58.0, 63.0, 50.0, 67.0, 38.0, 35.0, 45.0, 28.0, 27.0, 24.0, 29.0, 13.0, 12.0, 14.0, 11.0, 12.0, 9.0, 3.0, 4.0, 2.0, 5.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.354213237762451, -3.2558159828186035, -3.157418727874756, -3.0590217113494873, -2.9606244564056396, -2.862227201461792, -2.7638301849365234, -2.665432929992676, -2.567035675048828, -2.4686384201049805, -2.370241165161133, -2.2718441486358643, -2.1734468936920166, -2.075049638748169, -1.9766525030136108, -1.8782553672790527, -1.779858112335205, -1.6814608573913574, -1.5830637216567993, -1.4846665859222412, -1.3862693309783936, -1.287872076034546, -1.1894749402999878, -1.0910778045654297, -0.992680549621582, -0.8942833542823792, -0.7958861589431763, -0.6974889636039734, -0.5990917682647705, -0.5006945729255676, -0.40229737758636475, -0.30390018224716187, -0.20550322532653809, -0.1071060299873352, -0.008708834648132324, 0.08968836069107056, 0.18808555603027344, 0.2864827513694763, 0.3848799467086792, 0.4832771420478821, 0.581674337387085, 0.6800715327262878, 0.7784687280654907, 0.8768659234046936, 0.9752631187438965, 1.0736603736877441, 1.1720575094223022, 1.2704546451568604, 1.368851900100708, 1.4672491550445557, 1.5656462907791138, 1.6640434265136719, 1.7624406814575195, 1.8608379364013672, 1.9592350721359253, 2.0576322078704834, 2.156029462814331, 2.2544267177581787, 2.3528237342834473, 2.451220989227295, 2.5496182441711426, 2.6480154991149902, 2.746412754058838, 2.8448097705841064, 2.943207025527954]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 2.0, 4.0, 2.0, 14.0, 16.0, 26.0, 29.0, 63.0, 121.0, 259.0, 546.0, 1126.0, 2689.0, 6998.0, 21425.0, 86475.0, 757523.0, 2948074.0, 296307.0, 49525.0, 14086.0, 5010.0, 2045.0, 939.0, 488.0, 219.0, 107.0, 54.0, 37.0, 25.0, 16.0, 11.0, 8.0, 4.0, 4.0, 3.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3291015625, -0.31748199462890625, -0.3058624267578125, -0.29424285888671875, -0.282623291015625, -0.27100372314453125, -0.2593841552734375, -0.24776458740234375, -0.23614501953125, -0.22452545166015625, -0.2129058837890625, -0.20128631591796875, -0.189666748046875, -0.17804718017578125, -0.1664276123046875, -0.15480804443359375, -0.1431884765625, -0.13156890869140625, -0.1199493408203125, -0.10832977294921875, -0.096710205078125, -0.08509063720703125, -0.0734710693359375, -0.06185150146484375, -0.05023193359375, -0.03861236572265625, -0.0269927978515625, -0.01537322998046875, -0.003753662109375, 0.00786590576171875, 0.0194854736328125, 0.03110504150390625, 0.042724609375, 0.05434417724609375, 0.0659637451171875, 0.07758331298828125, 0.089202880859375, 0.10082244873046875, 0.1124420166015625, 0.12406158447265625, 0.13568115234375, 0.14730072021484375, 0.1589202880859375, 0.17053985595703125, 0.182159423828125, 0.19377899169921875, 0.2053985595703125, 0.21701812744140625, 0.2286376953125, 0.24025726318359375, 0.2518768310546875, 0.26349639892578125, 0.275115966796875, 0.28673553466796875, 0.2983551025390625, 0.30997467041015625, 0.32159423828125, 0.33321380615234375, 0.3448333740234375, 0.35645294189453125, 0.368072509765625, 0.37969207763671875, 0.3913116455078125, 0.40293121337890625, 0.41455078125]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 6.0, 1.0, 8.0, 14.0, 13.0, 18.0, 27.0, 42.0, 43.0, 34.0, 60.0, 61.0, 64.0, 63.0, 79.0, 77.0, 54.0, 61.0, 61.0, 37.0, 51.0, 37.0, 24.0, 20.0, 12.0, 19.0, 3.0, 6.0, 3.0, 6.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.2034912109375, -0.19742965698242188, -0.19136810302734375, -0.18530654907226562, -0.1792449951171875, -0.17318344116210938, -0.16712188720703125, -0.16106033325195312, -0.154998779296875, -0.14893722534179688, -0.14287567138671875, -0.13681411743164062, -0.1307525634765625, -0.12469100952148438, -0.11862945556640625, -0.11256790161132812, -0.10650634765625, -0.10044479370117188, -0.09438323974609375, -0.08832168579101562, -0.0822601318359375, -0.07619857788085938, -0.07013702392578125, -0.06407546997070312, -0.058013916015625, -0.051952362060546875, -0.04589080810546875, -0.039829254150390625, -0.0337677001953125, -0.027706146240234375, -0.02164459228515625, -0.015583038330078125, -0.009521484375, -0.003459930419921875, 0.00260162353515625, 0.008663177490234375, 0.0147247314453125, 0.020786285400390625, 0.02684783935546875, 0.032909393310546875, 0.038970947265625, 0.045032501220703125, 0.05109405517578125, 0.057155609130859375, 0.0632171630859375, 0.06927871704101562, 0.07534027099609375, 0.08140182495117188, 0.08746337890625, 0.09352493286132812, 0.09958648681640625, 0.10564804077148438, 0.1117095947265625, 0.11777114868164062, 0.12383270263671875, 0.12989425659179688, 0.135955810546875, 0.14201736450195312, 0.14807891845703125, 0.15414047241210938, 0.1602020263671875, 0.16626358032226562, 0.17232513427734375, 0.17838668823242188, 0.1844482421875]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 8.0, 8.0, 14.0, 22.0, 49.0, 75.0, 121.0, 243.0, 427.0, 826.0, 1841.0, 4811.0, 16001.0, 83624.0, 1350426.0, 2587599.0, 118068.0, 20355.0, 5583.0, 2107.0, 953.0, 470.0, 278.0, 149.0, 79.0, 42.0, 45.0, 19.0, 11.0, 12.0, 10.0, 4.0, 1.0, 5.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.75439453125, -0.733489990234375, -0.71258544921875, -0.691680908203125, -0.6707763671875, -0.649871826171875, -0.62896728515625, -0.608062744140625, -0.587158203125, -0.566253662109375, -0.54534912109375, -0.524444580078125, -0.5035400390625, -0.482635498046875, -0.46173095703125, -0.440826416015625, -0.419921875, -0.399017333984375, -0.37811279296875, -0.357208251953125, -0.3363037109375, -0.315399169921875, -0.29449462890625, -0.273590087890625, -0.252685546875, -0.231781005859375, -0.21087646484375, -0.189971923828125, -0.1690673828125, -0.148162841796875, -0.12725830078125, -0.106353759765625, -0.08544921875, -0.064544677734375, -0.04364013671875, -0.022735595703125, -0.0018310546875, 0.019073486328125, 0.03997802734375, 0.060882568359375, 0.081787109375, 0.102691650390625, 0.12359619140625, 0.144500732421875, 0.1654052734375, 0.186309814453125, 0.20721435546875, 0.228118896484375, 0.2490234375, 0.269927978515625, 0.29083251953125, 0.311737060546875, 0.3326416015625, 0.353546142578125, 0.37445068359375, 0.395355224609375, 0.416259765625, 0.437164306640625, 0.45806884765625, 0.478973388671875, 0.4998779296875, 0.520782470703125, 0.54168701171875, 0.562591552734375, 0.58349609375]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 3.0, 10.0, 5.0, 10.0, 17.0, 27.0, 21.0, 55.0, 55.0, 114.0, 143.0, 356.0, 684.0, 1026.0, 711.0, 331.0, 185.0, 108.0, 64.0, 56.0, 28.0, 18.0, 13.0, 9.0, 5.0, 8.0, 5.0, 5.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.615234375, -0.591156005859375, -0.56707763671875, -0.542999267578125, -0.5189208984375, -0.494842529296875, -0.47076416015625, -0.446685791015625, -0.422607421875, -0.398529052734375, -0.37445068359375, -0.350372314453125, -0.3262939453125, -0.302215576171875, -0.27813720703125, -0.254058837890625, -0.22998046875, -0.205902099609375, -0.18182373046875, -0.157745361328125, -0.1336669921875, -0.109588623046875, -0.08551025390625, -0.061431884765625, -0.037353515625, -0.013275146484375, 0.01080322265625, 0.034881591796875, 0.0589599609375, 0.083038330078125, 0.10711669921875, 0.131195068359375, 0.1552734375, 0.179351806640625, 0.20343017578125, 0.227508544921875, 0.2515869140625, 0.275665283203125, 0.29974365234375, 0.323822021484375, 0.347900390625, 0.371978759765625, 0.39605712890625, 0.420135498046875, 0.4442138671875, 0.468292236328125, 0.49237060546875, 0.516448974609375, 0.54052734375, 0.564605712890625, 0.58868408203125, 0.612762451171875, 0.6368408203125, 0.660919189453125, 0.68499755859375, 0.709075927734375, 0.733154296875, 0.757232666015625, 0.78131103515625, 0.805389404296875, 0.8294677734375, 0.853546142578125, 0.87762451171875, 0.901702880859375, 0.92578125]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 2.0, 6.0, 10.0, 51.0, 163.0, 400.0, 262.0, 82.0, 15.0, 7.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.1943359375, -9.74473762512207, -9.295138359069824, -8.845540046691895, -8.395941734313965, -7.946342945098877, -7.496744155883789, -7.047145843505859, -6.59754753112793, -6.147948741912842, -5.698350429534912, -5.248751640319824, -4.7991533279418945, -4.349554538726807, -3.899955987930298, -3.450357437133789, -3.000758647918701, -2.5511600971221924, -2.1015615463256836, -1.6519628763198853, -1.2023643255233765, -0.7527656555175781, -0.30316710472106934, 0.14643144607543945, 0.5960299968719482, 1.045628547668457, 1.4952270984649658, 1.9448257684707642, 2.3944244384765625, 2.8440229892730713, 3.29362154006958, 3.743220090866089, 4.192818641662598, 4.6424174308776855, 5.092015743255615, 5.541614532470703, 5.991212844848633, 6.440811634063721, 6.890410423278809, 7.340008735656738, 7.789607048034668, 8.239205360412598, 8.688804626464844, 9.138402938842773, 9.588001251220703, 10.037599563598633, 10.487198829650879, 10.936797142028809, 11.386396408081055, 11.835994720458984, 12.28559398651123, 12.73519229888916, 13.18479061126709, 13.634389877319336, 14.083988189697266, 14.533586502075195, 14.983184814453125, 15.432783126831055, 15.8823823928833, 16.331979751586914, 16.781579971313477, 17.231178283691406, 17.680776596069336, 18.130374908447266, 18.579973220825195]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 4.0, 3.0, 9.0, 3.0, 10.0, 6.0, 8.0, 12.0, 12.0, 20.0, 19.0, 20.0, 27.0, 19.0, 35.0, 24.0, 39.0, 29.0, 53.0, 52.0, 40.0, 58.0, 49.0, 43.0, 45.0, 43.0, 44.0, 38.0, 44.0, 25.0, 36.0, 19.0, 18.0, 19.0, 14.0, 13.0, 15.0, 7.0, 6.0, 3.0, 8.0, 3.0, 1.0, 3.0, 3.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.78259015083313, -2.697113275527954, -2.6116366386413574, -2.5261597633361816, -2.440682888031006, -2.35520601272583, -2.2697293758392334, -2.1842525005340576, -2.098775625228882, -2.013298749923706, -1.9278219938278198, -1.8423452377319336, -1.7568683624267578, -1.6713916063308716, -1.5859148502349854, -1.5004379749298096, -1.4149612188339233, -1.329484462738037, -1.2440075874328613, -1.158530831336975, -1.0730539560317993, -0.9875771999359131, -0.9021003842353821, -0.8166235685348511, -0.7311467528343201, -0.6456699371337891, -0.5601931214332581, -0.47471633553504944, -0.38923951983451843, -0.3037627041339874, -0.2182859182357788, -0.1328091025352478, -0.0473322868347168, 0.03814452141523361, 0.12362132966518402, 0.20909813046455383, 0.29457494616508484, 0.38005176186561584, 0.46552854776382446, 0.5510053634643555, 0.6364821791648865, 0.7219589948654175, 0.8074358105659485, 0.8929126262664795, 0.9783893823623657, 1.0638662576675415, 1.1493430137634277, 1.2348198890686035, 1.3202966451644897, 1.405773401260376, 1.4912502765655518, 1.576727032661438, 1.6622039079666138, 1.7476806640625, 1.8331575393676758, 1.918634295463562, 2.0041110515594482, 2.089587926864624, 2.1750645637512207, 2.2605414390563965, 2.3460183143615723, 2.431495189666748, 2.5169718265533447, 2.6024487018585205, 2.6879255771636963]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 2.0, 2.0, 9.0, 10.0, 7.0, 17.0, 17.0, 42.0, 42.0, 86.0, 168.0, 383.0, 762.0, 1742.0, 4318.0, 12275.0, 39346.0, 154710.0, 585571.0, 181902.0, 45057.0, 13603.0, 4817.0, 1945.0, 878.0, 382.0, 198.0, 96.0, 63.0, 31.0, 30.0, 14.0, 13.0, 6.0, 2.0, 4.0, 4.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.58740234375, -0.56817626953125, -0.5489501953125, -0.52972412109375, -0.510498046875, -0.49127197265625, -0.4720458984375, -0.45281982421875, -0.43359375, -0.41436767578125, -0.3951416015625, -0.37591552734375, -0.356689453125, -0.33746337890625, -0.3182373046875, -0.29901123046875, -0.27978515625, -0.26055908203125, -0.2413330078125, -0.22210693359375, -0.202880859375, -0.18365478515625, -0.1644287109375, -0.14520263671875, -0.1259765625, -0.10675048828125, -0.0875244140625, -0.06829833984375, -0.049072265625, -0.02984619140625, -0.0106201171875, 0.00860595703125, 0.02783203125, 0.04705810546875, 0.0662841796875, 0.08551025390625, 0.104736328125, 0.12396240234375, 0.1431884765625, 0.16241455078125, 0.181640625, 0.20086669921875, 0.2200927734375, 0.23931884765625, 0.258544921875, 0.27777099609375, 0.2969970703125, 0.31622314453125, 0.33544921875, 0.35467529296875, 0.3739013671875, 0.39312744140625, 0.412353515625, 0.43157958984375, 0.4508056640625, 0.47003173828125, 0.4892578125, 0.50848388671875, 0.5277099609375, 0.54693603515625, 0.566162109375, 0.58538818359375, 0.6046142578125, 0.62384033203125, 0.64306640625]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 4.0, 6.0, 10.0, 9.0, 9.0, 13.0, 24.0, 16.0, 27.0, 22.0, 23.0, 41.0, 50.0, 41.0, 35.0, 71.0, 63.0, 64.0, 39.0, 61.0, 50.0, 50.0, 53.0, 41.0, 37.0, 28.0, 21.0, 21.0, 15.0, 14.0, 10.0, 12.0, 1.0, 5.0, 4.0, 4.0, 1.0, 2.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.1705322265625, -0.1647663116455078, -0.15900039672851562, -0.15323448181152344, -0.14746856689453125, -0.14170265197753906, -0.13593673706054688, -0.1301708221435547, -0.1244049072265625, -0.11863899230957031, -0.11287307739257812, -0.10710716247558594, -0.10134124755859375, -0.09557533264160156, -0.08980941772460938, -0.08404350280761719, -0.078277587890625, -0.07251167297363281, -0.06674575805664062, -0.06097984313964844, -0.05521392822265625, -0.04944801330566406, -0.043682098388671875, -0.03791618347167969, -0.0321502685546875, -0.026384353637695312, -0.020618438720703125, -0.014852523803710938, -0.00908660888671875, -0.0033206939697265625, 0.002445220947265625, 0.008211135864257812, 0.01397705078125, 0.019742965698242188, 0.025508880615234375, 0.03127479553222656, 0.03704071044921875, 0.04280662536621094, 0.048572540283203125, 0.05433845520019531, 0.0601043701171875, 0.06587028503417969, 0.07163619995117188, 0.07740211486816406, 0.08316802978515625, 0.08893394470214844, 0.09469985961914062, 0.10046577453613281, 0.106231689453125, 0.11199760437011719, 0.11776351928710938, 0.12352943420410156, 0.12929534912109375, 0.13506126403808594, 0.14082717895507812, 0.1465930938720703, 0.1523590087890625, 0.1581249237060547, 0.16389083862304688, 0.16965675354003906, 0.17542266845703125, 0.18118858337402344, 0.18695449829101562, 0.1927204132080078, 0.198486328125]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 0.0, 1.0, 2.0, 6.0, 4.0, 5.0, 13.0, 19.0, 26.0, 33.0, 39.0, 58.0, 94.0, 158.0, 310.0, 443.0, 900.0, 1964.0, 5440.0, 27931.0, 725382.0, 259265.0, 18730.0, 4208.0, 1647.0, 775.0, 440.0, 269.0, 134.0, 84.0, 67.0, 38.0, 17.0, 18.0, 7.0, 8.0, 11.0, 6.0, 3.0, 3.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4384765625, -1.3919219970703125, -1.345367431640625, -1.2988128662109375, -1.25225830078125, -1.2057037353515625, -1.159149169921875, -1.1125946044921875, -1.0660400390625, -1.0194854736328125, -0.972930908203125, -0.9263763427734375, -0.87982177734375, -0.8332672119140625, -0.786712646484375, -0.7401580810546875, -0.693603515625, -0.6470489501953125, -0.600494384765625, -0.5539398193359375, -0.50738525390625, -0.4608306884765625, -0.414276123046875, -0.3677215576171875, -0.3211669921875, -0.2746124267578125, -0.228057861328125, -0.1815032958984375, -0.13494873046875, -0.0883941650390625, -0.041839599609375, 0.0047149658203125, 0.05126953125, 0.0978240966796875, 0.144378662109375, 0.1909332275390625, 0.23748779296875, 0.2840423583984375, 0.330596923828125, 0.3771514892578125, 0.4237060546875, 0.4702606201171875, 0.516815185546875, 0.5633697509765625, 0.60992431640625, 0.6564788818359375, 0.703033447265625, 0.7495880126953125, 0.796142578125, 0.8426971435546875, 0.889251708984375, 0.9358062744140625, 0.98236083984375, 1.0289154052734375, 1.075469970703125, 1.1220245361328125, 1.1685791015625, 1.2151336669921875, 1.261688232421875, 1.3082427978515625, 1.35479736328125, 1.4013519287109375, 1.447906494140625, 1.4944610595703125, 1.541015625]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 4.0, 4.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 10.0, 11.0, 14.0, 15.0, 26.0, 32.0, 50.0, 44.0, 56.0, 65.0, 77.0, 75.0, 59.0, 66.0, 68.0, 63.0, 58.0, 39.0, 40.0, 37.0, 21.0, 24.0, 11.0, 7.0, 8.0, 4.0, 4.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.125, -1.08551025390625, -1.0460205078125, -1.00653076171875, -0.967041015625, -0.92755126953125, -0.8880615234375, -0.84857177734375, -0.80908203125, -0.76959228515625, -0.7301025390625, -0.69061279296875, -0.651123046875, -0.61163330078125, -0.5721435546875, -0.53265380859375, -0.4931640625, -0.45367431640625, -0.4141845703125, -0.37469482421875, -0.335205078125, -0.29571533203125, -0.2562255859375, -0.21673583984375, -0.17724609375, -0.13775634765625, -0.0982666015625, -0.05877685546875, -0.019287109375, 0.02020263671875, 0.0596923828125, 0.09918212890625, 0.138671875, 0.17816162109375, 0.2176513671875, 0.25714111328125, 0.296630859375, 0.33612060546875, 0.3756103515625, 0.41510009765625, 0.45458984375, 0.49407958984375, 0.5335693359375, 0.57305908203125, 0.612548828125, 0.65203857421875, 0.6915283203125, 0.73101806640625, 0.7705078125, 0.80999755859375, 0.8494873046875, 0.88897705078125, 0.928466796875, 0.96795654296875, 1.0074462890625, 1.04693603515625, 1.08642578125, 1.12591552734375, 1.1654052734375, 1.20489501953125, 1.244384765625, 1.28387451171875, 1.3233642578125, 1.36285400390625, 1.40234375]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 4.0, 2.0, 5.0, 5.0, 3.0, 7.0, 14.0, 16.0, 28.0, 37.0, 81.0, 118.0, 197.0, 327.0, 704.0, 1431.0, 3460.0, 9912.0, 39140.0, 270045.0, 639983.0, 61049.0, 13916.0, 4425.0, 1847.0, 844.0, 413.0, 210.0, 142.0, 72.0, 50.0, 27.0, 10.0, 14.0, 12.0, 5.0, 4.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.34912109375, -0.3382568359375, -0.327392578125, -0.3165283203125, -0.3056640625, -0.2947998046875, -0.283935546875, -0.2730712890625, -0.26220703125, -0.2513427734375, -0.240478515625, -0.2296142578125, -0.21875, -0.2078857421875, -0.197021484375, -0.1861572265625, -0.17529296875, -0.1644287109375, -0.153564453125, -0.1427001953125, -0.1318359375, -0.1209716796875, -0.110107421875, -0.0992431640625, -0.08837890625, -0.0775146484375, -0.066650390625, -0.0557861328125, -0.044921875, -0.0340576171875, -0.023193359375, -0.0123291015625, -0.00146484375, 0.0093994140625, 0.020263671875, 0.0311279296875, 0.0419921875, 0.0528564453125, 0.063720703125, 0.0745849609375, 0.08544921875, 0.0963134765625, 0.107177734375, 0.1180419921875, 0.12890625, 0.1397705078125, 0.150634765625, 0.1614990234375, 0.17236328125, 0.1832275390625, 0.194091796875, 0.2049560546875, 0.2158203125, 0.2266845703125, 0.237548828125, 0.2484130859375, 0.25927734375, 0.2701416015625, 0.281005859375, 0.2918701171875, 0.302734375, 0.3135986328125, 0.324462890625, 0.3353271484375, 0.34619140625]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 2.0, 3.0, 1.0, 4.0, 5.0, 8.0, 12.0, 8.0, 17.0, 17.0, 26.0, 26.0, 29.0, 54.0, 83.0, 109.0, 152.0, 119.0, 89.0, 61.0, 44.0, 33.0, 24.0, 20.0, 15.0, 12.0, 9.0, 7.0, 6.0, 4.0, 9.0, 4.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.369850158691406e-05, -8.974969387054443e-05, -8.58008861541748e-05, -8.185207843780518e-05, -7.790327072143555e-05, -7.395446300506592e-05, -7.000565528869629e-05, -6.605684757232666e-05, -6.210803985595703e-05, -5.81592321395874e-05, -5.4210424423217773e-05, -5.0261616706848145e-05, -4.6312808990478516e-05, -4.236400127410889e-05, -3.841519355773926e-05, -3.446638584136963e-05, -3.0517578125e-05, -2.656877040863037e-05, -2.2619962692260742e-05, -1.8671154975891113e-05, -1.4722347259521484e-05, -1.0773539543151855e-05, -6.8247318267822266e-06, -2.8759241104125977e-06, 1.0728836059570312e-06, 5.02169132232666e-06, 8.970499038696289e-06, 1.2919306755065918e-05, 1.6868114471435547e-05, 2.0816922187805176e-05, 2.4765729904174805e-05, 2.8714537620544434e-05, 3.266334533691406e-05, 3.661215305328369e-05, 4.056096076965332e-05, 4.450976848602295e-05, 4.845857620239258e-05, 5.240738391876221e-05, 5.6356191635131836e-05, 6.0304999351501465e-05, 6.42538070678711e-05, 6.820261478424072e-05, 7.215142250061035e-05, 7.610023021697998e-05, 8.004903793334961e-05, 8.399784564971924e-05, 8.794665336608887e-05, 9.18954610824585e-05, 9.584426879882812e-05, 9.979307651519775e-05, 0.00010374188423156738, 0.00010769069194793701, 0.00011163949966430664, 0.00011558830738067627, 0.0001195371150970459, 0.00012348592281341553, 0.00012743473052978516, 0.00013138353824615479, 0.00013533234596252441, 0.00013928115367889404, 0.00014322996139526367, 0.0001471787691116333, 0.00015112757682800293, 0.00015507638454437256, 0.0001590251922607422]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 5.0, 3.0, 6.0, 7.0, 7.0, 15.0, 34.0, 31.0, 47.0, 83.0, 123.0, 167.0, 258.0, 494.0, 864.0, 1900.0, 4674.0, 17534.0, 140212.0, 773863.0, 87607.0, 13219.0, 3812.0, 1658.0, 822.0, 387.0, 245.0, 136.0, 114.0, 71.0, 46.0, 35.0, 16.0, 17.0, 13.0, 9.0, 6.0, 6.0, 2.0, 3.0, 3.0, 5.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.294677734375, -0.2839241027832031, -0.27317047119140625, -0.2624168395996094, -0.2516632080078125, -0.24090957641601562, -0.23015594482421875, -0.21940231323242188, -0.208648681640625, -0.19789505004882812, -0.18714141845703125, -0.17638778686523438, -0.1656341552734375, -0.15488052368164062, -0.14412689208984375, -0.13337326049804688, -0.12261962890625, -0.11186599731445312, -0.10111236572265625, -0.09035873413085938, -0.0796051025390625, -0.06885147094726562, -0.05809783935546875, -0.047344207763671875, -0.036590576171875, -0.025836944580078125, -0.01508331298828125, -0.004329681396484375, 0.0064239501953125, 0.017177581787109375, 0.02793121337890625, 0.038684844970703125, 0.0494384765625, 0.060192108154296875, 0.07094573974609375, 0.08169937133789062, 0.0924530029296875, 0.10320663452148438, 0.11396026611328125, 0.12471389770507812, 0.135467529296875, 0.14622116088867188, 0.15697479248046875, 0.16772842407226562, 0.1784820556640625, 0.18923568725585938, 0.19998931884765625, 0.21074295043945312, 0.22149658203125, 0.23225021362304688, 0.24300384521484375, 0.2537574768066406, 0.2645111083984375, 0.2752647399902344, 0.28601837158203125, 0.2967720031738281, 0.307525634765625, 0.3182792663574219, 0.32903289794921875, 0.3397865295410156, 0.3505401611328125, 0.3612937927246094, 0.37204742431640625, 0.3828010559082031, 0.3935546875]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 4.0, 5.0, 4.0, 2.0, 4.0, 9.0, 10.0, 16.0, 8.0, 25.0, 23.0, 46.0, 32.0, 62.0, 55.0, 104.0, 101.0, 108.0, 84.0, 63.0, 36.0, 38.0, 35.0, 19.0, 25.0, 21.0, 14.0, 17.0, 10.0, 9.0, 3.0, 2.0, 2.0, 4.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.32763671875, -0.3173408508300781, -0.30704498291015625, -0.2967491149902344, -0.2864532470703125, -0.2761573791503906, -0.26586151123046875, -0.2555656433105469, -0.245269775390625, -0.23497390747070312, -0.22467803955078125, -0.21438217163085938, -0.2040863037109375, -0.19379043579101562, -0.18349456787109375, -0.17319869995117188, -0.16290283203125, -0.15260696411132812, -0.14231109619140625, -0.13201522827148438, -0.1217193603515625, -0.11142349243164062, -0.10112762451171875, -0.09083175659179688, -0.080535888671875, -0.07024002075195312, -0.05994415283203125, -0.049648284912109375, -0.0393524169921875, -0.029056549072265625, -0.01876068115234375, -0.008464813232421875, 0.0018310546875, 0.012126922607421875, 0.02242279052734375, 0.032718658447265625, 0.0430145263671875, 0.053310394287109375, 0.06360626220703125, 0.07390213012695312, 0.084197998046875, 0.09449386596679688, 0.10478973388671875, 0.11508560180664062, 0.1253814697265625, 0.13567733764648438, 0.14597320556640625, 0.15626907348632812, 0.16656494140625, 0.17686080932617188, 0.18715667724609375, 0.19745254516601562, 0.2077484130859375, 0.21804428100585938, 0.22834014892578125, 0.23863601684570312, 0.248931884765625, 0.2592277526855469, 0.26952362060546875, 0.2798194885253906, 0.2901153564453125, 0.3004112243652344, 0.31070709228515625, 0.3210029602050781, 0.331298828125]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 1.0, 2.0, 2.0, 3.0, 5.0, 3.0, 6.0, 8.0, 20.0, 26.0, 31.0, 77.0, 129.0, 179.0, 221.0, 116.0, 73.0, 46.0, 21.0, 15.0, 11.0, 5.0, 0.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.029716491699219, -7.819554328918457, -7.6093926429748535, -7.399230480194092, -7.18906831741333, -6.978906631469727, -6.768744468688965, -6.558582305908203, -6.348420143127441, -6.13825798034668, -5.928096294403076, -5.7179341316223145, -5.507771968841553, -5.297610282897949, -5.0874481201171875, -4.877285957336426, -4.667123794555664, -4.456961631774902, -4.246799945831299, -4.036637783050537, -3.8264756202697754, -3.6163136959075928, -3.40615177154541, -3.1959896087646484, -2.985827922821045, -2.7756659984588623, -2.5655038356781006, -2.355341911315918, -2.1451797485351562, -1.9350178241729736, -1.7248557806015015, -1.5146937370300293, -1.3045315742492676, -1.0943695306777954, -0.8842074871063232, -0.6740455031394958, -0.4638834595680237, -0.2537214756011963, -0.04355943202972412, 0.16660261154174805, 0.3767646551132202, 0.5869266986846924, 0.7970887422561646, 1.0072507858276367, 1.2174127101898193, 1.4275747537612915, 1.6377367973327637, 1.8478988409042358, 2.058060884475708, 2.2682228088378906, 2.4783849716186523, 2.688546895980835, 2.8987090587615967, 3.1088709831237793, 3.319033145904541, 3.5291950702667236, 3.7393569946289062, 3.949518918991089, 4.1596808433532715, 4.369843006134033, 4.580005168914795, 4.790166854858398, 5.00032901763916, 5.210491180419922, 5.420653343200684]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 4.0, 4.0, 10.0, 3.0, 7.0, 10.0, 13.0, 13.0, 24.0, 25.0, 27.0, 18.0, 32.0, 31.0, 28.0, 37.0, 45.0, 63.0, 42.0, 72.0, 57.0, 67.0, 55.0, 40.0, 37.0, 44.0, 29.0, 19.0, 28.0, 25.0, 19.0, 18.0, 8.0, 16.0, 4.0, 8.0, 9.0, 3.0, 1.0, 2.0, 3.0, 2.0, 0.0, 4.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.059631824493408, -2.960043430328369, -2.86045503616333, -2.760866641998291, -2.661278009414673, -2.561689615249634, -2.4621012210845947, -2.3625128269195557, -2.2629244327545166, -2.1633360385894775, -2.0637476444244385, -1.9641591310501099, -1.8645707368850708, -1.7649822235107422, -1.6653938293457031, -1.565805435180664, -1.4662169218063354, -1.3666285276412964, -1.2670400142669678, -1.1674516201019287, -1.0678632259368896, -0.9682747721672058, -0.868686318397522, -0.7690979242324829, -0.6695094704627991, -0.5699210166931152, -0.47033262252807617, -0.37074416875839233, -0.2711557447910309, -0.17156732082366943, -0.0719788670539856, 0.027609527111053467, 0.1271979808807373, 0.22678640484809875, 0.3263748288154602, 0.42596328258514404, 0.5255516767501831, 0.6251401305198669, 0.7247285842895508, 0.8243169784545898, 0.9239054322242737, 1.0234938859939575, 1.1230822801589966, 1.2226707935333252, 1.3222591876983643, 1.4218475818634033, 1.5214359760284424, 1.6210243701934814, 1.72061288356781, 1.8202012777328491, 1.9197897911071777, 2.019378185272217, 2.118966579437256, 2.218554973602295, 2.318143367767334, 2.417731761932373, 2.517320394515991, 2.6169087886810303, 2.7164971828460693, 2.8160858154296875, 2.9156742095947266, 3.0152626037597656, 3.1148509979248047, 3.2144393920898438, 3.314027786254883]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 1.0, 2.0, 5.0, 4.0, 12.0, 16.0, 19.0, 20.0, 47.0, 67.0, 126.0, 212.0, 396.0, 794.0, 1612.0, 3736.0, 9825.0, 29896.0, 124005.0, 1222867.0, 2507450.0, 226154.0, 44145.0, 13619.0, 5025.0, 2139.0, 969.0, 477.0, 229.0, 158.0, 93.0, 58.0, 36.0, 15.0, 24.0, 7.0, 13.0, 4.0, 5.0, 2.0, 3.0, 0.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.397705078125, -0.385711669921875, -0.37371826171875, -0.361724853515625, -0.3497314453125, -0.337738037109375, -0.32574462890625, -0.313751220703125, -0.3017578125, -0.289764404296875, -0.27777099609375, -0.265777587890625, -0.2537841796875, -0.241790771484375, -0.22979736328125, -0.217803955078125, -0.205810546875, -0.193817138671875, -0.18182373046875, -0.169830322265625, -0.1578369140625, -0.145843505859375, -0.13385009765625, -0.121856689453125, -0.10986328125, -0.097869873046875, -0.08587646484375, -0.073883056640625, -0.0618896484375, -0.049896240234375, -0.03790283203125, -0.025909423828125, -0.013916015625, -0.001922607421875, 0.01007080078125, 0.022064208984375, 0.0340576171875, 0.046051025390625, 0.05804443359375, 0.070037841796875, 0.08203125, 0.094024658203125, 0.10601806640625, 0.118011474609375, 0.1300048828125, 0.141998291015625, 0.15399169921875, 0.165985107421875, 0.177978515625, 0.189971923828125, 0.20196533203125, 0.213958740234375, 0.2259521484375, 0.237945556640625, 0.24993896484375, 0.261932373046875, 0.27392578125, 0.285919189453125, 0.29791259765625, 0.309906005859375, 0.3218994140625, 0.333892822265625, 0.34588623046875, 0.357879638671875, 0.369873046875]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 7.0, 5.0, 9.0, 23.0, 27.0, 32.0, 43.0, 57.0, 51.0, 59.0, 62.0, 61.0, 75.0, 70.0, 80.0, 52.0, 63.0, 48.0, 45.0, 44.0, 29.0, 22.0, 15.0, 10.0, 5.0, 5.0, 3.0, 2.0, 4.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1563720703125, -0.14855003356933594, -0.14072799682617188, -0.1329059600830078, -0.12508392333984375, -0.11726188659667969, -0.10943984985351562, -0.10161781311035156, -0.0937957763671875, -0.08597373962402344, -0.07815170288085938, -0.07032966613769531, -0.06250762939453125, -0.05468559265136719, -0.046863555908203125, -0.03904151916503906, -0.031219482421875, -0.023397445678710938, -0.015575408935546875, -0.0077533721923828125, 6.866455078125e-05, 0.007890701293945312, 0.015712738037109375, 0.023534774780273438, 0.0313568115234375, 0.03917884826660156, 0.047000885009765625, 0.05482292175292969, 0.06264495849609375, 0.07046699523925781, 0.07828903198242188, 0.08611106872558594, 0.09393310546875, 0.10175514221191406, 0.10957717895507812, 0.11739921569824219, 0.12522125244140625, 0.1330432891845703, 0.14086532592773438, 0.14868736267089844, 0.1565093994140625, 0.16433143615722656, 0.17215347290039062, 0.1799755096435547, 0.18779754638671875, 0.1956195831298828, 0.20344161987304688, 0.21126365661621094, 0.219085693359375, 0.22690773010253906, 0.23472976684570312, 0.2425518035888672, 0.25037384033203125, 0.2581958770751953, 0.2660179138183594, 0.27383995056152344, 0.2816619873046875, 0.28948402404785156, 0.2973060607910156, 0.3051280975341797, 0.31295013427734375, 0.3207721710205078, 0.3285942077636719, 0.33641624450683594, 0.34423828125]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 8.0, 10.0, 11.0, 28.0, 53.0, 61.0, 100.0, 207.0, 434.0, 890.0, 2058.0, 5702.0, 19089.0, 94137.0, 1728453.0, 2202695.0, 109415.0, 20560.0, 6207.0, 2240.0, 920.0, 455.0, 227.0, 133.0, 66.0, 50.0, 29.0, 12.0, 11.0, 9.0, 2.0, 5.0, 0.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.79345703125, -0.7701416015625, -0.746826171875, -0.7235107421875, -0.7001953125, -0.6768798828125, -0.653564453125, -0.6302490234375, -0.60693359375, -0.5836181640625, -0.560302734375, -0.5369873046875, -0.513671875, -0.4903564453125, -0.467041015625, -0.4437255859375, -0.42041015625, -0.3970947265625, -0.373779296875, -0.3504638671875, -0.3271484375, -0.3038330078125, -0.280517578125, -0.2572021484375, -0.23388671875, -0.2105712890625, -0.187255859375, -0.1639404296875, -0.140625, -0.1173095703125, -0.093994140625, -0.0706787109375, -0.04736328125, -0.0240478515625, -0.000732421875, 0.0225830078125, 0.0458984375, 0.0692138671875, 0.092529296875, 0.1158447265625, 0.13916015625, 0.1624755859375, 0.185791015625, 0.2091064453125, 0.232421875, 0.2557373046875, 0.279052734375, 0.3023681640625, 0.32568359375, 0.3489990234375, 0.372314453125, 0.3956298828125, 0.4189453125, 0.4422607421875, 0.465576171875, 0.4888916015625, 0.51220703125, 0.5355224609375, 0.558837890625, 0.5821533203125, 0.60546875, 0.6287841796875, 0.652099609375, 0.6754150390625, 0.69873046875]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [4.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 1.0, 4.0, 4.0, 7.0, 7.0, 12.0, 8.0, 16.0, 20.0, 24.0, 35.0, 46.0, 54.0, 91.0, 128.0, 208.0, 357.0, 554.0, 718.0, 604.0, 397.0, 255.0, 156.0, 103.0, 64.0, 61.0, 30.0, 23.0, 30.0, 18.0, 13.0, 13.0, 1.0, 4.0, 3.0, 4.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.537109375, -0.5176544189453125, -0.498199462890625, -0.4787445068359375, -0.45928955078125, -0.4398345947265625, -0.420379638671875, -0.4009246826171875, -0.3814697265625, -0.3620147705078125, -0.342559814453125, -0.3231048583984375, -0.30364990234375, -0.2841949462890625, -0.264739990234375, -0.2452850341796875, -0.225830078125, -0.2063751220703125, -0.186920166015625, -0.1674652099609375, -0.14801025390625, -0.1285552978515625, -0.109100341796875, -0.0896453857421875, -0.0701904296875, -0.0507354736328125, -0.031280517578125, -0.0118255615234375, 0.00762939453125, 0.0270843505859375, 0.046539306640625, 0.0659942626953125, 0.08544921875, 0.1049041748046875, 0.124359130859375, 0.1438140869140625, 0.16326904296875, 0.1827239990234375, 0.202178955078125, 0.2216339111328125, 0.2410888671875, 0.2605438232421875, 0.279998779296875, 0.2994537353515625, 0.31890869140625, 0.3383636474609375, 0.357818603515625, 0.3772735595703125, 0.396728515625, 0.4161834716796875, 0.435638427734375, 0.4550933837890625, 0.47454833984375, 0.4940032958984375, 0.513458251953125, 0.5329132080078125, 0.5523681640625, 0.5718231201171875, 0.591278076171875, 0.6107330322265625, 0.63018798828125, 0.6496429443359375, 0.669097900390625, 0.6885528564453125, 0.7080078125]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 6.0, 10.0, 32.0, 185.0, 479.0, 227.0, 46.0, 13.0, 6.0, 6.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-23.713897705078125, -23.113670349121094, -22.513442993164062, -21.91321563720703, -21.31298828125, -20.71276092529297, -20.112533569335938, -19.512306213378906, -18.912078857421875, -18.311851501464844, -17.711624145507812, -17.11139678955078, -16.51116943359375, -15.910942077636719, -15.310713768005371, -14.71048641204834, -14.110258102416992, -13.510030746459961, -12.90980339050293, -12.309576034545898, -11.709348678588867, -11.109121322631836, -10.508893013000488, -9.908665657043457, -9.308438301086426, -8.708210945129395, -8.107983589172363, -7.507755756378174, -6.907528400421143, -6.307301044464111, -5.707073211669922, -5.106845855712891, -4.506616592407227, -3.9063892364501953, -3.306161642074585, -2.7059340476989746, -2.1057066917419434, -1.505479335784912, -0.9052517414093018, -0.3050241470336914, 0.29520320892333984, 0.8954306840896606, 1.4956581592559814, 2.095885753631592, 2.696113109588623, 3.2963404655456543, 3.8965680599212646, 4.496795654296875, 5.097023010253906, 5.6972503662109375, 6.297477722167969, 6.897705554962158, 7.4979329109191895, 8.098159790039062, 8.69838809967041, 9.298615455627441, 9.898842811584473, 10.499070167541504, 11.099297523498535, 11.699524879455566, 12.299753189086914, 12.899980545043945, 13.500207901000977, 14.100435256958008, 14.700662612915039]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 6.0, 5.0, 6.0, 5.0, 7.0, 10.0, 14.0, 10.0, 20.0, 16.0, 24.0, 25.0, 43.0, 35.0, 47.0, 38.0, 49.0, 54.0, 36.0, 45.0, 51.0, 45.0, 53.0, 53.0, 58.0, 37.0, 32.0, 31.0, 33.0, 23.0, 26.0, 12.0, 12.0, 16.0, 8.0, 5.0, 5.0, 6.0, 3.0, 1.0, 0.0, 2.0, 3.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.4422640800476074, -3.337495803833008, -3.232727289199829, -3.1279587745666504, -3.023190498352051, -2.918422222137451, -2.8136537075042725, -2.7088851928710938, -2.604116916656494, -2.4993486404418945, -2.394580125808716, -2.289811611175537, -2.1850433349609375, -2.080275058746338, -1.9755065441131592, -1.87073814868927, -1.7659697532653809, -1.6612013578414917, -1.5564329624176025, -1.4516645669937134, -1.3468961715698242, -1.242127776145935, -1.137359380722046, -1.0325909852981567, -0.9278225898742676, -0.8230541944503784, -0.7182857990264893, -0.6135174036026001, -0.5087490081787109, -0.4039806127548218, -0.2992122173309326, -0.19444382190704346, -0.0896754264831543, 0.015092968940734863, 0.11986136436462402, 0.22462975978851318, 0.32939815521240234, 0.4341665506362915, 0.5389349460601807, 0.6437033414840698, 0.748471736907959, 0.8532401323318481, 0.9580085277557373, 1.0627769231796265, 1.1675453186035156, 1.2723137140274048, 1.377082109451294, 1.481850504875183, 1.5866189002990723, 1.6913872957229614, 1.7961556911468506, 1.9009240865707397, 2.005692481994629, 2.1104607582092285, 2.2152292728424072, 2.319997787475586, 2.4247660636901855, 2.529534339904785, 2.634302854537964, 2.7390713691711426, 2.843839645385742, 2.948607921600342, 3.0533764362335205, 3.158144950866699, 3.262913227081299]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 3.0, 11.0, 15.0, 15.0, 27.0, 60.0, 106.0, 193.0, 430.0, 961.0, 2606.0, 7941.0, 31301.0, 206552.0, 681808.0, 90339.0, 18105.0, 5025.0, 1709.0, 712.0, 320.0, 137.0, 77.0, 37.0, 26.0, 14.0, 7.0, 8.0, 5.0, 5.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.841796875, -0.814910888671875, -0.78802490234375, -0.761138916015625, -0.7342529296875, -0.707366943359375, -0.68048095703125, -0.653594970703125, -0.626708984375, -0.599822998046875, -0.57293701171875, -0.546051025390625, -0.5191650390625, -0.492279052734375, -0.46539306640625, -0.438507080078125, -0.41162109375, -0.384735107421875, -0.35784912109375, -0.330963134765625, -0.3040771484375, -0.277191162109375, -0.25030517578125, -0.223419189453125, -0.196533203125, -0.169647216796875, -0.14276123046875, -0.115875244140625, -0.0889892578125, -0.062103271484375, -0.03521728515625, -0.008331298828125, 0.0185546875, 0.045440673828125, 0.07232666015625, 0.099212646484375, 0.1260986328125, 0.152984619140625, 0.17987060546875, 0.206756591796875, 0.233642578125, 0.260528564453125, 0.28741455078125, 0.314300537109375, 0.3411865234375, 0.368072509765625, 0.39495849609375, 0.421844482421875, 0.44873046875, 0.475616455078125, 0.50250244140625, 0.529388427734375, 0.5562744140625, 0.583160400390625, 0.61004638671875, 0.636932373046875, 0.663818359375, 0.690704345703125, 0.71759033203125, 0.744476318359375, 0.7713623046875, 0.798248291015625, 0.82513427734375, 0.852020263671875, 0.87890625]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 9.0, 8.0, 11.0, 18.0, 20.0, 21.0, 43.0, 31.0, 43.0, 49.0, 66.0, 59.0, 77.0, 71.0, 69.0, 76.0, 74.0, 60.0, 52.0, 26.0, 29.0, 25.0, 22.0, 8.0, 14.0, 10.0, 5.0, 1.0, 2.0, 6.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.22998046875, -0.22098541259765625, -0.2119903564453125, -0.20299530029296875, -0.194000244140625, -0.18500518798828125, -0.1760101318359375, -0.16701507568359375, -0.15802001953125, -0.14902496337890625, -0.1400299072265625, -0.13103485107421875, -0.122039794921875, -0.11304473876953125, -0.1040496826171875, -0.09505462646484375, -0.0860595703125, -0.07706451416015625, -0.0680694580078125, -0.05907440185546875, -0.050079345703125, -0.04108428955078125, -0.0320892333984375, -0.02309417724609375, -0.01409912109375, -0.00510406494140625, 0.0038909912109375, 0.01288604736328125, 0.021881103515625, 0.03087615966796875, 0.0398712158203125, 0.04886627197265625, 0.057861328125, 0.06685638427734375, 0.0758514404296875, 0.08484649658203125, 0.093841552734375, 0.10283660888671875, 0.1118316650390625, 0.12082672119140625, 0.12982177734375, 0.13881683349609375, 0.1478118896484375, 0.15680694580078125, 0.165802001953125, 0.17479705810546875, 0.1837921142578125, 0.19278717041015625, 0.2017822265625, 0.21077728271484375, 0.2197723388671875, 0.22876739501953125, 0.237762451171875, 0.24675750732421875, 0.2557525634765625, 0.26474761962890625, 0.27374267578125, 0.28273773193359375, 0.2917327880859375, 0.30072784423828125, 0.309722900390625, 0.31871795654296875, 0.3277130126953125, 0.33670806884765625, 0.345703125]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 1.0, 0.0, 1.0, 3.0, 5.0, 3.0, 3.0, 9.0, 11.0, 9.0, 23.0, 24.0, 29.0, 34.0, 46.0, 73.0, 75.0, 115.0, 160.0, 240.0, 345.0, 579.0, 965.0, 1726.0, 3892.0, 10664.0, 40913.0, 341319.0, 577920.0, 48308.0, 12025.0, 4246.0, 1957.0, 1009.0, 590.0, 357.0, 234.0, 177.0, 117.0, 78.0, 69.0, 41.0, 42.0, 33.0, 18.0, 18.0, 14.0, 15.0, 7.0, 7.0, 7.0, 3.0, 5.0, 2.0, 1.0, 2.0], "bins": [-0.96435546875, -0.9376068115234375, -0.910858154296875, -0.8841094970703125, -0.85736083984375, -0.8306121826171875, -0.803863525390625, -0.7771148681640625, -0.7503662109375, -0.7236175537109375, -0.696868896484375, -0.6701202392578125, -0.64337158203125, -0.6166229248046875, -0.589874267578125, -0.5631256103515625, -0.536376953125, -0.5096282958984375, -0.482879638671875, -0.4561309814453125, -0.42938232421875, -0.4026336669921875, -0.375885009765625, -0.3491363525390625, -0.3223876953125, -0.2956390380859375, -0.268890380859375, -0.2421417236328125, -0.21539306640625, -0.1886444091796875, -0.161895751953125, -0.1351470947265625, -0.1083984375, -0.0816497802734375, -0.054901123046875, -0.0281524658203125, -0.00140380859375, 0.0253448486328125, 0.052093505859375, 0.0788421630859375, 0.1055908203125, 0.1323394775390625, 0.159088134765625, 0.1858367919921875, 0.21258544921875, 0.2393341064453125, 0.266082763671875, 0.2928314208984375, 0.319580078125, 0.3463287353515625, 0.373077392578125, 0.3998260498046875, 0.42657470703125, 0.4533233642578125, 0.480072021484375, 0.5068206787109375, 0.5335693359375, 0.5603179931640625, 0.587066650390625, 0.6138153076171875, 0.64056396484375, 0.6673126220703125, 0.694061279296875, 0.7208099365234375, 0.74755859375]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 4.0, 4.0, 5.0, 9.0, 9.0, 9.0, 11.0, 12.0, 24.0, 16.0, 33.0, 35.0, 28.0, 50.0, 60.0, 62.0, 53.0, 71.0, 62.0, 54.0, 57.0, 57.0, 47.0, 41.0, 31.0, 27.0, 35.0, 16.0, 21.0, 21.0, 10.0, 11.0, 7.0, 9.0, 0.0, 3.0, 3.0, 5.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.0205078125, -0.98577880859375, -0.9510498046875, -0.91632080078125, -0.881591796875, -0.84686279296875, -0.8121337890625, -0.77740478515625, -0.74267578125, -0.70794677734375, -0.6732177734375, -0.63848876953125, -0.603759765625, -0.56903076171875, -0.5343017578125, -0.49957275390625, -0.46484375, -0.43011474609375, -0.3953857421875, -0.36065673828125, -0.325927734375, -0.29119873046875, -0.2564697265625, -0.22174072265625, -0.18701171875, -0.15228271484375, -0.1175537109375, -0.08282470703125, -0.048095703125, -0.01336669921875, 0.0213623046875, 0.05609130859375, 0.0908203125, 0.12554931640625, 0.1602783203125, 0.19500732421875, 0.229736328125, 0.26446533203125, 0.2991943359375, 0.33392333984375, 0.36865234375, 0.40338134765625, 0.4381103515625, 0.47283935546875, 0.507568359375, 0.54229736328125, 0.5770263671875, 0.61175537109375, 0.646484375, 0.68121337890625, 0.7159423828125, 0.75067138671875, 0.785400390625, 0.82012939453125, 0.8548583984375, 0.88958740234375, 0.92431640625, 0.95904541015625, 0.9937744140625, 1.02850341796875, 1.063232421875, 1.09796142578125, 1.1326904296875, 1.16741943359375, 1.2021484375]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 3.0, 8.0, 6.0, 11.0, 13.0, 20.0, 28.0, 52.0, 77.0, 162.0, 296.0, 537.0, 1232.0, 3158.0, 9745.0, 43952.0, 307747.0, 599443.0, 62308.0, 13117.0, 3793.0, 1412.0, 670.0, 306.0, 183.0, 100.0, 68.0, 47.0, 17.0, 18.0, 11.0, 5.0, 1.0, 3.0, 2.0, 1.0, 0.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.347412109375, -0.3365898132324219, -0.32576751708984375, -0.3149452209472656, -0.3041229248046875, -0.2933006286621094, -0.28247833251953125, -0.2716560363769531, -0.260833740234375, -0.2500114440917969, -0.23918914794921875, -0.22836685180664062, -0.2175445556640625, -0.20672225952148438, -0.19589996337890625, -0.18507766723632812, -0.17425537109375, -0.16343307495117188, -0.15261077880859375, -0.14178848266601562, -0.1309661865234375, -0.12014389038085938, -0.10932159423828125, -0.09849929809570312, -0.087677001953125, -0.07685470581054688, -0.06603240966796875, -0.055210113525390625, -0.0443878173828125, -0.033565521240234375, -0.02274322509765625, -0.011920928955078125, -0.0010986328125, 0.009723663330078125, 0.02054595947265625, 0.031368255615234375, 0.0421905517578125, 0.053012847900390625, 0.06383514404296875, 0.07465744018554688, 0.085479736328125, 0.09630203247070312, 0.10712432861328125, 0.11794662475585938, 0.1287689208984375, 0.13959121704101562, 0.15041351318359375, 0.16123580932617188, 0.17205810546875, 0.18288040161132812, 0.19370269775390625, 0.20452499389648438, 0.2153472900390625, 0.22616958618164062, 0.23699188232421875, 0.24781417846679688, 0.258636474609375, 0.2694587707519531, 0.28028106689453125, 0.2911033630371094, 0.3019256591796875, 0.3127479553222656, 0.32357025146484375, 0.3343925476074219, 0.34521484375]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 5.0, 4.0, 7.0, 4.0, 7.0, 8.0, 16.0, 6.0, 29.0, 23.0, 34.0, 48.0, 57.0, 77.0, 86.0, 99.0, 105.0, 82.0, 64.0, 51.0, 44.0, 34.0, 29.0, 25.0, 11.0, 13.0, 11.0, 8.0, 8.0, 1.0, 4.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.334087371826172e-05, -9.02228057384491e-05, -8.710473775863647e-05, -8.398666977882385e-05, -8.086860179901123e-05, -7.775053381919861e-05, -7.463246583938599e-05, -7.151439785957336e-05, -6.839632987976074e-05, -6.527826189994812e-05, -6.21601939201355e-05, -5.9042125940322876e-05, -5.5924057960510254e-05, -5.280598998069763e-05, -4.968792200088501e-05, -4.656985402107239e-05, -4.3451786041259766e-05, -4.0333718061447144e-05, -3.721565008163452e-05, -3.40975821018219e-05, -3.097951412200928e-05, -2.7861446142196655e-05, -2.4743378162384033e-05, -2.162531018257141e-05, -1.850724220275879e-05, -1.5389174222946167e-05, -1.2271106243133545e-05, -9.153038263320923e-06, -6.034970283508301e-06, -2.9169023036956787e-06, 2.0116567611694336e-07, 3.3192336559295654e-06, 6.4373016357421875e-06, 9.55536961555481e-06, 1.2673437595367432e-05, 1.5791505575180054e-05, 1.8909573554992676e-05, 2.2027641534805298e-05, 2.514570951461792e-05, 2.8263777494430542e-05, 3.1381845474243164e-05, 3.4499913454055786e-05, 3.761798143386841e-05, 4.073604941368103e-05, 4.385411739349365e-05, 4.6972185373306274e-05, 5.0090253353118896e-05, 5.320832133293152e-05, 5.632638931274414e-05, 5.944445729255676e-05, 6.256252527236938e-05, 6.568059325218201e-05, 6.879866123199463e-05, 7.191672921180725e-05, 7.503479719161987e-05, 7.81528651714325e-05, 8.127093315124512e-05, 8.438900113105774e-05, 8.750706911087036e-05, 9.062513709068298e-05, 9.37432050704956e-05, 9.686127305030823e-05, 9.997934103012085e-05, 0.00010309740900993347, 0.0001062154769897461]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 2.0, 3.0, 2.0, 2.0, 2.0, 3.0, 2.0, 3.0, 4.0, 6.0, 13.0, 14.0, 14.0, 16.0, 29.0, 42.0, 62.0, 86.0, 126.0, 167.0, 302.0, 510.0, 843.0, 1618.0, 3299.0, 8288.0, 28204.0, 147190.0, 680228.0, 136046.0, 26613.0, 7931.0, 3151.0, 1508.0, 872.0, 490.0, 303.0, 178.0, 123.0, 84.0, 59.0, 26.0, 26.0, 17.0, 12.0, 7.0, 8.0, 5.0, 10.0, 3.0, 2.0, 2.0, 4.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0], "bins": [-0.27978515625, -0.27089691162109375, -0.2620086669921875, -0.25312042236328125, -0.244232177734375, -0.23534393310546875, -0.2264556884765625, -0.21756744384765625, -0.20867919921875, -0.19979095458984375, -0.1909027099609375, -0.18201446533203125, -0.173126220703125, -0.16423797607421875, -0.1553497314453125, -0.14646148681640625, -0.1375732421875, -0.12868499755859375, -0.1197967529296875, -0.11090850830078125, -0.102020263671875, -0.09313201904296875, -0.0842437744140625, -0.07535552978515625, -0.06646728515625, -0.05757904052734375, -0.0486907958984375, -0.03980255126953125, -0.030914306640625, -0.02202606201171875, -0.0131378173828125, -0.00424957275390625, 0.004638671875, 0.01352691650390625, 0.0224151611328125, 0.03130340576171875, 0.040191650390625, 0.04907989501953125, 0.0579681396484375, 0.06685638427734375, 0.07574462890625, 0.08463287353515625, 0.0935211181640625, 0.10240936279296875, 0.111297607421875, 0.12018585205078125, 0.1290740966796875, 0.13796234130859375, 0.1468505859375, 0.15573883056640625, 0.1646270751953125, 0.17351531982421875, 0.182403564453125, 0.19129180908203125, 0.2001800537109375, 0.20906829833984375, 0.21795654296875, 0.22684478759765625, 0.2357330322265625, 0.24462127685546875, 0.253509521484375, 0.26239776611328125, 0.2712860107421875, 0.28017425537109375, 0.2890625]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 6.0, 3.0, 7.0, 5.0, 1.0, 7.0, 8.0, 10.0, 14.0, 13.0, 21.0, 31.0, 26.0, 37.0, 35.0, 40.0, 52.0, 53.0, 55.0, 66.0, 68.0, 53.0, 57.0, 59.0, 46.0, 33.0, 50.0, 24.0, 27.0, 20.0, 16.0, 13.0, 11.0, 10.0, 4.0, 5.0, 4.0, 5.0, 2.0, 3.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.2249755859375, -0.2181682586669922, -0.21136093139648438, -0.20455360412597656, -0.19774627685546875, -0.19093894958496094, -0.18413162231445312, -0.1773242950439453, -0.1705169677734375, -0.1637096405029297, -0.15690231323242188, -0.15009498596191406, -0.14328765869140625, -0.13648033142089844, -0.12967300415039062, -0.12286567687988281, -0.116058349609375, -0.10925102233886719, -0.10244369506835938, -0.09563636779785156, -0.08882904052734375, -0.08202171325683594, -0.07521438598632812, -0.06840705871582031, -0.0615997314453125, -0.05479240417480469, -0.047985076904296875, -0.04117774963378906, -0.03437042236328125, -0.027563095092773438, -0.020755767822265625, -0.013948440551757812, -0.00714111328125, -0.0003337860107421875, 0.006473541259765625, 0.013280868530273438, 0.02008819580078125, 0.026895523071289062, 0.033702850341796875, 0.04051017761230469, 0.0473175048828125, 0.05412483215332031, 0.060932159423828125, 0.06773948669433594, 0.07454681396484375, 0.08135414123535156, 0.08816146850585938, 0.09496879577636719, 0.101776123046875, 0.10858345031738281, 0.11539077758789062, 0.12219810485839844, 0.12900543212890625, 0.13581275939941406, 0.14262008666992188, 0.1494274139404297, 0.1562347412109375, 0.1630420684814453, 0.16984939575195312, 0.17665672302246094, 0.18346405029296875, 0.19027137756347656, 0.19707870483398438, 0.2038860321044922, 0.210693359375]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 8.0, 6.0, 9.0, 19.0, 66.0, 155.0, 344.0, 216.0, 102.0, 51.0, 16.0, 11.0, 5.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.427070617675781, -12.09839916229248, -11.769728660583496, -11.441057205200195, -11.112386703491211, -10.78371524810791, -10.45504379272461, -10.126373291015625, -9.797701835632324, -9.469030380249023, -9.140359878540039, -8.811688423156738, -8.483016967773438, -8.154346466064453, -7.825675010681152, -7.49700403213501, -7.168333053588867, -6.839662075042725, -6.510991096496582, -6.182319641113281, -5.853648662567139, -5.524977684020996, -5.196306228637695, -4.867635250091553, -4.53896427154541, -4.210293292999268, -3.881622076034546, -3.552950859069824, -3.2242798805236816, -2.895608901977539, -2.5669376850128174, -2.2382664680480957, -1.9095964431762695, -1.5809253454208374, -1.2522542476654053, -0.9235831499099731, -0.594912052154541, -0.2662409543991089, 0.06243014335632324, 0.3911013603210449, 0.7197723388671875, 1.0484434366226196, 1.3771145343780518, 1.7057856321334839, 2.034456729888916, 2.3631277084350586, 2.6917989253997803, 3.020470142364502, 3.3491411209106445, 3.677812099456787, 4.00648307800293, 4.3351545333862305, 4.663825511932373, 4.992496490478516, 5.321167945861816, 5.649838924407959, 5.978509902954102, 6.307180881500244, 6.635851860046387, 6.9645233154296875, 7.29319429397583, 7.621865272521973, 7.950536727905273, 8.279207229614258, 8.607878684997559]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 5.0, 4.0, 5.0, 14.0, 4.0, 17.0, 10.0, 14.0, 22.0, 17.0, 21.0, 36.0, 22.0, 31.0, 26.0, 31.0, 42.0, 64.0, 75.0, 83.0, 57.0, 55.0, 43.0, 44.0, 29.0, 32.0, 30.0, 28.0, 24.0, 17.0, 13.0, 15.0, 20.0, 11.0, 9.0, 4.0, 4.0, 4.0, 3.0, 4.0, 4.0, 6.0, 1.0, 1.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-3.9810056686401367, -3.8539695739746094, -3.726933717727661, -3.599897861480713, -3.4728617668151855, -3.345825672149658, -3.21878981590271, -3.0917539596557617, -2.9647178649902344, -2.837681770324707, -2.710645914077759, -2.5836100578308105, -2.456573963165283, -2.329537868499756, -2.2025020122528076, -2.0754661560058594, -1.948430061340332, -1.8213940858840942, -1.6943581104278564, -1.5673221349716187, -1.4402861595153809, -1.313250184059143, -1.1862142086029053, -1.0591782331466675, -0.9321422576904297, -0.8051062822341919, -0.6780703067779541, -0.5510343313217163, -0.4239983558654785, -0.2969623804092407, -0.16992640495300293, -0.04289042949676514, 0.08414602279663086, 0.21118199825286865, 0.33821797370910645, 0.46525394916534424, 0.592289924621582, 0.7193259000778198, 0.8463618755340576, 0.9733978509902954, 1.1004338264465332, 1.227469801902771, 1.3545057773590088, 1.4815417528152466, 1.6085777282714844, 1.7356137037277222, 1.86264967918396, 1.9896856546401978, 2.1167216300964355, 2.243757724761963, 2.370793581008911, 2.4978294372558594, 2.6248655319213867, 2.751901626586914, 2.8789374828338623, 3.0059733390808105, 3.133009433746338, 3.2600455284118652, 3.3870813846588135, 3.5141172409057617, 3.641153335571289, 3.7681894302368164, 3.8952252864837646, 4.022261142730713, 4.14929723739624]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 0.0, 3.0, 2.0, 1.0, 2.0, 2.0, 5.0, 4.0, 7.0, 9.0, 9.0, 10.0, 12.0, 20.0, 32.0, 27.0, 46.0, 89.0, 131.0, 183.0, 391.0, 633.0, 1359.0, 2847.0, 6866.0, 20214.0, 84867.0, 1015135.0, 2815578.0, 194165.0, 32717.0, 10593.0, 4193.0, 1864.0, 987.0, 511.0, 280.0, 166.0, 116.0, 61.0, 50.0, 26.0, 24.0, 20.0, 10.0, 8.0, 8.0, 6.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4326171875, -0.4191856384277344, -0.40575408935546875, -0.3923225402832031, -0.3788909912109375, -0.3654594421386719, -0.35202789306640625, -0.3385963439941406, -0.325164794921875, -0.3117332458496094, -0.29830169677734375, -0.2848701477050781, -0.2714385986328125, -0.2580070495605469, -0.24457550048828125, -0.23114395141601562, -0.21771240234375, -0.20428085327148438, -0.19084930419921875, -0.17741775512695312, -0.1639862060546875, -0.15055465698242188, -0.13712310791015625, -0.12369155883789062, -0.110260009765625, -0.09682846069335938, -0.08339691162109375, -0.06996536254882812, -0.0565338134765625, -0.043102264404296875, -0.02967071533203125, -0.016239166259765625, -0.0028076171875, 0.010623931884765625, 0.02405548095703125, 0.037487030029296875, 0.0509185791015625, 0.06435012817382812, 0.07778167724609375, 0.09121322631835938, 0.104644775390625, 0.11807632446289062, 0.13150787353515625, 0.14493942260742188, 0.1583709716796875, 0.17180252075195312, 0.18523406982421875, 0.19866561889648438, 0.21209716796875, 0.22552871704101562, 0.23896026611328125, 0.2523918151855469, 0.2658233642578125, 0.2792549133300781, 0.29268646240234375, 0.3061180114746094, 0.319549560546875, 0.3329811096191406, 0.34641265869140625, 0.3598442077636719, 0.3732757568359375, 0.3867073059082031, 0.40013885498046875, 0.4135704040527344, 0.427001953125]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 6.0, 6.0, 3.0, 6.0, 11.0, 12.0, 17.0, 19.0, 27.0, 19.0, 29.0, 39.0, 43.0, 50.0, 41.0, 49.0, 53.0, 88.0, 56.0, 60.0, 66.0, 59.0, 35.0, 29.0, 32.0, 26.0, 32.0, 19.0, 17.0, 16.0, 13.0, 11.0, 5.0, 7.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.2435302734375, -0.2358570098876953, -0.22818374633789062, -0.22051048278808594, -0.21283721923828125, -0.20516395568847656, -0.19749069213867188, -0.1898174285888672, -0.1821441650390625, -0.1744709014892578, -0.16679763793945312, -0.15912437438964844, -0.15145111083984375, -0.14377784729003906, -0.13610458374023438, -0.1284313201904297, -0.120758056640625, -0.11308479309082031, -0.10541152954101562, -0.09773826599121094, -0.09006500244140625, -0.08239173889160156, -0.07471847534179688, -0.06704521179199219, -0.0593719482421875, -0.05169868469238281, -0.044025421142578125, -0.03635215759277344, -0.02867889404296875, -0.021005630493164062, -0.013332366943359375, -0.0056591033935546875, 0.00201416015625, 0.009687423706054688, 0.017360687255859375, 0.025033950805664062, 0.03270721435546875, 0.04038047790527344, 0.048053741455078125, 0.05572700500488281, 0.0634002685546875, 0.07107353210449219, 0.07874679565429688, 0.08642005920410156, 0.09409332275390625, 0.10176658630371094, 0.10943984985351562, 0.11711311340332031, 0.124786376953125, 0.1324596405029297, 0.14013290405273438, 0.14780616760253906, 0.15547943115234375, 0.16315269470214844, 0.17082595825195312, 0.1784992218017578, 0.1861724853515625, 0.1938457489013672, 0.20151901245117188, 0.20919227600097656, 0.21686553955078125, 0.22453880310058594, 0.23221206665039062, 0.2398853302001953, 0.24755859375]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 5.0, 8.0, 10.0, 11.0, 16.0, 22.0, 30.0, 65.0, 114.0, 167.0, 355.0, 747.0, 1682.0, 4651.0, 17010.0, 114707.0, 3573345.0, 434603.0, 34439.0, 7759.0, 2458.0, 1038.0, 506.0, 228.0, 121.0, 74.0, 40.0, 32.0, 10.0, 13.0, 9.0, 5.0, 1.0, 2.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.0859375, -1.0555267333984375, -1.025115966796875, -0.9947052001953125, -0.96429443359375, -0.9338836669921875, -0.903472900390625, -0.8730621337890625, -0.8426513671875, -0.8122406005859375, -0.781829833984375, -0.7514190673828125, -0.72100830078125, -0.6905975341796875, -0.660186767578125, -0.6297760009765625, -0.599365234375, -0.5689544677734375, -0.538543701171875, -0.5081329345703125, -0.47772216796875, -0.4473114013671875, -0.416900634765625, -0.3864898681640625, -0.3560791015625, -0.3256683349609375, -0.295257568359375, -0.2648468017578125, -0.23443603515625, -0.2040252685546875, -0.173614501953125, -0.1432037353515625, -0.11279296875, -0.0823822021484375, -0.051971435546875, -0.0215606689453125, 0.00885009765625, 0.0392608642578125, 0.069671630859375, 0.1000823974609375, 0.1304931640625, 0.1609039306640625, 0.191314697265625, 0.2217254638671875, 0.25213623046875, 0.2825469970703125, 0.312957763671875, 0.3433685302734375, 0.373779296875, 0.4041900634765625, 0.434600830078125, 0.4650115966796875, 0.49542236328125, 0.5258331298828125, 0.556243896484375, 0.5866546630859375, 0.6170654296875, 0.6474761962890625, 0.677886962890625, 0.7082977294921875, 0.73870849609375, 0.7691192626953125, 0.799530029296875, 0.8299407958984375, 0.8603515625]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 1.0, 5.0, 4.0, 5.0, 8.0, 7.0, 5.0, 26.0, 27.0, 40.0, 52.0, 87.0, 192.0, 337.0, 828.0, 1157.0, 652.0, 281.0, 131.0, 69.0, 53.0, 26.0, 22.0, 16.0, 15.0, 7.0, 5.0, 9.0, 3.0, 3.0, 5.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.0625, -1.034027099609375, -1.00555419921875, -0.977081298828125, -0.9486083984375, -0.920135498046875, -0.89166259765625, -0.863189697265625, -0.834716796875, -0.806243896484375, -0.77777099609375, -0.749298095703125, -0.7208251953125, -0.692352294921875, -0.66387939453125, -0.635406494140625, -0.60693359375, -0.578460693359375, -0.54998779296875, -0.521514892578125, -0.4930419921875, -0.464569091796875, -0.43609619140625, -0.407623291015625, -0.379150390625, -0.350677490234375, -0.32220458984375, -0.293731689453125, -0.2652587890625, -0.236785888671875, -0.20831298828125, -0.179840087890625, -0.1513671875, -0.122894287109375, -0.09442138671875, -0.065948486328125, -0.0374755859375, -0.009002685546875, 0.01947021484375, 0.047943115234375, 0.076416015625, 0.104888916015625, 0.13336181640625, 0.161834716796875, 0.1903076171875, 0.218780517578125, 0.24725341796875, 0.275726318359375, 0.30419921875, 0.332672119140625, 0.36114501953125, 0.389617919921875, 0.4180908203125, 0.446563720703125, 0.47503662109375, 0.503509521484375, 0.531982421875, 0.560455322265625, 0.58892822265625, 0.617401123046875, 0.6458740234375, 0.674346923828125, 0.70281982421875, 0.731292724609375, 0.759765625]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 1.0, 4.0, 4.0, 3.0, 5.0, 22.0, 52.0, 94.0, 198.0, 261.0, 182.0, 97.0, 45.0, 10.0, 7.0, 11.0, 3.0, 4.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.044780731201172, -6.756098747253418, -6.467416763305664, -6.17873477935791, -5.890052795410156, -5.601370811462402, -5.312688827514648, -5.0240068435668945, -4.735324859619141, -4.446642875671387, -4.157960891723633, -3.869278907775879, -3.580596923828125, -3.291914939880371, -3.0032331943511963, -2.7145512104034424, -2.4258694648742676, -2.1371874809265137, -1.8485054969787598, -1.5598236322402954, -1.2711416482925415, -0.9824596643447876, -0.6937777996063232, -0.40509581565856934, -0.11641383171081543, 0.1722681224346161, 0.4609500765800476, 0.7496320009231567, 1.0383139848709106, 1.3269959688186646, 1.615677833557129, 1.9043598175048828, 2.1930418014526367, 2.4817237854003906, 2.7704057693481445, 3.0590877532958984, 3.3477697372436523, 3.6364517211914062, 3.925133466720581, 4.213815689086914, 4.502497673034668, 4.791179656982422, 5.079861640930176, 5.36854362487793, 5.657225608825684, 5.9459075927734375, 6.234589576721191, 6.523271560668945, 6.811953067779541, 7.100635051727295, 7.389317035675049, 7.677999019622803, 7.966681003570557, 8.255362510681152, 8.544044494628906, 8.83272647857666, 9.121408462524414, 9.410090446472168, 9.698772430419922, 9.987454414367676, 10.27613639831543, 10.564818382263184, 10.853500366210938, 11.142182350158691, 11.430864334106445]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 3.0, 4.0, 4.0, 0.0, 2.0, 7.0, 5.0, 5.0, 10.0, 11.0, 16.0, 11.0, 18.0, 25.0, 24.0, 27.0, 27.0, 23.0, 32.0, 34.0, 34.0, 40.0, 41.0, 59.0, 46.0, 34.0, 30.0, 51.0, 43.0, 46.0, 36.0, 40.0, 26.0, 20.0, 24.0, 25.0, 20.0, 16.0, 16.0, 10.0, 11.0, 5.0, 8.0, 8.0, 9.0, 6.0, 8.0, 2.0, 4.0, 0.0, 4.0, 2.0, 0.0, 1.0, 1.0], "bins": [-3.004866361618042, -2.917200803756714, -2.8295350074768066, -2.7418694496154785, -2.6542038917541504, -2.566538095474243, -2.478872537612915, -2.391206741333008, -2.3035411834716797, -2.2158756256103516, -2.1282098293304443, -2.040544271469116, -1.9528785943984985, -1.8652129173278809, -1.7775473594665527, -1.689881682395935, -1.6022160053253174, -1.5145503282546997, -1.426884651184082, -1.339219093322754, -1.2515534162521362, -1.1638877391815186, -1.0762221813201904, -0.9885565042495728, -0.9008908271789551, -0.8132251501083374, -0.7255595326423645, -0.6378939151763916, -0.5502282381057739, -0.46256259083747864, -0.37489694356918335, -0.28723132610321045, -0.19956541061401367, -0.11189976334571838, -0.024234116077423096, 0.06343153119087219, 0.15109717845916748, 0.23876282572746277, 0.32642847299575806, 0.41409409046173096, 0.5017597675323486, 0.5894254446029663, 0.6770910620689392, 0.7647566795349121, 0.8524223566055298, 0.9400880336761475, 1.0277535915374756, 1.1154192686080933, 1.203084945678711, 1.2907506227493286, 1.3784162998199463, 1.4660818576812744, 1.553747534751892, 1.6414132118225098, 1.729078769683838, 1.8167444467544556, 1.9044101238250732, 1.992075800895691, 2.0797414779663086, 2.1674070358276367, 2.255072593688965, 2.342738389968872, 2.4304039478302, 2.5180697441101074, 2.6057353019714355]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 0.0, 2.0, 5.0, 9.0, 19.0, 10.0, 23.0, 25.0, 62.0, 114.0, 173.0, 337.0, 595.0, 1080.0, 2300.0, 5124.0, 12856.0, 40604.0, 178505.0, 533546.0, 203795.0, 45007.0, 13837.0, 5421.0, 2472.0, 1227.0, 598.0, 349.0, 198.0, 108.0, 59.0, 39.0, 29.0, 11.0, 9.0, 3.0, 4.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.426513671875, -0.4134063720703125, -0.400299072265625, -0.3871917724609375, -0.37408447265625, -0.3609771728515625, -0.347869873046875, -0.3347625732421875, -0.3216552734375, -0.3085479736328125, -0.295440673828125, -0.2823333740234375, -0.26922607421875, -0.2561187744140625, -0.243011474609375, -0.2299041748046875, -0.216796875, -0.2036895751953125, -0.190582275390625, -0.1774749755859375, -0.16436767578125, -0.1512603759765625, -0.138153076171875, -0.1250457763671875, -0.1119384765625, -0.0988311767578125, -0.085723876953125, -0.0726165771484375, -0.05950927734375, -0.0464019775390625, -0.033294677734375, -0.0201873779296875, -0.007080078125, 0.0060272216796875, 0.019134521484375, 0.0322418212890625, 0.04534912109375, 0.0584564208984375, 0.071563720703125, 0.0846710205078125, 0.0977783203125, 0.1108856201171875, 0.123992919921875, 0.1371002197265625, 0.15020751953125, 0.1633148193359375, 0.176422119140625, 0.1895294189453125, 0.20263671875, 0.2157440185546875, 0.228851318359375, 0.2419586181640625, 0.25506591796875, 0.2681732177734375, 0.281280517578125, 0.2943878173828125, 0.3074951171875, 0.3206024169921875, 0.333709716796875, 0.3468170166015625, 0.35992431640625, 0.3730316162109375, 0.386138916015625, 0.3992462158203125, 0.412353515625]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 6.0, 3.0, 4.0, 1.0, 5.0, 10.0, 17.0, 11.0, 13.0, 21.0, 19.0, 24.0, 30.0, 36.0, 37.0, 48.0, 36.0, 40.0, 44.0, 56.0, 63.0, 76.0, 56.0, 45.0, 51.0, 50.0, 34.0, 27.0, 33.0, 25.0, 15.0, 13.0, 15.0, 8.0, 7.0, 8.0, 7.0, 2.0, 5.0, 3.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.2406005859375, -0.2329082489013672, -0.22521591186523438, -0.21752357482910156, -0.20983123779296875, -0.20213890075683594, -0.19444656372070312, -0.1867542266845703, -0.1790618896484375, -0.1713695526123047, -0.16367721557617188, -0.15598487854003906, -0.14829254150390625, -0.14060020446777344, -0.13290786743164062, -0.1252155303955078, -0.117523193359375, -0.10983085632324219, -0.10213851928710938, -0.09444618225097656, -0.08675384521484375, -0.07906150817871094, -0.07136917114257812, -0.06367683410644531, -0.0559844970703125, -0.04829216003417969, -0.040599822998046875, -0.03290748596191406, -0.02521514892578125, -0.017522811889648438, -0.009830474853515625, -0.0021381378173828125, 0.00555419921875, 0.013246536254882812, 0.020938873291015625, 0.028631210327148438, 0.03632354736328125, 0.04401588439941406, 0.051708221435546875, 0.05940055847167969, 0.0670928955078125, 0.07478523254394531, 0.08247756958007812, 0.09016990661621094, 0.09786224365234375, 0.10555458068847656, 0.11324691772460938, 0.12093925476074219, 0.128631591796875, 0.1363239288330078, 0.14401626586914062, 0.15170860290527344, 0.15940093994140625, 0.16709327697753906, 0.17478561401367188, 0.1824779510498047, 0.1901702880859375, 0.1978626251220703, 0.20555496215820312, 0.21324729919433594, 0.22093963623046875, 0.22863197326660156, 0.23632431030273438, 0.2440166473388672, 0.251708984375]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 4.0, 5.0, 9.0, 12.0, 21.0, 48.0, 80.0, 141.0, 316.0, 725.0, 2360.0, 11407.0, 169838.0, 819233.0, 37302.0, 4796.0, 1331.0, 473.0, 223.0, 104.0, 49.0, 27.0, 22.0, 15.0, 8.0, 4.0, 2.0, 5.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.046875, -1.017181396484375, -0.98748779296875, -0.957794189453125, -0.9281005859375, -0.898406982421875, -0.86871337890625, -0.839019775390625, -0.809326171875, -0.779632568359375, -0.74993896484375, -0.720245361328125, -0.6905517578125, -0.660858154296875, -0.63116455078125, -0.601470947265625, -0.57177734375, -0.542083740234375, -0.51239013671875, -0.482696533203125, -0.4530029296875, -0.423309326171875, -0.39361572265625, -0.363922119140625, -0.334228515625, -0.304534912109375, -0.27484130859375, -0.245147705078125, -0.2154541015625, -0.185760498046875, -0.15606689453125, -0.126373291015625, -0.0966796875, -0.066986083984375, -0.03729248046875, -0.007598876953125, 0.0220947265625, 0.051788330078125, 0.08148193359375, 0.111175537109375, 0.140869140625, 0.170562744140625, 0.20025634765625, 0.229949951171875, 0.2596435546875, 0.289337158203125, 0.31903076171875, 0.348724365234375, 0.37841796875, 0.408111572265625, 0.43780517578125, 0.467498779296875, 0.4971923828125, 0.526885986328125, 0.55657958984375, 0.586273193359375, 0.615966796875, 0.645660400390625, 0.67535400390625, 0.705047607421875, 0.7347412109375, 0.764434814453125, 0.79412841796875, 0.823822021484375, 0.853515625]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 4.0, 1.0, 4.0, 4.0, 7.0, 2.0, 3.0, 13.0, 12.0, 16.0, 25.0, 25.0, 22.0, 28.0, 36.0, 42.0, 53.0, 48.0, 52.0, 51.0, 62.0, 73.0, 57.0, 61.0, 36.0, 40.0, 42.0, 32.0, 33.0, 28.0, 21.0, 19.0, 11.0, 12.0, 8.0, 7.0, 6.0, 3.0, 3.0, 3.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-1.1220703125, -1.0915908813476562, -1.0611114501953125, -1.0306320190429688, -1.000152587890625, -0.9696731567382812, -0.9391937255859375, -0.9087142944335938, -0.87823486328125, -0.8477554321289062, -0.8172760009765625, -0.7867965698242188, -0.756317138671875, -0.7258377075195312, -0.6953582763671875, -0.6648788452148438, -0.6343994140625, -0.6039199829101562, -0.5734405517578125, -0.5429611206054688, -0.512481689453125, -0.48200225830078125, -0.4515228271484375, -0.42104339599609375, -0.39056396484375, -0.36008453369140625, -0.3296051025390625, -0.29912567138671875, -0.268646240234375, -0.23816680908203125, -0.2076873779296875, -0.17720794677734375, -0.146728515625, -0.11624908447265625, -0.0857696533203125, -0.05529022216796875, -0.024810791015625, 0.00566864013671875, 0.0361480712890625, 0.06662750244140625, 0.09710693359375, 0.12758636474609375, 0.1580657958984375, 0.18854522705078125, 0.219024658203125, 0.24950408935546875, 0.2799835205078125, 0.31046295166015625, 0.3409423828125, 0.37142181396484375, 0.4019012451171875, 0.43238067626953125, 0.462860107421875, 0.49333953857421875, 0.5238189697265625, 0.5542984008789062, 0.58477783203125, 0.6152572631835938, 0.6457366943359375, 0.6762161254882812, 0.706695556640625, 0.7371749877929688, 0.7676544189453125, 0.7981338500976562, 0.82861328125]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 2.0, 5.0, 7.0, 5.0, 12.0, 11.0, 34.0, 44.0, 73.0, 130.0, 247.0, 514.0, 1238.0, 3465.0, 11597.0, 52834.0, 424966.0, 482539.0, 53294.0, 11757.0, 3407.0, 1305.0, 514.0, 243.0, 136.0, 69.0, 37.0, 25.0, 17.0, 8.0, 6.0, 7.0, 2.0, 6.0, 3.0, 1.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.301513671875, -0.2923774719238281, -0.28324127197265625, -0.2741050720214844, -0.2649688720703125, -0.2558326721191406, -0.24669647216796875, -0.23756027221679688, -0.228424072265625, -0.21928787231445312, -0.21015167236328125, -0.20101547241210938, -0.1918792724609375, -0.18274307250976562, -0.17360687255859375, -0.16447067260742188, -0.15533447265625, -0.14619827270507812, -0.13706207275390625, -0.12792587280273438, -0.1187896728515625, -0.10965347290039062, -0.10051727294921875, -0.09138107299804688, -0.082244873046875, -0.07310867309570312, -0.06397247314453125, -0.054836273193359375, -0.0457000732421875, -0.036563873291015625, -0.02742767333984375, -0.018291473388671875, -0.0091552734375, -1.9073486328125e-05, 0.00911712646484375, 0.018253326416015625, 0.0273895263671875, 0.036525726318359375, 0.04566192626953125, 0.054798126220703125, 0.063934326171875, 0.07307052612304688, 0.08220672607421875, 0.09134292602539062, 0.1004791259765625, 0.10961532592773438, 0.11875152587890625, 0.12788772583007812, 0.13702392578125, 0.14616012573242188, 0.15529632568359375, 0.16443252563476562, 0.1735687255859375, 0.18270492553710938, 0.19184112548828125, 0.20097732543945312, 0.210113525390625, 0.21924972534179688, 0.22838592529296875, 0.23752212524414062, 0.2466583251953125, 0.2557945251464844, 0.26493072509765625, 0.2740669250488281, 0.283203125]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 6.0, 5.0, 4.0, 1.0, 5.0, 6.0, 4.0, 3.0, 14.0, 7.0, 11.0, 22.0, 25.0, 29.0, 50.0, 62.0, 77.0, 92.0, 86.0, 110.0, 76.0, 80.0, 52.0, 40.0, 33.0, 17.0, 17.0, 15.0, 18.0, 13.0, 8.0, 6.0, 2.0, 6.0, 5.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.112192153930664e-05, -7.88029283285141e-05, -7.648393511772156e-05, -7.416494190692902e-05, -7.184594869613647e-05, -6.952695548534393e-05, -6.720796227455139e-05, -6.488896906375885e-05, -6.256997585296631e-05, -6.025098264217377e-05, -5.7931989431381226e-05, -5.5612996220588684e-05, -5.329400300979614e-05, -5.09750097990036e-05, -4.865601658821106e-05, -4.633702337741852e-05, -4.4018030166625977e-05, -4.1699036955833435e-05, -3.9380043745040894e-05, -3.706105053424835e-05, -3.474205732345581e-05, -3.242306411266327e-05, -3.0104070901870728e-05, -2.7785077691078186e-05, -2.5466084480285645e-05, -2.3147091269493103e-05, -2.082809805870056e-05, -1.850910484790802e-05, -1.619011163711548e-05, -1.3871118426322937e-05, -1.1552125215530396e-05, -9.233132004737854e-06, -6.9141387939453125e-06, -4.595145583152771e-06, -2.2761523723602295e-06, 4.284083843231201e-08, 2.3618340492248535e-06, 4.680827260017395e-06, 6.9998204708099365e-06, 9.318813681602478e-06, 1.163780689239502e-05, 1.3956800103187561e-05, 1.6275793313980103e-05, 1.8594786524772644e-05, 2.0913779735565186e-05, 2.3232772946357727e-05, 2.555176615715027e-05, 2.787075936794281e-05, 3.018975257873535e-05, 3.250874578952789e-05, 3.4827739000320435e-05, 3.7146732211112976e-05, 3.946572542190552e-05, 4.178471863269806e-05, 4.41037118434906e-05, 4.642270505428314e-05, 4.8741698265075684e-05, 5.1060691475868225e-05, 5.3379684686660767e-05, 5.569867789745331e-05, 5.801767110824585e-05, 6.033666431903839e-05, 6.265565752983093e-05, 6.497465074062347e-05, 6.729364395141602e-05]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 6.0, 9.0, 10.0, 12.0, 38.0, 100.0, 257.0, 1092.0, 8605.0, 335008.0, 689936.0, 11670.0, 1307.0, 319.0, 113.0, 37.0, 26.0, 6.0, 9.0, 4.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0712890625, -1.04852294921875, -1.0257568359375, -1.00299072265625, -0.980224609375, -0.95745849609375, -0.9346923828125, -0.91192626953125, -0.88916015625, -0.86639404296875, -0.8436279296875, -0.82086181640625, -0.798095703125, -0.77532958984375, -0.7525634765625, -0.72979736328125, -0.70703125, -0.68426513671875, -0.6614990234375, -0.63873291015625, -0.615966796875, -0.59320068359375, -0.5704345703125, -0.54766845703125, -0.52490234375, -0.50213623046875, -0.4793701171875, -0.45660400390625, -0.433837890625, -0.41107177734375, -0.3883056640625, -0.36553955078125, -0.3427734375, -0.32000732421875, -0.2972412109375, -0.27447509765625, -0.251708984375, -0.22894287109375, -0.2061767578125, -0.18341064453125, -0.16064453125, -0.13787841796875, -0.1151123046875, -0.09234619140625, -0.069580078125, -0.04681396484375, -0.0240478515625, -0.00128173828125, 0.021484375, 0.04425048828125, 0.0670166015625, 0.08978271484375, 0.112548828125, 0.13531494140625, 0.1580810546875, 0.18084716796875, 0.20361328125, 0.22637939453125, 0.2491455078125, 0.27191162109375, 0.294677734375, 0.31744384765625, 0.3402099609375, 0.36297607421875, 0.3857421875]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 4.0, 8.0, 12.0, 25.0, 30.0, 51.0, 67.0, 94.0, 118.0, 154.0, 117.0, 92.0, 65.0, 47.0, 35.0, 33.0, 25.0, 12.0, 6.0, 0.0, 7.0, 4.0, 4.0, 2.0], "bins": [-0.52392578125, -0.5133724212646484, -0.5028190612792969, -0.4922657012939453, -0.48171234130859375, -0.4711589813232422, -0.4606056213378906, -0.45005226135253906, -0.4394989013671875, -0.42894554138183594, -0.4183921813964844, -0.4078388214111328, -0.39728546142578125, -0.3867321014404297, -0.3761787414550781, -0.36562538146972656, -0.355072021484375, -0.34451866149902344, -0.3339653015136719, -0.3234119415283203, -0.31285858154296875, -0.3023052215576172, -0.2917518615722656, -0.28119850158691406, -0.2706451416015625, -0.26009178161621094, -0.24953842163085938, -0.2389850616455078, -0.22843170166015625, -0.2178783416748047, -0.20732498168945312, -0.19677162170410156, -0.18621826171875, -0.17566490173339844, -0.16511154174804688, -0.1545581817626953, -0.14400482177734375, -0.1334514617919922, -0.12289810180664062, -0.11234474182128906, -0.1017913818359375, -0.09123802185058594, -0.08068466186523438, -0.07013130187988281, -0.05957794189453125, -0.04902458190917969, -0.038471221923828125, -0.027917861938476562, -0.017364501953125, -0.0068111419677734375, 0.003742218017578125, 0.014295578002929688, 0.02484893798828125, 0.03540229797363281, 0.045955657958984375, 0.05650901794433594, 0.0670623779296875, 0.07761573791503906, 0.08816909790039062, 0.09872245788574219, 0.10927581787109375, 0.11982917785644531, 0.13038253784179688, 0.14093589782714844, 0.1514892578125]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 5.0, 3.0, 0.0, 2.0, 9.0, 15.0, 23.0, 45.0, 101.0, 178.0, 318.0, 151.0, 98.0, 37.0, 10.0, 8.0, 2.0, 3.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.6705245971679688, -2.469987154006958, -2.269449472427368, -2.0689120292663574, -1.8683744668960571, -1.6678369045257568, -1.467299461364746, -1.2667618989944458, -1.0662243366241455, -0.8656867742538452, -0.6651492714881897, -0.4646117687225342, -0.2640742063522339, -0.0635366439819336, 0.13700079917907715, 0.33753836154937744, 0.5380759239196777, 0.738613486289978, 0.9391509890556335, 1.139688491821289, 1.3402260541915894, 1.5407636165618896, 1.7413010597229004, 1.9418386220932007, 2.142376184463501, 2.3429136276245117, 2.5434513092041016, 2.7439887523651123, 2.944526195526123, 3.145063877105713, 3.3456013202667236, 3.5461387634277344, 3.746676445007324, 3.947213888168335, 4.147751331329346, 4.3482890129089355, 4.548826694488525, 4.749363899230957, 4.949901580810547, 5.150439262390137, 5.350976943969727, 5.551514625549316, 5.752051830291748, 5.952589511871338, 6.153127193450928, 6.353664398193359, 6.554202079772949, 6.754739761352539, 6.955276966094971, 7.1558146476745605, 7.356351852416992, 7.556889533996582, 7.757427215576172, 7.957964897155762, 8.158502578735352, 8.359039306640625, 8.559576988220215, 8.760114669799805, 8.960652351379395, 9.161190032958984, 9.361726760864258, 9.562264442443848, 9.762802124023438, 9.963339805603027, 10.163877487182617]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 5.0, 3.0, 3.0, 6.0, 6.0, 8.0, 10.0, 5.0, 11.0, 6.0, 22.0, 16.0, 12.0, 15.0, 12.0, 16.0, 30.0, 39.0, 29.0, 40.0, 62.0, 61.0, 59.0, 64.0, 68.0, 52.0, 45.0, 39.0, 22.0, 35.0, 22.0, 16.0, 26.0, 17.0, 18.0, 18.0, 15.0, 15.0, 7.0, 16.0, 10.0, 7.0, 6.0, 4.0, 4.0, 4.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.089521884918213, -2.991194248199463, -2.892866611480713, -2.794538974761963, -2.696211099624634, -2.597883462905884, -2.499555826187134, -2.401228189468384, -2.3029003143310547, -2.2045726776123047, -2.1062450408935547, -2.0079174041748047, -1.9095895290374756, -1.8112618923187256, -1.7129342555999756, -1.6146066188812256, -1.5162789821624756, -1.4179513454437256, -1.319623589515686, -1.221295952796936, -1.1229681968688965, -1.0246405601501465, -0.9263129234313965, -0.8279852271080017, -0.7296575307846069, -0.6313298344612122, -0.5330021381378174, -0.4346745014190674, -0.3363468050956726, -0.23801910877227783, -0.13969147205352783, -0.04136377573013306, 0.05696392059326172, 0.1552916020154953, 0.2536192834377289, 0.35194694995880127, 0.45027464628219604, 0.5486023426055908, 0.6469299793243408, 0.7452576756477356, 0.8435853719711304, 0.9419130682945251, 1.04024076461792, 1.13856840133667, 1.23689603805542, 1.3352237939834595, 1.4335514307022095, 1.531879186630249, 1.630206823348999, 1.728534460067749, 1.8268622159957886, 1.9251898527145386, 2.023517608642578, 2.121845245361328, 2.220172882080078, 2.318500518798828, 2.416828155517578, 2.515155792236328, 2.613483428955078, 2.711811065673828, 2.8101389408111572, 2.9084665775299072, 3.0067942142486572, 3.1051218509674072, 3.2034497261047363]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 3.0, 5.0, 6.0, 14.0, 18.0, 22.0, 39.0, 70.0, 94.0, 158.0, 272.0, 453.0, 937.0, 2060.0, 5025.0, 15836.0, 89592.0, 2605879.0, 1391981.0, 61222.0, 12782.0, 4265.0, 1723.0, 825.0, 367.0, 255.0, 146.0, 96.0, 46.0, 35.0, 22.0, 12.0, 9.0, 8.0, 4.0, 3.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.68701171875, -0.6693572998046875, -0.651702880859375, -0.6340484619140625, -0.61639404296875, -0.5987396240234375, -0.581085205078125, -0.5634307861328125, -0.5457763671875, -0.5281219482421875, -0.510467529296875, -0.4928131103515625, -0.47515869140625, -0.4575042724609375, -0.439849853515625, -0.4221954345703125, -0.404541015625, -0.3868865966796875, -0.369232177734375, -0.3515777587890625, -0.33392333984375, -0.3162689208984375, -0.298614501953125, -0.2809600830078125, -0.2633056640625, -0.2456512451171875, -0.227996826171875, -0.2103424072265625, -0.19268798828125, -0.1750335693359375, -0.157379150390625, -0.1397247314453125, -0.1220703125, -0.1044158935546875, -0.086761474609375, -0.0691070556640625, -0.05145263671875, -0.0337982177734375, -0.016143798828125, 0.0015106201171875, 0.0191650390625, 0.0368194580078125, 0.054473876953125, 0.0721282958984375, 0.08978271484375, 0.1074371337890625, 0.125091552734375, 0.1427459716796875, 0.160400390625, 0.1780548095703125, 0.195709228515625, 0.2133636474609375, 0.23101806640625, 0.2486724853515625, 0.266326904296875, 0.2839813232421875, 0.3016357421875, 0.3192901611328125, 0.336944580078125, 0.3545989990234375, 0.37225341796875, 0.3899078369140625, 0.407562255859375, 0.4252166748046875, 0.44287109375]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 2.0, 0.0, 9.0, 5.0, 7.0, 9.0, 23.0, 15.0, 18.0, 31.0, 32.0, 38.0, 35.0, 38.0, 35.0, 45.0, 49.0, 56.0, 56.0, 41.0, 48.0, 67.0, 70.0, 47.0, 41.0, 40.0, 29.0, 22.0, 20.0, 18.0, 12.0, 16.0, 7.0, 5.0, 10.0, 4.0, 3.0, 2.0, 2.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2247314453125, -0.2176380157470703, -0.21054458618164062, -0.20345115661621094, -0.19635772705078125, -0.18926429748535156, -0.18217086791992188, -0.1750774383544922, -0.1679840087890625, -0.1608905792236328, -0.15379714965820312, -0.14670372009277344, -0.13961029052734375, -0.13251686096191406, -0.12542343139648438, -0.11833000183105469, -0.111236572265625, -0.10414314270019531, -0.09704971313476562, -0.08995628356933594, -0.08286285400390625, -0.07576942443847656, -0.06867599487304688, -0.06158256530761719, -0.0544891357421875, -0.04739570617675781, -0.040302276611328125, -0.03320884704589844, -0.02611541748046875, -0.019021987915039062, -0.011928558349609375, -0.0048351287841796875, 0.00225830078125, 0.009351730346679688, 0.016445159912109375, 0.023538589477539062, 0.03063201904296875, 0.03772544860839844, 0.044818878173828125, 0.05191230773925781, 0.0590057373046875, 0.06609916687011719, 0.07319259643554688, 0.08028602600097656, 0.08737945556640625, 0.09447288513183594, 0.10156631469726562, 0.10865974426269531, 0.115753173828125, 0.12284660339355469, 0.12994003295898438, 0.13703346252441406, 0.14412689208984375, 0.15122032165527344, 0.15831375122070312, 0.1654071807861328, 0.1725006103515625, 0.1795940399169922, 0.18668746948242188, 0.19378089904785156, 0.20087432861328125, 0.20796775817871094, 0.21506118774414062, 0.2221546173095703, 0.229248046875]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 2.0, 7.0, 5.0, 5.0, 14.0, 16.0, 24.0, 30.0, 55.0, 73.0, 114.0, 184.0, 339.0, 617.0, 1250.0, 2951.0, 9668.0, 49829.0, 1488156.0, 2561913.0, 61725.0, 11316.0, 3279.0, 1257.0, 644.0, 311.0, 199.0, 94.0, 80.0, 45.0, 30.0, 16.0, 14.0, 6.0, 3.0, 5.0, 5.0, 3.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.99609375, -0.9676742553710938, -0.9392547607421875, -0.9108352661132812, -0.882415771484375, -0.8539962768554688, -0.8255767822265625, -0.7971572875976562, -0.76873779296875, -0.7403182983398438, -0.7118988037109375, -0.6834793090820312, -0.655059814453125, -0.6266403198242188, -0.5982208251953125, -0.5698013305664062, -0.5413818359375, -0.5129623413085938, -0.4845428466796875, -0.45612335205078125, -0.427703857421875, -0.39928436279296875, -0.3708648681640625, -0.34244537353515625, -0.31402587890625, -0.28560638427734375, -0.2571868896484375, -0.22876739501953125, -0.200347900390625, -0.17192840576171875, -0.1435089111328125, -0.11508941650390625, -0.086669921875, -0.05825042724609375, -0.0298309326171875, -0.00141143798828125, 0.027008056640625, 0.05542755126953125, 0.0838470458984375, 0.11226654052734375, 0.14068603515625, 0.16910552978515625, 0.1975250244140625, 0.22594451904296875, 0.254364013671875, 0.28278350830078125, 0.3112030029296875, 0.33962249755859375, 0.3680419921875, 0.39646148681640625, 0.4248809814453125, 0.45330047607421875, 0.481719970703125, 0.5101394653320312, 0.5385589599609375, 0.5669784545898438, 0.59539794921875, 0.6238174438476562, 0.6522369384765625, 0.6806564331054688, 0.709075927734375, 0.7374954223632812, 0.7659149169921875, 0.7943344116210938, 0.82275390625]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 7.0, 9.0, 9.0, 16.0, 14.0, 27.0, 36.0, 63.0, 109.0, 185.0, 482.0, 1192.0, 1013.0, 445.0, 174.0, 102.0, 60.0, 45.0, 28.0, 21.0, 17.0, 5.0, 7.0, 3.0, 5.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.96533203125, -0.9376983642578125, -0.910064697265625, -0.8824310302734375, -0.85479736328125, -0.8271636962890625, -0.799530029296875, -0.7718963623046875, -0.7442626953125, -0.7166290283203125, -0.688995361328125, -0.6613616943359375, -0.63372802734375, -0.6060943603515625, -0.578460693359375, -0.5508270263671875, -0.523193359375, -0.4955596923828125, -0.467926025390625, -0.4402923583984375, -0.41265869140625, -0.3850250244140625, -0.357391357421875, -0.3297576904296875, -0.3021240234375, -0.2744903564453125, -0.246856689453125, -0.2192230224609375, -0.19158935546875, -0.1639556884765625, -0.136322021484375, -0.1086883544921875, -0.0810546875, -0.0534210205078125, -0.025787353515625, 0.0018463134765625, 0.02947998046875, 0.0571136474609375, 0.084747314453125, 0.1123809814453125, 0.1400146484375, 0.1676483154296875, 0.195281982421875, 0.2229156494140625, 0.25054931640625, 0.2781829833984375, 0.305816650390625, 0.3334503173828125, 0.361083984375, 0.3887176513671875, 0.416351318359375, 0.4439849853515625, 0.47161865234375, 0.4992523193359375, 0.526885986328125, 0.5545196533203125, 0.5821533203125, 0.6097869873046875, 0.637420654296875, 0.6650543212890625, 0.69268798828125, 0.7203216552734375, 0.747955322265625, 0.7755889892578125, 0.80322265625]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 5.0, 5.0, 7.0, 14.0, 19.0, 35.0, 72.0, 95.0, 164.0, 172.0, 147.0, 113.0, 64.0, 38.0, 20.0, 7.0, 14.0, 7.0, 3.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.3345320224761963, -3.163228988647461, -2.9919261932373047, -2.8206231594085693, -2.649320125579834, -2.4780173301696777, -2.3067142963409424, -2.135411262512207, -1.9641084671020508, -1.792805552482605, -1.6215026378631592, -1.4501996040344238, -1.278896689414978, -1.1075937747955322, -0.9362907409667969, -0.7649878263473511, -0.5936849117279053, -0.4223819673061371, -0.2510790228843689, -0.07977604866027832, 0.09152686595916748, 0.2628297805786133, 0.43413281440734863, 0.6054357290267944, 0.7767386436462402, 0.948041558265686, 1.1193444728851318, 1.2906475067138672, 1.461950421333313, 1.6332533359527588, 1.8045563697814941, 1.97585928440094, 2.147162437438965, 2.3184654712677, 2.4897682666778564, 2.661071300506592, 2.832374095916748, 3.0036771297454834, 3.1749801635742188, 3.346282958984375, 3.5175859928131104, 3.6888890266418457, 3.860191822052002, 4.031495094299316, 4.202797889709473, 4.374100685119629, 4.545403480529785, 4.7167067527771, 4.888009548187256, 5.059312343597412, 5.230615615844727, 5.401918411254883, 5.573221206665039, 5.744524002075195, 5.91582727432251, 6.087130069732666, 6.2584333419799805, 6.429736137390137, 6.601039409637451, 6.772342205047607, 6.943645000457764, 7.114948272705078, 7.286251068115234, 7.457553863525391, 7.628856658935547]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 5.0, 3.0, 7.0, 5.0, 8.0, 6.0, 13.0, 13.0, 10.0, 13.0, 18.0, 21.0, 28.0, 30.0, 21.0, 31.0, 38.0, 31.0, 41.0, 43.0, 48.0, 40.0, 41.0, 42.0, 45.0, 49.0, 34.0, 27.0, 46.0, 29.0, 32.0, 20.0, 18.0, 28.0, 15.0, 19.0, 18.0, 8.0, 13.0, 5.0, 10.0, 12.0, 4.0, 6.0, 4.0, 7.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-2.317715644836426, -2.250880718231201, -2.1840457916259766, -2.117211103439331, -2.0503761768341064, -1.9835412502288818, -1.9167064428329468, -1.8498716354370117, -1.783036708831787, -1.7162017822265625, -1.6493669748306274, -1.5825321674346924, -1.5156972408294678, -1.4488623142242432, -1.382027506828308, -1.315192699432373, -1.2483577728271484, -1.1815228462219238, -1.1146880388259888, -1.0478532314300537, -0.9810183048248291, -0.9141834378242493, -0.8473485708236694, -0.7805137038230896, -0.7136788368225098, -0.6468439698219299, -0.5800091028213501, -0.5131742358207703, -0.44633936882019043, -0.3795045018196106, -0.31266963481903076, -0.24583476781845093, -0.17900002002716064, -0.11216515302658081, -0.04533028602600098, 0.021504580974578857, 0.08833944797515869, 0.15517431497573853, 0.22200918197631836, 0.2888440489768982, 0.355678915977478, 0.42251378297805786, 0.4893486499786377, 0.5561835169792175, 0.6230183839797974, 0.6898532509803772, 0.756688117980957, 0.8235229849815369, 0.8903578519821167, 0.9571927189826965, 1.0240275859832764, 1.090862512588501, 1.157697319984436, 1.224532127380371, 1.2913670539855957, 1.3582019805908203, 1.4250367879867554, 1.4918715953826904, 1.558706521987915, 1.6255414485931396, 1.6923762559890747, 1.7592110633850098, 1.8260459899902344, 1.892880916595459, 1.959715723991394]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 8.0, 5.0, 7.0, 9.0, 22.0, 22.0, 32.0, 55.0, 91.0, 140.0, 194.0, 336.0, 488.0, 856.0, 1536.0, 2921.0, 6279.0, 15206.0, 47434.0, 209021.0, 537555.0, 162635.0, 38834.0, 13065.0, 5583.0, 2686.0, 1396.0, 812.0, 471.0, 319.0, 212.0, 130.0, 69.0, 47.0, 29.0, 17.0, 14.0, 12.0, 7.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.385986328125, -0.37329864501953125, -0.3606109619140625, -0.34792327880859375, -0.335235595703125, -0.32254791259765625, -0.3098602294921875, -0.29717254638671875, -0.28448486328125, -0.27179718017578125, -0.2591094970703125, -0.24642181396484375, -0.233734130859375, -0.22104644775390625, -0.2083587646484375, -0.19567108154296875, -0.1829833984375, -0.17029571533203125, -0.1576080322265625, -0.14492034912109375, -0.132232666015625, -0.11954498291015625, -0.1068572998046875, -0.09416961669921875, -0.08148193359375, -0.06879425048828125, -0.0561065673828125, -0.04341888427734375, -0.030731201171875, -0.01804351806640625, -0.0053558349609375, 0.00733184814453125, 0.02001953125, 0.03270721435546875, 0.0453948974609375, 0.05808258056640625, 0.070770263671875, 0.08345794677734375, 0.0961456298828125, 0.10883331298828125, 0.12152099609375, 0.13420867919921875, 0.1468963623046875, 0.15958404541015625, 0.172271728515625, 0.18495941162109375, 0.1976470947265625, 0.21033477783203125, 0.2230224609375, 0.23571014404296875, 0.2483978271484375, 0.26108551025390625, 0.273773193359375, 0.28646087646484375, 0.2991485595703125, 0.31183624267578125, 0.32452392578125, 0.33721160888671875, 0.3498992919921875, 0.36258697509765625, 0.375274658203125, 0.38796234130859375, 0.4006500244140625, 0.41333770751953125, 0.426025390625]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 1.0, 2.0, 2.0, 0.0, 3.0, 6.0, 2.0, 2.0, 12.0, 11.0, 10.0, 13.0, 14.0, 20.0, 26.0, 26.0, 28.0, 42.0, 40.0, 37.0, 51.0, 39.0, 46.0, 55.0, 60.0, 52.0, 60.0, 35.0, 49.0, 33.0, 44.0, 39.0, 30.0, 21.0, 21.0, 15.0, 15.0, 12.0, 11.0, 5.0, 6.0, 8.0, 2.0, 5.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2098388671875, -0.2024402618408203, -0.19504165649414062, -0.18764305114746094, -0.18024444580078125, -0.17284584045410156, -0.16544723510742188, -0.1580486297607422, -0.1506500244140625, -0.1432514190673828, -0.13585281372070312, -0.12845420837402344, -0.12105560302734375, -0.11365699768066406, -0.10625839233398438, -0.09885978698730469, -0.091461181640625, -0.08406257629394531, -0.07666397094726562, -0.06926536560058594, -0.06186676025390625, -0.05446815490722656, -0.047069549560546875, -0.03967094421386719, -0.0322723388671875, -0.024873733520507812, -0.017475128173828125, -0.010076522827148438, -0.00267791748046875, 0.0047206878662109375, 0.012119293212890625, 0.019517898559570312, 0.02691650390625, 0.03431510925292969, 0.041713714599609375, 0.04911231994628906, 0.05651092529296875, 0.06390953063964844, 0.07130813598632812, 0.07870674133300781, 0.0861053466796875, 0.09350395202636719, 0.10090255737304688, 0.10830116271972656, 0.11569976806640625, 0.12309837341308594, 0.13049697875976562, 0.1378955841064453, 0.145294189453125, 0.1526927947998047, 0.16009140014648438, 0.16749000549316406, 0.17488861083984375, 0.18228721618652344, 0.18968582153320312, 0.1970844268798828, 0.2044830322265625, 0.2118816375732422, 0.21928024291992188, 0.22667884826660156, 0.23407745361328125, 0.24147605895996094, 0.24887466430664062, 0.2562732696533203, 0.263671875]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 4.0, 3.0, 11.0, 8.0, 15.0, 25.0, 23.0, 39.0, 54.0, 69.0, 107.0, 196.0, 307.0, 486.0, 945.0, 1959.0, 4911.0, 17334.0, 110206.0, 770731.0, 113931.0, 17967.0, 4965.0, 1952.0, 897.0, 509.0, 299.0, 189.0, 133.0, 91.0, 58.0, 42.0, 23.0, 15.0, 16.0, 10.0, 10.0, 4.0, 3.0, 3.0, 3.0, 4.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.62841796875, -0.6102066040039062, -0.5919952392578125, -0.5737838745117188, -0.555572509765625, -0.5373611450195312, -0.5191497802734375, -0.5009384155273438, -0.48272705078125, -0.46451568603515625, -0.4463043212890625, -0.42809295654296875, -0.409881591796875, -0.39167022705078125, -0.3734588623046875, -0.35524749755859375, -0.3370361328125, -0.31882476806640625, -0.3006134033203125, -0.28240203857421875, -0.264190673828125, -0.24597930908203125, -0.2277679443359375, -0.20955657958984375, -0.19134521484375, -0.17313385009765625, -0.1549224853515625, -0.13671112060546875, -0.118499755859375, -0.10028839111328125, -0.0820770263671875, -0.06386566162109375, -0.045654296875, -0.02744293212890625, -0.0092315673828125, 0.00897979736328125, 0.027191162109375, 0.04540252685546875, 0.0636138916015625, 0.08182525634765625, 0.10003662109375, 0.11824798583984375, 0.1364593505859375, 0.15467071533203125, 0.172882080078125, 0.19109344482421875, 0.2093048095703125, 0.22751617431640625, 0.2457275390625, 0.26393890380859375, 0.2821502685546875, 0.30036163330078125, 0.318572998046875, 0.33678436279296875, 0.3549957275390625, 0.37320709228515625, 0.39141845703125, 0.40962982177734375, 0.4278411865234375, 0.44605255126953125, 0.464263916015625, 0.48247528076171875, 0.5006866455078125, 0.5188980102539062, 0.537109375]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 3.0, 7.0, 4.0, 5.0, 6.0, 13.0, 13.0, 16.0, 21.0, 23.0, 26.0, 37.0, 36.0, 49.0, 49.0, 54.0, 49.0, 52.0, 64.0, 78.0, 54.0, 61.0, 58.0, 42.0, 45.0, 32.0, 18.0, 23.0, 12.0, 18.0, 8.0, 13.0, 6.0, 5.0, 4.0, 2.0, 1.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.80810546875, -0.7766189575195312, -0.7451324462890625, -0.7136459350585938, -0.682159423828125, -0.6506729125976562, -0.6191864013671875, -0.5876998901367188, -0.55621337890625, -0.5247268676757812, -0.4932403564453125, -0.46175384521484375, -0.430267333984375, -0.39878082275390625, -0.3672943115234375, -0.33580780029296875, -0.3043212890625, -0.27283477783203125, -0.2413482666015625, -0.20986175537109375, -0.178375244140625, -0.14688873291015625, -0.1154022216796875, -0.08391571044921875, -0.05242919921875, -0.02094268798828125, 0.0105438232421875, 0.04203033447265625, 0.073516845703125, 0.10500335693359375, 0.1364898681640625, 0.16797637939453125, 0.199462890625, 0.23094940185546875, 0.2624359130859375, 0.29392242431640625, 0.325408935546875, 0.35689544677734375, 0.3883819580078125, 0.41986846923828125, 0.45135498046875, 0.48284149169921875, 0.5143280029296875, 0.5458145141601562, 0.577301025390625, 0.6087875366210938, 0.6402740478515625, 0.6717605590820312, 0.7032470703125, 0.7347335815429688, 0.7662200927734375, 0.7977066040039062, 0.829193115234375, 0.8606796264648438, 0.8921661376953125, 0.9236526489257812, 0.95513916015625, 0.9866256713867188, 1.0181121826171875, 1.0495986938476562, 1.081085205078125, 1.1125717163085938, 1.1440582275390625, 1.1755447387695312, 1.20703125]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 5.0, 6.0, 12.0, 15.0, 14.0, 30.0, 41.0, 74.0, 104.0, 179.0, 244.0, 520.0, 925.0, 1690.0, 3826.0, 10480.0, 39133.0, 264791.0, 644464.0, 58713.0, 13860.0, 4850.0, 2096.0, 1020.0, 585.0, 334.0, 196.0, 106.0, 91.0, 47.0, 31.0, 25.0, 16.0, 13.0, 8.0, 3.0, 0.0, 6.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.255859375, -0.24813461303710938, -0.24040985107421875, -0.23268508911132812, -0.2249603271484375, -0.21723556518554688, -0.20951080322265625, -0.20178604125976562, -0.194061279296875, -0.18633651733398438, -0.17861175537109375, -0.17088699340820312, -0.1631622314453125, -0.15543746948242188, -0.14771270751953125, -0.13998794555664062, -0.13226318359375, -0.12453842163085938, -0.11681365966796875, -0.10908889770507812, -0.1013641357421875, -0.09363937377929688, -0.08591461181640625, -0.07818984985351562, -0.070465087890625, -0.06274032592773438, -0.05501556396484375, -0.047290802001953125, -0.0395660400390625, -0.031841278076171875, -0.02411651611328125, -0.016391754150390625, -0.0086669921875, -0.000942230224609375, 0.00678253173828125, 0.014507293701171875, 0.0222320556640625, 0.029956817626953125, 0.03768157958984375, 0.045406341552734375, 0.053131103515625, 0.060855865478515625, 0.06858062744140625, 0.07630538940429688, 0.0840301513671875, 0.09175491333007812, 0.09947967529296875, 0.10720443725585938, 0.11492919921875, 0.12265396118164062, 0.13037872314453125, 0.13810348510742188, 0.1458282470703125, 0.15355300903320312, 0.16127777099609375, 0.16900253295898438, 0.176727294921875, 0.18445205688476562, 0.19217681884765625, 0.19990158081054688, 0.2076263427734375, 0.21535110473632812, 0.22307586669921875, 0.23080062866210938, 0.238525390625]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 0.0, 1.0, 3.0, 7.0, 18.0, 19.0, 38.0, 76.0, 134.0, 203.0, 244.0, 128.0, 57.0, 31.0, 23.0, 12.0, 3.0, 2.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00014257431030273438, -0.0001376532018184662, -0.000132732093334198, -0.0001278109848499298, -0.00012288987636566162, -0.00011796876788139343, -0.00011304765939712524, -0.00010812655091285706, -0.00010320544242858887, -9.828433394432068e-05, -9.336322546005249e-05, -8.84421169757843e-05, -8.352100849151611e-05, -7.859990000724792e-05, -7.367879152297974e-05, -6.875768303871155e-05, -6.383657455444336e-05, -5.891546607017517e-05, -5.399435758590698e-05, -4.9073249101638794e-05, -4.4152140617370605e-05, -3.923103213310242e-05, -3.430992364883423e-05, -2.938881516456604e-05, -2.446770668029785e-05, -1.9546598196029663e-05, -1.4625489711761475e-05, -9.704381227493286e-06, -4.783272743225098e-06, 1.3783574104309082e-07, 5.058944225311279e-06, 9.980052709579468e-06, 1.4901161193847656e-05, 1.9822269678115845e-05, 2.4743378162384033e-05, 2.966448664665222e-05, 3.458559513092041e-05, 3.95067036151886e-05, 4.442781209945679e-05, 4.9348920583724976e-05, 5.4270029067993164e-05, 5.919113755226135e-05, 6.411224603652954e-05, 6.903335452079773e-05, 7.395446300506592e-05, 7.88755714893341e-05, 8.37966799736023e-05, 8.871778845787048e-05, 9.363889694213867e-05, 9.856000542640686e-05, 0.00010348111391067505, 0.00010840222239494324, 0.00011332333087921143, 0.00011824443936347961, 0.0001231655478477478, 0.000128086656332016, 0.00013300776481628418, 0.00013792887330055237, 0.00014284998178482056, 0.00014777109026908875, 0.00015269219875335693, 0.00015761330723762512, 0.0001625344157218933, 0.0001674555242061615, 0.0001723766326904297]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 3.0, 2.0, 3.0, 4.0, 7.0, 14.0, 11.0, 21.0, 34.0, 41.0, 56.0, 109.0, 223.0, 434.0, 767.0, 1638.0, 4120.0, 11799.0, 54211.0, 647900.0, 275270.0, 36777.0, 9034.0, 3280.0, 1281.0, 681.0, 319.0, 189.0, 108.0, 62.0, 46.0, 35.0, 21.0, 12.0, 12.0, 9.0, 7.0, 7.0, 4.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.27587890625, -0.2672271728515625, -0.258575439453125, -0.2499237060546875, -0.24127197265625, -0.2326202392578125, -0.223968505859375, -0.2153167724609375, -0.2066650390625, -0.1980133056640625, -0.189361572265625, -0.1807098388671875, -0.17205810546875, -0.1634063720703125, -0.154754638671875, -0.1461029052734375, -0.137451171875, -0.1287994384765625, -0.120147705078125, -0.1114959716796875, -0.10284423828125, -0.0941925048828125, -0.085540771484375, -0.0768890380859375, -0.0682373046875, -0.0595855712890625, -0.050933837890625, -0.0422821044921875, -0.03363037109375, -0.0249786376953125, -0.016326904296875, -0.0076751708984375, 0.0009765625, 0.0096282958984375, 0.018280029296875, 0.0269317626953125, 0.03558349609375, 0.0442352294921875, 0.052886962890625, 0.0615386962890625, 0.0701904296875, 0.0788421630859375, 0.087493896484375, 0.0961456298828125, 0.10479736328125, 0.1134490966796875, 0.122100830078125, 0.1307525634765625, 0.139404296875, 0.1480560302734375, 0.156707763671875, 0.1653594970703125, 0.17401123046875, 0.1826629638671875, 0.191314697265625, 0.1999664306640625, 0.2086181640625, 0.2172698974609375, 0.225921630859375, 0.2345733642578125, 0.24322509765625, 0.2518768310546875, 0.260528564453125, 0.2691802978515625, 0.27783203125]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 2.0, 3.0, 8.0, 12.0, 16.0, 11.0, 18.0, 34.0, 45.0, 58.0, 51.0, 67.0, 89.0, 122.0, 110.0, 78.0, 60.0, 61.0, 43.0, 22.0, 25.0, 10.0, 14.0, 7.0, 10.0, 9.0, 4.0, 1.0, 7.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.2181396484375, -0.21148109436035156, -0.20482254028320312, -0.1981639862060547, -0.19150543212890625, -0.1848468780517578, -0.17818832397460938, -0.17152976989746094, -0.1648712158203125, -0.15821266174316406, -0.15155410766601562, -0.1448955535888672, -0.13823699951171875, -0.1315784454345703, -0.12491989135742188, -0.11826133728027344, -0.111602783203125, -0.10494422912597656, -0.09828567504882812, -0.09162712097167969, -0.08496856689453125, -0.07831001281738281, -0.07165145874023438, -0.06499290466308594, -0.0583343505859375, -0.05167579650878906, -0.045017242431640625, -0.03835868835449219, -0.03170013427734375, -0.025041580200195312, -0.018383026123046875, -0.011724472045898438, -0.00506591796875, 0.0015926361083984375, 0.008251190185546875, 0.014909744262695312, 0.02156829833984375, 0.028226852416992188, 0.034885406494140625, 0.04154396057128906, 0.0482025146484375, 0.05486106872558594, 0.061519622802734375, 0.06817817687988281, 0.07483673095703125, 0.08149528503417969, 0.08815383911132812, 0.09481239318847656, 0.101470947265625, 0.10812950134277344, 0.11478805541992188, 0.12144660949707031, 0.12810516357421875, 0.1347637176513672, 0.14142227172851562, 0.14808082580566406, 0.1547393798828125, 0.16139793395996094, 0.16805648803710938, 0.1747150421142578, 0.18137359619140625, 0.1880321502685547, 0.19469070434570312, 0.20134925842285156, 0.2080078125]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 5.0, 5.0, 7.0, 9.0, 15.0, 31.0, 66.0, 120.0, 273.0, 246.0, 104.0, 55.0, 32.0, 19.0, 6.0, 7.0, 6.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.099287509918213, -6.9066619873046875, -6.714036464691162, -6.521410942077637, -6.328784942626953, -6.136159420013428, -5.943533897399902, -5.750908374786377, -5.558282852172852, -5.365657329559326, -5.173031806945801, -4.980405807495117, -4.787780284881592, -4.595154762268066, -4.402529239654541, -4.209903717041016, -4.017277717590332, -3.8246521949768066, -3.632026433944702, -3.4394009113311768, -3.2467751502990723, -3.054149627685547, -2.8615241050720215, -2.668898582458496, -2.4762728214263916, -2.283647298812866, -2.0910215377807617, -1.8983960151672363, -1.7057703733444214, -1.5131447315216064, -1.320519208908081, -1.1278935670852661, -0.9352684020996094, -0.7426427602767944, -0.5500171780586243, -0.3573915958404541, -0.16476595401763916, 0.02785968780517578, 0.22048521041870117, 0.4131108522415161, 0.605736494064331, 0.798362135887146, 0.9909877181053162, 1.1836133003234863, 1.3762389421463013, 1.5688645839691162, 1.7614901065826416, 1.9541157484054565, 2.1467413902282715, 2.339366912841797, 2.5319926738739014, 2.7246181964874268, 2.9172439575195312, 3.1098694801330566, 3.302495002746582, 3.4951205253601074, 3.687746286392212, 3.8803718090057373, 4.072997570037842, 4.265623092651367, 4.458248615264893, 4.650874137878418, 4.843500137329102, 5.036125659942627, 5.228751182556152]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 1.0, 3.0, 4.0, 5.0, 7.0, 5.0, 11.0, 12.0, 9.0, 22.0, 13.0, 16.0, 24.0, 19.0, 34.0, 28.0, 25.0, 40.0, 32.0, 42.0, 69.0, 81.0, 80.0, 67.0, 56.0, 37.0, 34.0, 25.0, 24.0, 29.0, 24.0, 19.0, 14.0, 16.0, 8.0, 9.0, 12.0, 10.0, 8.0, 2.0, 5.0, 5.0, 4.0, 4.0, 4.0, 5.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-3.056497573852539, -2.963557004928589, -2.8706164360046387, -2.7776756286621094, -2.684735059738159, -2.591794490814209, -2.498853921890259, -2.4059133529663086, -2.3129725456237793, -2.220031976699829, -2.127091407775879, -2.0341506004333496, -1.9412100315093994, -1.8482694625854492, -1.755328893661499, -1.6623883247375488, -1.5694477558135986, -1.4765071868896484, -1.3835664987564087, -1.2906259298324585, -1.1976852416992188, -1.1047446727752686, -1.0118041038513184, -0.9188634753227234, -0.8259228467941284, -0.7329822182655334, -0.6400415897369385, -0.5471010208129883, -0.4541603922843933, -0.36121976375579834, -0.26827919483184814, -0.17533856630325317, -0.0823979377746582, 0.010542675852775574, 0.10348328948020935, 0.19642388820648193, 0.2893645167350769, 0.3823051452636719, 0.47524571418762207, 0.568186342716217, 0.661126971244812, 0.754067599773407, 0.847008228302002, 0.9399487972259521, 1.0328893661499023, 1.125830054283142, 1.2187706232070923, 1.311711311340332, 1.4046518802642822, 1.4975924491882324, 1.5905331373214722, 1.6834737062454224, 1.776414394378662, 1.8693549633026123, 1.9622955322265625, 2.0552361011505127, 2.148176670074463, 2.241117238998413, 2.3340578079223633, 2.4269986152648926, 2.5199391841888428, 2.612879753112793, 2.705820322036743, 2.7987608909606934, 2.8917016983032227]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 3.0, 3.0, 5.0, 4.0, 7.0, 8.0, 15.0, 12.0, 25.0, 26.0, 48.0, 48.0, 74.0, 161.0, 257.0, 364.0, 635.0, 1187.0, 2219.0, 4743.0, 11355.0, 36733.0, 252261.0, 3059696.0, 728159.0, 66239.0, 17043.0, 6646.0, 2894.0, 1503.0, 797.0, 425.0, 237.0, 147.0, 100.0, 65.0, 38.0, 33.0, 11.0, 20.0, 10.0, 14.0, 2.0, 5.0, 4.0, 3.0, 5.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.53515625, -0.5197296142578125, -0.504302978515625, -0.4888763427734375, -0.47344970703125, -0.4580230712890625, -0.442596435546875, -0.4271697998046875, -0.4117431640625, -0.3963165283203125, -0.380889892578125, -0.3654632568359375, -0.35003662109375, -0.3346099853515625, -0.319183349609375, -0.3037567138671875, -0.288330078125, -0.2729034423828125, -0.257476806640625, -0.2420501708984375, -0.22662353515625, -0.2111968994140625, -0.195770263671875, -0.1803436279296875, -0.1649169921875, -0.1494903564453125, -0.134063720703125, -0.1186370849609375, -0.10321044921875, -0.0877838134765625, -0.072357177734375, -0.0569305419921875, -0.04150390625, -0.0260772705078125, -0.010650634765625, 0.0047760009765625, 0.02020263671875, 0.0356292724609375, 0.051055908203125, 0.0664825439453125, 0.0819091796875, 0.0973358154296875, 0.112762451171875, 0.1281890869140625, 0.14361572265625, 0.1590423583984375, 0.174468994140625, 0.1898956298828125, 0.205322265625, 0.2207489013671875, 0.236175537109375, 0.2516021728515625, 0.26702880859375, 0.2824554443359375, 0.297882080078125, 0.3133087158203125, 0.3287353515625, 0.3441619873046875, 0.359588623046875, 0.3750152587890625, 0.39044189453125, 0.4058685302734375, 0.421295166015625, 0.4367218017578125, 0.4521484375]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 3.0, 4.0, 7.0, 7.0, 8.0, 5.0, 3.0, 3.0, 17.0, 19.0, 20.0, 20.0, 23.0, 30.0, 23.0, 32.0, 43.0, 45.0, 43.0, 49.0, 56.0, 42.0, 49.0, 49.0, 36.0, 41.0, 45.0, 43.0, 37.0, 29.0, 27.0, 23.0, 21.0, 17.0, 16.0, 11.0, 17.0, 9.0, 8.0, 7.0, 7.0, 5.0, 5.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0], "bins": [-0.2210693359375, -0.2144031524658203, -0.20773696899414062, -0.20107078552246094, -0.19440460205078125, -0.18773841857910156, -0.18107223510742188, -0.1744060516357422, -0.1677398681640625, -0.1610736846923828, -0.15440750122070312, -0.14774131774902344, -0.14107513427734375, -0.13440895080566406, -0.12774276733398438, -0.12107658386230469, -0.114410400390625, -0.10774421691894531, -0.10107803344726562, -0.09441184997558594, -0.08774566650390625, -0.08107948303222656, -0.07441329956054688, -0.06774711608886719, -0.0610809326171875, -0.05441474914550781, -0.047748565673828125, -0.04108238220214844, -0.03441619873046875, -0.027750015258789062, -0.021083831787109375, -0.014417648315429688, -0.00775146484375, -0.0010852813720703125, 0.005580902099609375, 0.012247085571289062, 0.01891326904296875, 0.025579452514648438, 0.032245635986328125, 0.03891181945800781, 0.0455780029296875, 0.05224418640136719, 0.058910369873046875, 0.06557655334472656, 0.07224273681640625, 0.07890892028808594, 0.08557510375976562, 0.09224128723144531, 0.098907470703125, 0.10557365417480469, 0.11223983764648438, 0.11890602111816406, 0.12557220458984375, 0.13223838806152344, 0.13890457153320312, 0.1455707550048828, 0.1522369384765625, 0.1589031219482422, 0.16556930541992188, 0.17223548889160156, 0.17890167236328125, 0.18556785583496094, 0.19223403930664062, 0.1989002227783203, 0.20556640625]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 3.0, 3.0, 7.0, 11.0, 23.0, 12.0, 28.0, 25.0, 61.0, 97.0, 178.0, 340.0, 768.0, 2063.0, 7441.0, 37254.0, 835962.0, 3226505.0, 67247.0, 11355.0, 2930.0, 992.0, 457.0, 198.0, 128.0, 64.0, 35.0, 32.0, 19.0, 15.0, 10.0, 9.0, 6.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0986328125, -1.0690536499023438, -1.0394744873046875, -1.0098953247070312, -0.980316162109375, -0.9507369995117188, -0.9211578369140625, -0.8915786743164062, -0.86199951171875, -0.8324203491210938, -0.8028411865234375, -0.7732620239257812, -0.743682861328125, -0.7141036987304688, -0.6845245361328125, -0.6549453735351562, -0.6253662109375, -0.5957870483398438, -0.5662078857421875, -0.5366287231445312, -0.507049560546875, -0.47747039794921875, -0.4478912353515625, -0.41831207275390625, -0.38873291015625, -0.35915374755859375, -0.3295745849609375, -0.29999542236328125, -0.270416259765625, -0.24083709716796875, -0.2112579345703125, -0.18167877197265625, -0.152099609375, -0.12252044677734375, -0.0929412841796875, -0.06336212158203125, -0.033782958984375, -0.00420379638671875, 0.0253753662109375, 0.05495452880859375, 0.08453369140625, 0.11411285400390625, 0.1436920166015625, 0.17327117919921875, 0.202850341796875, 0.23242950439453125, 0.2620086669921875, 0.29158782958984375, 0.3211669921875, 0.35074615478515625, 0.3803253173828125, 0.40990447998046875, 0.439483642578125, 0.46906280517578125, 0.4986419677734375, 0.5282211303710938, 0.55780029296875, 0.5873794555664062, 0.6169586181640625, 0.6465377807617188, 0.676116943359375, 0.7056961059570312, 0.7352752685546875, 0.7648544311523438, 0.79443359375]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 3.0, 7.0, 6.0, 6.0, 6.0, 14.0, 13.0, 14.0, 21.0, 23.0, 35.0, 100.0, 113.0, 197.0, 423.0, 839.0, 987.0, 569.0, 263.0, 162.0, 81.0, 54.0, 37.0, 31.0, 17.0, 13.0, 10.0, 8.0, 3.0, 6.0, 8.0, 5.0, 2.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.91259765625, -0.889892578125, -0.8671875, -0.844482421875, -0.82177734375, -0.799072265625, -0.7763671875, -0.753662109375, -0.73095703125, -0.708251953125, -0.685546875, -0.662841796875, -0.64013671875, -0.617431640625, -0.5947265625, -0.572021484375, -0.54931640625, -0.526611328125, -0.50390625, -0.481201171875, -0.45849609375, -0.435791015625, -0.4130859375, -0.390380859375, -0.36767578125, -0.344970703125, -0.322265625, -0.299560546875, -0.27685546875, -0.254150390625, -0.2314453125, -0.208740234375, -0.18603515625, -0.163330078125, -0.140625, -0.117919921875, -0.09521484375, -0.072509765625, -0.0498046875, -0.027099609375, -0.00439453125, 0.018310546875, 0.041015625, 0.063720703125, 0.08642578125, 0.109130859375, 0.1318359375, 0.154541015625, 0.17724609375, 0.199951171875, 0.22265625, 0.245361328125, 0.26806640625, 0.290771484375, 0.3134765625, 0.336181640625, 0.35888671875, 0.381591796875, 0.404296875, 0.427001953125, 0.44970703125, 0.472412109375, 0.4951171875, 0.517822265625, 0.54052734375]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 2.0, 5.0, 3.0, 15.0, 28.0, 38.0, 126.0, 227.0, 283.0, 150.0, 78.0, 24.0, 10.0, 5.0, 5.0, 2.0, 2.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.307458877563477, -9.035744667053223, -8.764031410217285, -8.492317199707031, -8.220603942871094, -7.94888973236084, -7.677175998687744, -7.405462265014648, -7.133748531341553, -6.862034797668457, -6.590321063995361, -6.318607330322266, -6.046893119812012, -5.775179862976074, -5.50346565246582, -5.231751918792725, -4.960038185119629, -4.688324451446533, -4.4166107177734375, -4.144896984100342, -3.873183012008667, -3.6014692783355713, -3.3297553062438965, -3.058041572570801, -2.786327838897705, -2.5146141052246094, -2.2429003715515137, -1.9711863994598389, -1.6994726657867432, -1.4277589321136475, -1.1560450792312622, -0.884331226348877, -0.6126184463500977, -0.3409046530723572, -0.0691908597946167, 0.20252293348312378, 0.47423672676086426, 0.74595046043396, 1.0176643133163452, 1.2893781661987305, 1.5610918998718262, 1.8328056335449219, 2.1045193672180176, 2.3762333393096924, 2.647947072982788, 2.919660806655884, 3.1913747787475586, 3.4630885124206543, 3.73480224609375, 4.006515979766846, 4.278229713439941, 4.549943447113037, 4.821657180786133, 5.093371391296387, 5.365085124969482, 5.636798858642578, 5.908512592315674, 6.1802263259887695, 6.451940059661865, 6.723653793334961, 6.995368003845215, 7.267081260681152, 7.538795471191406, 7.810509204864502, 8.082222938537598]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 4.0, 5.0, 6.0, 5.0, 5.0, 2.0, 4.0, 12.0, 9.0, 16.0, 18.0, 24.0, 13.0, 18.0, 23.0, 26.0, 36.0, 35.0, 44.0, 59.0, 53.0, 63.0, 72.0, 39.0, 60.0, 46.0, 35.0, 50.0, 36.0, 29.0, 21.0, 21.0, 21.0, 22.0, 18.0, 6.0, 10.0, 8.0, 10.0, 4.0, 6.0, 6.0, 4.0, 3.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.665886878967285, -2.577211618423462, -2.4885363578796387, -2.3998610973358154, -2.311185836791992, -2.222510576248169, -2.1338353157043457, -2.0451598167419434, -1.9564846754074097, -1.8678094148635864, -1.7791341543197632, -1.6904587745666504, -1.6017835140228271, -1.513108253479004, -1.4244329929351807, -1.3357577323913574, -1.2470824718475342, -1.158407211303711, -1.0697319507598877, -0.9810566306114197, -0.8923813700675964, -0.8037061095237732, -0.7150307893753052, -0.6263555288314819, -0.5376802682876587, -0.44900500774383545, -0.3603297173976898, -0.2716544270515442, -0.18297916650772095, -0.0943039059638977, -0.0056285858154296875, 0.08304667472839355, 0.1717219352722168, 0.26039719581604004, 0.34907248616218567, 0.4377477765083313, 0.5264230370521545, 0.6150982975959778, 0.7037736177444458, 0.792448878288269, 0.8811241388320923, 0.9697993993759155, 1.0584746599197388, 1.1471500396728516, 1.2358253002166748, 1.324500560760498, 1.4131758213043213, 1.5018510818481445, 1.5905263423919678, 1.679201602935791, 1.7678768634796143, 1.8565521240234375, 1.9452273845672607, 2.033902645111084, 2.1225781440734863, 2.2112531661987305, 2.299928665161133, 2.388603925704956, 2.4772791862487793, 2.5659544467926025, 2.654629707336426, 2.743304967880249, 2.8319802284240723, 2.9206557273864746, 3.0093307495117188]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 3.0, 2.0, 12.0, 10.0, 27.0, 45.0, 76.0, 114.0, 236.0, 476.0, 1010.0, 2666.0, 8751.0, 37710.0, 297251.0, 607624.0, 72036.0, 13894.0, 3991.0, 1363.0, 606.0, 291.0, 155.0, 94.0, 49.0, 33.0, 13.0, 9.0, 2.0, 1.0, 4.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.60107421875, -0.579742431640625, -0.55841064453125, -0.537078857421875, -0.5157470703125, -0.494415283203125, -0.47308349609375, -0.451751708984375, -0.430419921875, -0.409088134765625, -0.38775634765625, -0.366424560546875, -0.3450927734375, -0.323760986328125, -0.30242919921875, -0.281097412109375, -0.259765625, -0.238433837890625, -0.21710205078125, -0.195770263671875, -0.1744384765625, -0.153106689453125, -0.13177490234375, -0.110443115234375, -0.089111328125, -0.067779541015625, -0.04644775390625, -0.025115966796875, -0.0037841796875, 0.017547607421875, 0.03887939453125, 0.060211181640625, 0.08154296875, 0.102874755859375, 0.12420654296875, 0.145538330078125, 0.1668701171875, 0.188201904296875, 0.20953369140625, 0.230865478515625, 0.252197265625, 0.273529052734375, 0.29486083984375, 0.316192626953125, 0.3375244140625, 0.358856201171875, 0.38018798828125, 0.401519775390625, 0.4228515625, 0.444183349609375, 0.46551513671875, 0.486846923828125, 0.5081787109375, 0.529510498046875, 0.55084228515625, 0.572174072265625, 0.593505859375, 0.614837646484375, 0.63616943359375, 0.657501220703125, 0.6788330078125, 0.700164794921875, 0.72149658203125, 0.742828369140625, 0.76416015625]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 4.0, 4.0, 1.0, 9.0, 5.0, 4.0, 8.0, 7.0, 14.0, 15.0, 18.0, 25.0, 18.0, 21.0, 27.0, 28.0, 35.0, 45.0, 45.0, 47.0, 43.0, 46.0, 49.0, 68.0, 38.0, 50.0, 36.0, 38.0, 47.0, 28.0, 43.0, 25.0, 22.0, 21.0, 16.0, 12.0, 12.0, 8.0, 8.0, 2.0, 6.0, 4.0, 3.0, 4.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2423095703125, -0.2343158721923828, -0.22632217407226562, -0.21832847595214844, -0.21033477783203125, -0.20234107971191406, -0.19434738159179688, -0.1863536834716797, -0.1783599853515625, -0.1703662872314453, -0.16237258911132812, -0.15437889099121094, -0.14638519287109375, -0.13839149475097656, -0.13039779663085938, -0.12240409851074219, -0.114410400390625, -0.10641670227050781, -0.09842300415039062, -0.09042930603027344, -0.08243560791015625, -0.07444190979003906, -0.06644821166992188, -0.05845451354980469, -0.0504608154296875, -0.04246711730957031, -0.034473419189453125, -0.026479721069335938, -0.01848602294921875, -0.010492324829101562, -0.002498626708984375, 0.0054950714111328125, 0.01348876953125, 0.021482467651367188, 0.029476165771484375, 0.03746986389160156, 0.04546356201171875, 0.05345726013183594, 0.061450958251953125, 0.06944465637207031, 0.0774383544921875, 0.08543205261230469, 0.09342575073242188, 0.10141944885253906, 0.10941314697265625, 0.11740684509277344, 0.12540054321289062, 0.1333942413330078, 0.141387939453125, 0.1493816375732422, 0.15737533569335938, 0.16536903381347656, 0.17336273193359375, 0.18135643005371094, 0.18935012817382812, 0.1973438262939453, 0.2053375244140625, 0.2133312225341797, 0.22132492065429688, 0.22931861877441406, 0.23731231689453125, 0.24530601501464844, 0.2532997131347656, 0.2612934112548828, 0.269287109375]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 4.0, 2.0, 2.0, 6.0, 10.0, 16.0, 23.0, 23.0, 57.0, 111.0, 170.0, 346.0, 775.0, 1937.0, 7581.0, 70968.0, 909237.0, 48087.0, 6099.0, 1715.0, 639.0, 303.0, 183.0, 115.0, 54.0, 44.0, 18.0, 11.0, 8.0, 9.0, 6.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1669921875, -1.1331024169921875, -1.099212646484375, -1.0653228759765625, -1.03143310546875, -0.9975433349609375, -0.963653564453125, -0.9297637939453125, -0.8958740234375, -0.8619842529296875, -0.828094482421875, -0.7942047119140625, -0.76031494140625, -0.7264251708984375, -0.692535400390625, -0.6586456298828125, -0.624755859375, -0.5908660888671875, -0.556976318359375, -0.5230865478515625, -0.48919677734375, -0.4553070068359375, -0.421417236328125, -0.3875274658203125, -0.3536376953125, -0.3197479248046875, -0.285858154296875, -0.2519683837890625, -0.21807861328125, -0.1841888427734375, -0.150299072265625, -0.1164093017578125, -0.08251953125, -0.0486297607421875, -0.014739990234375, 0.0191497802734375, 0.05303955078125, 0.0869293212890625, 0.120819091796875, 0.1547088623046875, 0.1885986328125, 0.2224884033203125, 0.256378173828125, 0.2902679443359375, 0.32415771484375, 0.3580474853515625, 0.391937255859375, 0.4258270263671875, 0.459716796875, 0.4936065673828125, 0.527496337890625, 0.5613861083984375, 0.59527587890625, 0.6291656494140625, 0.663055419921875, 0.6969451904296875, 0.7308349609375, 0.7647247314453125, 0.798614501953125, 0.8325042724609375, 0.86639404296875, 0.9002838134765625, 0.934173583984375, 0.9680633544921875, 1.001953125]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 4.0, 3.0, 3.0, 3.0, 8.0, 6.0, 15.0, 15.0, 20.0, 21.0, 28.0, 34.0, 41.0, 41.0, 52.0, 62.0, 67.0, 68.0, 68.0, 75.0, 55.0, 52.0, 49.0, 48.0, 38.0, 22.0, 23.0, 22.0, 9.0, 10.0, 11.0, 4.0, 5.0, 6.0, 1.0, 4.0, 5.0, 4.0, 0.0, 4.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0224609375, -0.9862060546875, -0.949951171875, -0.9136962890625, -0.87744140625, -0.8411865234375, -0.804931640625, -0.7686767578125, -0.732421875, -0.6961669921875, -0.659912109375, -0.6236572265625, -0.58740234375, -0.5511474609375, -0.514892578125, -0.4786376953125, -0.4423828125, -0.4061279296875, -0.369873046875, -0.3336181640625, -0.29736328125, -0.2611083984375, -0.224853515625, -0.1885986328125, -0.15234375, -0.1160888671875, -0.079833984375, -0.0435791015625, -0.00732421875, 0.0289306640625, 0.065185546875, 0.1014404296875, 0.1376953125, 0.1739501953125, 0.210205078125, 0.2464599609375, 0.28271484375, 0.3189697265625, 0.355224609375, 0.3914794921875, 0.427734375, 0.4639892578125, 0.500244140625, 0.5364990234375, 0.57275390625, 0.6090087890625, 0.645263671875, 0.6815185546875, 0.7177734375, 0.7540283203125, 0.790283203125, 0.8265380859375, 0.86279296875, 0.8990478515625, 0.935302734375, 0.9715576171875, 1.0078125, 1.0440673828125, 1.080322265625, 1.1165771484375, 1.15283203125, 1.1890869140625, 1.225341796875, 1.2615966796875, 1.2978515625]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 4.0, 4.0, 4.0, 10.0, 7.0, 11.0, 12.0, 25.0, 51.0, 94.0, 160.0, 315.0, 640.0, 1292.0, 3246.0, 9664.0, 45116.0, 726713.0, 222726.0, 27022.0, 6884.0, 2452.0, 1034.0, 473.0, 254.0, 134.0, 76.0, 42.0, 30.0, 25.0, 13.0, 11.0, 4.0, 6.0, 3.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2379150390625, -0.23044586181640625, -0.2229766845703125, -0.21550750732421875, -0.208038330078125, -0.20056915283203125, -0.1930999755859375, -0.18563079833984375, -0.17816162109375, -0.17069244384765625, -0.1632232666015625, -0.15575408935546875, -0.148284912109375, -0.14081573486328125, -0.1333465576171875, -0.12587738037109375, -0.118408203125, -0.11093902587890625, -0.1034698486328125, -0.09600067138671875, -0.088531494140625, -0.08106231689453125, -0.0735931396484375, -0.06612396240234375, -0.05865478515625, -0.05118560791015625, -0.0437164306640625, -0.03624725341796875, -0.028778076171875, -0.02130889892578125, -0.0138397216796875, -0.00637054443359375, 0.0010986328125, 0.00856781005859375, 0.0160369873046875, 0.02350616455078125, 0.030975341796875, 0.03844451904296875, 0.0459136962890625, 0.05338287353515625, 0.06085205078125, 0.06832122802734375, 0.0757904052734375, 0.08325958251953125, 0.090728759765625, 0.09819793701171875, 0.1056671142578125, 0.11313629150390625, 0.12060546875, 0.12807464599609375, 0.1355438232421875, 0.14301300048828125, 0.150482177734375, 0.15795135498046875, 0.1654205322265625, 0.17288970947265625, 0.18035888671875, 0.18782806396484375, 0.1952972412109375, 0.20276641845703125, 0.210235595703125, 0.21770477294921875, 0.2251739501953125, 0.23264312744140625, 0.2401123046875]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 5.0, 3.0, 4.0, 10.0, 11.0, 12.0, 20.0, 47.0, 64.0, 129.0, 184.0, 194.0, 132.0, 73.0, 42.0, 21.0, 22.0, 12.0, 7.0, 4.0, 3.0, 2.0, 5.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00011986494064331055, -0.00011652708053588867, -0.0001131892204284668, -0.00010985136032104492, -0.00010651350021362305, -0.00010317564010620117, -9.98377799987793e-05, -9.649991989135742e-05, -9.316205978393555e-05, -8.982419967651367e-05, -8.64863395690918e-05, -8.314847946166992e-05, -7.981061935424805e-05, -7.647275924682617e-05, -7.31348991394043e-05, -6.979703903198242e-05, -6.645917892456055e-05, -6.312131881713867e-05, -5.97834587097168e-05, -5.644559860229492e-05, -5.310773849487305e-05, -4.976987838745117e-05, -4.64320182800293e-05, -4.309415817260742e-05, -3.975629806518555e-05, -3.641843795776367e-05, -3.30805778503418e-05, -2.9742717742919922e-05, -2.6404857635498047e-05, -2.3066997528076172e-05, -1.9729137420654297e-05, -1.6391277313232422e-05, -1.3053417205810547e-05, -9.715557098388672e-06, -6.377696990966797e-06, -3.039836883544922e-06, 2.980232238769531e-07, 3.635883331298828e-06, 6.973743438720703e-06, 1.0311603546142578e-05, 1.3649463653564453e-05, 1.6987323760986328e-05, 2.0325183868408203e-05, 2.3663043975830078e-05, 2.7000904083251953e-05, 3.0338764190673828e-05, 3.36766242980957e-05, 3.701448440551758e-05, 4.035234451293945e-05, 4.369020462036133e-05, 4.70280647277832e-05, 5.036592483520508e-05, 5.370378494262695e-05, 5.704164505004883e-05, 6.03795051574707e-05, 6.371736526489258e-05, 6.705522537231445e-05, 7.039308547973633e-05, 7.37309455871582e-05, 7.706880569458008e-05, 8.040666580200195e-05, 8.374452590942383e-05, 8.70823860168457e-05, 9.042024612426758e-05, 9.375810623168945e-05]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 3.0, 1.0, 5.0, 14.0, 14.0, 14.0, 29.0, 39.0, 45.0, 93.0, 155.0, 261.0, 472.0, 912.0, 1952.0, 5136.0, 16400.0, 69463.0, 692184.0, 208173.0, 36897.0, 10003.0, 3342.0, 1435.0, 708.0, 327.0, 170.0, 115.0, 74.0, 46.0, 29.0, 18.0, 12.0, 7.0, 7.0, 4.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.2080078125, -0.20185279846191406, -0.19569778442382812, -0.1895427703857422, -0.18338775634765625, -0.1772327423095703, -0.17107772827148438, -0.16492271423339844, -0.1587677001953125, -0.15261268615722656, -0.14645767211914062, -0.1403026580810547, -0.13414764404296875, -0.1279926300048828, -0.12183761596679688, -0.11568260192871094, -0.109527587890625, -0.10337257385253906, -0.09721755981445312, -0.09106254577636719, -0.08490753173828125, -0.07875251770019531, -0.07259750366210938, -0.06644248962402344, -0.0602874755859375, -0.05413246154785156, -0.047977447509765625, -0.04182243347167969, -0.03566741943359375, -0.029512405395507812, -0.023357391357421875, -0.017202377319335938, -0.01104736328125, -0.0048923492431640625, 0.001262664794921875, 0.0074176788330078125, 0.01357269287109375, 0.019727706909179688, 0.025882720947265625, 0.03203773498535156, 0.0381927490234375, 0.04434776306152344, 0.050502777099609375, 0.05665779113769531, 0.06281280517578125, 0.06896781921386719, 0.07512283325195312, 0.08127784729003906, 0.087432861328125, 0.09358787536621094, 0.09974288940429688, 0.10589790344238281, 0.11205291748046875, 0.11820793151855469, 0.12436294555664062, 0.13051795959472656, 0.1366729736328125, 0.14282798767089844, 0.14898300170898438, 0.1551380157470703, 0.16129302978515625, 0.1674480438232422, 0.17360305786132812, 0.17975807189941406, 0.1859130859375]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 1.0, 5.0, 4.0, 4.0, 7.0, 3.0, 3.0, 9.0, 6.0, 15.0, 17.0, 26.0, 24.0, 33.0, 38.0, 42.0, 78.0, 76.0, 92.0, 98.0, 77.0, 72.0, 51.0, 44.0, 28.0, 30.0, 27.0, 18.0, 20.0, 13.0, 9.0, 6.0, 7.0, 4.0, 4.0, 3.0, 2.0, 4.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.199462890625, -0.19395065307617188, -0.18843841552734375, -0.18292617797851562, -0.1774139404296875, -0.17190170288085938, -0.16638946533203125, -0.16087722778320312, -0.155364990234375, -0.14985275268554688, -0.14434051513671875, -0.13882827758789062, -0.1333160400390625, -0.12780380249023438, -0.12229156494140625, -0.11677932739257812, -0.11126708984375, -0.10575485229492188, -0.10024261474609375, -0.09473037719726562, -0.0892181396484375, -0.08370590209960938, -0.07819366455078125, -0.07268142700195312, -0.067169189453125, -0.061656951904296875, -0.05614471435546875, -0.050632476806640625, -0.0451202392578125, -0.039608001708984375, -0.03409576416015625, -0.028583526611328125, -0.0230712890625, -0.017559051513671875, -0.01204681396484375, -0.006534576416015625, -0.0010223388671875, 0.004489898681640625, 0.01000213623046875, 0.015514373779296875, 0.021026611328125, 0.026538848876953125, 0.03205108642578125, 0.037563323974609375, 0.0430755615234375, 0.048587799072265625, 0.05410003662109375, 0.059612274169921875, 0.06512451171875, 0.07063674926757812, 0.07614898681640625, 0.08166122436523438, 0.0871734619140625, 0.09268569946289062, 0.09819793701171875, 0.10371017456054688, 0.109222412109375, 0.11473464965820312, 0.12024688720703125, 0.12575912475585938, 0.1312713623046875, 0.13678359985351562, 0.14229583740234375, 0.14780807495117188, 0.1533203125]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 4.0, 4.0, 11.0, 45.0, 157.0, 592.0, 146.0, 34.0, 14.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.593036651611328, -10.14123821258545, -9.689438819885254, -9.237640380859375, -8.78584098815918, -8.3340425491333, -7.882243633270264, -7.430444717407227, -6.9786458015441895, -6.526846885681152, -6.075047969818115, -5.623249053955078, -5.171450614929199, -4.719651222229004, -4.267852783203125, -3.816053867340088, -3.364254951477051, -2.9124560356140137, -2.4606571197509766, -2.0088584423065186, -1.5570595264434814, -1.1052606105804443, -0.6534619331359863, -0.20166301727294922, 0.2501358985900879, 0.7019347548484802, 1.1537336111068726, 1.6055324077606201, 2.0573313236236572, 2.5091302394866943, 2.9609289169311523, 3.4127278327941895, 3.8645267486572266, 4.316325664520264, 4.768124580383301, 5.21992301940918, 5.671722412109375, 6.123520851135254, 6.575319766998291, 7.027118682861328, 7.478917598724365, 7.930716514587402, 8.382514953613281, 8.834314346313477, 9.286112785339355, 9.73791217803955, 10.18971061706543, 10.641510009765625, 11.093308448791504, 11.545106887817383, 11.996906280517578, 12.448704719543457, 12.900504112243652, 13.352302551269531, 13.804101943969727, 14.255900382995605, 14.707698822021484, 15.159497261047363, 15.611296653747559, 16.063095092773438, 16.514894485473633, 16.966693878173828, 17.41849136352539, 17.870290756225586, 18.32209014892578]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 1.0, 4.0, 3.0, 3.0, 6.0, 9.0, 2.0, 6.0, 10.0, 10.0, 8.0, 15.0, 10.0, 17.0, 19.0, 24.0, 15.0, 19.0, 18.0, 33.0, 30.0, 45.0, 57.0, 94.0, 98.0, 94.0, 42.0, 42.0, 42.0, 27.0, 25.0, 33.0, 13.0, 22.0, 19.0, 17.0, 11.0, 13.0, 8.0, 8.0, 10.0, 6.0, 4.0, 3.0, 6.0, 1.0, 3.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.9598214626312256, -2.856128692626953, -2.7524359226226807, -2.648743152618408, -2.5450501441955566, -2.4413576126098633, -2.3376646041870117, -2.2339718341827393, -2.130279064178467, -2.0265862941741943, -1.9228935241699219, -1.8192006349563599, -1.7155078649520874, -1.611815094947815, -1.508122205734253, -1.4044294357299805, -1.300736665725708, -1.1970438957214355, -1.093351125717163, -0.9896582365036011, -0.8859654664993286, -0.7822726964950562, -0.6785798668861389, -0.5748870372772217, -0.4711942672729492, -0.36750146746635437, -0.2638086676597595, -0.16011586785316467, -0.056423068046569824, 0.04726970195770264, 0.15096253156661987, 0.2546553611755371, 0.35834813117980957, 0.4620409309864044, 0.5657337307929993, 0.6694265604019165, 0.773119330406189, 0.8768121004104614, 0.9805049300193787, 1.084197759628296, 1.1878905296325684, 1.2915832996368408, 1.3952760696411133, 1.4989689588546753, 1.6026617288589478, 1.7063544988632202, 1.8100473880767822, 1.9137401580810547, 2.017432928085327, 2.1211256980895996, 2.224818468093872, 2.3285112380981445, 2.432204246520996, 2.5358967781066895, 2.639589786529541, 2.7432825565338135, 2.846975326538086, 2.9506680965423584, 3.054360866546631, 3.1580536365509033, 3.261746406555176, 3.3654394149780273, 3.4691321849823, 3.5728249549865723, 3.6765177249908447]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 5.0, 2.0, 8.0, 7.0, 18.0, 17.0, 28.0, 28.0, 45.0, 78.0, 138.0, 182.0, 308.0, 494.0, 888.0, 1599.0, 3143.0, 6636.0, 15870.0, 45026.0, 182115.0, 1208707.0, 2244944.0, 369189.0, 73977.0, 22901.0, 9238.0, 4152.0, 2001.0, 1040.0, 611.0, 312.0, 214.0, 130.0, 89.0, 48.0, 35.0, 25.0, 16.0, 9.0, 8.0, 3.0, 7.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.6845703125, -0.6666450500488281, -0.6487197875976562, -0.6307945251464844, -0.6128692626953125, -0.5949440002441406, -0.5770187377929688, -0.5590934753417969, -0.541168212890625, -0.5232429504394531, -0.5053176879882812, -0.4873924255371094, -0.4694671630859375, -0.4515419006347656, -0.43361663818359375, -0.4156913757324219, -0.39776611328125, -0.3798408508300781, -0.36191558837890625, -0.3439903259277344, -0.3260650634765625, -0.3081398010253906, -0.29021453857421875, -0.2722892761230469, -0.254364013671875, -0.23643875122070312, -0.21851348876953125, -0.20058822631835938, -0.1826629638671875, -0.16473770141601562, -0.14681243896484375, -0.12888717651367188, -0.1109619140625, -0.09303665161132812, -0.07511138916015625, -0.057186126708984375, -0.0392608642578125, -0.021335601806640625, -0.00341033935546875, 0.014514923095703125, 0.032440185546875, 0.050365447998046875, 0.06829071044921875, 0.08621597290039062, 0.1041412353515625, 0.12206649780273438, 0.13999176025390625, 0.15791702270507812, 0.17584228515625, 0.19376754760742188, 0.21169281005859375, 0.22961807250976562, 0.2475433349609375, 0.2654685974121094, 0.28339385986328125, 0.3013191223144531, 0.319244384765625, 0.3371696472167969, 0.35509490966796875, 0.3730201721191406, 0.3909454345703125, 0.4088706970214844, 0.42679595947265625, 0.4447212219238281, 0.462646484375]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 6.0, 1.0, 2.0, 2.0, 3.0, 5.0, 4.0, 3.0, 8.0, 12.0, 12.0, 29.0, 19.0, 15.0, 26.0, 36.0, 45.0, 33.0, 39.0, 48.0, 52.0, 55.0, 54.0, 48.0, 59.0, 52.0, 49.0, 35.0, 41.0, 31.0, 33.0, 25.0, 25.0, 24.0, 18.0, 15.0, 8.0, 10.0, 10.0, 8.0, 8.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.288818359375, -0.2806072235107422, -0.2723960876464844, -0.26418495178222656, -0.25597381591796875, -0.24776268005371094, -0.23955154418945312, -0.2313404083251953, -0.2231292724609375, -0.2149181365966797, -0.20670700073242188, -0.19849586486816406, -0.19028472900390625, -0.18207359313964844, -0.17386245727539062, -0.1656513214111328, -0.157440185546875, -0.1492290496826172, -0.14101791381835938, -0.13280677795410156, -0.12459564208984375, -0.11638450622558594, -0.10817337036132812, -0.09996223449707031, -0.0917510986328125, -0.08353996276855469, -0.07532882690429688, -0.06711769104003906, -0.05890655517578125, -0.05069541931152344, -0.042484283447265625, -0.03427314758300781, -0.02606201171875, -0.017850875854492188, -0.009639739990234375, -0.0014286041259765625, 0.00678253173828125, 0.014993667602539062, 0.023204803466796875, 0.03141593933105469, 0.0396270751953125, 0.04783821105957031, 0.056049346923828125, 0.06426048278808594, 0.07247161865234375, 0.08068275451660156, 0.08889389038085938, 0.09710502624511719, 0.105316162109375, 0.11352729797363281, 0.12173843383789062, 0.12994956970214844, 0.13816070556640625, 0.14637184143066406, 0.15458297729492188, 0.1627941131591797, 0.1710052490234375, 0.1792163848876953, 0.18742752075195312, 0.19563865661621094, 0.20384979248046875, 0.21206092834472656, 0.22027206420898438, 0.2284832000732422, 0.2366943359375]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 4.0, 2.0, 7.0, 10.0, 18.0, 19.0, 19.0, 37.0, 51.0, 100.0, 174.0, 310.0, 633.0, 1838.0, 10403.0, 413517.0, 3737307.0, 25095.0, 3013.0, 864.0, 347.0, 182.0, 118.0, 54.0, 56.0, 36.0, 21.0, 11.0, 11.0, 7.0, 4.0, 6.0, 4.0, 5.0, 1.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.98046875, -2.8980712890625, -2.815673828125, -2.7332763671875, -2.65087890625, -2.5684814453125, -2.486083984375, -2.4036865234375, -2.3212890625, -2.2388916015625, -2.156494140625, -2.0740966796875, -1.99169921875, -1.9093017578125, -1.826904296875, -1.7445068359375, -1.662109375, -1.5797119140625, -1.497314453125, -1.4149169921875, -1.33251953125, -1.2501220703125, -1.167724609375, -1.0853271484375, -1.0029296875, -0.9205322265625, -0.838134765625, -0.7557373046875, -0.67333984375, -0.5909423828125, -0.508544921875, -0.4261474609375, -0.34375, -0.2613525390625, -0.178955078125, -0.0965576171875, -0.01416015625, 0.0682373046875, 0.150634765625, 0.2330322265625, 0.3154296875, 0.3978271484375, 0.480224609375, 0.5626220703125, 0.64501953125, 0.7274169921875, 0.809814453125, 0.8922119140625, 0.974609375, 1.0570068359375, 1.139404296875, 1.2218017578125, 1.30419921875, 1.3865966796875, 1.468994140625, 1.5513916015625, 1.6337890625, 1.7161865234375, 1.798583984375, 1.8809814453125, 1.96337890625, 2.0457763671875, 2.128173828125, 2.2105712890625, 2.29296875]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 1.0, 9.0, 5.0, 11.0, 16.0, 26.0, 24.0, 36.0, 50.0, 80.0, 138.0, 196.0, 284.0, 475.0, 820.0, 730.0, 440.0, 231.0, 159.0, 96.0, 70.0, 56.0, 42.0, 14.0, 13.0, 16.0, 14.0, 9.0, 2.0, 4.0, 1.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1298828125, -1.0906524658203125, -1.051422119140625, -1.0121917724609375, -0.97296142578125, -0.9337310791015625, -0.894500732421875, -0.8552703857421875, -0.8160400390625, -0.7768096923828125, -0.737579345703125, -0.6983489990234375, -0.65911865234375, -0.6198883056640625, -0.580657958984375, -0.5414276123046875, -0.502197265625, -0.4629669189453125, -0.423736572265625, -0.3845062255859375, -0.34527587890625, -0.3060455322265625, -0.266815185546875, -0.2275848388671875, -0.1883544921875, -0.1491241455078125, -0.109893798828125, -0.0706634521484375, -0.03143310546875, 0.0077972412109375, 0.047027587890625, 0.0862579345703125, 0.12548828125, 0.1647186279296875, 0.203948974609375, 0.2431793212890625, 0.28240966796875, 0.3216400146484375, 0.360870361328125, 0.4001007080078125, 0.4393310546875, 0.4785614013671875, 0.517791748046875, 0.5570220947265625, 0.59625244140625, 0.6354827880859375, 0.674713134765625, 0.7139434814453125, 0.753173828125, 0.7924041748046875, 0.831634521484375, 0.8708648681640625, 0.91009521484375, 0.9493255615234375, 0.988555908203125, 1.0277862548828125, 1.0670166015625, 1.1062469482421875, 1.145477294921875, 1.1847076416015625, 1.22393798828125, 1.2631683349609375, 1.302398681640625, 1.3416290283203125, 1.380859375]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 8.0, 3.0, 6.0, 20.0, 27.0, 62.0, 106.0, 177.0, 202.0, 175.0, 100.0, 50.0, 27.0, 22.0, 11.0, 7.0, 4.0, 1.0, 0.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-20.979576110839844, -20.517967224121094, -20.056358337402344, -19.594751358032227, -19.133142471313477, -18.671533584594727, -18.209924697875977, -17.748315811157227, -17.28670883178711, -16.82509994506836, -16.36349105834961, -15.901883125305176, -15.440275192260742, -14.978666305541992, -14.517057418823242, -14.055448532104492, -13.593839645385742, -13.132230758666992, -12.670622825622559, -12.209013938903809, -11.747406005859375, -11.285797119140625, -10.824188232421875, -10.362579345703125, -9.900971412658691, -9.439362525939941, -8.977754592895508, -8.516145706176758, -8.054536819458008, -7.592928886413574, -7.131319999694824, -6.669711589813232, -6.208104133605957, -5.746495723724365, -5.284887313842773, -4.823278427124023, -4.361670017242432, -3.90006160736084, -3.438452959060669, -2.976844310760498, -2.5152359008789062, -2.0536274909973145, -1.5920188426971436, -1.1304103136062622, -0.6688017845153809, -0.20719337463378906, 0.25441527366638184, 0.7160239219665527, 1.1776323318481445, 1.6392408609390259, 2.1008493900299072, 2.562458038330078, 3.02406644821167, 3.4856748580932617, 3.9472835063934326, 4.4088921546936035, 4.870500564575195, 5.332108974456787, 5.793717384338379, 6.255326271057129, 6.716934680938721, 7.1785430908203125, 7.6401519775390625, 8.101760864257812, 8.563368797302246]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 5.0, 3.0, 6.0, 2.0, 5.0, 6.0, 8.0, 21.0, 21.0, 26.0, 18.0, 30.0, 26.0, 39.0, 39.0, 44.0, 42.0, 59.0, 58.0, 59.0, 72.0, 67.0, 45.0, 48.0, 33.0, 31.0, 35.0, 38.0, 27.0, 23.0, 17.0, 8.0, 6.0, 7.0, 10.0, 4.0, 6.0, 6.0, 2.0, 0.0, 2.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.653155326843262, -5.467251300811768, -5.281346797943115, -5.095442771911621, -4.909538745880127, -4.723634719848633, -4.5377302169799805, -4.351826190948486, -4.165922164916992, -3.980017900466919, -3.794113874435425, -3.6082096099853516, -3.4223055839538574, -3.236401319503784, -3.050497055053711, -2.864593029022217, -2.6786885261535645, -2.492784261703491, -2.306880235671997, -2.120975971221924, -1.9350718259811401, -1.7491676807403564, -1.5632634162902832, -1.3773592710494995, -1.1914551258087158, -1.0055509805679321, -0.8196467757225037, -0.6337425708770752, -0.4478384256362915, -0.2619342803955078, -0.07603001594543457, 0.10987412929534912, 0.2957782745361328, 0.4816824495792389, 0.667586624622345, 0.8534908294677734, 1.0393949747085571, 1.2252991199493408, 1.411203384399414, 1.5971075296401978, 1.7830116748809814, 1.9689158201217651, 2.154819965362549, 2.340724229812622, 2.5266284942626953, 2.7125325202941895, 2.8984367847442627, 3.084341049194336, 3.27024507522583, 3.4561493396759033, 3.6420533657073975, 3.8279576301574707, 4.013861656188965, 4.199766159057617, 4.385670185089111, 4.5715742111206055, 4.757478713989258, 4.943382740020752, 5.129287242889404, 5.315191268920898, 5.501095294952393, 5.686999320983887, 5.872903823852539, 6.058807849884033, 6.244711875915527]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 5.0, 7.0, 15.0, 12.0, 34.0, 33.0, 57.0, 56.0, 100.0, 130.0, 209.0, 321.0, 538.0, 1011.0, 1940.0, 4139.0, 9740.0, 29186.0, 131376.0, 688092.0, 133679.0, 29251.0, 10021.0, 4147.0, 1917.0, 1010.0, 569.0, 302.0, 198.0, 129.0, 113.0, 55.0, 47.0, 36.0, 21.0, 13.0, 13.0, 8.0, 10.0, 5.0, 4.0, 6.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.517578125, -0.499420166015625, -0.48126220703125, -0.463104248046875, -0.4449462890625, -0.426788330078125, -0.40863037109375, -0.390472412109375, -0.372314453125, -0.354156494140625, -0.33599853515625, -0.317840576171875, -0.2996826171875, -0.281524658203125, -0.26336669921875, -0.245208740234375, -0.22705078125, -0.208892822265625, -0.19073486328125, -0.172576904296875, -0.1544189453125, -0.136260986328125, -0.11810302734375, -0.099945068359375, -0.081787109375, -0.063629150390625, -0.04547119140625, -0.027313232421875, -0.0091552734375, 0.009002685546875, 0.02716064453125, 0.045318603515625, 0.0634765625, 0.081634521484375, 0.09979248046875, 0.117950439453125, 0.1361083984375, 0.154266357421875, 0.17242431640625, 0.190582275390625, 0.208740234375, 0.226898193359375, 0.24505615234375, 0.263214111328125, 0.2813720703125, 0.299530029296875, 0.31768798828125, 0.335845947265625, 0.35400390625, 0.372161865234375, 0.39031982421875, 0.408477783203125, 0.4266357421875, 0.444793701171875, 0.46295166015625, 0.481109619140625, 0.499267578125, 0.517425537109375, 0.53558349609375, 0.553741455078125, 0.5718994140625, 0.590057373046875, 0.60821533203125, 0.626373291015625, 0.64453125]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 5.0, 7.0, 6.0, 6.0, 6.0, 9.0, 11.0, 13.0, 17.0, 13.0, 29.0, 35.0, 33.0, 45.0, 31.0, 52.0, 48.0, 71.0, 58.0, 55.0, 55.0, 58.0, 52.0, 40.0, 38.0, 37.0, 29.0, 31.0, 23.0, 15.0, 11.0, 12.0, 14.0, 12.0, 6.0, 6.0, 0.0, 7.0, 2.0, 5.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.393310546875, -0.3789405822753906, -0.36457061767578125, -0.3502006530761719, -0.3358306884765625, -0.3214607238769531, -0.30709075927734375, -0.2927207946777344, -0.278350830078125, -0.2639808654785156, -0.24961090087890625, -0.23524093627929688, -0.2208709716796875, -0.20650100708007812, -0.19213104248046875, -0.17776107788085938, -0.16339111328125, -0.14902114868164062, -0.13465118408203125, -0.12028121948242188, -0.1059112548828125, -0.09154129028320312, -0.07717132568359375, -0.06280136108398438, -0.048431396484375, -0.034061431884765625, -0.01969146728515625, -0.005321502685546875, 0.0090484619140625, 0.023418426513671875, 0.03778839111328125, 0.052158355712890625, 0.0665283203125, 0.08089828491210938, 0.09526824951171875, 0.10963821411132812, 0.1240081787109375, 0.13837814331054688, 0.15274810791015625, 0.16711807250976562, 0.181488037109375, 0.19585800170898438, 0.21022796630859375, 0.22459793090820312, 0.2389678955078125, 0.2533378601074219, 0.26770782470703125, 0.2820777893066406, 0.29644775390625, 0.3108177185058594, 0.32518768310546875, 0.3395576477050781, 0.3539276123046875, 0.3682975769042969, 0.38266754150390625, 0.3970375061035156, 0.411407470703125, 0.4257774353027344, 0.44014739990234375, 0.4545173645019531, 0.4688873291015625, 0.4832572937011719, 0.49762725830078125, 0.5119972229003906, 0.5263671875]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 8.0, 8.0, 11.0, 13.0, 19.0, 42.0, 38.0, 84.0, 228.0, 638.0, 2904.0, 30249.0, 980712.0, 29747.0, 2765.0, 657.0, 218.0, 77.0, 50.0, 31.0, 24.0, 10.0, 8.0, 6.0, 5.0, 2.0, 4.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7041015625, -1.6598358154296875, -1.615570068359375, -1.5713043212890625, -1.52703857421875, -1.4827728271484375, -1.438507080078125, -1.3942413330078125, -1.3499755859375, -1.3057098388671875, -1.261444091796875, -1.2171783447265625, -1.17291259765625, -1.1286468505859375, -1.084381103515625, -1.0401153564453125, -0.995849609375, -0.9515838623046875, -0.907318115234375, -0.8630523681640625, -0.81878662109375, -0.7745208740234375, -0.730255126953125, -0.6859893798828125, -0.6417236328125, -0.5974578857421875, -0.553192138671875, -0.5089263916015625, -0.46466064453125, -0.4203948974609375, -0.376129150390625, -0.3318634033203125, -0.28759765625, -0.2433319091796875, -0.199066162109375, -0.1548004150390625, -0.11053466796875, -0.0662689208984375, -0.022003173828125, 0.0222625732421875, 0.0665283203125, 0.1107940673828125, 0.155059814453125, 0.1993255615234375, 0.24359130859375, 0.2878570556640625, 0.332122802734375, 0.3763885498046875, 0.420654296875, 0.4649200439453125, 0.509185791015625, 0.5534515380859375, 0.59771728515625, 0.6419830322265625, 0.686248779296875, 0.7305145263671875, 0.7747802734375, 0.8190460205078125, 0.863311767578125, 0.9075775146484375, 0.95184326171875, 0.9961090087890625, 1.040374755859375, 1.0846405029296875, 1.12890625]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 4.0, 5.0, 4.0, 4.0, 6.0, 8.0, 10.0, 9.0, 17.0, 10.0, 22.0, 27.0, 22.0, 27.0, 40.0, 45.0, 63.0, 79.0, 104.0, 98.0, 86.0, 62.0, 41.0, 41.0, 32.0, 24.0, 20.0, 20.0, 11.0, 15.0, 12.0, 8.0, 10.0, 2.0, 6.0, 6.0, 6.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.001953125, -1.9429473876953125, -1.883941650390625, -1.8249359130859375, -1.76593017578125, -1.7069244384765625, -1.647918701171875, -1.5889129638671875, -1.5299072265625, -1.4709014892578125, -1.411895751953125, -1.3528900146484375, -1.29388427734375, -1.2348785400390625, -1.175872802734375, -1.1168670654296875, -1.057861328125, -0.9988555908203125, -0.939849853515625, -0.8808441162109375, -0.82183837890625, -0.7628326416015625, -0.703826904296875, -0.6448211669921875, -0.5858154296875, -0.5268096923828125, -0.467803955078125, -0.4087982177734375, -0.34979248046875, -0.2907867431640625, -0.231781005859375, -0.1727752685546875, -0.11376953125, -0.0547637939453125, 0.004241943359375, 0.0632476806640625, 0.12225341796875, 0.1812591552734375, 0.240264892578125, 0.2992706298828125, 0.3582763671875, 0.4172821044921875, 0.476287841796875, 0.5352935791015625, 0.59429931640625, 0.6533050537109375, 0.712310791015625, 0.7713165283203125, 0.830322265625, 0.8893280029296875, 0.948333740234375, 1.0073394775390625, 1.06634521484375, 1.1253509521484375, 1.184356689453125, 1.2433624267578125, 1.3023681640625, 1.3613739013671875, 1.420379638671875, 1.4793853759765625, 1.53839111328125, 1.5973968505859375, 1.656402587890625, 1.7154083251953125, 1.7744140625]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 6.0, 0.0, 1.0, 8.0, 3.0, 5.0, 7.0, 13.0, 17.0, 27.0, 46.0, 48.0, 93.0, 179.0, 291.0, 586.0, 1343.0, 3772.0, 12277.0, 58427.0, 867423.0, 80781.0, 15338.0, 4656.0, 1630.0, 716.0, 377.0, 184.0, 78.0, 67.0, 40.0, 23.0, 17.0, 18.0, 11.0, 10.0, 8.0, 7.0, 5.0, 2.0, 6.0, 3.0, 4.0, 2.0, 4.0, 0.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.13916015625, -0.13460922241210938, -0.13005828857421875, -0.12550735473632812, -0.1209564208984375, -0.11640548706054688, -0.11185455322265625, -0.10730361938476562, -0.102752685546875, -0.09820175170898438, -0.09365081787109375, -0.08909988403320312, -0.0845489501953125, -0.07999801635742188, -0.07544708251953125, -0.07089614868164062, -0.06634521484375, -0.061794281005859375, -0.05724334716796875, -0.052692413330078125, -0.0481414794921875, -0.043590545654296875, -0.03903961181640625, -0.034488677978515625, -0.029937744140625, -0.025386810302734375, -0.02083587646484375, -0.016284942626953125, -0.0117340087890625, -0.007183074951171875, -0.00263214111328125, 0.001918792724609375, 0.0064697265625, 0.011020660400390625, 0.01557159423828125, 0.020122528076171875, 0.0246734619140625, 0.029224395751953125, 0.03377532958984375, 0.038326263427734375, 0.042877197265625, 0.047428131103515625, 0.05197906494140625, 0.056529998779296875, 0.0610809326171875, 0.06563186645507812, 0.07018280029296875, 0.07473373413085938, 0.07928466796875, 0.08383560180664062, 0.08838653564453125, 0.09293746948242188, 0.0974884033203125, 0.10203933715820312, 0.10659027099609375, 0.11114120483398438, 0.115692138671875, 0.12024307250976562, 0.12479400634765625, 0.12934494018554688, 0.1338958740234375, 0.13844680786132812, 0.14299774169921875, 0.14754867553710938, 0.152099609375]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 5.0, 3.0, 2.0, 4.0, 2.0, 1.0, 5.0, 6.0, 4.0, 9.0, 14.0, 10.0, 14.0, 14.0, 18.0, 33.0, 34.0, 49.0, 60.0, 59.0, 83.0, 85.0, 94.0, 85.0, 55.0, 54.0, 28.0, 22.0, 22.0, 30.0, 22.0, 15.0, 9.0, 10.0, 12.0, 9.0, 9.0, 5.0, 1.0, 5.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.510713577270508e-05, -3.388896584510803e-05, -3.2670795917510986e-05, -3.145262598991394e-05, -3.0234456062316895e-05, -2.901628613471985e-05, -2.7798116207122803e-05, -2.6579946279525757e-05, -2.536177635192871e-05, -2.4143606424331665e-05, -2.292543649673462e-05, -2.1707266569137573e-05, -2.0489096641540527e-05, -1.927092671394348e-05, -1.8052756786346436e-05, -1.683458685874939e-05, -1.5616416931152344e-05, -1.4398247003555298e-05, -1.3180077075958252e-05, -1.1961907148361206e-05, -1.074373722076416e-05, -9.525567293167114e-06, -8.307397365570068e-06, -7.0892274379730225e-06, -5.8710575103759766e-06, -4.652887582778931e-06, -3.4347176551818848e-06, -2.216547727584839e-06, -9.98377799987793e-07, 2.1979212760925293e-07, 1.4379620552062988e-06, 2.6561319828033447e-06, 3.874301910400391e-06, 5.0924718379974365e-06, 6.310641765594482e-06, 7.528811693191528e-06, 8.746981620788574e-06, 9.96515154838562e-06, 1.1183321475982666e-05, 1.2401491403579712e-05, 1.3619661331176758e-05, 1.4837831258773804e-05, 1.605600118637085e-05, 1.7274171113967896e-05, 1.849234104156494e-05, 1.9710510969161987e-05, 2.0928680896759033e-05, 2.214685082435608e-05, 2.3365020751953125e-05, 2.458319067955017e-05, 2.5801360607147217e-05, 2.7019530534744263e-05, 2.823770046234131e-05, 2.9455870389938354e-05, 3.06740403175354e-05, 3.1892210245132446e-05, 3.311038017272949e-05, 3.432855010032654e-05, 3.5546720027923584e-05, 3.676488995552063e-05, 3.7983059883117676e-05, 3.920122981071472e-05, 4.041939973831177e-05, 4.1637569665908813e-05, 4.285573959350586e-05]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 3.0, 1.0, 8.0, 4.0, 10.0, 5.0, 10.0, 12.0, 29.0, 36.0, 37.0, 62.0, 89.0, 158.0, 259.0, 501.0, 1000.0, 2051.0, 4773.0, 12185.0, 37991.0, 239707.0, 684373.0, 42333.0, 13201.0, 5101.0, 2240.0, 1059.0, 511.0, 288.0, 167.0, 108.0, 64.0, 53.0, 43.0, 24.0, 17.0, 12.0, 11.0, 5.0, 3.0, 6.0, 3.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1300048828125, -0.12552833557128906, -0.12105178833007812, -0.11657524108886719, -0.11209869384765625, -0.10762214660644531, -0.10314559936523438, -0.09866905212402344, -0.0941925048828125, -0.08971595764160156, -0.08523941040039062, -0.08076286315917969, -0.07628631591796875, -0.07180976867675781, -0.06733322143554688, -0.06285667419433594, -0.058380126953125, -0.05390357971191406, -0.049427032470703125, -0.04495048522949219, -0.04047393798828125, -0.03599739074707031, -0.031520843505859375, -0.027044296264648438, -0.0225677490234375, -0.018091201782226562, -0.013614654541015625, -0.009138107299804688, -0.00466156005859375, -0.0001850128173828125, 0.004291534423828125, 0.008768081665039062, 0.01324462890625, 0.017721176147460938, 0.022197723388671875, 0.026674270629882812, 0.03115081787109375, 0.03562736511230469, 0.040103912353515625, 0.04458045959472656, 0.0490570068359375, 0.05353355407714844, 0.058010101318359375, 0.06248664855957031, 0.06696319580078125, 0.07143974304199219, 0.07591629028320312, 0.08039283752441406, 0.084869384765625, 0.08934593200683594, 0.09382247924804688, 0.09829902648925781, 0.10277557373046875, 0.10725212097167969, 0.11172866821289062, 0.11620521545410156, 0.1206817626953125, 0.12515830993652344, 0.12963485717773438, 0.1341114044189453, 0.13858795166015625, 0.1430644989013672, 0.14754104614257812, 0.15201759338378906, 0.156494140625]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 2.0, 0.0, 1.0, 1.0, 4.0, 2.0, 5.0, 7.0, 5.0, 5.0, 7.0, 3.0, 6.0, 9.0, 6.0, 18.0, 16.0, 26.0, 43.0, 50.0, 51.0, 69.0, 80.0, 105.0, 82.0, 78.0, 65.0, 53.0, 45.0, 29.0, 28.0, 24.0, 21.0, 13.0, 9.0, 7.0, 7.0, 7.0, 0.0, 4.0, 7.0, 1.0, 4.0, 0.0, 6.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1595458984375, -0.1541919708251953, -0.14883804321289062, -0.14348411560058594, -0.13813018798828125, -0.13277626037597656, -0.12742233276367188, -0.12206840515136719, -0.1167144775390625, -0.11136054992675781, -0.10600662231445312, -0.10065269470214844, -0.09529876708984375, -0.08994483947753906, -0.08459091186523438, -0.07923698425292969, -0.073883056640625, -0.06852912902832031, -0.06317520141601562, -0.05782127380371094, -0.05246734619140625, -0.04711341857910156, -0.041759490966796875, -0.03640556335449219, -0.0310516357421875, -0.025697708129882812, -0.020343780517578125, -0.014989852905273438, -0.00963592529296875, -0.0042819976806640625, 0.001071929931640625, 0.0064258575439453125, 0.01177978515625, 0.017133712768554688, 0.022487640380859375, 0.027841567993164062, 0.03319549560546875, 0.03854942321777344, 0.043903350830078125, 0.04925727844238281, 0.0546112060546875, 0.05996513366699219, 0.06531906127929688, 0.07067298889160156, 0.07602691650390625, 0.08138084411621094, 0.08673477172851562, 0.09208869934082031, 0.097442626953125, 0.10279655456542969, 0.10815048217773438, 0.11350440979003906, 0.11885833740234375, 0.12421226501464844, 0.12956619262695312, 0.1349201202392578, 0.1402740478515625, 0.1456279754638672, 0.15098190307617188, 0.15633583068847656, 0.16168975830078125, 0.16704368591308594, 0.17239761352539062, 0.1777515411376953, 0.18310546875]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 4.0, 6.0, 17.0, 45.0, 164.0, 622.0, 118.0, 21.0, 5.0, 6.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.1596999168396, -5.701000213623047, -5.242300033569336, -4.783600330352783, -4.3249006271362305, -3.8662004470825195, -3.407500743865967, -2.948800802230835, -2.490100860595703, -2.0314009189605713, -1.572701096534729, -1.1140012741088867, -0.6553013324737549, -0.19660139083862305, 0.2620983123779297, 0.7207982540130615, 1.1794981956481934, 1.6381981372833252, 2.096898078918457, 2.5555977821350098, 3.0142977237701416, 3.4729976654052734, 3.931697368621826, 4.390397071838379, 4.84909725189209, 5.307796955108643, 5.7664971351623535, 6.225196838378906, 6.683897018432617, 7.14259672164917, 7.601296424865723, 8.059996604919434, 8.518695831298828, 8.977396011352539, 9.436095237731934, 9.894795417785645, 10.353495597839355, 10.81219482421875, 11.270895004272461, 11.729595184326172, 12.188295364379883, 12.646995544433594, 13.105694770812988, 13.5643949508667, 14.02309513092041, 14.481794357299805, 14.940494537353516, 15.399194717407227, 15.857893943786621, 16.316593170166016, 16.775293350219727, 17.233993530273438, 17.69269371032715, 18.15139389038086, 18.610092163085938, 19.06879234313965, 19.52749252319336, 19.98619270324707, 20.44489288330078, 20.90359115600586, 21.36229133605957, 21.82099151611328, 22.279691696166992, 22.738391876220703, 23.197092056274414]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 5.0, 3.0, 4.0, 7.0, 7.0, 12.0, 5.0, 16.0, 8.0, 14.0, 13.0, 23.0, 15.0, 18.0, 24.0, 51.0, 65.0, 95.0, 88.0, 85.0, 82.0, 102.0, 74.0, 31.0, 20.0, 20.0, 14.0, 17.0, 10.0, 7.0, 12.0, 6.0, 9.0, 11.0, 7.0, 8.0, 2.0, 3.0, 6.0, 1.0, 0.0, 3.0, 2.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.58046293258667, -4.4399027824401855, -4.299342632293701, -4.158782005310059, -4.018221855163574, -3.87766170501709, -3.7371015548706055, -3.596541404724121, -3.4559810161590576, -3.3154208660125732, -3.1748604774475098, -3.0343003273010254, -2.893740177154541, -2.7531797885894775, -2.612619638442993, -2.4720592498779297, -2.3314990997314453, -2.190938949584961, -2.0503785610198975, -1.909818410873413, -1.7692581415176392, -1.6286978721618652, -1.4881377220153809, -1.347577452659607, -1.207017183303833, -1.066456913948059, -0.9258967041969299, -0.7853364944458008, -0.6447762250900269, -0.5042159557342529, -0.3636557459831238, -0.22309553623199463, -0.0825347900390625, 0.05802544951438904, 0.19858568906784058, 0.3391459286212921, 0.47970616817474365, 0.6202664375305176, 0.7608266472816467, 0.9013868570327759, 1.0419471263885498, 1.1825073957443237, 1.3230676651000977, 1.463627815246582, 1.604188084602356, 1.7447483539581299, 1.8853085041046143, 2.0258688926696777, 2.166429042816162, 2.3069891929626465, 2.44754958152771, 2.5881097316741943, 2.728670120239258, 2.869230270385742, 3.0097904205322266, 3.150350570678711, 3.2909109592437744, 3.431471109390259, 3.5720314979553223, 3.7125916481018066, 3.853151798248291, 3.9937121868133545, 4.134272575378418, 4.274832725524902, 4.415392875671387]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 1.0, 3.0, 3.0, 8.0, 3.0, 10.0, 1.0, 6.0, 12.0, 11.0, 16.0, 20.0, 23.0, 28.0, 40.0, 43.0, 38.0, 68.0, 163.0, 177.0, 57.0, 48.0, 37.0, 33.0, 27.0, 25.0, 21.0, 24.0, 12.0, 8.0, 8.0, 5.0, 7.0, 4.0, 3.0, 4.0, 3.0, 3.0, 0.0, 2.0, 4.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4521484375, -0.43602752685546875, -0.4199066162109375, -0.40378570556640625, -0.387664794921875, -0.37154388427734375, -0.3554229736328125, -0.33930206298828125, -0.32318115234375, -0.30706024169921875, -0.2909393310546875, -0.27481842041015625, -0.258697509765625, -0.24257659912109375, -0.2264556884765625, -0.21033477783203125, -0.1942138671875, -0.17809295654296875, -0.1619720458984375, -0.14585113525390625, -0.129730224609375, -0.11360931396484375, -0.0974884033203125, -0.08136749267578125, -0.06524658203125, -0.04912567138671875, -0.0330047607421875, -0.01688385009765625, -0.000762939453125, 0.01535797119140625, 0.0314788818359375, 0.04759979248046875, 0.063720703125, 0.07984161376953125, 0.0959625244140625, 0.11208343505859375, 0.128204345703125, 0.14432525634765625, 0.1604461669921875, 0.17656707763671875, 0.19268798828125, 0.20880889892578125, 0.2249298095703125, 0.24105072021484375, 0.257171630859375, 0.27329254150390625, 0.2894134521484375, 0.30553436279296875, 0.3216552734375, 0.33777618408203125, 0.3538970947265625, 0.37001800537109375, 0.386138916015625, 0.40225982666015625, 0.4183807373046875, 0.43450164794921875, 0.45062255859375, 0.46674346923828125, 0.4828643798828125, 0.49898529052734375, 0.515106201171875, 0.5312271118164062, 0.5473480224609375, 0.5634689331054688, 0.57958984375]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 2.0, 7.0, 14.0, 6.0, 14.0, 12.0, 28.0, 28.0, 38.0, 57.0, 111.0, 210.0, 376.0, 757.0, 1657.0, 4257.0, 16392.0, 8268546.0, 82626.0, 8231.0, 2829.0, 1082.0, 554.0, 294.0, 199.0, 88.0, 55.0, 35.0, 22.0, 16.0, 16.0, 7.0, 4.0, 5.0, 6.0, 3.0, 2.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.2332375049591064, -2.167112350463867, -2.100986957550049, -2.0348615646362305, -1.9687364101409912, -1.9026111364364624, -1.8364858627319336, -1.7703605890274048, -1.704235315322876, -1.6381100416183472, -1.5719847679138184, -1.5058594942092896, -1.4397342205047607, -1.373608946800232, -1.3074836730957031, -1.2413583993911743, -1.1752331256866455, -1.1091078519821167, -1.042982578277588, -0.9768573045730591, -0.9107320308685303, -0.8446067571640015, -0.7784814834594727, -0.7123562097549438, -0.646230936050415, -0.5801056623458862, -0.5139803886413574, -0.4478551149368286, -0.3817298412322998, -0.315604567527771, -0.2494792938232422, -0.18335402011871338, -0.11722874641418457, -0.05110347270965576, 0.015021800994873047, 0.08114707469940186, 0.14727234840393066, 0.21339762210845947, 0.2795228958129883, 0.3456481695175171, 0.4117734432220459, 0.4778987169265747, 0.5440239906311035, 0.6101492643356323, 0.6762745380401611, 0.7423998117446899, 0.8085250854492188, 0.8746503591537476, 0.9407756328582764, 1.0069009065628052, 1.073026180267334, 1.1391514539718628, 1.2052767276763916, 1.2714020013809204, 1.3375272750854492, 1.403652548789978, 1.4697778224945068, 1.5359030961990356, 1.6020283699035645, 1.6681536436080933, 1.734278917312622, 1.8004041910171509, 1.8665294647216797, 1.9326547384262085, 1.9987800121307373]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 3.0, 1.0, 2.0, 1.0, 3.0, 3.0, 2.0, 2.0, 2.0, 3.0, 1.0, 6.0, 3.0, 2.0, 4.0, 1.0, 8.0, 4.0, 3.0, 1.0, 3.0, 4.0, 6.0, 5.0, 1.0, 1.0, 8.0, 1.0, 6.0, 2.0, 3.0, 8.0, 2.0, 1.0, 2.0, 0.0, 0.0, 4.0, 1.0, 1.0, 2.0, 2.0, 1.0], "bins": [-4.284852504730225, -4.190340042114258, -4.095828056335449, -4.001315593719482, -3.9068031311035156, -3.812290668487549, -3.717778444290161, -3.6232662200927734, -3.5287537574768066, -3.43424129486084, -3.339729070663452, -3.2452168464660645, -3.1507043838500977, -3.056191921234131, -2.961679697036743, -2.8671674728393555, -2.7726550102233887, -2.678142547607422, -2.583630323410034, -2.4891180992126465, -2.3946056365966797, -2.300093173980713, -2.205580949783325, -2.1110687255859375, -2.0165562629699707, -1.9220439195632935, -1.8275315761566162, -1.733019232749939, -1.6385068893432617, -1.5439945459365845, -1.4494822025299072, -1.35496985912323, -1.2604575157165527, -1.1659451723098755, -1.0714328289031982, -0.976920485496521, -0.8824081420898438, -0.7878957986831665, -0.6933834552764893, -0.598871111869812, -0.5043587684631348, -0.4098464250564575, -0.3153340816497803, -0.22082173824310303, -0.12630939483642578, -0.031797051429748535, 0.06271529197692871, 0.15722763538360596, 0.2517399787902832, 0.34625232219696045, 0.4407646656036377, 0.5352770090103149, 0.6297893524169922, 0.7243016958236694, 0.8188140392303467, 0.9133263826370239, 1.0078387260437012, 1.1023510694503784, 1.1968634128570557, 1.291375756263733, 1.3858880996704102, 1.4804004430770874, 1.5749127864837646, 1.669425129890442, 1.7639374732971191]}, "gradients/encoder.masked_spec_embed": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 3.0, 3.0, 4.0, 7.0, 9.0, 16.0, 24.0, 33.0, 36.0, 39.0, 56.0, 59.0, 82.0, 90.0, 98.0, 67.0, 68.0, 67.0, 58.0, 41.0, 37.0, 17.0, 18.0, 13.0, 17.0, 8.0, 9.0, 6.0, 4.0, 3.0, 7.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.40966796875, -0.394439697265625, -0.37921142578125, -0.363983154296875, -0.3487548828125, -0.333526611328125, -0.31829833984375, -0.303070068359375, -0.287841796875, -0.272613525390625, -0.25738525390625, -0.242156982421875, -0.2269287109375, -0.211700439453125, -0.19647216796875, -0.181243896484375, -0.166015625, -0.150787353515625, -0.13555908203125, -0.120330810546875, -0.1051025390625, -0.089874267578125, -0.07464599609375, -0.059417724609375, -0.044189453125, -0.028961181640625, -0.01373291015625, 0.001495361328125, 0.0167236328125, 0.031951904296875, 0.04718017578125, 0.062408447265625, 0.07763671875, 0.092864990234375, 0.10809326171875, 0.123321533203125, 0.1385498046875, 0.153778076171875, 0.16900634765625, 0.184234619140625, 0.199462890625, 0.214691162109375, 0.22991943359375, 0.245147705078125, 0.2603759765625, 0.275604248046875, 0.29083251953125, 0.306060791015625, 0.3212890625, 0.336517333984375, 0.35174560546875, 0.366973876953125, 0.3822021484375, 0.397430419921875, 0.41265869140625, 0.427886962890625, 0.443115234375, 0.458343505859375, 0.47357177734375, 0.488800048828125, 0.5040283203125, 0.519256591796875, 0.53448486328125, 0.549713134765625, 0.56494140625]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 2.0, 6.0, 3.0, 5.0, 12.0, 18.0, 20.0, 55.0, 71.0, 98.0, 204.0, 418.0, 920.0, 2864.0, 15039.0, 141244.0, 317268.0, 37609.0, 5707.0, 1481.0, 562.0, 261.0, 153.0, 84.0, 64.0, 35.0, 21.0, 16.0, 15.0, 5.0, 3.0, 4.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.623046875, -3.443878173828125, -3.26470947265625, -3.085540771484375, -2.9063720703125, -2.727203369140625, -2.54803466796875, -2.368865966796875, -2.189697265625, -2.010528564453125, -1.83135986328125, -1.652191162109375, -1.4730224609375, -1.293853759765625, -1.11468505859375, -0.935516357421875, -0.75634765625, -0.577178955078125, -0.39801025390625, -0.218841552734375, -0.0396728515625, 0.139495849609375, 0.31866455078125, 0.497833251953125, 0.677001953125, 0.856170654296875, 1.03533935546875, 1.214508056640625, 1.3936767578125, 1.572845458984375, 1.75201416015625, 1.931182861328125, 2.1103515625, 2.289520263671875, 2.46868896484375, 2.647857666015625, 2.8270263671875, 3.006195068359375, 3.18536376953125, 3.364532470703125, 3.543701171875, 3.722869873046875, 3.90203857421875, 4.081207275390625, 4.2603759765625, 4.439544677734375, 4.61871337890625, 4.797882080078125, 4.97705078125, 5.156219482421875, 5.33538818359375, 5.514556884765625, 5.6937255859375, 5.872894287109375, 6.05206298828125, 6.231231689453125, 6.410400390625, 6.589569091796875, 6.76873779296875, 6.947906494140625, 7.1270751953125, 7.306243896484375, 7.48541259765625, 7.664581298828125, 7.84375]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 6.0, 1.0, 2.0, 8.0, 8.0, 7.0, 11.0, 18.0, 21.0, 23.0, 27.0, 32.0, 69.0, 54.0, 60.0, 66.0, 85.0, 73.0, 64.0, 58.0, 61.0, 52.0, 45.0, 38.0, 25.0, 26.0, 14.0, 17.0, 8.0, 8.0, 6.0, 4.0, 5.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.456787109375, -0.4421653747558594, -0.42754364013671875, -0.4129219055175781, -0.3983001708984375, -0.3836784362792969, -0.36905670166015625, -0.3544349670410156, -0.339813232421875, -0.3251914978027344, -0.31056976318359375, -0.2959480285644531, -0.2813262939453125, -0.2667045593261719, -0.25208282470703125, -0.23746109008789062, -0.22283935546875, -0.20821762084960938, -0.19359588623046875, -0.17897415161132812, -0.1643524169921875, -0.14973068237304688, -0.13510894775390625, -0.12048721313476562, -0.105865478515625, -0.09124374389648438, -0.07662200927734375, -0.062000274658203125, -0.0473785400390625, -0.032756805419921875, -0.01813507080078125, -0.003513336181640625, 0.0111083984375, 0.025730133056640625, 0.04035186767578125, 0.054973602294921875, 0.0695953369140625, 0.08421707153320312, 0.09883880615234375, 0.11346054077148438, 0.128082275390625, 0.14270401000976562, 0.15732574462890625, 0.17194747924804688, 0.1865692138671875, 0.20119094848632812, 0.21581268310546875, 0.23043441772460938, 0.24505615234375, 0.2596778869628906, 0.27429962158203125, 0.2889213562011719, 0.3035430908203125, 0.3181648254394531, 0.33278656005859375, 0.3474082946777344, 0.362030029296875, 0.3766517639160156, 0.39127349853515625, 0.4058952331542969, 0.4205169677734375, 0.4351387023925781, 0.44976043701171875, 0.4643821716308594, 0.47900390625]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 2.0, 3.0, 3.0, 4.0, 7.0, 4.0, 4.0, 6.0, 11.0, 13.0, 21.0, 40.0, 74.0, 102.0, 86.0, 40.0, 21.0, 7.0, 9.0, 2.0, 5.0, 4.0, 6.0, 2.0, 6.0, 3.0, 0.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-3.2655529975891113, -3.1731772422790527, -3.080801486968994, -2.9884257316589355, -2.896049976348877, -2.8036742210388184, -2.7112984657287598, -2.618922710418701, -2.5265469551086426, -2.434171199798584, -2.3417954444885254, -2.249419689178467, -2.157043933868408, -2.0646681785583496, -1.972292423248291, -1.8799166679382324, -1.7875409126281738, -1.6951651573181152, -1.6027894020080566, -1.510413646697998, -1.4180378913879395, -1.3256621360778809, -1.2332863807678223, -1.1409106254577637, -1.048534870147705, -0.9561591148376465, -0.8637833595275879, -0.7714076042175293, -0.6790318489074707, -0.5866560935974121, -0.4942803382873535, -0.4019045829772949, -0.3095285892486572, -0.21715283393859863, -0.12477707862854004, -0.032401323318481445, 0.05997443199157715, 0.15235018730163574, 0.24472594261169434, 0.33710169792175293, 0.4294774532318115, 0.5218532085418701, 0.6142289638519287, 0.7066047191619873, 0.7989804744720459, 0.8913562297821045, 0.9837319850921631, 1.0761077404022217, 1.1684834957122803, 1.2608592510223389, 1.3532350063323975, 1.445610761642456, 1.5379865169525146, 1.6303622722625732, 1.7227380275726318, 1.8151137828826904, 1.907489538192749, 1.9998652935028076, 2.092241048812866, 2.184616804122925, 2.2769925594329834, 2.369368314743042, 2.4617440700531006, 2.554119825363159, 2.6464955806732178]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 1.0, 2.0, 6.0, 5.0, 6.0, 1.0, 5.0, 4.0, 11.0, 6.0, 11.0, 28.0, 58.0, 84.0, 94.0, 77.0, 25.0, 9.0, 8.0, 6.0, 6.0, 4.0, 5.0, 4.0, 1.0, 4.0, 1.0, 5.0, 4.0, 3.0, 2.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0], "bins": [-2.5647969245910645, -2.487628936767578, -2.4104607105255127, -2.3332927227020264, -2.256124496459961, -2.1789565086364746, -2.101788282394409, -2.024620294570923, -1.947452187538147, -1.870284080505371, -1.7931159734725952, -1.7159478664398193, -1.638779878616333, -1.5616116523742676, -1.4844436645507812, -1.4072755575180054, -1.3301074504852295, -1.2529393434524536, -1.1757712364196777, -1.0986031293869019, -1.021435022354126, -0.9442669749259949, -0.8670989274978638, -0.7899308204650879, -0.712762713432312, -0.6355946063995361, -0.5584264993667603, -0.48125845193862915, -0.40409034490585327, -0.3269222378730774, -0.2497541606426239, -0.1725860834121704, -0.09541773796081543, -0.018249645829200745, 0.05891844630241394, 0.13608653843402863, 0.2132546305656433, 0.2904227375984192, 0.3675908148288727, 0.44475889205932617, 0.521926999092102, 0.5990951061248779, 0.6762632131576538, 0.7534312605857849, 0.8305993676185608, 0.9077674746513367, 0.9849355220794678, 1.0621036291122437, 1.1392717361450195, 1.2164398431777954, 1.2936079502105713, 1.3707760572433472, 1.447944164276123, 1.5251121520996094, 1.6022802591323853, 1.6794483661651611, 1.756616473197937, 1.833784580230713, 1.9109526872634888, 1.9881207942962646, 2.065288782119751, 2.1424570083618164, 2.2196249961853027, 2.296792984008789, 2.3739612102508545]}, "eval/loss": 0.3589690625667572, "eval/wer": 0.09641015470051567, "eval/runtime": 570.6282, "eval/samples_per_second": 4.63, "eval/steps_per_second": 0.58} \ No newline at end of file +{"train/loss": 0.0134, "train/learning_rate": 6.936416184971098e-07, "train/epoch": 10.0, "train/global_step": 2230, "_runtime": 51756, "_timestamp": 1648366446, "_step": 2234, "gradients/decoder.model.decoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 9.0, 30.0, 111.0, 200.0, 305.0, 216.0, 87.0, 40.0, 11.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.3592593669891357, -2.3074288368225098, -2.255598545074463, -2.203768014907837, -2.151937484741211, -2.100106954574585, -2.048276662826538, -1.996446132659912, -1.9446156024932861, -1.8927851915359497, -1.8409546613693237, -1.7891242504119873, -1.7372937202453613, -1.685463309288025, -1.633632779121399, -1.5818023681640625, -1.5299718379974365, -1.4781414270401, -1.4263108968734741, -1.3744804859161377, -1.3226499557495117, -1.2708195447921753, -1.2189890146255493, -1.167158603668213, -1.1153281927108765, -1.06349778175354, -1.011667251586914, -0.9598367810249329, -0.9080063104629517, -0.8561758995056152, -0.8043453693389893, -0.7525149583816528, -0.7006843686103821, -0.6488538980484009, -0.5970234274864197, -0.5451929569244385, -0.4933624863624573, -0.44153204560279846, -0.38970157504081726, -0.33787110447883606, -0.28604063391685486, -0.23421016335487366, -0.18237969279289246, -0.13054923713207245, -0.07871876657009125, -0.02688831090927124, 0.02494215965270996, 0.07677263021469116, 0.12860310077667236, 0.18043357133865356, 0.23226404190063477, 0.28409451246261597, 0.33592498302459717, 0.387755423784256, 0.4395858943462372, 0.4914163649082184, 0.543246865272522, 0.5950773358345032, 0.6469078063964844, 0.6987382769584656, 0.7505687475204468, 0.8023991584777832, 0.8542296886444092, 0.9060600996017456, 0.9578905701637268]}, "gradients/decoder.model.decoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 4.0, 1.0, 2.0, 2.0, 2.0, 2.0, 4.0, 7.0, 10.0, 11.0, 15.0, 19.0, 22.0, 24.0, 39.0, 22.0, 38.0, 43.0, 41.0, 48.0, 48.0, 49.0, 51.0, 56.0, 44.0, 49.0, 42.0, 36.0, 39.0, 35.0, 28.0, 34.0, 18.0, 24.0, 25.0, 18.0, 17.0, 13.0, 6.0, 10.0, 4.0, 3.0, 3.0, 5.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4530882239341736, -0.4375229775905609, -0.42195773124694824, -0.40639248490333557, -0.3908272385597229, -0.37526199221611023, -0.35969674587249756, -0.3441315293312073, -0.3285662531852722, -0.31300100684165955, -0.2974357604980469, -0.2818705141544342, -0.26630526781082153, -0.25074002146720886, -0.23517479002475739, -0.21960954368114471, -0.20404431223869324, -0.18847906589508057, -0.1729138195514679, -0.15734857320785522, -0.14178332686424255, -0.12621808052062988, -0.1106528490781784, -0.09508760273456573, -0.07952235639095306, -0.0639571100473404, -0.04839186742901802, -0.03282662481069565, -0.017261378467082977, -0.0016961321234703064, 0.013869106769561768, 0.02943435311317444, 0.04499959945678711, 0.06056484580039978, 0.07613009214401245, 0.09169533103704453, 0.1072605773806572, 0.12282582372426987, 0.13839106261730194, 0.1539563089609146, 0.16952155530452728, 0.18508680164813995, 0.20065204799175262, 0.2162172794342041, 0.23178252577781677, 0.24734777212142944, 0.2629130184650421, 0.2784782648086548, 0.29404351115226746, 0.3096087574958801, 0.3251740038394928, 0.34073925018310547, 0.35630449652671814, 0.3718697428703308, 0.3874349594116211, 0.40300023555755615, 0.41856545209884644, 0.4341306984424591, 0.4496959447860718, 0.46526119112968445, 0.4808264374732971, 0.4963916838169098, 0.5119569301605225, 0.5275221467018127, 0.5430874228477478]}, "gradients/decoder.model.decoder.layers.11.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 4.0, 3.0, 14.0, 13.0, 14.0, 21.0, 30.0, 36.0, 48.0, 62.0, 98.0, 147.0, 212.0, 322.0, 507.0, 747.0, 1173.0, 1811.0, 3182.0, 6017.0, 12088.0, 30614.0, 128466.0, 602238.0, 2024053.0, 1052782.0, 239315.0, 55238.0, 17617.0, 7380.0, 3974.0, 2237.0, 1354.0, 854.0, 546.0, 349.0, 221.0, 154.0, 102.0, 71.0, 47.0, 35.0, 37.0, 16.0, 14.0, 7.0, 6.0, 6.0, 6.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.86083984375, -0.835296630859375, -0.80975341796875, -0.784210205078125, -0.7586669921875, -0.733123779296875, -0.70758056640625, -0.682037353515625, -0.656494140625, -0.630950927734375, -0.60540771484375, -0.579864501953125, -0.5543212890625, -0.528778076171875, -0.50323486328125, -0.477691650390625, -0.4521484375, -0.426605224609375, -0.40106201171875, -0.375518798828125, -0.3499755859375, -0.324432373046875, -0.29888916015625, -0.273345947265625, -0.247802734375, -0.222259521484375, -0.19671630859375, -0.171173095703125, -0.1456298828125, -0.120086669921875, -0.09454345703125, -0.069000244140625, -0.04345703125, -0.017913818359375, 0.00762939453125, 0.033172607421875, 0.0587158203125, 0.084259033203125, 0.10980224609375, 0.135345458984375, 0.160888671875, 0.186431884765625, 0.21197509765625, 0.237518310546875, 0.2630615234375, 0.288604736328125, 0.31414794921875, 0.339691162109375, 0.365234375, 0.390777587890625, 0.41632080078125, 0.441864013671875, 0.4674072265625, 0.492950439453125, 0.51849365234375, 0.544036865234375, 0.569580078125, 0.595123291015625, 0.62066650390625, 0.646209716796875, 0.6717529296875, 0.697296142578125, 0.72283935546875, 0.748382568359375, 0.77392578125]}, "gradients/decoder.model.decoder.layers.11.fc2.bias": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 3.0, 2.0, 9.0, 5.0, 2.0, 5.0, 15.0, 16.0, 10.0, 27.0, 24.0, 27.0, 25.0, 40.0, 51.0, 38.0, 33.0, 52.0, 66.0, 52.0, 44.0, 41.0, 41.0, 56.0, 35.0, 50.0, 41.0, 25.0, 27.0, 22.0, 25.0, 16.0, 19.0, 12.0, 14.0, 16.0, 9.0, 4.0, 2.0, 3.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.69384765625, -0.668426513671875, -0.64300537109375, -0.617584228515625, -0.5921630859375, -0.566741943359375, -0.54132080078125, -0.515899658203125, -0.490478515625, -0.465057373046875, -0.43963623046875, -0.414215087890625, -0.3887939453125, -0.363372802734375, -0.33795166015625, -0.312530517578125, -0.287109375, -0.261688232421875, -0.23626708984375, -0.210845947265625, -0.1854248046875, -0.160003662109375, -0.13458251953125, -0.109161376953125, -0.083740234375, -0.058319091796875, -0.03289794921875, -0.007476806640625, 0.0179443359375, 0.043365478515625, 0.06878662109375, 0.094207763671875, 0.11962890625, 0.145050048828125, 0.17047119140625, 0.195892333984375, 0.2213134765625, 0.246734619140625, 0.27215576171875, 0.297576904296875, 0.322998046875, 0.348419189453125, 0.37384033203125, 0.399261474609375, 0.4246826171875, 0.450103759765625, 0.47552490234375, 0.500946044921875, 0.5263671875, 0.551788330078125, 0.57720947265625, 0.602630615234375, 0.6280517578125, 0.653472900390625, 0.67889404296875, 0.704315185546875, 0.729736328125, 0.755157470703125, 0.78057861328125, 0.805999755859375, 0.8314208984375, 0.856842041015625, 0.88226318359375, 0.907684326171875, 0.93310546875]}, "gradients/decoder.model.decoder.layers.11.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 3.0, 2.0, 5.0, 19.0, 37.0, 79.0, 590.0, 4178993.0, 14102.0, 338.0, 69.0, 27.0, 10.0, 5.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.078125, -17.251220703125, -16.42431640625, -15.597412109375, -14.7705078125, -13.943603515625, -13.11669921875, -12.289794921875, -11.462890625, -10.635986328125, -9.80908203125, -8.982177734375, -8.1552734375, -7.328369140625, -6.50146484375, -5.674560546875, -4.84765625, -4.020751953125, -3.19384765625, -2.366943359375, -1.5400390625, -0.713134765625, 0.11376953125, 0.940673828125, 1.767578125, 2.594482421875, 3.42138671875, 4.248291015625, 5.0751953125, 5.902099609375, 6.72900390625, 7.555908203125, 8.3828125, 9.209716796875, 10.03662109375, 10.863525390625, 11.6904296875, 12.517333984375, 13.34423828125, 14.171142578125, 14.998046875, 15.824951171875, 16.65185546875, 17.478759765625, 18.3056640625, 19.132568359375, 19.95947265625, 20.786376953125, 21.61328125, 22.440185546875, 23.26708984375, 24.093994140625, 24.9208984375, 25.747802734375, 26.57470703125, 27.401611328125, 28.228515625, 29.055419921875, 29.88232421875, 30.709228515625, 31.5361328125, 32.363037109375, 33.18994140625, 34.016845703125, 34.84375]}, "gradients/decoder.model.decoder.layers.11.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 2.0, 4.0, 4.0, 29.0, 38.0, 139.0, 570.0, 2697.0, 421.0, 114.0, 35.0, 13.0, 6.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.96533203125, -0.9287796020507812, -0.8922271728515625, -0.8556747436523438, -0.819122314453125, -0.7825698852539062, -0.7460174560546875, -0.7094650268554688, -0.67291259765625, -0.6363601684570312, -0.5998077392578125, -0.5632553100585938, -0.526702880859375, -0.49015045166015625, -0.4535980224609375, -0.41704559326171875, -0.3804931640625, -0.34394073486328125, -0.3073883056640625, -0.27083587646484375, -0.234283447265625, -0.19773101806640625, -0.1611785888671875, -0.12462615966796875, -0.08807373046875, -0.05152130126953125, -0.0149688720703125, 0.02158355712890625, 0.058135986328125, 0.09468841552734375, 0.1312408447265625, 0.16779327392578125, 0.204345703125, 0.24089813232421875, 0.2774505615234375, 0.31400299072265625, 0.350555419921875, 0.38710784912109375, 0.4236602783203125, 0.46021270751953125, 0.49676513671875, 0.5333175659179688, 0.5698699951171875, 0.6064224243164062, 0.642974853515625, 0.6795272827148438, 0.7160797119140625, 0.7526321411132812, 0.7891845703125, 0.8257369995117188, 0.8622894287109375, 0.8988418579101562, 0.935394287109375, 0.9719467163085938, 1.0084991455078125, 1.0450515747070312, 1.08160400390625, 1.1181564331054688, 1.1547088623046875, 1.1912612915039062, 1.227813720703125, 1.2643661499023438, 1.3009185791015625, 1.3374710083007812, 1.3740234375]}, "gradients/decoder.model.decoder.layers.11.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 1.0, 4.0, 6.0, 9.0, 11.0, 13.0, 15.0, 18.0, 31.0, 30.0, 35.0, 51.0, 69.0, 69.0, 78.0, 91.0, 106.0, 73.0, 57.0, 56.0, 46.0, 29.0, 34.0, 18.0, 14.0, 14.0, 6.0, 7.0, 4.0, 5.0, 4.0, 5.0, 2.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.1353092193603516, -1.1050784587860107, -1.0748478174209595, -1.0446170568466187, -1.0143862962722778, -0.9841555953025818, -0.9539248943328857, -0.9236941337585449, -0.8934634327888489, -0.8632327318191528, -0.833001971244812, -0.802771270275116, -0.7725405693054199, -0.7423098087310791, -0.7120791077613831, -0.681848406791687, -0.6516176462173462, -0.6213869452476501, -0.5911561846733093, -0.5609254837036133, -0.5306947231292725, -0.5004640221595764, -0.47023332118988037, -0.44000259041786194, -0.4097718596458435, -0.3795411288738251, -0.34931039810180664, -0.3190796971321106, -0.28884896636009216, -0.25861823558807373, -0.2283875197172165, -0.19815680384635925, -0.16792601346969604, -0.1376952826976776, -0.10746456682682037, -0.07723384350538254, -0.0470031201839447, -0.01677238941192627, 0.01345832645893097, 0.04368904232978821, 0.07391977310180664, 0.10415049642324448, 0.1343812197446823, 0.16461193561553955, 0.19484266638755798, 0.22507339715957642, 0.25530409812927246, 0.2855348289012909, 0.3157655596733093, 0.34599629044532776, 0.3762270212173462, 0.40645772218704224, 0.43668845295906067, 0.4669191837310791, 0.49714988470077515, 0.5273805856704712, 0.557611346244812, 0.5878420472145081, 0.6180728077888489, 0.6483035087585449, 0.6785342693328857, 0.7087649703025818, 0.7389956712722778, 0.7692264318466187, 0.7994571328163147]}, "gradients/decoder.model.decoder.layers.11.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 6.0, 2.0, 4.0, 8.0, 10.0, 8.0, 11.0, 26.0, 22.0, 29.0, 32.0, 23.0, 43.0, 37.0, 45.0, 41.0, 28.0, 50.0, 45.0, 46.0, 40.0, 44.0, 47.0, 35.0, 44.0, 53.0, 28.0, 36.0, 24.0, 25.0, 21.0, 9.0, 17.0, 11.0, 20.0, 9.0, 7.0, 7.0, 3.0, 6.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6483617424964905, -0.6281723380088806, -0.607982873916626, -0.5877934694290161, -0.5676040053367615, -0.5474146008491516, -0.527225136756897, -0.5070357322692871, -0.48684626817703247, -0.4666568338871002, -0.44646739959716797, -0.4262779653072357, -0.40608853101730347, -0.3858990967273712, -0.36570966243743896, -0.3455202579498291, -0.32533082365989685, -0.3051413893699646, -0.28495195508003235, -0.2647625207901001, -0.24457308650016785, -0.2243836522102356, -0.20419423282146454, -0.1840047985315323, -0.16381536424160004, -0.14362592995166779, -0.12343649566173553, -0.10324706882238388, -0.08305763453245163, -0.06286820024251938, -0.042678773403167725, -0.022489339113235474, -0.0022999048233032227, 0.01788952760398388, 0.03807896003127098, 0.05826839059591293, 0.07845782488584518, 0.09864725917577744, 0.11883668601512909, 0.13902612030506134, 0.1592155545949936, 0.17940498888492584, 0.1995944231748581, 0.21978384256362915, 0.2399732768535614, 0.26016271114349365, 0.2803521454334259, 0.30054157972335815, 0.3207310140132904, 0.34092044830322266, 0.3611098825931549, 0.38129931688308716, 0.4014887511730194, 0.42167818546295166, 0.4418675899505615, 0.46205705404281616, 0.482246458530426, 0.5024358630180359, 0.5226253271102905, 0.5428147315979004, 0.563004195690155, 0.5831936001777649, 0.6033830642700195, 0.6235724687576294, 0.643761932849884]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 9.0, 1.0, 7.0, 12.0, 21.0, 28.0, 34.0, 58.0, 73.0, 147.0, 208.0, 310.0, 539.0, 842.0, 1393.0, 2397.0, 4277.0, 7140.0, 12779.0, 23155.0, 42211.0, 77846.0, 141425.0, 236640.0, 218332.0, 125422.0, 68411.0, 37037.0, 20560.0, 11411.0, 6471.0, 3693.0, 2276.0, 1323.0, 760.0, 479.0, 308.0, 183.0, 101.0, 86.0, 43.0, 35.0, 21.0, 19.0, 14.0, 15.0, 6.0, 5.0, 3.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.2308349609375, -0.22359848022460938, -0.21636199951171875, -0.20912551879882812, -0.2018890380859375, -0.19465255737304688, -0.18741607666015625, -0.18017959594726562, -0.172943115234375, -0.16570663452148438, -0.15847015380859375, -0.15123367309570312, -0.1439971923828125, -0.13676071166992188, -0.12952423095703125, -0.12228775024414062, -0.11505126953125, -0.10781478881835938, -0.10057830810546875, -0.09334182739257812, -0.0861053466796875, -0.07886886596679688, -0.07163238525390625, -0.06439590454101562, -0.057159423828125, -0.049922943115234375, -0.04268646240234375, -0.035449981689453125, -0.0282135009765625, -0.020977020263671875, -0.01374053955078125, -0.006504058837890625, 0.000732421875, 0.007968902587890625, 0.01520538330078125, 0.022441864013671875, 0.0296783447265625, 0.036914825439453125, 0.04415130615234375, 0.051387786865234375, 0.058624267578125, 0.06586074829101562, 0.07309722900390625, 0.08033370971679688, 0.0875701904296875, 0.09480667114257812, 0.10204315185546875, 0.10927963256835938, 0.11651611328125, 0.12375259399414062, 0.13098907470703125, 0.13822555541992188, 0.1454620361328125, 0.15269851684570312, 0.15993499755859375, 0.16717147827148438, 0.174407958984375, 0.18164443969726562, 0.18888092041015625, 0.19611740112304688, 0.2033538818359375, 0.21059036254882812, 0.21782684326171875, 0.22506332397460938, 0.2322998046875]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 2.0, 3.0, 4.0, 7.0, 5.0, 9.0, 13.0, 32.0, 21.0, 24.0, 29.0, 40.0, 30.0, 44.0, 37.0, 49.0, 35.0, 50.0, 51.0, 61.0, 40.0, 49.0, 45.0, 45.0, 35.0, 30.0, 40.0, 32.0, 22.0, 25.0, 19.0, 9.0, 11.0, 13.0, 11.0, 9.0, 6.0, 9.0, 1.0, 0.0, 4.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.45654296875, -0.4424400329589844, -0.42833709716796875, -0.4142341613769531, -0.4001312255859375, -0.3860282897949219, -0.37192535400390625, -0.3578224182128906, -0.343719482421875, -0.3296165466308594, -0.31551361083984375, -0.3014106750488281, -0.2873077392578125, -0.2732048034667969, -0.25910186767578125, -0.24499893188476562, -0.23089599609375, -0.21679306030273438, -0.20269012451171875, -0.18858718872070312, -0.1744842529296875, -0.16038131713867188, -0.14627838134765625, -0.13217544555664062, -0.118072509765625, -0.10396957397460938, -0.08986663818359375, -0.07576370239257812, -0.0616607666015625, -0.047557830810546875, -0.03345489501953125, -0.019351959228515625, -0.0052490234375, 0.008853912353515625, 0.02295684814453125, 0.037059783935546875, 0.0511627197265625, 0.06526565551757812, 0.07936859130859375, 0.09347152709960938, 0.107574462890625, 0.12167739868164062, 0.13578033447265625, 0.14988327026367188, 0.1639862060546875, 0.17808914184570312, 0.19219207763671875, 0.20629501342773438, 0.22039794921875, 0.23450088500976562, 0.24860382080078125, 0.2627067565917969, 0.2768096923828125, 0.2909126281738281, 0.30501556396484375, 0.3191184997558594, 0.333221435546875, 0.3473243713378906, 0.36142730712890625, 0.3755302429199219, 0.3896331787109375, 0.4037361145019531, 0.41783905029296875, 0.4319419860839844, 0.446044921875]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 2.0, 2.0, 3.0, 9.0, 16.0, 13.0, 30.0, 28.0, 52.0, 66.0, 109.0, 234.0, 364.0, 769.0, 1422.0, 3143.0, 8148.0, 23704.0, 77312.0, 283738.0, 445985.0, 140916.0, 40421.0, 13068.0, 4750.0, 2090.0, 991.0, 468.0, 267.0, 173.0, 94.0, 56.0, 43.0, 23.0, 16.0, 12.0, 7.0, 3.0, 6.0, 1.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.38720703125, -0.37480926513671875, -0.3624114990234375, -0.35001373291015625, -0.337615966796875, -0.32521820068359375, -0.3128204345703125, -0.30042266845703125, -0.28802490234375, -0.27562713623046875, -0.2632293701171875, -0.25083160400390625, -0.238433837890625, -0.22603607177734375, -0.2136383056640625, -0.20124053955078125, -0.1888427734375, -0.17644500732421875, -0.1640472412109375, -0.15164947509765625, -0.139251708984375, -0.12685394287109375, -0.1144561767578125, -0.10205841064453125, -0.08966064453125, -0.07726287841796875, -0.0648651123046875, -0.05246734619140625, -0.040069580078125, -0.02767181396484375, -0.0152740478515625, -0.00287628173828125, 0.009521484375, 0.02191925048828125, 0.0343170166015625, 0.04671478271484375, 0.059112548828125, 0.07151031494140625, 0.0839080810546875, 0.09630584716796875, 0.10870361328125, 0.12110137939453125, 0.1334991455078125, 0.14589691162109375, 0.158294677734375, 0.17069244384765625, 0.1830902099609375, 0.19548797607421875, 0.2078857421875, 0.22028350830078125, 0.2326812744140625, 0.24507904052734375, 0.257476806640625, 0.26987457275390625, 0.2822723388671875, 0.29467010498046875, 0.30706787109375, 0.31946563720703125, 0.3318634033203125, 0.34426116943359375, 0.356658935546875, 0.36905670166015625, 0.3814544677734375, 0.39385223388671875, 0.40625]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 1.0, 4.0, 7.0, 1.0, 6.0, 6.0, 5.0, 8.0, 11.0, 11.0, 11.0, 17.0, 12.0, 15.0, 14.0, 26.0, 29.0, 25.0, 29.0, 35.0, 21.0, 31.0, 49.0, 43.0, 46.0, 48.0, 44.0, 34.0, 36.0, 34.0, 32.0, 41.0, 32.0, 34.0, 25.0, 29.0, 26.0, 15.0, 24.0, 18.0, 17.0, 13.0, 12.0, 7.0, 14.0, 3.0, 3.0, 2.0, 1.0, 1.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7392578125, -0.7140655517578125, -0.688873291015625, -0.6636810302734375, -0.63848876953125, -0.6132965087890625, -0.588104248046875, -0.5629119873046875, -0.5377197265625, -0.5125274658203125, -0.487335205078125, -0.4621429443359375, -0.43695068359375, -0.4117584228515625, -0.386566162109375, -0.3613739013671875, -0.336181640625, -0.3109893798828125, -0.285797119140625, -0.2606048583984375, -0.23541259765625, -0.2102203369140625, -0.185028076171875, -0.1598358154296875, -0.1346435546875, -0.1094512939453125, -0.084259033203125, -0.0590667724609375, -0.03387451171875, -0.0086822509765625, 0.016510009765625, 0.0417022705078125, 0.06689453125, 0.0920867919921875, 0.117279052734375, 0.1424713134765625, 0.16766357421875, 0.1928558349609375, 0.218048095703125, 0.2432403564453125, 0.2684326171875, 0.2936248779296875, 0.318817138671875, 0.3440093994140625, 0.36920166015625, 0.3943939208984375, 0.419586181640625, 0.4447784423828125, 0.469970703125, 0.4951629638671875, 0.520355224609375, 0.5455474853515625, 0.57073974609375, 0.5959320068359375, 0.621124267578125, 0.6463165283203125, 0.6715087890625, 0.6967010498046875, 0.721893310546875, 0.7470855712890625, 0.77227783203125, 0.7974700927734375, 0.822662353515625, 0.8478546142578125, 0.873046875]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 6.0, 7.0, 5.0, 18.0, 31.0, 34.0, 57.0, 87.0, 134.0, 254.0, 420.0, 728.0, 1376.0, 2871.0, 5907.0, 13614.0, 37320.0, 123114.0, 424889.0, 309507.0, 81611.0, 26653.0, 10439.0, 4590.0, 2218.0, 1147.0, 629.0, 348.0, 219.0, 110.0, 88.0, 46.0, 32.0, 17.0, 12.0, 8.0, 7.0, 5.0, 1.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.062347412109375, -0.06044912338256836, -0.05855083465576172, -0.05665254592895508, -0.05475425720214844, -0.0528559684753418, -0.050957679748535156, -0.049059391021728516, -0.047161102294921875, -0.045262813568115234, -0.043364524841308594, -0.04146623611450195, -0.03956794738769531, -0.03766965866088867, -0.03577136993408203, -0.03387308120727539, -0.03197479248046875, -0.03007650375366211, -0.02817821502685547, -0.026279926300048828, -0.024381637573242188, -0.022483348846435547, -0.020585060119628906, -0.018686771392822266, -0.016788482666015625, -0.014890193939208984, -0.012991905212402344, -0.011093616485595703, -0.009195327758789062, -0.007297039031982422, -0.005398750305175781, -0.0035004615783691406, -0.0016021728515625, 0.0002961158752441406, 0.0021944046020507812, 0.004092693328857422, 0.0059909820556640625, 0.007889270782470703, 0.009787559509277344, 0.011685848236083984, 0.013584136962890625, 0.015482425689697266, 0.017380714416503906, 0.019279003143310547, 0.021177291870117188, 0.023075580596923828, 0.02497386932373047, 0.02687215805053711, 0.02877044677734375, 0.03066873550415039, 0.03256702423095703, 0.03446531295776367, 0.03636360168457031, 0.03826189041137695, 0.040160179138183594, 0.042058467864990234, 0.043956756591796875, 0.045855045318603516, 0.047753334045410156, 0.0496516227722168, 0.05154991149902344, 0.05344820022583008, 0.05534648895263672, 0.05724477767944336, 0.05914306640625]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 4.0, 2.0, 1.0, 4.0, 4.0, 9.0, 10.0, 22.0, 22.0, 14.0, 27.0, 43.0, 65.0, 87.0, 124.0, 128.0, 106.0, 103.0, 56.0, 58.0, 25.0, 28.0, 16.0, 13.0, 9.0, 4.0, 9.0, 6.0, 4.0, 0.0, 0.0, 1.0, 2.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.76837158203125e-05, -4.5666471123695374e-05, -4.364922642707825e-05, -4.163198173046112e-05, -3.9614737033843994e-05, -3.759749233722687e-05, -3.558024764060974e-05, -3.3563002943992615e-05, -3.154575824737549e-05, -2.9528513550758362e-05, -2.7511268854141235e-05, -2.549402415752411e-05, -2.3476779460906982e-05, -2.1459534764289856e-05, -1.944229006767273e-05, -1.7425045371055603e-05, -1.5407800674438477e-05, -1.339055597782135e-05, -1.1373311281204224e-05, -9.356066584587097e-06, -7.338821887969971e-06, -5.321577191352844e-06, -3.3043324947357178e-06, -1.2870877981185913e-06, 7.301568984985352e-07, 2.7474015951156616e-06, 4.764646291732788e-06, 6.7818909883499146e-06, 8.799135684967041e-06, 1.0816380381584167e-05, 1.2833625078201294e-05, 1.485086977481842e-05, 1.6868114471435547e-05, 1.8885359168052673e-05, 2.09026038646698e-05, 2.2919848561286926e-05, 2.4937093257904053e-05, 2.695433795452118e-05, 2.8971582651138306e-05, 3.098882734775543e-05, 3.300607204437256e-05, 3.5023316740989685e-05, 3.704056143760681e-05, 3.905780613422394e-05, 4.1075050830841064e-05, 4.309229552745819e-05, 4.510954022407532e-05, 4.7126784920692444e-05, 4.914402961730957e-05, 5.11612743139267e-05, 5.317851901054382e-05, 5.519576370716095e-05, 5.7213008403778076e-05, 5.92302531003952e-05, 6.124749779701233e-05, 6.326474249362946e-05, 6.528198719024658e-05, 6.729923188686371e-05, 6.931647658348083e-05, 7.133372128009796e-05, 7.335096597671509e-05, 7.536821067333221e-05, 7.738545536994934e-05, 7.940270006656647e-05, 8.14199447631836e-05]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 0.0, 3.0, 5.0, 2.0, 7.0, 4.0, 8.0, 18.0, 15.0, 24.0, 30.0, 33.0, 62.0, 62.0, 156.0, 288.0, 586.0, 1592.0, 4758.0, 17727.0, 106463.0, 641518.0, 232467.0, 31445.0, 7188.0, 2350.0, 918.0, 338.0, 174.0, 99.0, 63.0, 47.0, 32.0, 20.0, 11.0, 13.0, 6.0, 5.0, 3.0, 2.0, 3.0, 2.0, 3.0, 3.0, 0.0, 2.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.10296630859375, -0.09949684143066406, -0.09602737426757812, -0.09255790710449219, -0.08908843994140625, -0.08561897277832031, -0.08214950561523438, -0.07868003845214844, -0.0752105712890625, -0.07174110412597656, -0.06827163696289062, -0.06480216979980469, -0.06133270263671875, -0.05786323547363281, -0.054393768310546875, -0.05092430114746094, -0.047454833984375, -0.04398536682128906, -0.040515899658203125, -0.03704643249511719, -0.03357696533203125, -0.030107498168945312, -0.026638031005859375, -0.023168563842773438, -0.0196990966796875, -0.016229629516601562, -0.012760162353515625, -0.009290695190429688, -0.00582122802734375, -0.0023517608642578125, 0.001117706298828125, 0.0045871734619140625, 0.008056640625, 0.011526107788085938, 0.014995574951171875, 0.018465042114257812, 0.02193450927734375, 0.025403976440429688, 0.028873443603515625, 0.03234291076660156, 0.0358123779296875, 0.03928184509277344, 0.042751312255859375, 0.04622077941894531, 0.04969024658203125, 0.05315971374511719, 0.056629180908203125, 0.06009864807128906, 0.063568115234375, 0.06703758239746094, 0.07050704956054688, 0.07397651672363281, 0.07744598388671875, 0.08091545104980469, 0.08438491821289062, 0.08785438537597656, 0.0913238525390625, 0.09479331970214844, 0.09826278686523438, 0.10173225402832031, 0.10520172119140625, 0.10867118835449219, 0.11214065551757812, 0.11561012268066406, 0.11907958984375]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 3.0, 3.0, 0.0, 0.0, 0.0, 4.0, 6.0, 8.0, 7.0, 5.0, 7.0, 11.0, 18.0, 15.0, 19.0, 21.0, 26.0, 30.0, 36.0, 51.0, 53.0, 56.0, 66.0, 68.0, 59.0, 71.0, 45.0, 57.0, 43.0, 45.0, 42.0, 28.0, 27.0, 17.0, 8.0, 5.0, 20.0, 7.0, 1.0, 7.0, 1.0, 3.0, 4.0, 2.0, 2.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0179901123046875, -0.0174102783203125, -0.0168304443359375, -0.0162506103515625, -0.0156707763671875, -0.0150909423828125, -0.0145111083984375, -0.0139312744140625, -0.0133514404296875, -0.0127716064453125, -0.0121917724609375, -0.0116119384765625, -0.0110321044921875, -0.0104522705078125, -0.0098724365234375, -0.0092926025390625, -0.0087127685546875, -0.0081329345703125, -0.0075531005859375, -0.0069732666015625, -0.0063934326171875, -0.0058135986328125, -0.0052337646484375, -0.0046539306640625, -0.0040740966796875, -0.0034942626953125, -0.0029144287109375, -0.0023345947265625, -0.0017547607421875, -0.0011749267578125, -0.0005950927734375, -1.52587890625e-05, 0.0005645751953125, 0.0011444091796875, 0.0017242431640625, 0.0023040771484375, 0.0028839111328125, 0.0034637451171875, 0.0040435791015625, 0.0046234130859375, 0.0052032470703125, 0.0057830810546875, 0.0063629150390625, 0.0069427490234375, 0.0075225830078125, 0.0081024169921875, 0.0086822509765625, 0.0092620849609375, 0.0098419189453125, 0.0104217529296875, 0.0110015869140625, 0.0115814208984375, 0.0121612548828125, 0.0127410888671875, 0.0133209228515625, 0.0139007568359375, 0.0144805908203125, 0.0150604248046875, 0.0156402587890625, 0.0162200927734375, 0.0167999267578125, 0.0173797607421875, 0.0179595947265625, 0.0185394287109375, 0.0191192626953125]}, "gradients/decoder.model.decoder.layers.11.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 8.0, 16.0, 23.0, 64.0, 117.0, 210.0, 237.0, 164.0, 92.0, 37.0, 24.0, 9.0, 4.0, 4.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.1237847805023193, -2.073493719100952, -2.023202896118164, -1.9729118347167969, -1.9226207733154297, -1.872329831123352, -1.8220388889312744, -1.7717478275299072, -1.7214568853378296, -1.671165943145752, -1.6208748817443848, -1.5705839395523071, -1.5202929973602295, -1.4700019359588623, -1.4197109937667847, -1.369420051574707, -1.3191289901733398, -1.2688380479812622, -1.218546986579895, -1.1682560443878174, -1.1179649829864502, -1.0676740407943726, -1.017383098602295, -0.9670920968055725, -0.9168010950088501, -0.8665100932121277, -0.8162190914154053, -0.7659281492233276, -0.7156371474266052, -0.6653461456298828, -0.6150552034378052, -0.5647642016410828, -0.5144731998443604, -0.46418219804763794, -0.4138912260532379, -0.3636002540588379, -0.3133092522621155, -0.26301825046539307, -0.21272727847099304, -0.16243630647659302, -0.1121453046798706, -0.06185431778430939, -0.011563330888748169, 0.03872765600681305, 0.08901864290237427, 0.13930964469909668, 0.1896006166934967, 0.23989158868789673, 0.29018259048461914, 0.34047359228134155, 0.3907645642757416, 0.4410555362701416, 0.491346538066864, 0.5416375398635864, 0.5919284820556641, 0.6422194838523865, 0.6925104856491089, 0.7428014874458313, 0.7930924892425537, 0.8433834314346313, 0.8936744332313538, 0.9439654350280762, 0.9942563772201538, 1.0445473194122314, 1.0948383808135986]}, "gradients/decoder.model.decoder.layers.11.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 4.0, 3.0, 1.0, 6.0, 5.0, 10.0, 14.0, 13.0, 13.0, 21.0, 32.0, 25.0, 25.0, 43.0, 35.0, 39.0, 36.0, 36.0, 37.0, 44.0, 45.0, 39.0, 41.0, 40.0, 43.0, 40.0, 40.0, 40.0, 35.0, 34.0, 24.0, 21.0, 24.0, 17.0, 15.0, 11.0, 9.0, 11.0, 9.0, 7.0, 3.0, 3.0, 4.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 2.0, 4.0], "bins": [-0.4222990870475769, -0.41003358364105225, -0.3977680802345276, -0.38550257682800293, -0.37323707342147827, -0.3609715700149536, -0.34870606660842896, -0.3364405632019043, -0.32417505979537964, -0.311909556388855, -0.2996440529823303, -0.28737854957580566, -0.275113046169281, -0.26284754276275635, -0.2505820393562317, -0.23831652104854584, -0.22605100274085999, -0.21378549933433533, -0.20151999592781067, -0.189254492521286, -0.17698898911476135, -0.1647234857082367, -0.15245796740055084, -0.14019246399402618, -0.12792696058750153, -0.11566145718097687, -0.10339595377445221, -0.09113044291734695, -0.0788649395108223, -0.06659943610429764, -0.05433392524719238, -0.042068421840667725, -0.02980288863182068, -0.01753738336265087, -0.005271878093481064, 0.006993629038333893, 0.01925913244485855, 0.03152463585138321, 0.043790146708488464, 0.05605565011501312, 0.06832115352153778, 0.08058665692806244, 0.0928521603345871, 0.10511767119169235, 0.11738317459821701, 0.12964868545532227, 0.14191418886184692, 0.15417969226837158, 0.16644519567489624, 0.1787106990814209, 0.19097620248794556, 0.20324170589447021, 0.21550720930099487, 0.22777271270751953, 0.24003823101520538, 0.25230371952056885, 0.2645692229270935, 0.27683472633361816, 0.2891002297401428, 0.3013657331466675, 0.31363123655319214, 0.3258967399597168, 0.33816224336624146, 0.3504277467727661, 0.36269327998161316]}, "gradients/decoder.model.decoder.layers.11.self_attn.out_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 0.0, 2.0, 4.0, 7.0, 15.0, 20.0, 26.0, 55.0, 78.0, 114.0, 155.0, 246.0, 389.0, 573.0, 1034.0, 1737.0, 3066.0, 5587.0, 10471.0, 22530.0, 57423.0, 212048.0, 499490.0, 149416.0, 45008.0, 18690.0, 9018.0, 4624.0, 2624.0, 1553.0, 992.0, 551.0, 370.0, 211.0, 143.0, 99.0, 59.0, 41.0, 36.0, 19.0, 15.0, 3.0, 6.0, 4.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1705322265625, -0.16472816467285156, -0.15892410278320312, -0.1531200408935547, -0.14731597900390625, -0.1415119171142578, -0.13570785522460938, -0.12990379333496094, -0.1240997314453125, -0.11829566955566406, -0.11249160766601562, -0.10668754577636719, -0.10088348388671875, -0.09507942199707031, -0.08927536010742188, -0.08347129821777344, -0.077667236328125, -0.07186317443847656, -0.06605911254882812, -0.06025505065917969, -0.05445098876953125, -0.04864692687988281, -0.042842864990234375, -0.03703880310058594, -0.0312347412109375, -0.025430679321289062, -0.019626617431640625, -0.013822555541992188, -0.00801849365234375, -0.0022144317626953125, 0.003589630126953125, 0.009393692016601562, 0.01519775390625, 0.021001815795898438, 0.026805877685546875, 0.03260993957519531, 0.03841400146484375, 0.04421806335449219, 0.050022125244140625, 0.05582618713378906, 0.0616302490234375, 0.06743431091308594, 0.07323837280273438, 0.07904243469238281, 0.08484649658203125, 0.09065055847167969, 0.09645462036132812, 0.10225868225097656, 0.108062744140625, 0.11386680603027344, 0.11967086791992188, 0.1254749298095703, 0.13127899169921875, 0.1370830535888672, 0.14288711547851562, 0.14869117736816406, 0.1544952392578125, 0.16029930114746094, 0.16610336303710938, 0.1719074249267578, 0.17771148681640625, 0.1835155487060547, 0.18931961059570312, 0.19512367248535156, 0.200927734375]}, "gradients/decoder.model.decoder.layers.11.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 4.0, 5.0, 8.0, 10.0, 18.0, 15.0, 9.0, 27.0, 25.0, 19.0, 23.0, 33.0, 33.0, 37.0, 33.0, 53.0, 38.0, 44.0, 32.0, 49.0, 47.0, 55.0, 28.0, 51.0, 46.0, 27.0, 40.0, 19.0, 34.0, 18.0, 23.0, 20.0, 14.0, 14.0, 13.0, 6.0, 12.0, 1.0, 5.0, 9.0, 0.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.6416015625, -0.6213302612304688, -0.6010589599609375, -0.5807876586914062, -0.560516357421875, -0.5402450561523438, -0.5199737548828125, -0.49970245361328125, -0.47943115234375, -0.45915985107421875, -0.4388885498046875, -0.41861724853515625, -0.398345947265625, -0.37807464599609375, -0.3578033447265625, -0.33753204345703125, -0.3172607421875, -0.29698944091796875, -0.2767181396484375, -0.25644683837890625, -0.236175537109375, -0.21590423583984375, -0.1956329345703125, -0.17536163330078125, -0.15509033203125, -0.13481903076171875, -0.1145477294921875, -0.09427642822265625, -0.074005126953125, -0.05373382568359375, -0.0334625244140625, -0.01319122314453125, 0.007080078125, 0.02735137939453125, 0.0476226806640625, 0.06789398193359375, 0.088165283203125, 0.10843658447265625, 0.1287078857421875, 0.14897918701171875, 0.16925048828125, 0.18952178955078125, 0.2097930908203125, 0.23006439208984375, 0.250335693359375, 0.27060699462890625, 0.2908782958984375, 0.31114959716796875, 0.3314208984375, 0.35169219970703125, 0.3719635009765625, 0.39223480224609375, 0.412506103515625, 0.43277740478515625, 0.4530487060546875, 0.47332000732421875, 0.49359130859375, 0.5138626098632812, 0.5341339111328125, 0.5544052124023438, 0.574676513671875, 0.5949478149414062, 0.6152191162109375, 0.6354904174804688, 0.65576171875]}, "gradients/decoder.model.decoder.layers.11.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 6.0, 5.0, 5.0, 5.0, 7.0, 7.0, 11.0, 20.0, 20.0, 31.0, 45.0, 35.0, 64.0, 63.0, 105.0, 140.0, 230.0, 399.0, 907.0, 2536.0, 8960.0, 50186.0, 777342.0, 182263.0, 17903.0, 4347.0, 1399.0, 565.0, 298.0, 182.0, 116.0, 78.0, 53.0, 47.0, 47.0, 28.0, 34.0, 18.0, 17.0, 13.0, 5.0, 5.0, 6.0, 5.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.51806640625, -0.5035667419433594, -0.48906707763671875, -0.4745674133300781, -0.4600677490234375, -0.4455680847167969, -0.43106842041015625, -0.4165687561035156, -0.402069091796875, -0.3875694274902344, -0.37306976318359375, -0.3585700988769531, -0.3440704345703125, -0.3295707702636719, -0.31507110595703125, -0.3005714416503906, -0.28607177734375, -0.2715721130371094, -0.25707244873046875, -0.24257278442382812, -0.2280731201171875, -0.21357345581054688, -0.19907379150390625, -0.18457412719726562, -0.170074462890625, -0.15557479858398438, -0.14107513427734375, -0.12657546997070312, -0.1120758056640625, -0.09757614135742188, -0.08307647705078125, -0.06857681274414062, -0.0540771484375, -0.039577484130859375, -0.02507781982421875, -0.010578155517578125, 0.0039215087890625, 0.018421173095703125, 0.03292083740234375, 0.047420501708984375, 0.061920166015625, 0.07641983032226562, 0.09091949462890625, 0.10541915893554688, 0.1199188232421875, 0.13441848754882812, 0.14891815185546875, 0.16341781616210938, 0.17791748046875, 0.19241714477539062, 0.20691680908203125, 0.22141647338867188, 0.2359161376953125, 0.2504158020019531, 0.26491546630859375, 0.2794151306152344, 0.293914794921875, 0.3084144592285156, 0.32291412353515625, 0.3374137878417969, 0.3519134521484375, 0.3664131164550781, 0.38091278076171875, 0.3954124450683594, 0.409912109375]}, "gradients/decoder.model.decoder.layers.11.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 2.0, 1.0, 7.0, 3.0, 7.0, 8.0, 12.0, 12.0, 16.0, 28.0, 24.0, 14.0, 23.0, 31.0, 29.0, 35.0, 37.0, 33.0, 51.0, 57.0, 47.0, 51.0, 57.0, 47.0, 36.0, 50.0, 50.0, 36.0, 29.0, 27.0, 23.0, 30.0, 26.0, 10.0, 20.0, 7.0, 8.0, 7.0, 6.0, 0.0, 3.0, 5.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.79541015625, -0.7721786499023438, -0.7489471435546875, -0.7257156372070312, -0.702484130859375, -0.6792526245117188, -0.6560211181640625, -0.6327896118164062, -0.60955810546875, -0.5863265991210938, -0.5630950927734375, -0.5398635864257812, -0.516632080078125, -0.49340057373046875, -0.4701690673828125, -0.44693756103515625, -0.4237060546875, -0.40047454833984375, -0.3772430419921875, -0.35401153564453125, -0.330780029296875, -0.30754852294921875, -0.2843170166015625, -0.26108551025390625, -0.23785400390625, -0.21462249755859375, -0.1913909912109375, -0.16815948486328125, -0.144927978515625, -0.12169647216796875, -0.0984649658203125, -0.07523345947265625, -0.052001953125, -0.02877044677734375, -0.0055389404296875, 0.01769256591796875, 0.040924072265625, 0.06415557861328125, 0.0873870849609375, 0.11061859130859375, 0.13385009765625, 0.15708160400390625, 0.1803131103515625, 0.20354461669921875, 0.226776123046875, 0.25000762939453125, 0.2732391357421875, 0.29647064208984375, 0.3197021484375, 0.34293365478515625, 0.3661651611328125, 0.38939666748046875, 0.412628173828125, 0.43585968017578125, 0.4590911865234375, 0.48232269287109375, 0.50555419921875, 0.5287857055664062, 0.5520172119140625, 0.5752487182617188, 0.598480224609375, 0.6217117309570312, 0.6449432373046875, 0.6681747436523438, 0.69140625]}, "gradients/decoder.model.decoder.layers.11.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 2.0, 3.0, 6.0, 6.0, 2.0, 9.0, 12.0, 24.0, 27.0, 50.0, 88.0, 114.0, 242.0, 440.0, 1079.0, 2847.0, 10486.0, 65506.0, 848404.0, 99958.0, 13405.0, 3406.0, 1276.0, 535.0, 269.0, 148.0, 73.0, 55.0, 26.0, 18.0, 10.0, 10.0, 5.0, 5.0, 5.0, 5.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.1649169921875, -0.1607503890991211, -0.1565837860107422, -0.15241718292236328, -0.14825057983398438, -0.14408397674560547, -0.13991737365722656, -0.13575077056884766, -0.13158416748046875, -0.12741756439208984, -0.12325096130371094, -0.11908435821533203, -0.11491775512695312, -0.11075115203857422, -0.10658454895019531, -0.1024179458618164, -0.0982513427734375, -0.0940847396850586, -0.08991813659667969, -0.08575153350830078, -0.08158493041992188, -0.07741832733154297, -0.07325172424316406, -0.06908512115478516, -0.06491851806640625, -0.060751914978027344, -0.05658531188964844, -0.05241870880126953, -0.048252105712890625, -0.04408550262451172, -0.03991889953613281, -0.035752296447753906, -0.031585693359375, -0.027419090270996094, -0.023252487182617188, -0.01908588409423828, -0.014919281005859375, -0.010752677917480469, -0.0065860748291015625, -0.0024194717407226562, 0.00174713134765625, 0.005913734436035156, 0.010080337524414062, 0.014246940612792969, 0.018413543701171875, 0.02258014678955078, 0.026746749877929688, 0.030913352966308594, 0.0350799560546875, 0.039246559143066406, 0.04341316223144531, 0.04757976531982422, 0.051746368408203125, 0.05591297149658203, 0.06007957458496094, 0.06424617767333984, 0.06841278076171875, 0.07257938385009766, 0.07674598693847656, 0.08091259002685547, 0.08507919311523438, 0.08924579620361328, 0.09341239929199219, 0.0975790023803711, 0.10174560546875]}, "gradients/decoder.model.decoder.layers.11.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 4.0, 5.0, 2.0, 10.0, 10.0, 12.0, 16.0, 19.0, 28.0, 44.0, 75.0, 152.0, 149.0, 176.0, 83.0, 64.0, 38.0, 23.0, 27.0, 23.0, 7.0, 10.0, 3.0, 3.0, 3.0, 4.0, 3.0, 0.0, 3.0, 0.0, 3.0, 5.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-1.8656253814697266e-05, -1.815054565668106e-05, -1.7644837498664856e-05, -1.713912934064865e-05, -1.6633421182632446e-05, -1.612771302461624e-05, -1.5622004866600037e-05, -1.5116296708583832e-05, -1.4610588550567627e-05, -1.4104880392551422e-05, -1.3599172234535217e-05, -1.3093464076519012e-05, -1.2587755918502808e-05, -1.2082047760486603e-05, -1.1576339602470398e-05, -1.1070631444454193e-05, -1.0564923286437988e-05, -1.0059215128421783e-05, -9.553506970405579e-06, -9.047798812389374e-06, -8.542090654373169e-06, -8.036382496356964e-06, -7.530674338340759e-06, -7.0249661803245544e-06, -6.51925802230835e-06, -6.013549864292145e-06, -5.50784170627594e-06, -5.002133548259735e-06, -4.49642539024353e-06, -3.9907172322273254e-06, -3.4850090742111206e-06, -2.9793009161949158e-06, -2.473592758178711e-06, -1.967884600162506e-06, -1.4621764421463013e-06, -9.564682841300964e-07, -4.507601261138916e-07, 5.494803190231323e-08, 5.606561899185181e-07, 1.066364347934723e-06, 1.5720725059509277e-06, 2.0777806639671326e-06, 2.5834888219833374e-06, 3.0891969799995422e-06, 3.594905138015747e-06, 4.100613296031952e-06, 4.606321454048157e-06, 5.1120296120643616e-06, 5.617737770080566e-06, 6.123445928096771e-06, 6.629154086112976e-06, 7.134862244129181e-06, 7.640570402145386e-06, 8.14627856016159e-06, 8.651986718177795e-06, 9.157694876194e-06, 9.663403034210205e-06, 1.016911119222641e-05, 1.0674819350242615e-05, 1.118052750825882e-05, 1.1686235666275024e-05, 1.219194382429123e-05, 1.2697651982307434e-05, 1.3203360140323639e-05, 1.3709068298339844e-05]}, "gradients/decoder.model.decoder.layers.11.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 5.0, 2.0, 5.0, 4.0, 3.0, 2.0, 13.0, 8.0, 19.0, 37.0, 35.0, 71.0, 133.0, 259.0, 518.0, 1150.0, 3111.0, 9861.0, 45615.0, 672559.0, 275747.0, 28397.0, 6984.0, 2262.0, 848.0, 396.0, 192.0, 120.0, 70.0, 40.0, 23.0, 21.0, 8.0, 11.0, 7.0, 5.0, 8.0, 3.0, 2.0, 4.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.101806640625, -0.09839725494384766, -0.09498786926269531, -0.09157848358154297, -0.08816909790039062, -0.08475971221923828, -0.08135032653808594, -0.0779409408569336, -0.07453155517578125, -0.0711221694946289, -0.06771278381347656, -0.06430339813232422, -0.060894012451171875, -0.05748462677001953, -0.05407524108886719, -0.050665855407714844, -0.0472564697265625, -0.043847084045410156, -0.04043769836425781, -0.03702831268310547, -0.033618927001953125, -0.03020954132080078, -0.026800155639648438, -0.023390769958496094, -0.01998138427734375, -0.016571998596191406, -0.013162612915039062, -0.009753227233886719, -0.006343841552734375, -0.0029344558715820312, 0.0004749298095703125, 0.0038843154907226562, 0.007293701171875, 0.010703086853027344, 0.014112472534179688, 0.01752185821533203, 0.020931243896484375, 0.02434062957763672, 0.027750015258789062, 0.031159400939941406, 0.03456878662109375, 0.037978172302246094, 0.04138755798339844, 0.04479694366455078, 0.048206329345703125, 0.05161571502685547, 0.05502510070800781, 0.058434486389160156, 0.0618438720703125, 0.06525325775146484, 0.06866264343261719, 0.07207202911376953, 0.07548141479492188, 0.07889080047607422, 0.08230018615722656, 0.0857095718383789, 0.08911895751953125, 0.0925283432006836, 0.09593772888183594, 0.09934711456298828, 0.10275650024414062, 0.10616588592529297, 0.10957527160644531, 0.11298465728759766, 0.11639404296875]}, "gradients/decoder.model.decoder.layers.11.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 8.0, 5.0, 7.0, 7.0, 9.0, 20.0, 24.0, 39.0, 44.0, 70.0, 94.0, 139.0, 147.0, 114.0, 70.0, 47.0, 38.0, 27.0, 18.0, 16.0, 11.0, 13.0, 9.0, 3.0, 3.0, 4.0, 4.0, 2.0, 5.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.037109375, -0.03587675094604492, -0.034644126892089844, -0.033411502838134766, -0.03217887878417969, -0.03094625473022461, -0.02971363067626953, -0.028481006622314453, -0.027248382568359375, -0.026015758514404297, -0.02478313446044922, -0.02355051040649414, -0.022317886352539062, -0.021085262298583984, -0.019852638244628906, -0.018620014190673828, -0.01738739013671875, -0.016154766082763672, -0.014922142028808594, -0.013689517974853516, -0.012456893920898438, -0.01122426986694336, -0.009991645812988281, -0.008759021759033203, -0.007526397705078125, -0.006293773651123047, -0.005061149597167969, -0.0038285255432128906, -0.0025959014892578125, -0.0013632774353027344, -0.00013065338134765625, 0.0011019706726074219, 0.0023345947265625, 0.003567218780517578, 0.004799842834472656, 0.006032466888427734, 0.0072650909423828125, 0.00849771499633789, 0.009730339050292969, 0.010962963104248047, 0.012195587158203125, 0.013428211212158203, 0.014660835266113281, 0.01589345932006836, 0.017126083374023438, 0.018358707427978516, 0.019591331481933594, 0.020823955535888672, 0.02205657958984375, 0.023289203643798828, 0.024521827697753906, 0.025754451751708984, 0.026987075805664062, 0.02821969985961914, 0.02945232391357422, 0.030684947967529297, 0.031917572021484375, 0.03315019607543945, 0.03438282012939453, 0.03561544418334961, 0.03684806823730469, 0.038080692291259766, 0.039313316345214844, 0.04054594039916992, 0.041778564453125]}, "gradients/decoder.model.decoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 10.0, 23.0, 50.0, 110.0, 205.0, 255.0, 197.0, 95.0, 37.0, 19.0, 6.0, 3.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.405527591705322, -4.316229820251465, -4.226932048797607, -4.13763427734375, -4.048336505889893, -3.959038734436035, -3.8697409629821777, -3.780442953109741, -3.691145181655884, -3.6018474102020264, -3.512549638748169, -3.4232518672943115, -3.333954095840454, -3.2446560859680176, -3.15535831451416, -3.0660605430603027, -2.9767627716064453, -2.887465000152588, -2.7981672286987305, -2.708869457244873, -2.6195716857910156, -2.530273914337158, -2.440976142883301, -2.3516781330108643, -2.262380599975586, -2.1730828285217285, -2.083785057067871, -1.9944872856140137, -1.9051893949508667, -1.8158916234970093, -1.7265938520431519, -1.6372959613800049, -1.547998070716858, -1.4587002992630005, -1.369402527809143, -1.280104637145996, -1.1908068656921387, -1.1015090942382812, -1.0122113227844238, -0.9229134917259216, -0.8336157202720642, -0.7443179488182068, -0.6550201177597046, -0.5657223463058472, -0.47642454504966736, -0.38712674379348755, -0.2978289723396301, -0.20853114128112793, -0.11923336982727051, -0.029935576021671295, 0.05936221778392792, 0.14866000413894653, 0.23795780539512634, 0.32725560665130615, 0.4165533781051636, 0.5058512091636658, 0.5951489806175232, 0.6844467520713806, 0.7737445831298828, 0.8630423545837402, 0.9523401260375977, 1.041637897491455, 1.1309356689453125, 1.2202335596084595, 1.309531331062317]}, "gradients/decoder.model.decoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 4.0, 6.0, 6.0, 2.0, 6.0, 12.0, 8.0, 7.0, 11.0, 10.0, 23.0, 15.0, 15.0, 23.0, 26.0, 38.0, 32.0, 45.0, 34.0, 37.0, 41.0, 34.0, 48.0, 40.0, 47.0, 47.0, 38.0, 29.0, 31.0, 35.0, 23.0, 21.0, 33.0, 28.0, 24.0, 20.0, 22.0, 13.0, 11.0, 12.0, 10.0, 8.0, 5.0, 7.0, 4.0, 10.0, 0.0, 2.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0, 3.0], "bins": [-1.0377143621444702, -1.0079102516174316, -0.9781060218811035, -0.9483018517494202, -0.9184976816177368, -0.8886935710906982, -0.8588893413543701, -0.8290852308273315, -0.7992810606956482, -0.7694768905639648, -0.7396727204322815, -0.7098685503005981, -0.6800643801689148, -0.6502602100372314, -0.6204560995101929, -0.5906519293785095, -0.5608477592468262, -0.5310435891151428, -0.5012394189834595, -0.4714352488517761, -0.44163110852241516, -0.4118269383907318, -0.38202276825904846, -0.3522186279296875, -0.3224143981933594, -0.292610228061676, -0.2628060579299927, -0.23300190269947052, -0.20319774746894836, -0.17339357733726501, -0.14358940720558167, -0.11378525197505951, -0.08398109674453735, -0.0541769340634346, -0.02437276765704155, 0.0054313987493515015, 0.035235561430454254, 0.065039724111557, 0.09484389424324036, 0.12464804947376251, 0.15445221960544586, 0.1842563897371292, 0.21406054496765137, 0.24386471509933472, 0.27366888523101807, 0.3034730553627014, 0.33327722549438477, 0.3630813658237457, 0.3928855359554291, 0.4226897060871124, 0.4524938762187958, 0.48229801654815674, 0.5121021866798401, 0.5419063568115234, 0.5717105269432068, 0.6015146970748901, 0.6313188672065735, 0.6611230373382568, 0.6909272074699402, 0.7207313776016235, 0.7505355477333069, 0.7803397178649902, 0.8101438283920288, 0.8399479985237122, 0.8697521686553955]}, "gradients/decoder.model.decoder.layers.10.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 7.0, 4.0, 7.0, 6.0, 11.0, 12.0, 20.0, 28.0, 38.0, 52.0, 101.0, 191.0, 368.0, 665.0, 1303.0, 2569.0, 5659.0, 14074.0, 48434.0, 298387.0, 2137336.0, 1473472.0, 161060.0, 30380.0, 10894.0, 4602.0, 2203.0, 1074.0, 563.0, 309.0, 161.0, 112.0, 62.0, 42.0, 22.0, 13.0, 17.0, 16.0, 4.0, 3.0, 3.0, 1.0, 1.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.66943359375, -0.6462478637695312, -0.6230621337890625, -0.5998764038085938, -0.576690673828125, -0.5535049438476562, -0.5303192138671875, -0.5071334838867188, -0.48394775390625, -0.46076202392578125, -0.4375762939453125, -0.41439056396484375, -0.391204833984375, -0.36801910400390625, -0.3448333740234375, -0.32164764404296875, -0.2984619140625, -0.27527618408203125, -0.2520904541015625, -0.22890472412109375, -0.205718994140625, -0.18253326416015625, -0.1593475341796875, -0.13616180419921875, -0.11297607421875, -0.08979034423828125, -0.0666046142578125, -0.04341888427734375, -0.020233154296875, 0.00295257568359375, 0.0261383056640625, 0.04932403564453125, 0.072509765625, 0.09569549560546875, 0.1188812255859375, 0.14206695556640625, 0.165252685546875, 0.18843841552734375, 0.2116241455078125, 0.23480987548828125, 0.25799560546875, 0.28118133544921875, 0.3043670654296875, 0.32755279541015625, 0.350738525390625, 0.37392425537109375, 0.3971099853515625, 0.42029571533203125, 0.4434814453125, 0.46666717529296875, 0.4898529052734375, 0.5130386352539062, 0.536224365234375, 0.5594100952148438, 0.5825958251953125, 0.6057815551757812, 0.62896728515625, 0.6521530151367188, 0.6753387451171875, 0.6985244750976562, 0.721710205078125, 0.7448959350585938, 0.7680816650390625, 0.7912673950195312, 0.814453125]}, "gradients/decoder.model.decoder.layers.10.fc2.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 9.0, 8.0, 8.0, 6.0, 12.0, 17.0, 36.0, 21.0, 36.0, 31.0, 43.0, 45.0, 47.0, 51.0, 50.0, 48.0, 64.0, 46.0, 59.0, 51.0, 44.0, 53.0, 45.0, 28.0, 23.0, 24.0, 21.0, 18.0, 12.0, 12.0, 11.0, 4.0, 5.0, 2.0, 1.0, 7.0, 5.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.482177734375, -0.4658851623535156, -0.44959259033203125, -0.4333000183105469, -0.4170074462890625, -0.4007148742675781, -0.38442230224609375, -0.3681297302246094, -0.351837158203125, -0.3355445861816406, -0.31925201416015625, -0.3029594421386719, -0.2866668701171875, -0.2703742980957031, -0.25408172607421875, -0.23778915405273438, -0.22149658203125, -0.20520401000976562, -0.18891143798828125, -0.17261886596679688, -0.1563262939453125, -0.14003372192382812, -0.12374114990234375, -0.10744857788085938, -0.091156005859375, -0.07486343383789062, -0.05857086181640625, -0.042278289794921875, -0.0259857177734375, -0.009693145751953125, 0.00659942626953125, 0.022891998291015625, 0.0391845703125, 0.055477142333984375, 0.07176971435546875, 0.08806228637695312, 0.1043548583984375, 0.12064743041992188, 0.13694000244140625, 0.15323257446289062, 0.169525146484375, 0.18581771850585938, 0.20211029052734375, 0.21840286254882812, 0.2346954345703125, 0.2509880065917969, 0.26728057861328125, 0.2835731506347656, 0.29986572265625, 0.3161582946777344, 0.33245086669921875, 0.3487434387207031, 0.3650360107421875, 0.3813285827636719, 0.39762115478515625, 0.4139137268066406, 0.430206298828125, 0.4464988708496094, 0.46279144287109375, 0.4790840148925781, 0.4953765869140625, 0.5116691589355469, 0.5279617309570312, 0.5442543029785156, 0.560546875]}, "gradients/decoder.model.decoder.layers.10.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 5.0, 5.0, 4.0, 2.0, 11.0, 10.0, 20.0, 57.0, 127.0, 377.0, 2546.0, 721511.0, 3465932.0, 2991.0, 436.0, 130.0, 60.0, 23.0, 17.0, 10.0, 5.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-7.04296875, -6.871368408203125, -6.69976806640625, -6.528167724609375, -6.3565673828125, -6.184967041015625, -6.01336669921875, -5.841766357421875, -5.670166015625, -5.498565673828125, -5.32696533203125, -5.155364990234375, -4.9837646484375, -4.812164306640625, -4.64056396484375, -4.468963623046875, -4.29736328125, -4.125762939453125, -3.95416259765625, -3.782562255859375, -3.6109619140625, -3.439361572265625, -3.26776123046875, -3.096160888671875, -2.924560546875, -2.752960205078125, -2.58135986328125, -2.409759521484375, -2.2381591796875, -2.066558837890625, -1.89495849609375, -1.723358154296875, -1.5517578125, -1.380157470703125, -1.20855712890625, -1.036956787109375, -0.8653564453125, -0.693756103515625, -0.52215576171875, -0.350555419921875, -0.178955078125, -0.007354736328125, 0.16424560546875, 0.335845947265625, 0.5074462890625, 0.679046630859375, 0.85064697265625, 1.022247314453125, 1.19384765625, 1.365447998046875, 1.53704833984375, 1.708648681640625, 1.8802490234375, 2.051849365234375, 2.22344970703125, 2.395050048828125, 2.566650390625, 2.738250732421875, 2.90985107421875, 3.081451416015625, 3.2530517578125, 3.424652099609375, 3.59625244140625, 3.767852783203125, 3.939453125]}, "gradients/decoder.model.decoder.layers.10.fc1.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 5.0, 2.0, 2.0, 1.0, 1.0, 4.0, 8.0, 7.0, 8.0, 11.0, 21.0, 39.0, 69.0, 104.0, 168.0, 361.0, 755.0, 1198.0, 629.0, 297.0, 147.0, 83.0, 63.0, 29.0, 23.0, 12.0, 14.0, 6.0, 3.0, 4.0, 1.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0], "bins": [-0.415283203125, -0.4035491943359375, -0.391815185546875, -0.3800811767578125, -0.36834716796875, -0.3566131591796875, -0.344879150390625, -0.3331451416015625, -0.3214111328125, -0.3096771240234375, -0.297943115234375, -0.2862091064453125, -0.27447509765625, -0.2627410888671875, -0.251007080078125, -0.2392730712890625, -0.2275390625, -0.2158050537109375, -0.204071044921875, -0.1923370361328125, -0.18060302734375, -0.1688690185546875, -0.157135009765625, -0.1454010009765625, -0.1336669921875, -0.1219329833984375, -0.110198974609375, -0.0984649658203125, -0.08673095703125, -0.0749969482421875, -0.063262939453125, -0.0515289306640625, -0.039794921875, -0.0280609130859375, -0.016326904296875, -0.0045928955078125, 0.00714111328125, 0.0188751220703125, 0.030609130859375, 0.0423431396484375, 0.0540771484375, 0.0658111572265625, 0.077545166015625, 0.0892791748046875, 0.10101318359375, 0.1127471923828125, 0.124481201171875, 0.1362152099609375, 0.14794921875, 0.1596832275390625, 0.171417236328125, 0.1831512451171875, 0.19488525390625, 0.2066192626953125, 0.218353271484375, 0.2300872802734375, 0.2418212890625, 0.2535552978515625, 0.265289306640625, 0.2770233154296875, 0.28875732421875, 0.3004913330078125, 0.312225341796875, 0.3239593505859375, 0.335693359375]}, "gradients/decoder.model.decoder.layers.10.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 2.0, 3.0, 6.0, 13.0, 15.0, 23.0, 34.0, 37.0, 67.0, 96.0, 103.0, 117.0, 106.0, 96.0, 81.0, 77.0, 39.0, 31.0, 21.0, 19.0, 9.0, 4.0, 7.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-1.5571964979171753, -1.5232477188110352, -1.4892988204956055, -1.4553499221801758, -1.4214011430740356, -1.3874523639678955, -1.3535034656524658, -1.3195545673370361, -1.285605788230896, -1.2516570091247559, -1.2177081108093262, -1.1837592124938965, -1.1498104333877563, -1.1158616542816162, -1.0819127559661865, -1.0479638576507568, -1.0140150785446167, -0.9800662398338318, -0.9461174011230469, -0.912168562412262, -0.878219723701477, -0.8442708849906921, -0.8103220462799072, -0.7763732075691223, -0.7424243688583374, -0.7084755301475525, -0.6745266914367676, -0.6405778527259827, -0.6066290140151978, -0.5726801753044128, -0.5387313365936279, -0.504782497882843, -0.47083377838134766, -0.43688493967056274, -0.40293610095977783, -0.3689872622489929, -0.335038423538208, -0.3010895848274231, -0.2671407461166382, -0.23319190740585327, -0.19924306869506836, -0.16529422998428345, -0.13134539127349854, -0.09739655256271362, -0.06344771385192871, -0.0294988751411438, 0.004449963569641113, 0.038398802280426025, 0.07234764099121094, 0.10629647970199585, 0.14024531841278076, 0.17419415712356567, 0.20814299583435059, 0.2420918345451355, 0.2760406732559204, 0.3099895119667053, 0.34393835067749023, 0.37788718938827515, 0.41183602809906006, 0.44578486680984497, 0.4797337055206299, 0.5136825442314148, 0.5476313829421997, 0.5815802216529846, 0.6155290603637695]}, "gradients/decoder.model.decoder.layers.10.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 4.0, 4.0, 4.0, 7.0, 10.0, 10.0, 9.0, 18.0, 20.0, 17.0, 18.0, 28.0, 32.0, 41.0, 41.0, 33.0, 36.0, 41.0, 51.0, 58.0, 51.0, 48.0, 40.0, 44.0, 42.0, 41.0, 32.0, 35.0, 24.0, 30.0, 14.0, 20.0, 15.0, 22.0, 23.0, 14.0, 8.0, 8.0, 8.0, 10.0, 0.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5627540349960327, -0.5461817383766174, -0.5296093821525574, -0.5130370855331421, -0.4964647889137268, -0.47989246249198914, -0.46332013607025146, -0.4467478394508362, -0.4301755130290985, -0.41360318660736084, -0.39703088998794556, -0.3804585635662079, -0.3638862371444702, -0.34731394052505493, -0.33074161410331726, -0.3141692876815796, -0.2975969910621643, -0.28102466464042664, -0.26445236802101135, -0.24788004159927368, -0.2313077300786972, -0.21473541855812073, -0.19816309213638306, -0.18159078061580658, -0.1650184690952301, -0.14844615757465363, -0.13187384605407715, -0.11530151963233948, -0.098729208111763, -0.08215689659118652, -0.06558457762002945, -0.049012258648872375, -0.03243991732597351, -0.015867602080106735, 0.0007047131657600403, 0.017277028411626816, 0.03384934365749359, 0.05042165517807007, 0.06699397414922714, 0.08356629312038422, 0.1001386046409607, 0.11671091616153717, 0.13328322768211365, 0.14985555410385132, 0.1664278656244278, 0.18300017714500427, 0.19957250356674194, 0.21614481508731842, 0.2327171266078949, 0.24928943812847137, 0.26586174964904785, 0.2824340760707855, 0.2990064024925232, 0.3155786991119385, 0.33215102553367615, 0.3487233519554138, 0.3652956485748291, 0.3818679749965668, 0.39844027161598206, 0.4150125980377197, 0.431584894657135, 0.4481572210788727, 0.46472954750061035, 0.48130184412002563, 0.4978741705417633]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 4.0, 3.0, 8.0, 6.0, 22.0, 34.0, 77.0, 107.0, 210.0, 367.0, 718.0, 1344.0, 2875.0, 5810.0, 13400.0, 31588.0, 76092.0, 184385.0, 356732.0, 217726.0, 90977.0, 37119.0, 15361.0, 7021.0, 3207.0, 1602.0, 818.0, 409.0, 243.0, 134.0, 63.0, 37.0, 23.0, 15.0, 11.0, 5.0, 3.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2568359375, -0.24895668029785156, -0.24107742309570312, -0.2331981658935547, -0.22531890869140625, -0.2174396514892578, -0.20956039428710938, -0.20168113708496094, -0.1938018798828125, -0.18592262268066406, -0.17804336547851562, -0.1701641082763672, -0.16228485107421875, -0.1544055938720703, -0.14652633666992188, -0.13864707946777344, -0.130767822265625, -0.12288856506347656, -0.11500930786132812, -0.10713005065917969, -0.09925079345703125, -0.09137153625488281, -0.08349227905273438, -0.07561302185058594, -0.0677337646484375, -0.05985450744628906, -0.051975250244140625, -0.04409599304199219, -0.03621673583984375, -0.028337478637695312, -0.020458221435546875, -0.012578964233398438, -0.00469970703125, 0.0031795501708984375, 0.011058807373046875, 0.018938064575195312, 0.02681732177734375, 0.03469657897949219, 0.042575836181640625, 0.05045509338378906, 0.0583343505859375, 0.06621360778808594, 0.07409286499023438, 0.08197212219238281, 0.08985137939453125, 0.09773063659667969, 0.10560989379882812, 0.11348915100097656, 0.121368408203125, 0.12924766540527344, 0.13712692260742188, 0.1450061798095703, 0.15288543701171875, 0.1607646942138672, 0.16864395141601562, 0.17652320861816406, 0.1844024658203125, 0.19228172302246094, 0.20016098022460938, 0.2080402374267578, 0.21591949462890625, 0.2237987518310547, 0.23167800903320312, 0.23955726623535156, 0.2474365234375]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 4.0, 2.0, 7.0, 2.0, 14.0, 16.0, 17.0, 17.0, 29.0, 29.0, 38.0, 32.0, 42.0, 41.0, 48.0, 56.0, 55.0, 64.0, 58.0, 48.0, 52.0, 45.0, 54.0, 42.0, 26.0, 30.0, 28.0, 19.0, 19.0, 23.0, 14.0, 10.0, 15.0, 7.0, 4.0, 4.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.434326171875, -0.42119598388671875, -0.4080657958984375, -0.39493560791015625, -0.381805419921875, -0.36867523193359375, -0.3555450439453125, -0.34241485595703125, -0.32928466796875, -0.31615447998046875, -0.3030242919921875, -0.28989410400390625, -0.276763916015625, -0.26363372802734375, -0.2505035400390625, -0.23737335205078125, -0.2242431640625, -0.21111297607421875, -0.1979827880859375, -0.18485260009765625, -0.171722412109375, -0.15859222412109375, -0.1454620361328125, -0.13233184814453125, -0.11920166015625, -0.10607147216796875, -0.0929412841796875, -0.07981109619140625, -0.066680908203125, -0.05355072021484375, -0.0404205322265625, -0.02729034423828125, -0.01416015625, -0.00102996826171875, 0.0121002197265625, 0.02523040771484375, 0.038360595703125, 0.05149078369140625, 0.0646209716796875, 0.07775115966796875, 0.09088134765625, 0.10401153564453125, 0.1171417236328125, 0.13027191162109375, 0.143402099609375, 0.15653228759765625, 0.1696624755859375, 0.18279266357421875, 0.1959228515625, 0.20905303955078125, 0.2221832275390625, 0.23531341552734375, 0.248443603515625, 0.26157379150390625, 0.2747039794921875, 0.28783416748046875, 0.30096435546875, 0.31409454345703125, 0.3272247314453125, 0.34035491943359375, 0.353485107421875, 0.36661529541015625, 0.3797454833984375, 0.39287567138671875, 0.406005859375]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 5.0, 5.0, 5.0, 12.0, 16.0, 27.0, 43.0, 70.0, 176.0, 423.0, 959.0, 3360.0, 13699.0, 78940.0, 528683.0, 358609.0, 50168.0, 9350.0, 2519.0, 848.0, 325.0, 137.0, 68.0, 44.0, 21.0, 24.0, 5.0, 7.0, 3.0, 0.0, 1.0, 5.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.5400390625, -0.5245552062988281, -0.5090713500976562, -0.4935874938964844, -0.4781036376953125, -0.4626197814941406, -0.44713592529296875, -0.4316520690917969, -0.416168212890625, -0.4006843566894531, -0.38520050048828125, -0.3697166442871094, -0.3542327880859375, -0.3387489318847656, -0.32326507568359375, -0.3077812194824219, -0.29229736328125, -0.2768135070800781, -0.26132965087890625, -0.24584579467773438, -0.2303619384765625, -0.21487808227539062, -0.19939422607421875, -0.18391036987304688, -0.168426513671875, -0.15294265747070312, -0.13745880126953125, -0.12197494506835938, -0.1064910888671875, -0.09100723266601562, -0.07552337646484375, -0.060039520263671875, -0.0445556640625, -0.029071807861328125, -0.01358795166015625, 0.001895904541015625, 0.0173797607421875, 0.032863616943359375, 0.04834747314453125, 0.06383132934570312, 0.079315185546875, 0.09479904174804688, 0.11028289794921875, 0.12576675415039062, 0.1412506103515625, 0.15673446655273438, 0.17221832275390625, 0.18770217895507812, 0.20318603515625, 0.21866989135742188, 0.23415374755859375, 0.24963760375976562, 0.2651214599609375, 0.2806053161621094, 0.29608917236328125, 0.3115730285644531, 0.327056884765625, 0.3425407409667969, 0.35802459716796875, 0.3735084533691406, 0.3889923095703125, 0.4044761657714844, 0.41996002197265625, 0.4354438781738281, 0.450927734375]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 2.0, 5.0, 9.0, 3.0, 7.0, 11.0, 7.0, 12.0, 17.0, 25.0, 20.0, 22.0, 24.0, 35.0, 27.0, 35.0, 35.0, 24.0, 32.0, 35.0, 46.0, 37.0, 31.0, 44.0, 42.0, 39.0, 39.0, 37.0, 33.0, 46.0, 32.0, 29.0, 21.0, 22.0, 16.0, 18.0, 25.0, 7.0, 12.0, 9.0, 8.0, 8.0, 5.0, 3.0, 4.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.59521484375, -0.5749588012695312, -0.5547027587890625, -0.5344467163085938, -0.514190673828125, -0.49393463134765625, -0.4736785888671875, -0.45342254638671875, -0.43316650390625, -0.41291046142578125, -0.3926544189453125, -0.37239837646484375, -0.352142333984375, -0.33188629150390625, -0.3116302490234375, -0.29137420654296875, -0.2711181640625, -0.25086212158203125, -0.2306060791015625, -0.21035003662109375, -0.190093994140625, -0.16983795166015625, -0.1495819091796875, -0.12932586669921875, -0.10906982421875, -0.08881378173828125, -0.0685577392578125, -0.04830169677734375, -0.028045654296875, -0.00778961181640625, 0.0124664306640625, 0.03272247314453125, 0.052978515625, 0.07323455810546875, 0.0934906005859375, 0.11374664306640625, 0.134002685546875, 0.15425872802734375, 0.1745147705078125, 0.19477081298828125, 0.21502685546875, 0.23528289794921875, 0.2555389404296875, 0.27579498291015625, 0.296051025390625, 0.31630706787109375, 0.3365631103515625, 0.35681915283203125, 0.3770751953125, 0.39733123779296875, 0.4175872802734375, 0.43784332275390625, 0.458099365234375, 0.47835540771484375, 0.4986114501953125, 0.5188674926757812, 0.53912353515625, 0.5593795776367188, 0.5796356201171875, 0.5998916625976562, 0.620147705078125, 0.6404037475585938, 0.6606597900390625, 0.6809158325195312, 0.701171875]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 3.0, 3.0, 7.0, 9.0, 15.0, 29.0, 51.0, 75.0, 135.0, 225.0, 364.0, 649.0, 1301.0, 2535.0, 5617.0, 13629.0, 40155.0, 158484.0, 516153.0, 224654.0, 53934.0, 17226.0, 6829.0, 3153.0, 1475.0, 788.0, 446.0, 255.0, 131.0, 96.0, 50.0, 28.0, 23.0, 14.0, 9.0, 5.0, 6.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.05572509765625, -0.0540165901184082, -0.052308082580566406, -0.05059957504272461, -0.04889106750488281, -0.047182559967041016, -0.04547405242919922, -0.04376554489135742, -0.042057037353515625, -0.04034852981567383, -0.03864002227783203, -0.036931514739990234, -0.03522300720214844, -0.03351449966430664, -0.031805992126464844, -0.030097484588623047, -0.02838897705078125, -0.026680469512939453, -0.024971961975097656, -0.02326345443725586, -0.021554946899414062, -0.019846439361572266, -0.01813793182373047, -0.016429424285888672, -0.014720916748046875, -0.013012409210205078, -0.011303901672363281, -0.009595394134521484, -0.007886886596679688, -0.006178379058837891, -0.004469871520996094, -0.002761363983154297, -0.0010528564453125, 0.0006556510925292969, 0.0023641586303710938, 0.004072666168212891, 0.0057811737060546875, 0.007489681243896484, 0.009198188781738281, 0.010906696319580078, 0.012615203857421875, 0.014323711395263672, 0.01603221893310547, 0.017740726470947266, 0.019449234008789062, 0.02115774154663086, 0.022866249084472656, 0.024574756622314453, 0.02628326416015625, 0.027991771697998047, 0.029700279235839844, 0.03140878677368164, 0.03311729431152344, 0.034825801849365234, 0.03653430938720703, 0.03824281692504883, 0.039951324462890625, 0.04165983200073242, 0.04336833953857422, 0.045076847076416016, 0.04678535461425781, 0.04849386215209961, 0.050202369689941406, 0.0519108772277832, 0.053619384765625]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 4.0, 2.0, 3.0, 4.0, 4.0, 4.0, 9.0, 6.0, 15.0, 25.0, 29.0, 54.0, 97.0, 152.0, 173.0, 130.0, 108.0, 70.0, 31.0, 34.0, 17.0, 11.0, 6.0, 7.0, 2.0, 1.0, 1.0, 3.0, 3.0, 0.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.838010787963867e-05, -7.603969424962997e-05, -7.369928061962128e-05, -7.135886698961258e-05, -6.901845335960388e-05, -6.667803972959518e-05, -6.433762609958649e-05, -6.199721246957779e-05, -5.965679883956909e-05, -5.7316385209560394e-05, -5.49759715795517e-05, -5.2635557949543e-05, -5.02951443195343e-05, -4.7954730689525604e-05, -4.561431705951691e-05, -4.327390342950821e-05, -4.093348979949951e-05, -3.8593076169490814e-05, -3.625266253948212e-05, -3.391224890947342e-05, -3.157183527946472e-05, -2.9231421649456024e-05, -2.6891008019447327e-05, -2.455059438943863e-05, -2.221018075942993e-05, -1.9869767129421234e-05, -1.7529353499412537e-05, -1.5188939869403839e-05, -1.2848526239395142e-05, -1.0508112609386444e-05, -8.167698979377747e-06, -5.827285349369049e-06, -3.4868717193603516e-06, -1.146458089351654e-06, 1.1939555406570435e-06, 3.534369170665741e-06, 5.8747828006744385e-06, 8.215196430683136e-06, 1.0555610060691833e-05, 1.2896023690700531e-05, 1.5236437320709229e-05, 1.7576850950717926e-05, 1.9917264580726624e-05, 2.225767821073532e-05, 2.459809184074402e-05, 2.6938505470752716e-05, 2.9278919100761414e-05, 3.161933273077011e-05, 3.395974636077881e-05, 3.6300159990787506e-05, 3.8640573620796204e-05, 4.09809872508049e-05, 4.33214008808136e-05, 4.5661814510822296e-05, 4.8002228140830994e-05, 5.034264177083969e-05, 5.268305540084839e-05, 5.5023469030857086e-05, 5.7363882660865784e-05, 5.970429629087448e-05, 6.204470992088318e-05, 6.438512355089188e-05, 6.672553718090057e-05, 6.906595081090927e-05, 7.140636444091797e-05]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 3.0, 4.0, 3.0, 5.0, 8.0, 9.0, 15.0, 18.0, 27.0, 50.0, 78.0, 125.0, 231.0, 385.0, 850.0, 1974.0, 5439.0, 16495.0, 63447.0, 292651.0, 494909.0, 127484.0, 30042.0, 8807.0, 3065.0, 1239.0, 549.0, 283.0, 137.0, 77.0, 37.0, 37.0, 21.0, 22.0, 7.0, 9.0, 7.0, 1.0, 7.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.051788330078125, -0.04995393753051758, -0.048119544982910156, -0.046285152435302734, -0.04445075988769531, -0.04261636734008789, -0.04078197479248047, -0.03894758224487305, -0.037113189697265625, -0.0352787971496582, -0.03344440460205078, -0.03161001205444336, -0.029775619506835938, -0.027941226959228516, -0.026106834411621094, -0.024272441864013672, -0.02243804931640625, -0.020603656768798828, -0.018769264221191406, -0.016934871673583984, -0.015100479125976562, -0.01326608657836914, -0.011431694030761719, -0.009597301483154297, -0.007762908935546875, -0.005928516387939453, -0.004094123840332031, -0.0022597312927246094, -0.0004253387451171875, 0.0014090538024902344, 0.0032434463500976562, 0.005077838897705078, 0.0069122314453125, 0.008746623992919922, 0.010581016540527344, 0.012415409088134766, 0.014249801635742188, 0.01608419418334961, 0.01791858673095703, 0.019752979278564453, 0.021587371826171875, 0.023421764373779297, 0.02525615692138672, 0.02709054946899414, 0.028924942016601562, 0.030759334564208984, 0.032593727111816406, 0.03442811965942383, 0.03626251220703125, 0.03809690475463867, 0.039931297302246094, 0.041765689849853516, 0.04360008239746094, 0.04543447494506836, 0.04726886749267578, 0.0491032600402832, 0.050937652587890625, 0.05277204513549805, 0.05460643768310547, 0.05644083023071289, 0.05827522277832031, 0.060109615325927734, 0.061944007873535156, 0.06377840042114258, 0.06561279296875]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 0.0, 3.0, 1.0, 6.0, 4.0, 13.0, 7.0, 10.0, 10.0, 16.0, 18.0, 17.0, 23.0, 28.0, 35.0, 46.0, 63.0, 69.0, 84.0, 90.0, 78.0, 87.0, 68.0, 48.0, 42.0, 25.0, 34.0, 21.0, 14.0, 11.0, 8.0, 8.0, 6.0, 5.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01470947265625, -0.014224767684936523, -0.013740062713623047, -0.01325535774230957, -0.012770652770996094, -0.012285947799682617, -0.01180124282836914, -0.011316537857055664, -0.010831832885742188, -0.010347127914428711, -0.009862422943115234, -0.009377717971801758, -0.008893013000488281, -0.008408308029174805, -0.007923603057861328, -0.0074388980865478516, -0.006954193115234375, -0.0064694881439208984, -0.005984783172607422, -0.005500078201293945, -0.005015373229980469, -0.004530668258666992, -0.004045963287353516, -0.003561258316040039, -0.0030765533447265625, -0.002591848373413086, -0.0021071434020996094, -0.0016224384307861328, -0.0011377334594726562, -0.0006530284881591797, -0.00016832351684570312, 0.00031638145446777344, 0.00080108642578125, 0.0012857913970947266, 0.0017704963684082031, 0.0022552013397216797, 0.0027399063110351562, 0.003224611282348633, 0.0037093162536621094, 0.004194021224975586, 0.0046787261962890625, 0.005163431167602539, 0.005648136138916016, 0.006132841110229492, 0.006617546081542969, 0.007102251052856445, 0.007586956024169922, 0.008071660995483398, 0.008556365966796875, 0.009041070938110352, 0.009525775909423828, 0.010010480880737305, 0.010495185852050781, 0.010979890823364258, 0.011464595794677734, 0.011949300765991211, 0.012434005737304688, 0.012918710708618164, 0.01340341567993164, 0.013888120651245117, 0.014372825622558594, 0.01485753059387207, 0.015342235565185547, 0.015826940536499023, 0.0163116455078125]}, "gradients/decoder.model.decoder.layers.10.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 3.0, 3.0, 3.0, 2.0, 4.0, 7.0, 9.0, 11.0, 23.0, 39.0, 34.0, 76.0, 93.0, 108.0, 110.0, 120.0, 96.0, 72.0, 74.0, 31.0, 26.0, 23.0, 11.0, 12.0, 3.0, 4.0, 4.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0], "bins": [-0.8066639304161072, -0.7877929210662842, -0.768921971321106, -0.750050961971283, -0.7311800122261047, -0.7123090028762817, -0.6934380531311035, -0.6745670437812805, -0.6556960344314575, -0.6368250250816345, -0.6179540753364563, -0.5990830659866333, -0.5802121162414551, -0.5613411068916321, -0.5424701571464539, -0.5235991477966309, -0.5047281980514526, -0.485857218503952, -0.4669862389564514, -0.4481152594089508, -0.4292442798614502, -0.4103732705116272, -0.3915022909641266, -0.372631311416626, -0.35376033186912537, -0.33488935232162476, -0.31601837277412415, -0.29714739322662354, -0.27827638387680054, -0.2594054341316223, -0.24053442478179932, -0.2216634452342987, -0.20279240608215332, -0.1839214265346527, -0.1650504469871521, -0.1461794525384903, -0.12730847299098969, -0.10843749344348907, -0.08956650644540787, -0.07069551944732666, -0.05182453989982605, -0.03295355662703514, -0.014082573354244232, 0.004788409918546677, 0.023659393191337585, 0.042530372738838196, 0.0614013597369194, 0.08027234673500061, 0.09914332628250122, 0.11801430583000183, 0.13688528537750244, 0.15575627982616425, 0.17462725937366486, 0.19349823892116547, 0.21236923336982727, 0.23124021291732788, 0.2501111924648285, 0.2689821720123291, 0.2878531515598297, 0.3067241311073303, 0.3255951404571533, 0.34446609020233154, 0.36333709955215454, 0.38220807909965515, 0.40107905864715576]}, "gradients/decoder.model.decoder.layers.10.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 4.0, 10.0, 5.0, 10.0, 14.0, 17.0, 21.0, 17.0, 23.0, 26.0, 46.0, 42.0, 36.0, 40.0, 46.0, 42.0, 57.0, 59.0, 51.0, 46.0, 54.0, 40.0, 42.0, 35.0, 39.0, 29.0, 19.0, 17.0, 29.0, 15.0, 20.0, 11.0, 11.0, 11.0, 12.0, 3.0, 3.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3913864493370056, -0.3797988295555115, -0.36821120977401733, -0.3566235899925232, -0.34503600001335144, -0.3334483802318573, -0.32186076045036316, -0.310273140668869, -0.2986855208873749, -0.28709790110588074, -0.2755102813243866, -0.26392269134521484, -0.2523350715637207, -0.24074745178222656, -0.22915983200073242, -0.21757221221923828, -0.20598460733890533, -0.1943969875574112, -0.18280938267707825, -0.1712217628955841, -0.15963414311408997, -0.14804652333259583, -0.13645891845226288, -0.12487129867076874, -0.1132836863398552, -0.10169607400894165, -0.09010845422744751, -0.07852084189653397, -0.06693322956562042, -0.05534560978412628, -0.04375799745321274, -0.0321703776717186, -0.020582765340805054, -0.008995150215923786, 0.0025924649089574814, 0.014180079102516174, 0.025767695158720016, 0.03735531121492386, 0.0489429235458374, 0.06053054332733154, 0.07211815565824509, 0.08370576798915863, 0.09529338777065277, 0.10688100010156631, 0.11846861243247986, 0.130056232213974, 0.14164385199546814, 0.15323147177696228, 0.16481907665729523, 0.17640669643878937, 0.18799430131912231, 0.19958192110061646, 0.2111695408821106, 0.22275716066360474, 0.23434476554393768, 0.24593238532543182, 0.25751999020576477, 0.2691076099872589, 0.28069522976875305, 0.2922828197479248, 0.30387043952941895, 0.3154580593109131, 0.3270456790924072, 0.33863329887390137, 0.3502209186553955]}, "gradients/decoder.model.decoder.layers.10.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 3.0, 2.0, 8.0, 6.0, 10.0, 18.0, 23.0, 41.0, 65.0, 82.0, 124.0, 199.0, 296.0, 416.0, 618.0, 918.0, 1441.0, 2015.0, 3241.0, 5295.0, 8581.0, 14935.0, 27754.0, 57524.0, 145658.0, 393674.0, 224425.0, 78790.0, 35759.0, 18661.0, 10564.0, 6178.0, 3891.0, 2531.0, 1609.0, 1058.0, 703.0, 448.0, 317.0, 203.0, 144.0, 98.0, 71.0, 60.0, 34.0, 23.0, 27.0, 11.0, 5.0, 4.0, 3.0, 1.0, 2.0], "bins": [-0.20263671875, -0.197113037109375, -0.19158935546875, -0.186065673828125, -0.1805419921875, -0.175018310546875, -0.16949462890625, -0.163970947265625, -0.158447265625, -0.152923583984375, -0.14739990234375, -0.141876220703125, -0.1363525390625, -0.130828857421875, -0.12530517578125, -0.119781494140625, -0.1142578125, -0.108734130859375, -0.10321044921875, -0.097686767578125, -0.0921630859375, -0.086639404296875, -0.08111572265625, -0.075592041015625, -0.070068359375, -0.064544677734375, -0.05902099609375, -0.053497314453125, -0.0479736328125, -0.042449951171875, -0.03692626953125, -0.031402587890625, -0.02587890625, -0.020355224609375, -0.01483154296875, -0.009307861328125, -0.0037841796875, 0.001739501953125, 0.00726318359375, 0.012786865234375, 0.018310546875, 0.023834228515625, 0.02935791015625, 0.034881591796875, 0.0404052734375, 0.045928955078125, 0.05145263671875, 0.056976318359375, 0.0625, 0.068023681640625, 0.07354736328125, 0.079071044921875, 0.0845947265625, 0.090118408203125, 0.09564208984375, 0.101165771484375, 0.106689453125, 0.112213134765625, 0.11773681640625, 0.123260498046875, 0.1287841796875, 0.134307861328125, 0.13983154296875, 0.145355224609375, 0.15087890625]}, "gradients/decoder.model.decoder.layers.10.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 3.0, 4.0, 2.0, 4.0, 6.0, 7.0, 9.0, 16.0, 11.0, 16.0, 26.0, 20.0, 18.0, 34.0, 34.0, 41.0, 35.0, 40.0, 40.0, 57.0, 47.0, 55.0, 50.0, 46.0, 48.0, 52.0, 47.0, 25.0, 35.0, 30.0, 27.0, 26.0, 16.0, 17.0, 8.0, 12.0, 11.0, 12.0, 7.0, 5.0, 3.0, 7.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.74853515625, -0.7275390625, -0.70654296875, -0.685546875, -0.66455078125, -0.6435546875, -0.62255859375, -0.6015625, -0.58056640625, -0.5595703125, -0.53857421875, -0.517578125, -0.49658203125, -0.4755859375, -0.45458984375, -0.43359375, -0.41259765625, -0.3916015625, -0.37060546875, -0.349609375, -0.32861328125, -0.3076171875, -0.28662109375, -0.265625, -0.24462890625, -0.2236328125, -0.20263671875, -0.181640625, -0.16064453125, -0.1396484375, -0.11865234375, -0.09765625, -0.07666015625, -0.0556640625, -0.03466796875, -0.013671875, 0.00732421875, 0.0283203125, 0.04931640625, 0.0703125, 0.09130859375, 0.1123046875, 0.13330078125, 0.154296875, 0.17529296875, 0.1962890625, 0.21728515625, 0.23828125, 0.25927734375, 0.2802734375, 0.30126953125, 0.322265625, 0.34326171875, 0.3642578125, 0.38525390625, 0.40625, 0.42724609375, 0.4482421875, 0.46923828125, 0.490234375, 0.51123046875, 0.5322265625, 0.55322265625, 0.57421875, 0.59521484375]}, "gradients/decoder.model.decoder.layers.10.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 5.0, 1.0, 3.0, 3.0, 2.0, 14.0, 18.0, 9.0, 9.0, 25.0, 26.0, 40.0, 60.0, 61.0, 74.0, 100.0, 223.0, 2284.0, 1000399.0, 44165.0, 484.0, 139.0, 87.0, 69.0, 59.0, 39.0, 42.0, 27.0, 26.0, 16.0, 15.0, 10.0, 7.0, 7.0, 2.0, 8.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.2421875, -2.173736572265625, -2.10528564453125, -2.036834716796875, -1.9683837890625, -1.899932861328125, -1.83148193359375, -1.763031005859375, -1.694580078125, -1.626129150390625, -1.55767822265625, -1.489227294921875, -1.4207763671875, -1.352325439453125, -1.28387451171875, -1.215423583984375, -1.14697265625, -1.078521728515625, -1.01007080078125, -0.941619873046875, -0.8731689453125, -0.804718017578125, -0.73626708984375, -0.667816162109375, -0.599365234375, -0.530914306640625, -0.46246337890625, -0.394012451171875, -0.3255615234375, -0.257110595703125, -0.18865966796875, -0.120208740234375, -0.0517578125, 0.016693115234375, 0.08514404296875, 0.153594970703125, 0.2220458984375, 0.290496826171875, 0.35894775390625, 0.427398681640625, 0.495849609375, 0.564300537109375, 0.63275146484375, 0.701202392578125, 0.7696533203125, 0.838104248046875, 0.90655517578125, 0.975006103515625, 1.04345703125, 1.111907958984375, 1.18035888671875, 1.248809814453125, 1.3172607421875, 1.385711669921875, 1.45416259765625, 1.522613525390625, 1.591064453125, 1.659515380859375, 1.72796630859375, 1.796417236328125, 1.8648681640625, 1.933319091796875, 2.00177001953125, 2.070220947265625, 2.138671875]}, "gradients/decoder.model.decoder.layers.10.self_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 2.0, 0.0, 2.0, 4.0, 3.0, 10.0, 16.0, 12.0, 11.0, 15.0, 14.0, 28.0, 30.0, 52.0, 51.0, 48.0, 41.0, 54.0, 57.0, 57.0, 65.0, 50.0, 47.0, 46.0, 47.0, 38.0, 38.0, 34.0, 26.0, 27.0, 18.0, 16.0, 15.0, 9.0, 5.0, 7.0, 3.0, 3.0, 5.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.90185546875, -0.8743362426757812, -0.8468170166015625, -0.8192977905273438, -0.791778564453125, -0.7642593383789062, -0.7367401123046875, -0.7092208862304688, -0.68170166015625, -0.6541824340820312, -0.6266632080078125, -0.5991439819335938, -0.571624755859375, -0.5441055297851562, -0.5165863037109375, -0.48906707763671875, -0.4615478515625, -0.43402862548828125, -0.4065093994140625, -0.37899017333984375, -0.351470947265625, -0.32395172119140625, -0.2964324951171875, -0.26891326904296875, -0.24139404296875, -0.21387481689453125, -0.1863555908203125, -0.15883636474609375, -0.131317138671875, -0.10379791259765625, -0.0762786865234375, -0.04875946044921875, -0.021240234375, 0.00627899169921875, 0.0337982177734375, 0.06131744384765625, 0.088836669921875, 0.11635589599609375, 0.1438751220703125, 0.17139434814453125, 0.19891357421875, 0.22643280029296875, 0.2539520263671875, 0.28147125244140625, 0.308990478515625, 0.33650970458984375, 0.3640289306640625, 0.39154815673828125, 0.4190673828125, 0.44658660888671875, 0.4741058349609375, 0.5016250610351562, 0.529144287109375, 0.5566635131835938, 0.5841827392578125, 0.6117019653320312, 0.63922119140625, 0.6667404174804688, 0.6942596435546875, 0.7217788696289062, 0.749298095703125, 0.7768173217773438, 0.8043365478515625, 0.8318557739257812, 0.859375]}, "gradients/decoder.model.decoder.layers.10.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 4.0, 4.0, 1.0, 5.0, 6.0, 4.0, 5.0, 6.0, 9.0, 20.0, 25.0, 30.0, 50.0, 80.0, 170.0, 472.0, 1888.0, 12088.0, 718777.0, 302768.0, 9614.0, 1701.0, 451.0, 163.0, 82.0, 40.0, 28.0, 15.0, 13.0, 9.0, 11.0, 5.0, 5.0, 4.0, 4.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.434326171875, -0.41982269287109375, -0.4053192138671875, -0.39081573486328125, -0.376312255859375, -0.36180877685546875, -0.3473052978515625, -0.33280181884765625, -0.31829833984375, -0.30379486083984375, -0.2892913818359375, -0.27478790283203125, -0.260284423828125, -0.24578094482421875, -0.2312774658203125, -0.21677398681640625, -0.2022705078125, -0.18776702880859375, -0.1732635498046875, -0.15876007080078125, -0.144256591796875, -0.12975311279296875, -0.1152496337890625, -0.10074615478515625, -0.08624267578125, -0.07173919677734375, -0.0572357177734375, -0.04273223876953125, -0.028228759765625, -0.01372528076171875, 0.0007781982421875, 0.01528167724609375, 0.02978515625, 0.04428863525390625, 0.0587921142578125, 0.07329559326171875, 0.087799072265625, 0.10230255126953125, 0.1168060302734375, 0.13130950927734375, 0.14581298828125, 0.16031646728515625, 0.1748199462890625, 0.18932342529296875, 0.203826904296875, 0.21833038330078125, 0.2328338623046875, 0.24733734130859375, 0.2618408203125, 0.27634429931640625, 0.2908477783203125, 0.30535125732421875, 0.319854736328125, 0.33435821533203125, 0.3488616943359375, 0.36336517333984375, 0.37786865234375, 0.39237213134765625, 0.4068756103515625, 0.42137908935546875, 0.435882568359375, 0.45038604736328125, 0.4648895263671875, 0.47939300537109375, 0.493896484375]}, "gradients/decoder.model.decoder.layers.10.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 3.0, 6.0, 6.0, 5.0, 8.0, 10.0, 22.0, 28.0, 31.0, 64.0, 194.0, 343.0, 131.0, 58.0, 26.0, 23.0, 16.0, 7.0, 7.0, 1.0, 1.0, 5.0, 3.0, 3.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.2498111724853516e-05, -4.1048042476177216e-05, -3.9597973227500916e-05, -3.8147903978824615e-05, -3.6697834730148315e-05, -3.5247765481472015e-05, -3.3797696232795715e-05, -3.2347626984119415e-05, -3.0897557735443115e-05, -2.9447488486766815e-05, -2.7997419238090515e-05, -2.6547349989414215e-05, -2.5097280740737915e-05, -2.3647211492061615e-05, -2.2197142243385315e-05, -2.0747072994709015e-05, -1.9297003746032715e-05, -1.7846934497356415e-05, -1.6396865248680115e-05, -1.4946796000003815e-05, -1.3496726751327515e-05, -1.2046657502651215e-05, -1.0596588253974915e-05, -9.146519005298615e-06, -7.696449756622314e-06, -6.246380507946014e-06, -4.796311259269714e-06, -3.3462420105934143e-06, -1.8961727619171143e-06, -4.461035132408142e-07, 1.0039657354354858e-06, 2.454034984111786e-06, 3.904104232788086e-06, 5.354173481464386e-06, 6.804242730140686e-06, 8.254311978816986e-06, 9.704381227493286e-06, 1.1154450476169586e-05, 1.2604519724845886e-05, 1.4054588973522186e-05, 1.5504658222198486e-05, 1.6954727470874786e-05, 1.8404796719551086e-05, 1.9854865968227386e-05, 2.1304935216903687e-05, 2.2755004465579987e-05, 2.4205073714256287e-05, 2.5655142962932587e-05, 2.7105212211608887e-05, 2.8555281460285187e-05, 3.0005350708961487e-05, 3.145541995763779e-05, 3.290548920631409e-05, 3.435555845499039e-05, 3.580562770366669e-05, 3.725569695234299e-05, 3.870576620101929e-05, 4.015583544969559e-05, 4.160590469837189e-05, 4.305597394704819e-05, 4.450604319572449e-05, 4.595611244440079e-05, 4.740618169307709e-05, 4.885625094175339e-05, 5.030632019042969e-05]}, "gradients/decoder.model.decoder.layers.10.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 5.0, 5.0, 11.0, 13.0, 11.0, 58.0, 116.0, 452.0, 3053.0, 166903.0, 872791.0, 4281.0, 585.0, 147.0, 54.0, 26.0, 21.0, 5.0, 6.0, 6.0, 2.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.76220703125, -0.7360000610351562, -0.7097930908203125, -0.6835861206054688, -0.657379150390625, -0.6311721801757812, -0.6049652099609375, -0.5787582397460938, -0.55255126953125, -0.5263442993164062, -0.5001373291015625, -0.47393035888671875, -0.447723388671875, -0.42151641845703125, -0.3953094482421875, -0.36910247802734375, -0.3428955078125, -0.31668853759765625, -0.2904815673828125, -0.26427459716796875, -0.238067626953125, -0.21186065673828125, -0.1856536865234375, -0.15944671630859375, -0.13323974609375, -0.10703277587890625, -0.0808258056640625, -0.05461883544921875, -0.028411865234375, -0.00220489501953125, 0.0240020751953125, 0.05020904541015625, 0.076416015625, 0.10262298583984375, 0.1288299560546875, 0.15503692626953125, 0.181243896484375, 0.20745086669921875, 0.2336578369140625, 0.25986480712890625, 0.28607177734375, 0.31227874755859375, 0.3384857177734375, 0.36469268798828125, 0.390899658203125, 0.41710662841796875, 0.4433135986328125, 0.46952056884765625, 0.4957275390625, 0.5219345092773438, 0.5481414794921875, 0.5743484497070312, 0.600555419921875, 0.6267623901367188, 0.6529693603515625, 0.6791763305664062, 0.70538330078125, 0.7315902709960938, 0.7577972412109375, 0.7840042114257812, 0.810211181640625, 0.8364181518554688, 0.8626251220703125, 0.8888320922851562, 0.9150390625]}, "gradients/decoder.model.decoder.layers.10.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 5.0, 3.0, 0.0, 2.0, 3.0, 5.0, 5.0, 15.0, 11.0, 21.0, 20.0, 47.0, 83.0, 164.0, 297.0, 132.0, 76.0, 42.0, 27.0, 11.0, 15.0, 7.0, 3.0, 6.0, 3.0, 5.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.12371826171875, -0.11989498138427734, -0.11607170104980469, -0.11224842071533203, -0.10842514038085938, -0.10460186004638672, -0.10077857971191406, -0.0969552993774414, -0.09313201904296875, -0.0893087387084961, -0.08548545837402344, -0.08166217803955078, -0.07783889770507812, -0.07401561737060547, -0.07019233703613281, -0.06636905670166016, -0.0625457763671875, -0.058722496032714844, -0.05489921569824219, -0.05107593536376953, -0.047252655029296875, -0.04342937469482422, -0.03960609436035156, -0.035782814025878906, -0.03195953369140625, -0.028136253356933594, -0.024312973022460938, -0.02048969268798828, -0.016666412353515625, -0.012843132019042969, -0.009019851684570312, -0.005196571350097656, -0.001373291015625, 0.0024499893188476562, 0.0062732696533203125, 0.010096549987792969, 0.013919830322265625, 0.01774311065673828, 0.021566390991210938, 0.025389671325683594, 0.02921295166015625, 0.033036231994628906, 0.03685951232910156, 0.04068279266357422, 0.044506072998046875, 0.04832935333251953, 0.05215263366699219, 0.055975914001464844, 0.0597991943359375, 0.06362247467041016, 0.06744575500488281, 0.07126903533935547, 0.07509231567382812, 0.07891559600830078, 0.08273887634277344, 0.0865621566772461, 0.09038543701171875, 0.0942087173461914, 0.09803199768066406, 0.10185527801513672, 0.10567855834960938, 0.10950183868408203, 0.11332511901855469, 0.11714839935302734, 0.1209716796875]}, "gradients/decoder.model.decoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [19.0, 374.0, 585.0, 39.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6702286005020142, -0.35472747683525085, -0.03922635316848755, 0.27627480030059814, 0.5917758941650391, 0.90727698802948, 1.2227782011032104, 1.5382791757583618, 1.8537803888320923, 2.169281482696533, 2.4847826957702637, 2.800283908843994, 3.1157848834991455, 3.431285858154297, 3.7467870712280273, 4.062288284301758, 4.377789497375488, 4.693290710449219, 5.008791923522949, 5.32429313659668, 5.639793872833252, 5.955295085906982, 6.270796298980713, 6.586297035217285, 6.901798248291016, 7.217299461364746, 7.532800674438477, 7.848301887512207, 8.163803100585938, 8.479303359985352, 8.794805526733398, 9.110305786132812, 9.425806999206543, 9.741308212280273, 10.056809425354004, 10.372310638427734, 10.687811851501465, 11.003313064575195, 11.31881332397461, 11.63431453704834, 11.94981575012207, 12.2653169631958, 12.580818176269531, 12.896319389343262, 13.211820602416992, 13.527320861816406, 13.842823028564453, 14.158323287963867, 14.473825454711914, 14.789326667785645, 15.104827880859375, 15.420329093933105, 15.735830307006836, 16.05133056640625, 16.366832733154297, 16.68233299255371, 16.997833251953125, 17.31333351135254, 17.628835678100586, 17.9443359375, 18.259838104248047, 18.57533836364746, 18.890840530395508, 19.206340789794922, 19.52184295654297]}, "gradients/decoder.model.decoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 4.0, 3.0, 2.0, 4.0, 6.0, 13.0, 11.0, 12.0, 7.0, 10.0, 18.0, 27.0, 20.0, 28.0, 29.0, 24.0, 35.0, 28.0, 31.0, 45.0, 41.0, 49.0, 50.0, 34.0, 34.0, 37.0, 52.0, 44.0, 39.0, 39.0, 33.0, 25.0, 29.0, 25.0, 21.0, 14.0, 17.0, 16.0, 12.0, 10.0, 8.0, 4.0, 8.0, 4.0, 5.0, 2.0, 2.0, 1.0, 3.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.803426206111908, -0.7724162340164185, -0.7414062023162842, -0.7103962302207947, -0.6793862581253052, -0.6483762264251709, -0.6173662543296814, -0.5863562822341919, -0.5553462505340576, -0.5243362784385681, -0.49332624673843384, -0.46231627464294434, -0.43130627274513245, -0.40029627084732056, -0.36928629875183105, -0.33827629685401917, -0.3072662949562073, -0.2762562930583954, -0.2452463060617447, -0.214236319065094, -0.1832263171672821, -0.15221631526947021, -0.12120632827281952, -0.09019634127616882, -0.059186339378356934, -0.02817634493112564, 0.002833649516105652, 0.033843643963336945, 0.06485363841056824, 0.09586364030838013, 0.12687362730503082, 0.15788361430168152, 0.18889367580413818, 0.21990367770195007, 0.25091367959976196, 0.28192365169525146, 0.31293365359306335, 0.34394365549087524, 0.37495362758636475, 0.40596362948417664, 0.4369736313819885, 0.4679836332798004, 0.4989936351776123, 0.5300036072731018, 0.5610135793685913, 0.5920236110687256, 0.6230335831642151, 0.6540435552597046, 0.6850535869598389, 0.7160635590553284, 0.7470735907554626, 0.7780835628509521, 0.8090935945510864, 0.8401035666465759, 0.8711135387420654, 0.9021235704421997, 0.9331335425376892, 0.9641435146331787, 0.995153546333313, 1.0261635780334473, 1.057173490524292, 1.0881835222244263, 1.1191935539245605, 1.1502034664154053, 1.1812134981155396]}, "gradients/decoder.model.decoder.layers.9.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 1.0, 1.0, 5.0, 9.0, 12.0, 13.0, 24.0, 25.0, 26.0, 53.0, 60.0, 93.0, 160.0, 195.0, 295.0, 579.0, 948.0, 1631.0, 3216.0, 6991.0, 18275.0, 64984.0, 407807.0, 2128040.0, 1307615.0, 192519.0, 37977.0, 11951.0, 4904.0, 2497.0, 1314.0, 775.0, 475.0, 256.0, 172.0, 127.0, 65.0, 57.0, 46.0, 24.0, 23.0, 18.0, 6.0, 7.0, 5.0, 5.0, 2.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.59375, -0.5744781494140625, -0.555206298828125, -0.5359344482421875, -0.51666259765625, -0.4973907470703125, -0.478118896484375, -0.4588470458984375, -0.4395751953125, -0.4203033447265625, -0.401031494140625, -0.3817596435546875, -0.36248779296875, -0.3432159423828125, -0.323944091796875, -0.3046722412109375, -0.285400390625, -0.2661285400390625, -0.246856689453125, -0.2275848388671875, -0.20831298828125, -0.1890411376953125, -0.169769287109375, -0.1504974365234375, -0.1312255859375, -0.1119537353515625, -0.092681884765625, -0.0734100341796875, -0.05413818359375, -0.0348663330078125, -0.015594482421875, 0.0036773681640625, 0.02294921875, 0.0422210693359375, 0.061492919921875, 0.0807647705078125, 0.10003662109375, 0.1193084716796875, 0.138580322265625, 0.1578521728515625, 0.1771240234375, 0.1963958740234375, 0.215667724609375, 0.2349395751953125, 0.25421142578125, 0.2734832763671875, 0.292755126953125, 0.3120269775390625, 0.331298828125, 0.3505706787109375, 0.369842529296875, 0.3891143798828125, 0.40838623046875, 0.4276580810546875, 0.446929931640625, 0.4662017822265625, 0.4854736328125, 0.5047454833984375, 0.524017333984375, 0.5432891845703125, 0.56256103515625, 0.5818328857421875, 0.601104736328125, 0.6203765869140625, 0.6396484375]}, "gradients/decoder.model.decoder.layers.9.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 5.0, 1.0, 1.0, 2.0, 4.0, 9.0, 7.0, 9.0, 17.0, 14.0, 18.0, 29.0, 19.0, 27.0, 37.0, 30.0, 49.0, 42.0, 44.0, 38.0, 39.0, 53.0, 46.0, 53.0, 57.0, 46.0, 43.0, 53.0, 37.0, 27.0, 29.0, 23.0, 25.0, 16.0, 16.0, 11.0, 11.0, 2.0, 6.0, 5.0, 3.0, 4.0, 6.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.438720703125, -0.42501068115234375, -0.4113006591796875, -0.39759063720703125, -0.383880615234375, -0.37017059326171875, -0.3564605712890625, -0.34275054931640625, -0.32904052734375, -0.31533050537109375, -0.3016204833984375, -0.28791046142578125, -0.274200439453125, -0.26049041748046875, -0.2467803955078125, -0.23307037353515625, -0.2193603515625, -0.20565032958984375, -0.1919403076171875, -0.17823028564453125, -0.164520263671875, -0.15081024169921875, -0.1371002197265625, -0.12339019775390625, -0.10968017578125, -0.09597015380859375, -0.0822601318359375, -0.06855010986328125, -0.054840087890625, -0.04113006591796875, -0.0274200439453125, -0.01371002197265625, 0.0, 0.01371002197265625, 0.0274200439453125, 0.04113006591796875, 0.054840087890625, 0.06855010986328125, 0.0822601318359375, 0.09597015380859375, 0.10968017578125, 0.12339019775390625, 0.1371002197265625, 0.15081024169921875, 0.164520263671875, 0.17823028564453125, 0.1919403076171875, 0.20565032958984375, 0.2193603515625, 0.23307037353515625, 0.2467803955078125, 0.26049041748046875, 0.274200439453125, 0.28791046142578125, 0.3016204833984375, 0.31533050537109375, 0.32904052734375, 0.34275054931640625, 0.3564605712890625, 0.37017059326171875, 0.383880615234375, 0.39759063720703125, 0.4113006591796875, 0.42501068115234375, 0.438720703125]}, "gradients/decoder.model.decoder.layers.9.fc1.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 8.0, 12.0, 14.0, 15.0, 34.0, 55.0, 122.0, 252.0, 713.0, 2180.0, 24322.0, 4040277.0, 120257.0, 4402.0, 924.0, 353.0, 166.0, 80.0, 42.0, 15.0, 15.0, 5.0, 9.0, 5.0, 6.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.326171875, -2.24212646484375, -2.1580810546875, -2.07403564453125, -1.989990234375, -1.90594482421875, -1.8218994140625, -1.73785400390625, -1.65380859375, -1.56976318359375, -1.4857177734375, -1.40167236328125, -1.317626953125, -1.23358154296875, -1.1495361328125, -1.06549072265625, -0.9814453125, -0.89739990234375, -0.8133544921875, -0.72930908203125, -0.645263671875, -0.56121826171875, -0.4771728515625, -0.39312744140625, -0.30908203125, -0.22503662109375, -0.1409912109375, -0.05694580078125, 0.027099609375, 0.11114501953125, 0.1951904296875, 0.27923583984375, 0.36328125, 0.44732666015625, 0.5313720703125, 0.61541748046875, 0.699462890625, 0.78350830078125, 0.8675537109375, 0.95159912109375, 1.03564453125, 1.11968994140625, 1.2037353515625, 1.28778076171875, 1.371826171875, 1.45587158203125, 1.5399169921875, 1.62396240234375, 1.7080078125, 1.79205322265625, 1.8760986328125, 1.96014404296875, 2.044189453125, 2.12823486328125, 2.2122802734375, 2.29632568359375, 2.38037109375, 2.46441650390625, 2.5484619140625, 2.63250732421875, 2.716552734375, 2.80059814453125, 2.8846435546875, 2.96868896484375, 3.052734375]}, "gradients/decoder.model.decoder.layers.9.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 1.0, 2.0, 2.0, 2.0, 9.0, 15.0, 21.0, 44.0, 90.0, 170.0, 389.0, 1061.0, 1315.0, 513.0, 208.0, 115.0, 58.0, 30.0, 15.0, 11.0, 5.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5400390625, -0.5242156982421875, -0.508392333984375, -0.4925689697265625, -0.47674560546875, -0.4609222412109375, -0.445098876953125, -0.4292755126953125, -0.4134521484375, -0.3976287841796875, -0.381805419921875, -0.3659820556640625, -0.35015869140625, -0.3343353271484375, -0.318511962890625, -0.3026885986328125, -0.286865234375, -0.2710418701171875, -0.255218505859375, -0.2393951416015625, -0.22357177734375, -0.2077484130859375, -0.191925048828125, -0.1761016845703125, -0.1602783203125, -0.1444549560546875, -0.128631591796875, -0.1128082275390625, -0.09698486328125, -0.0811614990234375, -0.065338134765625, -0.0495147705078125, -0.03369140625, -0.0178680419921875, -0.002044677734375, 0.0137786865234375, 0.02960205078125, 0.0454254150390625, 0.061248779296875, 0.0770721435546875, 0.0928955078125, 0.1087188720703125, 0.124542236328125, 0.1403656005859375, 0.15618896484375, 0.1720123291015625, 0.187835693359375, 0.2036590576171875, 0.219482421875, 0.2353057861328125, 0.251129150390625, 0.2669525146484375, 0.28277587890625, 0.2985992431640625, 0.314422607421875, 0.3302459716796875, 0.3460693359375, 0.3618927001953125, 0.377716064453125, 0.3935394287109375, 0.40936279296875, 0.4251861572265625, 0.441009521484375, 0.4568328857421875, 0.47265625]}, "gradients/decoder.model.decoder.layers.9.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 7.0, 8.0, 9.0, 12.0, 13.0, 16.0, 26.0, 34.0, 59.0, 51.0, 63.0, 95.0, 93.0, 92.0, 83.0, 72.0, 51.0, 61.0, 42.0, 28.0, 19.0, 11.0, 17.0, 10.0, 8.0, 2.0, 4.0, 2.0, 4.0, 0.0, 4.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.699211597442627, -0.6760556697845459, -0.6528997421264648, -0.6297438144683838, -0.6065878868103027, -0.5834318995475769, -0.5602759718894958, -0.5371200442314148, -0.5139641165733337, -0.4908081889152527, -0.46765226125717163, -0.4444963037967682, -0.42134037613868713, -0.3981844484806061, -0.37502849102020264, -0.3518725633621216, -0.3287166357040405, -0.3055607080459595, -0.2824047803878784, -0.259248822927475, -0.23609289526939392, -0.21293696761131287, -0.18978102505207062, -0.16662508249282837, -0.14346915483474731, -0.12031321972608566, -0.09715728461742401, -0.07400134950876236, -0.05084541440010071, -0.027689479291439056, -0.004533544182777405, 0.018622398376464844, 0.04177826642990112, 0.06493420153856277, 0.08809013664722443, 0.11124607175588608, 0.13440200686454773, 0.15755793452262878, 0.18071387708187103, 0.20386981964111328, 0.22702574729919434, 0.2501816749572754, 0.27333760261535645, 0.2964935600757599, 0.31964948773384094, 0.342805415391922, 0.36596137285232544, 0.3891173005104065, 0.41227322816848755, 0.4354291558265686, 0.45858508348464966, 0.4817410409450531, 0.5048969984054565, 0.5280529260635376, 0.5512088537216187, 0.5743647813796997, 0.5975207090377808, 0.6206766366958618, 0.6438325643539429, 0.6669884920120239, 0.690144419670105, 0.7133004069328308, 0.7364563345909119, 0.7596122622489929, 0.782768189907074]}, "gradients/decoder.model.decoder.layers.9.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 5.0, 4.0, 7.0, 18.0, 17.0, 13.0, 20.0, 19.0, 27.0, 22.0, 26.0, 42.0, 40.0, 39.0, 38.0, 52.0, 40.0, 44.0, 44.0, 35.0, 49.0, 47.0, 43.0, 48.0, 30.0, 41.0, 33.0, 30.0, 16.0, 23.0, 23.0, 12.0, 18.0, 7.0, 9.0, 6.0, 0.0, 2.0, 7.0, 1.0, 5.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.5059067606925964, -0.4903792440891266, -0.47485169768333435, -0.4593241810798645, -0.44379663467407227, -0.4282691180706024, -0.41274160146713257, -0.39721405506134033, -0.3816865384578705, -0.36615902185440063, -0.3506314754486084, -0.33510395884513855, -0.3195764422416687, -0.30404889583587646, -0.2885213792324066, -0.27299386262893677, -0.25746631622314453, -0.2419387847185135, -0.22641125321388245, -0.2108837366104126, -0.19535620510578156, -0.1798286736011505, -0.16430115699768066, -0.14877362549304962, -0.13324609398841858, -0.11771856248378754, -0.10219103842973709, -0.08666351437568665, -0.0711359828710556, -0.05560845136642456, -0.040080927312374115, -0.02455340325832367, -0.009025901556015015, 0.006501626223325729, 0.022029154002666473, 0.03755668178200722, 0.05308420956134796, 0.068611741065979, 0.08413926512002945, 0.0996667891740799, 0.11519432067871094, 0.13072185218334198, 0.14624938368797302, 0.16177690029144287, 0.1773044317960739, 0.19283196330070496, 0.2083594799041748, 0.22388701140880585, 0.2394145429134369, 0.25494205951690674, 0.270469605922699, 0.2859971225261688, 0.30152463912963867, 0.3170521855354309, 0.33257970213890076, 0.3481072187423706, 0.36363476514816284, 0.3791622817516327, 0.3946898281574249, 0.4102173447608948, 0.425744891166687, 0.44127240777015686, 0.4567999243736267, 0.47232747077941895, 0.4878549873828888]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 2.0, 2.0, 4.0, 5.0, 1.0, 11.0, 28.0, 30.0, 43.0, 61.0, 84.0, 140.0, 201.0, 417.0, 671.0, 1205.0, 2156.0, 3900.0, 7597.0, 15276.0, 33023.0, 79385.0, 218782.0, 389526.0, 174699.0, 65599.0, 27926.0, 13227.0, 6635.0, 3494.0, 1833.0, 1033.0, 582.0, 398.0, 227.0, 119.0, 91.0, 53.0, 42.0, 21.0, 8.0, 7.0, 8.0, 2.0, 5.0, 4.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.2176513671875, -0.2111339569091797, -0.20461654663085938, -0.19809913635253906, -0.19158172607421875, -0.18506431579589844, -0.17854690551757812, -0.1720294952392578, -0.1655120849609375, -0.1589946746826172, -0.15247726440429688, -0.14595985412597656, -0.13944244384765625, -0.13292503356933594, -0.12640762329101562, -0.11989021301269531, -0.113372802734375, -0.10685539245605469, -0.10033798217773438, -0.09382057189941406, -0.08730316162109375, -0.08078575134277344, -0.07426834106445312, -0.06775093078613281, -0.0612335205078125, -0.05471611022949219, -0.048198699951171875, -0.04168128967285156, -0.03516387939453125, -0.028646469116210938, -0.022129058837890625, -0.015611648559570312, -0.00909423828125, -0.0025768280029296875, 0.003940582275390625, 0.010457992553710938, 0.01697540283203125, 0.023492813110351562, 0.030010223388671875, 0.03652763366699219, 0.0430450439453125, 0.04956245422363281, 0.056079864501953125, 0.06259727478027344, 0.06911468505859375, 0.07563209533691406, 0.08214950561523438, 0.08866691589355469, 0.095184326171875, 0.10170173645019531, 0.10821914672851562, 0.11473655700683594, 0.12125396728515625, 0.12777137756347656, 0.13428878784179688, 0.1408061981201172, 0.1473236083984375, 0.1538410186767578, 0.16035842895507812, 0.16687583923339844, 0.17339324951171875, 0.17991065979003906, 0.18642807006835938, 0.1929454803466797, 0.199462890625]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 9.0, 7.0, 15.0, 11.0, 15.0, 21.0, 20.0, 21.0, 21.0, 43.0, 31.0, 45.0, 48.0, 60.0, 52.0, 61.0, 54.0, 48.0, 49.0, 46.0, 53.0, 35.0, 40.0, 35.0, 32.0, 25.0, 21.0, 21.0, 15.0, 16.0, 6.0, 8.0, 5.0, 1.0, 6.0, 4.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.310791015625, -0.3002510070800781, -0.28971099853515625, -0.2791709899902344, -0.2686309814453125, -0.2580909729003906, -0.24755096435546875, -0.23701095581054688, -0.226470947265625, -0.21593093872070312, -0.20539093017578125, -0.19485092163085938, -0.1843109130859375, -0.17377090454101562, -0.16323089599609375, -0.15269088745117188, -0.14215087890625, -0.13161087036132812, -0.12107086181640625, -0.11053085327148438, -0.0999908447265625, -0.08945083618164062, -0.07891082763671875, -0.06837081909179688, -0.057830810546875, -0.047290802001953125, -0.03675079345703125, -0.026210784912109375, -0.0156707763671875, -0.005130767822265625, 0.00540924072265625, 0.015949249267578125, 0.0264892578125, 0.037029266357421875, 0.04756927490234375, 0.058109283447265625, 0.0686492919921875, 0.07918930053710938, 0.08972930908203125, 0.10026931762695312, 0.110809326171875, 0.12134933471679688, 0.13188934326171875, 0.14242935180664062, 0.1529693603515625, 0.16350936889648438, 0.17404937744140625, 0.18458938598632812, 0.19512939453125, 0.20566940307617188, 0.21620941162109375, 0.22674942016601562, 0.2372894287109375, 0.24782943725585938, 0.25836944580078125, 0.2689094543457031, 0.279449462890625, 0.2899894714355469, 0.30052947998046875, 0.3110694885253906, 0.3216094970703125, 0.3321495056152344, 0.34268951416015625, 0.3532295227050781, 0.36376953125]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 3.0, 2.0, 4.0, 5.0, 2.0, 4.0, 7.0, 12.0, 11.0, 24.0, 28.0, 45.0, 54.0, 97.0, 164.0, 241.0, 348.0, 599.0, 1003.0, 1881.0, 3519.0, 7202.0, 16436.0, 39745.0, 112087.0, 337862.0, 341775.0, 113687.0, 40159.0, 16202.0, 7314.0, 3657.0, 1779.0, 1077.0, 555.0, 333.0, 211.0, 140.0, 96.0, 62.0, 41.0, 35.0, 25.0, 11.0, 13.0, 5.0, 3.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.2132568359375, -0.20764541625976562, -0.20203399658203125, -0.19642257690429688, -0.1908111572265625, -0.18519973754882812, -0.17958831787109375, -0.17397689819335938, -0.168365478515625, -0.16275405883789062, -0.15714263916015625, -0.15153121948242188, -0.1459197998046875, -0.14030838012695312, -0.13469696044921875, -0.12908554077148438, -0.12347412109375, -0.11786270141601562, -0.11225128173828125, -0.10663986206054688, -0.1010284423828125, -0.09541702270507812, -0.08980560302734375, -0.08419418334960938, -0.078582763671875, -0.07297134399414062, -0.06735992431640625, -0.061748504638671875, -0.0561370849609375, -0.050525665283203125, -0.04491424560546875, -0.039302825927734375, -0.03369140625, -0.028079986572265625, -0.02246856689453125, -0.016857147216796875, -0.0112457275390625, -0.005634307861328125, -2.288818359375e-05, 0.005588531494140625, 0.011199951171875, 0.016811370849609375, 0.02242279052734375, 0.028034210205078125, 0.0336456298828125, 0.039257049560546875, 0.04486846923828125, 0.050479888916015625, 0.05609130859375, 0.061702728271484375, 0.06731414794921875, 0.07292556762695312, 0.0785369873046875, 0.08414840698242188, 0.08975982666015625, 0.09537124633789062, 0.100982666015625, 0.10659408569335938, 0.11220550537109375, 0.11781692504882812, 0.1234283447265625, 0.12903976440429688, 0.13465118408203125, 0.14026260375976562, 0.1458740234375]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 3.0, 4.0, 4.0, 5.0, 8.0, 11.0, 8.0, 17.0, 10.0, 24.0, 22.0, 35.0, 29.0, 39.0, 47.0, 39.0, 45.0, 48.0, 58.0, 54.0, 49.0, 52.0, 48.0, 52.0, 57.0, 36.0, 32.0, 36.0, 32.0, 24.0, 13.0, 15.0, 14.0, 19.0, 5.0, 4.0, 4.0, 2.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.74072265625, -0.7204437255859375, -0.700164794921875, -0.6798858642578125, -0.65960693359375, -0.6393280029296875, -0.619049072265625, -0.5987701416015625, -0.5784912109375, -0.5582122802734375, -0.537933349609375, -0.5176544189453125, -0.49737548828125, -0.4770965576171875, -0.456817626953125, -0.4365386962890625, -0.416259765625, -0.3959808349609375, -0.375701904296875, -0.3554229736328125, -0.33514404296875, -0.3148651123046875, -0.294586181640625, -0.2743072509765625, -0.2540283203125, -0.2337493896484375, -0.213470458984375, -0.1931915283203125, -0.17291259765625, -0.1526336669921875, -0.132354736328125, -0.1120758056640625, -0.091796875, -0.0715179443359375, -0.051239013671875, -0.0309600830078125, -0.01068115234375, 0.0095977783203125, 0.029876708984375, 0.0501556396484375, 0.0704345703125, 0.0907135009765625, 0.110992431640625, 0.1312713623046875, 0.15155029296875, 0.1718292236328125, 0.192108154296875, 0.2123870849609375, 0.232666015625, 0.2529449462890625, 0.273223876953125, 0.2935028076171875, 0.31378173828125, 0.3340606689453125, 0.354339599609375, 0.3746185302734375, 0.3948974609375, 0.4151763916015625, 0.435455322265625, 0.4557342529296875, 0.47601318359375, 0.4962921142578125, 0.516571044921875, 0.5368499755859375, 0.55712890625]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 4.0, 6.0, 6.0, 11.0, 12.0, 25.0, 26.0, 35.0, 73.0, 129.0, 255.0, 559.0, 1359.0, 4002.0, 16515.0, 123834.0, 791252.0, 91163.0, 13523.0, 3487.0, 1230.0, 487.0, 265.0, 113.0, 64.0, 53.0, 24.0, 9.0, 14.0, 7.0, 10.0, 5.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.18115234375, -0.17678070068359375, -0.1724090576171875, -0.16803741455078125, -0.163665771484375, -0.15929412841796875, -0.1549224853515625, -0.15055084228515625, -0.14617919921875, -0.14180755615234375, -0.1374359130859375, -0.13306427001953125, -0.128692626953125, -0.12432098388671875, -0.1199493408203125, -0.11557769775390625, -0.1112060546875, -0.10683441162109375, -0.1024627685546875, -0.09809112548828125, -0.093719482421875, -0.08934783935546875, -0.0849761962890625, -0.08060455322265625, -0.07623291015625, -0.07186126708984375, -0.0674896240234375, -0.06311798095703125, -0.058746337890625, -0.05437469482421875, -0.0500030517578125, -0.04563140869140625, -0.041259765625, -0.03688812255859375, -0.0325164794921875, -0.02814483642578125, -0.023773193359375, -0.01940155029296875, -0.0150299072265625, -0.01065826416015625, -0.00628662109375, -0.00191497802734375, 0.0024566650390625, 0.00682830810546875, 0.011199951171875, 0.01557159423828125, 0.0199432373046875, 0.02431488037109375, 0.0286865234375, 0.03305816650390625, 0.0374298095703125, 0.04180145263671875, 0.046173095703125, 0.05054473876953125, 0.0549163818359375, 0.05928802490234375, 0.06365966796875, 0.06803131103515625, 0.0724029541015625, 0.07677459716796875, 0.081146240234375, 0.08551788330078125, 0.0898895263671875, 0.09426116943359375, 0.0986328125]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 2.0, 1.0, 2.0, 5.0, 4.0, 4.0, 8.0, 7.0, 8.0, 11.0, 15.0, 20.0, 33.0, 26.0, 40.0, 74.0, 106.0, 164.0, 154.0, 105.0, 58.0, 37.0, 21.0, 29.0, 13.0, 12.0, 8.0, 10.0, 3.0, 7.0, 3.0, 6.0, 5.0, 2.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-6.103515625e-05, -5.9118494391441345e-05, -5.720183253288269e-05, -5.5285170674324036e-05, -5.336850881576538e-05, -5.1451846957206726e-05, -4.953518509864807e-05, -4.7618523240089417e-05, -4.570186138153076e-05, -4.378519952297211e-05, -4.186853766441345e-05, -3.99518758058548e-05, -3.803521394729614e-05, -3.611855208873749e-05, -3.420189023017883e-05, -3.228522837162018e-05, -3.0368566513061523e-05, -2.845190465450287e-05, -2.6535242795944214e-05, -2.461858093738556e-05, -2.2701919078826904e-05, -2.078525722026825e-05, -1.8868595361709595e-05, -1.695193350315094e-05, -1.5035271644592285e-05, -1.311860978603363e-05, -1.1201947927474976e-05, -9.28528606891632e-06, -7.368624210357666e-06, -5.451962351799011e-06, -3.5353004932403564e-06, -1.6186386346817017e-06, 2.980232238769531e-07, 2.214685082435608e-06, 4.131346940994263e-06, 6.0480087995529175e-06, 7.964670658111572e-06, 9.881332516670227e-06, 1.1797994375228882e-05, 1.3714656233787537e-05, 1.563131809234619e-05, 1.7547979950904846e-05, 1.94646418094635e-05, 2.1381303668022156e-05, 2.329796552658081e-05, 2.5214627385139465e-05, 2.713128924369812e-05, 2.9047951102256775e-05, 3.096461296081543e-05, 3.2881274819374084e-05, 3.479793667793274e-05, 3.6714598536491394e-05, 3.863126039505005e-05, 4.0547922253608704e-05, 4.246458411216736e-05, 4.438124597072601e-05, 4.629790782928467e-05, 4.821456968784332e-05, 5.013123154640198e-05, 5.204789340496063e-05, 5.396455526351929e-05, 5.588121712207794e-05, 5.77978789806366e-05, 5.971454083919525e-05, 6.16312026977539e-05]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 5.0, 5.0, 3.0, 8.0, 8.0, 13.0, 21.0, 25.0, 37.0, 43.0, 77.0, 118.0, 232.0, 377.0, 647.0, 1354.0, 3065.0, 10284.0, 61848.0, 773106.0, 170673.0, 18286.0, 4558.0, 1747.0, 892.0, 416.0, 254.0, 152.0, 97.0, 67.0, 42.0, 24.0, 26.0, 18.0, 11.0, 8.0, 6.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 4.0], "bins": [-0.15673828125, -0.1522197723388672, -0.14770126342773438, -0.14318275451660156, -0.13866424560546875, -0.13414573669433594, -0.12962722778320312, -0.1251087188720703, -0.1205902099609375, -0.11607170104980469, -0.11155319213867188, -0.10703468322753906, -0.10251617431640625, -0.09799766540527344, -0.09347915649414062, -0.08896064758300781, -0.084442138671875, -0.07992362976074219, -0.07540512084960938, -0.07088661193847656, -0.06636810302734375, -0.06184959411621094, -0.057331085205078125, -0.05281257629394531, -0.0482940673828125, -0.04377555847167969, -0.039257049560546875, -0.03473854064941406, -0.03022003173828125, -0.025701522827148438, -0.021183013916015625, -0.016664505004882812, -0.01214599609375, -0.0076274871826171875, -0.003108978271484375, 0.0014095306396484375, 0.00592803955078125, 0.010446548461914062, 0.014965057373046875, 0.019483566284179688, 0.0240020751953125, 0.028520584106445312, 0.033039093017578125, 0.03755760192871094, 0.04207611083984375, 0.04659461975097656, 0.051113128662109375, 0.05563163757324219, 0.060150146484375, 0.06466865539550781, 0.06918716430664062, 0.07370567321777344, 0.07822418212890625, 0.08274269104003906, 0.08726119995117188, 0.09177970886230469, 0.0962982177734375, 0.10081672668457031, 0.10533523559570312, 0.10985374450683594, 0.11437225341796875, 0.11889076232910156, 0.12340927124023438, 0.1279277801513672, 0.1324462890625]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 2.0, 3.0, 2.0, 1.0, 3.0, 5.0, 9.0, 19.0, 19.0, 37.0, 38.0, 55.0, 105.0, 131.0, 189.0, 124.0, 87.0, 47.0, 45.0, 21.0, 17.0, 19.0, 10.0, 3.0, 10.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0], "bins": [-0.0301666259765625, -0.029288768768310547, -0.028410911560058594, -0.02753305435180664, -0.026655197143554688, -0.025777339935302734, -0.02489948272705078, -0.024021625518798828, -0.023143768310546875, -0.022265911102294922, -0.02138805389404297, -0.020510196685791016, -0.019632339477539062, -0.01875448226928711, -0.017876625061035156, -0.016998767852783203, -0.01612091064453125, -0.015243053436279297, -0.014365196228027344, -0.01348733901977539, -0.012609481811523438, -0.011731624603271484, -0.010853767395019531, -0.009975910186767578, -0.009098052978515625, -0.008220195770263672, -0.007342338562011719, -0.006464481353759766, -0.0055866241455078125, -0.004708766937255859, -0.0038309097290039062, -0.002953052520751953, -0.0020751953125, -0.0011973381042480469, -0.00031948089599609375, 0.0005583763122558594, 0.0014362335205078125, 0.0023140907287597656, 0.0031919479370117188, 0.004069805145263672, 0.004947662353515625, 0.005825519561767578, 0.006703376770019531, 0.007581233978271484, 0.008459091186523438, 0.00933694839477539, 0.010214805603027344, 0.011092662811279297, 0.01197052001953125, 0.012848377227783203, 0.013726234436035156, 0.01460409164428711, 0.015481948852539062, 0.016359806060791016, 0.01723766326904297, 0.018115520477294922, 0.018993377685546875, 0.019871234893798828, 0.02074909210205078, 0.021626949310302734, 0.022504806518554688, 0.02338266372680664, 0.024260520935058594, 0.025138378143310547, 0.0260162353515625]}, "gradients/decoder.model.decoder.layers.9.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 6.0, 7.0, 9.0, 16.0, 20.0, 27.0, 37.0, 44.0, 44.0, 59.0, 89.0, 73.0, 115.0, 107.0, 78.0, 61.0, 50.0, 39.0, 32.0, 25.0, 13.0, 9.0, 6.0, 4.0, 8.0, 6.0, 5.0, 1.0, 2.0, 0.0, 1.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.45680394768714905, -0.44278910756111145, -0.42877423763275146, -0.41475939750671387, -0.40074455738067627, -0.3867296874523163, -0.3727148473262787, -0.3586999773979187, -0.3446851372718811, -0.3306702971458435, -0.3166554272174835, -0.3026405870914459, -0.28862571716308594, -0.27461087703704834, -0.26059603691101074, -0.24658118188381195, -0.23256632685661316, -0.21855147182941437, -0.20453661680221558, -0.19052177667617798, -0.1765069216489792, -0.1624920666217804, -0.1484772264957428, -0.134462371468544, -0.12044751644134521, -0.10643266141414642, -0.09241781383752823, -0.07840296626091003, -0.06438811123371124, -0.05037325620651245, -0.03635840862989426, -0.022343561053276062, -0.008328676223754883, 0.00568617507815361, 0.019701026380062103, 0.033715877681970596, 0.04773072898387909, 0.06174558401107788, 0.07576043158769608, 0.08977527916431427, 0.10379013419151306, 0.11780498921871185, 0.13181984424591064, 0.14583468437194824, 0.15984953939914703, 0.17386439442634583, 0.18787923455238342, 0.20189408957958221, 0.215908944606781, 0.2299237996339798, 0.2439386546611786, 0.2579534947872162, 0.27196836471557617, 0.28598320484161377, 0.29999804496765137, 0.31401288509368896, 0.32802775502204895, 0.34204259514808655, 0.35605746507644653, 0.37007230520248413, 0.38408714532852173, 0.3981020152568817, 0.4121168553829193, 0.4261317253112793, 0.4401465654373169]}, "gradients/decoder.model.decoder.layers.9.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 5.0, 4.0, 9.0, 7.0, 19.0, 24.0, 28.0, 22.0, 33.0, 34.0, 47.0, 45.0, 51.0, 53.0, 58.0, 54.0, 68.0, 53.0, 58.0, 52.0, 51.0, 36.0, 41.0, 32.0, 23.0, 23.0, 24.0, 20.0, 9.0, 4.0, 3.0, 5.0, 5.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.3513355851173401, -0.34003373980522156, -0.328731894493103, -0.3174300789833069, -0.30612823367118835, -0.2948263883590698, -0.2835245728492737, -0.27222272753715515, -0.2609208822250366, -0.2496190369129181, -0.23831720650196075, -0.22701537609100342, -0.2157135307788849, -0.20441168546676636, -0.19310985505580902, -0.18180802464485168, -0.17050617933273315, -0.15920433402061462, -0.1479025036096573, -0.13660067319869995, -0.12529882788658142, -0.11399699002504349, -0.10269515216350555, -0.09139331430196762, -0.08009147644042969, -0.06878963857889175, -0.05748780071735382, -0.04618596285581589, -0.034884124994277954, -0.02358228713274002, -0.012280449271202087, -0.000978611409664154, 0.010323196649551392, 0.021625034511089325, 0.03292687237262726, 0.04422871023416519, 0.055530548095703125, 0.06683238595724106, 0.07813422381877899, 0.08943606168031693, 0.10073789954185486, 0.11203973740339279, 0.12334157526493073, 0.13464340567588806, 0.1459452509880066, 0.15724709630012512, 0.16854892671108246, 0.1798507571220398, 0.19115260243415833, 0.20245444774627686, 0.2137562781572342, 0.22505810856819153, 0.23635995388031006, 0.2476617991924286, 0.2589636445045471, 0.27026546001434326, 0.2815673053264618, 0.2928691506385803, 0.30417096614837646, 0.315472811460495, 0.3267746567726135, 0.33807650208473206, 0.3493783473968506, 0.36068016290664673, 0.37198200821876526]}, "gradients/decoder.model.decoder.layers.9.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 5.0, 5.0, 5.0, 5.0, 10.0, 14.0, 18.0, 54.0, 52.0, 110.0, 148.0, 262.0, 445.0, 807.0, 1521.0, 3102.0, 6527.0, 14966.0, 37959.0, 134551.0, 658078.0, 125997.0, 36655.0, 14495.0, 6435.0, 2963.0, 1481.0, 799.0, 419.0, 261.0, 142.0, 94.0, 64.0, 34.0, 18.0, 14.0, 16.0, 17.0, 3.0, 4.0, 1.0, 2.0, 2.0, 0.0, 4.0, 1.0], "bins": [-0.537109375, -0.5231513977050781, -0.5091934204101562, -0.4952354431152344, -0.4812774658203125, -0.4673194885253906, -0.45336151123046875, -0.4394035339355469, -0.425445556640625, -0.4114875793457031, -0.39752960205078125, -0.3835716247558594, -0.3696136474609375, -0.3556556701660156, -0.34169769287109375, -0.3277397155761719, -0.31378173828125, -0.2998237609863281, -0.28586578369140625, -0.2719078063964844, -0.2579498291015625, -0.24399185180664062, -0.23003387451171875, -0.21607589721679688, -0.202117919921875, -0.18815994262695312, -0.17420196533203125, -0.16024398803710938, -0.1462860107421875, -0.13232803344726562, -0.11837005615234375, -0.10441207885742188, -0.0904541015625, -0.07649612426757812, -0.06253814697265625, -0.048580169677734375, -0.0346221923828125, -0.020664215087890625, -0.00670623779296875, 0.007251739501953125, 0.021209716796875, 0.035167694091796875, 0.04912567138671875, 0.06308364868164062, 0.0770416259765625, 0.09099960327148438, 0.10495758056640625, 0.11891555786132812, 0.13287353515625, 0.14683151245117188, 0.16078948974609375, 0.17474746704101562, 0.1887054443359375, 0.20266342163085938, 0.21662139892578125, 0.23057937622070312, 0.244537353515625, 0.2584953308105469, 0.27245330810546875, 0.2864112854003906, 0.3003692626953125, 0.3143272399902344, 0.32828521728515625, 0.3422431945800781, 0.356201171875]}, "gradients/decoder.model.decoder.layers.9.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 2.0, 2.0, 4.0, 7.0, 3.0, 9.0, 12.0, 16.0, 18.0, 28.0, 38.0, 33.0, 23.0, 43.0, 45.0, 60.0, 50.0, 55.0, 60.0, 62.0, 67.0, 50.0, 46.0, 44.0, 51.0, 35.0, 28.0, 22.0, 21.0, 16.0, 20.0, 15.0, 8.0, 4.0, 4.0, 4.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.744140625, -0.7214736938476562, -0.6988067626953125, -0.6761398315429688, -0.653472900390625, -0.6308059692382812, -0.6081390380859375, -0.5854721069335938, -0.56280517578125, -0.5401382446289062, -0.5174713134765625, -0.49480438232421875, -0.472137451171875, -0.44947052001953125, -0.4268035888671875, -0.40413665771484375, -0.3814697265625, -0.35880279541015625, -0.3361358642578125, -0.31346893310546875, -0.290802001953125, -0.26813507080078125, -0.2454681396484375, -0.22280120849609375, -0.20013427734375, -0.17746734619140625, -0.1548004150390625, -0.13213348388671875, -0.109466552734375, -0.08679962158203125, -0.0641326904296875, -0.04146575927734375, -0.018798828125, 0.00386810302734375, 0.0265350341796875, 0.04920196533203125, 0.071868896484375, 0.09453582763671875, 0.1172027587890625, 0.13986968994140625, 0.16253662109375, 0.18520355224609375, 0.2078704833984375, 0.23053741455078125, 0.253204345703125, 0.27587127685546875, 0.2985382080078125, 0.32120513916015625, 0.3438720703125, 0.36653900146484375, 0.3892059326171875, 0.41187286376953125, 0.434539794921875, 0.45720672607421875, 0.4798736572265625, 0.5025405883789062, 0.52520751953125, 0.5478744506835938, 0.5705413818359375, 0.5932083129882812, 0.615875244140625, 0.6385421752929688, 0.6612091064453125, 0.6838760375976562, 0.70654296875]}, "gradients/decoder.model.decoder.layers.9.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 0.0, 5.0, 3.0, 7.0, 5.0, 13.0, 5.0, 13.0, 16.0, 17.0, 17.0, 16.0, 26.0, 24.0, 35.0, 52.0, 57.0, 75.0, 187.0, 957.0, 26887.0, 1009751.0, 9382.0, 533.0, 128.0, 74.0, 42.0, 43.0, 31.0, 24.0, 20.0, 25.0, 16.0, 15.0, 14.0, 9.0, 13.0, 4.0, 8.0, 1.0, 3.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.4140625, -2.3345947265625, -2.255126953125, -2.1756591796875, -2.09619140625, -2.0167236328125, -1.937255859375, -1.8577880859375, -1.7783203125, -1.6988525390625, -1.619384765625, -1.5399169921875, -1.46044921875, -1.3809814453125, -1.301513671875, -1.2220458984375, -1.142578125, -1.0631103515625, -0.983642578125, -0.9041748046875, -0.82470703125, -0.7452392578125, -0.665771484375, -0.5863037109375, -0.5068359375, -0.4273681640625, -0.347900390625, -0.2684326171875, -0.18896484375, -0.1094970703125, -0.030029296875, 0.0494384765625, 0.12890625, 0.2083740234375, 0.287841796875, 0.3673095703125, 0.44677734375, 0.5262451171875, 0.605712890625, 0.6851806640625, 0.7646484375, 0.8441162109375, 0.923583984375, 1.0030517578125, 1.08251953125, 1.1619873046875, 1.241455078125, 1.3209228515625, 1.400390625, 1.4798583984375, 1.559326171875, 1.6387939453125, 1.71826171875, 1.7977294921875, 1.877197265625, 1.9566650390625, 2.0361328125, 2.1156005859375, 2.195068359375, 2.2745361328125, 2.35400390625, 2.4334716796875, 2.512939453125, 2.5924072265625, 2.671875]}, "gradients/decoder.model.decoder.layers.9.self_attn.v_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 8.0, 3.0, 5.0, 5.0, 8.0, 12.0, 15.0, 8.0, 18.0, 16.0, 16.0, 22.0, 31.0, 36.0, 35.0, 34.0, 46.0, 31.0, 37.0, 41.0, 50.0, 33.0, 48.0, 42.0, 45.0, 41.0, 40.0, 30.0, 26.0, 24.0, 31.0, 27.0, 19.0, 21.0, 20.0, 16.0, 12.0, 15.0, 12.0, 7.0, 2.0, 5.0, 2.0, 3.0, 3.0, 5.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.5302734375, -0.5126495361328125, -0.495025634765625, -0.4774017333984375, -0.45977783203125, -0.4421539306640625, -0.424530029296875, -0.4069061279296875, -0.3892822265625, -0.3716583251953125, -0.354034423828125, -0.3364105224609375, -0.31878662109375, -0.3011627197265625, -0.283538818359375, -0.2659149169921875, -0.248291015625, -0.2306671142578125, -0.213043212890625, -0.1954193115234375, -0.17779541015625, -0.1601715087890625, -0.142547607421875, -0.1249237060546875, -0.1072998046875, -0.0896759033203125, -0.072052001953125, -0.0544281005859375, -0.03680419921875, -0.0191802978515625, -0.001556396484375, 0.0160675048828125, 0.03369140625, 0.0513153076171875, 0.068939208984375, 0.0865631103515625, 0.10418701171875, 0.1218109130859375, 0.139434814453125, 0.1570587158203125, 0.1746826171875, 0.1923065185546875, 0.209930419921875, 0.2275543212890625, 0.24517822265625, 0.2628021240234375, 0.280426025390625, 0.2980499267578125, 0.315673828125, 0.3332977294921875, 0.350921630859375, 0.3685455322265625, 0.38616943359375, 0.4037933349609375, 0.421417236328125, 0.4390411376953125, 0.4566650390625, 0.4742889404296875, 0.491912841796875, 0.5095367431640625, 0.52716064453125, 0.5447845458984375, 0.562408447265625, 0.5800323486328125, 0.59765625]}, "gradients/decoder.model.decoder.layers.9.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 5.0, 2.0, 3.0, 9.0, 11.0, 10.0, 14.0, 19.0, 45.0, 78.0, 201.0, 520.0, 1743.0, 7682.0, 165736.0, 855921.0, 12883.0, 2512.0, 710.0, 225.0, 98.0, 41.0, 31.0, 16.0, 9.0, 8.0, 8.0, 6.0, 2.0, 2.0, 5.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.525390625, -0.508514404296875, -0.49163818359375, -0.474761962890625, -0.4578857421875, -0.441009521484375, -0.42413330078125, -0.407257080078125, -0.390380859375, -0.373504638671875, -0.35662841796875, -0.339752197265625, -0.3228759765625, -0.305999755859375, -0.28912353515625, -0.272247314453125, -0.25537109375, -0.238494873046875, -0.22161865234375, -0.204742431640625, -0.1878662109375, -0.170989990234375, -0.15411376953125, -0.137237548828125, -0.120361328125, -0.103485107421875, -0.08660888671875, -0.069732666015625, -0.0528564453125, -0.035980224609375, -0.01910400390625, -0.002227783203125, 0.0146484375, 0.031524658203125, 0.04840087890625, 0.065277099609375, 0.0821533203125, 0.099029541015625, 0.11590576171875, 0.132781982421875, 0.149658203125, 0.166534423828125, 0.18341064453125, 0.200286865234375, 0.2171630859375, 0.234039306640625, 0.25091552734375, 0.267791748046875, 0.28466796875, 0.301544189453125, 0.31842041015625, 0.335296630859375, 0.3521728515625, 0.369049072265625, 0.38592529296875, 0.402801513671875, 0.419677734375, 0.436553955078125, 0.45343017578125, 0.470306396484375, 0.4871826171875, 0.504058837890625, 0.52093505859375, 0.537811279296875, 0.5546875]}, "gradients/decoder.model.decoder.layers.9.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 4.0, 2.0, 5.0, 5.0, 8.0, 10.0, 12.0, 17.0, 21.0, 32.0, 74.0, 234.0, 339.0, 100.0, 56.0, 30.0, 21.0, 14.0, 5.0, 4.0, 4.0, 0.0, 1.0, 3.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.40614128112793e-05, -5.2072107791900635e-05, -5.008280277252197e-05, -4.809349775314331e-05, -4.610419273376465e-05, -4.4114887714385986e-05, -4.2125582695007324e-05, -4.013627767562866e-05, -3.814697265625e-05, -3.615766763687134e-05, -3.4168362617492676e-05, -3.2179057598114014e-05, -3.018975257873535e-05, -2.820044755935669e-05, -2.6211142539978027e-05, -2.4221837520599365e-05, -2.2232532501220703e-05, -2.024322748184204e-05, -1.825392246246338e-05, -1.6264617443084717e-05, -1.4275312423706055e-05, -1.2286007404327393e-05, -1.029670238494873e-05, -8.307397365570068e-06, -6.318092346191406e-06, -4.328787326812744e-06, -2.339482307434082e-06, -3.501772880554199e-07, 1.6391277313232422e-06, 3.6284327507019043e-06, 5.617737770080566e-06, 7.6070427894592285e-06, 9.59634780883789e-06, 1.1585652828216553e-05, 1.3574957847595215e-05, 1.5564262866973877e-05, 1.755356788635254e-05, 1.95428729057312e-05, 2.1532177925109863e-05, 2.3521482944488525e-05, 2.5510787963867188e-05, 2.750009298324585e-05, 2.9489398002624512e-05, 3.1478703022003174e-05, 3.3468008041381836e-05, 3.54573130607605e-05, 3.744661808013916e-05, 3.943592309951782e-05, 4.1425228118896484e-05, 4.3414533138275146e-05, 4.540383815765381e-05, 4.739314317703247e-05, 4.938244819641113e-05, 5.1371753215789795e-05, 5.336105823516846e-05, 5.535036325454712e-05, 5.733966827392578e-05, 5.932897329330444e-05, 6.13182783126831e-05, 6.330758333206177e-05, 6.529688835144043e-05, 6.728619337081909e-05, 6.927549839019775e-05, 7.126480340957642e-05, 7.325410842895508e-05]}, "gradients/decoder.model.decoder.layers.9.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 4.0, 3.0, 2.0, 7.0, 10.0, 18.0, 23.0, 35.0, 60.0, 104.0, 198.0, 463.0, 1233.0, 4783.0, 39781.0, 944849.0, 49509.0, 5241.0, 1321.0, 446.0, 195.0, 117.0, 60.0, 36.0, 30.0, 7.0, 9.0, 5.0, 4.0, 6.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.409423828125, -0.39556121826171875, -0.3816986083984375, -0.36783599853515625, -0.353973388671875, -0.34011077880859375, -0.3262481689453125, -0.31238555908203125, -0.29852294921875, -0.28466033935546875, -0.2707977294921875, -0.25693511962890625, -0.243072509765625, -0.22920989990234375, -0.2153472900390625, -0.20148468017578125, -0.1876220703125, -0.17375946044921875, -0.1598968505859375, -0.14603424072265625, -0.132171630859375, -0.11830902099609375, -0.1044464111328125, -0.09058380126953125, -0.07672119140625, -0.06285858154296875, -0.0489959716796875, -0.03513336181640625, -0.021270751953125, -0.00740814208984375, 0.0064544677734375, 0.02031707763671875, 0.0341796875, 0.04804229736328125, 0.0619049072265625, 0.07576751708984375, 0.089630126953125, 0.10349273681640625, 0.1173553466796875, 0.13121795654296875, 0.14508056640625, 0.15894317626953125, 0.1728057861328125, 0.18666839599609375, 0.200531005859375, 0.21439361572265625, 0.2282562255859375, 0.24211883544921875, 0.2559814453125, 0.26984405517578125, 0.2837066650390625, 0.29756927490234375, 0.311431884765625, 0.32529449462890625, 0.3391571044921875, 0.35301971435546875, 0.36688232421875, 0.38074493408203125, 0.3946075439453125, 0.40847015380859375, 0.422332763671875, 0.43619537353515625, 0.4500579833984375, 0.46392059326171875, 0.477783203125]}, "gradients/decoder.model.decoder.layers.9.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 2.0, 5.0, 3.0, 5.0, 4.0, 8.0, 22.0, 23.0, 43.0, 73.0, 187.0, 348.0, 123.0, 63.0, 42.0, 14.0, 14.0, 9.0, 3.0, 8.0, 7.0, 0.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.206298828125, -0.20142269134521484, -0.1965465545654297, -0.19167041778564453, -0.18679428100585938, -0.18191814422607422, -0.17704200744628906, -0.1721658706665039, -0.16728973388671875, -0.1624135971069336, -0.15753746032714844, -0.15266132354736328, -0.14778518676757812, -0.14290904998779297, -0.1380329132080078, -0.13315677642822266, -0.1282806396484375, -0.12340450286865234, -0.11852836608886719, -0.11365222930908203, -0.10877609252929688, -0.10389995574951172, -0.09902381896972656, -0.0941476821899414, -0.08927154541015625, -0.0843954086303711, -0.07951927185058594, -0.07464313507080078, -0.06976699829101562, -0.06489086151123047, -0.06001472473144531, -0.055138587951660156, -0.050262451171875, -0.045386314392089844, -0.04051017761230469, -0.03563404083251953, -0.030757904052734375, -0.02588176727294922, -0.021005630493164062, -0.016129493713378906, -0.01125335693359375, -0.006377220153808594, -0.0015010833740234375, 0.0033750534057617188, 0.008251190185546875, 0.013127326965332031, 0.018003463745117188, 0.022879600524902344, 0.0277557373046875, 0.032631874084472656, 0.03750801086425781, 0.04238414764404297, 0.047260284423828125, 0.05213642120361328, 0.05701255798339844, 0.061888694763183594, 0.06676483154296875, 0.0716409683227539, 0.07651710510253906, 0.08139324188232422, 0.08626937866210938, 0.09114551544189453, 0.09602165222167969, 0.10089778900146484, 0.10577392578125]}, "gradients/decoder.model.decoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [4.0, 32.0, 400.0, 524.0, 53.0, 8.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.85219407081604, -0.5773032307624817, -0.30241239070892334, -0.02752155065536499, 0.24736928939819336, 0.5222601890563965, 0.7971509695053101, 1.0720417499542236, 1.3469326496124268, 1.6218235492706299, 1.8967143297195435, 2.171605110168457, 2.44649600982666, 2.7213869094848633, 2.9962778091430664, 3.2711684703826904, 3.5460593700408936, 3.8209502696990967, 4.095840930938721, 4.370731830596924, 4.645622730255127, 4.92051362991333, 5.195404529571533, 5.470294952392578, 5.745185852050781, 6.020076751708984, 6.2949676513671875, 6.569858551025391, 6.844749450683594, 7.119640350341797, 7.394530773162842, 7.669421672821045, 7.944313049316406, 8.21920394897461, 8.494094848632812, 8.768985748291016, 9.043876647949219, 9.318767547607422, 9.593658447265625, 9.868549346923828, 10.143440246582031, 10.418331146240234, 10.693222045898438, 10.96811294555664, 11.243003845214844, 11.517894744873047, 11.79278564453125, 12.067676544189453, 12.34256649017334, 12.617457389831543, 12.892348289489746, 13.16723918914795, 13.442130088806152, 13.717020988464355, 13.991911888122559, 14.266801834106445, 14.541692733764648, 14.816583633422852, 15.091474533081055, 15.366365432739258, 15.641256332397461, 15.916147232055664, 16.191038131713867, 16.46592903137207, 16.740819931030273]}, "gradients/decoder.model.decoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 3.0, 2.0, 5.0, 6.0, 4.0, 12.0, 10.0, 7.0, 17.0, 20.0, 15.0, 29.0, 32.0, 33.0, 40.0, 47.0, 41.0, 46.0, 50.0, 44.0, 61.0, 50.0, 38.0, 57.0, 43.0, 49.0, 28.0, 34.0, 33.0, 25.0, 27.0, 20.0, 19.0, 9.0, 17.0, 10.0, 7.0, 6.0, 4.0, 5.0, 4.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.9638789892196655, -0.9347702264785767, -0.9056615233421326, -0.8765528202056885, -0.8474440574645996, -0.8183352947235107, -0.7892265915870667, -0.7601178884506226, -0.7310091257095337, -0.7019003629684448, -0.6727916598320007, -0.6436829566955566, -0.6145741939544678, -0.5854654312133789, -0.5563567280769348, -0.5272480249404907, -0.49813926219940186, -0.4690305292606354, -0.4399217963218689, -0.4108130633831024, -0.38170433044433594, -0.35259559750556946, -0.323486864566803, -0.2943781316280365, -0.26526939868927, -0.23616066575050354, -0.20705193281173706, -0.17794319987297058, -0.1488344669342041, -0.11972573399543762, -0.09061700105667114, -0.06150826811790466, -0.032399535179138184, -0.003290802240371704, 0.025817930698394775, 0.054926663637161255, 0.08403539657592773, 0.11314412951469421, 0.1422528624534607, 0.17136159539222717, 0.20047032833099365, 0.22957906126976013, 0.2586877942085266, 0.2877965271472931, 0.31690526008605957, 0.34601399302482605, 0.37512272596359253, 0.404231458902359, 0.4333401918411255, 0.46244892477989197, 0.49155765771865845, 0.5206663608551025, 0.5497751235961914, 0.5788838863372803, 0.6079925894737244, 0.6371012926101685, 0.6662100553512573, 0.6953188180923462, 0.7244275212287903, 0.7535362243652344, 0.7826449871063232, 0.8117537498474121, 0.8408624529838562, 0.8699711561203003, 0.8990799188613892]}, "gradients/decoder.model.decoder.layers.8.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 5.0, 1.0, 5.0, 11.0, 6.0, 9.0, 30.0, 37.0, 48.0, 98.0, 162.0, 312.0, 675.0, 1693.0, 5115.0, 23037.0, 282509.0, 3395522.0, 448645.0, 26894.0, 5934.0, 1939.0, 792.0, 337.0, 196.0, 110.0, 43.0, 43.0, 26.0, 20.0, 15.0, 8.0, 1.0, 5.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9765625, -0.941131591796875, -0.90570068359375, -0.870269775390625, -0.8348388671875, -0.799407958984375, -0.76397705078125, -0.728546142578125, -0.693115234375, -0.657684326171875, -0.62225341796875, -0.586822509765625, -0.5513916015625, -0.515960693359375, -0.48052978515625, -0.445098876953125, -0.40966796875, -0.374237060546875, -0.33880615234375, -0.303375244140625, -0.2679443359375, -0.232513427734375, -0.19708251953125, -0.161651611328125, -0.126220703125, -0.090789794921875, -0.05535888671875, -0.019927978515625, 0.0155029296875, 0.050933837890625, 0.08636474609375, 0.121795654296875, 0.1572265625, 0.192657470703125, 0.22808837890625, 0.263519287109375, 0.2989501953125, 0.334381103515625, 0.36981201171875, 0.405242919921875, 0.440673828125, 0.476104736328125, 0.51153564453125, 0.546966552734375, 0.5823974609375, 0.617828369140625, 0.65325927734375, 0.688690185546875, 0.72412109375, 0.759552001953125, 0.79498291015625, 0.830413818359375, 0.8658447265625, 0.901275634765625, 0.93670654296875, 0.972137451171875, 1.007568359375, 1.042999267578125, 1.07843017578125, 1.113861083984375, 1.1492919921875, 1.184722900390625, 1.22015380859375, 1.255584716796875, 1.291015625]}, "gradients/decoder.model.decoder.layers.8.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 5.0, 3.0, 7.0, 6.0, 9.0, 14.0, 18.0, 22.0, 19.0, 33.0, 32.0, 70.0, 39.0, 60.0, 53.0, 74.0, 84.0, 70.0, 77.0, 42.0, 53.0, 39.0, 38.0, 34.0, 25.0, 25.0, 17.0, 13.0, 8.0, 8.0, 5.0, 4.0, 3.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.453369140625, -0.4363441467285156, -0.41931915283203125, -0.4022941589355469, -0.3852691650390625, -0.3682441711425781, -0.35121917724609375, -0.3341941833496094, -0.317169189453125, -0.3001441955566406, -0.28311920166015625, -0.2660942077636719, -0.2490692138671875, -0.23204421997070312, -0.21501922607421875, -0.19799423217773438, -0.18096923828125, -0.16394424438476562, -0.14691925048828125, -0.12989425659179688, -0.1128692626953125, -0.09584426879882812, -0.07881927490234375, -0.061794281005859375, -0.044769287109375, -0.027744293212890625, -0.01071929931640625, 0.006305694580078125, 0.0233306884765625, 0.040355682373046875, 0.05738067626953125, 0.07440567016601562, 0.0914306640625, 0.10845565795898438, 0.12548065185546875, 0.14250564575195312, 0.1595306396484375, 0.17655563354492188, 0.19358062744140625, 0.21060562133789062, 0.227630615234375, 0.24465560913085938, 0.26168060302734375, 0.2787055969238281, 0.2957305908203125, 0.3127555847167969, 0.32978057861328125, 0.3468055725097656, 0.36383056640625, 0.3808555603027344, 0.39788055419921875, 0.4149055480957031, 0.4319305419921875, 0.4489555358886719, 0.46598052978515625, 0.4830055236816406, 0.500030517578125, 0.5170555114746094, 0.5340805053710938, 0.5511054992675781, 0.5681304931640625, 0.5851554870605469, 0.6021804809570312, 0.6192054748535156, 0.63623046875]}, "gradients/decoder.model.decoder.layers.8.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 4.0, 4.0, 12.0, 13.0, 18.0, 18.0, 20.0, 44.0, 61.0, 127.0, 252.0, 805.0, 3524.0, 39032.0, 3913388.0, 226365.0, 8401.0, 1383.0, 427.0, 166.0, 87.0, 49.0, 26.0, 17.0, 12.0, 9.0, 8.0, 4.0, 7.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8525390625, -1.79412841796875, -1.7357177734375, -1.67730712890625, -1.618896484375, -1.56048583984375, -1.5020751953125, -1.44366455078125, -1.38525390625, -1.32684326171875, -1.2684326171875, -1.21002197265625, -1.151611328125, -1.09320068359375, -1.0347900390625, -0.97637939453125, -0.91796875, -0.85955810546875, -0.8011474609375, -0.74273681640625, -0.684326171875, -0.62591552734375, -0.5675048828125, -0.50909423828125, -0.45068359375, -0.39227294921875, -0.3338623046875, -0.27545166015625, -0.217041015625, -0.15863037109375, -0.1002197265625, -0.04180908203125, 0.0166015625, 0.07501220703125, 0.1334228515625, 0.19183349609375, 0.250244140625, 0.30865478515625, 0.3670654296875, 0.42547607421875, 0.48388671875, 0.54229736328125, 0.6007080078125, 0.65911865234375, 0.717529296875, 0.77593994140625, 0.8343505859375, 0.89276123046875, 0.951171875, 1.00958251953125, 1.0679931640625, 1.12640380859375, 1.184814453125, 1.24322509765625, 1.3016357421875, 1.36004638671875, 1.41845703125, 1.47686767578125, 1.5352783203125, 1.59368896484375, 1.652099609375, 1.71051025390625, 1.7689208984375, 1.82733154296875, 1.8857421875]}, "gradients/decoder.model.decoder.layers.8.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 3.0, 3.0, 4.0, 7.0, 8.0, 9.0, 12.0, 14.0, 32.0, 40.0, 55.0, 82.0, 163.0, 226.0, 403.0, 759.0, 813.0, 606.0, 298.0, 163.0, 124.0, 70.0, 36.0, 42.0, 23.0, 24.0, 17.0, 13.0, 4.0, 7.0, 10.0, 4.0, 4.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.235595703125, -0.2275390625, -0.219482421875, -0.21142578125, -0.203369140625, -0.1953125, -0.187255859375, -0.17919921875, -0.171142578125, -0.1630859375, -0.155029296875, -0.14697265625, -0.138916015625, -0.130859375, -0.122802734375, -0.11474609375, -0.106689453125, -0.0986328125, -0.090576171875, -0.08251953125, -0.074462890625, -0.06640625, -0.058349609375, -0.05029296875, -0.042236328125, -0.0341796875, -0.026123046875, -0.01806640625, -0.010009765625, -0.001953125, 0.006103515625, 0.01416015625, 0.022216796875, 0.0302734375, 0.038330078125, 0.04638671875, 0.054443359375, 0.0625, 0.070556640625, 0.07861328125, 0.086669921875, 0.0947265625, 0.102783203125, 0.11083984375, 0.118896484375, 0.126953125, 0.135009765625, 0.14306640625, 0.151123046875, 0.1591796875, 0.167236328125, 0.17529296875, 0.183349609375, 0.19140625, 0.199462890625, 0.20751953125, 0.215576171875, 0.2236328125, 0.231689453125, 0.23974609375, 0.247802734375, 0.255859375, 0.263916015625, 0.27197265625, 0.280029296875]}, "gradients/decoder.model.decoder.layers.8.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 0.0, 3.0, 2.0, 1.0, 1.0, 1.0, 4.0, 3.0, 5.0, 8.0, 11.0, 15.0, 28.0, 38.0, 42.0, 61.0, 70.0, 93.0, 106.0, 99.0, 96.0, 71.0, 69.0, 44.0, 43.0, 25.0, 15.0, 13.0, 10.0, 12.0, 8.0, 9.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7021980285644531, -0.6773347854614258, -0.6524714827537537, -0.6276082396507263, -0.6027449369430542, -0.5778816938400269, -0.5530184507369995, -0.5281551480293274, -0.5032918453216553, -0.47842857241630554, -0.4535652995109558, -0.42870205640792847, -0.40383875370025635, -0.378975510597229, -0.3541122376918793, -0.32924896478652954, -0.3043857216835022, -0.27952244877815247, -0.25465917587280273, -0.2297959178686142, -0.20493264496326447, -0.18006937205791473, -0.1552061140537262, -0.13034284114837646, -0.10547956824302673, -0.080616295337677, -0.05575302988290787, -0.030889764428138733, -0.0060264915227890015, 0.01883678138256073, 0.04370003938674927, 0.068563312292099, 0.09342652559280396, 0.11828979849815369, 0.14315307140350342, 0.16801632940769196, 0.1928796023130417, 0.21774287521839142, 0.24260613322257996, 0.2674694061279297, 0.2923326790332794, 0.31719595193862915, 0.3420592248439789, 0.3669224977493286, 0.39178574085235596, 0.4166490435600281, 0.4415122866630554, 0.46637555956840515, 0.4912388324737549, 0.5161020755767822, 0.5409653782844543, 0.5658286213874817, 0.5906919240951538, 0.6155551671981812, 0.6404184103012085, 0.6652817130088806, 0.6901450157165527, 0.7150082588195801, 0.7398715615272522, 0.7647348046302795, 0.7895981073379517, 0.814461350440979, 0.8393245935440063, 0.8641878962516785, 0.8890511393547058]}, "gradients/decoder.model.decoder.layers.8.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 4.0, 2.0, 5.0, 12.0, 9.0, 15.0, 18.0, 14.0, 17.0, 19.0, 37.0, 21.0, 38.0, 23.0, 29.0, 40.0, 38.0, 56.0, 50.0, 38.0, 57.0, 46.0, 51.0, 49.0, 32.0, 47.0, 36.0, 24.0, 34.0, 30.0, 25.0, 17.0, 17.0, 10.0, 16.0, 10.0, 5.0, 6.0, 7.0, 4.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.4636613726615906, -0.44915205240249634, -0.4346427321434021, -0.42013341188430786, -0.4056240916252136, -0.3911147713661194, -0.37660548090934753, -0.3620961606502533, -0.34758684039115906, -0.3330775201320648, -0.3185681998729706, -0.30405887961387634, -0.2895495891571045, -0.27504026889801025, -0.260530948638916, -0.24602162837982178, -0.23151230812072754, -0.2170029878616333, -0.20249366760253906, -0.18798436224460602, -0.17347504198551178, -0.15896572172641754, -0.1444564163684845, -0.12994709610939026, -0.11543777585029602, -0.10092845559120178, -0.08641914278268814, -0.0719098299741745, -0.05740050971508026, -0.04289118945598602, -0.02838187664747238, -0.01387256383895874, 0.0006367862224578857, 0.015146102756261826, 0.029655419290065765, 0.044164735823869705, 0.058674052357673645, 0.07318337261676788, 0.08769268542528152, 0.10220199823379517, 0.1167113184928894, 0.13122063875198364, 0.14572995901107788, 0.16023926436901093, 0.17474858462810516, 0.1892579048871994, 0.20376721024513245, 0.21827653050422668, 0.23278585076332092, 0.24729517102241516, 0.2618044912815094, 0.27631381154060364, 0.2908231019973755, 0.3053324222564697, 0.31984174251556396, 0.3343510627746582, 0.34886038303375244, 0.3633697032928467, 0.3778790235519409, 0.39238834381103516, 0.4068976640701294, 0.42140698432922363, 0.4359162747859955, 0.4504255950450897, 0.46493491530418396]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 4.0, 8.0, 1.0, 2.0, 3.0, 7.0, 11.0, 13.0, 12.0, 17.0, 23.0, 47.0, 81.0, 127.0, 269.0, 505.0, 1013.0, 2067.0, 4761.0, 11396.0, 31371.0, 162695.0, 670164.0, 119628.0, 26590.0, 9917.0, 4123.0, 1808.0, 901.0, 431.0, 229.0, 129.0, 70.0, 29.0, 34.0, 15.0, 13.0, 7.0, 12.0, 7.0, 3.0, 6.0, 3.0, 7.0, 1.0, 0.0, 1.0, 0.0, 4.0, 1.0, 1.0, 1.0], "bins": [-0.30810546875, -0.29915618896484375, -0.2902069091796875, -0.28125762939453125, -0.272308349609375, -0.26335906982421875, -0.2544097900390625, -0.24546051025390625, -0.23651123046875, -0.22756195068359375, -0.2186126708984375, -0.20966339111328125, -0.200714111328125, -0.19176483154296875, -0.1828155517578125, -0.17386627197265625, -0.1649169921875, -0.15596771240234375, -0.1470184326171875, -0.13806915283203125, -0.129119873046875, -0.12017059326171875, -0.1112213134765625, -0.10227203369140625, -0.09332275390625, -0.08437347412109375, -0.0754241943359375, -0.06647491455078125, -0.057525634765625, -0.04857635498046875, -0.0396270751953125, -0.03067779541015625, -0.021728515625, -0.01277923583984375, -0.0038299560546875, 0.00511932373046875, 0.014068603515625, 0.02301788330078125, 0.0319671630859375, 0.04091644287109375, 0.04986572265625, 0.05881500244140625, 0.0677642822265625, 0.07671356201171875, 0.085662841796875, 0.09461212158203125, 0.1035614013671875, 0.11251068115234375, 0.1214599609375, 0.13040924072265625, 0.1393585205078125, 0.14830780029296875, 0.157257080078125, 0.16620635986328125, 0.1751556396484375, 0.18410491943359375, 0.19305419921875, 0.20200347900390625, 0.2109527587890625, 0.21990203857421875, 0.228851318359375, 0.23780059814453125, 0.2467498779296875, 0.25569915771484375, 0.2646484375]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 1.0, 3.0, 3.0, 14.0, 7.0, 19.0, 16.0, 15.0, 36.0, 33.0, 33.0, 37.0, 40.0, 59.0, 49.0, 69.0, 66.0, 66.0, 59.0, 61.0, 59.0, 40.0, 46.0, 37.0, 39.0, 27.0, 23.0, 10.0, 11.0, 11.0, 8.0, 6.0, 5.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.368896484375, -0.3577537536621094, -0.34661102294921875, -0.3354682922363281, -0.3243255615234375, -0.3131828308105469, -0.30204010009765625, -0.2908973693847656, -0.279754638671875, -0.2686119079589844, -0.25746917724609375, -0.24632644653320312, -0.2351837158203125, -0.22404098510742188, -0.21289825439453125, -0.20175552368164062, -0.19061279296875, -0.17947006225585938, -0.16832733154296875, -0.15718460083007812, -0.1460418701171875, -0.13489913940429688, -0.12375640869140625, -0.11261367797851562, -0.101470947265625, -0.09032821655273438, -0.07918548583984375, -0.06804275512695312, -0.0569000244140625, -0.045757293701171875, -0.03461456298828125, -0.023471832275390625, -0.0123291015625, -0.001186370849609375, 0.00995635986328125, 0.021099090576171875, 0.0322418212890625, 0.043384552001953125, 0.05452728271484375, 0.06567001342773438, 0.076812744140625, 0.08795547485351562, 0.09909820556640625, 0.11024093627929688, 0.1213836669921875, 0.13252639770507812, 0.14366912841796875, 0.15481185913085938, 0.16595458984375, 0.17709732055664062, 0.18824005126953125, 0.19938278198242188, 0.2105255126953125, 0.22166824340820312, 0.23281097412109375, 0.24395370483398438, 0.255096435546875, 0.2662391662597656, 0.27738189697265625, 0.2885246276855469, 0.2996673583984375, 0.3108100891113281, 0.32195281982421875, 0.3330955505371094, 0.34423828125]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 5.0, 7.0, 9.0, 8.0, 12.0, 18.0, 12.0, 35.0, 56.0, 68.0, 85.0, 151.0, 248.0, 367.0, 592.0, 1033.0, 1991.0, 3567.0, 7106.0, 15071.0, 34547.0, 96643.0, 310295.0, 373612.0, 124822.0, 42724.0, 17895.0, 8261.0, 4129.0, 2102.0, 1219.0, 677.0, 399.0, 291.0, 151.0, 109.0, 78.0, 52.0, 37.0, 27.0, 15.0, 14.0, 12.0, 6.0, 2.0, 4.0, 2.0, 2.0, 1.0, 2.0], "bins": [-0.135986328125, -0.1323223114013672, -0.12865829467773438, -0.12499427795410156, -0.12133026123046875, -0.11766624450683594, -0.11400222778320312, -0.11033821105957031, -0.1066741943359375, -0.10301017761230469, -0.09934616088867188, -0.09568214416503906, -0.09201812744140625, -0.08835411071777344, -0.08469009399414062, -0.08102607727050781, -0.077362060546875, -0.07369804382324219, -0.07003402709960938, -0.06637001037597656, -0.06270599365234375, -0.05904197692871094, -0.055377960205078125, -0.05171394348144531, -0.0480499267578125, -0.04438591003417969, -0.040721893310546875, -0.03705787658691406, -0.03339385986328125, -0.029729843139648438, -0.026065826416015625, -0.022401809692382812, -0.01873779296875, -0.015073776245117188, -0.011409759521484375, -0.0077457427978515625, -0.00408172607421875, -0.0004177093505859375, 0.003246307373046875, 0.0069103240966796875, 0.0105743408203125, 0.014238357543945312, 0.017902374267578125, 0.021566390991210938, 0.02523040771484375, 0.028894424438476562, 0.032558441162109375, 0.03622245788574219, 0.039886474609375, 0.04355049133300781, 0.047214508056640625, 0.05087852478027344, 0.05454254150390625, 0.05820655822753906, 0.061870574951171875, 0.06553459167480469, 0.0691986083984375, 0.07286262512207031, 0.07652664184570312, 0.08019065856933594, 0.08385467529296875, 0.08751869201660156, 0.09118270874023438, 0.09484672546386719, 0.0985107421875]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 2.0, 3.0, 0.0, 1.0, 1.0, 3.0, 13.0, 7.0, 8.0, 9.0, 14.0, 17.0, 16.0, 26.0, 23.0, 24.0, 30.0, 24.0, 20.0, 40.0, 34.0, 39.0, 45.0, 41.0, 33.0, 42.0, 50.0, 67.0, 34.0, 41.0, 36.0, 37.0, 35.0, 23.0, 31.0, 18.0, 26.0, 24.0, 12.0, 10.0, 9.0, 13.0, 5.0, 5.0, 8.0, 4.0, 1.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.52294921875, -0.50732421875, -0.49169921875, -0.47607421875, -0.46044921875, -0.44482421875, -0.42919921875, -0.41357421875, -0.39794921875, -0.38232421875, -0.36669921875, -0.35107421875, -0.33544921875, -0.31982421875, -0.30419921875, -0.28857421875, -0.27294921875, -0.25732421875, -0.24169921875, -0.22607421875, -0.21044921875, -0.19482421875, -0.17919921875, -0.16357421875, -0.14794921875, -0.13232421875, -0.11669921875, -0.10107421875, -0.08544921875, -0.06982421875, -0.05419921875, -0.03857421875, -0.02294921875, -0.00732421875, 0.00830078125, 0.02392578125, 0.03955078125, 0.05517578125, 0.07080078125, 0.08642578125, 0.10205078125, 0.11767578125, 0.13330078125, 0.14892578125, 0.16455078125, 0.18017578125, 0.19580078125, 0.21142578125, 0.22705078125, 0.24267578125, 0.25830078125, 0.27392578125, 0.28955078125, 0.30517578125, 0.32080078125, 0.33642578125, 0.35205078125, 0.36767578125, 0.38330078125, 0.39892578125, 0.41455078125, 0.43017578125, 0.44580078125, 0.46142578125, 0.47705078125]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 2.0, 1.0, 1.0, 6.0, 3.0, 3.0, 7.0, 7.0, 16.0, 21.0, 29.0, 53.0, 89.0, 121.0, 210.0, 327.0, 618.0, 1163.0, 2157.0, 4606.0, 10656.0, 27263.0, 83628.0, 306648.0, 417874.0, 128443.0, 38732.0, 13961.0, 6059.0, 2718.0, 1364.0, 733.0, 400.0, 239.0, 142.0, 93.0, 62.0, 34.0, 28.0, 14.0, 8.0, 6.0, 10.0, 4.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.035186767578125, -0.03409290313720703, -0.03299903869628906, -0.031905174255371094, -0.030811309814453125, -0.029717445373535156, -0.028623580932617188, -0.02752971649169922, -0.02643585205078125, -0.02534198760986328, -0.024248123168945312, -0.023154258728027344, -0.022060394287109375, -0.020966529846191406, -0.019872665405273438, -0.01877880096435547, -0.0176849365234375, -0.01659107208251953, -0.015497207641601562, -0.014403343200683594, -0.013309478759765625, -0.012215614318847656, -0.011121749877929688, -0.010027885437011719, -0.00893402099609375, -0.007840156555175781, -0.0067462921142578125, -0.005652427673339844, -0.004558563232421875, -0.0034646987915039062, -0.0023708343505859375, -0.0012769699096679688, -0.00018310546875, 0.0009107589721679688, 0.0020046234130859375, 0.0030984878540039062, 0.004192352294921875, 0.005286216735839844, 0.0063800811767578125, 0.007473945617675781, 0.00856781005859375, 0.009661674499511719, 0.010755538940429688, 0.011849403381347656, 0.012943267822265625, 0.014037132263183594, 0.015130996704101562, 0.01622486114501953, 0.0173187255859375, 0.01841259002685547, 0.019506454467773438, 0.020600318908691406, 0.021694183349609375, 0.022788047790527344, 0.023881912231445312, 0.02497577667236328, 0.02606964111328125, 0.02716350555419922, 0.028257369995117188, 0.029351234436035156, 0.030445098876953125, 0.031538963317871094, 0.03263282775878906, 0.03372669219970703, 0.034820556640625]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 4.0, 0.0, 4.0, 3.0, 3.0, 6.0, 7.0, 4.0, 5.0, 11.0, 11.0, 20.0, 16.0, 30.0, 32.0, 43.0, 51.0, 55.0, 63.0, 93.0, 76.0, 84.0, 72.0, 72.0, 37.0, 47.0, 31.0, 26.0, 29.0, 12.0, 13.0, 11.0, 6.0, 7.0, 7.0, 3.0, 6.0, 3.0, 6.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-2.6702880859375e-05, -2.595502883195877e-05, -2.520717680454254e-05, -2.4459324777126312e-05, -2.3711472749710083e-05, -2.2963620722293854e-05, -2.2215768694877625e-05, -2.1467916667461395e-05, -2.0720064640045166e-05, -1.9972212612628937e-05, -1.9224360585212708e-05, -1.8476508557796478e-05, -1.772865653038025e-05, -1.698080450296402e-05, -1.623295247554779e-05, -1.548510044813156e-05, -1.4737248420715332e-05, -1.3989396393299103e-05, -1.3241544365882874e-05, -1.2493692338466644e-05, -1.1745840311050415e-05, -1.0997988283634186e-05, -1.0250136256217957e-05, -9.502284228801727e-06, -8.754432201385498e-06, -8.006580173969269e-06, -7.2587281465530396e-06, -6.51087611913681e-06, -5.763024091720581e-06, -5.015172064304352e-06, -4.2673200368881226e-06, -3.5194680094718933e-06, -2.771615982055664e-06, -2.023763954639435e-06, -1.2759119272232056e-06, -5.280598998069763e-07, 2.1979212760925293e-07, 9.676441550254822e-07, 1.7154961824417114e-06, 2.4633482098579407e-06, 3.21120023727417e-06, 3.959052264690399e-06, 4.706904292106628e-06, 5.454756319522858e-06, 6.202608346939087e-06, 6.950460374355316e-06, 7.698312401771545e-06, 8.446164429187775e-06, 9.194016456604004e-06, 9.941868484020233e-06, 1.0689720511436462e-05, 1.1437572538852692e-05, 1.2185424566268921e-05, 1.293327659368515e-05, 1.368112862110138e-05, 1.4428980648517609e-05, 1.5176832675933838e-05, 1.5924684703350067e-05, 1.6672536730766296e-05, 1.7420388758182526e-05, 1.8168240785598755e-05, 1.8916092813014984e-05, 1.9663944840431213e-05, 2.0411796867847443e-05, 2.1159648895263672e-05]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 2.0, 3.0, 5.0, 7.0, 8.0, 7.0, 19.0, 22.0, 50.0, 77.0, 128.0, 226.0, 413.0, 715.0, 1425.0, 3098.0, 7231.0, 19488.0, 65466.0, 298628.0, 479200.0, 121680.0, 31588.0, 10561.0, 4399.0, 1980.0, 921.0, 555.0, 283.0, 128.0, 76.0, 60.0, 36.0, 18.0, 18.0, 8.0, 9.0, 4.0, 6.0, 5.0, 5.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.04656982421875, -0.045124053955078125, -0.04367828369140625, -0.042232513427734375, -0.0407867431640625, -0.039340972900390625, -0.03789520263671875, -0.036449432373046875, -0.035003662109375, -0.033557891845703125, -0.03211212158203125, -0.030666351318359375, -0.0292205810546875, -0.027774810791015625, -0.02632904052734375, -0.024883270263671875, -0.0234375, -0.021991729736328125, -0.02054595947265625, -0.019100189208984375, -0.0176544189453125, -0.016208648681640625, -0.01476287841796875, -0.013317108154296875, -0.011871337890625, -0.010425567626953125, -0.00897979736328125, -0.007534027099609375, -0.0060882568359375, -0.004642486572265625, -0.00319671630859375, -0.001750946044921875, -0.00030517578125, 0.001140594482421875, 0.00258636474609375, 0.004032135009765625, 0.0054779052734375, 0.006923675537109375, 0.00836944580078125, 0.009815216064453125, 0.011260986328125, 0.012706756591796875, 0.01415252685546875, 0.015598297119140625, 0.0170440673828125, 0.018489837646484375, 0.01993560791015625, 0.021381378173828125, 0.0228271484375, 0.024272918701171875, 0.02571868896484375, 0.027164459228515625, 0.0286102294921875, 0.030055999755859375, 0.03150177001953125, 0.032947540283203125, 0.034393310546875, 0.035839080810546875, 0.03728485107421875, 0.038730621337890625, 0.0401763916015625, 0.041622161865234375, 0.04306793212890625, 0.044513702392578125, 0.04595947265625]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 5.0, 1.0, 4.0, 7.0, 10.0, 9.0, 10.0, 10.0, 15.0, 24.0, 29.0, 31.0, 49.0, 80.0, 75.0, 79.0, 69.0, 85.0, 82.0, 65.0, 65.0, 51.0, 29.0, 30.0, 26.0, 15.0, 8.0, 14.0, 8.0, 7.0, 3.0, 3.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.01165008544921875, -0.01130533218383789, -0.010960578918457031, -0.010615825653076172, -0.010271072387695312, -0.009926319122314453, -0.009581565856933594, -0.009236812591552734, -0.008892059326171875, -0.008547306060791016, -0.008202552795410156, -0.007857799530029297, -0.0075130462646484375, -0.007168292999267578, -0.006823539733886719, -0.006478786468505859, -0.006134033203125, -0.005789279937744141, -0.005444526672363281, -0.005099773406982422, -0.0047550201416015625, -0.004410266876220703, -0.004065513610839844, -0.0037207603454589844, -0.003376007080078125, -0.0030312538146972656, -0.0026865005493164062, -0.002341747283935547, -0.0019969940185546875, -0.0016522407531738281, -0.0013074874877929688, -0.0009627342224121094, -0.00061798095703125, -0.0002732276916503906, 7.152557373046875e-05, 0.0004162788391113281, 0.0007610321044921875, 0.0011057853698730469, 0.0014505386352539062, 0.0017952919006347656, 0.002140045166015625, 0.0024847984313964844, 0.0028295516967773438, 0.003174304962158203, 0.0035190582275390625, 0.003863811492919922, 0.004208564758300781, 0.004553318023681641, 0.0048980712890625, 0.005242824554443359, 0.005587577819824219, 0.005932331085205078, 0.0062770843505859375, 0.006621837615966797, 0.006966590881347656, 0.007311344146728516, 0.007656097412109375, 0.008000850677490234, 0.008345603942871094, 0.008690357208251953, 0.009035110473632812, 0.009379863739013672, 0.009724617004394531, 0.01006937026977539, 0.01041412353515625]}, "gradients/decoder.model.decoder.layers.8.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 3.0, 4.0, 3.0, 2.0, 4.0, 5.0, 15.0, 25.0, 35.0, 50.0, 89.0, 107.0, 155.0, 142.0, 133.0, 83.0, 54.0, 34.0, 18.0, 21.0, 10.0, 9.0, 4.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.47072476148605347, -0.451171338558197, -0.43161794543266296, -0.4120645225048065, -0.39251112937927246, -0.372957706451416, -0.35340428352355957, -0.3338508605957031, -0.31429746747016907, -0.2947440445423126, -0.27519065141677856, -0.2556372284889221, -0.23608382046222687, -0.21653041243553162, -0.19697698950767517, -0.17742358148097992, -0.15787017345428467, -0.13831676542758942, -0.11876334995031357, -0.09920993447303772, -0.07965652644634247, -0.06010311841964722, -0.04054970294237137, -0.02099628746509552, -0.0014428794384002686, 0.01811053231358528, 0.03766394406557083, 0.05721735581755638, 0.07677076756954193, 0.09632417559623718, 0.11587759107351303, 0.13543100655078888, 0.15498441457748413, 0.17453782260417938, 0.19409123063087463, 0.21364465355873108, 0.23319806158542633, 0.2527514696121216, 0.272304892539978, 0.2918583154678345, 0.31141170859336853, 0.330965131521225, 0.35051852464675903, 0.3700719475746155, 0.3896253705024719, 0.409178763628006, 0.4287321865558624, 0.4482855796813965, 0.46783900260925293, 0.4873924255371094, 0.5069458484649658, 0.5264992117881775, 0.5460526347160339, 0.5656060576438904, 0.5851594805717468, 0.6047129034996033, 0.6242662668228149, 0.6438196897506714, 0.6633731126785278, 0.6829264760017395, 0.702479898929596, 0.7220333218574524, 0.7415867447853088, 0.7611401677131653, 0.7806935906410217]}, "gradients/decoder.model.decoder.layers.8.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 7.0, 5.0, 1.0, 8.0, 15.0, 15.0, 14.0, 12.0, 22.0, 28.0, 44.0, 33.0, 34.0, 39.0, 44.0, 56.0, 59.0, 60.0, 53.0, 68.0, 58.0, 55.0, 43.0, 43.0, 36.0, 31.0, 21.0, 26.0, 25.0, 18.0, 11.0, 8.0, 8.0, 7.0, 4.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.3167051374912262, -0.30682605504989624, -0.2969469428062439, -0.28706786036491394, -0.2771887481212616, -0.26730966567993164, -0.2574305534362793, -0.24755147099494934, -0.2376723736524582, -0.22779327630996704, -0.2179141789674759, -0.20803508162498474, -0.19815599918365479, -0.18827688694000244, -0.17839780449867249, -0.16851870715618134, -0.15863960981369019, -0.14876051247119904, -0.13888141512870789, -0.12900231778621674, -0.11912322789430618, -0.10924413055181503, -0.09936504065990448, -0.08948594331741333, -0.07960684597492218, -0.06972774863243103, -0.05984865501523018, -0.04996956139802933, -0.04009046405553818, -0.030211366713047028, -0.020332273095846176, -0.010453179478645325, -0.0005740523338317871, 0.009305043146014214, 0.019184138625860214, 0.029063234105706215, 0.038942329585552216, 0.048821426928043365, 0.05870052054524422, 0.06857961416244507, 0.07845871150493622, 0.08833780884742737, 0.09821690618991852, 0.10809599608182907, 0.11797509342432022, 0.12785419821739197, 0.13773328065872192, 0.14761237800121307, 0.15749147534370422, 0.16737057268619537, 0.17724967002868652, 0.18712876737117767, 0.19700786471366882, 0.20688694715499878, 0.21676604449748993, 0.22664514183998108, 0.23652423918247223, 0.24640333652496338, 0.25628241896629333, 0.2661615312099457, 0.27604061365127563, 0.285919725894928, 0.29579880833625793, 0.3056778907775879, 0.31555700302124023]}, "gradients/decoder.model.decoder.layers.8.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 4.0, 4.0, 5.0, 7.0, 7.0, 13.0, 16.0, 29.0, 44.0, 64.0, 153.0, 303.0, 589.0, 1120.0, 2428.0, 5775.0, 15069.0, 50161.0, 292596.0, 553929.0, 89504.0, 22276.0, 8082.0, 3431.0, 1477.0, 748.0, 313.0, 185.0, 111.0, 47.0, 29.0, 15.0, 5.0, 6.0, 6.0, 7.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.59423828125, -0.5763320922851562, -0.5584259033203125, -0.5405197143554688, -0.522613525390625, -0.5047073364257812, -0.4868011474609375, -0.46889495849609375, -0.45098876953125, -0.43308258056640625, -0.4151763916015625, -0.39727020263671875, -0.379364013671875, -0.36145782470703125, -0.3435516357421875, -0.32564544677734375, -0.3077392578125, -0.28983306884765625, -0.2719268798828125, -0.25402069091796875, -0.236114501953125, -0.21820831298828125, -0.2003021240234375, -0.18239593505859375, -0.16448974609375, -0.14658355712890625, -0.1286773681640625, -0.11077117919921875, -0.092864990234375, -0.07495880126953125, -0.0570526123046875, -0.03914642333984375, -0.021240234375, -0.00333404541015625, 0.0145721435546875, 0.03247833251953125, 0.050384521484375, 0.06829071044921875, 0.0861968994140625, 0.10410308837890625, 0.12200927734375, 0.13991546630859375, 0.1578216552734375, 0.17572784423828125, 0.193634033203125, 0.21154022216796875, 0.2294464111328125, 0.24735260009765625, 0.2652587890625, 0.28316497802734375, 0.3010711669921875, 0.31897735595703125, 0.336883544921875, 0.35478973388671875, 0.3726959228515625, 0.39060211181640625, 0.40850830078125, 0.42641448974609375, 0.4443206787109375, 0.46222686767578125, 0.480133056640625, 0.49803924560546875, 0.5159454345703125, 0.5338516235351562, 0.5517578125]}, "gradients/decoder.model.decoder.layers.8.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 3.0, 3.0, 6.0, 10.0, 9.0, 10.0, 13.0, 18.0, 29.0, 20.0, 34.0, 24.0, 40.0, 40.0, 35.0, 54.0, 57.0, 46.0, 54.0, 52.0, 62.0, 58.0, 63.0, 40.0, 45.0, 33.0, 34.0, 20.0, 16.0, 26.0, 11.0, 11.0, 8.0, 5.0, 4.0, 7.0, 5.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.434326171875, -0.4165840148925781, -0.39884185791015625, -0.3810997009277344, -0.3633575439453125, -0.3456153869628906, -0.32787322998046875, -0.3101310729980469, -0.292388916015625, -0.2746467590332031, -0.25690460205078125, -0.23916244506835938, -0.2214202880859375, -0.20367813110351562, -0.18593597412109375, -0.16819381713867188, -0.15045166015625, -0.13270950317382812, -0.11496734619140625, -0.09722518920898438, -0.0794830322265625, -0.061740875244140625, -0.04399871826171875, -0.026256561279296875, -0.008514404296875, 0.009227752685546875, 0.02696990966796875, 0.044712066650390625, 0.0624542236328125, 0.08019638061523438, 0.09793853759765625, 0.11568069458007812, 0.1334228515625, 0.15116500854492188, 0.16890716552734375, 0.18664932250976562, 0.2043914794921875, 0.22213363647460938, 0.23987579345703125, 0.2576179504394531, 0.275360107421875, 0.2931022644042969, 0.31084442138671875, 0.3285865783691406, 0.3463287353515625, 0.3640708923339844, 0.38181304931640625, 0.3995552062988281, 0.41729736328125, 0.4350395202636719, 0.45278167724609375, 0.4705238342285156, 0.4882659912109375, 0.5060081481933594, 0.5237503051757812, 0.5414924621582031, 0.559234619140625, 0.5769767761230469, 0.5947189331054688, 0.6124610900878906, 0.6302032470703125, 0.6479454040527344, 0.6656875610351562, 0.6834297180175781, 0.701171875]}, "gradients/decoder.model.decoder.layers.8.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 4.0, 4.0, 2.0, 6.0, 2.0, 7.0, 3.0, 4.0, 11.0, 8.0, 12.0, 7.0, 16.0, 16.0, 22.0, 25.0, 25.0, 34.0, 28.0, 50.0, 81.0, 160.0, 286.0, 796.0, 5247.0, 113610.0, 903148.0, 21905.0, 1961.0, 438.0, 172.0, 102.0, 67.0, 55.0, 50.0, 35.0, 21.0, 23.0, 17.0, 22.0, 12.0, 17.0, 17.0, 10.0, 5.0, 6.0, 6.0, 4.0, 4.0, 3.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.41015625, -1.3650665283203125, -1.319976806640625, -1.2748870849609375, -1.22979736328125, -1.1847076416015625, -1.139617919921875, -1.0945281982421875, -1.0494384765625, -1.0043487548828125, -0.959259033203125, -0.9141693115234375, -0.86907958984375, -0.8239898681640625, -0.778900146484375, -0.7338104248046875, -0.688720703125, -0.6436309814453125, -0.598541259765625, -0.5534515380859375, -0.50836181640625, -0.4632720947265625, -0.418182373046875, -0.3730926513671875, -0.3280029296875, -0.2829132080078125, -0.237823486328125, -0.1927337646484375, -0.14764404296875, -0.1025543212890625, -0.057464599609375, -0.0123748779296875, 0.03271484375, 0.0778045654296875, 0.122894287109375, 0.1679840087890625, 0.21307373046875, 0.2581634521484375, 0.303253173828125, 0.3483428955078125, 0.3934326171875, 0.4385223388671875, 0.483612060546875, 0.5287017822265625, 0.57379150390625, 0.6188812255859375, 0.663970947265625, 0.7090606689453125, 0.754150390625, 0.7992401123046875, 0.844329833984375, 0.8894195556640625, 0.93450927734375, 0.9795989990234375, 1.024688720703125, 1.0697784423828125, 1.1148681640625, 1.1599578857421875, 1.205047607421875, 1.2501373291015625, 1.29522705078125, 1.3403167724609375, 1.385406494140625, 1.4304962158203125, 1.4755859375]}, "gradients/decoder.model.decoder.layers.8.self_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 4.0, 0.0, 2.0, 4.0, 1.0, 3.0, 5.0, 7.0, 4.0, 9.0, 6.0, 13.0, 13.0, 9.0, 12.0, 20.0, 18.0, 21.0, 25.0, 22.0, 29.0, 28.0, 22.0, 41.0, 42.0, 38.0, 36.0, 43.0, 34.0, 28.0, 40.0, 52.0, 37.0, 35.0, 41.0, 31.0, 38.0, 24.0, 21.0, 21.0, 17.0, 21.0, 23.0, 12.0, 11.0, 8.0, 8.0, 7.0, 4.0, 7.0, 10.0, 5.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.474609375, -0.4599800109863281, -0.44535064697265625, -0.4307212829589844, -0.4160919189453125, -0.4014625549316406, -0.38683319091796875, -0.3722038269042969, -0.357574462890625, -0.3429450988769531, -0.32831573486328125, -0.3136863708496094, -0.2990570068359375, -0.2844276428222656, -0.26979827880859375, -0.2551689147949219, -0.24053955078125, -0.22591018676757812, -0.21128082275390625, -0.19665145874023438, -0.1820220947265625, -0.16739273071289062, -0.15276336669921875, -0.13813400268554688, -0.123504638671875, -0.10887527465820312, -0.09424591064453125, -0.07961654663085938, -0.0649871826171875, -0.050357818603515625, -0.03572845458984375, -0.021099090576171875, -0.0064697265625, 0.008159637451171875, 0.02278900146484375, 0.037418365478515625, 0.0520477294921875, 0.06667709350585938, 0.08130645751953125, 0.09593582153320312, 0.110565185546875, 0.12519454956054688, 0.13982391357421875, 0.15445327758789062, 0.1690826416015625, 0.18371200561523438, 0.19834136962890625, 0.21297073364257812, 0.22760009765625, 0.24222946166992188, 0.25685882568359375, 0.2714881896972656, 0.2861175537109375, 0.3007469177246094, 0.31537628173828125, 0.3300056457519531, 0.344635009765625, 0.3592643737792969, 0.37389373779296875, 0.3885231018066406, 0.4031524658203125, 0.4177818298339844, 0.43241119384765625, 0.4470405578613281, 0.461669921875]}, "gradients/decoder.model.decoder.layers.8.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 3.0, 5.0, 5.0, 3.0, 9.0, 12.0, 19.0, 23.0, 41.0, 76.0, 127.0, 240.0, 468.0, 1194.0, 3635.0, 16828.0, 145155.0, 772177.0, 91491.0, 12305.0, 2811.0, 988.0, 416.0, 215.0, 103.0, 67.0, 49.0, 26.0, 14.0, 10.0, 16.0, 10.0, 3.0, 3.0, 3.0, 4.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.25048828125, -0.2436084747314453, -0.23672866821289062, -0.22984886169433594, -0.22296905517578125, -0.21608924865722656, -0.20920944213867188, -0.2023296356201172, -0.1954498291015625, -0.1885700225830078, -0.18169021606445312, -0.17481040954589844, -0.16793060302734375, -0.16105079650878906, -0.15417098999023438, -0.1472911834716797, -0.140411376953125, -0.1335315704345703, -0.12665176391601562, -0.11977195739746094, -0.11289215087890625, -0.10601234436035156, -0.09913253784179688, -0.09225273132324219, -0.0853729248046875, -0.07849311828613281, -0.07161331176757812, -0.06473350524902344, -0.05785369873046875, -0.05097389221191406, -0.044094085693359375, -0.03721427917480469, -0.03033447265625, -0.023454666137695312, -0.016574859619140625, -0.009695053100585938, -0.00281524658203125, 0.0040645599365234375, 0.010944366455078125, 0.017824172973632812, 0.0247039794921875, 0.03158378601074219, 0.038463592529296875, 0.04534339904785156, 0.05222320556640625, 0.05910301208496094, 0.06598281860351562, 0.07286262512207031, 0.079742431640625, 0.08662223815917969, 0.09350204467773438, 0.10038185119628906, 0.10726165771484375, 0.11414146423339844, 0.12102127075195312, 0.1279010772705078, 0.1347808837890625, 0.1416606903076172, 0.14854049682617188, 0.15542030334472656, 0.16230010986328125, 0.16917991638183594, 0.17605972290039062, 0.1829395294189453, 0.1898193359375]}, "gradients/decoder.model.decoder.layers.8.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 3.0, 5.0, 2.0, 5.0, 2.0, 8.0, 10.0, 15.0, 22.0, 17.0, 25.0, 36.0, 46.0, 71.0, 95.0, 147.0, 139.0, 94.0, 73.0, 47.0, 53.0, 20.0, 17.0, 13.0, 13.0, 7.0, 6.0, 5.0, 2.0, 6.0, 1.0, 2.0, 3.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.9802322387695312e-05, -2.8806738555431366e-05, -2.781115472316742e-05, -2.6815570890903473e-05, -2.5819987058639526e-05, -2.482440322637558e-05, -2.3828819394111633e-05, -2.2833235561847687e-05, -2.183765172958374e-05, -2.0842067897319794e-05, -1.9846484065055847e-05, -1.88509002327919e-05, -1.7855316400527954e-05, -1.6859732568264008e-05, -1.586414873600006e-05, -1.4868564903736115e-05, -1.3872981071472168e-05, -1.2877397239208221e-05, -1.1881813406944275e-05, -1.0886229574680328e-05, -9.890645742416382e-06, -8.895061910152435e-06, -7.899478077888489e-06, -6.903894245624542e-06, -5.908310413360596e-06, -4.912726581096649e-06, -3.917142748832703e-06, -2.921558916568756e-06, -1.9259750843048096e-06, -9.30391252040863e-07, 6.51925802230835e-08, 1.06077641248703e-06, 2.0563602447509766e-06, 3.051944077014923e-06, 4.04752790927887e-06, 5.043111741542816e-06, 6.038695573806763e-06, 7.034279406070709e-06, 8.029863238334656e-06, 9.025447070598602e-06, 1.0021030902862549e-05, 1.1016614735126495e-05, 1.2012198567390442e-05, 1.3007782399654388e-05, 1.4003366231918335e-05, 1.4998950064182281e-05, 1.5994533896446228e-05, 1.6990117728710175e-05, 1.798570156097412e-05, 1.8981285393238068e-05, 1.9976869225502014e-05, 2.097245305776596e-05, 2.1968036890029907e-05, 2.2963620722293854e-05, 2.39592045545578e-05, 2.4954788386821747e-05, 2.5950372219085693e-05, 2.694595605134964e-05, 2.7941539883613586e-05, 2.8937123715877533e-05, 2.993270754814148e-05, 3.0928291380405426e-05, 3.192387521266937e-05, 3.291945904493332e-05, 3.3915042877197266e-05]}, "gradients/decoder.model.decoder.layers.8.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 3.0, 3.0, 5.0, 8.0, 9.0, 18.0, 20.0, 31.0, 65.0, 120.0, 228.0, 480.0, 1172.0, 3874.0, 20944.0, 248157.0, 709534.0, 53431.0, 7336.0, 1801.0, 641.0, 282.0, 156.0, 67.0, 64.0, 34.0, 27.0, 16.0, 10.0, 8.0, 10.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.3037109375, -0.2961578369140625, -0.288604736328125, -0.2810516357421875, -0.27349853515625, -0.2659454345703125, -0.258392333984375, -0.2508392333984375, -0.2432861328125, -0.2357330322265625, -0.228179931640625, -0.2206268310546875, -0.21307373046875, -0.2055206298828125, -0.197967529296875, -0.1904144287109375, -0.182861328125, -0.1753082275390625, -0.167755126953125, -0.1602020263671875, -0.15264892578125, -0.1450958251953125, -0.137542724609375, -0.1299896240234375, -0.1224365234375, -0.1148834228515625, -0.107330322265625, -0.0997772216796875, -0.09222412109375, -0.0846710205078125, -0.077117919921875, -0.0695648193359375, -0.06201171875, -0.0544586181640625, -0.046905517578125, -0.0393524169921875, -0.03179931640625, -0.0242462158203125, -0.016693115234375, -0.0091400146484375, -0.0015869140625, 0.0059661865234375, 0.013519287109375, 0.0210723876953125, 0.02862548828125, 0.0361785888671875, 0.043731689453125, 0.0512847900390625, 0.058837890625, 0.0663909912109375, 0.073944091796875, 0.0814971923828125, 0.08905029296875, 0.0966033935546875, 0.104156494140625, 0.1117095947265625, 0.1192626953125, 0.1268157958984375, 0.134368896484375, 0.1419219970703125, 0.14947509765625, 0.1570281982421875, 0.164581298828125, 0.1721343994140625, 0.1796875]}, "gradients/decoder.model.decoder.layers.8.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 1.0, 2.0, 5.0, 8.0, 5.0, 6.0, 13.0, 12.0, 21.0, 18.0, 37.0, 44.0, 41.0, 61.0, 87.0, 96.0, 108.0, 85.0, 63.0, 61.0, 56.0, 49.0, 37.0, 20.0, 19.0, 15.0, 8.0, 9.0, 6.0, 5.0, 6.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.05999755859375, -0.05782318115234375, -0.0556488037109375, -0.05347442626953125, -0.051300048828125, -0.04912567138671875, -0.0469512939453125, -0.04477691650390625, -0.0426025390625, -0.04042816162109375, -0.0382537841796875, -0.03607940673828125, -0.033905029296875, -0.03173065185546875, -0.0295562744140625, -0.02738189697265625, -0.02520751953125, -0.02303314208984375, -0.0208587646484375, -0.01868438720703125, -0.016510009765625, -0.01433563232421875, -0.0121612548828125, -0.00998687744140625, -0.0078125, -0.00563812255859375, -0.0034637451171875, -0.00128936767578125, 0.000885009765625, 0.00305938720703125, 0.0052337646484375, 0.00740814208984375, 0.00958251953125, 0.01175689697265625, 0.0139312744140625, 0.01610565185546875, 0.018280029296875, 0.02045440673828125, 0.0226287841796875, 0.02480316162109375, 0.0269775390625, 0.02915191650390625, 0.0313262939453125, 0.03350067138671875, 0.035675048828125, 0.03784942626953125, 0.0400238037109375, 0.04219818115234375, 0.04437255859375, 0.04654693603515625, 0.0487213134765625, 0.05089569091796875, 0.053070068359375, 0.05524444580078125, 0.0574188232421875, 0.05959320068359375, 0.061767578125, 0.06394195556640625, 0.0661163330078125, 0.06829071044921875, 0.070465087890625, 0.07263946533203125, 0.0748138427734375, 0.07698822021484375, 0.07916259765625]}, "gradients/decoder.model.decoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 6.0, 62.0, 648.0, 275.0, 26.0, 3.0], "bins": [-15.009307861328125, -14.762321472167969, -14.515335083007812, -14.26834774017334, -14.021361351013184, -13.774374961853027, -13.527387619018555, -13.280401229858398, -13.033414840698242, -12.786428451538086, -12.53944206237793, -12.292454719543457, -12.0454683303833, -11.798481941223145, -11.551494598388672, -11.304508209228516, -11.05752182006836, -10.810535430908203, -10.563549041748047, -10.316561698913574, -10.069575309753418, -9.822588920593262, -9.575601577758789, -9.328615188598633, -9.081628799438477, -8.83464241027832, -8.587656021118164, -8.340668678283691, -8.093682289123535, -7.846695899963379, -7.5997090339660645, -7.35272216796875, -7.1057353019714355, -6.858748435974121, -6.611762046813965, -6.364775657653809, -6.117788791656494, -5.87080192565918, -5.623815536499023, -5.376829147338867, -5.129842281341553, -4.882855415344238, -4.635869026184082, -4.388882637023926, -4.141895771026611, -3.894909143447876, -3.6479225158691406, -3.4009358882904053, -3.15394926071167, -2.9069626331329346, -2.659976005554199, -2.412989377975464, -2.1660027503967285, -1.9190161228179932, -1.6720294952392578, -1.4250428676605225, -1.1780563592910767, -0.9310697317123413, -0.684083104133606, -0.4370964765548706, -0.19010984897613525, 0.0568767786026001, 0.30386340618133545, 0.5508500337600708, 0.7978366613388062]}, "gradients/decoder.model.decoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 6.0, 7.0, 7.0, 11.0, 12.0, 15.0, 11.0, 20.0, 12.0, 26.0, 25.0, 26.0, 30.0, 28.0, 38.0, 34.0, 34.0, 50.0, 44.0, 38.0, 36.0, 47.0, 46.0, 41.0, 36.0, 46.0, 39.0, 38.0, 31.0, 30.0, 24.0, 26.0, 14.0, 15.0, 13.0, 10.0, 9.0, 4.0, 7.0, 4.0, 4.0, 5.0, 3.0, 3.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.8316761255264282, -0.8047030568122864, -0.7777299880981445, -0.7507569193840027, -0.7237838506698608, -0.6968108415603638, -0.6698377132415771, -0.6428647041320801, -0.6158916354179382, -0.5889185667037964, -0.5619454979896545, -0.5349724292755127, -0.5079993605613708, -0.4810263216495514, -0.45405325293540955, -0.4270802140235901, -0.40010711550712585, -0.373134046792984, -0.34616097807884216, -0.3191879391670227, -0.29221487045288086, -0.265241801738739, -0.23826873302459717, -0.21129567921161652, -0.18432261049747467, -0.15734954178333282, -0.13037648797035217, -0.10340341925621033, -0.07643035799264908, -0.04945729672908783, -0.022484228014945984, 0.004488825798034668, 0.031461894512176514, 0.05843495577573776, 0.08540801703929901, 0.11238108575344086, 0.1393541395664215, 0.16632720828056335, 0.1933002769947052, 0.22027333080768585, 0.2472463995218277, 0.27421945333480835, 0.3011925220489502, 0.32816559076309204, 0.3551386594772339, 0.38211172819137573, 0.4090847969055176, 0.43605783581733704, 0.4630309045314789, 0.4900039732456207, 0.5169770121574402, 0.543950080871582, 0.5709231495857239, 0.5978962182998657, 0.6248692870140076, 0.6518423557281494, 0.6788154244422913, 0.7057884931564331, 0.732761561870575, 0.7597346305847168, 0.7867076992988586, 0.8136807680130005, 0.8406537771224976, 0.8676268458366394, 0.8945999145507812]}, "gradients/decoder.model.decoder.layers.7.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 7.0, 2.0, 17.0, 14.0, 21.0, 44.0, 41.0, 89.0, 141.0, 228.0, 408.0, 809.0, 1823.0, 5311.0, 23220.0, 345800.0, 3379263.0, 403344.0, 24337.0, 5541.0, 1904.0, 863.0, 405.0, 268.0, 149.0, 88.0, 45.0, 30.0, 21.0, 20.0, 10.0, 7.0, 8.0, 4.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.92431640625, -0.894989013671875, -0.86566162109375, -0.836334228515625, -0.8070068359375, -0.777679443359375, -0.74835205078125, -0.719024658203125, -0.689697265625, -0.660369873046875, -0.63104248046875, -0.601715087890625, -0.5723876953125, -0.543060302734375, -0.51373291015625, -0.484405517578125, -0.455078125, -0.425750732421875, -0.39642333984375, -0.367095947265625, -0.3377685546875, -0.308441162109375, -0.27911376953125, -0.249786376953125, -0.220458984375, -0.191131591796875, -0.16180419921875, -0.132476806640625, -0.1031494140625, -0.073822021484375, -0.04449462890625, -0.015167236328125, 0.01416015625, 0.043487548828125, 0.07281494140625, 0.102142333984375, 0.1314697265625, 0.160797119140625, 0.19012451171875, 0.219451904296875, 0.248779296875, 0.278106689453125, 0.30743408203125, 0.336761474609375, 0.3660888671875, 0.395416259765625, 0.42474365234375, 0.454071044921875, 0.4833984375, 0.512725830078125, 0.54205322265625, 0.571380615234375, 0.6007080078125, 0.630035400390625, 0.65936279296875, 0.688690185546875, 0.718017578125, 0.747344970703125, 0.77667236328125, 0.805999755859375, 0.8353271484375, 0.864654541015625, 0.89398193359375, 0.923309326171875, 0.95263671875]}, "gradients/decoder.model.decoder.layers.7.fc2.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 3.0, 7.0, 1.0, 5.0, 3.0, 4.0, 4.0, 6.0, 11.0, 9.0, 7.0, 21.0, 7.0, 23.0, 9.0, 18.0, 27.0, 25.0, 44.0, 19.0, 25.0, 25.0, 29.0, 26.0, 46.0, 25.0, 44.0, 34.0, 39.0, 47.0, 29.0, 28.0, 32.0, 38.0, 43.0, 39.0, 23.0, 28.0, 19.0, 21.0, 21.0, 16.0, 16.0, 15.0, 12.0, 8.0, 6.0, 2.0, 8.0, 3.0, 3.0, 2.0, 3.0, 3.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.281982421875, -0.2727813720703125, -0.263580322265625, -0.2543792724609375, -0.24517822265625, -0.2359771728515625, -0.226776123046875, -0.2175750732421875, -0.2083740234375, -0.1991729736328125, -0.189971923828125, -0.1807708740234375, -0.17156982421875, -0.1623687744140625, -0.153167724609375, -0.1439666748046875, -0.134765625, -0.1255645751953125, -0.116363525390625, -0.1071624755859375, -0.09796142578125, -0.0887603759765625, -0.079559326171875, -0.0703582763671875, -0.0611572265625, -0.0519561767578125, -0.042755126953125, -0.0335540771484375, -0.02435302734375, -0.0151519775390625, -0.005950927734375, 0.0032501220703125, 0.012451171875, 0.0216522216796875, 0.030853271484375, 0.0400543212890625, 0.04925537109375, 0.0584564208984375, 0.067657470703125, 0.0768585205078125, 0.0860595703125, 0.0952606201171875, 0.104461669921875, 0.1136627197265625, 0.12286376953125, 0.1320648193359375, 0.141265869140625, 0.1504669189453125, 0.15966796875, 0.1688690185546875, 0.178070068359375, 0.1872711181640625, 0.19647216796875, 0.2056732177734375, 0.214874267578125, 0.2240753173828125, 0.2332763671875, 0.2424774169921875, 0.251678466796875, 0.2608795166015625, 0.27008056640625, 0.2792816162109375, 0.288482666015625, 0.2976837158203125, 0.306884765625]}, "gradients/decoder.model.decoder.layers.7.fc1.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 3.0, 0.0, 1.0, 2.0, 4.0, 8.0, 7.0, 13.0, 6.0, 15.0, 18.0, 19.0, 32.0, 38.0, 53.0, 90.0, 135.0, 306.0, 820.0, 3401.0, 43035.0, 4021819.0, 117151.0, 5327.0, 1080.0, 361.0, 173.0, 105.0, 72.0, 42.0, 37.0, 22.0, 19.0, 7.0, 12.0, 11.0, 10.0, 9.0, 6.0, 2.0, 4.0, 4.0, 4.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.5537109375, -1.501251220703125, -1.44879150390625, -1.396331787109375, -1.3438720703125, -1.291412353515625, -1.23895263671875, -1.186492919921875, -1.134033203125, -1.081573486328125, -1.02911376953125, -0.976654052734375, -0.9241943359375, -0.871734619140625, -0.81927490234375, -0.766815185546875, -0.71435546875, -0.661895751953125, -0.60943603515625, -0.556976318359375, -0.5045166015625, -0.452056884765625, -0.39959716796875, -0.347137451171875, -0.294677734375, -0.242218017578125, -0.18975830078125, -0.137298583984375, -0.0848388671875, -0.032379150390625, 0.02008056640625, 0.072540283203125, 0.125, 0.177459716796875, 0.22991943359375, 0.282379150390625, 0.3348388671875, 0.387298583984375, 0.43975830078125, 0.492218017578125, 0.544677734375, 0.597137451171875, 0.64959716796875, 0.702056884765625, 0.7545166015625, 0.806976318359375, 0.85943603515625, 0.911895751953125, 0.96435546875, 1.016815185546875, 1.06927490234375, 1.121734619140625, 1.1741943359375, 1.226654052734375, 1.27911376953125, 1.331573486328125, 1.384033203125, 1.436492919921875, 1.48895263671875, 1.541412353515625, 1.5938720703125, 1.646331787109375, 1.69879150390625, 1.751251220703125, 1.8037109375]}, "gradients/decoder.model.decoder.layers.7.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 6.0, 3.0, 3.0, 9.0, 6.0, 8.0, 17.0, 43.0, 49.0, 80.0, 138.0, 287.0, 494.0, 932.0, 930.0, 501.0, 231.0, 139.0, 82.0, 30.0, 29.0, 16.0, 15.0, 10.0, 11.0, 4.0, 2.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.323974609375, -0.3156585693359375, -0.307342529296875, -0.2990264892578125, -0.29071044921875, -0.2823944091796875, -0.274078369140625, -0.2657623291015625, -0.2574462890625, -0.2491302490234375, -0.240814208984375, -0.2324981689453125, -0.22418212890625, -0.2158660888671875, -0.207550048828125, -0.1992340087890625, -0.19091796875, -0.1826019287109375, -0.174285888671875, -0.1659698486328125, -0.15765380859375, -0.1493377685546875, -0.141021728515625, -0.1327056884765625, -0.1243896484375, -0.1160736083984375, -0.107757568359375, -0.0994415283203125, -0.09112548828125, -0.0828094482421875, -0.074493408203125, -0.0661773681640625, -0.057861328125, -0.0495452880859375, -0.041229248046875, -0.0329132080078125, -0.02459716796875, -0.0162811279296875, -0.007965087890625, 0.0003509521484375, 0.0086669921875, 0.0169830322265625, 0.025299072265625, 0.0336151123046875, 0.04193115234375, 0.0502471923828125, 0.058563232421875, 0.0668792724609375, 0.0751953125, 0.0835113525390625, 0.091827392578125, 0.1001434326171875, 0.10845947265625, 0.1167755126953125, 0.125091552734375, 0.1334075927734375, 0.1417236328125, 0.1500396728515625, 0.158355712890625, 0.1666717529296875, 0.17498779296875, 0.1833038330078125, 0.191619873046875, 0.1999359130859375, 0.208251953125]}, "gradients/decoder.model.decoder.layers.7.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 6.0, 4.0, 2.0, 6.0, 12.0, 17.0, 16.0, 23.0, 35.0, 46.0, 54.0, 76.0, 81.0, 100.0, 89.0, 85.0, 84.0, 65.0, 57.0, 35.0, 36.0, 19.0, 20.0, 11.0, 13.0, 5.0, 4.0, 3.0, 0.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.571103572845459, -0.5502992272377014, -0.5294948816299438, -0.5086905360221863, -0.4878861606121063, -0.46708181500434875, -0.4462774693965912, -0.42547309398651123, -0.40466874837875366, -0.3838644027709961, -0.3630600571632385, -0.34225571155548096, -0.321451336145401, -0.30064699053764343, -0.27984264492988586, -0.2590382695198059, -0.23823395371437073, -0.21742960810661316, -0.1966252475976944, -0.17582090198993683, -0.15501654148101807, -0.1342121958732605, -0.11340785026550293, -0.09260348975658417, -0.0717991441488266, -0.050994791090488434, -0.030190441757440567, -0.0093860924243927, 0.011418260633945465, 0.03222261369228363, 0.0530269593000412, 0.07383131980895996, 0.09463566541671753, 0.1154400184750557, 0.13624437153339386, 0.15704871714115143, 0.1778530776500702, 0.19865742325782776, 0.21946176886558533, 0.2402661293745041, 0.26107048988342285, 0.2818748354911804, 0.302679181098938, 0.32348352670669556, 0.3442879021167755, 0.3650922477245331, 0.38589659333229065, 0.4067009687423706, 0.4275052845478058, 0.44830963015556335, 0.4691139757633209, 0.4899183511734009, 0.5107226967811584, 0.531527042388916, 0.5523313879966736, 0.5731357336044312, 0.5939400792121887, 0.6147444248199463, 0.6355487704277039, 0.6563531160354614, 0.677157461643219, 0.6979618072509766, 0.7187662124633789, 0.7395705580711365, 0.760374903678894]}, "gradients/decoder.model.decoder.layers.7.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 6.0, 3.0, 6.0, 3.0, 2.0, 7.0, 7.0, 11.0, 8.0, 6.0, 12.0, 20.0, 23.0, 21.0, 21.0, 35.0, 28.0, 30.0, 35.0, 46.0, 35.0, 33.0, 39.0, 45.0, 48.0, 42.0, 45.0, 27.0, 33.0, 30.0, 36.0, 33.0, 29.0, 38.0, 19.0, 32.0, 25.0, 18.0, 15.0, 12.0, 7.0, 14.0, 6.0, 3.0, 8.0, 4.0, 5.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.32858216762542725, -0.31640568375587463, -0.304229199886322, -0.2920527458190918, -0.2798762619495392, -0.2676997780799866, -0.25552329421043396, -0.24334681034088135, -0.23117034137248993, -0.21899385750293732, -0.2068173885345459, -0.1946409046649933, -0.18246442079544067, -0.17028795182704926, -0.15811146795749664, -0.14593499898910522, -0.1337585151195526, -0.1215820387005806, -0.10940556228160858, -0.09722907841205597, -0.08505260199308395, -0.07287612557411194, -0.060699641704559326, -0.04852316528558731, -0.036346688866615295, -0.02417021058499813, -0.011993732303380966, 0.00018274784088134766, 0.012359224259853363, 0.02453570067882538, 0.03671218454837799, 0.048888660967350006, 0.061065107583999634, 0.07324158400297165, 0.08541806042194366, 0.09759454429149628, 0.10977102071046829, 0.12194749712944031, 0.13412398099899292, 0.14630046486854553, 0.15847693383693695, 0.17065341770648956, 0.18282988667488098, 0.1950063705444336, 0.2071828544139862, 0.21935932338237762, 0.23153580725193024, 0.24371227622032166, 0.25588876008987427, 0.2680652439594269, 0.2802417278289795, 0.2924181818962097, 0.30459466576576233, 0.31677114963531494, 0.32894763350486755, 0.34112411737442017, 0.3533005714416504, 0.365477055311203, 0.3776535391807556, 0.38982999324798584, 0.40200647711753845, 0.41418296098709106, 0.4263594448566437, 0.4385359287261963, 0.4507124125957489]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 4.0, 6.0, 5.0, 7.0, 17.0, 21.0, 29.0, 45.0, 79.0, 88.0, 158.0, 283.0, 467.0, 834.0, 1704.0, 3653.0, 8698.0, 23171.0, 70863.0, 229989.0, 417614.0, 195996.0, 60235.0, 20295.0, 7792.0, 3141.0, 1513.0, 791.0, 396.0, 253.0, 131.0, 92.0, 59.0, 44.0, 25.0, 22.0, 17.0, 10.0, 6.0, 9.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0789794921875, -0.07629585266113281, -0.07361221313476562, -0.07092857360839844, -0.06824493408203125, -0.06556129455566406, -0.06287765502929688, -0.06019401550292969, -0.0575103759765625, -0.05482673645019531, -0.052143096923828125, -0.04945945739746094, -0.04677581787109375, -0.04409217834472656, -0.041408538818359375, -0.03872489929199219, -0.036041259765625, -0.03335762023925781, -0.030673980712890625, -0.027990341186523438, -0.02530670166015625, -0.022623062133789062, -0.019939422607421875, -0.017255783081054688, -0.0145721435546875, -0.011888504028320312, -0.009204864501953125, -0.0065212249755859375, -0.00383758544921875, -0.0011539459228515625, 0.001529693603515625, 0.0042133331298828125, 0.00689697265625, 0.009580612182617188, 0.012264251708984375, 0.014947891235351562, 0.01763153076171875, 0.020315170288085938, 0.022998809814453125, 0.025682449340820312, 0.0283660888671875, 0.031049728393554688, 0.033733367919921875, 0.03641700744628906, 0.03910064697265625, 0.04178428649902344, 0.044467926025390625, 0.04715156555175781, 0.049835205078125, 0.05251884460449219, 0.055202484130859375, 0.05788612365722656, 0.06056976318359375, 0.06325340270996094, 0.06593704223632812, 0.06862068176269531, 0.0713043212890625, 0.07398796081542969, 0.07667160034179688, 0.07935523986816406, 0.08203887939453125, 0.08472251892089844, 0.08740615844726562, 0.09008979797363281, 0.0927734375]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 3.0, 2.0, 6.0, 4.0, 7.0, 7.0, 14.0, 10.0, 10.0, 16.0, 9.0, 34.0, 32.0, 33.0, 28.0, 42.0, 49.0, 54.0, 43.0, 51.0, 58.0, 55.0, 61.0, 33.0, 43.0, 36.0, 41.0, 38.0, 27.0, 36.0, 28.0, 23.0, 18.0, 16.0, 11.0, 9.0, 10.0, 3.0, 3.0, 2.0, 7.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.263427734375, -0.253692626953125, -0.24395751953125, -0.234222412109375, -0.2244873046875, -0.214752197265625, -0.20501708984375, -0.195281982421875, -0.185546875, -0.175811767578125, -0.16607666015625, -0.156341552734375, -0.1466064453125, -0.136871337890625, -0.12713623046875, -0.117401123046875, -0.107666015625, -0.097930908203125, -0.08819580078125, -0.078460693359375, -0.0687255859375, -0.058990478515625, -0.04925537109375, -0.039520263671875, -0.02978515625, -0.020050048828125, -0.01031494140625, -0.000579833984375, 0.0091552734375, 0.018890380859375, 0.02862548828125, 0.038360595703125, 0.048095703125, 0.057830810546875, 0.06756591796875, 0.077301025390625, 0.0870361328125, 0.096771240234375, 0.10650634765625, 0.116241455078125, 0.1259765625, 0.135711669921875, 0.14544677734375, 0.155181884765625, 0.1649169921875, 0.174652099609375, 0.18438720703125, 0.194122314453125, 0.203857421875, 0.213592529296875, 0.22332763671875, 0.233062744140625, 0.2427978515625, 0.252532958984375, 0.26226806640625, 0.272003173828125, 0.28173828125, 0.291473388671875, 0.30120849609375, 0.310943603515625, 0.3206787109375, 0.330413818359375, 0.34014892578125, 0.349884033203125, 0.359619140625]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 4.0, 3.0, 5.0, 4.0, 8.0, 17.0, 14.0, 36.0, 38.0, 56.0, 82.0, 142.0, 199.0, 343.0, 616.0, 1133.0, 2317.0, 5167.0, 12620.0, 35839.0, 113749.0, 325108.0, 352513.0, 131236.0, 41650.0, 14397.0, 5711.0, 2622.0, 1250.0, 651.0, 354.0, 239.0, 143.0, 107.0, 50.0, 41.0, 29.0, 22.0, 10.0, 14.0, 5.0, 6.0, 4.0, 1.0, 3.0, 2.0, 1.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0614013671875, -0.058951377868652344, -0.05650138854980469, -0.05405139923095703, -0.051601409912109375, -0.04915142059326172, -0.04670143127441406, -0.044251441955566406, -0.04180145263671875, -0.039351463317871094, -0.03690147399902344, -0.03445148468017578, -0.032001495361328125, -0.02955150604248047, -0.027101516723632812, -0.024651527404785156, -0.0222015380859375, -0.019751548767089844, -0.017301559448242188, -0.014851570129394531, -0.012401580810546875, -0.009951591491699219, -0.0075016021728515625, -0.005051612854003906, -0.00260162353515625, -0.00015163421630859375, 0.0022983551025390625, 0.004748344421386719, 0.007198333740234375, 0.009648323059082031, 0.012098312377929688, 0.014548301696777344, 0.016998291015625, 0.019448280334472656, 0.021898269653320312, 0.02434825897216797, 0.026798248291015625, 0.02924823760986328, 0.03169822692871094, 0.034148216247558594, 0.03659820556640625, 0.039048194885253906, 0.04149818420410156, 0.04394817352294922, 0.046398162841796875, 0.04884815216064453, 0.05129814147949219, 0.053748130798339844, 0.0561981201171875, 0.058648109436035156, 0.06109809875488281, 0.06354808807373047, 0.06599807739257812, 0.06844806671142578, 0.07089805603027344, 0.0733480453491211, 0.07579803466796875, 0.0782480239868164, 0.08069801330566406, 0.08314800262451172, 0.08559799194335938, 0.08804798126220703, 0.09049797058105469, 0.09294795989990234, 0.09539794921875]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 2.0, 1.0, 5.0, 9.0, 9.0, 8.0, 20.0, 18.0, 23.0, 18.0, 21.0, 35.0, 33.0, 33.0, 55.0, 39.0, 56.0, 63.0, 47.0, 56.0, 41.0, 36.0, 50.0, 43.0, 35.0, 38.0, 32.0, 29.0, 27.0, 30.0, 16.0, 12.0, 11.0, 13.0, 11.0, 6.0, 6.0, 5.0, 2.0, 4.0, 5.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.6015625, -0.583526611328125, -0.56549072265625, -0.547454833984375, -0.5294189453125, -0.511383056640625, -0.49334716796875, -0.475311279296875, -0.457275390625, -0.439239501953125, -0.42120361328125, -0.403167724609375, -0.3851318359375, -0.367095947265625, -0.34906005859375, -0.331024169921875, -0.31298828125, -0.294952392578125, -0.27691650390625, -0.258880615234375, -0.2408447265625, -0.222808837890625, -0.20477294921875, -0.186737060546875, -0.168701171875, -0.150665283203125, -0.13262939453125, -0.114593505859375, -0.0965576171875, -0.078521728515625, -0.06048583984375, -0.042449951171875, -0.0244140625, -0.006378173828125, 0.01165771484375, 0.029693603515625, 0.0477294921875, 0.065765380859375, 0.08380126953125, 0.101837158203125, 0.119873046875, 0.137908935546875, 0.15594482421875, 0.173980712890625, 0.1920166015625, 0.210052490234375, 0.22808837890625, 0.246124267578125, 0.26416015625, 0.282196044921875, 0.30023193359375, 0.318267822265625, 0.3363037109375, 0.354339599609375, 0.37237548828125, 0.390411376953125, 0.408447265625, 0.426483154296875, 0.44451904296875, 0.462554931640625, 0.4805908203125, 0.498626708984375, 0.51666259765625, 0.534698486328125, 0.552734375]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 1.0, 3.0, 3.0, 7.0, 12.0, 16.0, 22.0, 38.0, 53.0, 105.0, 167.0, 326.0, 544.0, 1195.0, 2619.0, 6243.0, 18732.0, 77187.0, 395437.0, 427598.0, 86024.0, 20185.0, 6732.0, 2677.0, 1178.0, 628.0, 336.0, 186.0, 107.0, 66.0, 39.0, 33.0, 15.0, 17.0, 10.0, 7.0, 5.0, 5.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.040771484375, -0.039726972579956055, -0.03868246078491211, -0.037637948989868164, -0.03659343719482422, -0.03554892539978027, -0.03450441360473633, -0.03345990180969238, -0.03241539001464844, -0.03137087821960449, -0.030326366424560547, -0.0292818546295166, -0.028237342834472656, -0.02719283103942871, -0.026148319244384766, -0.02510380744934082, -0.024059295654296875, -0.02301478385925293, -0.021970272064208984, -0.02092576026916504, -0.019881248474121094, -0.01883673667907715, -0.017792224884033203, -0.016747713088989258, -0.015703201293945312, -0.014658689498901367, -0.013614177703857422, -0.012569665908813477, -0.011525154113769531, -0.010480642318725586, -0.00943613052368164, -0.008391618728637695, -0.00734710693359375, -0.006302595138549805, -0.005258083343505859, -0.004213571548461914, -0.0031690597534179688, -0.0021245479583740234, -0.0010800361633300781, -3.552436828613281e-05, 0.0010089874267578125, 0.002053499221801758, 0.003098011016845703, 0.0041425228118896484, 0.005187034606933594, 0.006231546401977539, 0.007276058197021484, 0.00832056999206543, 0.009365081787109375, 0.01040959358215332, 0.011454105377197266, 0.012498617172241211, 0.013543128967285156, 0.014587640762329102, 0.015632152557373047, 0.016676664352416992, 0.017721176147460938, 0.018765687942504883, 0.019810199737548828, 0.020854711532592773, 0.02189922332763672, 0.022943735122680664, 0.02398824691772461, 0.025032758712768555, 0.0260772705078125]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 6.0, 8.0, 4.0, 6.0, 6.0, 4.0, 13.0, 12.0, 19.0, 32.0, 32.0, 58.0, 56.0, 78.0, 81.0, 104.0, 93.0, 101.0, 82.0, 54.0, 45.0, 36.0, 34.0, 13.0, 4.0, 4.0, 6.0, 7.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.806020736694336e-05, -1.7437152564525604e-05, -1.681409776210785e-05, -1.6191042959690094e-05, -1.556798815727234e-05, -1.4944933354854584e-05, -1.4321878552436829e-05, -1.3698823750019073e-05, -1.3075768947601318e-05, -1.2452714145183563e-05, -1.1829659342765808e-05, -1.1206604540348053e-05, -1.0583549737930298e-05, -9.960494935512543e-06, -9.337440133094788e-06, -8.714385330677032e-06, -8.091330528259277e-06, -7.468275725841522e-06, -6.845220923423767e-06, -6.222166121006012e-06, -5.599111318588257e-06, -4.976056516170502e-06, -4.353001713752747e-06, -3.7299469113349915e-06, -3.1068921089172363e-06, -2.483837306499481e-06, -1.860782504081726e-06, -1.237727701663971e-06, -6.146728992462158e-07, 8.381903171539307e-09, 6.314367055892944e-07, 1.2544915080070496e-06, 1.8775463104248047e-06, 2.50060111284256e-06, 3.123655915260315e-06, 3.74671071767807e-06, 4.369765520095825e-06, 4.99282032251358e-06, 5.6158751249313354e-06, 6.2389299273490906e-06, 6.861984729766846e-06, 7.485039532184601e-06, 8.108094334602356e-06, 8.731149137020111e-06, 9.354203939437866e-06, 9.977258741855621e-06, 1.0600313544273376e-05, 1.1223368346691132e-05, 1.1846423149108887e-05, 1.2469477951526642e-05, 1.3092532753944397e-05, 1.3715587556362152e-05, 1.4338642358779907e-05, 1.4961697161197662e-05, 1.5584751963615417e-05, 1.6207806766033173e-05, 1.6830861568450928e-05, 1.7453916370868683e-05, 1.8076971173286438e-05, 1.8700025975704193e-05, 1.9323080778121948e-05, 1.9946135580539703e-05, 2.056919038295746e-05, 2.1192245185375214e-05, 2.181529998779297e-05]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 1.0, 3.0, 7.0, 10.0, 11.0, 12.0, 17.0, 32.0, 61.0, 102.0, 142.0, 234.0, 462.0, 829.0, 1798.0, 4314.0, 11887.0, 38347.0, 161437.0, 489571.0, 254919.0, 57533.0, 16368.0, 5694.0, 2386.0, 1096.0, 596.0, 273.0, 164.0, 95.0, 50.0, 31.0, 16.0, 21.0, 14.0, 11.0, 7.0, 5.0, 3.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0297088623046875, -0.02877020835876465, -0.027831554412841797, -0.026892900466918945, -0.025954246520996094, -0.025015592575073242, -0.02407693862915039, -0.02313828468322754, -0.022199630737304688, -0.021260976791381836, -0.020322322845458984, -0.019383668899536133, -0.01844501495361328, -0.01750636100769043, -0.016567707061767578, -0.015629053115844727, -0.014690399169921875, -0.013751745223999023, -0.012813091278076172, -0.01187443733215332, -0.010935783386230469, -0.009997129440307617, -0.009058475494384766, -0.008119821548461914, -0.0071811676025390625, -0.006242513656616211, -0.005303859710693359, -0.004365205764770508, -0.0034265518188476562, -0.0024878978729248047, -0.0015492439270019531, -0.0006105899810791016, 0.00032806396484375, 0.0012667179107666016, 0.002205371856689453, 0.0031440258026123047, 0.004082679748535156, 0.005021333694458008, 0.005959987640380859, 0.006898641586303711, 0.007837295532226562, 0.008775949478149414, 0.009714603424072266, 0.010653257369995117, 0.011591911315917969, 0.01253056526184082, 0.013469219207763672, 0.014407873153686523, 0.015346527099609375, 0.016285181045532227, 0.017223834991455078, 0.01816248893737793, 0.01910114288330078, 0.020039796829223633, 0.020978450775146484, 0.021917104721069336, 0.022855758666992188, 0.02379441261291504, 0.02473306655883789, 0.025671720504760742, 0.026610374450683594, 0.027549028396606445, 0.028487682342529297, 0.02942633628845215, 0.030364990234375]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 5.0, 2.0, 3.0, 9.0, 6.0, 4.0, 5.0, 9.0, 13.0, 14.0, 16.0, 27.0, 44.0, 44.0, 47.0, 72.0, 93.0, 85.0, 84.0, 91.0, 59.0, 67.0, 54.0, 38.0, 33.0, 18.0, 23.0, 12.0, 11.0, 5.0, 2.0, 4.0, 3.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0082244873046875, -0.007966399192810059, -0.007708311080932617, -0.007450222969055176, -0.007192134857177734, -0.006934046745300293, -0.0066759586334228516, -0.00641787052154541, -0.006159782409667969, -0.005901694297790527, -0.005643606185913086, -0.0053855180740356445, -0.005127429962158203, -0.004869341850280762, -0.00461125373840332, -0.004353165626525879, -0.0040950775146484375, -0.003836989402770996, -0.0035789012908935547, -0.0033208131790161133, -0.003062725067138672, -0.0028046369552612305, -0.002546548843383789, -0.0022884607315063477, -0.0020303726196289062, -0.0017722845077514648, -0.0015141963958740234, -0.001256108283996582, -0.0009980201721191406, -0.0007399320602416992, -0.0004818439483642578, -0.0002237558364868164, 3.4332275390625e-05, 0.0002924203872680664, 0.0005505084991455078, 0.0008085966110229492, 0.0010666847229003906, 0.001324772834777832, 0.0015828609466552734, 0.0018409490585327148, 0.0020990371704101562, 0.0023571252822875977, 0.002615213394165039, 0.0028733015060424805, 0.003131389617919922, 0.0033894777297973633, 0.0036475658416748047, 0.003905653953552246, 0.0041637420654296875, 0.004421830177307129, 0.00467991828918457, 0.004938006401062012, 0.005196094512939453, 0.0054541826248168945, 0.005712270736694336, 0.005970358848571777, 0.006228446960449219, 0.00648653507232666, 0.0067446231842041016, 0.007002711296081543, 0.007260799407958984, 0.007518887519836426, 0.007776975631713867, 0.008035063743591309, 0.00829315185546875]}, "gradients/decoder.model.decoder.layers.7.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 8.0, 10.0, 18.0, 25.0, 58.0, 84.0, 154.0, 203.0, 165.0, 129.0, 62.0, 52.0, 17.0, 11.0, 3.0, 4.0, 4.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5143777132034302, -0.489646315574646, -0.4649149477481842, -0.4401835501194, -0.41545215249061584, -0.39072078466415405, -0.3659893870353699, -0.3412579894065857, -0.3165265917778015, -0.29179519414901733, -0.26706382632255554, -0.24233242869377136, -0.21760103106498718, -0.1928696483373642, -0.1681382656097412, -0.14340686798095703, -0.11867550015449524, -0.09394410997629166, -0.06921271979808807, -0.04448133707046509, -0.019749946892261505, 0.004981443285942078, 0.029712826013565063, 0.05444422364234924, 0.07917560636997223, 0.10390699654817581, 0.1286383867263794, 0.15336976945400238, 0.17810115218162537, 0.20283254981040955, 0.22756393253803253, 0.2522953152656555, 0.2770267128944397, 0.3017581105232239, 0.32648947834968567, 0.35122087597846985, 0.37595227360725403, 0.4006836414337158, 0.4254150390625, 0.4501464366912842, 0.47487783432006836, 0.49960923194885254, 0.5243406295776367, 0.5490720272064209, 0.5738033652305603, 0.5985347628593445, 0.6232661604881287, 0.6479975581169128, 0.6727288961410522, 0.6974602937698364, 0.7221916913986206, 0.7469230890274048, 0.7716544270515442, 0.7963858246803284, 0.8211172223091125, 0.8458486199378967, 0.8705800175666809, 0.8953114151954651, 0.9200428128242493, 0.9447741508483887, 0.9695055484771729, 0.994236946105957, 1.0189683437347412, 1.0436997413635254, 1.0684311389923096]}, "gradients/decoder.model.decoder.layers.7.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 0.0, 3.0, 4.0, 2.0, 3.0, 7.0, 5.0, 6.0, 6.0, 12.0, 10.0, 14.0, 19.0, 25.0, 25.0, 30.0, 33.0, 41.0, 32.0, 47.0, 46.0, 38.0, 54.0, 57.0, 53.0, 46.0, 39.0, 27.0, 33.0, 37.0, 51.0, 35.0, 32.0, 22.0, 23.0, 24.0, 16.0, 10.0, 8.0, 14.0, 8.0, 3.0, 6.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.23610919713974, -0.22735466063022614, -0.21860012412071228, -0.20984557271003723, -0.20109103620052338, -0.19233649969100952, -0.18358194828033447, -0.17482741177082062, -0.16607287526130676, -0.1573183387517929, -0.14856380224227905, -0.139809250831604, -0.13105471432209015, -0.1223001778125763, -0.11354563385248184, -0.10479108989238739, -0.09603655338287354, -0.08728201687335968, -0.07852747291326523, -0.06977292895317078, -0.06101839244365692, -0.05226385220885277, -0.043509311974048615, -0.03475477173924446, -0.026000231504440308, -0.017245691269636154, -0.008491151034832, 0.0002633891999721527, 0.009017929434776306, 0.01777246966958046, 0.026527009904384613, 0.035281550139188766, 0.04403609037399292, 0.05279063060879707, 0.06154517084360123, 0.07029971480369568, 0.07905425131320953, 0.08780878782272339, 0.09656333178281784, 0.10531787574291229, 0.11407241225242615, 0.12282694876194, 0.13158148527145386, 0.1403360366821289, 0.14909057319164276, 0.15784510970115662, 0.16659966111183167, 0.17535419762134552, 0.18410873413085938, 0.19286327064037323, 0.20161780714988708, 0.21037235856056213, 0.219126895070076, 0.22788143157958984, 0.2366359829902649, 0.24539051949977875, 0.2541450560092926, 0.26289960741996765, 0.2716541290283203, 0.28040868043899536, 0.2891632318496704, 0.29791775345802307, 0.3066723048686981, 0.3154268264770508, 0.32418137788772583]}, "gradients/decoder.model.decoder.layers.7.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 6.0, 12.0, 7.0, 18.0, 53.0, 110.0, 412.0, 1786.0, 11144.0, 132611.0, 821456.0, 71883.0, 7301.0, 1256.0, 321.0, 87.0, 39.0, 18.0, 10.0, 4.0, 6.0, 5.0, 1.0, 3.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.97607421875, -0.94769287109375, -0.9193115234375, -0.89093017578125, -0.862548828125, -0.83416748046875, -0.8057861328125, -0.77740478515625, -0.7490234375, -0.72064208984375, -0.6922607421875, -0.66387939453125, -0.635498046875, -0.60711669921875, -0.5787353515625, -0.55035400390625, -0.52197265625, -0.49359130859375, -0.4652099609375, -0.43682861328125, -0.408447265625, -0.38006591796875, -0.3516845703125, -0.32330322265625, -0.294921875, -0.26654052734375, -0.2381591796875, -0.20977783203125, -0.181396484375, -0.15301513671875, -0.1246337890625, -0.09625244140625, -0.06787109375, -0.03948974609375, -0.0111083984375, 0.01727294921875, 0.045654296875, 0.07403564453125, 0.1024169921875, 0.13079833984375, 0.1591796875, 0.18756103515625, 0.2159423828125, 0.24432373046875, 0.272705078125, 0.30108642578125, 0.3294677734375, 0.35784912109375, 0.38623046875, 0.41461181640625, 0.4429931640625, 0.47137451171875, 0.499755859375, 0.52813720703125, 0.5565185546875, 0.58489990234375, 0.61328125, 0.64166259765625, 0.6700439453125, 0.69842529296875, 0.726806640625, 0.75518798828125, 0.7835693359375, 0.81195068359375, 0.84033203125]}, "gradients/decoder.model.decoder.layers.7.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 3.0, 3.0, 3.0, 3.0, 5.0, 4.0, 9.0, 12.0, 13.0, 20.0, 27.0, 33.0, 29.0, 43.0, 48.0, 50.0, 53.0, 58.0, 62.0, 90.0, 58.0, 58.0, 45.0, 52.0, 47.0, 41.0, 39.0, 22.0, 23.0, 15.0, 15.0, 10.0, 8.0, 3.0, 6.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.484130859375, -0.4623908996582031, -0.44065093994140625, -0.4189109802246094, -0.3971710205078125, -0.3754310607910156, -0.35369110107421875, -0.3319511413574219, -0.310211181640625, -0.2884712219238281, -0.26673126220703125, -0.24499130249023438, -0.2232513427734375, -0.20151138305664062, -0.17977142333984375, -0.15803146362304688, -0.13629150390625, -0.11455154418945312, -0.09281158447265625, -0.07107162475585938, -0.0493316650390625, -0.027591705322265625, -0.00585174560546875, 0.015888214111328125, 0.037628173828125, 0.059368133544921875, 0.08110809326171875, 0.10284805297851562, 0.1245880126953125, 0.14632797241210938, 0.16806793212890625, 0.18980789184570312, 0.2115478515625, 0.23328781127929688, 0.25502777099609375, 0.2767677307128906, 0.2985076904296875, 0.3202476501464844, 0.34198760986328125, 0.3637275695800781, 0.385467529296875, 0.4072074890136719, 0.42894744873046875, 0.4506874084472656, 0.4724273681640625, 0.4941673278808594, 0.5159072875976562, 0.5376472473144531, 0.55938720703125, 0.5811271667480469, 0.6028671264648438, 0.6246070861816406, 0.6463470458984375, 0.6680870056152344, 0.6898269653320312, 0.7115669250488281, 0.733306884765625, 0.7550468444824219, 0.7767868041992188, 0.7985267639160156, 0.8202667236328125, 0.8420066833496094, 0.8637466430664062, 0.8854866027832031, 0.9072265625]}, "gradients/decoder.model.decoder.layers.7.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 1.0, 5.0, 3.0, 7.0, 9.0, 4.0, 11.0, 20.0, 22.0, 22.0, 37.0, 38.0, 38.0, 37.0, 70.0, 72.0, 110.0, 133.0, 183.0, 337.0, 794.0, 3641.0, 31193.0, 648320.0, 339592.0, 19575.0, 2576.0, 593.0, 290.0, 198.0, 133.0, 106.0, 80.0, 55.0, 46.0, 51.0, 35.0, 24.0, 22.0, 17.0, 12.0, 11.0, 5.0, 4.0, 11.0, 4.0, 5.0, 5.0, 3.0, 1.0, 2.0, 2.0, 1.0], "bins": [-0.8916015625, -0.866058349609375, -0.84051513671875, -0.814971923828125, -0.7894287109375, -0.763885498046875, -0.73834228515625, -0.712799072265625, -0.687255859375, -0.661712646484375, -0.63616943359375, -0.610626220703125, -0.5850830078125, -0.559539794921875, -0.53399658203125, -0.508453369140625, -0.48291015625, -0.457366943359375, -0.43182373046875, -0.406280517578125, -0.3807373046875, -0.355194091796875, -0.32965087890625, -0.304107666015625, -0.278564453125, -0.253021240234375, -0.22747802734375, -0.201934814453125, -0.1763916015625, -0.150848388671875, -0.12530517578125, -0.099761962890625, -0.07421875, -0.048675537109375, -0.02313232421875, 0.002410888671875, 0.0279541015625, 0.053497314453125, 0.07904052734375, 0.104583740234375, 0.130126953125, 0.155670166015625, 0.18121337890625, 0.206756591796875, 0.2322998046875, 0.257843017578125, 0.28338623046875, 0.308929443359375, 0.33447265625, 0.360015869140625, 0.38555908203125, 0.411102294921875, 0.4366455078125, 0.462188720703125, 0.48773193359375, 0.513275146484375, 0.538818359375, 0.564361572265625, 0.58990478515625, 0.615447998046875, 0.6409912109375, 0.666534423828125, 0.69207763671875, 0.717620849609375, 0.7431640625]}, "gradients/decoder.model.decoder.layers.7.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 3.0, 4.0, 7.0, 2.0, 8.0, 13.0, 12.0, 9.0, 14.0, 15.0, 22.0, 28.0, 18.0, 26.0, 26.0, 37.0, 33.0, 30.0, 30.0, 40.0, 44.0, 45.0, 40.0, 42.0, 54.0, 46.0, 42.0, 37.0, 36.0, 34.0, 40.0, 30.0, 16.0, 20.0, 19.0, 9.0, 10.0, 17.0, 11.0, 13.0, 6.0, 6.0, 4.0, 3.0, 1.0, 4.0, 4.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.53857421875, -0.5217132568359375, -0.504852294921875, -0.4879913330078125, -0.47113037109375, -0.4542694091796875, -0.437408447265625, -0.4205474853515625, -0.4036865234375, -0.3868255615234375, -0.369964599609375, -0.3531036376953125, -0.33624267578125, -0.3193817138671875, -0.302520751953125, -0.2856597900390625, -0.268798828125, -0.2519378662109375, -0.235076904296875, -0.2182159423828125, -0.20135498046875, -0.1844940185546875, -0.167633056640625, -0.1507720947265625, -0.1339111328125, -0.1170501708984375, -0.100189208984375, -0.0833282470703125, -0.06646728515625, -0.0496063232421875, -0.032745361328125, -0.0158843994140625, 0.0009765625, 0.0178375244140625, 0.034698486328125, 0.0515594482421875, 0.06842041015625, 0.0852813720703125, 0.102142333984375, 0.1190032958984375, 0.1358642578125, 0.1527252197265625, 0.169586181640625, 0.1864471435546875, 0.20330810546875, 0.2201690673828125, 0.237030029296875, 0.2538909912109375, 0.270751953125, 0.2876129150390625, 0.304473876953125, 0.3213348388671875, 0.33819580078125, 0.3550567626953125, 0.371917724609375, 0.3887786865234375, 0.4056396484375, 0.4225006103515625, 0.439361572265625, 0.4562225341796875, 0.47308349609375, 0.4899444580078125, 0.506805419921875, 0.5236663818359375, 0.54052734375]}, "gradients/decoder.model.decoder.layers.7.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 5.0, 6.0, 2.0, 4.0, 6.0, 7.0, 18.0, 22.0, 40.0, 73.0, 162.0, 485.0, 1612.0, 8321.0, 120923.0, 860966.0, 49255.0, 4874.0, 1142.0, 342.0, 136.0, 59.0, 31.0, 20.0, 14.0, 6.0, 4.0, 10.0, 5.0, 3.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.267333984375, -0.2579078674316406, -0.24848175048828125, -0.23905563354492188, -0.2296295166015625, -0.22020339965820312, -0.21077728271484375, -0.20135116577148438, -0.191925048828125, -0.18249893188476562, -0.17307281494140625, -0.16364669799804688, -0.1542205810546875, -0.14479446411132812, -0.13536834716796875, -0.12594223022460938, -0.11651611328125, -0.10708999633789062, -0.09766387939453125, -0.08823776245117188, -0.0788116455078125, -0.06938552856445312, -0.05995941162109375, -0.050533294677734375, -0.041107177734375, -0.031681060791015625, -0.02225494384765625, -0.012828826904296875, -0.0034027099609375, 0.006023406982421875, 0.01544952392578125, 0.024875640869140625, 0.0343017578125, 0.043727874755859375, 0.05315399169921875, 0.06258010864257812, 0.0720062255859375, 0.08143234252929688, 0.09085845947265625, 0.10028457641601562, 0.109710693359375, 0.11913681030273438, 0.12856292724609375, 0.13798904418945312, 0.1474151611328125, 0.15684127807617188, 0.16626739501953125, 0.17569351196289062, 0.18511962890625, 0.19454574584960938, 0.20397186279296875, 0.21339797973632812, 0.2228240966796875, 0.23225021362304688, 0.24167633056640625, 0.2511024475097656, 0.260528564453125, 0.2699546813964844, 0.27938079833984375, 0.2888069152832031, 0.2982330322265625, 0.3076591491699219, 0.31708526611328125, 0.3265113830566406, 0.3359375]}, "gradients/decoder.model.decoder.layers.7.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 5.0, 3.0, 4.0, 8.0, 12.0, 20.0, 30.0, 51.0, 65.0, 116.0, 182.0, 191.0, 112.0, 71.0, 43.0, 29.0, 21.0, 17.0, 5.0, 5.0, 7.0, 2.0, 1.0, 3.0, 4.0, 1.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.7206878662109375e-05, -4.590023308992386e-05, -4.459358751773834e-05, -4.3286941945552826e-05, -4.198029637336731e-05, -4.067365080118179e-05, -3.936700522899628e-05, -3.806035965681076e-05, -3.6753714084625244e-05, -3.544706851243973e-05, -3.414042294025421e-05, -3.2833777368068695e-05, -3.152713179588318e-05, -3.0220486223697662e-05, -2.8913840651512146e-05, -2.760719507932663e-05, -2.6300549507141113e-05, -2.4993903934955597e-05, -2.368725836277008e-05, -2.2380612790584564e-05, -2.1073967218399048e-05, -1.976732164621353e-05, -1.8460676074028015e-05, -1.71540305018425e-05, -1.5847384929656982e-05, -1.4540739357471466e-05, -1.323409378528595e-05, -1.1927448213100433e-05, -1.0620802640914917e-05, -9.3141570687294e-06, -8.007511496543884e-06, -6.700865924358368e-06, -5.3942203521728516e-06, -4.087574779987335e-06, -2.780929207801819e-06, -1.4742836356163025e-06, -1.6763806343078613e-07, 1.1390075087547302e-06, 2.4456530809402466e-06, 3.752298653125763e-06, 5.058944225311279e-06, 6.365589797496796e-06, 7.672235369682312e-06, 8.978880941867828e-06, 1.0285526514053345e-05, 1.1592172086238861e-05, 1.2898817658424377e-05, 1.4205463230609894e-05, 1.551210880279541e-05, 1.6818754374980927e-05, 1.8125399947166443e-05, 1.943204551935196e-05, 2.0738691091537476e-05, 2.2045336663722992e-05, 2.3351982235908508e-05, 2.4658627808094025e-05, 2.596527338027954e-05, 2.7271918952465057e-05, 2.8578564524650574e-05, 2.988521009683609e-05, 3.1191855669021606e-05, 3.249850124120712e-05, 3.380514681339264e-05, 3.5111792385578156e-05, 3.641843795776367e-05]}, "gradients/decoder.model.decoder.layers.7.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 4.0, 0.0, 6.0, 1.0, 10.0, 9.0, 17.0, 17.0, 36.0, 80.0, 158.0, 493.0, 1764.0, 10846.0, 290272.0, 721933.0, 19331.0, 2544.0, 613.0, 204.0, 86.0, 47.0, 36.0, 11.0, 9.0, 13.0, 5.0, 1.0, 6.0, 4.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-0.37548828125, -0.3637962341308594, -0.35210418701171875, -0.3404121398925781, -0.3287200927734375, -0.3170280456542969, -0.30533599853515625, -0.2936439514160156, -0.281951904296875, -0.2702598571777344, -0.25856781005859375, -0.24687576293945312, -0.2351837158203125, -0.22349166870117188, -0.21179962158203125, -0.20010757446289062, -0.18841552734375, -0.17672348022460938, -0.16503143310546875, -0.15333938598632812, -0.1416473388671875, -0.12995529174804688, -0.11826324462890625, -0.10657119750976562, -0.094879150390625, -0.08318710327148438, -0.07149505615234375, -0.059803009033203125, -0.0481109619140625, -0.036418914794921875, -0.02472686767578125, -0.013034820556640625, -0.0013427734375, 0.010349273681640625, 0.02204132080078125, 0.033733367919921875, 0.0454254150390625, 0.057117462158203125, 0.06880950927734375, 0.08050155639648438, 0.092193603515625, 0.10388565063476562, 0.11557769775390625, 0.12726974487304688, 0.1389617919921875, 0.15065383911132812, 0.16234588623046875, 0.17403793334960938, 0.18572998046875, 0.19742202758789062, 0.20911407470703125, 0.22080612182617188, 0.2324981689453125, 0.24419021606445312, 0.25588226318359375, 0.2675743103027344, 0.279266357421875, 0.2909584045410156, 0.30265045166015625, 0.3143424987792969, 0.3260345458984375, 0.3377265930175781, 0.34941864013671875, 0.3611106872558594, 0.372802734375]}, "gradients/decoder.model.decoder.layers.7.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 3.0, 3.0, 6.0, 9.0, 11.0, 7.0, 23.0, 28.0, 39.0, 67.0, 113.0, 164.0, 156.0, 125.0, 90.0, 41.0, 37.0, 25.0, 17.0, 15.0, 8.0, 7.0, 2.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1031494140625, -0.10021686553955078, -0.09728431701660156, -0.09435176849365234, -0.09141921997070312, -0.0884866714477539, -0.08555412292480469, -0.08262157440185547, -0.07968902587890625, -0.07675647735595703, -0.07382392883300781, -0.0708913803100586, -0.06795883178710938, -0.06502628326416016, -0.06209373474121094, -0.05916118621826172, -0.0562286376953125, -0.05329608917236328, -0.05036354064941406, -0.047430992126464844, -0.044498443603515625, -0.041565895080566406, -0.03863334655761719, -0.03570079803466797, -0.03276824951171875, -0.02983570098876953, -0.026903152465820312, -0.023970603942871094, -0.021038055419921875, -0.018105506896972656, -0.015172958374023438, -0.012240409851074219, -0.009307861328125, -0.006375312805175781, -0.0034427642822265625, -0.0005102157592773438, 0.002422332763671875, 0.005354881286621094, 0.008287429809570312, 0.011219978332519531, 0.01415252685546875, 0.01708507537841797, 0.020017623901367188, 0.022950172424316406, 0.025882720947265625, 0.028815269470214844, 0.03174781799316406, 0.03468036651611328, 0.0376129150390625, 0.04054546356201172, 0.04347801208496094, 0.046410560607910156, 0.049343109130859375, 0.052275657653808594, 0.05520820617675781, 0.05814075469970703, 0.06107330322265625, 0.06400585174560547, 0.06693840026855469, 0.0698709487915039, 0.07280349731445312, 0.07573604583740234, 0.07866859436035156, 0.08160114288330078, 0.08453369140625]}, "gradients/decoder.model.decoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 3.0, 1.0, 3.0, 3.0, 7.0, 8.0, 11.0, 20.0, 25.0, 40.0, 65.0, 90.0, 108.0, 141.0, 133.0, 107.0, 91.0, 59.0, 31.0, 24.0, 11.0, 9.0, 6.0, 2.0, 5.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8961554765701294, -0.8628050684928894, -0.8294546008110046, -0.7961041927337646, -0.7627537250518799, -0.7294033169746399, -0.6960529088973999, -0.6627024412155151, -0.6293519735336304, -0.5960015654563904, -0.5626510977745056, -0.5293006896972656, -0.49595022201538086, -0.46259981393814087, -0.4292493760585785, -0.3958989381790161, -0.3625485301017761, -0.32919809222221375, -0.29584765434265137, -0.2624972462654114, -0.2291467934846878, -0.19579635560512543, -0.16244593262672424, -0.12909549474716187, -0.09574505686759949, -0.06239462271332741, -0.02904418855905533, 0.004306241869926453, 0.03765667974948883, 0.07100711762905121, 0.10435754060745239, 0.13770797848701477, 0.17105841636657715, 0.20440885424613953, 0.2377592921257019, 0.2711097002029419, 0.30446016788482666, 0.33781057596206665, 0.37116101384162903, 0.4045114517211914, 0.4378618896007538, 0.47121232748031616, 0.5045627355575562, 0.5379132032394409, 0.5712636113166809, 0.6046140789985657, 0.6379644870758057, 0.6713149547576904, 0.7046653628349304, 0.7380157709121704, 0.7713662385940552, 0.8047166466712952, 0.8380671143531799, 0.8714175224304199, 0.9047679901123047, 0.9381183981895447, 0.9714688062667847, 1.0048192739486694, 1.0381696224212646, 1.0715200901031494, 1.1048705577850342, 1.138221025466919, 1.1715713739395142, 1.204921841621399, 1.2382723093032837]}, "gradients/decoder.model.decoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 2.0, 2.0, 14.0, 8.0, 12.0, 9.0, 21.0, 15.0, 25.0, 31.0, 37.0, 49.0, 29.0, 45.0, 55.0, 52.0, 56.0, 54.0, 56.0, 56.0, 57.0, 48.0, 50.0, 42.0, 31.0, 40.0, 28.0, 22.0, 19.0, 20.0, 7.0, 7.0, 4.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9736251831054688, -0.9356900453567505, -0.8977549076080322, -0.8598197102546692, -0.8218845725059509, -0.7839494347572327, -0.7460142374038696, -0.7080790996551514, -0.6701439619064331, -0.6322088241577148, -0.5942736864089966, -0.5563384890556335, -0.5184033513069153, -0.480468213558197, -0.44253304600715637, -0.4045978784561157, -0.36666274070739746, -0.3287276029586792, -0.29079243540763855, -0.2528572678565979, -0.21492213010787964, -0.17698697745800018, -0.13905182480812073, -0.10111665725708008, -0.06318151950836182, -0.02524636685848236, 0.012688785791397095, 0.05062393844127655, 0.088559091091156, 0.12649424374103546, 0.16442939639091492, 0.20236456394195557, 0.24029982089996338, 0.27823495864868164, 0.3161701261997223, 0.35410529375076294, 0.3920404314994812, 0.42997556924819946, 0.4679107367992401, 0.5058459043502808, 0.543781042098999, 0.5817161798477173, 0.6196513175964355, 0.6575865149497986, 0.6955216526985168, 0.7334567904472351, 0.7713919878005981, 0.8093271255493164, 0.8472622632980347, 0.8851974010467529, 0.9231325387954712, 0.9610677361488342, 0.9990028738975525, 1.0369380712509155, 1.0748732089996338, 1.112808346748352, 1.1507434844970703, 1.1886786222457886, 1.2266137599945068, 1.264548897743225, 1.3024840354919434, 1.3404192924499512, 1.3783544301986694, 1.4162895679473877, 1.454224705696106]}, "gradients/decoder.model.decoder.layers.6.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 2.0, 2.0, 4.0, 2.0, 8.0, 6.0, 10.0, 10.0, 15.0, 20.0, 43.0, 57.0, 110.0, 269.0, 613.0, 1869.0, 7164.0, 52445.0, 1978350.0, 2083160.0, 59274.0, 7524.0, 2011.0, 680.0, 276.0, 130.0, 78.0, 39.0, 35.0, 15.0, 15.0, 11.0, 10.0, 4.0, 3.0, 5.0, 7.0, 4.0, 2.0, 1.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8857421875, -0.8552093505859375, -0.824676513671875, -0.7941436767578125, -0.76361083984375, -0.7330780029296875, -0.702545166015625, -0.6720123291015625, -0.6414794921875, -0.6109466552734375, -0.580413818359375, -0.5498809814453125, -0.51934814453125, -0.4888153076171875, -0.458282470703125, -0.4277496337890625, -0.397216796875, -0.3666839599609375, -0.336151123046875, -0.3056182861328125, -0.27508544921875, -0.2445526123046875, -0.214019775390625, -0.1834869384765625, -0.1529541015625, -0.1224212646484375, -0.091888427734375, -0.0613555908203125, -0.03082275390625, -0.0002899169921875, 0.030242919921875, 0.0607757568359375, 0.09130859375, 0.1218414306640625, 0.152374267578125, 0.1829071044921875, 0.21343994140625, 0.2439727783203125, 0.274505615234375, 0.3050384521484375, 0.3355712890625, 0.3661041259765625, 0.396636962890625, 0.4271697998046875, 0.45770263671875, 0.4882354736328125, 0.518768310546875, 0.5493011474609375, 0.579833984375, 0.6103668212890625, 0.640899658203125, 0.6714324951171875, 0.70196533203125, 0.7324981689453125, 0.763031005859375, 0.7935638427734375, 0.8240966796875, 0.8546295166015625, 0.885162353515625, 0.9156951904296875, 0.94622802734375, 0.9767608642578125, 1.007293701171875, 1.0378265380859375, 1.068359375]}, "gradients/decoder.model.decoder.layers.6.fc2.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 1.0, 4.0, 3.0, 3.0, 6.0, 3.0, 4.0, 5.0, 7.0, 12.0, 11.0, 20.0, 21.0, 18.0, 23.0, 39.0, 27.0, 48.0, 40.0, 45.0, 54.0, 40.0, 51.0, 58.0, 45.0, 46.0, 49.0, 41.0, 42.0, 48.0, 29.0, 28.0, 29.0, 28.0, 20.0, 13.0, 15.0, 10.0, 7.0, 7.0, 6.0, 2.0, 2.0, 5.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.33984375, -0.3273773193359375, -0.314910888671875, -0.3024444580078125, -0.28997802734375, -0.2775115966796875, -0.265045166015625, -0.2525787353515625, -0.2401123046875, -0.2276458740234375, -0.215179443359375, -0.2027130126953125, -0.19024658203125, -0.1777801513671875, -0.165313720703125, -0.1528472900390625, -0.140380859375, -0.1279144287109375, -0.115447998046875, -0.1029815673828125, -0.09051513671875, -0.0780487060546875, -0.065582275390625, -0.0531158447265625, -0.0406494140625, -0.0281829833984375, -0.015716552734375, -0.0032501220703125, 0.00921630859375, 0.0216827392578125, 0.034149169921875, 0.0466156005859375, 0.05908203125, 0.0715484619140625, 0.084014892578125, 0.0964813232421875, 0.10894775390625, 0.1214141845703125, 0.133880615234375, 0.1463470458984375, 0.1588134765625, 0.1712799072265625, 0.183746337890625, 0.1962127685546875, 0.20867919921875, 0.2211456298828125, 0.233612060546875, 0.2460784912109375, 0.258544921875, 0.2710113525390625, 0.283477783203125, 0.2959442138671875, 0.30841064453125, 0.3208770751953125, 0.333343505859375, 0.3458099365234375, 0.3582763671875, 0.3707427978515625, 0.383209228515625, 0.3956756591796875, 0.40814208984375, 0.4206085205078125, 0.433074951171875, 0.4455413818359375, 0.4580078125]}, "gradients/decoder.model.decoder.layers.6.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 1.0, 2.0, 2.0, 5.0, 6.0, 4.0, 12.0, 10.0, 21.0, 38.0, 64.0, 82.0, 191.0, 452.0, 1500.0, 6838.0, 98440.0, 3946702.0, 129280.0, 8024.0, 1651.0, 511.0, 221.0, 81.0, 46.0, 31.0, 21.0, 23.0, 12.0, 9.0, 7.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.3203125, -1.2831573486328125, -1.246002197265625, -1.2088470458984375, -1.17169189453125, -1.1345367431640625, -1.097381591796875, -1.0602264404296875, -1.0230712890625, -0.9859161376953125, -0.948760986328125, -0.9116058349609375, -0.87445068359375, -0.8372955322265625, -0.800140380859375, -0.7629852294921875, -0.725830078125, -0.6886749267578125, -0.651519775390625, -0.6143646240234375, -0.57720947265625, -0.5400543212890625, -0.502899169921875, -0.4657440185546875, -0.4285888671875, -0.3914337158203125, -0.354278564453125, -0.3171234130859375, -0.27996826171875, -0.2428131103515625, -0.205657958984375, -0.1685028076171875, -0.13134765625, -0.0941925048828125, -0.057037353515625, -0.0198822021484375, 0.01727294921875, 0.0544281005859375, 0.091583251953125, 0.1287384033203125, 0.1658935546875, 0.2030487060546875, 0.240203857421875, 0.2773590087890625, 0.31451416015625, 0.3516693115234375, 0.388824462890625, 0.4259796142578125, 0.463134765625, 0.5002899169921875, 0.537445068359375, 0.5746002197265625, 0.61175537109375, 0.6489105224609375, 0.686065673828125, 0.7232208251953125, 0.7603759765625, 0.7975311279296875, 0.834686279296875, 0.8718414306640625, 0.90899658203125, 0.9461517333984375, 0.983306884765625, 1.0204620361328125, 1.0576171875]}, "gradients/decoder.model.decoder.layers.6.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 1.0, 3.0, 3.0, 4.0, 11.0, 15.0, 21.0, 25.0, 27.0, 41.0, 74.0, 101.0, 163.0, 280.0, 462.0, 671.0, 724.0, 527.0, 331.0, 192.0, 121.0, 82.0, 48.0, 46.0, 28.0, 21.0, 16.0, 13.0, 9.0, 5.0, 7.0, 2.0, 1.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1602783203125, -0.1548004150390625, -0.149322509765625, -0.1438446044921875, -0.13836669921875, -0.1328887939453125, -0.127410888671875, -0.1219329833984375, -0.116455078125, -0.1109771728515625, -0.105499267578125, -0.1000213623046875, -0.09454345703125, -0.0890655517578125, -0.083587646484375, -0.0781097412109375, -0.0726318359375, -0.0671539306640625, -0.061676025390625, -0.0561981201171875, -0.05072021484375, -0.0452423095703125, -0.039764404296875, -0.0342864990234375, -0.02880859375, -0.0233306884765625, -0.017852783203125, -0.0123748779296875, -0.00689697265625, -0.0014190673828125, 0.004058837890625, 0.0095367431640625, 0.0150146484375, 0.0204925537109375, 0.025970458984375, 0.0314483642578125, 0.03692626953125, 0.0424041748046875, 0.047882080078125, 0.0533599853515625, 0.058837890625, 0.0643157958984375, 0.069793701171875, 0.0752716064453125, 0.08074951171875, 0.0862274169921875, 0.091705322265625, 0.0971832275390625, 0.1026611328125, 0.1081390380859375, 0.113616943359375, 0.1190948486328125, 0.12457275390625, 0.1300506591796875, 0.135528564453125, 0.1410064697265625, 0.146484375, 0.1519622802734375, 0.157440185546875, 0.1629180908203125, 0.16839599609375, 0.1738739013671875, 0.179351806640625, 0.1848297119140625, 0.1903076171875]}, "gradients/decoder.model.decoder.layers.6.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 7.0, 6.0, 11.0, 16.0, 27.0, 30.0, 44.0, 60.0, 90.0, 123.0, 149.0, 122.0, 96.0, 68.0, 65.0, 37.0, 15.0, 11.0, 9.0, 9.0, 2.0, 3.0, 2.0, 1.0, 2.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6566445231437683, -0.6300395727157593, -0.6034346222877502, -0.5768296718597412, -0.5502246618270874, -0.5236197113990784, -0.49701476097106934, -0.4704098105430603, -0.4438048303127289, -0.41719987988471985, -0.3905948996543884, -0.3639899492263794, -0.33738499879837036, -0.31078001856803894, -0.2841750681400299, -0.2575700879096985, -0.23096513748168945, -0.20436017215251923, -0.177755206823349, -0.15115025639533997, -0.12454529106616974, -0.09794032573699951, -0.07133537530899048, -0.04473040997982025, -0.018125444650650024, 0.008479516953229904, 0.03508447855710983, 0.06168943643569946, 0.08829440176486969, 0.11489936709403992, 0.14150431752204895, 0.16810928285121918, 0.19471430778503418, 0.2213192731142044, 0.24792423844337463, 0.27452918887138367, 0.3011341691017151, 0.3277391195297241, 0.35434406995773315, 0.3809490203857422, 0.4075540006160736, 0.43415895104408264, 0.46076393127441406, 0.4873688817024231, 0.5139738321304321, 0.5405788421630859, 0.5671837329864502, 0.593788743019104, 0.620393693447113, 0.6469986438751221, 0.6736035943031311, 0.7002085447311401, 0.726813554763794, 0.753418505191803, 0.780023455619812, 0.806628406047821, 0.8332333564758301, 0.8598383069038391, 0.8864432573318481, 0.913048267364502, 0.939653217792511, 0.96625816822052, 0.992863118648529, 1.019468069076538, 1.046073079109192]}, "gradients/decoder.model.decoder.layers.6.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 3.0, 3.0, 4.0, 7.0, 4.0, 7.0, 16.0, 10.0, 15.0, 21.0, 18.0, 26.0, 18.0, 32.0, 41.0, 35.0, 50.0, 55.0, 44.0, 48.0, 52.0, 48.0, 52.0, 46.0, 49.0, 37.0, 47.0, 41.0, 32.0, 30.0, 14.0, 25.0, 17.0, 18.0, 9.0, 11.0, 8.0, 5.0, 6.0, 3.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3984873294830322, -0.38455063104629517, -0.3706139326095581, -0.35667726397514343, -0.34274056553840637, -0.3288038671016693, -0.31486716866493225, -0.3009305000305176, -0.2869938015937805, -0.27305710315704346, -0.2591204047203064, -0.24518372118473053, -0.23124703764915466, -0.2173103392124176, -0.20337364077568054, -0.18943695724010468, -0.17550025880336761, -0.16156356036663055, -0.1476268768310547, -0.13369017839431763, -0.11975349485874176, -0.1058167964220047, -0.09188010543584824, -0.07794341444969177, -0.06400672346353531, -0.050070032477378845, -0.03613334149122238, -0.02219664677977562, -0.008259955793619156, 0.005676738917827606, 0.01961342990398407, 0.03355012089014053, 0.047486811876297, 0.06142350286245346, 0.07536019384860992, 0.08929689228534698, 0.10323357582092285, 0.11717027425765991, 0.13110697269439697, 0.14504365622997284, 0.1589803397655487, 0.17291703820228577, 0.18685372173786163, 0.2007904201745987, 0.21472710371017456, 0.22866380214691162, 0.24260050058364868, 0.25653719902038574, 0.2704738974571228, 0.28441059589385986, 0.2983472943305969, 0.3122839629650116, 0.32622066140174866, 0.3401573598384857, 0.3540940582752228, 0.36803072690963745, 0.3819674253463745, 0.3959041237831116, 0.40984082221984863, 0.4237774908542633, 0.43771418929100037, 0.4516508877277374, 0.4655875861644745, 0.47952425479888916, 0.4934609532356262]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 4.0, 1.0, 5.0, 2.0, 6.0, 6.0, 10.0, 24.0, 43.0, 59.0, 179.0, 483.0, 1293.0, 4013.0, 16190.0, 130349.0, 727663.0, 144451.0, 17293.0, 4378.0, 1327.0, 424.0, 185.0, 84.0, 29.0, 18.0, 14.0, 5.0, 3.0, 4.0, 2.0, 5.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.179931640625, -0.17403602600097656, -0.16814041137695312, -0.1622447967529297, -0.15634918212890625, -0.1504535675048828, -0.14455795288085938, -0.13866233825683594, -0.1327667236328125, -0.12687110900878906, -0.12097549438476562, -0.11507987976074219, -0.10918426513671875, -0.10328865051269531, -0.09739303588867188, -0.09149742126464844, -0.085601806640625, -0.07970619201660156, -0.07381057739257812, -0.06791496276855469, -0.06201934814453125, -0.05612373352050781, -0.050228118896484375, -0.04433250427246094, -0.0384368896484375, -0.03254127502441406, -0.026645660400390625, -0.020750045776367188, -0.01485443115234375, -0.008958816528320312, -0.003063201904296875, 0.0028324127197265625, 0.00872802734375, 0.014623641967773438, 0.020519256591796875, 0.026414871215820312, 0.03231048583984375, 0.03820610046386719, 0.044101715087890625, 0.04999732971191406, 0.0558929443359375, 0.06178855895996094, 0.06768417358398438, 0.07357978820800781, 0.07947540283203125, 0.08537101745605469, 0.09126663208007812, 0.09716224670410156, 0.103057861328125, 0.10895347595214844, 0.11484909057617188, 0.12074470520019531, 0.12664031982421875, 0.1325359344482422, 0.13843154907226562, 0.14432716369628906, 0.1502227783203125, 0.15611839294433594, 0.16201400756835938, 0.1679096221923828, 0.17380523681640625, 0.1797008514404297, 0.18559646606445312, 0.19149208068847656, 0.1973876953125]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 5.0, 7.0, 15.0, 9.0, 18.0, 23.0, 19.0, 21.0, 34.0, 48.0, 47.0, 54.0, 65.0, 67.0, 62.0, 68.0, 61.0, 63.0, 65.0, 56.0, 44.0, 35.0, 30.0, 18.0, 27.0, 6.0, 15.0, 6.0, 4.0, 4.0, 0.0, 4.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.366943359375, -0.35467529296875, -0.3424072265625, -0.33013916015625, -0.31787109375, -0.30560302734375, -0.2933349609375, -0.28106689453125, -0.268798828125, -0.25653076171875, -0.2442626953125, -0.23199462890625, -0.2197265625, -0.20745849609375, -0.1951904296875, -0.18292236328125, -0.170654296875, -0.15838623046875, -0.1461181640625, -0.13385009765625, -0.12158203125, -0.10931396484375, -0.0970458984375, -0.08477783203125, -0.072509765625, -0.06024169921875, -0.0479736328125, -0.03570556640625, -0.0234375, -0.01116943359375, 0.0010986328125, 0.01336669921875, 0.025634765625, 0.03790283203125, 0.0501708984375, 0.06243896484375, 0.07470703125, 0.08697509765625, 0.0992431640625, 0.11151123046875, 0.123779296875, 0.13604736328125, 0.1483154296875, 0.16058349609375, 0.1728515625, 0.18511962890625, 0.1973876953125, 0.20965576171875, 0.221923828125, 0.23419189453125, 0.2464599609375, 0.25872802734375, 0.27099609375, 0.28326416015625, 0.2955322265625, 0.30780029296875, 0.320068359375, 0.33233642578125, 0.3446044921875, 0.35687255859375, 0.369140625, 0.38140869140625, 0.3936767578125, 0.40594482421875, 0.418212890625]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 2.0, 2.0, 3.0, 6.0, 7.0, 8.0, 7.0, 21.0, 32.0, 57.0, 71.0, 113.0, 194.0, 402.0, 699.0, 1436.0, 3401.0, 9050.0, 26981.0, 104612.0, 395855.0, 371244.0, 94409.0, 25174.0, 8455.0, 3240.0, 1415.0, 670.0, 382.0, 213.0, 127.0, 98.0, 51.0, 33.0, 27.0, 19.0, 6.0, 10.0, 13.0, 5.0, 2.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.09930419921875, -0.09629154205322266, -0.09327888488769531, -0.09026622772216797, -0.08725357055664062, -0.08424091339111328, -0.08122825622558594, -0.0782155990600586, -0.07520294189453125, -0.0721902847290039, -0.06917762756347656, -0.06616497039794922, -0.06315231323242188, -0.06013965606689453, -0.05712699890136719, -0.054114341735839844, -0.0511016845703125, -0.048089027404785156, -0.04507637023925781, -0.04206371307373047, -0.039051055908203125, -0.03603839874267578, -0.03302574157714844, -0.030013084411621094, -0.02700042724609375, -0.023987770080566406, -0.020975112915039062, -0.01796245574951172, -0.014949798583984375, -0.011937141418457031, -0.008924484252929688, -0.005911827087402344, -0.002899169921875, 0.00011348724365234375, 0.0031261444091796875, 0.006138801574707031, 0.009151458740234375, 0.012164115905761719, 0.015176773071289062, 0.018189430236816406, 0.02120208740234375, 0.024214744567871094, 0.027227401733398438, 0.03024005889892578, 0.033252716064453125, 0.03626537322998047, 0.03927803039550781, 0.042290687561035156, 0.0453033447265625, 0.048316001892089844, 0.05132865905761719, 0.05434131622314453, 0.057353973388671875, 0.06036663055419922, 0.06337928771972656, 0.0663919448852539, 0.06940460205078125, 0.0724172592163086, 0.07542991638183594, 0.07844257354736328, 0.08145523071289062, 0.08446788787841797, 0.08748054504394531, 0.09049320220947266, 0.093505859375]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 4.0, 4.0, 7.0, 3.0, 8.0, 11.0, 15.0, 18.0, 19.0, 14.0, 30.0, 33.0, 45.0, 34.0, 48.0, 49.0, 53.0, 75.0, 52.0, 45.0, 61.0, 55.0, 42.0, 47.0, 47.0, 36.0, 32.0, 27.0, 20.0, 17.0, 17.0, 10.0, 2.0, 10.0, 8.0, 6.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.61279296875, -0.5912322998046875, -0.569671630859375, -0.5481109619140625, -0.52655029296875, -0.5049896240234375, -0.483428955078125, -0.4618682861328125, -0.4403076171875, -0.4187469482421875, -0.397186279296875, -0.3756256103515625, -0.35406494140625, -0.3325042724609375, -0.310943603515625, -0.2893829345703125, -0.267822265625, -0.2462615966796875, -0.224700927734375, -0.2031402587890625, -0.18157958984375, -0.1600189208984375, -0.138458251953125, -0.1168975830078125, -0.0953369140625, -0.0737762451171875, -0.052215576171875, -0.0306549072265625, -0.00909423828125, 0.0124664306640625, 0.034027099609375, 0.0555877685546875, 0.0771484375, 0.0987091064453125, 0.120269775390625, 0.1418304443359375, 0.16339111328125, 0.1849517822265625, 0.206512451171875, 0.2280731201171875, 0.2496337890625, 0.2711944580078125, 0.292755126953125, 0.3143157958984375, 0.33587646484375, 0.3574371337890625, 0.378997802734375, 0.4005584716796875, 0.422119140625, 0.4436798095703125, 0.465240478515625, 0.4868011474609375, 0.50836181640625, 0.5299224853515625, 0.551483154296875, 0.5730438232421875, 0.5946044921875, 0.6161651611328125, 0.637725830078125, 0.6592864990234375, 0.68084716796875, 0.7024078369140625, 0.723968505859375, 0.7455291748046875, 0.76708984375]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 1.0, 5.0, 4.0, 7.0, 23.0, 22.0, 27.0, 28.0, 46.0, 86.0, 135.0, 241.0, 443.0, 823.0, 1642.0, 3768.0, 9746.0, 32138.0, 141307.0, 505474.0, 271021.0, 56006.0, 15437.0, 5525.0, 2236.0, 1051.0, 527.0, 317.0, 193.0, 89.0, 66.0, 36.0, 27.0, 23.0, 12.0, 7.0, 6.0, 5.0, 3.0, 2.0, 6.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.039337158203125, -0.03829383850097656, -0.037250518798828125, -0.03620719909667969, -0.03516387939453125, -0.03412055969238281, -0.033077239990234375, -0.03203392028808594, -0.0309906005859375, -0.029947280883789062, -0.028903961181640625, -0.027860641479492188, -0.02681732177734375, -0.025774002075195312, -0.024730682373046875, -0.023687362670898438, -0.02264404296875, -0.021600723266601562, -0.020557403564453125, -0.019514083862304688, -0.01847076416015625, -0.017427444458007812, -0.016384124755859375, -0.015340805053710938, -0.0142974853515625, -0.013254165649414062, -0.012210845947265625, -0.011167526245117188, -0.01012420654296875, -0.009080886840820312, -0.008037567138671875, -0.0069942474365234375, -0.005950927734375, -0.0049076080322265625, -0.003864288330078125, -0.0028209686279296875, -0.00177764892578125, -0.0007343292236328125, 0.000308990478515625, 0.0013523101806640625, 0.0023956298828125, 0.0034389495849609375, 0.004482269287109375, 0.0055255889892578125, 0.00656890869140625, 0.0076122283935546875, 0.008655548095703125, 0.009698867797851562, 0.0107421875, 0.011785507202148438, 0.012828826904296875, 0.013872146606445312, 0.01491546630859375, 0.015958786010742188, 0.017002105712890625, 0.018045425415039062, 0.0190887451171875, 0.020132064819335938, 0.021175384521484375, 0.022218704223632812, 0.02326202392578125, 0.024305343627929688, 0.025348663330078125, 0.026391983032226562, 0.027435302734375]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 7.0, 2.0, 5.0, 6.0, 6.0, 15.0, 10.0, 20.0, 19.0, 22.0, 31.0, 55.0, 52.0, 59.0, 74.0, 105.0, 74.0, 70.0, 74.0, 56.0, 53.0, 32.0, 39.0, 26.0, 17.0, 24.0, 10.0, 5.0, 7.0, 8.0, 6.0, 3.0, 7.0, 5.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-1.6510486602783203e-05, -1.6016885638237e-05, -1.5523284673690796e-05, -1.5029683709144592e-05, -1.4536082744598389e-05, -1.4042481780052185e-05, -1.3548880815505981e-05, -1.3055279850959778e-05, -1.2561678886413574e-05, -1.206807792186737e-05, -1.1574476957321167e-05, -1.1080875992774963e-05, -1.058727502822876e-05, -1.0093674063682556e-05, -9.600073099136353e-06, -9.106472134590149e-06, -8.612871170043945e-06, -8.119270205497742e-06, -7.625669240951538e-06, -7.1320682764053345e-06, -6.638467311859131e-06, -6.144866347312927e-06, -5.651265382766724e-06, -5.15766441822052e-06, -4.664063453674316e-06, -4.170462489128113e-06, -3.676861524581909e-06, -3.1832605600357056e-06, -2.689659595489502e-06, -2.1960586309432983e-06, -1.7024576663970947e-06, -1.2088567018508911e-06, -7.152557373046875e-07, -2.2165477275848389e-07, 2.7194619178771973e-07, 7.655471563339233e-07, 1.259148120880127e-06, 1.7527490854263306e-06, 2.246350049972534e-06, 2.739951014518738e-06, 3.2335519790649414e-06, 3.727152943611145e-06, 4.220753908157349e-06, 4.714354872703552e-06, 5.207955837249756e-06, 5.7015568017959595e-06, 6.195157766342163e-06, 6.688758730888367e-06, 7.18235969543457e-06, 7.675960659980774e-06, 8.169561624526978e-06, 8.663162589073181e-06, 9.156763553619385e-06, 9.650364518165588e-06, 1.0143965482711792e-05, 1.0637566447257996e-05, 1.11311674118042e-05, 1.1624768376350403e-05, 1.2118369340896606e-05, 1.261197030544281e-05, 1.3105571269989014e-05, 1.3599172234535217e-05, 1.4092773199081421e-05, 1.4586374163627625e-05, 1.5079975128173828e-05]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 2.0, 4.0, 10.0, 7.0, 11.0, 18.0, 26.0, 43.0, 66.0, 108.0, 175.0, 296.0, 474.0, 867.0, 1953.0, 4927.0, 14199.0, 53378.0, 254597.0, 505310.0, 159826.0, 35076.0, 10225.0, 3634.0, 1547.0, 708.0, 406.0, 240.0, 149.0, 97.0, 63.0, 40.0, 24.0, 15.0, 17.0, 10.0, 3.0, 4.0, 4.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.032470703125, -0.03143501281738281, -0.030399322509765625, -0.029363632202148438, -0.02832794189453125, -0.027292251586914062, -0.026256561279296875, -0.025220870971679688, -0.0241851806640625, -0.023149490356445312, -0.022113800048828125, -0.021078109741210938, -0.02004241943359375, -0.019006729125976562, -0.017971038818359375, -0.016935348510742188, -0.015899658203125, -0.014863967895507812, -0.013828277587890625, -0.012792587280273438, -0.01175689697265625, -0.010721206665039062, -0.009685516357421875, -0.008649826049804688, -0.0076141357421875, -0.0065784454345703125, -0.005542755126953125, -0.0045070648193359375, -0.00347137451171875, -0.0024356842041015625, -0.001399993896484375, -0.0003643035888671875, 0.00067138671875, 0.0017070770263671875, 0.002742767333984375, 0.0037784576416015625, 0.00481414794921875, 0.0058498382568359375, 0.006885528564453125, 0.007921218872070312, 0.0089569091796875, 0.009992599487304688, 0.011028289794921875, 0.012063980102539062, 0.01309967041015625, 0.014135360717773438, 0.015171051025390625, 0.016206741333007812, 0.017242431640625, 0.018278121948242188, 0.019313812255859375, 0.020349502563476562, 0.02138519287109375, 0.022420883178710938, 0.023456573486328125, 0.024492263793945312, 0.0255279541015625, 0.026563644409179688, 0.027599334716796875, 0.028635025024414062, 0.02967071533203125, 0.030706405639648438, 0.031742095947265625, 0.03277778625488281, 0.0338134765625]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 4.0, 4.0, 4.0, 5.0, 5.0, 5.0, 8.0, 4.0, 9.0, 19.0, 12.0, 19.0, 35.0, 28.0, 25.0, 26.0, 51.0, 58.0, 56.0, 72.0, 56.0, 64.0, 52.0, 65.0, 49.0, 45.0, 34.0, 31.0, 26.0, 29.0, 18.0, 17.0, 17.0, 8.0, 13.0, 6.0, 5.0, 5.0, 4.0, 5.0, 3.0, 2.0, 1.0, 4.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.005687713623046875, -0.005492985248565674, -0.005298256874084473, -0.0051035284996032715, -0.00490880012512207, -0.004714071750640869, -0.004519343376159668, -0.004324615001678467, -0.004129886627197266, -0.0039351582527160645, -0.0037404298782348633, -0.003545701503753662, -0.003350973129272461, -0.0031562447547912598, -0.0029615163803100586, -0.0027667880058288574, -0.0025720596313476562, -0.002377331256866455, -0.002182602882385254, -0.0019878745079040527, -0.0017931461334228516, -0.0015984177589416504, -0.0014036893844604492, -0.001208961009979248, -0.0010142326354980469, -0.0008195042610168457, -0.0006247758865356445, -0.00043004751205444336, -0.0002353191375732422, -4.0590763092041016e-05, 0.00015413761138916016, 0.00034886598587036133, 0.0005435943603515625, 0.0007383227348327637, 0.0009330511093139648, 0.001127779483795166, 0.0013225078582763672, 0.0015172362327575684, 0.0017119646072387695, 0.0019066929817199707, 0.002101421356201172, 0.002296149730682373, 0.0024908781051635742, 0.0026856064796447754, 0.0028803348541259766, 0.0030750632286071777, 0.003269791603088379, 0.00346451997756958, 0.0036592483520507812, 0.0038539767265319824, 0.004048705101013184, 0.004243433475494385, 0.004438161849975586, 0.004632890224456787, 0.004827618598937988, 0.0050223469734191895, 0.005217075347900391, 0.005411803722381592, 0.005606532096862793, 0.005801260471343994, 0.005995988845825195, 0.0061907172203063965, 0.006385445594787598, 0.006580173969268799, 0.00677490234375]}, "gradients/decoder.model.decoder.layers.6.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 5.0, 11.0, 20.0, 36.0, 61.0, 93.0, 209.0, 224.0, 156.0, 96.0, 45.0, 23.0, 13.0, 5.0, 6.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5888968706130981, -0.5613466501235962, -0.5337964296340942, -0.5062462091445923, -0.47869595885276794, -0.451145738363266, -0.42359548807144165, -0.3960452675819397, -0.36849504709243774, -0.3409448266029358, -0.31339460611343384, -0.2858443558216095, -0.25829413533210754, -0.2307439148426056, -0.20319367945194244, -0.1756434440612793, -0.14809322357177734, -0.1205429956316948, -0.09299276769161224, -0.0654425397515297, -0.037892311811447144, -0.01034209132194519, 0.017208144068717957, 0.044758379459381104, 0.07230859994888306, 0.0998588278889656, 0.12740905582904816, 0.1549592912197113, 0.18250951170921326, 0.2100597321987152, 0.23760996758937836, 0.2651602029800415, 0.29271042346954346, 0.3202606439590454, 0.34781086444854736, 0.3753611147403717, 0.40291133522987366, 0.4304615557193756, 0.45801180601119995, 0.4855620265007019, 0.5131122469902039, 0.5406624674797058, 0.5682126879692078, 0.5957629084587097, 0.6233131885528564, 0.6508634090423584, 0.6784136295318604, 0.7059638500213623, 0.7335140705108643, 0.7610642910003662, 0.7886145114898682, 0.8161647319793701, 0.8437149524688721, 0.871265172958374, 0.8988154530525208, 0.9263656735420227, 0.9539158940315247, 0.9814661145210266, 1.0090163946151733, 1.0365666151046753, 1.0641168355941772, 1.0916670560836792, 1.1192172765731812, 1.146767497062683, 1.174317717552185]}, "gradients/decoder.model.decoder.layers.6.self_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 2.0, 6.0, 4.0, 2.0, 9.0, 13.0, 9.0, 20.0, 16.0, 25.0, 25.0, 31.0, 47.0, 49.0, 47.0, 52.0, 62.0, 59.0, 58.0, 55.0, 62.0, 58.0, 51.0, 51.0, 40.0, 41.0, 18.0, 17.0, 25.0, 9.0, 15.0, 9.0, 8.0, 3.0, 3.0, 4.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.27519190311431885, -0.2643825113773346, -0.25357311964035034, -0.2427637279033661, -0.23195433616638184, -0.22114494442939758, -0.21033555269241333, -0.19952616095542908, -0.18871676921844482, -0.17790737748146057, -0.16709798574447632, -0.15628859400749207, -0.1454792022705078, -0.13466981053352356, -0.1238604187965393, -0.11305102705955505, -0.1022416353225708, -0.09143224358558655, -0.0806228518486023, -0.06981346011161804, -0.05900406837463379, -0.048194676637649536, -0.03738528490066528, -0.02657589316368103, -0.015766501426696777, -0.004957109689712524, 0.0058522820472717285, 0.01666167378425598, 0.027471065521240234, 0.03828045725822449, 0.04908984899520874, 0.05989924073219299, 0.07070866227149963, 0.08151805400848389, 0.09232744574546814, 0.10313683748245239, 0.11394622921943665, 0.1247556209564209, 0.13556501269340515, 0.1463744044303894, 0.15718379616737366, 0.1679931879043579, 0.17880257964134216, 0.18961197137832642, 0.20042136311531067, 0.21123075485229492, 0.22204014658927917, 0.23284953832626343, 0.24365893006324768, 0.25446832180023193, 0.2652777135372162, 0.27608710527420044, 0.2868964970111847, 0.29770588874816895, 0.3085152804851532, 0.31932467222213745, 0.3301340639591217, 0.34094345569610596, 0.3517528474330902, 0.36256223917007446, 0.3733716309070587, 0.38418102264404297, 0.3949904143810272, 0.4057998061180115, 0.4166091978549957]}, "gradients/decoder.model.decoder.layers.6.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 1.0, 2.0, 5.0, 4.0, 6.0, 3.0, 7.0, 3.0, 12.0, 18.0, 35.0, 111.0, 369.0, 2133.0, 22338.0, 864903.0, 151378.0, 6036.0, 849.0, 199.0, 65.0, 27.0, 11.0, 10.0, 2.0, 4.0, 5.0, 0.0, 1.0, 7.0, 2.0, 2.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.263671875, -1.223876953125, -1.18408203125, -1.144287109375, -1.1044921875, -1.064697265625, -1.02490234375, -0.985107421875, -0.9453125, -0.905517578125, -0.86572265625, -0.825927734375, -0.7861328125, -0.746337890625, -0.70654296875, -0.666748046875, -0.626953125, -0.587158203125, -0.54736328125, -0.507568359375, -0.4677734375, -0.427978515625, -0.38818359375, -0.348388671875, -0.30859375, -0.268798828125, -0.22900390625, -0.189208984375, -0.1494140625, -0.109619140625, -0.06982421875, -0.030029296875, 0.009765625, 0.049560546875, 0.08935546875, 0.129150390625, 0.1689453125, 0.208740234375, 0.24853515625, 0.288330078125, 0.328125, 0.367919921875, 0.40771484375, 0.447509765625, 0.4873046875, 0.527099609375, 0.56689453125, 0.606689453125, 0.646484375, 0.686279296875, 0.72607421875, 0.765869140625, 0.8056640625, 0.845458984375, 0.88525390625, 0.925048828125, 0.96484375, 1.004638671875, 1.04443359375, 1.084228515625, 1.1240234375, 1.163818359375, 1.20361328125, 1.243408203125, 1.283203125]}, "gradients/decoder.model.decoder.layers.6.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 6.0, 6.0, 15.0, 16.0, 29.0, 42.0, 71.0, 98.0, 112.0, 114.0, 114.0, 114.0, 103.0, 69.0, 42.0, 29.0, 20.0, 3.0, 7.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.58154296875, -0.5399551391601562, -0.4983673095703125, -0.45677947998046875, -0.415191650390625, -0.37360382080078125, -0.3320159912109375, -0.29042816162109375, -0.24884033203125, -0.20725250244140625, -0.1656646728515625, -0.12407684326171875, -0.082489013671875, -0.04090118408203125, 0.0006866455078125, 0.04227447509765625, 0.0838623046875, 0.12545013427734375, 0.1670379638671875, 0.20862579345703125, 0.250213623046875, 0.29180145263671875, 0.3333892822265625, 0.37497711181640625, 0.41656494140625, 0.45815277099609375, 0.4997406005859375, 0.5413284301757812, 0.582916259765625, 0.6245040893554688, 0.6660919189453125, 0.7076797485351562, 0.749267578125, 0.7908554077148438, 0.8324432373046875, 0.8740310668945312, 0.915618896484375, 0.9572067260742188, 0.9987945556640625, 1.0403823852539062, 1.08197021484375, 1.1235580444335938, 1.1651458740234375, 1.2067337036132812, 1.248321533203125, 1.2899093627929688, 1.3314971923828125, 1.3730850219726562, 1.4146728515625, 1.4562606811523438, 1.4978485107421875, 1.5394363403320312, 1.581024169921875, 1.6226119995117188, 1.6641998291015625, 1.7057876586914062, 1.74737548828125, 1.7889633178710938, 1.8305511474609375, 1.8721389770507812, 1.913726806640625, 1.9553146362304688, 1.9969024658203125, 2.0384902954101562, 2.080078125]}, "gradients/decoder.model.decoder.layers.6.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 3.0, 2.0, 12.0, 10.0, 11.0, 14.0, 32.0, 25.0, 43.0, 96.0, 144.0, 269.0, 685.0, 2066.0, 11721.0, 199846.0, 796426.0, 31122.0, 4167.0, 964.0, 383.0, 193.0, 114.0, 74.0, 37.0, 27.0, 20.0, 19.0, 11.0, 6.0, 2.0, 2.0, 6.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-1.0732421875, -1.0465545654296875, -1.019866943359375, -0.9931793212890625, -0.96649169921875, -0.9398040771484375, -0.913116455078125, -0.8864288330078125, -0.8597412109375, -0.8330535888671875, -0.806365966796875, -0.7796783447265625, -0.75299072265625, -0.7263031005859375, -0.699615478515625, -0.6729278564453125, -0.646240234375, -0.6195526123046875, -0.592864990234375, -0.5661773681640625, -0.53948974609375, -0.5128021240234375, -0.486114501953125, -0.4594268798828125, -0.4327392578125, -0.4060516357421875, -0.379364013671875, -0.3526763916015625, -0.32598876953125, -0.2993011474609375, -0.272613525390625, -0.2459259033203125, -0.21923828125, -0.1925506591796875, -0.165863037109375, -0.1391754150390625, -0.11248779296875, -0.0858001708984375, -0.059112548828125, -0.0324249267578125, -0.0057373046875, 0.0209503173828125, 0.047637939453125, 0.0743255615234375, 0.10101318359375, 0.1277008056640625, 0.154388427734375, 0.1810760498046875, 0.207763671875, 0.2344512939453125, 0.261138916015625, 0.2878265380859375, 0.31451416015625, 0.3412017822265625, 0.367889404296875, 0.3945770263671875, 0.4212646484375, 0.4479522705078125, 0.474639892578125, 0.5013275146484375, 0.52801513671875, 0.5547027587890625, 0.581390380859375, 0.6080780029296875, 0.634765625]}, "gradients/decoder.model.decoder.layers.6.self_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 4.0, 3.0, 3.0, 4.0, 4.0, 8.0, 5.0, 7.0, 6.0, 5.0, 7.0, 14.0, 21.0, 22.0, 16.0, 28.0, 31.0, 26.0, 22.0, 34.0, 40.0, 31.0, 38.0, 27.0, 42.0, 36.0, 38.0, 43.0, 51.0, 43.0, 41.0, 34.0, 31.0, 31.0, 24.0, 23.0, 26.0, 22.0, 12.0, 15.0, 19.0, 8.0, 8.0, 15.0, 6.0, 7.0, 6.0, 8.0, 6.0, 4.0, 3.0, 2.0, 3.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.5078125, -0.4907989501953125, -0.473785400390625, -0.4567718505859375, -0.43975830078125, -0.4227447509765625, -0.405731201171875, -0.3887176513671875, -0.3717041015625, -0.3546905517578125, -0.337677001953125, -0.3206634521484375, -0.30364990234375, -0.2866363525390625, -0.269622802734375, -0.2526092529296875, -0.235595703125, -0.2185821533203125, -0.201568603515625, -0.1845550537109375, -0.16754150390625, -0.1505279541015625, -0.133514404296875, -0.1165008544921875, -0.0994873046875, -0.0824737548828125, -0.065460205078125, -0.0484466552734375, -0.03143310546875, -0.0144195556640625, 0.002593994140625, 0.0196075439453125, 0.03662109375, 0.0536346435546875, 0.070648193359375, 0.0876617431640625, 0.10467529296875, 0.1216888427734375, 0.138702392578125, 0.1557159423828125, 0.1727294921875, 0.1897430419921875, 0.206756591796875, 0.2237701416015625, 0.24078369140625, 0.2577972412109375, 0.274810791015625, 0.2918243408203125, 0.308837890625, 0.3258514404296875, 0.342864990234375, 0.3598785400390625, 0.37689208984375, 0.3939056396484375, 0.410919189453125, 0.4279327392578125, 0.4449462890625, 0.4619598388671875, 0.478973388671875, 0.4959869384765625, 0.51300048828125, 0.5300140380859375, 0.547027587890625, 0.5640411376953125, 0.5810546875]}, "gradients/decoder.model.decoder.layers.6.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 12.0, 8.0, 16.0, 13.0, 43.0, 87.0, 150.0, 328.0, 759.0, 2249.0, 8951.0, 77434.0, 840400.0, 103267.0, 10794.0, 2486.0, 866.0, 347.0, 155.0, 71.0, 49.0, 25.0, 11.0, 8.0, 10.0, 10.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.2744140625, -0.26598358154296875, -0.2575531005859375, -0.24912261962890625, -0.240692138671875, -0.23226165771484375, -0.2238311767578125, -0.21540069580078125, -0.20697021484375, -0.19853973388671875, -0.1901092529296875, -0.18167877197265625, -0.173248291015625, -0.16481781005859375, -0.1563873291015625, -0.14795684814453125, -0.1395263671875, -0.13109588623046875, -0.1226654052734375, -0.11423492431640625, -0.105804443359375, -0.09737396240234375, -0.0889434814453125, -0.08051300048828125, -0.07208251953125, -0.06365203857421875, -0.0552215576171875, -0.04679107666015625, -0.038360595703125, -0.02993011474609375, -0.0214996337890625, -0.01306915283203125, -0.004638671875, 0.00379180908203125, 0.0122222900390625, 0.02065277099609375, 0.029083251953125, 0.03751373291015625, 0.0459442138671875, 0.05437469482421875, 0.06280517578125, 0.07123565673828125, 0.0796661376953125, 0.08809661865234375, 0.096527099609375, 0.10495758056640625, 0.1133880615234375, 0.12181854248046875, 0.1302490234375, 0.13867950439453125, 0.1471099853515625, 0.15554046630859375, 0.163970947265625, 0.17240142822265625, 0.1808319091796875, 0.18926239013671875, 0.19769287109375, 0.20612335205078125, 0.2145538330078125, 0.22298431396484375, 0.231414794921875, 0.23984527587890625, 0.2482757568359375, 0.25670623779296875, 0.26513671875]}, "gradients/decoder.model.decoder.layers.6.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 3.0, 2.0, 2.0, 5.0, 1.0, 7.0, 3.0, 8.0, 14.0, 10.0, 13.0, 30.0, 29.0, 51.0, 66.0, 92.0, 142.0, 156.0, 99.0, 81.0, 48.0, 43.0, 28.0, 24.0, 16.0, 10.0, 6.0, 4.0, 5.0, 1.0, 1.0, 2.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.664327621459961e-05, -2.5787390768527985e-05, -2.493150532245636e-05, -2.4075619876384735e-05, -2.321973443031311e-05, -2.2363848984241486e-05, -2.150796353816986e-05, -2.0652078092098236e-05, -1.979619264602661e-05, -1.8940307199954987e-05, -1.8084421753883362e-05, -1.7228536307811737e-05, -1.6372650861740112e-05, -1.5516765415668488e-05, -1.4660879969596863e-05, -1.3804994523525238e-05, -1.2949109077453613e-05, -1.2093223631381989e-05, -1.1237338185310364e-05, -1.0381452739238739e-05, -9.525567293167114e-06, -8.66968184709549e-06, -7.813796401023865e-06, -6.95791095495224e-06, -6.102025508880615e-06, -5.2461400628089905e-06, -4.390254616737366e-06, -3.534369170665741e-06, -2.678483724594116e-06, -1.8225982785224915e-06, -9.667128324508667e-07, -1.1082738637924194e-07, 7.450580596923828e-07, 1.6009435057640076e-06, 2.4568289518356323e-06, 3.312714397907257e-06, 4.168599843978882e-06, 5.024485290050507e-06, 5.880370736122131e-06, 6.736256182193756e-06, 7.592141628265381e-06, 8.448027074337006e-06, 9.30391252040863e-06, 1.0159797966480255e-05, 1.101568341255188e-05, 1.1871568858623505e-05, 1.272745430469513e-05, 1.3583339750766754e-05, 1.4439225196838379e-05, 1.5295110642910004e-05, 1.615099608898163e-05, 1.7006881535053253e-05, 1.7862766981124878e-05, 1.8718652427196503e-05, 1.9574537873268127e-05, 2.0430423319339752e-05, 2.1286308765411377e-05, 2.2142194211483002e-05, 2.2998079657554626e-05, 2.385396510362625e-05, 2.4709850549697876e-05, 2.55657359957695e-05, 2.6421621441841125e-05, 2.727750688791275e-05, 2.8133392333984375e-05]}, "gradients/decoder.model.decoder.layers.6.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 3.0, 3.0, 3.0, 6.0, 10.0, 22.0, 24.0, 43.0, 66.0, 146.0, 270.0, 770.0, 3167.0, 27198.0, 807551.0, 197419.0, 9367.0, 1567.0, 467.0, 202.0, 86.0, 63.0, 28.0, 24.0, 21.0, 10.0, 1.0, 7.0, 2.0, 4.0, 3.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.35302734375, -0.3428802490234375, -0.332733154296875, -0.3225860595703125, -0.31243896484375, -0.3022918701171875, -0.292144775390625, -0.2819976806640625, -0.2718505859375, -0.2617034912109375, -0.251556396484375, -0.2414093017578125, -0.23126220703125, -0.2211151123046875, -0.210968017578125, -0.2008209228515625, -0.190673828125, -0.1805267333984375, -0.170379638671875, -0.1602325439453125, -0.15008544921875, -0.1399383544921875, -0.129791259765625, -0.1196441650390625, -0.1094970703125, -0.0993499755859375, -0.089202880859375, -0.0790557861328125, -0.06890869140625, -0.0587615966796875, -0.048614501953125, -0.0384674072265625, -0.0283203125, -0.0181732177734375, -0.008026123046875, 0.0021209716796875, 0.01226806640625, 0.0224151611328125, 0.032562255859375, 0.0427093505859375, 0.0528564453125, 0.0630035400390625, 0.073150634765625, 0.0832977294921875, 0.09344482421875, 0.1035919189453125, 0.113739013671875, 0.1238861083984375, 0.134033203125, 0.1441802978515625, 0.154327392578125, 0.1644744873046875, 0.17462158203125, 0.1847686767578125, 0.194915771484375, 0.2050628662109375, 0.2152099609375, 0.2253570556640625, 0.235504150390625, 0.2456512451171875, 0.25579833984375, 0.2659454345703125, 0.276092529296875, 0.2862396240234375, 0.29638671875]}, "gradients/decoder.model.decoder.layers.6.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 7.0, 2.0, 10.0, 8.0, 19.0, 23.0, 29.0, 29.0, 41.0, 64.0, 89.0, 113.0, 132.0, 120.0, 97.0, 65.0, 49.0, 38.0, 15.0, 20.0, 12.0, 12.0, 7.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0772705078125, -0.07463932037353516, -0.07200813293457031, -0.06937694549560547, -0.06674575805664062, -0.06411457061767578, -0.06148338317871094, -0.058852195739746094, -0.05622100830078125, -0.053589820861816406, -0.05095863342285156, -0.04832744598388672, -0.045696258544921875, -0.04306507110595703, -0.04043388366699219, -0.037802696228027344, -0.0351715087890625, -0.032540321350097656, -0.029909133911132812, -0.02727794647216797, -0.024646759033203125, -0.02201557159423828, -0.019384384155273438, -0.016753196716308594, -0.01412200927734375, -0.011490821838378906, -0.008859634399414062, -0.006228446960449219, -0.003597259521484375, -0.0009660720825195312, 0.0016651153564453125, 0.004296302795410156, 0.006927490234375, 0.009558677673339844, 0.012189865112304688, 0.014821052551269531, 0.017452239990234375, 0.02008342742919922, 0.022714614868164062, 0.025345802307128906, 0.02797698974609375, 0.030608177185058594, 0.03323936462402344, 0.03587055206298828, 0.038501739501953125, 0.04113292694091797, 0.04376411437988281, 0.046395301818847656, 0.0490264892578125, 0.051657676696777344, 0.05428886413574219, 0.05692005157470703, 0.059551239013671875, 0.06218242645263672, 0.06481361389160156, 0.0674448013305664, 0.07007598876953125, 0.0727071762084961, 0.07533836364746094, 0.07796955108642578, 0.08060073852539062, 0.08323192596435547, 0.08586311340332031, 0.08849430084228516, 0.09112548828125]}, "gradients/decoder.model.decoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 10.0, 11.0, 22.0, 45.0, 74.0, 142.0, 240.0, 196.0, 156.0, 53.0, 24.0, 14.0, 12.0, 6.0, 1.0, 3.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.669635534286499, -1.611814022064209, -1.5539923906326294, -1.4961708784103394, -1.4383493661880493, -1.3805277347564697, -1.3227062225341797, -1.2648847103118896, -1.20706307888031, -1.14924156665802, -1.0914199352264404, -1.0335984230041504, -0.9757768511772156, -0.9179552793502808, -0.8601337671279907, -0.8023121953010559, -0.7444906830787659, -0.686669111251831, -0.628847599029541, -0.5710260272026062, -0.5132044553756714, -0.45538291335105896, -0.39756137132644653, -0.3397397994995117, -0.2819182574748993, -0.22409670054912567, -0.16627514362335205, -0.10845360159873962, -0.050632044672966, 0.007189512252807617, 0.06501105427742004, 0.12283262610435486, 0.18065416812896729, 0.2384757250547409, 0.2962972819805145, 0.35411882400512695, 0.41194039583206177, 0.4697619378566742, 0.5275834798812866, 0.5854050517082214, 0.6432266235351562, 0.7010481953620911, 0.7588697075843811, 0.8166912794113159, 0.8745128512382507, 0.9323344230651855, 0.9901559352874756, 1.0479774475097656, 1.1057989597320557, 1.1636204719543457, 1.2214421033859253, 1.2792636156082153, 1.3370851278305054, 1.394906759262085, 1.452728271484375, 1.510549783706665, 1.5683714151382446, 1.6261929273605347, 1.6840145587921143, 1.7418360710144043, 1.7996575832366943, 1.857479214668274, 1.915300726890564, 1.9731223583221436, 2.0309438705444336]}, "gradients/decoder.model.decoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 4.0, 5.0, 10.0, 12.0, 13.0, 23.0, 14.0, 40.0, 39.0, 38.0, 46.0, 44.0, 58.0, 50.0, 71.0, 49.0, 58.0, 54.0, 65.0, 55.0, 50.0, 47.0, 38.0, 37.0, 32.0, 18.0, 11.0, 10.0, 2.0, 8.0, 5.0, 5.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9879714846611023, -0.9422454833984375, -0.8965195417404175, -0.8507936000823975, -0.8050675988197327, -0.7593415975570679, -0.7136156558990479, -0.6678897142410278, -0.622163712978363, -0.5764377117156982, -0.5307117700576782, -0.4849857985973358, -0.4392598271369934, -0.393533855676651, -0.3478078842163086, -0.3020819127559662, -0.2563559412956238, -0.21062996983528137, -0.16490399837493896, -0.11917802691459656, -0.07345205545425415, -0.027726083993911743, 0.017999887466430664, 0.06372585892677307, 0.10945183038711548, 0.15517780184745789, 0.2009037733078003, 0.2466297447681427, 0.2923557162284851, 0.3380816876888275, 0.3838076591491699, 0.42953363060951233, 0.47525954246520996, 0.52098548412323, 0.5667114853858948, 0.6124374866485596, 0.6581634283065796, 0.7038893699645996, 0.7496153712272644, 0.7953413724899292, 0.8410673141479492, 0.8867932558059692, 0.932519257068634, 0.9782452583312988, 1.0239711999893188, 1.0696971416473389, 1.1154232025146484, 1.1611491441726685, 1.2068750858306885, 1.2526010274887085, 1.2983269691467285, 1.344053030014038, 1.389778971672058, 1.4355049133300781, 1.4812309741973877, 1.5269569158554077, 1.5726828575134277, 1.6184087991714478, 1.6641347408294678, 1.7098608016967773, 1.7555867433547974, 1.8013126850128174, 1.847038745880127, 1.892764687538147, 1.938490629196167]}, "gradients/decoder.model.decoder.layers.5.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 5.0, 4.0, 6.0, 5.0, 16.0, 19.0, 20.0, 22.0, 30.0, 39.0, 56.0, 117.0, 207.0, 457.0, 1264.0, 4583.0, 27887.0, 948619.0, 3136535.0, 63728.0, 7523.0, 1851.0, 641.0, 258.0, 122.0, 77.0, 47.0, 35.0, 24.0, 23.0, 16.0, 8.0, 12.0, 8.0, 4.0, 5.0, 3.0, 3.0, 2.0, 2.0, 5.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.2080078125, -1.1726531982421875, -1.137298583984375, -1.1019439697265625, -1.06658935546875, -1.0312347412109375, -0.995880126953125, -0.9605255126953125, -0.9251708984375, -0.8898162841796875, -0.854461669921875, -0.8191070556640625, -0.78375244140625, -0.7483978271484375, -0.713043212890625, -0.6776885986328125, -0.642333984375, -0.6069793701171875, -0.571624755859375, -0.5362701416015625, -0.50091552734375, -0.4655609130859375, -0.430206298828125, -0.3948516845703125, -0.3594970703125, -0.3241424560546875, -0.288787841796875, -0.2534332275390625, -0.21807861328125, -0.1827239990234375, -0.147369384765625, -0.1120147705078125, -0.07666015625, -0.0413055419921875, -0.005950927734375, 0.0294036865234375, 0.06475830078125, 0.1001129150390625, 0.135467529296875, 0.1708221435546875, 0.2061767578125, 0.2415313720703125, 0.276885986328125, 0.3122406005859375, 0.34759521484375, 0.3829498291015625, 0.418304443359375, 0.4536590576171875, 0.489013671875, 0.5243682861328125, 0.559722900390625, 0.5950775146484375, 0.63043212890625, 0.6657867431640625, 0.701141357421875, 0.7364959716796875, 0.7718505859375, 0.8072052001953125, 0.842559814453125, 0.8779144287109375, 0.91326904296875, 0.9486236572265625, 0.983978271484375, 1.0193328857421875, 1.0546875]}, "gradients/decoder.model.decoder.layers.5.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 4.0, 2.0, 4.0, 4.0, 7.0, 6.0, 20.0, 17.0, 27.0, 26.0, 33.0, 40.0, 53.0, 43.0, 38.0, 60.0, 59.0, 51.0, 64.0, 72.0, 67.0, 52.0, 44.0, 37.0, 38.0, 39.0, 28.0, 19.0, 10.0, 17.0, 9.0, 7.0, 5.0, 4.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.428466796875, -0.4145774841308594, -0.40068817138671875, -0.3867988586425781, -0.3729095458984375, -0.3590202331542969, -0.34513092041015625, -0.3312416076660156, -0.317352294921875, -0.3034629821777344, -0.28957366943359375, -0.2756843566894531, -0.2617950439453125, -0.24790573120117188, -0.23401641845703125, -0.22012710571289062, -0.20623779296875, -0.19234848022460938, -0.17845916748046875, -0.16456985473632812, -0.1506805419921875, -0.13679122924804688, -0.12290191650390625, -0.10901260375976562, -0.095123291015625, -0.08123397827148438, -0.06734466552734375, -0.053455352783203125, -0.0395660400390625, -0.025676727294921875, -0.01178741455078125, 0.002101898193359375, 0.0159912109375, 0.029880523681640625, 0.04376983642578125, 0.057659149169921875, 0.0715484619140625, 0.08543777465820312, 0.09932708740234375, 0.11321640014648438, 0.127105712890625, 0.14099502563476562, 0.15488433837890625, 0.16877365112304688, 0.1826629638671875, 0.19655227661132812, 0.21044158935546875, 0.22433090209960938, 0.23822021484375, 0.2521095275878906, 0.26599884033203125, 0.2798881530761719, 0.2937774658203125, 0.3076667785644531, 0.32155609130859375, 0.3354454040527344, 0.349334716796875, 0.3632240295410156, 0.37711334228515625, 0.3910026550292969, 0.4048919677734375, 0.4187812805175781, 0.43267059326171875, 0.4465599060058594, 0.46044921875]}, "gradients/decoder.model.decoder.layers.5.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 0.0, 3.0, 4.0, 4.0, 4.0, 3.0, 9.0, 12.0, 11.0, 16.0, 27.0, 44.0, 78.0, 111.0, 186.0, 365.0, 810.0, 2258.0, 7527.0, 41306.0, 857948.0, 3181389.0, 85328.0, 11896.0, 2933.0, 1009.0, 441.0, 230.0, 144.0, 69.0, 41.0, 17.0, 22.0, 9.0, 13.0, 9.0, 7.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.931640625, -0.9078521728515625, -0.884063720703125, -0.8602752685546875, -0.83648681640625, -0.8126983642578125, -0.788909912109375, -0.7651214599609375, -0.7413330078125, -0.7175445556640625, -0.693756103515625, -0.6699676513671875, -0.64617919921875, -0.6223907470703125, -0.598602294921875, -0.5748138427734375, -0.551025390625, -0.5272369384765625, -0.503448486328125, -0.4796600341796875, -0.45587158203125, -0.4320831298828125, -0.408294677734375, -0.3845062255859375, -0.3607177734375, -0.3369293212890625, -0.313140869140625, -0.2893524169921875, -0.26556396484375, -0.2417755126953125, -0.217987060546875, -0.1941986083984375, -0.17041015625, -0.1466217041015625, -0.122833251953125, -0.0990447998046875, -0.07525634765625, -0.0514678955078125, -0.027679443359375, -0.0038909912109375, 0.0198974609375, 0.0436859130859375, 0.067474365234375, 0.0912628173828125, 0.11505126953125, 0.1388397216796875, 0.162628173828125, 0.1864166259765625, 0.210205078125, 0.2339935302734375, 0.257781982421875, 0.2815704345703125, 0.30535888671875, 0.3291473388671875, 0.352935791015625, 0.3767242431640625, 0.4005126953125, 0.4243011474609375, 0.448089599609375, 0.4718780517578125, 0.49566650390625, 0.5194549560546875, 0.543243408203125, 0.5670318603515625, 0.5908203125]}, "gradients/decoder.model.decoder.layers.5.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 6.0, 6.0, 10.0, 9.0, 18.0, 15.0, 40.0, 50.0, 73.0, 129.0, 227.0, 436.0, 743.0, 861.0, 603.0, 329.0, 178.0, 111.0, 70.0, 53.0, 33.0, 21.0, 25.0, 5.0, 5.0, 8.0, 6.0, 5.0, 0.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.136962890625, -0.13054275512695312, -0.12412261962890625, -0.11770248413085938, -0.1112823486328125, -0.10486221313476562, -0.09844207763671875, -0.09202194213867188, -0.085601806640625, -0.07918167114257812, -0.07276153564453125, -0.06634140014648438, -0.0599212646484375, -0.053501129150390625, -0.04708099365234375, -0.040660858154296875, -0.03424072265625, -0.027820587158203125, -0.02140045166015625, -0.014980316162109375, -0.0085601806640625, -0.002140045166015625, 0.00428009033203125, 0.010700225830078125, 0.017120361328125, 0.023540496826171875, 0.02996063232421875, 0.036380767822265625, 0.0428009033203125, 0.049221038818359375, 0.05564117431640625, 0.062061309814453125, 0.0684814453125, 0.07490158081054688, 0.08132171630859375, 0.08774185180664062, 0.0941619873046875, 0.10058212280273438, 0.10700225830078125, 0.11342239379882812, 0.119842529296875, 0.12626266479492188, 0.13268280029296875, 0.13910293579101562, 0.1455230712890625, 0.15194320678710938, 0.15836334228515625, 0.16478347778320312, 0.17120361328125, 0.17762374877929688, 0.18404388427734375, 0.19046401977539062, 0.1968841552734375, 0.20330429077148438, 0.20972442626953125, 0.21614456176757812, 0.222564697265625, 0.22898483276367188, 0.23540496826171875, 0.24182510375976562, 0.2482452392578125, 0.2546653747558594, 0.26108551025390625, 0.2675056457519531, 0.27392578125]}, "gradients/decoder.model.decoder.layers.5.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 0.0, 5.0, 4.0, 4.0, 6.0, 9.0, 8.0, 10.0, 18.0, 25.0, 47.0, 61.0, 83.0, 98.0, 99.0, 98.0, 94.0, 113.0, 77.0, 39.0, 31.0, 25.0, 21.0, 13.0, 7.0, 3.0, 5.0, 4.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.42179274559020996, -0.39984646439552307, -0.3779001832008362, -0.3559538722038269, -0.3340076208114624, -0.3120613098144531, -0.29011502861976624, -0.26816874742507935, -0.24622246623039246, -0.22427618503570557, -0.20232990384101868, -0.1803836077451706, -0.1584373265504837, -0.13649104535579681, -0.11454474925994873, -0.09259846806526184, -0.07065218687057495, -0.04870590195059776, -0.026759617030620575, -0.004813328385353088, 0.0171329528093338, 0.03907923400402069, 0.061025530099868774, 0.08297181129455566, 0.10491809248924255, 0.12686437368392944, 0.14881065487861633, 0.17075695097446442, 0.1927032321691513, 0.2146495133638382, 0.23659580945968628, 0.25854209065437317, 0.2804883122444153, 0.3024345934391022, 0.32438087463378906, 0.34632718563079834, 0.36827343702316284, 0.3902197480201721, 0.412166029214859, 0.4341123104095459, 0.4560585916042328, 0.4780048727989197, 0.49995115399360657, 0.5218974351882935, 0.5438437461853027, 0.5657899975776672, 0.5877363085746765, 0.609682559967041, 0.6316288709640503, 0.6535751819610596, 0.6755214333534241, 0.6974677443504333, 0.7194139957427979, 0.7413603067398071, 0.7633066177368164, 0.7852528691291809, 0.8071991205215454, 0.8291454315185547, 0.8510916829109192, 0.8730379939079285, 0.894984245300293, 0.9169305562973022, 0.9388768672943115, 0.960823118686676, 0.9827694296836853]}, "gradients/decoder.model.decoder.layers.5.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 3.0, 1.0, 5.0, 5.0, 7.0, 2.0, 4.0, 8.0, 13.0, 19.0, 18.0, 18.0, 22.0, 26.0, 33.0, 32.0, 39.0, 40.0, 44.0, 48.0, 36.0, 49.0, 51.0, 55.0, 48.0, 40.0, 49.0, 49.0, 40.0, 28.0, 22.0, 36.0, 23.0, 18.0, 18.0, 14.0, 12.0, 7.0, 5.0, 10.0, 4.0, 3.0, 4.0, 3.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3696340024471283, -0.3574292063713074, -0.34522441029548645, -0.3330196142196655, -0.3208147883415222, -0.3086099922657013, -0.29640519618988037, -0.28420040011405945, -0.2719956040382385, -0.2597908079624176, -0.24758599698543549, -0.23538120090961456, -0.22317638993263245, -0.21097159385681152, -0.1987667977809906, -0.18656200170516968, -0.17435717582702637, -0.16215237975120544, -0.14994756877422333, -0.1377427726984024, -0.1255379617214203, -0.11333316564559937, -0.10112836956977844, -0.08892356604337692, -0.0767187625169754, -0.06451395899057388, -0.05230915918946266, -0.04010435938835144, -0.02789955586194992, -0.0156947523355484, -0.003489956259727478, 0.008714847266674042, 0.02091968059539795, 0.03312448412179947, 0.04532928392291069, 0.05753408372402191, 0.06973888725042343, 0.08194369077682495, 0.09414848685264587, 0.1063532903790474, 0.11855809390544891, 0.13076288998126984, 0.14296770095825195, 0.15517249703407288, 0.1673772931098938, 0.17958210408687592, 0.19178690016269684, 0.20399171113967896, 0.21619650721549988, 0.2284013032913208, 0.24060611426830292, 0.25281089544296265, 0.26501572132110596, 0.2772205173969269, 0.2894253134727478, 0.3016301095485687, 0.31383490562438965, 0.32603970170021057, 0.3382444977760315, 0.3504493236541748, 0.3626541197299957, 0.37485891580581665, 0.3870637118816376, 0.3992685079574585, 0.4114733338356018]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 3.0, 2.0, 3.0, 3.0, 9.0, 10.0, 11.0, 20.0, 16.0, 33.0, 37.0, 44.0, 54.0, 108.0, 138.0, 260.0, 492.0, 1051.0, 2191.0, 5351.0, 14086.0, 40213.0, 119922.0, 306115.0, 336956.0, 144418.0, 48865.0, 16713.0, 6328.0, 2607.0, 1160.0, 523.0, 279.0, 195.0, 104.0, 59.0, 46.0, 37.0, 33.0, 24.0, 12.0, 6.0, 6.0, 7.0, 3.0, 3.0, 3.0, 3.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.06671142578125, -0.06486272811889648, -0.06301403045654297, -0.06116533279418945, -0.05931663513183594, -0.05746793746948242, -0.055619239807128906, -0.05377054214477539, -0.051921844482421875, -0.05007314682006836, -0.048224449157714844, -0.04637575149536133, -0.04452705383300781, -0.0426783561706543, -0.04082965850830078, -0.038980960845947266, -0.03713226318359375, -0.035283565521240234, -0.03343486785888672, -0.0315861701965332, -0.029737472534179688, -0.027888774871826172, -0.026040077209472656, -0.02419137954711914, -0.022342681884765625, -0.02049398422241211, -0.018645286560058594, -0.016796588897705078, -0.014947891235351562, -0.013099193572998047, -0.011250495910644531, -0.009401798248291016, -0.0075531005859375, -0.005704402923583984, -0.0038557052612304688, -0.002007007598876953, -0.0001583099365234375, 0.0016903877258300781, 0.0035390853881835938, 0.005387783050537109, 0.007236480712890625, 0.00908517837524414, 0.010933876037597656, 0.012782573699951172, 0.014631271362304688, 0.016479969024658203, 0.01832866668701172, 0.020177364349365234, 0.02202606201171875, 0.023874759674072266, 0.02572345733642578, 0.027572154998779297, 0.029420852661132812, 0.03126955032348633, 0.033118247985839844, 0.03496694564819336, 0.036815643310546875, 0.03866434097290039, 0.040513038635253906, 0.04236173629760742, 0.04421043395996094, 0.04605913162231445, 0.04790782928466797, 0.049756526947021484, 0.051605224609375]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 5.0, 6.0, 2.0, 14.0, 8.0, 4.0, 14.0, 24.0, 28.0, 31.0, 35.0, 39.0, 52.0, 65.0, 52.0, 55.0, 79.0, 67.0, 59.0, 76.0, 65.0, 41.0, 31.0, 36.0, 33.0, 19.0, 20.0, 20.0, 3.0, 8.0, 6.0, 4.0, 3.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.26318359375, -0.252227783203125, -0.24127197265625, -0.230316162109375, -0.2193603515625, -0.208404541015625, -0.19744873046875, -0.186492919921875, -0.175537109375, -0.164581298828125, -0.15362548828125, -0.142669677734375, -0.1317138671875, -0.120758056640625, -0.10980224609375, -0.098846435546875, -0.087890625, -0.076934814453125, -0.06597900390625, -0.055023193359375, -0.0440673828125, -0.033111572265625, -0.02215576171875, -0.011199951171875, -0.000244140625, 0.010711669921875, 0.02166748046875, 0.032623291015625, 0.0435791015625, 0.054534912109375, 0.06549072265625, 0.076446533203125, 0.08740234375, 0.098358154296875, 0.10931396484375, 0.120269775390625, 0.1312255859375, 0.142181396484375, 0.15313720703125, 0.164093017578125, 0.175048828125, 0.186004638671875, 0.19696044921875, 0.207916259765625, 0.2188720703125, 0.229827880859375, 0.24078369140625, 0.251739501953125, 0.2626953125, 0.273651123046875, 0.28460693359375, 0.295562744140625, 0.3065185546875, 0.317474365234375, 0.32843017578125, 0.339385986328125, 0.350341796875, 0.361297607421875, 0.37225341796875, 0.383209228515625, 0.3941650390625, 0.405120849609375, 0.41607666015625, 0.427032470703125, 0.43798828125]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 0.0, 4.0, 13.0, 8.0, 17.0, 19.0, 35.0, 48.0, 85.0, 121.0, 224.0, 314.0, 607.0, 1193.0, 2585.0, 6025.0, 15687.0, 47961.0, 158344.0, 389619.0, 287210.0, 92509.0, 28246.0, 9734.0, 3991.0, 1788.0, 887.0, 509.0, 307.0, 190.0, 104.0, 56.0, 29.0, 32.0, 21.0, 14.0, 7.0, 10.0, 3.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0], "bins": [-0.07427978515625, -0.07236433029174805, -0.0704488754272461, -0.06853342056274414, -0.06661796569824219, -0.06470251083374023, -0.06278705596923828, -0.06087160110473633, -0.058956146240234375, -0.05704069137573242, -0.05512523651123047, -0.053209781646728516, -0.05129432678222656, -0.04937887191772461, -0.047463417053222656, -0.0455479621887207, -0.04363250732421875, -0.0417170524597168, -0.039801597595214844, -0.03788614273071289, -0.03597068786621094, -0.034055233001708984, -0.03213977813720703, -0.030224323272705078, -0.028308868408203125, -0.026393413543701172, -0.02447795867919922, -0.022562503814697266, -0.020647048950195312, -0.01873159408569336, -0.016816139221191406, -0.014900684356689453, -0.0129852294921875, -0.011069774627685547, -0.009154319763183594, -0.007238864898681641, -0.0053234100341796875, -0.0034079551696777344, -0.0014925003051757812, 0.0004229545593261719, 0.002338409423828125, 0.004253864288330078, 0.006169319152832031, 0.008084774017333984, 0.010000228881835938, 0.01191568374633789, 0.013831138610839844, 0.015746593475341797, 0.01766204833984375, 0.019577503204345703, 0.021492958068847656, 0.02340841293334961, 0.025323867797851562, 0.027239322662353516, 0.02915477752685547, 0.031070232391357422, 0.032985687255859375, 0.03490114212036133, 0.03681659698486328, 0.038732051849365234, 0.04064750671386719, 0.04256296157836914, 0.044478416442871094, 0.04639387130737305, 0.048309326171875]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 4.0, 11.0, 8.0, 10.0, 9.0, 15.0, 11.0, 12.0, 18.0, 19.0, 25.0, 20.0, 35.0, 34.0, 32.0, 39.0, 36.0, 46.0, 39.0, 55.0, 41.0, 55.0, 41.0, 35.0, 49.0, 44.0, 34.0, 35.0, 32.0, 31.0, 21.0, 19.0, 12.0, 16.0, 12.0, 8.0, 9.0, 5.0, 7.0, 5.0, 3.0, 2.0, 6.0, 0.0, 3.0, 1.0, 3.0, 2.0], "bins": [-0.55615234375, -0.5408363342285156, -0.5255203247070312, -0.5102043151855469, -0.4948883056640625, -0.4795722961425781, -0.46425628662109375, -0.4489402770996094, -0.433624267578125, -0.4183082580566406, -0.40299224853515625, -0.3876762390136719, -0.3723602294921875, -0.3570442199707031, -0.34172821044921875, -0.3264122009277344, -0.31109619140625, -0.2957801818847656, -0.28046417236328125, -0.2651481628417969, -0.2498321533203125, -0.23451614379882812, -0.21920013427734375, -0.20388412475585938, -0.188568115234375, -0.17325210571289062, -0.15793609619140625, -0.14262008666992188, -0.1273040771484375, -0.11198806762695312, -0.09667205810546875, -0.08135604858398438, -0.0660400390625, -0.050724029541015625, -0.03540802001953125, -0.020092010498046875, -0.0047760009765625, 0.010540008544921875, 0.02585601806640625, 0.041172027587890625, 0.056488037109375, 0.07180404663085938, 0.08712005615234375, 0.10243606567382812, 0.1177520751953125, 0.13306808471679688, 0.14838409423828125, 0.16370010375976562, 0.17901611328125, 0.19433212280273438, 0.20964813232421875, 0.22496414184570312, 0.2402801513671875, 0.2555961608886719, 0.27091217041015625, 0.2862281799316406, 0.301544189453125, 0.3168601989746094, 0.33217620849609375, 0.3474922180175781, 0.3628082275390625, 0.3781242370605469, 0.39344024658203125, 0.4087562561035156, 0.424072265625]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 2.0, 4.0, 2.0, 2.0, 4.0, 3.0, 8.0, 11.0, 11.0, 21.0, 15.0, 26.0, 38.0, 53.0, 67.0, 103.0, 157.0, 246.0, 432.0, 764.0, 1341.0, 2692.0, 5752.0, 14690.0, 48505.0, 209496.0, 517549.0, 179473.0, 42993.0, 13226.0, 5206.0, 2491.0, 1322.0, 703.0, 417.0, 244.0, 175.0, 96.0, 77.0, 22.0, 42.0, 19.0, 10.0, 15.0, 11.0, 10.0, 6.0, 4.0, 4.0, 2.0, 4.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.020233154296875, -0.019568681716918945, -0.01890420913696289, -0.018239736557006836, -0.01757526397705078, -0.016910791397094727, -0.016246318817138672, -0.015581846237182617, -0.014917373657226562, -0.014252901077270508, -0.013588428497314453, -0.012923955917358398, -0.012259483337402344, -0.011595010757446289, -0.010930538177490234, -0.01026606559753418, -0.009601593017578125, -0.00893712043762207, -0.008272647857666016, -0.007608175277709961, -0.006943702697753906, -0.0062792301177978516, -0.005614757537841797, -0.004950284957885742, -0.0042858123779296875, -0.003621339797973633, -0.002956867218017578, -0.0022923946380615234, -0.0016279220581054688, -0.0009634494781494141, -0.0002989768981933594, 0.0003654956817626953, 0.00102996826171875, 0.0016944408416748047, 0.0023589134216308594, 0.003023386001586914, 0.0036878585815429688, 0.0043523311614990234, 0.005016803741455078, 0.005681276321411133, 0.0063457489013671875, 0.007010221481323242, 0.007674694061279297, 0.008339166641235352, 0.009003639221191406, 0.009668111801147461, 0.010332584381103516, 0.01099705696105957, 0.011661529541015625, 0.01232600212097168, 0.012990474700927734, 0.013654947280883789, 0.014319419860839844, 0.014983892440795898, 0.015648365020751953, 0.016312837600708008, 0.016977310180664062, 0.017641782760620117, 0.018306255340576172, 0.018970727920532227, 0.01963520050048828, 0.020299673080444336, 0.02096414566040039, 0.021628618240356445, 0.0222930908203125]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 2.0, 3.0, 7.0, 4.0, 6.0, 3.0, 7.0, 24.0, 24.0, 30.0, 47.0, 51.0, 54.0, 87.0, 71.0, 110.0, 104.0, 77.0, 88.0, 63.0, 39.0, 30.0, 32.0, 14.0, 9.0, 4.0, 6.0, 4.0, 2.0, 2.0, 6.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.4901161193847656e-05, -1.4456920325756073e-05, -1.401267945766449e-05, -1.3568438589572906e-05, -1.3124197721481323e-05, -1.267995685338974e-05, -1.2235715985298157e-05, -1.1791475117206573e-05, -1.134723424911499e-05, -1.0902993381023407e-05, -1.0458752512931824e-05, -1.001451164484024e-05, -9.570270776748657e-06, -9.126029908657074e-06, -8.68178904056549e-06, -8.237548172473907e-06, -7.793307304382324e-06, -7.349066436290741e-06, -6.904825568199158e-06, -6.4605847001075745e-06, -6.016343832015991e-06, -5.572102963924408e-06, -5.127862095832825e-06, -4.6836212277412415e-06, -4.239380359649658e-06, -3.795139491558075e-06, -3.3508986234664917e-06, -2.9066577553749084e-06, -2.462416887283325e-06, -2.018176019191742e-06, -1.5739351511001587e-06, -1.1296942830085754e-06, -6.854534149169922e-07, -2.4121254682540894e-07, 2.0302832126617432e-07, 6.472691893577576e-07, 1.0915100574493408e-06, 1.535750925540924e-06, 1.9799917936325073e-06, 2.4242326617240906e-06, 2.868473529815674e-06, 3.312714397907257e-06, 3.7569552659988403e-06, 4.201196134090424e-06, 4.645437002182007e-06, 5.08967787027359e-06, 5.533918738365173e-06, 5.978159606456757e-06, 6.42240047454834e-06, 6.866641342639923e-06, 7.310882210731506e-06, 7.75512307882309e-06, 8.199363946914673e-06, 8.643604815006256e-06, 9.08784568309784e-06, 9.532086551189423e-06, 9.976327419281006e-06, 1.0420568287372589e-05, 1.0864809155464172e-05, 1.1309050023555756e-05, 1.1753290891647339e-05, 1.2197531759738922e-05, 1.2641772627830505e-05, 1.3086013495922089e-05, 1.3530254364013672e-05]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 2.0, 1.0, 3.0, 6.0, 3.0, 9.0, 13.0, 17.0, 28.0, 35.0, 59.0, 74.0, 113.0, 124.0, 215.0, 379.0, 704.0, 1193.0, 2470.0, 5791.0, 14656.0, 41681.0, 126174.0, 318484.0, 330538.0, 134083.0, 44462.0, 15665.0, 6068.0, 2500.0, 1239.0, 610.0, 376.0, 236.0, 154.0, 109.0, 87.0, 49.0, 36.0, 34.0, 25.0, 13.0, 10.0, 10.0, 6.0, 6.0, 5.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0], "bins": [-0.0158538818359375, -0.015342950820922852, -0.014832019805908203, -0.014321088790893555, -0.013810157775878906, -0.013299226760864258, -0.01278829574584961, -0.012277364730834961, -0.011766433715820312, -0.011255502700805664, -0.010744571685791016, -0.010233640670776367, -0.009722709655761719, -0.00921177864074707, -0.008700847625732422, -0.008189916610717773, -0.007678985595703125, -0.0071680545806884766, -0.006657123565673828, -0.00614619255065918, -0.005635261535644531, -0.005124330520629883, -0.004613399505615234, -0.004102468490600586, -0.0035915374755859375, -0.003080606460571289, -0.0025696754455566406, -0.002058744430541992, -0.0015478134155273438, -0.0010368824005126953, -0.0005259513854980469, -1.5020370483398438e-05, 0.00049591064453125, 0.0010068416595458984, 0.0015177726745605469, 0.0020287036895751953, 0.0025396347045898438, 0.003050565719604492, 0.0035614967346191406, 0.004072427749633789, 0.0045833587646484375, 0.005094289779663086, 0.005605220794677734, 0.006116151809692383, 0.006627082824707031, 0.00713801383972168, 0.007648944854736328, 0.008159875869750977, 0.008670806884765625, 0.009181737899780273, 0.009692668914794922, 0.01020359992980957, 0.010714530944824219, 0.011225461959838867, 0.011736392974853516, 0.012247323989868164, 0.012758255004882812, 0.013269186019897461, 0.01378011703491211, 0.014291048049926758, 0.014801979064941406, 0.015312910079956055, 0.015823841094970703, 0.01633477210998535, 0.016845703125]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 3.0, 7.0, 6.0, 4.0, 7.0, 11.0, 11.0, 10.0, 12.0, 8.0, 19.0, 30.0, 25.0, 31.0, 29.0, 38.0, 62.0, 52.0, 49.0, 67.0, 57.0, 44.0, 52.0, 46.0, 50.0, 37.0, 32.0, 39.0, 31.0, 22.0, 27.0, 19.0, 16.0, 11.0, 9.0, 7.0, 8.0, 5.0, 6.0, 2.0, 5.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0048065185546875, -0.004659771919250488, -0.0045130252838134766, -0.004366278648376465, -0.004219532012939453, -0.004072785377502441, -0.00392603874206543, -0.003779292106628418, -0.0036325454711914062, -0.0034857988357543945, -0.003339052200317383, -0.003192305564880371, -0.0030455589294433594, -0.0028988122940063477, -0.002752065658569336, -0.0026053190231323242, -0.0024585723876953125, -0.0023118257522583008, -0.002165079116821289, -0.0020183324813842773, -0.0018715858459472656, -0.001724839210510254, -0.0015780925750732422, -0.0014313459396362305, -0.0012845993041992188, -0.001137852668762207, -0.0009911060333251953, -0.0008443593978881836, -0.0006976127624511719, -0.0005508661270141602, -0.00040411949157714844, -0.0002573728561401367, -0.000110626220703125, 3.612041473388672e-05, 0.00018286705017089844, 0.00032961368560791016, 0.0004763603210449219, 0.0006231069564819336, 0.0007698535919189453, 0.000916600227355957, 0.0010633468627929688, 0.0012100934982299805, 0.0013568401336669922, 0.001503586769104004, 0.0016503334045410156, 0.0017970800399780273, 0.001943826675415039, 0.0020905733108520508, 0.0022373199462890625, 0.0023840665817260742, 0.002530813217163086, 0.0026775598526000977, 0.0028243064880371094, 0.002971053123474121, 0.003117799758911133, 0.0032645463943481445, 0.0034112930297851562, 0.003558039665222168, 0.0037047863006591797, 0.0038515329360961914, 0.003998279571533203, 0.004145026206970215, 0.0042917728424072266, 0.004438519477844238, 0.00458526611328125]}, "gradients/decoder.model.decoder.layers.5.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 9.0, 17.0, 25.0, 52.0, 150.0, 210.0, 250.0, 166.0, 75.0, 28.0, 14.0, 8.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1758981943130493, -1.1465601921081543, -1.1172221899032593, -1.0878841876983643, -1.0585461854934692, -1.0292081832885742, -0.9998701810836792, -0.9705321788787842, -0.9411941766738892, -0.9118561744689941, -0.8825181722640991, -0.8531801700592041, -0.8238421678543091, -0.7945041656494141, -0.765166163444519, -0.735828161239624, -0.706490159034729, -0.677152156829834, -0.647814154624939, -0.618476152420044, -0.5891381502151489, -0.5598001480102539, -0.5304621458053589, -0.5011241436004639, -0.47178614139556885, -0.44244813919067383, -0.4131101369857788, -0.3837721347808838, -0.35443413257598877, -0.32509613037109375, -0.29575812816619873, -0.2664201259613037, -0.23708206415176392, -0.2077440619468689, -0.17840605974197388, -0.14906805753707886, -0.11973005533218384, -0.09039205312728882, -0.0610540509223938, -0.03171604871749878, -0.0023780465126037598, 0.02695995569229126, 0.05629795789718628, 0.0856359601020813, 0.11497396230697632, 0.14431196451187134, 0.17364996671676636, 0.20298796892166138, 0.2323259711265564, 0.2616639733314514, 0.29100197553634644, 0.32033997774124146, 0.3496779799461365, 0.3790159821510315, 0.4083539843559265, 0.43769198656082153, 0.46702998876571655, 0.4963679909706116, 0.5257059931755066, 0.5550439953804016, 0.5843819975852966, 0.6137199997901917, 0.6430580019950867, 0.6723960041999817, 0.7017340064048767]}, "gradients/decoder.model.decoder.layers.5.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 5.0, 5.0, 4.0, 8.0, 9.0, 9.0, 17.0, 19.0, 22.0, 25.0, 39.0, 38.0, 33.0, 59.0, 54.0, 62.0, 50.0, 60.0, 70.0, 61.0, 58.0, 52.0, 45.0, 36.0, 35.0, 31.0, 21.0, 23.0, 14.0, 7.0, 11.0, 8.0, 5.0, 5.0, 5.0, 2.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2743450701236725, -0.26477813720703125, -0.2552111744880676, -0.2456442266702652, -0.23607727885246277, -0.22651033103466034, -0.2169433832168579, -0.20737643539905548, -0.19780948758125305, -0.18824253976345062, -0.1786755919456482, -0.16910864412784576, -0.15954169631004333, -0.1499747484922409, -0.14040780067443848, -0.13084085285663605, -0.12127390503883362, -0.11170695722103119, -0.10214000940322876, -0.09257306158542633, -0.0830061137676239, -0.07343916594982147, -0.06387221813201904, -0.054305270314216614, -0.044738322496414185, -0.035171374678611755, -0.025604426860809326, -0.016037479043006897, -0.006470531225204468, 0.0030964165925979614, 0.01266336441040039, 0.02223031222820282, 0.03179726004600525, 0.04136420786380768, 0.05093115568161011, 0.06049810349941254, 0.07006505131721497, 0.0796319991350174, 0.08919894695281982, 0.09876589477062225, 0.10833284258842468, 0.11789979040622711, 0.12746673822402954, 0.13703368604183197, 0.1466006338596344, 0.15616758167743683, 0.16573452949523926, 0.1753014773130417, 0.18486842513084412, 0.19443537294864655, 0.20400232076644897, 0.2135692685842514, 0.22313621640205383, 0.23270316421985626, 0.2422701120376587, 0.2518370747566223, 0.26140400767326355, 0.2709709405899048, 0.2805379033088684, 0.29010486602783203, 0.29967179894447327, 0.3092387318611145, 0.3188056945800781, 0.32837265729904175, 0.337939590215683]}, "gradients/decoder.model.decoder.layers.5.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 5.0, 4.0, 7.0, 10.0, 15.0, 11.0, 24.0, 38.0, 51.0, 81.0, 124.0, 193.0, 291.0, 556.0, 933.0, 1680.0, 3223.0, 6451.0, 13813.0, 32101.0, 91108.0, 333532.0, 387404.0, 109035.0, 37242.0, 15515.0, 7074.0, 3539.0, 1894.0, 1030.0, 597.0, 366.0, 230.0, 132.0, 88.0, 48.0, 36.0, 30.0, 19.0, 11.0, 6.0, 5.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.290771484375, -0.2822380065917969, -0.27370452880859375, -0.2651710510253906, -0.2566375732421875, -0.24810409545898438, -0.23957061767578125, -0.23103713989257812, -0.222503662109375, -0.21397018432617188, -0.20543670654296875, -0.19690322875976562, -0.1883697509765625, -0.17983627319335938, -0.17130279541015625, -0.16276931762695312, -0.15423583984375, -0.14570236206054688, -0.13716888427734375, -0.12863540649414062, -0.1201019287109375, -0.11156845092773438, -0.10303497314453125, -0.09450149536132812, -0.085968017578125, -0.07743453979492188, -0.06890106201171875, -0.060367584228515625, -0.0518341064453125, -0.043300628662109375, -0.03476715087890625, -0.026233673095703125, -0.0177001953125, -0.009166717529296875, -0.00063323974609375, 0.007900238037109375, 0.0164337158203125, 0.024967193603515625, 0.03350067138671875, 0.042034149169921875, 0.050567626953125, 0.059101104736328125, 0.06763458251953125, 0.07616806030273438, 0.0847015380859375, 0.09323501586914062, 0.10176849365234375, 0.11030197143554688, 0.11883544921875, 0.12736892700195312, 0.13590240478515625, 0.14443588256835938, 0.1529693603515625, 0.16150283813476562, 0.17003631591796875, 0.17856979370117188, 0.187103271484375, 0.19563674926757812, 0.20417022705078125, 0.21270370483398438, 0.2212371826171875, 0.22977066040039062, 0.23830413818359375, 0.24683761596679688, 0.25537109375]}, "gradients/decoder.model.decoder.layers.5.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 4.0, 1.0, 2.0, 3.0, 4.0, 8.0, 9.0, 16.0, 14.0, 12.0, 15.0, 30.0, 30.0, 36.0, 47.0, 45.0, 59.0, 42.0, 45.0, 67.0, 59.0, 71.0, 52.0, 58.0, 50.0, 44.0, 43.0, 29.0, 28.0, 16.0, 13.0, 15.0, 13.0, 6.0, 8.0, 2.0, 3.0, 1.0, 6.0, 3.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.47705078125, -0.4587249755859375, -0.440399169921875, -0.4220733642578125, -0.40374755859375, -0.3854217529296875, -0.367095947265625, -0.3487701416015625, -0.3304443359375, -0.3121185302734375, -0.293792724609375, -0.2754669189453125, -0.25714111328125, -0.2388153076171875, -0.220489501953125, -0.2021636962890625, -0.183837890625, -0.1655120849609375, -0.147186279296875, -0.1288604736328125, -0.11053466796875, -0.0922088623046875, -0.073883056640625, -0.0555572509765625, -0.0372314453125, -0.0189056396484375, -0.000579833984375, 0.0177459716796875, 0.03607177734375, 0.0543975830078125, 0.072723388671875, 0.0910491943359375, 0.109375, 0.1277008056640625, 0.146026611328125, 0.1643524169921875, 0.18267822265625, 0.2010040283203125, 0.219329833984375, 0.2376556396484375, 0.2559814453125, 0.2743072509765625, 0.292633056640625, 0.3109588623046875, 0.32928466796875, 0.3476104736328125, 0.365936279296875, 0.3842620849609375, 0.402587890625, 0.4209136962890625, 0.439239501953125, 0.4575653076171875, 0.47589111328125, 0.4942169189453125, 0.512542724609375, 0.5308685302734375, 0.5491943359375, 0.5675201416015625, 0.585845947265625, 0.6041717529296875, 0.62249755859375, 0.6408233642578125, 0.659149169921875, 0.6774749755859375, 0.69580078125]}, "gradients/decoder.model.decoder.layers.5.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 3.0, 3.0, 7.0, 11.0, 5.0, 9.0, 7.0, 9.0, 19.0, 27.0, 36.0, 53.0, 76.0, 125.0, 252.0, 655.0, 2635.0, 14666.0, 194610.0, 781092.0, 46200.0, 5882.0, 1252.0, 425.0, 162.0, 101.0, 71.0, 32.0, 37.0, 18.0, 18.0, 11.0, 11.0, 8.0, 7.0, 6.0, 7.0, 1.0, 2.0, 4.0, 0.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.56201171875, -0.5421218872070312, -0.5222320556640625, -0.5023422241210938, -0.482452392578125, -0.46256256103515625, -0.4426727294921875, -0.42278289794921875, -0.40289306640625, -0.38300323486328125, -0.3631134033203125, -0.34322357177734375, -0.323333740234375, -0.30344390869140625, -0.2835540771484375, -0.26366424560546875, -0.2437744140625, -0.22388458251953125, -0.2039947509765625, -0.18410491943359375, -0.164215087890625, -0.14432525634765625, -0.1244354248046875, -0.10454559326171875, -0.08465576171875, -0.06476593017578125, -0.0448760986328125, -0.02498626708984375, -0.005096435546875, 0.01479339599609375, 0.0346832275390625, 0.05457305908203125, 0.074462890625, 0.09435272216796875, 0.1142425537109375, 0.13413238525390625, 0.154022216796875, 0.17391204833984375, 0.1938018798828125, 0.21369171142578125, 0.23358154296875, 0.25347137451171875, 0.2733612060546875, 0.29325103759765625, 0.313140869140625, 0.33303070068359375, 0.3529205322265625, 0.37281036376953125, 0.3927001953125, 0.41259002685546875, 0.4324798583984375, 0.45236968994140625, 0.472259521484375, 0.49214935302734375, 0.5120391845703125, 0.5319290161132812, 0.55181884765625, 0.5717086791992188, 0.5915985107421875, 0.6114883422851562, 0.631378173828125, 0.6512680053710938, 0.6711578369140625, 0.6910476684570312, 0.7109375]}, "gradients/decoder.model.decoder.layers.5.self_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 10.0, 10.0, 4.0, 10.0, 11.0, 13.0, 16.0, 7.0, 22.0, 35.0, 26.0, 28.0, 27.0, 36.0, 30.0, 42.0, 48.0, 57.0, 61.0, 52.0, 30.0, 39.0, 44.0, 48.0, 37.0, 28.0, 46.0, 36.0, 31.0, 28.0, 22.0, 9.0, 16.0, 13.0, 13.0, 2.0, 4.0, 5.0, 5.0, 3.0, 5.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.49755859375, -0.480010986328125, -0.46246337890625, -0.444915771484375, -0.4273681640625, -0.409820556640625, -0.39227294921875, -0.374725341796875, -0.357177734375, -0.339630126953125, -0.32208251953125, -0.304534912109375, -0.2869873046875, -0.269439697265625, -0.25189208984375, -0.234344482421875, -0.216796875, -0.199249267578125, -0.18170166015625, -0.164154052734375, -0.1466064453125, -0.129058837890625, -0.11151123046875, -0.093963623046875, -0.076416015625, -0.058868408203125, -0.04132080078125, -0.023773193359375, -0.0062255859375, 0.011322021484375, 0.02886962890625, 0.046417236328125, 0.06396484375, 0.081512451171875, 0.09906005859375, 0.116607666015625, 0.1341552734375, 0.151702880859375, 0.16925048828125, 0.186798095703125, 0.204345703125, 0.221893310546875, 0.23944091796875, 0.256988525390625, 0.2745361328125, 0.292083740234375, 0.30963134765625, 0.327178955078125, 0.3447265625, 0.362274169921875, 0.37982177734375, 0.397369384765625, 0.4149169921875, 0.432464599609375, 0.45001220703125, 0.467559814453125, 0.485107421875, 0.502655029296875, 0.52020263671875, 0.537750244140625, 0.5552978515625, 0.572845458984375, 0.59039306640625, 0.607940673828125, 0.62548828125]}, "gradients/decoder.model.decoder.layers.5.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 3.0, 1.0, 6.0, 7.0, 5.0, 14.0, 30.0, 40.0, 67.0, 124.0, 227.0, 408.0, 841.0, 1775.0, 4500.0, 18337.0, 298281.0, 681067.0, 32402.0, 5999.0, 2313.0, 1038.0, 476.0, 255.0, 129.0, 81.0, 57.0, 28.0, 12.0, 16.0, 3.0, 4.0, 3.0, 3.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.252197265625, -0.24354171752929688, -0.23488616943359375, -0.22623062133789062, -0.2175750732421875, -0.20891952514648438, -0.20026397705078125, -0.19160842895507812, -0.182952880859375, -0.17429733276367188, -0.16564178466796875, -0.15698623657226562, -0.1483306884765625, -0.13967514038085938, -0.13101959228515625, -0.12236404418945312, -0.11370849609375, -0.10505294799804688, -0.09639739990234375, -0.08774185180664062, -0.0790863037109375, -0.07043075561523438, -0.06177520751953125, -0.053119659423828125, -0.044464111328125, -0.035808563232421875, -0.02715301513671875, -0.018497467041015625, -0.0098419189453125, -0.001186370849609375, 0.00746917724609375, 0.016124725341796875, 0.0247802734375, 0.033435821533203125, 0.04209136962890625, 0.050746917724609375, 0.0594024658203125, 0.06805801391601562, 0.07671356201171875, 0.08536911010742188, 0.094024658203125, 0.10268020629882812, 0.11133575439453125, 0.11999130249023438, 0.1286468505859375, 0.13730239868164062, 0.14595794677734375, 0.15461349487304688, 0.16326904296875, 0.17192459106445312, 0.18058013916015625, 0.18923568725585938, 0.1978912353515625, 0.20654678344726562, 0.21520233154296875, 0.22385787963867188, 0.232513427734375, 0.24116897583007812, 0.24982452392578125, 0.2584800720214844, 0.2671356201171875, 0.2757911682128906, 0.28444671630859375, 0.2931022644042969, 0.3017578125]}, "gradients/decoder.model.decoder.layers.5.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 3.0, 3.0, 1.0, 1.0, 1.0, 5.0, 16.0, 22.0, 49.0, 70.0, 132.0, 196.0, 206.0, 140.0, 59.0, 34.0, 24.0, 22.0, 5.0, 10.0, 4.0, 5.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.725290298461914e-05, -3.576651215553284e-05, -3.428012132644653e-05, -3.279373049736023e-05, -3.1307339668273926e-05, -2.9820948839187622e-05, -2.833455801010132e-05, -2.6848167181015015e-05, -2.536177635192871e-05, -2.3875385522842407e-05, -2.2388994693756104e-05, -2.09026038646698e-05, -1.9416213035583496e-05, -1.7929822206497192e-05, -1.644343137741089e-05, -1.4957040548324585e-05, -1.3470649719238281e-05, -1.1984258890151978e-05, -1.0497868061065674e-05, -9.01147723197937e-06, -7.525086402893066e-06, -6.038695573806763e-06, -4.552304744720459e-06, -3.0659139156341553e-06, -1.5795230865478516e-06, -9.313225746154785e-08, 1.3932585716247559e-06, 2.8796494007110596e-06, 4.366040229797363e-06, 5.852431058883667e-06, 7.338821887969971e-06, 8.825212717056274e-06, 1.0311603546142578e-05, 1.1797994375228882e-05, 1.3284385204315186e-05, 1.477077603340149e-05, 1.6257166862487793e-05, 1.7743557691574097e-05, 1.92299485206604e-05, 2.0716339349746704e-05, 2.2202730178833008e-05, 2.368912100791931e-05, 2.5175511837005615e-05, 2.666190266609192e-05, 2.8148293495178223e-05, 2.9634684324264526e-05, 3.112107515335083e-05, 3.2607465982437134e-05, 3.409385681152344e-05, 3.558024764060974e-05, 3.7066638469696045e-05, 3.855302929878235e-05, 4.003942012786865e-05, 4.1525810956954956e-05, 4.301220178604126e-05, 4.4498592615127563e-05, 4.598498344421387e-05, 4.747137427330017e-05, 4.8957765102386475e-05, 5.044415593147278e-05, 5.193054676055908e-05, 5.3416937589645386e-05, 5.490332841873169e-05, 5.638971924781799e-05, 5.78761100769043e-05]}, "gradients/decoder.model.decoder.layers.5.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 4.0, 0.0, 5.0, 2.0, 1.0, 1.0, 2.0, 6.0, 3.0, 1.0, 6.0, 10.0, 20.0, 30.0, 41.0, 64.0, 167.0, 456.0, 1443.0, 5423.0, 50558.0, 927910.0, 54436.0, 5712.0, 1406.0, 460.0, 185.0, 81.0, 43.0, 30.0, 15.0, 7.0, 6.0, 6.0, 5.0, 2.0, 1.0, 2.0, 6.0, 4.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.388427734375, -0.3764801025390625, -0.364532470703125, -0.3525848388671875, -0.34063720703125, -0.3286895751953125, -0.316741943359375, -0.3047943115234375, -0.2928466796875, -0.2808990478515625, -0.268951416015625, -0.2570037841796875, -0.24505615234375, -0.2331085205078125, -0.221160888671875, -0.2092132568359375, -0.197265625, -0.1853179931640625, -0.173370361328125, -0.1614227294921875, -0.14947509765625, -0.1375274658203125, -0.125579833984375, -0.1136322021484375, -0.1016845703125, -0.0897369384765625, -0.077789306640625, -0.0658416748046875, -0.05389404296875, -0.0419464111328125, -0.029998779296875, -0.0180511474609375, -0.006103515625, 0.0058441162109375, 0.017791748046875, 0.0297393798828125, 0.04168701171875, 0.0536346435546875, 0.065582275390625, 0.0775299072265625, 0.0894775390625, 0.1014251708984375, 0.113372802734375, 0.1253204345703125, 0.13726806640625, 0.1492156982421875, 0.161163330078125, 0.1731109619140625, 0.18505859375, 0.1970062255859375, 0.208953857421875, 0.2209014892578125, 0.23284912109375, 0.2447967529296875, 0.256744384765625, 0.2686920166015625, 0.2806396484375, 0.2925872802734375, 0.304534912109375, 0.3164825439453125, 0.32843017578125, 0.3403778076171875, 0.352325439453125, 0.3642730712890625, 0.376220703125]}, "gradients/decoder.model.decoder.layers.5.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 5.0, 5.0, 3.0, 12.0, 6.0, 16.0, 24.0, 28.0, 45.0, 51.0, 104.0, 130.0, 161.0, 113.0, 107.0, 68.0, 30.0, 33.0, 16.0, 16.0, 10.0, 5.0, 7.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0799560546875, -0.0770425796508789, -0.07412910461425781, -0.07121562957763672, -0.06830215454101562, -0.06538867950439453, -0.06247520446777344, -0.059561729431152344, -0.05664825439453125, -0.053734779357910156, -0.05082130432128906, -0.04790782928466797, -0.044994354248046875, -0.04208087921142578, -0.03916740417480469, -0.036253929138183594, -0.0333404541015625, -0.030426979064941406, -0.027513504028320312, -0.02460002899169922, -0.021686553955078125, -0.01877307891845703, -0.015859603881835938, -0.012946128845214844, -0.01003265380859375, -0.007119178771972656, -0.0042057037353515625, -0.0012922286987304688, 0.001621246337890625, 0.004534721374511719, 0.0074481964111328125, 0.010361671447753906, 0.013275146484375, 0.016188621520996094, 0.019102096557617188, 0.02201557159423828, 0.024929046630859375, 0.02784252166748047, 0.030755996704101562, 0.033669471740722656, 0.03658294677734375, 0.039496421813964844, 0.04240989685058594, 0.04532337188720703, 0.048236846923828125, 0.05115032196044922, 0.05406379699707031, 0.056977272033691406, 0.0598907470703125, 0.0628042221069336, 0.06571769714355469, 0.06863117218017578, 0.07154464721679688, 0.07445812225341797, 0.07737159729003906, 0.08028507232666016, 0.08319854736328125, 0.08611202239990234, 0.08902549743652344, 0.09193897247314453, 0.09485244750976562, 0.09776592254638672, 0.10067939758300781, 0.1035928726196289, 0.10650634765625]}, "gradients/decoder.model.decoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [3.0, 1.0, 3.0, 8.0, 5.0, 19.0, 29.0, 46.0, 113.0, 148.0, 223.0, 180.0, 116.0, 56.0, 35.0, 18.0, 5.0, 5.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5302221775054932, -0.48031696677207947, -0.43041178584098816, -0.38050657510757446, -0.33060139417648315, -0.28069618344306946, -0.23079097270965576, -0.18088579177856445, -0.13098058104515076, -0.08107538521289825, -0.031170181930065155, 0.018735021352767944, 0.06864021718502045, 0.11854541301727295, 0.16845062375068665, 0.21835580468177795, 0.26826101541519165, 0.31816622614860535, 0.36807140707969666, 0.41797661781311035, 0.46788179874420166, 0.517786979675293, 0.567692220211029, 0.6175974011421204, 0.6675026416778564, 0.7174078226089478, 0.7673130631446838, 0.8172182440757751, 0.8671234250068665, 0.9170286655426025, 0.9669338464736938, 1.0168390274047852, 1.0667442083358765, 1.1166493892669678, 1.166554570198059, 1.2164597511291504, 1.2663650512695312, 1.3162702322006226, 1.3661754131317139, 1.4160805940628052, 1.4659857749938965, 1.5158909559249878, 1.565796136856079, 1.61570143699646, 1.6656066179275513, 1.7155117988586426, 1.7654169797897339, 1.8153221607208252, 1.865227460861206, 1.9151326417922974, 1.9650378227233887, 2.0149431228637695, 2.0648481845855713, 2.114753484725952, 2.164658546447754, 2.2145638465881348, 2.2644689083099365, 2.3143742084503174, 2.364279270172119, 2.4141845703125, 2.4640896320343018, 2.5139949321746826, 2.5638999938964844, 2.6138052940368652, 2.663710594177246]}, "gradients/decoder.model.decoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 2.0, 3.0, 3.0, 0.0, 4.0, 6.0, 5.0, 6.0, 11.0, 10.0, 14.0, 9.0, 9.0, 23.0, 18.0, 19.0, 21.0, 19.0, 20.0, 24.0, 24.0, 28.0, 23.0, 34.0, 28.0, 36.0, 35.0, 33.0, 43.0, 35.0, 34.0, 44.0, 34.0, 24.0, 32.0, 41.0, 29.0, 30.0, 21.0, 20.0, 22.0, 24.0, 14.0, 19.0, 9.0, 14.0, 10.0, 2.0, 11.0, 8.0, 5.0, 4.0, 4.0, 4.0, 3.0, 1.0, 1.0, 3.0, 1.0, 4.0, 3.0], "bins": [-0.7506343722343445, -0.7271214127540588, -0.7036084532737732, -0.6800954937934875, -0.6565825939178467, -0.633069634437561, -0.6095566749572754, -0.5860437154769897, -0.5625307559967041, -0.5390177965164185, -0.5155048370361328, -0.49199190735816956, -0.4684789478778839, -0.44496598839759827, -0.421453058719635, -0.39794009923934937, -0.3744271397590637, -0.3509141802787781, -0.32740122079849243, -0.3038882911205292, -0.28037533164024353, -0.2568623721599579, -0.23334942758083344, -0.20983648300170898, -0.18632352352142334, -0.1628105640411377, -0.13929761946201324, -0.1157846674323082, -0.09227171540260315, -0.0687587633728981, -0.045245811343193054, -0.021732866764068604, 0.001780092716217041, 0.02529304474592209, 0.048805996775627136, 0.07231894880533218, 0.09583190083503723, 0.11934485286474228, 0.14285780489444733, 0.16637074947357178, 0.18988370895385742, 0.21339666843414307, 0.23690961301326752, 0.26042255759239197, 0.2839355170726776, 0.30744847655296326, 0.3309614062309265, 0.35447436571121216, 0.3779873251914978, 0.40150028467178345, 0.4250132441520691, 0.44852617383003235, 0.472039133310318, 0.49555209279060364, 0.5190650224685669, 0.5425779819488525, 0.5660909414291382, 0.5896039009094238, 0.6131168603897095, 0.6366298198699951, 0.6601427793502808, 0.6836556792259216, 0.7071686387062073, 0.7306815981864929, 0.7541945576667786]}, "gradients/decoder.model.decoder.layers.4.fc2.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 5.0, 4.0, 9.0, 9.0, 10.0, 24.0, 46.0, 99.0, 217.0, 536.0, 1611.0, 7012.0, 98068.0, 3906889.0, 169328.0, 7977.0, 1532.0, 487.0, 174.0, 92.0, 53.0, 24.0, 19.0, 16.0, 15.0, 7.0, 8.0, 4.0, 4.0, 2.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9287109375, -0.887542724609375, -0.84637451171875, -0.805206298828125, -0.7640380859375, -0.722869873046875, -0.68170166015625, -0.640533447265625, -0.599365234375, -0.558197021484375, -0.51702880859375, -0.475860595703125, -0.4346923828125, -0.393524169921875, -0.35235595703125, -0.311187744140625, -0.27001953125, -0.228851318359375, -0.18768310546875, -0.146514892578125, -0.1053466796875, -0.064178466796875, -0.02301025390625, 0.018157958984375, 0.059326171875, 0.100494384765625, 0.14166259765625, 0.182830810546875, 0.2239990234375, 0.265167236328125, 0.30633544921875, 0.347503662109375, 0.388671875, 0.429840087890625, 0.47100830078125, 0.512176513671875, 0.5533447265625, 0.594512939453125, 0.63568115234375, 0.676849365234375, 0.718017578125, 0.759185791015625, 0.80035400390625, 0.841522216796875, 0.8826904296875, 0.923858642578125, 0.96502685546875, 1.006195068359375, 1.04736328125, 1.088531494140625, 1.12969970703125, 1.170867919921875, 1.2120361328125, 1.253204345703125, 1.29437255859375, 1.335540771484375, 1.376708984375, 1.417877197265625, 1.45904541015625, 1.500213623046875, 1.5413818359375, 1.582550048828125, 1.62371826171875, 1.664886474609375, 1.7060546875]}, "gradients/decoder.model.decoder.layers.4.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 8.0, 8.0, 8.0, 18.0, 16.0, 25.0, 44.0, 30.0, 61.0, 58.0, 76.0, 77.0, 83.0, 105.0, 81.0, 72.0, 65.0, 43.0, 40.0, 27.0, 16.0, 18.0, 12.0, 7.0, 8.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.36767578125, -0.3507843017578125, -0.333892822265625, -0.3170013427734375, -0.30010986328125, -0.2832183837890625, -0.266326904296875, -0.2494354248046875, -0.2325439453125, -0.2156524658203125, -0.198760986328125, -0.1818695068359375, -0.16497802734375, -0.1480865478515625, -0.131195068359375, -0.1143035888671875, -0.097412109375, -0.0805206298828125, -0.063629150390625, -0.0467376708984375, -0.02984619140625, -0.0129547119140625, 0.003936767578125, 0.0208282470703125, 0.0377197265625, 0.0546112060546875, 0.071502685546875, 0.0883941650390625, 0.10528564453125, 0.1221771240234375, 0.139068603515625, 0.1559600830078125, 0.1728515625, 0.1897430419921875, 0.206634521484375, 0.2235260009765625, 0.24041748046875, 0.2573089599609375, 0.274200439453125, 0.2910919189453125, 0.3079833984375, 0.3248748779296875, 0.341766357421875, 0.3586578369140625, 0.37554931640625, 0.3924407958984375, 0.409332275390625, 0.4262237548828125, 0.443115234375, 0.4600067138671875, 0.476898193359375, 0.4937896728515625, 0.51068115234375, 0.5275726318359375, 0.544464111328125, 0.5613555908203125, 0.5782470703125, 0.5951385498046875, 0.612030029296875, 0.6289215087890625, 0.64581298828125, 0.6627044677734375, 0.679595947265625, 0.6964874267578125, 0.71337890625]}, "gradients/decoder.model.decoder.layers.4.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 2.0, 5.0, 11.0, 13.0, 20.0, 35.0, 43.0, 68.0, 150.0, 305.0, 745.0, 2057.0, 7603.0, 58638.0, 3135952.0, 949897.0, 30979.0, 4959.0, 1526.0, 655.0, 290.0, 134.0, 76.0, 45.0, 28.0, 10.0, 10.0, 10.0, 4.0, 6.0, 1.0, 6.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.75146484375, -0.7245025634765625, -0.697540283203125, -0.6705780029296875, -0.64361572265625, -0.6166534423828125, -0.589691162109375, -0.5627288818359375, -0.5357666015625, -0.5088043212890625, -0.481842041015625, -0.4548797607421875, -0.42791748046875, -0.4009552001953125, -0.373992919921875, -0.3470306396484375, -0.320068359375, -0.2931060791015625, -0.266143798828125, -0.2391815185546875, -0.21221923828125, -0.1852569580078125, -0.158294677734375, -0.1313323974609375, -0.1043701171875, -0.0774078369140625, -0.050445556640625, -0.0234832763671875, 0.00347900390625, 0.0304412841796875, 0.057403564453125, 0.0843658447265625, 0.111328125, 0.1382904052734375, 0.165252685546875, 0.1922149658203125, 0.21917724609375, 0.2461395263671875, 0.273101806640625, 0.3000640869140625, 0.3270263671875, 0.3539886474609375, 0.380950927734375, 0.4079132080078125, 0.43487548828125, 0.4618377685546875, 0.488800048828125, 0.5157623291015625, 0.542724609375, 0.5696868896484375, 0.596649169921875, 0.6236114501953125, 0.65057373046875, 0.6775360107421875, 0.704498291015625, 0.7314605712890625, 0.7584228515625, 0.7853851318359375, 0.812347412109375, 0.8393096923828125, 0.86627197265625, 0.8932342529296875, 0.920196533203125, 0.9471588134765625, 0.97412109375]}, "gradients/decoder.model.decoder.layers.4.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 5.0, 1.0, 7.0, 6.0, 8.0, 11.0, 15.0, 21.0, 33.0, 42.0, 67.0, 107.0, 174.0, 274.0, 458.0, 679.0, 791.0, 499.0, 334.0, 182.0, 107.0, 72.0, 60.0, 36.0, 30.0, 15.0, 7.0, 8.0, 8.0, 7.0, 4.0, 4.0, 3.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1920166015625, -0.18670654296875, -0.181396484375, -0.17608642578125, -0.1707763671875, -0.16546630859375, -0.16015625, -0.15484619140625, -0.1495361328125, -0.14422607421875, -0.138916015625, -0.13360595703125, -0.1282958984375, -0.12298583984375, -0.11767578125, -0.11236572265625, -0.1070556640625, -0.10174560546875, -0.096435546875, -0.09112548828125, -0.0858154296875, -0.08050537109375, -0.0751953125, -0.06988525390625, -0.0645751953125, -0.05926513671875, -0.053955078125, -0.04864501953125, -0.0433349609375, -0.03802490234375, -0.03271484375, -0.02740478515625, -0.0220947265625, -0.01678466796875, -0.011474609375, -0.00616455078125, -0.0008544921875, 0.00445556640625, 0.009765625, 0.01507568359375, 0.0203857421875, 0.02569580078125, 0.031005859375, 0.03631591796875, 0.0416259765625, 0.04693603515625, 0.05224609375, 0.05755615234375, 0.0628662109375, 0.06817626953125, 0.073486328125, 0.07879638671875, 0.0841064453125, 0.08941650390625, 0.0947265625, 0.10003662109375, 0.1053466796875, 0.11065673828125, 0.115966796875, 0.12127685546875, 0.1265869140625, 0.13189697265625, 0.13720703125, 0.14251708984375, 0.1478271484375]}, "gradients/decoder.model.decoder.layers.4.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 5.0, 0.0, 6.0, 4.0, 12.0, 15.0, 17.0, 17.0, 48.0, 94.0, 87.0, 120.0, 116.0, 123.0, 96.0, 88.0, 62.0, 38.0, 23.0, 14.0, 9.0, 8.0, 7.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6215534806251526, -0.5973003506660461, -0.5730472207069397, -0.548794150352478, -0.5245410203933716, -0.5002878904342651, -0.4760347604751587, -0.45178163051605225, -0.4275285303592682, -0.40327540040016174, -0.3790223002433777, -0.35476917028427124, -0.3305160403251648, -0.30626294016838074, -0.2820098102092743, -0.25775671005249023, -0.2335035800933838, -0.20925046503543854, -0.1849973499774933, -0.16074422001838684, -0.1364911049604416, -0.11223798990249634, -0.08798485994338989, -0.06373174488544464, -0.03947862982749939, -0.01522551104426384, 0.00902760773897171, 0.03328073024749756, 0.05753384530544281, 0.08178696036338806, 0.1060400903224945, 0.13029320538043976, 0.154546320438385, 0.17879943549633026, 0.2030525505542755, 0.22730568051338196, 0.251558780670166, 0.27581191062927246, 0.3000650405883789, 0.32431817054748535, 0.3485712707042694, 0.37282440066337585, 0.3970775008201599, 0.42133063077926636, 0.4455837607383728, 0.46983686089515686, 0.4940899908542633, 0.5183430910110474, 0.5425962209701538, 0.5668493509292603, 0.5911024808883667, 0.6153556108474731, 0.6396086812019348, 0.6638618111610413, 0.6881149411201477, 0.7123680710792542, 0.7366211414337158, 0.7608742713928223, 0.7851274013519287, 0.8093805313110352, 0.8336336016654968, 0.8578867316246033, 0.8821398615837097, 0.9063929915428162, 0.9306461215019226]}, "gradients/decoder.model.decoder.layers.4.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 3.0, 3.0, 4.0, 4.0, 5.0, 11.0, 5.0, 11.0, 15.0, 17.0, 12.0, 16.0, 17.0, 20.0, 32.0, 31.0, 35.0, 22.0, 32.0, 41.0, 28.0, 35.0, 44.0, 44.0, 41.0, 42.0, 32.0, 49.0, 39.0, 44.0, 34.0, 27.0, 28.0, 18.0, 28.0, 19.0, 19.0, 18.0, 13.0, 12.0, 11.0, 9.0, 11.0, 7.0, 1.0, 5.0, 2.0, 4.0, 2.0, 4.0, 1.0, 1.0, 2.0, 3.0], "bins": [-0.3360586166381836, -0.3264901638031006, -0.3169217109680176, -0.30735328793525696, -0.29778483510017395, -0.28821638226509094, -0.27864792943000793, -0.2690794765949249, -0.2595110535621643, -0.2499426007270813, -0.24037416279315948, -0.23080570995807648, -0.22123727202415466, -0.21166881918907166, -0.20210036635398865, -0.19253191351890564, -0.18296346068382263, -0.17339500784873962, -0.1638265699148178, -0.1542581170797348, -0.144689679145813, -0.13512122631072998, -0.12555277347564697, -0.11598432809114456, -0.10641588270664215, -0.09684743732213974, -0.08727899193763733, -0.07771053910255432, -0.06814209371805191, -0.0585736483335495, -0.04900519922375679, -0.03943675011396408, -0.02986830472946167, -0.02029985748231411, -0.01073141023516655, -0.0011629629880189896, 0.00840548425912857, 0.01797392964363098, 0.02754237875342369, 0.0371108278632164, 0.04667927324771881, 0.05624771863222122, 0.06581616401672363, 0.07538461685180664, 0.08495306223630905, 0.09452150762081146, 0.10408996045589447, 0.11365840584039688, 0.12322685122489929, 0.1327953040599823, 0.1423637419939041, 0.15193219482898712, 0.16150063276290894, 0.17106908559799194, 0.18063753843307495, 0.19020599126815796, 0.19977442920207977, 0.20934288203716278, 0.2189113199710846, 0.2284797728061676, 0.2380482256412506, 0.24761666357517242, 0.25718510150909424, 0.26675355434417725, 0.27632200717926025]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 2.0, 4.0, 0.0, 3.0, 7.0, 9.0, 13.0, 21.0, 34.0, 23.0, 42.0, 66.0, 110.0, 158.0, 291.0, 608.0, 1482.0, 3967.0, 12130.0, 41339.0, 160637.0, 441022.0, 281229.0, 74517.0, 20375.0, 6348.0, 2282.0, 859.0, 402.0, 210.0, 97.0, 68.0, 56.0, 30.0, 25.0, 20.0, 14.0, 18.0, 8.0, 9.0, 6.0, 5.0, 2.0, 3.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0694580078125, -0.06703948974609375, -0.0646209716796875, -0.06220245361328125, -0.059783935546875, -0.05736541748046875, -0.0549468994140625, -0.05252838134765625, -0.05010986328125, -0.04769134521484375, -0.0452728271484375, -0.04285430908203125, -0.040435791015625, -0.03801727294921875, -0.0355987548828125, -0.03318023681640625, -0.03076171875, -0.02834320068359375, -0.0259246826171875, -0.02350616455078125, -0.021087646484375, -0.01866912841796875, -0.0162506103515625, -0.01383209228515625, -0.01141357421875, -0.00899505615234375, -0.0065765380859375, -0.00415802001953125, -0.001739501953125, 0.00067901611328125, 0.0030975341796875, 0.00551605224609375, 0.0079345703125, 0.01035308837890625, 0.0127716064453125, 0.01519012451171875, 0.017608642578125, 0.02002716064453125, 0.0224456787109375, 0.02486419677734375, 0.02728271484375, 0.02970123291015625, 0.0321197509765625, 0.03453826904296875, 0.036956787109375, 0.03937530517578125, 0.0417938232421875, 0.04421234130859375, 0.046630859375, 0.04904937744140625, 0.0514678955078125, 0.05388641357421875, 0.056304931640625, 0.05872344970703125, 0.0611419677734375, 0.06356048583984375, 0.06597900390625, 0.06839752197265625, 0.0708160400390625, 0.07323455810546875, 0.075653076171875, 0.07807159423828125, 0.0804901123046875, 0.08290863037109375, 0.0853271484375]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 5.0, 4.0, 8.0, 8.0, 11.0, 14.0, 27.0, 33.0, 32.0, 42.0, 67.0, 58.0, 68.0, 85.0, 82.0, 90.0, 70.0, 60.0, 49.0, 51.0, 39.0, 32.0, 19.0, 24.0, 7.0, 8.0, 8.0, 4.0, 3.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.426513671875, -0.41339874267578125, -0.4002838134765625, -0.38716888427734375, -0.374053955078125, -0.36093902587890625, -0.3478240966796875, -0.33470916748046875, -0.32159423828125, -0.30847930908203125, -0.2953643798828125, -0.28224945068359375, -0.269134521484375, -0.25601959228515625, -0.2429046630859375, -0.22978973388671875, -0.2166748046875, -0.20355987548828125, -0.1904449462890625, -0.17733001708984375, -0.164215087890625, -0.15110015869140625, -0.1379852294921875, -0.12487030029296875, -0.11175537109375, -0.09864044189453125, -0.0855255126953125, -0.07241058349609375, -0.059295654296875, -0.04618072509765625, -0.0330657958984375, -0.01995086669921875, -0.0068359375, 0.00627899169921875, 0.0193939208984375, 0.03250885009765625, 0.045623779296875, 0.05873870849609375, 0.0718536376953125, 0.08496856689453125, 0.09808349609375, 0.11119842529296875, 0.1243133544921875, 0.13742828369140625, 0.150543212890625, 0.16365814208984375, 0.1767730712890625, 0.18988800048828125, 0.2030029296875, 0.21611785888671875, 0.2292327880859375, 0.24234771728515625, 0.255462646484375, 0.26857757568359375, 0.2816925048828125, 0.29480743408203125, 0.30792236328125, 0.32103729248046875, 0.3341522216796875, 0.34726715087890625, 0.360382080078125, 0.37349700927734375, 0.3866119384765625, 0.39972686767578125, 0.412841796875]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [3.0, 3.0, 3.0, 4.0, 5.0, 7.0, 13.0, 10.0, 29.0, 29.0, 41.0, 78.0, 107.0, 151.0, 247.0, 452.0, 826.0, 1691.0, 3410.0, 7459.0, 17551.0, 45987.0, 126785.0, 293994.0, 315727.0, 145012.0, 52643.0, 20143.0, 8303.0, 3757.0, 1831.0, 924.0, 510.0, 295.0, 163.0, 124.0, 70.0, 45.0, 35.0, 28.0, 14.0, 17.0, 13.0, 16.0, 8.0, 6.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.040252685546875, -0.03858041763305664, -0.03690814971923828, -0.03523588180541992, -0.03356361389160156, -0.0318913459777832, -0.030219078063964844, -0.028546810150146484, -0.026874542236328125, -0.025202274322509766, -0.023530006408691406, -0.021857738494873047, -0.020185470581054688, -0.018513202667236328, -0.01684093475341797, -0.01516866683959961, -0.01349639892578125, -0.01182413101196289, -0.010151863098144531, -0.008479595184326172, -0.0068073272705078125, -0.005135059356689453, -0.0034627914428710938, -0.0017905235290527344, -0.000118255615234375, 0.0015540122985839844, 0.0032262802124023438, 0.004898548126220703, 0.0065708160400390625, 0.008243083953857422, 0.009915351867675781, 0.01158761978149414, 0.0132598876953125, 0.01493215560913086, 0.01660442352294922, 0.018276691436767578, 0.019948959350585938, 0.021621227264404297, 0.023293495178222656, 0.024965763092041016, 0.026638031005859375, 0.028310298919677734, 0.029982566833496094, 0.03165483474731445, 0.03332710266113281, 0.03499937057495117, 0.03667163848876953, 0.03834390640258789, 0.04001617431640625, 0.04168844223022461, 0.04336071014404297, 0.04503297805786133, 0.04670524597167969, 0.04837751388549805, 0.050049781799316406, 0.051722049713134766, 0.053394317626953125, 0.055066585540771484, 0.056738853454589844, 0.0584111213684082, 0.06008338928222656, 0.06175565719604492, 0.06342792510986328, 0.06510019302368164, 0.0667724609375]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 3.0, 6.0, 4.0, 5.0, 7.0, 11.0, 20.0, 18.0, 21.0, 9.0, 23.0, 20.0, 28.0, 23.0, 27.0, 22.0, 28.0, 28.0, 38.0, 36.0, 43.0, 42.0, 37.0, 36.0, 48.0, 39.0, 42.0, 30.0, 28.0, 42.0, 34.0, 23.0, 25.0, 30.0, 21.0, 14.0, 14.0, 19.0, 13.0, 6.0, 7.0, 5.0, 8.0, 4.0, 8.0, 6.0, 4.0, 1.0, 3.0, 3.0, 0.0, 2.0], "bins": [-0.453369140625, -0.4403266906738281, -0.42728424072265625, -0.4142417907714844, -0.4011993408203125, -0.3881568908691406, -0.37511444091796875, -0.3620719909667969, -0.349029541015625, -0.3359870910644531, -0.32294464111328125, -0.3099021911621094, -0.2968597412109375, -0.2838172912597656, -0.27077484130859375, -0.2577323913574219, -0.24468994140625, -0.23164749145507812, -0.21860504150390625, -0.20556259155273438, -0.1925201416015625, -0.17947769165039062, -0.16643524169921875, -0.15339279174804688, -0.140350341796875, -0.12730789184570312, -0.11426544189453125, -0.10122299194335938, -0.0881805419921875, -0.07513809204101562, -0.06209564208984375, -0.049053192138671875, -0.0360107421875, -0.022968292236328125, -0.00992584228515625, 0.003116607666015625, 0.0161590576171875, 0.029201507568359375, 0.04224395751953125, 0.055286407470703125, 0.068328857421875, 0.08137130737304688, 0.09441375732421875, 0.10745620727539062, 0.1204986572265625, 0.13354110717773438, 0.14658355712890625, 0.15962600708007812, 0.17266845703125, 0.18571090698242188, 0.19875335693359375, 0.21179580688476562, 0.2248382568359375, 0.23788070678710938, 0.25092315673828125, 0.2639656066894531, 0.277008056640625, 0.2900505065917969, 0.30309295654296875, 0.3161354064941406, 0.3291778564453125, 0.3422203063964844, 0.35526275634765625, 0.3683052062988281, 0.38134765625]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 2.0, 4.0, 6.0, 9.0, 5.0, 9.0, 22.0, 15.0, 18.0, 33.0, 47.0, 111.0, 173.0, 287.0, 483.0, 858.0, 1803.0, 3996.0, 10684.0, 35453.0, 156670.0, 484103.0, 268392.0, 58833.0, 15783.0, 5573.0, 2418.0, 1203.0, 633.0, 343.0, 203.0, 131.0, 89.0, 46.0, 45.0, 27.0, 23.0, 7.0, 7.0, 7.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.02655029296875, -0.025826454162597656, -0.025102615356445312, -0.02437877655029297, -0.023654937744140625, -0.02293109893798828, -0.022207260131835938, -0.021483421325683594, -0.02075958251953125, -0.020035743713378906, -0.019311904907226562, -0.01858806610107422, -0.017864227294921875, -0.01714038848876953, -0.016416549682617188, -0.015692710876464844, -0.0149688720703125, -0.014245033264160156, -0.013521194458007812, -0.012797355651855469, -0.012073516845703125, -0.011349678039550781, -0.010625839233398438, -0.009902000427246094, -0.00917816162109375, -0.008454322814941406, -0.0077304840087890625, -0.007006645202636719, -0.006282806396484375, -0.005558967590332031, -0.0048351287841796875, -0.004111289978027344, -0.003387451171875, -0.0026636123657226562, -0.0019397735595703125, -0.0012159347534179688, -0.000492095947265625, 0.00023174285888671875, 0.0009555816650390625, 0.0016794204711914062, 0.00240325927734375, 0.0031270980834960938, 0.0038509368896484375, 0.004574775695800781, 0.005298614501953125, 0.006022453308105469, 0.0067462921142578125, 0.007470130920410156, 0.0081939697265625, 0.008917808532714844, 0.009641647338867188, 0.010365486145019531, 0.011089324951171875, 0.011813163757324219, 0.012537002563476562, 0.013260841369628906, 0.01398468017578125, 0.014708518981933594, 0.015432357788085938, 0.01615619659423828, 0.016880035400390625, 0.01760387420654297, 0.018327713012695312, 0.019051551818847656, 0.019775390625]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 6.0, 5.0, 8.0, 19.0, 15.0, 28.0, 37.0, 48.0, 51.0, 86.0, 80.0, 104.0, 107.0, 81.0, 88.0, 62.0, 41.0, 45.0, 23.0, 22.0, 16.0, 3.0, 15.0, 6.0, 5.0, 1.0, 3.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4066696166992188e-05, -1.3568438589572906e-05, -1.3070181012153625e-05, -1.2571923434734344e-05, -1.2073665857315063e-05, -1.1575408279895782e-05, -1.1077150702476501e-05, -1.057889312505722e-05, -1.008063554763794e-05, -9.582377970218658e-06, -9.084120392799377e-06, -8.585862815380096e-06, -8.087605237960815e-06, -7.5893476605415344e-06, -7.091090083122253e-06, -6.592832505702972e-06, -6.094574928283691e-06, -5.59631735086441e-06, -5.098059773445129e-06, -4.599802196025848e-06, -4.101544618606567e-06, -3.6032870411872864e-06, -3.1050294637680054e-06, -2.6067718863487244e-06, -2.1085143089294434e-06, -1.6102567315101624e-06, -1.1119991540908813e-06, -6.137415766716003e-07, -1.1548399925231934e-07, 3.8277357816696167e-07, 8.810311555862427e-07, 1.3792887330055237e-06, 1.8775463104248047e-06, 2.3758038878440857e-06, 2.8740614652633667e-06, 3.3723190426826477e-06, 3.870576620101929e-06, 4.36883419752121e-06, 4.867091774940491e-06, 5.365349352359772e-06, 5.863606929779053e-06, 6.361864507198334e-06, 6.860122084617615e-06, 7.358379662036896e-06, 7.856637239456177e-06, 8.354894816875458e-06, 8.853152394294739e-06, 9.35140997171402e-06, 9.8496675491333e-06, 1.0347925126552582e-05, 1.0846182703971863e-05, 1.1344440281391144e-05, 1.1842697858810425e-05, 1.2340955436229706e-05, 1.2839213013648987e-05, 1.3337470591068268e-05, 1.3835728168487549e-05, 1.433398574590683e-05, 1.483224332332611e-05, 1.5330500900745392e-05, 1.5828758478164673e-05, 1.6327016055583954e-05, 1.6825273633003235e-05, 1.7323531210422516e-05, 1.7821788787841797e-05]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 0.0, 4.0, 5.0, 7.0, 7.0, 7.0, 12.0, 19.0, 20.0, 29.0, 45.0, 67.0, 132.0, 185.0, 345.0, 722.0, 1556.0, 4466.0, 15375.0, 69882.0, 326642.0, 463226.0, 128542.0, 26243.0, 6783.0, 2200.0, 896.0, 465.0, 237.0, 163.0, 86.0, 55.0, 42.0, 27.0, 17.0, 17.0, 13.0, 4.0, 5.0, 5.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.02264404296875, -0.021868228912353516, -0.02109241485595703, -0.020316600799560547, -0.019540786743164062, -0.018764972686767578, -0.017989158630371094, -0.01721334457397461, -0.016437530517578125, -0.01566171646118164, -0.014885902404785156, -0.014110088348388672, -0.013334274291992188, -0.012558460235595703, -0.011782646179199219, -0.011006832122802734, -0.01023101806640625, -0.009455204010009766, -0.008679389953613281, -0.007903575897216797, -0.0071277618408203125, -0.006351947784423828, -0.005576133728027344, -0.004800319671630859, -0.004024505615234375, -0.0032486915588378906, -0.0024728775024414062, -0.0016970634460449219, -0.0009212493896484375, -0.00014543533325195312, 0.0006303787231445312, 0.0014061927795410156, 0.0021820068359375, 0.0029578208923339844, 0.0037336349487304688, 0.004509449005126953, 0.0052852630615234375, 0.006061077117919922, 0.006836891174316406, 0.007612705230712891, 0.008388519287109375, 0.00916433334350586, 0.009940147399902344, 0.010715961456298828, 0.011491775512695312, 0.012267589569091797, 0.013043403625488281, 0.013819217681884766, 0.01459503173828125, 0.015370845794677734, 0.01614665985107422, 0.016922473907470703, 0.017698287963867188, 0.018474102020263672, 0.019249916076660156, 0.02002573013305664, 0.020801544189453125, 0.02157735824584961, 0.022353172302246094, 0.023128986358642578, 0.023904800415039062, 0.024680614471435547, 0.02545642852783203, 0.026232242584228516, 0.027008056640625]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 5.0, 2.0, 3.0, 8.0, 6.0, 10.0, 17.0, 21.0, 22.0, 39.0, 55.0, 56.0, 70.0, 73.0, 94.0, 92.0, 79.0, 91.0, 76.0, 42.0, 54.0, 26.0, 19.0, 12.0, 15.0, 10.0, 6.0, 3.0, 1.0, 1.0, 5.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0092620849609375, -0.00902026891708374, -0.00877845287322998, -0.00853663682937622, -0.008294820785522461, -0.008053004741668701, -0.007811188697814941, -0.007569372653961182, -0.007327556610107422, -0.007085740566253662, -0.006843924522399902, -0.006602108478546143, -0.006360292434692383, -0.006118476390838623, -0.005876660346984863, -0.0056348443031311035, -0.005393028259277344, -0.005151212215423584, -0.004909396171569824, -0.0046675801277160645, -0.004425764083862305, -0.004183948040008545, -0.003942131996154785, -0.0037003159523010254, -0.0034584999084472656, -0.003216683864593506, -0.002974867820739746, -0.0027330517768859863, -0.0024912357330322266, -0.002249419689178467, -0.002007603645324707, -0.0017657876014709473, -0.0015239715576171875, -0.0012821555137634277, -0.001040339469909668, -0.0007985234260559082, -0.0005567073822021484, -0.00031489133834838867, -7.30752944946289e-05, 0.00016874074935913086, 0.0004105567932128906, 0.0006523728370666504, 0.0008941888809204102, 0.00113600492477417, 0.0013778209686279297, 0.0016196370124816895, 0.0018614530563354492, 0.002103269100189209, 0.0023450851440429688, 0.0025869011878967285, 0.0028287172317504883, 0.003070533275604248, 0.003312349319458008, 0.0035541653633117676, 0.0037959814071655273, 0.004037797451019287, 0.004279613494873047, 0.004521429538726807, 0.004763245582580566, 0.005005061626434326, 0.005246877670288086, 0.005488693714141846, 0.0057305097579956055, 0.005972325801849365, 0.006214141845703125]}, "gradients/decoder.model.decoder.layers.4.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 8.0, 29.0, 40.0, 115.0, 229.0, 241.0, 200.0, 81.0, 33.0, 20.0, 7.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7753782272338867, -0.7435557842254639, -0.7117332816123962, -0.6799108386039734, -0.6480883359909058, -0.6162658929824829, -0.5844434499740601, -0.5526210069656372, -0.5207985043525696, -0.48897603154182434, -0.4571535587310791, -0.42533111572265625, -0.393508642911911, -0.36168617010116577, -0.3298637270927429, -0.2980412542819977, -0.26621878147125244, -0.2343963086605072, -0.20257385075092316, -0.1707513928413391, -0.13892892003059387, -0.10710644721984863, -0.07528398931026459, -0.04346153140068054, -0.011639058589935303, 0.02018340677022934, 0.05200587213039398, 0.08382833749055862, 0.11565080285072327, 0.1474732756614685, 0.17929573357105255, 0.2111181914806366, 0.24294066429138184, 0.2747631371021271, 0.3065856099128723, 0.33840805292129517, 0.3702305257320404, 0.40205299854278564, 0.4338754415512085, 0.46569791436195374, 0.497520387172699, 0.5293428301811218, 0.5611653327941895, 0.5929877758026123, 0.6248102188110352, 0.6566327214241028, 0.6884551644325256, 0.7202776670455933, 0.7521001100540161, 0.783922553062439, 0.8157450556755066, 0.8475674986839294, 0.8793900012969971, 0.9112124443054199, 0.9430348873138428, 0.9748573303222656, 1.0066797733306885, 1.0385022163391113, 1.0703246593475342, 1.1021472215652466, 1.1339696645736694, 1.1657921075820923, 1.1976145505905151, 1.229436993598938, 1.2612595558166504]}, "gradients/decoder.model.decoder.layers.4.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 4.0, 2.0, 7.0, 5.0, 2.0, 5.0, 5.0, 9.0, 8.0, 22.0, 15.0, 17.0, 21.0, 21.0, 25.0, 45.0, 24.0, 34.0, 33.0, 44.0, 40.0, 48.0, 44.0, 44.0, 46.0, 45.0, 45.0, 45.0, 51.0, 34.0, 25.0, 29.0, 22.0, 24.0, 24.0, 21.0, 13.0, 13.0, 6.0, 9.0, 9.0, 6.0, 1.0, 3.0, 2.0, 2.0, 5.0, 2.0, 3.0, 1.0, 0.0, 1.0, 3.0], "bins": [-0.2497846633195877, -0.2425040602684021, -0.2352234423160553, -0.2279428392648697, -0.2206622213125229, -0.21338161826133728, -0.20610100030899048, -0.19882039725780487, -0.19153979420661926, -0.18425919115543365, -0.17697857320308685, -0.16969797015190125, -0.16241735219955444, -0.15513674914836884, -0.14785614609718323, -0.14057552814483643, -0.13329491019248962, -0.12601430714130402, -0.11873368918895721, -0.1114530861377716, -0.1041724681854248, -0.0968918651342392, -0.08961125463247299, -0.08233064413070679, -0.07505003362894058, -0.06776942312717438, -0.06048881262540817, -0.053208205848932266, -0.04592759534716606, -0.03864698484539986, -0.03136637806892395, -0.024085767567157745, -0.016805142164230347, -0.009524532593786716, -0.0022439230233430862, 0.005036685615777969, 0.012317296117544174, 0.01959790661931038, 0.026878513395786285, 0.03415912389755249, 0.041439734399318695, 0.0487203449010849, 0.056000955402851105, 0.06328156590461731, 0.07056216895580292, 0.07784278690814972, 0.08512338995933533, 0.09240400046110153, 0.09968461096286774, 0.10696522146463394, 0.11424583196640015, 0.12152643501758575, 0.12880705296993256, 0.13608765602111816, 0.14336827397346497, 0.15064887702465057, 0.15792948007583618, 0.1652100831270218, 0.1724907010793686, 0.1797713041305542, 0.187051922082901, 0.1943325251340866, 0.20161312818527222, 0.20889374613761902, 0.21617436408996582]}, "gradients/decoder.model.decoder.layers.4.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 5.0, 1.0, 2.0, 5.0, 9.0, 13.0, 16.0, 16.0, 28.0, 39.0, 75.0, 92.0, 134.0, 242.0, 362.0, 577.0, 1018.0, 1968.0, 3805.0, 9002.0, 30185.0, 224484.0, 679510.0, 70076.0, 15213.0, 5574.0, 2665.0, 1366.0, 830.0, 449.0, 283.0, 163.0, 101.0, 72.0, 61.0, 29.0, 32.0, 22.0, 12.0, 8.0, 6.0, 5.0, 3.0, 2.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.363525390625, -0.35065460205078125, -0.3377838134765625, -0.32491302490234375, -0.312042236328125, -0.29917144775390625, -0.2863006591796875, -0.27342987060546875, -0.26055908203125, -0.24768829345703125, -0.2348175048828125, -0.22194671630859375, -0.209075927734375, -0.19620513916015625, -0.1833343505859375, -0.17046356201171875, -0.1575927734375, -0.14472198486328125, -0.1318511962890625, -0.11898040771484375, -0.106109619140625, -0.09323883056640625, -0.0803680419921875, -0.06749725341796875, -0.05462646484375, -0.04175567626953125, -0.0288848876953125, -0.01601409912109375, -0.003143310546875, 0.00972747802734375, 0.0225982666015625, 0.03546905517578125, 0.04833984375, 0.06121063232421875, 0.0740814208984375, 0.08695220947265625, 0.099822998046875, 0.11269378662109375, 0.1255645751953125, 0.13843536376953125, 0.15130615234375, 0.16417694091796875, 0.1770477294921875, 0.18991851806640625, 0.202789306640625, 0.21566009521484375, 0.2285308837890625, 0.24140167236328125, 0.2542724609375, 0.26714324951171875, 0.2800140380859375, 0.29288482666015625, 0.305755615234375, 0.31862640380859375, 0.3314971923828125, 0.34436798095703125, 0.35723876953125, 0.37010955810546875, 0.3829803466796875, 0.39585113525390625, 0.408721923828125, 0.42159271240234375, 0.4344635009765625, 0.44733428955078125, 0.460205078125]}, "gradients/decoder.model.decoder.layers.4.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 4.0, 3.0, 1.0, 2.0, 1.0, 3.0, 6.0, 4.0, 4.0, 9.0, 10.0, 12.0, 10.0, 19.0, 15.0, 17.0, 21.0, 34.0, 27.0, 36.0, 40.0, 51.0, 39.0, 42.0, 37.0, 43.0, 48.0, 57.0, 41.0, 40.0, 51.0, 39.0, 48.0, 27.0, 13.0, 31.0, 25.0, 22.0, 19.0, 12.0, 14.0, 6.0, 8.0, 3.0, 3.0, 3.0, 3.0, 3.0, 3.0, 1.0, 3.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.42333984375, -0.40883636474609375, -0.3943328857421875, -0.37982940673828125, -0.365325927734375, -0.35082244873046875, -0.3363189697265625, -0.32181549072265625, -0.30731201171875, -0.29280853271484375, -0.2783050537109375, -0.26380157470703125, -0.249298095703125, -0.23479461669921875, -0.2202911376953125, -0.20578765869140625, -0.1912841796875, -0.17678070068359375, -0.1622772216796875, -0.14777374267578125, -0.133270263671875, -0.11876678466796875, -0.1042633056640625, -0.08975982666015625, -0.07525634765625, -0.06075286865234375, -0.0462493896484375, -0.03174591064453125, -0.017242431640625, -0.00273895263671875, 0.0117645263671875, 0.02626800537109375, 0.040771484375, 0.05527496337890625, 0.0697784423828125, 0.08428192138671875, 0.098785400390625, 0.11328887939453125, 0.1277923583984375, 0.14229583740234375, 0.15679931640625, 0.17130279541015625, 0.1858062744140625, 0.20030975341796875, 0.214813232421875, 0.22931671142578125, 0.2438201904296875, 0.25832366943359375, 0.2728271484375, 0.28733062744140625, 0.3018341064453125, 0.31633758544921875, 0.330841064453125, 0.34534454345703125, 0.3598480224609375, 0.37435150146484375, 0.38885498046875, 0.40335845947265625, 0.4178619384765625, 0.43236541748046875, 0.446868896484375, 0.46137237548828125, 0.4758758544921875, 0.49037933349609375, 0.5048828125]}, "gradients/decoder.model.decoder.layers.4.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 4.0, 5.0, 1.0, 8.0, 6.0, 10.0, 20.0, 30.0, 36.0, 78.0, 115.0, 277.0, 739.0, 2146.0, 9324.0, 193624.0, 818968.0, 18261.0, 3216.0, 963.0, 368.0, 144.0, 84.0, 51.0, 24.0, 16.0, 9.0, 5.0, 4.0, 7.0, 2.0, 1.0, 6.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.65771484375, -0.635162353515625, -0.61260986328125, -0.590057373046875, -0.5675048828125, -0.544952392578125, -0.52239990234375, -0.499847412109375, -0.477294921875, -0.454742431640625, -0.43218994140625, -0.409637451171875, -0.3870849609375, -0.364532470703125, -0.34197998046875, -0.319427490234375, -0.296875, -0.274322509765625, -0.25177001953125, -0.229217529296875, -0.2066650390625, -0.184112548828125, -0.16156005859375, -0.139007568359375, -0.116455078125, -0.093902587890625, -0.07135009765625, -0.048797607421875, -0.0262451171875, -0.003692626953125, 0.01885986328125, 0.041412353515625, 0.06396484375, 0.086517333984375, 0.10906982421875, 0.131622314453125, 0.1541748046875, 0.176727294921875, 0.19927978515625, 0.221832275390625, 0.244384765625, 0.266937255859375, 0.28948974609375, 0.312042236328125, 0.3345947265625, 0.357147216796875, 0.37969970703125, 0.402252197265625, 0.4248046875, 0.447357177734375, 0.46990966796875, 0.492462158203125, 0.5150146484375, 0.537567138671875, 0.56011962890625, 0.582672119140625, 0.605224609375, 0.627777099609375, 0.65032958984375, 0.672882080078125, 0.6954345703125, 0.717987060546875, 0.74053955078125, 0.763092041015625, 0.78564453125]}, "gradients/decoder.model.decoder.layers.4.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 4.0, 4.0, 1.0, 2.0, 3.0, 2.0, 7.0, 5.0, 9.0, 9.0, 9.0, 12.0, 9.0, 13.0, 25.0, 31.0, 21.0, 23.0, 28.0, 41.0, 40.0, 36.0, 41.0, 49.0, 51.0, 43.0, 51.0, 54.0, 50.0, 44.0, 43.0, 32.0, 30.0, 35.0, 37.0, 19.0, 20.0, 11.0, 15.0, 14.0, 13.0, 8.0, 8.0, 5.0, 2.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5341796875, -0.5160980224609375, -0.498016357421875, -0.4799346923828125, -0.46185302734375, -0.4437713623046875, -0.425689697265625, -0.4076080322265625, -0.3895263671875, -0.3714447021484375, -0.353363037109375, -0.3352813720703125, -0.31719970703125, -0.2991180419921875, -0.281036376953125, -0.2629547119140625, -0.244873046875, -0.2267913818359375, -0.208709716796875, -0.1906280517578125, -0.17254638671875, -0.1544647216796875, -0.136383056640625, -0.1183013916015625, -0.1002197265625, -0.0821380615234375, -0.064056396484375, -0.0459747314453125, -0.02789306640625, -0.0098114013671875, 0.008270263671875, 0.0263519287109375, 0.04443359375, 0.0625152587890625, 0.080596923828125, 0.0986785888671875, 0.11676025390625, 0.1348419189453125, 0.152923583984375, 0.1710052490234375, 0.1890869140625, 0.2071685791015625, 0.225250244140625, 0.2433319091796875, 0.26141357421875, 0.2794952392578125, 0.297576904296875, 0.3156585693359375, 0.333740234375, 0.3518218994140625, 0.369903564453125, 0.3879852294921875, 0.40606689453125, 0.4241485595703125, 0.442230224609375, 0.4603118896484375, 0.4783935546875, 0.4964752197265625, 0.514556884765625, 0.5326385498046875, 0.55072021484375, 0.5688018798828125, 0.586883544921875, 0.6049652099609375, 0.623046875]}, "gradients/decoder.model.decoder.layers.4.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 4.0, 3.0, 2.0, 1.0, 2.0, 4.0, 1.0, 5.0, 11.0, 15.0, 39.0, 62.0, 178.0, 572.0, 2915.0, 51029.0, 971190.0, 20024.0, 1833.0, 388.0, 149.0, 58.0, 31.0, 15.0, 5.0, 5.0, 5.0, 3.0, 5.0, 1.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.352294921875, -0.3384132385253906, -0.32453155517578125, -0.3106498718261719, -0.2967681884765625, -0.2828865051269531, -0.26900482177734375, -0.2551231384277344, -0.241241455078125, -0.22735977172851562, -0.21347808837890625, -0.19959640502929688, -0.1857147216796875, -0.17183303833007812, -0.15795135498046875, -0.14406967163085938, -0.13018798828125, -0.11630630493164062, -0.10242462158203125, -0.08854293823242188, -0.0746612548828125, -0.060779571533203125, -0.04689788818359375, -0.033016204833984375, -0.019134521484375, -0.005252838134765625, 0.00862884521484375, 0.022510528564453125, 0.0363922119140625, 0.050273895263671875, 0.06415557861328125, 0.07803726196289062, 0.0919189453125, 0.10580062866210938, 0.11968231201171875, 0.13356399536132812, 0.1474456787109375, 0.16132736206054688, 0.17520904541015625, 0.18909072875976562, 0.202972412109375, 0.21685409545898438, 0.23073577880859375, 0.24461746215820312, 0.2584991455078125, 0.2723808288574219, 0.28626251220703125, 0.3001441955566406, 0.31402587890625, 0.3279075622558594, 0.34178924560546875, 0.3556709289550781, 0.3695526123046875, 0.3834342956542969, 0.39731597900390625, 0.4111976623535156, 0.425079345703125, 0.4389610290527344, 0.45284271240234375, 0.4667243957519531, 0.4806060791015625, 0.4944877624511719, 0.5083694458007812, 0.5222511291503906, 0.5361328125]}, "gradients/decoder.model.decoder.layers.4.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 3.0, 0.0, 2.0, 4.0, 5.0, 5.0, 15.0, 9.0, 23.0, 20.0, 47.0, 57.0, 87.0, 154.0, 180.0, 142.0, 82.0, 59.0, 49.0, 17.0, 13.0, 12.0, 7.0, 6.0, 1.0, 4.0, 2.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.910064697265625e-05, -3.810971975326538e-05, -3.711879253387451e-05, -3.612786531448364e-05, -3.5136938095092773e-05, -3.4146010875701904e-05, -3.3155083656311035e-05, -3.2164156436920166e-05, -3.11732292175293e-05, -3.0182301998138428e-05, -2.919137477874756e-05, -2.820044755935669e-05, -2.720952033996582e-05, -2.621859312057495e-05, -2.5227665901184082e-05, -2.4236738681793213e-05, -2.3245811462402344e-05, -2.2254884243011475e-05, -2.1263957023620605e-05, -2.0273029804229736e-05, -1.9282102584838867e-05, -1.8291175365447998e-05, -1.730024814605713e-05, -1.630932092666626e-05, -1.531839370727539e-05, -1.4327466487884521e-05, -1.3336539268493652e-05, -1.2345612049102783e-05, -1.1354684829711914e-05, -1.0363757610321045e-05, -9.372830390930176e-06, -8.381903171539307e-06, -7.3909759521484375e-06, -6.400048732757568e-06, -5.409121513366699e-06, -4.41819429397583e-06, -3.427267074584961e-06, -2.436339855194092e-06, -1.4454126358032227e-06, -4.544854164123535e-07, 5.364418029785156e-07, 1.5273690223693848e-06, 2.518296241760254e-06, 3.509223461151123e-06, 4.500150680541992e-06, 5.491077899932861e-06, 6.4820051193237305e-06, 7.4729323387146e-06, 8.463859558105469e-06, 9.454786777496338e-06, 1.0445713996887207e-05, 1.1436641216278076e-05, 1.2427568435668945e-05, 1.3418495655059814e-05, 1.4409422874450684e-05, 1.5400350093841553e-05, 1.6391277313232422e-05, 1.738220453262329e-05, 1.837313175201416e-05, 1.936405897140503e-05, 2.03549861907959e-05, 2.1345913410186768e-05, 2.2336840629577637e-05, 2.3327767848968506e-05, 2.4318695068359375e-05]}, "gradients/decoder.model.decoder.layers.4.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 4.0, 1.0, 3.0, 5.0, 3.0, 15.0, 14.0, 26.0, 43.0, 96.0, 205.0, 469.0, 1301.0, 4921.0, 61194.0, 943611.0, 31176.0, 3633.0, 1057.0, 402.0, 154.0, 81.0, 47.0, 25.0, 16.0, 10.0, 13.0, 10.0, 6.0, 2.0, 3.0, 2.0, 3.0, 1.0, 3.0, 0.0, 2.0, 0.0, 2.0], "bins": [-0.52001953125, -0.5071487426757812, -0.4942779541015625, -0.48140716552734375, -0.468536376953125, -0.45566558837890625, -0.4427947998046875, -0.42992401123046875, -0.41705322265625, -0.40418243408203125, -0.3913116455078125, -0.37844085693359375, -0.365570068359375, -0.35269927978515625, -0.3398284912109375, -0.32695770263671875, -0.3140869140625, -0.30121612548828125, -0.2883453369140625, -0.27547454833984375, -0.262603759765625, -0.24973297119140625, -0.2368621826171875, -0.22399139404296875, -0.21112060546875, -0.19824981689453125, -0.1853790283203125, -0.17250823974609375, -0.159637451171875, -0.14676666259765625, -0.1338958740234375, -0.12102508544921875, -0.108154296875, -0.09528350830078125, -0.0824127197265625, -0.06954193115234375, -0.056671142578125, -0.04380035400390625, -0.0309295654296875, -0.01805877685546875, -0.00518798828125, 0.00768280029296875, 0.0205535888671875, 0.03342437744140625, 0.046295166015625, 0.05916595458984375, 0.0720367431640625, 0.08490753173828125, 0.0977783203125, 0.11064910888671875, 0.1235198974609375, 0.13639068603515625, 0.149261474609375, 0.16213226318359375, 0.1750030517578125, 0.18787384033203125, 0.20074462890625, 0.21361541748046875, 0.2264862060546875, 0.23935699462890625, 0.252227783203125, 0.26509857177734375, 0.2779693603515625, 0.29084014892578125, 0.3037109375]}, "gradients/decoder.model.decoder.layers.4.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 4.0, 3.0, 2.0, 6.0, 10.0, 16.0, 13.0, 27.0, 19.0, 38.0, 62.0, 100.0, 232.0, 201.0, 93.0, 49.0, 37.0, 27.0, 24.0, 12.0, 9.0, 5.0, 3.0, 8.0, 2.0, 2.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.080322265625, -0.07695960998535156, -0.07359695434570312, -0.07023429870605469, -0.06687164306640625, -0.06350898742675781, -0.060146331787109375, -0.05678367614746094, -0.0534210205078125, -0.05005836486816406, -0.046695709228515625, -0.04333305358886719, -0.03997039794921875, -0.03660774230957031, -0.033245086669921875, -0.029882431030273438, -0.026519775390625, -0.023157119750976562, -0.019794464111328125, -0.016431808471679688, -0.01306915283203125, -0.009706497192382812, -0.006343841552734375, -0.0029811859130859375, 0.0003814697265625, 0.0037441253662109375, 0.007106781005859375, 0.010469436645507812, 0.01383209228515625, 0.017194747924804688, 0.020557403564453125, 0.023920059204101562, 0.02728271484375, 0.030645370483398438, 0.034008026123046875, 0.03737068176269531, 0.04073333740234375, 0.04409599304199219, 0.047458648681640625, 0.05082130432128906, 0.0541839599609375, 0.05754661560058594, 0.060909271240234375, 0.06427192687988281, 0.06763458251953125, 0.07099723815917969, 0.07435989379882812, 0.07772254943847656, 0.081085205078125, 0.08444786071777344, 0.08781051635742188, 0.09117317199707031, 0.09453582763671875, 0.09789848327636719, 0.10126113891601562, 0.10462379455566406, 0.1079864501953125, 0.11134910583496094, 0.11471176147460938, 0.11807441711425781, 0.12143707275390625, 0.12479972839355469, 0.12816238403320312, 0.13152503967285156, 0.1348876953125]}, "gradients/decoder.model.decoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 11.0, 29.0, 51.0, 165.0, 292.0, 253.0, 121.0, 38.0, 25.0, 13.0, 6.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.731217861175537, -1.661611795425415, -1.592005729675293, -1.522399663925171, -1.4527935981750488, -1.3831875324249268, -1.3135814666748047, -1.2439754009246826, -1.1743693351745605, -1.1047632694244385, -1.0351572036743164, -0.9655511379241943, -0.8959450721740723, -0.8263390064239502, -0.7567330002784729, -0.6871269345283508, -0.6175209283828735, -0.5479148626327515, -0.4783087968826294, -0.4087027609348297, -0.33909669518470764, -0.26949062943458557, -0.1998845934867859, -0.13027852773666382, -0.06067246198654175, 0.008933596312999725, 0.0785396546125412, 0.14814570546150208, 0.21775177121162415, 0.2873578369617462, 0.3569638729095459, 0.42656993865966797, 0.49617600440979004, 0.5657820701599121, 0.6353881359100342, 0.7049942016601562, 0.7746002674102783, 0.8442063331604004, 0.9138123393058777, 0.9834184050559998, 1.0530245304107666, 1.1226305961608887, 1.1922366619110107, 1.2618427276611328, 1.3314487934112549, 1.401054859161377, 1.470660924911499, 1.540266990661621, 1.6098729372024536, 1.6794790029525757, 1.7490850687026978, 1.8186911344528198, 1.888297200202942, 1.957903265953064, 2.0275092124938965, 2.0971152782440186, 2.1667213439941406, 2.2363274097442627, 2.3059334754943848, 2.375539541244507, 2.445145606994629, 2.514751672744751, 2.584357738494873, 2.653963804244995, 2.723569869995117]}, "gradients/decoder.model.decoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 5.0, 1.0, 3.0, 7.0, 3.0, 3.0, 6.0, 8.0, 9.0, 10.0, 14.0, 16.0, 12.0, 18.0, 20.0, 17.0, 20.0, 34.0, 30.0, 32.0, 21.0, 50.0, 26.0, 22.0, 45.0, 44.0, 37.0, 40.0, 36.0, 38.0, 42.0, 37.0, 26.0, 35.0, 29.0, 30.0, 28.0, 15.0, 23.0, 22.0, 16.0, 13.0, 13.0, 12.0, 11.0, 7.0, 5.0, 4.0, 1.0, 9.0, 3.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.8226771354675293, -0.7981719374656677, -0.7736666798591614, -0.7491614818572998, -0.7246562242507935, -0.7001510262489319, -0.6756458282470703, -0.651140570640564, -0.6266353726387024, -0.6021301746368408, -0.5776249170303345, -0.5531197190284729, -0.5286145210266113, -0.504109263420105, -0.4796040654182434, -0.45509883761405945, -0.4305936098098755, -0.40608838200569153, -0.38158315420150757, -0.357077956199646, -0.33257272839546204, -0.3080675005912781, -0.2835623025894165, -0.25905707478523254, -0.23455184698104858, -0.21004661917686462, -0.18554140627384186, -0.1610361933708191, -0.13653096556663513, -0.11202574521303177, -0.0875205248594284, -0.06301531195640564, -0.038510143756866455, -0.014004923403263092, 0.010500296950340271, 0.035005517303943634, 0.059510737657547, 0.08401595801115036, 0.10852117836475372, 0.1330263912677765, 0.15753161907196045, 0.1820368468761444, 0.20654205977916718, 0.23104727268218994, 0.2555525004863739, 0.28005772829055786, 0.30456292629241943, 0.3290681540966034, 0.35357338190078735, 0.3780786097049713, 0.4025838375091553, 0.42708903551101685, 0.4515942633152008, 0.47609949111938477, 0.5006046891212463, 0.5251098871231079, 0.5496151447296143, 0.5741203427314758, 0.5986256003379822, 0.6231307983398438, 0.6476360559463501, 0.6721412539482117, 0.6966464519500732, 0.7211517095565796, 0.7456569075584412]}, "gradients/decoder.model.decoder.layers.3.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 4.0, 4.0, 7.0, 9.0, 11.0, 18.0, 20.0, 53.0, 74.0, 177.0, 309.0, 835.0, 2211.0, 8258.0, 65724.0, 3036684.0, 1043191.0, 29026.0, 5113.0, 1485.0, 569.0, 227.0, 117.0, 59.0, 37.0, 17.0, 10.0, 13.0, 5.0, 6.0, 3.0, 0.0, 3.0, 3.0, 3.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.8955078125, -0.8664779663085938, -0.8374481201171875, -0.8084182739257812, -0.779388427734375, -0.7503585815429688, -0.7213287353515625, -0.6922988891601562, -0.66326904296875, -0.6342391967773438, -0.6052093505859375, -0.5761795043945312, -0.547149658203125, -0.5181198120117188, -0.4890899658203125, -0.46006011962890625, -0.4310302734375, -0.40200042724609375, -0.3729705810546875, -0.34394073486328125, -0.314910888671875, -0.28588104248046875, -0.2568511962890625, -0.22782135009765625, -0.19879150390625, -0.16976165771484375, -0.1407318115234375, -0.11170196533203125, -0.082672119140625, -0.05364227294921875, -0.0246124267578125, 0.00441741943359375, 0.033447265625, 0.06247711181640625, 0.0915069580078125, 0.12053680419921875, 0.149566650390625, 0.17859649658203125, 0.2076263427734375, 0.23665618896484375, 0.26568603515625, 0.29471588134765625, 0.3237457275390625, 0.35277557373046875, 0.381805419921875, 0.41083526611328125, 0.4398651123046875, 0.46889495849609375, 0.4979248046875, 0.5269546508789062, 0.5559844970703125, 0.5850143432617188, 0.614044189453125, 0.6430740356445312, 0.6721038818359375, 0.7011337280273438, 0.73016357421875, 0.7591934204101562, 0.7882232666015625, 0.8172531127929688, 0.846282958984375, 0.8753128051757812, 0.9043426513671875, 0.9333724975585938, 0.96240234375]}, "gradients/decoder.model.decoder.layers.3.fc2.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0, 7.0, 3.0, 3.0, 6.0, 5.0, 15.0, 12.0, 13.0, 20.0, 25.0, 23.0, 29.0, 30.0, 35.0, 30.0, 38.0, 41.0, 59.0, 53.0, 46.0, 45.0, 53.0, 43.0, 54.0, 41.0, 38.0, 41.0, 36.0, 29.0, 26.0, 25.0, 12.0, 15.0, 12.0, 7.0, 6.0, 5.0, 4.0, 5.0, 6.0, 4.0, 4.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.265869140625, -0.2570304870605469, -0.24819183349609375, -0.23935317993164062, -0.2305145263671875, -0.22167587280273438, -0.21283721923828125, -0.20399856567382812, -0.195159912109375, -0.18632125854492188, -0.17748260498046875, -0.16864395141601562, -0.1598052978515625, -0.15096664428710938, -0.14212799072265625, -0.13328933715820312, -0.12445068359375, -0.11561203002929688, -0.10677337646484375, -0.09793472290039062, -0.0890960693359375, -0.08025741577148438, -0.07141876220703125, -0.06258010864257812, -0.053741455078125, -0.044902801513671875, -0.03606414794921875, -0.027225494384765625, -0.0183868408203125, -0.009548187255859375, -0.00070953369140625, 0.008129119873046875, 0.0169677734375, 0.025806427001953125, 0.03464508056640625, 0.043483734130859375, 0.0523223876953125, 0.061161041259765625, 0.06999969482421875, 0.07883834838867188, 0.087677001953125, 0.09651565551757812, 0.10535430908203125, 0.11419296264648438, 0.1230316162109375, 0.13187026977539062, 0.14070892333984375, 0.14954757690429688, 0.15838623046875, 0.16722488403320312, 0.17606353759765625, 0.18490219116210938, 0.1937408447265625, 0.20257949829101562, 0.21141815185546875, 0.22025680541992188, 0.229095458984375, 0.23793411254882812, 0.24677276611328125, 0.2556114196777344, 0.2644500732421875, 0.2732887268066406, 0.28212738037109375, 0.2909660339355469, 0.2998046875]}, "gradients/decoder.model.decoder.layers.3.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 7.0, 4.0, 4.0, 5.0, 7.0, 6.0, 15.0, 15.0, 22.0, 34.0, 46.0, 51.0, 89.0, 125.0, 271.0, 390.0, 857.0, 2170.0, 6318.0, 28099.0, 278861.0, 3612183.0, 229796.0, 25331.0, 5907.0, 1929.0, 755.0, 423.0, 200.0, 120.0, 78.0, 47.0, 39.0, 19.0, 16.0, 18.0, 7.0, 7.0, 2.0, 3.0, 3.0, 5.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0], "bins": [-0.71728515625, -0.6981430053710938, -0.6790008544921875, -0.6598587036132812, -0.640716552734375, -0.6215744018554688, -0.6024322509765625, -0.5832901000976562, -0.56414794921875, -0.5450057983398438, -0.5258636474609375, -0.5067214965820312, -0.487579345703125, -0.46843719482421875, -0.4492950439453125, -0.43015289306640625, -0.4110107421875, -0.39186859130859375, -0.3727264404296875, -0.35358428955078125, -0.334442138671875, -0.31529998779296875, -0.2961578369140625, -0.27701568603515625, -0.25787353515625, -0.23873138427734375, -0.2195892333984375, -0.20044708251953125, -0.181304931640625, -0.16216278076171875, -0.1430206298828125, -0.12387847900390625, -0.104736328125, -0.08559417724609375, -0.0664520263671875, -0.04730987548828125, -0.028167724609375, -0.00902557373046875, 0.0101165771484375, 0.02925872802734375, 0.04840087890625, 0.06754302978515625, 0.0866851806640625, 0.10582733154296875, 0.124969482421875, 0.14411163330078125, 0.1632537841796875, 0.18239593505859375, 0.2015380859375, 0.22068023681640625, 0.2398223876953125, 0.25896453857421875, 0.278106689453125, 0.29724884033203125, 0.3163909912109375, 0.33553314208984375, 0.35467529296875, 0.37381744384765625, 0.3929595947265625, 0.41210174560546875, 0.431243896484375, 0.45038604736328125, 0.4695281982421875, 0.48867034912109375, 0.5078125]}, "gradients/decoder.model.decoder.layers.3.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 5.0, 4.0, 9.0, 14.0, 14.0, 21.0, 35.0, 53.0, 73.0, 103.0, 207.0, 395.0, 661.0, 879.0, 663.0, 364.0, 203.0, 139.0, 67.0, 50.0, 31.0, 30.0, 13.0, 17.0, 6.0, 5.0, 9.0, 1.0, 3.0, 4.0, 2.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.17822265625, -0.1727313995361328, -0.16724014282226562, -0.16174888610839844, -0.15625762939453125, -0.15076637268066406, -0.14527511596679688, -0.1397838592529297, -0.1342926025390625, -0.1288013458251953, -0.12331008911132812, -0.11781883239746094, -0.11232757568359375, -0.10683631896972656, -0.10134506225585938, -0.09585380554199219, -0.090362548828125, -0.08487129211425781, -0.07938003540039062, -0.07388877868652344, -0.06839752197265625, -0.06290626525878906, -0.057415008544921875, -0.05192375183105469, -0.0464324951171875, -0.04094123840332031, -0.035449981689453125, -0.029958724975585938, -0.02446746826171875, -0.018976211547851562, -0.013484954833984375, -0.007993698120117188, -0.00250244140625, 0.0029888153076171875, 0.008480072021484375, 0.013971328735351562, 0.01946258544921875, 0.024953842163085938, 0.030445098876953125, 0.03593635559082031, 0.0414276123046875, 0.04691886901855469, 0.052410125732421875, 0.05790138244628906, 0.06339263916015625, 0.06888389587402344, 0.07437515258789062, 0.07986640930175781, 0.085357666015625, 0.09084892272949219, 0.09634017944335938, 0.10183143615722656, 0.10732269287109375, 0.11281394958496094, 0.11830520629882812, 0.12379646301269531, 0.1292877197265625, 0.1347789764404297, 0.14027023315429688, 0.14576148986816406, 0.15125274658203125, 0.15674400329589844, 0.16223526000976562, 0.1677265167236328, 0.1732177734375]}, "gradients/decoder.model.decoder.layers.3.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 3.0, 2.0, 10.0, 11.0, 15.0, 16.0, 25.0, 37.0, 53.0, 81.0, 98.0, 99.0, 145.0, 105.0, 120.0, 57.0, 43.0, 32.0, 20.0, 14.0, 5.0, 6.0, 5.0, 4.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5308326482772827, -0.5080342292785645, -0.4852357804775238, -0.46243736147880554, -0.4396389126777649, -0.41684049367904663, -0.39404207468032837, -0.3712436556816101, -0.34844520688056946, -0.3256467878818512, -0.30284833908081055, -0.2800499200820923, -0.257251501083374, -0.23445305228233337, -0.2116546332836151, -0.18885619938373566, -0.1660577654838562, -0.14325933158397675, -0.12046090513467789, -0.09766247868537903, -0.07486404478549957, -0.05206561088562012, -0.029267191886901855, -0.0064687579870224, 0.016329675912857056, 0.03912810608744621, 0.06192653626203537, 0.08472496271133423, 0.10752339661121368, 0.13032183051109314, 0.1531202495098114, 0.17591868340969086, 0.1987171173095703, 0.22151555120944977, 0.24431398510932922, 0.2671124041080475, 0.28991085290908813, 0.3127092719078064, 0.33550769090652466, 0.3583061099052429, 0.38110455870628357, 0.40390297770500183, 0.4267014265060425, 0.44949984550476074, 0.472298264503479, 0.49509671330451965, 0.5178951025009155, 0.5406935811042786, 0.5634920001029968, 0.5862904191017151, 0.6090888381004333, 0.6318873167037964, 0.6546857357025146, 0.6774841547012329, 0.7002825736999512, 0.7230809926986694, 0.7458794116973877, 0.768677830696106, 0.7914762496948242, 0.8142746686935425, 0.8370731472969055, 0.8598715662956238, 0.882669985294342, 0.9054684042930603, 0.9282668828964233]}, "gradients/decoder.model.decoder.layers.3.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 5.0, 4.0, 6.0, 4.0, 8.0, 7.0, 7.0, 12.0, 12.0, 13.0, 26.0, 23.0, 24.0, 33.0, 30.0, 46.0, 32.0, 38.0, 30.0, 30.0, 37.0, 37.0, 39.0, 46.0, 48.0, 41.0, 36.0, 42.0, 42.0, 34.0, 25.0, 26.0, 33.0, 23.0, 23.0, 20.0, 19.0, 10.0, 13.0, 10.0, 1.0, 4.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.31847622990608215, -0.30862683057785034, -0.29877740144729614, -0.28892800211906433, -0.2790786027908325, -0.2692291736602783, -0.2593797743320465, -0.2495303601026535, -0.2396809458732605, -0.2298315316438675, -0.2199821174144745, -0.21013271808624268, -0.20028330385684967, -0.19043388962745667, -0.18058449029922485, -0.17073507606983185, -0.16088566184043884, -0.15103624761104584, -0.14118683338165283, -0.13133743405342102, -0.12148801982402802, -0.11163860559463501, -0.1017891988158226, -0.09193979203701019, -0.08209037780761719, -0.07224096357822418, -0.062391556799411774, -0.05254214629530907, -0.04269273579120636, -0.03284332528710365, -0.022993914783000946, -0.013144508004188538, -0.00329512357711792, 0.006554286926984787, 0.016403697431087494, 0.0262531079351902, 0.03610251843929291, 0.045951928943395615, 0.05580133944749832, 0.06565074622631073, 0.07550016045570374, 0.08534957468509674, 0.09519898146390915, 0.10504838824272156, 0.11489780247211456, 0.12474721670150757, 0.13459661602973938, 0.14444603025913239, 0.1542954444885254, 0.1641448587179184, 0.1739942729473114, 0.1838436722755432, 0.19369308650493622, 0.20354250073432922, 0.21339190006256104, 0.22324131429195404, 0.23309072852134705, 0.24294014275074005, 0.25278955698013306, 0.26263895630836487, 0.2724883556365967, 0.2823377847671509, 0.2921871840953827, 0.3020365834236145, 0.3118860125541687]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 4.0, 4.0, 3.0, 7.0, 0.0, 3.0, 10.0, 14.0, 31.0, 46.0, 138.0, 345.0, 923.0, 2830.0, 10380.0, 119000.0, 827631.0, 74976.0, 8535.0, 2364.0, 786.0, 275.0, 132.0, 51.0, 27.0, 17.0, 8.0, 5.0, 6.0, 4.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1671142578125, -0.16079139709472656, -0.15446853637695312, -0.1481456756591797, -0.14182281494140625, -0.1354999542236328, -0.12917709350585938, -0.12285423278808594, -0.1165313720703125, -0.11020851135253906, -0.10388565063476562, -0.09756278991699219, -0.09123992919921875, -0.08491706848144531, -0.07859420776367188, -0.07227134704589844, -0.065948486328125, -0.05962562561035156, -0.053302764892578125, -0.04697990417480469, -0.04065704345703125, -0.03433418273925781, -0.028011322021484375, -0.021688461303710938, -0.0153656005859375, -0.009042739868164062, -0.002719879150390625, 0.0036029815673828125, 0.00992584228515625, 0.016248703002929688, 0.022571563720703125, 0.028894424438476562, 0.03521728515625, 0.04154014587402344, 0.047863006591796875, 0.05418586730957031, 0.06050872802734375, 0.06683158874511719, 0.07315444946289062, 0.07947731018066406, 0.0858001708984375, 0.09212303161621094, 0.09844589233398438, 0.10476875305175781, 0.11109161376953125, 0.11741447448730469, 0.12373733520507812, 0.13006019592285156, 0.136383056640625, 0.14270591735839844, 0.14902877807617188, 0.1553516387939453, 0.16167449951171875, 0.1679973602294922, 0.17432022094726562, 0.18064308166503906, 0.1869659423828125, 0.19328880310058594, 0.19961166381835938, 0.2059345245361328, 0.21225738525390625, 0.2185802459716797, 0.22490310668945312, 0.23122596740722656, 0.237548828125]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 3.0, 6.0, 2.0, 7.0, 2.0, 7.0, 14.0, 15.0, 17.0, 23.0, 28.0, 39.0, 38.0, 35.0, 42.0, 54.0, 28.0, 49.0, 53.0, 43.0, 59.0, 52.0, 57.0, 48.0, 38.0, 36.0, 43.0, 23.0, 31.0, 21.0, 28.0, 20.0, 11.0, 12.0, 5.0, 3.0, 5.0, 2.0, 1.0, 0.0, 2.0, 3.0, 1.0, 4.0, 0.0, 0.0, 1.0], "bins": [-0.291259765625, -0.2832679748535156, -0.27527618408203125, -0.2672843933105469, -0.2592926025390625, -0.2513008117675781, -0.24330902099609375, -0.23531723022460938, -0.227325439453125, -0.21933364868164062, -0.21134185791015625, -0.20335006713867188, -0.1953582763671875, -0.18736648559570312, -0.17937469482421875, -0.17138290405273438, -0.16339111328125, -0.15539932250976562, -0.14740753173828125, -0.13941574096679688, -0.1314239501953125, -0.12343215942382812, -0.11544036865234375, -0.10744857788085938, -0.099456787109375, -0.09146499633789062, -0.08347320556640625, -0.07548141479492188, -0.0674896240234375, -0.059497833251953125, -0.05150604248046875, -0.043514251708984375, -0.0355224609375, -0.027530670166015625, -0.01953887939453125, -0.011547088623046875, -0.0035552978515625, 0.004436492919921875, 0.01242828369140625, 0.020420074462890625, 0.028411865234375, 0.036403656005859375, 0.04439544677734375, 0.052387237548828125, 0.0603790283203125, 0.06837081909179688, 0.07636260986328125, 0.08435440063476562, 0.09234619140625, 0.10033798217773438, 0.10832977294921875, 0.11632156372070312, 0.1243133544921875, 0.13230514526367188, 0.14029693603515625, 0.14828872680664062, 0.156280517578125, 0.16427230834960938, 0.17226409912109375, 0.18025588989257812, 0.1882476806640625, 0.19623947143554688, 0.20423126220703125, 0.21222305297851562, 0.22021484375]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 9.0, 12.0, 10.0, 16.0, 26.0, 43.0, 72.0, 133.0, 225.0, 441.0, 862.0, 1917.0, 4857.0, 15250.0, 74528.0, 496114.0, 380762.0, 53749.0, 12138.0, 3971.0, 1680.0, 762.0, 397.0, 218.0, 134.0, 93.0, 52.0, 26.0, 20.0, 15.0, 11.0, 8.0, 8.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.10565185546875, -0.10253620147705078, -0.09942054748535156, -0.09630489349365234, -0.09318923950195312, -0.0900735855102539, -0.08695793151855469, -0.08384227752685547, -0.08072662353515625, -0.07761096954345703, -0.07449531555175781, -0.0713796615600586, -0.06826400756835938, -0.06514835357666016, -0.06203269958496094, -0.05891704559326172, -0.0558013916015625, -0.05268573760986328, -0.04957008361816406, -0.046454429626464844, -0.043338775634765625, -0.040223121643066406, -0.03710746765136719, -0.03399181365966797, -0.03087615966796875, -0.02776050567626953, -0.024644851684570312, -0.021529197692871094, -0.018413543701171875, -0.015297889709472656, -0.012182235717773438, -0.009066581726074219, -0.005950927734375, -0.0028352737426757812, 0.0002803802490234375, 0.0033960342407226562, 0.006511688232421875, 0.009627342224121094, 0.012742996215820312, 0.01585865020751953, 0.01897430419921875, 0.02208995819091797, 0.025205612182617188, 0.028321266174316406, 0.031436920166015625, 0.034552574157714844, 0.03766822814941406, 0.04078388214111328, 0.0438995361328125, 0.04701519012451172, 0.05013084411621094, 0.053246498107910156, 0.056362152099609375, 0.059477806091308594, 0.06259346008300781, 0.06570911407470703, 0.06882476806640625, 0.07194042205810547, 0.07505607604980469, 0.0781717300415039, 0.08128738403320312, 0.08440303802490234, 0.08751869201660156, 0.09063434600830078, 0.09375]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 7.0, 0.0, 3.0, 4.0, 3.0, 4.0, 3.0, 4.0, 3.0, 12.0, 10.0, 15.0, 18.0, 29.0, 32.0, 28.0, 38.0, 42.0, 42.0, 32.0, 60.0, 53.0, 58.0, 71.0, 58.0, 42.0, 49.0, 40.0, 34.0, 30.0, 27.0, 24.0, 28.0, 19.0, 25.0, 15.0, 13.0, 4.0, 10.0, 6.0, 4.0, 6.0, 2.0, 3.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.453125, -0.4381866455078125, -0.423248291015625, -0.4083099365234375, -0.39337158203125, -0.3784332275390625, -0.363494873046875, -0.3485565185546875, -0.3336181640625, -0.3186798095703125, -0.303741455078125, -0.2888031005859375, -0.27386474609375, -0.2589263916015625, -0.243988037109375, -0.2290496826171875, -0.214111328125, -0.1991729736328125, -0.184234619140625, -0.1692962646484375, -0.15435791015625, -0.1394195556640625, -0.124481201171875, -0.1095428466796875, -0.0946044921875, -0.0796661376953125, -0.064727783203125, -0.0497894287109375, -0.03485107421875, -0.0199127197265625, -0.004974365234375, 0.0099639892578125, 0.02490234375, 0.0398406982421875, 0.054779052734375, 0.0697174072265625, 0.08465576171875, 0.0995941162109375, 0.114532470703125, 0.1294708251953125, 0.1444091796875, 0.1593475341796875, 0.174285888671875, 0.1892242431640625, 0.20416259765625, 0.2191009521484375, 0.234039306640625, 0.2489776611328125, 0.263916015625, 0.2788543701171875, 0.293792724609375, 0.3087310791015625, 0.32366943359375, 0.3386077880859375, 0.353546142578125, 0.3684844970703125, 0.3834228515625, 0.3983612060546875, 0.413299560546875, 0.4282379150390625, 0.44317626953125, 0.4581146240234375, 0.473052978515625, 0.4879913330078125, 0.5029296875]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 3.0, 2.0, 3.0, 6.0, 14.0, 15.0, 24.0, 35.0, 48.0, 78.0, 105.0, 172.0, 252.0, 410.0, 748.0, 1427.0, 2772.0, 6212.0, 16022.0, 53096.0, 221021.0, 488824.0, 185438.0, 45874.0, 14584.0, 5701.0, 2522.0, 1355.0, 693.0, 416.0, 250.0, 128.0, 93.0, 66.0, 37.0, 30.0, 28.0, 18.0, 14.0, 8.0, 6.0, 4.0, 4.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.022613525390625, -0.021956920623779297, -0.021300315856933594, -0.02064371109008789, -0.019987106323242188, -0.019330501556396484, -0.01867389678955078, -0.018017292022705078, -0.017360687255859375, -0.016704082489013672, -0.01604747772216797, -0.015390872955322266, -0.014734268188476562, -0.01407766342163086, -0.013421058654785156, -0.012764453887939453, -0.01210784912109375, -0.011451244354248047, -0.010794639587402344, -0.01013803482055664, -0.009481430053710938, -0.008824825286865234, -0.008168220520019531, -0.007511615753173828, -0.006855010986328125, -0.006198406219482422, -0.005541801452636719, -0.004885196685791016, -0.0042285919189453125, -0.0035719871520996094, -0.0029153823852539062, -0.002258777618408203, -0.0016021728515625, -0.0009455680847167969, -0.00028896331787109375, 0.0003676414489746094, 0.0010242462158203125, 0.0016808509826660156, 0.0023374557495117188, 0.002994060516357422, 0.003650665283203125, 0.004307270050048828, 0.004963874816894531, 0.005620479583740234, 0.0062770843505859375, 0.006933689117431641, 0.007590293884277344, 0.008246898651123047, 0.00890350341796875, 0.009560108184814453, 0.010216712951660156, 0.01087331771850586, 0.011529922485351562, 0.012186527252197266, 0.012843132019042969, 0.013499736785888672, 0.014156341552734375, 0.014812946319580078, 0.015469551086425781, 0.016126155853271484, 0.016782760620117188, 0.01743936538696289, 0.018095970153808594, 0.018752574920654297, 0.0194091796875]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 3.0, 1.0, 3.0, 2.0, 3.0, 6.0, 4.0, 9.0, 12.0, 14.0, 11.0, 23.0, 26.0, 27.0, 29.0, 37.0, 43.0, 64.0, 55.0, 60.0, 78.0, 67.0, 81.0, 57.0, 56.0, 45.0, 46.0, 23.0, 28.0, 23.0, 14.0, 9.0, 15.0, 4.0, 12.0, 3.0, 3.0, 4.0, 5.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0788440704345703e-05, -1.0462477803230286e-05, -1.0136514902114868e-05, -9.81055200099945e-06, -9.484589099884033e-06, -9.158626198768616e-06, -8.832663297653198e-06, -8.50670039653778e-06, -8.180737495422363e-06, -7.854774594306946e-06, -7.528811693191528e-06, -7.202848792076111e-06, -6.876885890960693e-06, -6.550922989845276e-06, -6.224960088729858e-06, -5.898997187614441e-06, -5.5730342864990234e-06, -5.247071385383606e-06, -4.9211084842681885e-06, -4.595145583152771e-06, -4.2691826820373535e-06, -3.943219780921936e-06, -3.6172568798065186e-06, -3.291293978691101e-06, -2.9653310775756836e-06, -2.639368176460266e-06, -2.3134052753448486e-06, -1.987442374229431e-06, -1.6614794731140137e-06, -1.3355165719985962e-06, -1.0095536708831787e-06, -6.835907697677612e-07, -3.5762786865234375e-07, -3.166496753692627e-08, 2.942979335784912e-07, 6.202608346939087e-07, 9.462237358093262e-07, 1.2721866369247437e-06, 1.5981495380401611e-06, 1.9241124391555786e-06, 2.250075340270996e-06, 2.5760382413864136e-06, 2.902001142501831e-06, 3.2279640436172485e-06, 3.553926944732666e-06, 3.8798898458480835e-06, 4.205852746963501e-06, 4.5318156480789185e-06, 4.857778549194336e-06, 5.183741450309753e-06, 5.509704351425171e-06, 5.835667252540588e-06, 6.161630153656006e-06, 6.487593054771423e-06, 6.813555955886841e-06, 7.139518857002258e-06, 7.465481758117676e-06, 7.791444659233093e-06, 8.11740756034851e-06, 8.443370461463928e-06, 8.769333362579346e-06, 9.095296263694763e-06, 9.42125916481018e-06, 9.747222065925598e-06, 1.0073184967041016e-05]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 3.0, 1.0, 5.0, 1.0, 5.0, 11.0, 13.0, 12.0, 27.0, 32.0, 57.0, 83.0, 126.0, 208.0, 355.0, 588.0, 1178.0, 2445.0, 6165.0, 17354.0, 59239.0, 222912.0, 442147.0, 211720.0, 56557.0, 16501.0, 5819.0, 2368.0, 1145.0, 576.0, 313.0, 219.0, 131.0, 78.0, 59.0, 24.0, 22.0, 13.0, 14.0, 5.0, 4.0, 10.0, 5.0, 7.0, 3.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0175628662109375, -0.016899585723876953, -0.016236305236816406, -0.01557302474975586, -0.014909744262695312, -0.014246463775634766, -0.013583183288574219, -0.012919902801513672, -0.012256622314453125, -0.011593341827392578, -0.010930061340332031, -0.010266780853271484, -0.009603500366210938, -0.00894021987915039, -0.008276939392089844, -0.007613658905029297, -0.00695037841796875, -0.006287097930908203, -0.005623817443847656, -0.004960536956787109, -0.0042972564697265625, -0.0036339759826660156, -0.0029706954956054688, -0.002307415008544922, -0.001644134521484375, -0.0009808540344238281, -0.00031757354736328125, 0.0003457069396972656, 0.0010089874267578125, 0.0016722679138183594, 0.0023355484008789062, 0.002998828887939453, 0.003662109375, 0.004325389862060547, 0.004988670349121094, 0.005651950836181641, 0.0063152313232421875, 0.006978511810302734, 0.007641792297363281, 0.008305072784423828, 0.008968353271484375, 0.009631633758544922, 0.010294914245605469, 0.010958194732666016, 0.011621475219726562, 0.01228475570678711, 0.012948036193847656, 0.013611316680908203, 0.01427459716796875, 0.014937877655029297, 0.015601158142089844, 0.01626443862915039, 0.016927719116210938, 0.017590999603271484, 0.01825428009033203, 0.018917560577392578, 0.019580841064453125, 0.020244121551513672, 0.02090740203857422, 0.021570682525634766, 0.022233963012695312, 0.02289724349975586, 0.023560523986816406, 0.024223804473876953, 0.0248870849609375]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 3.0, 4.0, 4.0, 6.0, 4.0, 4.0, 8.0, 8.0, 12.0, 15.0, 19.0, 19.0, 29.0, 31.0, 42.0, 48.0, 49.0, 65.0, 80.0, 70.0, 59.0, 59.0, 51.0, 58.0, 60.0, 34.0, 28.0, 28.0, 28.0, 13.0, 22.0, 5.0, 8.0, 6.0, 4.0, 7.0, 4.0, 3.0, 4.0, 4.0, 3.0, 2.0, 0.0, 3.0], "bins": [-0.007099151611328125, -0.006922602653503418, -0.006746053695678711, -0.006569504737854004, -0.006392955780029297, -0.00621640682220459, -0.006039857864379883, -0.005863308906555176, -0.005686759948730469, -0.005510210990905762, -0.005333662033081055, -0.005157113075256348, -0.004980564117431641, -0.004804015159606934, -0.0046274662017822266, -0.0044509172439575195, -0.0042743682861328125, -0.0040978193283081055, -0.0039212703704833984, -0.0037447214126586914, -0.0035681724548339844, -0.0033916234970092773, -0.0032150745391845703, -0.0030385255813598633, -0.0028619766235351562, -0.0026854276657104492, -0.002508878707885742, -0.002332329750061035, -0.002155780792236328, -0.001979231834411621, -0.001802682876586914, -0.001626133918762207, -0.0014495849609375, -0.001273036003112793, -0.001096487045288086, -0.0009199380874633789, -0.0007433891296386719, -0.0005668401718139648, -0.0003902912139892578, -0.00021374225616455078, -3.719329833984375e-05, 0.00013935565948486328, 0.0003159046173095703, 0.0004924535751342773, 0.0006690025329589844, 0.0008455514907836914, 0.0010221004486083984, 0.0011986494064331055, 0.0013751983642578125, 0.0015517473220825195, 0.0017282962799072266, 0.0019048452377319336, 0.0020813941955566406, 0.0022579431533813477, 0.0024344921112060547, 0.0026110410690307617, 0.0027875900268554688, 0.0029641389846801758, 0.003140687942504883, 0.00331723690032959, 0.003493785858154297, 0.003670334815979004, 0.003846883773803711, 0.004023432731628418, 0.004199981689453125]}, "gradients/decoder.model.decoder.layers.3.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 4.0, 12.0, 27.0, 46.0, 105.0, 211.0, 270.0, 179.0, 91.0, 40.0, 10.0, 6.0, 7.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5026878714561462, -0.4737480580806732, -0.4448082447052002, -0.4158684015274048, -0.38692858815193176, -0.35798877477645874, -0.32904893159866333, -0.3001091182231903, -0.2711693048477173, -0.24222949147224426, -0.21328966319561005, -0.18434983491897583, -0.1554100215435028, -0.12647020816802979, -0.09753037989139557, -0.06859055161476135, -0.03965073823928833, -0.01071091741323471, 0.01822890341281891, 0.04716872423887253, 0.07610854506492615, 0.10504835844039917, 0.1339881867170334, 0.1629280149936676, 0.19186782836914062, 0.22080764174461365, 0.24974747002124786, 0.2786872982978821, 0.3076271116733551, 0.3365669250488281, 0.36550676822662354, 0.39444658160209656, 0.4233863353729248, 0.4523261487483978, 0.48126596212387085, 0.5102058053016663, 0.5391455888748169, 0.5680854320526123, 0.5970252752304077, 0.6259651184082031, 0.6549049019813538, 0.6838447451591492, 0.7127845287322998, 0.7417243719100952, 0.7706642150878906, 0.7996039986610413, 0.8285438418388367, 0.8574836254119873, 0.8864234685897827, 0.9153633117675781, 0.9443030953407288, 0.9732429385185242, 1.0021827220916748, 1.0311225652694702, 1.0600624084472656, 1.089002251625061, 1.1179420948028564, 1.1468819379806519, 1.1758217811584473, 1.2047615051269531, 1.2337013483047485, 1.262641191482544, 1.2915810346603394, 1.3205208778381348, 1.3494606018066406]}, "gradients/decoder.model.decoder.layers.3.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 4.0, 2.0, 5.0, 8.0, 1.0, 16.0, 8.0, 15.0, 15.0, 25.0, 24.0, 42.0, 33.0, 56.0, 42.0, 44.0, 36.0, 54.0, 37.0, 57.0, 62.0, 63.0, 40.0, 55.0, 42.0, 36.0, 34.0, 32.0, 29.0, 28.0, 21.0, 14.0, 9.0, 6.0, 2.0, 5.0, 1.0, 3.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.29349470138549805, -0.28555718064308167, -0.2776196599006653, -0.2696821391582489, -0.2617446184158325, -0.25380709767341614, -0.24586959183216095, -0.23793207108974457, -0.22999455034732819, -0.2220570296049118, -0.21411950886249542, -0.20618198812007904, -0.19824448227882385, -0.19030696153640747, -0.1823694407939911, -0.1744319200515747, -0.16649439930915833, -0.15855687856674194, -0.15061935782432556, -0.14268183708190918, -0.1347443163394928, -0.12680679559707642, -0.11886928975582123, -0.11093176901340485, -0.10299424827098846, -0.09505672752857208, -0.0871192067861557, -0.07918169349431992, -0.07124417275190353, -0.06330665200948715, -0.05536913499236107, -0.047431617975234985, -0.039494067430496216, -0.031556546688079834, -0.02361902967095375, -0.015681510791182518, -0.007743991911411285, 0.00019352883100509644, 0.00813104584813118, 0.016068562865257263, 0.024006083607673645, 0.03194360435009003, 0.03988112136721611, 0.047818638384342194, 0.055756159126758575, 0.06369367986917496, 0.07163119316101074, 0.07956871390342712, 0.0875062346458435, 0.09544375538825989, 0.10338127613067627, 0.11131878942251205, 0.11925631016492844, 0.12719383835792542, 0.1351313441991806, 0.14306886494159698, 0.15100638568401337, 0.15894390642642975, 0.16688142716884613, 0.1748189479112625, 0.1827564537525177, 0.19069397449493408, 0.19863149523735046, 0.20656901597976685, 0.21450653672218323]}, "gradients/decoder.model.decoder.layers.3.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 5.0, 1.0, 4.0, 1.0, 4.0, 2.0, 5.0, 9.0, 8.0, 12.0, 16.0, 34.0, 46.0, 71.0, 118.0, 219.0, 419.0, 787.0, 1548.0, 3218.0, 7573.0, 19814.0, 61345.0, 723252.0, 172201.0, 35335.0, 12534.0, 5225.0, 2288.0, 1176.0, 535.0, 296.0, 176.0, 103.0, 58.0, 38.0, 14.0, 18.0, 12.0, 8.0, 7.0, 3.0, 10.0, 5.0, 5.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.305908203125, -0.29596710205078125, -0.2860260009765625, -0.27608489990234375, -0.266143798828125, -0.25620269775390625, -0.2462615966796875, -0.23632049560546875, -0.22637939453125, -0.21643829345703125, -0.2064971923828125, -0.19655609130859375, -0.186614990234375, -0.17667388916015625, -0.1667327880859375, -0.15679168701171875, -0.1468505859375, -0.13690948486328125, -0.1269683837890625, -0.11702728271484375, -0.107086181640625, -0.09714508056640625, -0.0872039794921875, -0.07726287841796875, -0.06732177734375, -0.05738067626953125, -0.0474395751953125, -0.03749847412109375, -0.027557373046875, -0.01761627197265625, -0.0076751708984375, 0.00226593017578125, 0.01220703125, 0.02214813232421875, 0.0320892333984375, 0.04203033447265625, 0.051971435546875, 0.06191253662109375, 0.0718536376953125, 0.08179473876953125, 0.09173583984375, 0.10167694091796875, 0.1116180419921875, 0.12155914306640625, 0.131500244140625, 0.14144134521484375, 0.1513824462890625, 0.16132354736328125, 0.1712646484375, 0.18120574951171875, 0.1911468505859375, 0.20108795166015625, 0.211029052734375, 0.22097015380859375, 0.2309112548828125, 0.24085235595703125, 0.25079345703125, 0.26073455810546875, 0.2706756591796875, 0.28061676025390625, 0.290557861328125, 0.30049896240234375, 0.3104400634765625, 0.32038116455078125, 0.330322265625]}, "gradients/decoder.model.decoder.layers.3.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 5.0, 2.0, 11.0, 12.0, 14.0, 24.0, 29.0, 43.0, 41.0, 64.0, 59.0, 52.0, 72.0, 61.0, 113.0, 63.0, 60.0, 64.0, 52.0, 41.0, 39.0, 31.0, 21.0, 16.0, 7.0, 5.0, 5.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6875, -0.6651153564453125, -0.642730712890625, -0.6203460693359375, -0.59796142578125, -0.5755767822265625, -0.553192138671875, -0.5308074951171875, -0.5084228515625, -0.4860382080078125, -0.463653564453125, -0.4412689208984375, -0.41888427734375, -0.3964996337890625, -0.374114990234375, -0.3517303466796875, -0.329345703125, -0.3069610595703125, -0.284576416015625, -0.2621917724609375, -0.23980712890625, -0.2174224853515625, -0.195037841796875, -0.1726531982421875, -0.1502685546875, -0.1278839111328125, -0.105499267578125, -0.0831146240234375, -0.06072998046875, -0.0383453369140625, -0.015960693359375, 0.0064239501953125, 0.02880859375, 0.0511932373046875, 0.073577880859375, 0.0959625244140625, 0.11834716796875, 0.1407318115234375, 0.163116455078125, 0.1855010986328125, 0.2078857421875, 0.2302703857421875, 0.252655029296875, 0.2750396728515625, 0.29742431640625, 0.3198089599609375, 0.342193603515625, 0.3645782470703125, 0.386962890625, 0.4093475341796875, 0.431732177734375, 0.4541168212890625, 0.47650146484375, 0.4988861083984375, 0.521270751953125, 0.5436553955078125, 0.5660400390625, 0.5884246826171875, 0.610809326171875, 0.6331939697265625, 0.65557861328125, 0.6779632568359375, 0.700347900390625, 0.7227325439453125, 0.7451171875]}, "gradients/decoder.model.decoder.layers.3.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 4.0, 2.0, 2.0, 8.0, 16.0, 6.0, 15.0, 21.0, 21.0, 18.0, 27.0, 53.0, 47.0, 79.0, 94.0, 153.0, 418.0, 2624.0, 40775.0, 963344.0, 37367.0, 2453.0, 460.0, 137.0, 90.0, 83.0, 53.0, 41.0, 40.0, 28.0, 22.0, 9.0, 6.0, 12.0, 6.0, 11.0, 3.0, 4.0, 0.0, 1.0, 4.0, 3.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.78125, -0.7556228637695312, -0.7299957275390625, -0.7043685913085938, -0.678741455078125, -0.6531143188476562, -0.6274871826171875, -0.6018600463867188, -0.57623291015625, -0.5506057739257812, -0.5249786376953125, -0.49935150146484375, -0.473724365234375, -0.44809722900390625, -0.4224700927734375, -0.39684295654296875, -0.3712158203125, -0.34558868408203125, -0.3199615478515625, -0.29433441162109375, -0.268707275390625, -0.24308013916015625, -0.2174530029296875, -0.19182586669921875, -0.16619873046875, -0.14057159423828125, -0.1149444580078125, -0.08931732177734375, -0.063690185546875, -0.03806304931640625, -0.0124359130859375, 0.01319122314453125, 0.038818359375, 0.06444549560546875, 0.0900726318359375, 0.11569976806640625, 0.141326904296875, 0.16695404052734375, 0.1925811767578125, 0.21820831298828125, 0.24383544921875, 0.26946258544921875, 0.2950897216796875, 0.32071685791015625, 0.346343994140625, 0.37197113037109375, 0.3975982666015625, 0.42322540283203125, 0.4488525390625, 0.47447967529296875, 0.5001068115234375, 0.5257339477539062, 0.551361083984375, 0.5769882202148438, 0.6026153564453125, 0.6282424926757812, 0.65386962890625, 0.6794967651367188, 0.7051239013671875, 0.7307510375976562, 0.756378173828125, 0.7820053100585938, 0.8076324462890625, 0.8332595825195312, 0.85888671875]}, "gradients/decoder.model.decoder.layers.3.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 5.0, 1.0, 4.0, 3.0, 8.0, 7.0, 9.0, 16.0, 11.0, 20.0, 25.0, 28.0, 33.0, 26.0, 50.0, 45.0, 41.0, 59.0, 44.0, 36.0, 59.0, 59.0, 64.0, 53.0, 38.0, 40.0, 34.0, 29.0, 29.0, 24.0, 25.0, 19.0, 13.0, 16.0, 6.0, 8.0, 4.0, 4.0, 5.0, 1.0, 1.0, 2.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.6376953125, -0.618560791015625, -0.59942626953125, -0.580291748046875, -0.5611572265625, -0.542022705078125, -0.52288818359375, -0.503753662109375, -0.484619140625, -0.465484619140625, -0.44635009765625, -0.427215576171875, -0.4080810546875, -0.388946533203125, -0.36981201171875, -0.350677490234375, -0.33154296875, -0.312408447265625, -0.29327392578125, -0.274139404296875, -0.2550048828125, -0.235870361328125, -0.21673583984375, -0.197601318359375, -0.178466796875, -0.159332275390625, -0.14019775390625, -0.121063232421875, -0.1019287109375, -0.082794189453125, -0.06365966796875, -0.044525146484375, -0.025390625, -0.006256103515625, 0.01287841796875, 0.032012939453125, 0.0511474609375, 0.070281982421875, 0.08941650390625, 0.108551025390625, 0.127685546875, 0.146820068359375, 0.16595458984375, 0.185089111328125, 0.2042236328125, 0.223358154296875, 0.24249267578125, 0.261627197265625, 0.28076171875, 0.299896240234375, 0.31903076171875, 0.338165283203125, 0.3572998046875, 0.376434326171875, 0.39556884765625, 0.414703369140625, 0.433837890625, 0.452972412109375, 0.47210693359375, 0.491241455078125, 0.5103759765625, 0.529510498046875, 0.54864501953125, 0.567779541015625, 0.5869140625]}, "gradients/decoder.model.decoder.layers.3.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 3.0, 4.0, 7.0, 3.0, 11.0, 20.0, 14.0, 17.0, 26.0, 49.0, 90.0, 178.0, 325.0, 776.0, 2071.0, 7648.0, 83154.0, 915758.0, 31207.0, 4498.0, 1379.0, 650.0, 293.0, 142.0, 86.0, 50.0, 41.0, 15.0, 12.0, 14.0, 4.0, 4.0, 5.0, 7.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.355224609375, -0.3470268249511719, -0.33882904052734375, -0.3306312561035156, -0.3224334716796875, -0.3142356872558594, -0.30603790283203125, -0.2978401184082031, -0.289642333984375, -0.2814445495605469, -0.27324676513671875, -0.2650489807128906, -0.2568511962890625, -0.24865341186523438, -0.24045562744140625, -0.23225784301757812, -0.22406005859375, -0.21586227416992188, -0.20766448974609375, -0.19946670532226562, -0.1912689208984375, -0.18307113647460938, -0.17487335205078125, -0.16667556762695312, -0.158477783203125, -0.15027999877929688, -0.14208221435546875, -0.13388442993164062, -0.1256866455078125, -0.11748886108398438, -0.10929107666015625, -0.10109329223632812, -0.0928955078125, -0.08469772338867188, -0.07649993896484375, -0.06830215454101562, -0.0601043701171875, -0.051906585693359375, -0.04370880126953125, -0.035511016845703125, -0.027313232421875, -0.019115447998046875, -0.01091766357421875, -0.002719879150390625, 0.0054779052734375, 0.013675689697265625, 0.02187347412109375, 0.030071258544921875, 0.03826904296875, 0.046466827392578125, 0.05466461181640625, 0.06286239624023438, 0.0710601806640625, 0.07925796508789062, 0.08745574951171875, 0.09565353393554688, 0.103851318359375, 0.11204910278320312, 0.12024688720703125, 0.12844467163085938, 0.1366424560546875, 0.14484024047851562, 0.15303802490234375, 0.16123580932617188, 0.16943359375]}, "gradients/decoder.model.decoder.layers.3.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 1.0, 2.0, 13.0, 14.0, 20.0, 35.0, 48.0, 148.0, 517.0, 81.0, 48.0, 32.0, 16.0, 12.0, 8.0, 4.0, 6.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.860494613647461e-05, -6.705615669488907e-05, -6.550736725330353e-05, -6.395857781171799e-05, -6.240978837013245e-05, -6.0860998928546906e-05, -5.9312209486961365e-05, -5.7763420045375824e-05, -5.621463060379028e-05, -5.466584116220474e-05, -5.31170517206192e-05, -5.156826227903366e-05, -5.001947283744812e-05, -4.847068339586258e-05, -4.692189395427704e-05, -4.53731045126915e-05, -4.382431507110596e-05, -4.2275525629520416e-05, -4.0726736187934875e-05, -3.9177946746349335e-05, -3.7629157304763794e-05, -3.608036786317825e-05, -3.453157842159271e-05, -3.298278898000717e-05, -3.143399953842163e-05, -2.988521009683609e-05, -2.833642065525055e-05, -2.678763121366501e-05, -2.5238841772079468e-05, -2.3690052330493927e-05, -2.2141262888908386e-05, -2.0592473447322845e-05, -1.9043684005737305e-05, -1.7494894564151764e-05, -1.5946105122566223e-05, -1.4397315680980682e-05, -1.2848526239395142e-05, -1.12997367978096e-05, -9.75094735622406e-06, -8.20215791463852e-06, -6.6533684730529785e-06, -5.104579031467438e-06, -3.555789589881897e-06, -2.007000148296356e-06, -4.5821070671081543e-07, 1.0905787348747253e-06, 2.639368176460266e-06, 4.188157618045807e-06, 5.736947059631348e-06, 7.2857365012168884e-06, 8.83452594280243e-06, 1.038331538438797e-05, 1.193210482597351e-05, 1.3480894267559052e-05, 1.5029683709144592e-05, 1.6578473150730133e-05, 1.8127262592315674e-05, 1.9676052033901215e-05, 2.1224841475486755e-05, 2.2773630917072296e-05, 2.4322420358657837e-05, 2.5871209800243378e-05, 2.741999924182892e-05, 2.896878868341446e-05, 3.0517578125e-05]}, "gradients/decoder.model.decoder.layers.3.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 5.0, 10.0, 11.0, 18.0, 32.0, 93.0, 163.0, 265.0, 519.0, 1166.0, 4470.0, 90519.0, 932297.0, 15328.0, 2086.0, 763.0, 373.0, 201.0, 100.0, 57.0, 33.0, 20.0, 8.0, 4.0, 3.0, 7.0, 6.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.322265625, -0.3104400634765625, -0.298614501953125, -0.2867889404296875, -0.27496337890625, -0.2631378173828125, -0.251312255859375, -0.2394866943359375, -0.2276611328125, -0.2158355712890625, -0.204010009765625, -0.1921844482421875, -0.18035888671875, -0.1685333251953125, -0.156707763671875, -0.1448822021484375, -0.133056640625, -0.1212310791015625, -0.109405517578125, -0.0975799560546875, -0.08575439453125, -0.0739288330078125, -0.062103271484375, -0.0502777099609375, -0.0384521484375, -0.0266265869140625, -0.014801025390625, -0.0029754638671875, 0.00885009765625, 0.0206756591796875, 0.032501220703125, 0.0443267822265625, 0.05615234375, 0.0679779052734375, 0.079803466796875, 0.0916290283203125, 0.10345458984375, 0.1152801513671875, 0.127105712890625, 0.1389312744140625, 0.1507568359375, 0.1625823974609375, 0.174407958984375, 0.1862335205078125, 0.19805908203125, 0.2098846435546875, 0.221710205078125, 0.2335357666015625, 0.245361328125, 0.2571868896484375, 0.269012451171875, 0.2808380126953125, 0.29266357421875, 0.3044891357421875, 0.316314697265625, 0.3281402587890625, 0.3399658203125, 0.3517913818359375, 0.363616943359375, 0.3754425048828125, 0.38726806640625, 0.3990936279296875, 0.410919189453125, 0.4227447509765625, 0.4345703125]}, "gradients/decoder.model.decoder.layers.3.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 9.0, 10.0, 16.0, 30.0, 52.0, 69.0, 361.0, 289.0, 65.0, 39.0, 24.0, 18.0, 14.0, 3.0, 3.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.15087890625, -0.14690303802490234, -0.1429271697998047, -0.13895130157470703, -0.13497543334960938, -0.13099956512451172, -0.12702369689941406, -0.1230478286743164, -0.11907196044921875, -0.1150960922241211, -0.11112022399902344, -0.10714435577392578, -0.10316848754882812, -0.09919261932373047, -0.09521675109863281, -0.09124088287353516, -0.0872650146484375, -0.08328914642333984, -0.07931327819824219, -0.07533740997314453, -0.07136154174804688, -0.06738567352294922, -0.06340980529785156, -0.059433937072753906, -0.05545806884765625, -0.051482200622558594, -0.04750633239746094, -0.04353046417236328, -0.039554595947265625, -0.03557872772216797, -0.03160285949707031, -0.027626991271972656, -0.023651123046875, -0.019675254821777344, -0.015699386596679688, -0.011723518371582031, -0.007747650146484375, -0.0037717819213867188, 0.0002040863037109375, 0.004179954528808594, 0.00815582275390625, 0.012131690979003906, 0.016107559204101562, 0.02008342742919922, 0.024059295654296875, 0.02803516387939453, 0.03201103210449219, 0.035986900329589844, 0.0399627685546875, 0.043938636779785156, 0.04791450500488281, 0.05189037322998047, 0.055866241455078125, 0.05984210968017578, 0.06381797790527344, 0.0677938461303711, 0.07176971435546875, 0.0757455825805664, 0.07972145080566406, 0.08369731903076172, 0.08767318725585938, 0.09164905548095703, 0.09562492370605469, 0.09960079193115234, 0.10357666015625]}, "gradients/decoder.model.decoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [3.0, 9.0, 23.0, 65.0, 188.0, 355.0, 262.0, 77.0, 23.0, 5.0, 6.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4813905656337738, -0.3963336944580078, -0.31127679347991943, -0.22621992230415344, -0.14116302132606506, -0.056106120347976685, 0.02895072102546692, 0.1140076220035553, 0.19906452298164368, 0.28412139415740967, 0.36917829513549805, 0.45423516631126404, 0.5392920970916748, 0.6243489980697632, 0.709405779838562, 0.7944626808166504, 0.8795195817947388, 0.9645764827728271, 1.0496333837509155, 1.134690284729004, 1.2197470664978027, 1.3048040866851807, 1.3898608684539795, 1.4749177694320679, 1.5599746704101562, 1.6450315713882446, 1.730088472366333, 1.8151452541351318, 1.9002022743225098, 1.9852590560913086, 2.0703158378601074, 2.1553728580474854, 2.2404298782348633, 2.325486660003662, 2.41054368019104, 2.495600461959839, 2.580657482147217, 2.6657142639160156, 2.7507710456848145, 2.8358280658721924, 2.9208850860595703, 3.005941867828369, 3.090998888015747, 3.176055669784546, 3.261112689971924, 3.3461694717407227, 3.4312262535095215, 3.5162832736968994, 3.6013400554656982, 3.686396837234497, 3.771453857421875, 3.856510639190674, 3.9415676593780518, 4.02662467956543, 4.1116814613342285, 4.196738243103027, 4.281795024871826, 4.366851806640625, 4.451908588409424, 4.536965847015381, 4.62202262878418, 4.7070794105529785, 4.792136192321777, 4.877193450927734, 4.962250232696533]}, "gradients/decoder.model.decoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 0.0, 4.0, 4.0, 8.0, 4.0, 2.0, 12.0, 16.0, 10.0, 10.0, 19.0, 11.0, 25.0, 20.0, 26.0, 23.0, 23.0, 35.0, 38.0, 42.0, 38.0, 47.0, 30.0, 51.0, 36.0, 40.0, 38.0, 45.0, 39.0, 38.0, 30.0, 47.0, 36.0, 26.0, 23.0, 18.0, 11.0, 19.0, 8.0, 14.0, 11.0, 10.0, 8.0, 2.0, 3.0, 3.0, 3.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.8738496899604797, -0.8473448157310486, -0.8208399415016174, -0.7943350672721863, -0.7678301930427551, -0.741325318813324, -0.7148204445838928, -0.6883155703544617, -0.6618106961250305, -0.6353058218955994, -0.6088009476661682, -0.5822960734367371, -0.5557911992073059, -0.5292863249778748, -0.5027814507484436, -0.47627657651901245, -0.4497717320919037, -0.42326685786247253, -0.3967619836330414, -0.37025710940361023, -0.3437522351741791, -0.3172473907470703, -0.29074251651763916, -0.264237642288208, -0.23773275315761566, -0.2112278789281845, -0.18472300469875336, -0.1582181453704834, -0.13171327114105225, -0.1052083969116211, -0.07870352268218994, -0.05219864845275879, -0.025693774223327637, 0.0008110981434583664, 0.02731597051024437, 0.05382084101438522, 0.08032571524381638, 0.10683058202266693, 0.13333545625209808, 0.15984033048152924, 0.1863452047109604, 0.21285007894039154, 0.2393549531698227, 0.26585981249809265, 0.2923646867275238, 0.31886956095695496, 0.3453744351863861, 0.37187930941581726, 0.3983841836452484, 0.42488905787467957, 0.4513939321041107, 0.47789880633354187, 0.5044036507606506, 0.5309085249900818, 0.5574133992195129, 0.5839182734489441, 0.6104231476783752, 0.6369280219078064, 0.6634328961372375, 0.6899377703666687, 0.7164426445960999, 0.742947518825531, 0.7694523930549622, 0.7959572672843933, 0.8224621415138245]}, "gradients/decoder.model.decoder.layers.2.fc2.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 6.0, 7.0, 10.0, 17.0, 23.0, 23.0, 30.0, 50.0, 56.0, 146.0, 251.0, 452.0, 1401.0, 4552.0, 21710.0, 419023.0, 3617665.0, 112161.0, 12039.0, 2807.0, 978.0, 386.0, 178.0, 97.0, 71.0, 51.0, 24.0, 21.0, 18.0, 6.0, 6.0, 3.0, 5.0, 6.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.732421875, -0.7046051025390625, -0.676788330078125, -0.6489715576171875, -0.62115478515625, -0.5933380126953125, -0.565521240234375, -0.5377044677734375, -0.5098876953125, -0.4820709228515625, -0.454254150390625, -0.4264373779296875, -0.39862060546875, -0.3708038330078125, -0.342987060546875, -0.3151702880859375, -0.287353515625, -0.2595367431640625, -0.231719970703125, -0.2039031982421875, -0.17608642578125, -0.1482696533203125, -0.120452880859375, -0.0926361083984375, -0.0648193359375, -0.0370025634765625, -0.009185791015625, 0.0186309814453125, 0.04644775390625, 0.0742645263671875, 0.102081298828125, 0.1298980712890625, 0.15771484375, 0.1855316162109375, 0.213348388671875, 0.2411651611328125, 0.26898193359375, 0.2967987060546875, 0.324615478515625, 0.3524322509765625, 0.3802490234375, 0.4080657958984375, 0.435882568359375, 0.4636993408203125, 0.49151611328125, 0.5193328857421875, 0.547149658203125, 0.5749664306640625, 0.602783203125, 0.6305999755859375, 0.658416748046875, 0.6862335205078125, 0.71405029296875, 0.7418670654296875, 0.769683837890625, 0.7975006103515625, 0.8253173828125, 0.8531341552734375, 0.880950927734375, 0.9087677001953125, 0.93658447265625, 0.9644012451171875, 0.992218017578125, 1.0200347900390625, 1.0478515625]}, "gradients/decoder.model.decoder.layers.2.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 9.0, 5.0, 7.0, 7.0, 21.0, 15.0, 12.0, 21.0, 19.0, 36.0, 25.0, 44.0, 39.0, 47.0, 48.0, 40.0, 51.0, 60.0, 59.0, 57.0, 51.0, 50.0, 36.0, 37.0, 41.0, 33.0, 29.0, 23.0, 9.0, 20.0, 12.0, 11.0, 9.0, 5.0, 1.0, 5.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.3046875, -0.2958564758300781, -0.28702545166015625, -0.2781944274902344, -0.2693634033203125, -0.2605323791503906, -0.25170135498046875, -0.24287033081054688, -0.234039306640625, -0.22520828247070312, -0.21637725830078125, -0.20754623413085938, -0.1987152099609375, -0.18988418579101562, -0.18105316162109375, -0.17222213745117188, -0.16339111328125, -0.15456008911132812, -0.14572906494140625, -0.13689804077148438, -0.1280670166015625, -0.11923599243164062, -0.11040496826171875, -0.10157394409179688, -0.092742919921875, -0.08391189575195312, -0.07508087158203125, -0.06624984741210938, -0.0574188232421875, -0.048587799072265625, -0.03975677490234375, -0.030925750732421875, -0.0220947265625, -0.013263702392578125, -0.00443267822265625, 0.004398345947265625, 0.0132293701171875, 0.022060394287109375, 0.03089141845703125, 0.039722442626953125, 0.048553466796875, 0.057384490966796875, 0.06621551513671875, 0.07504653930664062, 0.0838775634765625, 0.09270858764648438, 0.10153961181640625, 0.11037063598632812, 0.11920166015625, 0.12803268432617188, 0.13686370849609375, 0.14569473266601562, 0.1545257568359375, 0.16335678100585938, 0.17218780517578125, 0.18101882934570312, 0.189849853515625, 0.19868087768554688, 0.20751190185546875, 0.21634292602539062, 0.2251739501953125, 0.23400497436523438, 0.24283599853515625, 0.2516670227050781, 0.260498046875]}, "gradients/decoder.model.decoder.layers.2.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 4.0, 2.0, 2.0, 6.0, 11.0, 23.0, 31.0, 50.0, 133.0, 313.0, 871.0, 3555.0, 42983.0, 3934223.0, 202189.0, 7672.0, 1428.0, 445.0, 167.0, 76.0, 51.0, 15.0, 16.0, 8.0, 3.0, 5.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.2099609375, -1.1705322265625, -1.131103515625, -1.0916748046875, -1.05224609375, -1.0128173828125, -0.973388671875, -0.9339599609375, -0.89453125, -0.8551025390625, -0.815673828125, -0.7762451171875, -0.73681640625, -0.6973876953125, -0.657958984375, -0.6185302734375, -0.5791015625, -0.5396728515625, -0.500244140625, -0.4608154296875, -0.42138671875, -0.3819580078125, -0.342529296875, -0.3031005859375, -0.263671875, -0.2242431640625, -0.184814453125, -0.1453857421875, -0.10595703125, -0.0665283203125, -0.027099609375, 0.0123291015625, 0.0517578125, 0.0911865234375, 0.130615234375, 0.1700439453125, 0.20947265625, 0.2489013671875, 0.288330078125, 0.3277587890625, 0.3671875, 0.4066162109375, 0.446044921875, 0.4854736328125, 0.52490234375, 0.5643310546875, 0.603759765625, 0.6431884765625, 0.6826171875, 0.7220458984375, 0.761474609375, 0.8009033203125, 0.84033203125, 0.8797607421875, 0.919189453125, 0.9586181640625, 0.998046875, 1.0374755859375, 1.076904296875, 1.1163330078125, 1.15576171875, 1.1951904296875, 1.234619140625, 1.2740478515625, 1.3134765625]}, "gradients/decoder.model.decoder.layers.2.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 2.0, 6.0, 6.0, 12.0, 14.0, 41.0, 53.0, 94.0, 173.0, 363.0, 841.0, 1210.0, 676.0, 274.0, 139.0, 63.0, 45.0, 26.0, 14.0, 11.0, 5.0, 6.0, 5.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.334228515625, -0.32614707946777344, -0.3180656433105469, -0.3099842071533203, -0.30190277099609375, -0.2938213348388672, -0.2857398986816406, -0.27765846252441406, -0.2695770263671875, -0.26149559020996094, -0.2534141540527344, -0.2453327178955078, -0.23725128173828125, -0.2291698455810547, -0.22108840942382812, -0.21300697326660156, -0.204925537109375, -0.19684410095214844, -0.18876266479492188, -0.1806812286376953, -0.17259979248046875, -0.1645183563232422, -0.15643692016601562, -0.14835548400878906, -0.1402740478515625, -0.13219261169433594, -0.12411117553710938, -0.11602973937988281, -0.10794830322265625, -0.09986686706542969, -0.09178543090820312, -0.08370399475097656, -0.07562255859375, -0.06754112243652344, -0.059459686279296875, -0.05137825012207031, -0.04329681396484375, -0.03521537780761719, -0.027133941650390625, -0.019052505493164062, -0.0109710693359375, -0.0028896331787109375, 0.005191802978515625, 0.013273239135742188, 0.02135467529296875, 0.029436111450195312, 0.037517547607421875, 0.04559898376464844, 0.053680419921875, 0.06176185607910156, 0.06984329223632812, 0.07792472839355469, 0.08600616455078125, 0.09408760070800781, 0.10216903686523438, 0.11025047302246094, 0.1183319091796875, 0.12641334533691406, 0.13449478149414062, 0.1425762176513672, 0.15065765380859375, 0.1587390899658203, 0.16682052612304688, 0.17490196228027344, 0.1829833984375]}, "gradients/decoder.model.decoder.layers.2.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 3.0, 7.0, 7.0, 20.0, 16.0, 39.0, 43.0, 74.0, 80.0, 100.0, 121.0, 128.0, 107.0, 96.0, 54.0, 38.0, 30.0, 11.0, 16.0, 11.0, 5.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.7881006598472595, -0.7657932639122009, -0.7434858679771423, -0.7211785316467285, -0.6988711357116699, -0.6765637397766113, -0.6542563438415527, -0.6319489479064941, -0.6096415519714355, -0.587334156036377, -0.5650267601013184, -0.5427193641662598, -0.520412027835846, -0.49810463190078735, -0.47579723596572876, -0.45348984003067017, -0.43118247389793396, -0.40887507796287537, -0.38656771183013916, -0.36426031589508057, -0.341952919960022, -0.3196455240249634, -0.2973381578922272, -0.2750307619571686, -0.2527233958244324, -0.23041601479053497, -0.20810861885547638, -0.18580123782157898, -0.16349384188652039, -0.14118646085262299, -0.11887907981872559, -0.09657168388366699, -0.0742642879486084, -0.0519568994641304, -0.029649514704942703, -0.007342129945755005, 0.014965258538722992, 0.03727264702320099, 0.05958002805709839, 0.08188742399215698, 0.10419480502605438, 0.12650218605995178, 0.14880958199501038, 0.17111696302890778, 0.19342434406280518, 0.21573173999786377, 0.23803912103176117, 0.26034653186798096, 0.28265389800071716, 0.30496129393577576, 0.32726866006851196, 0.34957605600357056, 0.37188345193862915, 0.39419084787368774, 0.41649821400642395, 0.43880560994148254, 0.46111297607421875, 0.48342037200927734, 0.5057277679443359, 0.5280351638793945, 0.5503425002098083, 0.5726498961448669, 0.5949572920799255, 0.6172646880149841, 0.6395720839500427]}, "gradients/decoder.model.decoder.layers.2.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 6.0, 7.0, 8.0, 12.0, 9.0, 13.0, 16.0, 15.0, 14.0, 20.0, 17.0, 20.0, 27.0, 32.0, 46.0, 27.0, 31.0, 48.0, 39.0, 57.0, 47.0, 38.0, 39.0, 44.0, 43.0, 26.0, 33.0, 29.0, 29.0, 31.0, 26.0, 21.0, 22.0, 20.0, 9.0, 19.0, 17.0, 8.0, 9.0, 5.0, 9.0, 7.0, 3.0, 2.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.32736608386039734, -0.3176831007003784, -0.3080001473426819, -0.29831716418266296, -0.28863418102264404, -0.2789512276649475, -0.2692682445049286, -0.25958526134490967, -0.24990229308605194, -0.2402193248271942, -0.2305363416671753, -0.22085337340831757, -0.21117040514945984, -0.20148742198944092, -0.1918044537305832, -0.18212148547172546, -0.17243850231170654, -0.16275553405284882, -0.1530725508928299, -0.14338958263397217, -0.13370659947395325, -0.12402363121509552, -0.11434066295623779, -0.10465768724679947, -0.09497471153736115, -0.08529173582792282, -0.0756087601184845, -0.06592579185962677, -0.056242816150188446, -0.04655984044075012, -0.0368768684566021, -0.02719389647245407, -0.017510920763015747, -0.007827946916222572, 0.0018550269305706024, 0.011538000777363777, 0.021220974624156952, 0.030903950333595276, 0.0405869223177433, 0.05026989430189133, 0.05995287001132965, 0.06963584572076797, 0.0793188214302063, 0.08900178968906403, 0.09868476539850235, 0.10836774110794067, 0.1180507093667984, 0.12773367762565613, 0.13741666078567505, 0.14709962904453278, 0.1567826122045517, 0.16646558046340942, 0.17614856362342834, 0.18583153188228607, 0.1955145001411438, 0.20519748330116272, 0.21488045156002045, 0.22456341981887817, 0.2342464029788971, 0.24392937123775482, 0.25361233949661255, 0.26329532265663147, 0.2729783058166504, 0.2826612591743469, 0.29234424233436584]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 3.0, 9.0, 5.0, 11.0, 8.0, 18.0, 20.0, 40.0, 63.0, 101.0, 258.0, 455.0, 932.0, 2073.0, 4916.0, 12592.0, 48545.0, 530922.0, 391153.0, 37620.0, 10989.0, 4365.0, 1812.0, 829.0, 369.0, 202.0, 102.0, 49.0, 29.0, 18.0, 17.0, 6.0, 6.0, 6.0, 7.0, 1.0, 5.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1983642578125, -0.19173622131347656, -0.18510818481445312, -0.1784801483154297, -0.17185211181640625, -0.1652240753173828, -0.15859603881835938, -0.15196800231933594, -0.1453399658203125, -0.13871192932128906, -0.13208389282226562, -0.1254558563232422, -0.11882781982421875, -0.11219978332519531, -0.10557174682617188, -0.09894371032714844, -0.092315673828125, -0.08568763732910156, -0.07905960083007812, -0.07243156433105469, -0.06580352783203125, -0.05917549133300781, -0.052547454833984375, -0.04591941833496094, -0.0392913818359375, -0.03266334533691406, -0.026035308837890625, -0.019407272338867188, -0.01277923583984375, -0.0061511993408203125, 0.000476837158203125, 0.0071048736572265625, 0.01373291015625, 0.020360946655273438, 0.026988983154296875, 0.03361701965332031, 0.04024505615234375, 0.04687309265136719, 0.053501129150390625, 0.06012916564941406, 0.0667572021484375, 0.07338523864746094, 0.08001327514648438, 0.08664131164550781, 0.09326934814453125, 0.09989738464355469, 0.10652542114257812, 0.11315345764160156, 0.119781494140625, 0.12640953063964844, 0.13303756713867188, 0.1396656036376953, 0.14629364013671875, 0.1529216766357422, 0.15954971313476562, 0.16617774963378906, 0.1728057861328125, 0.17943382263183594, 0.18606185913085938, 0.1926898956298828, 0.19931793212890625, 0.2059459686279297, 0.21257400512695312, 0.21920204162597656, 0.225830078125]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 5.0, 3.0, 4.0, 14.0, 13.0, 17.0, 20.0, 21.0, 25.0, 25.0, 42.0, 42.0, 56.0, 36.0, 66.0, 63.0, 58.0, 55.0, 56.0, 52.0, 44.0, 50.0, 47.0, 35.0, 32.0, 25.0, 24.0, 19.0, 20.0, 8.0, 9.0, 9.0, 7.0, 3.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.284423828125, -0.2749481201171875, -0.265472412109375, -0.2559967041015625, -0.24652099609375, -0.2370452880859375, -0.227569580078125, -0.2180938720703125, -0.2086181640625, -0.1991424560546875, -0.189666748046875, -0.1801910400390625, -0.17071533203125, -0.1612396240234375, -0.151763916015625, -0.1422882080078125, -0.1328125, -0.1233367919921875, -0.113861083984375, -0.1043853759765625, -0.09490966796875, -0.0854339599609375, -0.075958251953125, -0.0664825439453125, -0.0570068359375, -0.0475311279296875, -0.038055419921875, -0.0285797119140625, -0.01910400390625, -0.0096282958984375, -0.000152587890625, 0.0093231201171875, 0.018798828125, 0.0282745361328125, 0.037750244140625, 0.0472259521484375, 0.05670166015625, 0.0661773681640625, 0.075653076171875, 0.0851287841796875, 0.0946044921875, 0.1040802001953125, 0.113555908203125, 0.1230316162109375, 0.13250732421875, 0.1419830322265625, 0.151458740234375, 0.1609344482421875, 0.17041015625, 0.1798858642578125, 0.189361572265625, 0.1988372802734375, 0.20831298828125, 0.2177886962890625, 0.227264404296875, 0.2367401123046875, 0.2462158203125, 0.2556915283203125, 0.265167236328125, 0.2746429443359375, 0.28411865234375, 0.2935943603515625, 0.303070068359375, 0.3125457763671875, 0.322021484375]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 5.0, 7.0, 13.0, 17.0, 18.0, 29.0, 42.0, 40.0, 81.0, 122.0, 138.0, 219.0, 339.0, 578.0, 951.0, 1671.0, 3203.0, 6877.0, 15393.0, 41863.0, 148197.0, 448736.0, 268096.0, 69813.0, 22853.0, 9428.0, 4385.0, 2244.0, 1237.0, 687.0, 418.0, 256.0, 167.0, 123.0, 91.0, 55.0, 35.0, 39.0, 31.0, 21.0, 18.0, 6.0, 6.0, 6.0, 5.0, 2.0, 2.0, 1.0, 0.0, 0.0, 3.0, 1.0], "bins": [-0.0916748046875, -0.08895587921142578, -0.08623695373535156, -0.08351802825927734, -0.08079910278320312, -0.0780801773071289, -0.07536125183105469, -0.07264232635498047, -0.06992340087890625, -0.06720447540283203, -0.06448554992675781, -0.061766624450683594, -0.059047698974609375, -0.056328773498535156, -0.05360984802246094, -0.05089092254638672, -0.0481719970703125, -0.04545307159423828, -0.04273414611816406, -0.040015220642089844, -0.037296295166015625, -0.034577369689941406, -0.03185844421386719, -0.02913951873779297, -0.02642059326171875, -0.02370166778564453, -0.020982742309570312, -0.018263816833496094, -0.015544891357421875, -0.012825965881347656, -0.010107040405273438, -0.007388114929199219, -0.004669189453125, -0.0019502639770507812, 0.0007686614990234375, 0.0034875869750976562, 0.006206512451171875, 0.008925437927246094, 0.011644363403320312, 0.014363288879394531, 0.01708221435546875, 0.01980113983154297, 0.022520065307617188, 0.025238990783691406, 0.027957916259765625, 0.030676841735839844, 0.03339576721191406, 0.03611469268798828, 0.0388336181640625, 0.04155254364013672, 0.04427146911621094, 0.046990394592285156, 0.049709320068359375, 0.052428245544433594, 0.05514717102050781, 0.05786609649658203, 0.06058502197265625, 0.06330394744873047, 0.06602287292480469, 0.0687417984008789, 0.07146072387695312, 0.07417964935302734, 0.07689857482910156, 0.07961750030517578, 0.08233642578125]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 4.0, 4.0, 3.0, 11.0, 4.0, 6.0, 16.0, 14.0, 18.0, 11.0, 14.0, 17.0, 18.0, 26.0, 32.0, 24.0, 40.0, 35.0, 57.0, 48.0, 56.0, 50.0, 41.0, 45.0, 56.0, 35.0, 44.0, 39.0, 41.0, 34.0, 43.0, 21.0, 18.0, 10.0, 12.0, 13.0, 10.0, 10.0, 9.0, 2.0, 5.0, 7.0, 3.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.50634765625, -0.49017333984375, -0.4739990234375, -0.45782470703125, -0.441650390625, -0.42547607421875, -0.4093017578125, -0.39312744140625, -0.376953125, -0.36077880859375, -0.3446044921875, -0.32843017578125, -0.312255859375, -0.29608154296875, -0.2799072265625, -0.26373291015625, -0.24755859375, -0.23138427734375, -0.2152099609375, -0.19903564453125, -0.182861328125, -0.16668701171875, -0.1505126953125, -0.13433837890625, -0.1181640625, -0.10198974609375, -0.0858154296875, -0.06964111328125, -0.053466796875, -0.03729248046875, -0.0211181640625, -0.00494384765625, 0.01123046875, 0.02740478515625, 0.0435791015625, 0.05975341796875, 0.075927734375, 0.09210205078125, 0.1082763671875, 0.12445068359375, 0.140625, 0.15679931640625, 0.1729736328125, 0.18914794921875, 0.205322265625, 0.22149658203125, 0.2376708984375, 0.25384521484375, 0.27001953125, 0.28619384765625, 0.3023681640625, 0.31854248046875, 0.334716796875, 0.35089111328125, 0.3670654296875, 0.38323974609375, 0.3994140625, 0.41558837890625, 0.4317626953125, 0.44793701171875, 0.464111328125, 0.48028564453125, 0.4964599609375, 0.51263427734375, 0.52880859375]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 4.0, 4.0, 7.0, 10.0, 7.0, 19.0, 17.0, 37.0, 54.0, 93.0, 150.0, 320.0, 611.0, 1228.0, 3025.0, 9222.0, 44813.0, 379836.0, 523678.0, 66679.0, 12088.0, 3629.0, 1476.0, 699.0, 361.0, 191.0, 109.0, 59.0, 47.0, 26.0, 22.0, 14.0, 8.0, 2.0, 4.0, 3.0, 1.0, 1.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.041656494140625, -0.04046964645385742, -0.039282798767089844, -0.038095951080322266, -0.03690910339355469, -0.03572225570678711, -0.03453540802001953, -0.03334856033325195, -0.032161712646484375, -0.030974864959716797, -0.02978801727294922, -0.02860116958618164, -0.027414321899414062, -0.026227474212646484, -0.025040626525878906, -0.023853778839111328, -0.02266693115234375, -0.021480083465576172, -0.020293235778808594, -0.019106388092041016, -0.017919540405273438, -0.01673269271850586, -0.015545845031738281, -0.014358997344970703, -0.013172149658203125, -0.011985301971435547, -0.010798454284667969, -0.00961160659790039, -0.008424758911132812, -0.007237911224365234, -0.006051063537597656, -0.004864215850830078, -0.0036773681640625, -0.002490520477294922, -0.0013036727905273438, -0.00011682510375976562, 0.0010700225830078125, 0.0022568702697753906, 0.0034437179565429688, 0.004630565643310547, 0.005817413330078125, 0.007004261016845703, 0.008191108703613281, 0.00937795639038086, 0.010564804077148438, 0.011751651763916016, 0.012938499450683594, 0.014125347137451172, 0.01531219482421875, 0.016499042510986328, 0.017685890197753906, 0.018872737884521484, 0.020059585571289062, 0.02124643325805664, 0.02243328094482422, 0.023620128631591797, 0.024806976318359375, 0.025993824005126953, 0.02718067169189453, 0.02836751937866211, 0.029554367065429688, 0.030741214752197266, 0.031928062438964844, 0.03311491012573242, 0.0343017578125]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0, 2.0, 7.0, 15.0, 8.0, 16.0, 34.0, 56.0, 87.0, 124.0, 138.0, 140.0, 133.0, 93.0, 52.0, 35.0, 24.0, 13.0, 6.0, 8.0, 3.0, 3.0, 1.0, 1.0, 1.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.384185791015625e-05, -2.299528568983078e-05, -2.214871346950531e-05, -2.130214124917984e-05, -2.045556902885437e-05, -1.96089968085289e-05, -1.876242458820343e-05, -1.791585236787796e-05, -1.706928014755249e-05, -1.622270792722702e-05, -1.537613570690155e-05, -1.452956348657608e-05, -1.368299126625061e-05, -1.283641904592514e-05, -1.198984682559967e-05, -1.11432746052742e-05, -1.029670238494873e-05, -9.45013016462326e-06, -8.60355794429779e-06, -7.75698572397232e-06, -6.910413503646851e-06, -6.063841283321381e-06, -5.217269062995911e-06, -4.370696842670441e-06, -3.5241246223449707e-06, -2.6775524020195007e-06, -1.8309801816940308e-06, -9.844079613685608e-07, -1.3783574104309082e-07, 7.087364792823792e-07, 1.5553086996078491e-06, 2.401880919933319e-06, 3.248453140258789e-06, 4.095025360584259e-06, 4.941597580909729e-06, 5.788169801235199e-06, 6.634742021560669e-06, 7.481314241886139e-06, 8.327886462211609e-06, 9.174458682537079e-06, 1.0021030902862549e-05, 1.0867603123188019e-05, 1.1714175343513489e-05, 1.2560747563838959e-05, 1.3407319784164429e-05, 1.4253892004489899e-05, 1.5100464224815369e-05, 1.594703644514084e-05, 1.679360866546631e-05, 1.764018088579178e-05, 1.848675310611725e-05, 1.933332532644272e-05, 2.017989754676819e-05, 2.102646976709366e-05, 2.187304198741913e-05, 2.27196142077446e-05, 2.356618642807007e-05, 2.441275864839554e-05, 2.5259330868721008e-05, 2.6105903089046478e-05, 2.6952475309371948e-05, 2.7799047529697418e-05, 2.8645619750022888e-05, 2.9492191970348358e-05, 3.0338764190673828e-05]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 3.0, 4.0, 11.0, 13.0, 18.0, 22.0, 26.0, 44.0, 67.0, 146.0, 238.0, 431.0, 813.0, 1470.0, 3254.0, 8793.0, 33870.0, 169471.0, 545038.0, 223441.0, 43398.0, 10623.0, 3728.0, 1623.0, 815.0, 497.0, 280.0, 150.0, 94.0, 64.0, 36.0, 30.0, 17.0, 11.0, 8.0, 0.0, 2.0, 0.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 4.0, 2.0], "bins": [-0.03485107421875, -0.033843278884887695, -0.03283548355102539, -0.031827688217163086, -0.03081989288330078, -0.029812097549438477, -0.028804302215576172, -0.027796506881713867, -0.026788711547851562, -0.025780916213989258, -0.024773120880126953, -0.02376532554626465, -0.022757530212402344, -0.02174973487854004, -0.020741939544677734, -0.01973414421081543, -0.018726348876953125, -0.01771855354309082, -0.016710758209228516, -0.01570296287536621, -0.014695167541503906, -0.013687372207641602, -0.012679576873779297, -0.011671781539916992, -0.010663986206054688, -0.009656190872192383, -0.008648395538330078, -0.0076406002044677734, -0.006632804870605469, -0.005625009536743164, -0.004617214202880859, -0.0036094188690185547, -0.00260162353515625, -0.0015938282012939453, -0.0005860328674316406, 0.00042176246643066406, 0.0014295578002929688, 0.0024373531341552734, 0.003445148468017578, 0.004452943801879883, 0.0054607391357421875, 0.006468534469604492, 0.007476329803466797, 0.008484125137329102, 0.009491920471191406, 0.010499715805053711, 0.011507511138916016, 0.01251530647277832, 0.013523101806640625, 0.01453089714050293, 0.015538692474365234, 0.01654648780822754, 0.017554283142089844, 0.01856207847595215, 0.019569873809814453, 0.020577669143676758, 0.021585464477539062, 0.022593259811401367, 0.023601055145263672, 0.024608850479125977, 0.02561664581298828, 0.026624441146850586, 0.02763223648071289, 0.028640031814575195, 0.0296478271484375]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 1.0, 2.0, 2.0, 2.0, 2.0, 12.0, 5.0, 8.0, 9.0, 11.0, 15.0, 19.0, 20.0, 35.0, 39.0, 56.0, 60.0, 100.0, 91.0, 76.0, 62.0, 72.0, 64.0, 60.0, 38.0, 34.0, 26.0, 25.0, 12.0, 13.0, 7.0, 9.0, 2.0, 4.0, 4.0, 5.0, 2.0, 3.0, 2.0, 2.0, 3.0, 0.0, 1.0], "bins": [-0.01062774658203125, -0.01036381721496582, -0.01009988784790039, -0.009835958480834961, -0.009572029113769531, -0.009308099746704102, -0.009044170379638672, -0.008780241012573242, -0.008516311645507812, -0.008252382278442383, -0.007988452911376953, -0.0077245235443115234, -0.007460594177246094, -0.007196664810180664, -0.006932735443115234, -0.006668806076049805, -0.006404876708984375, -0.006140947341918945, -0.005877017974853516, -0.005613088607788086, -0.005349159240722656, -0.0050852298736572266, -0.004821300506591797, -0.004557371139526367, -0.0042934417724609375, -0.004029512405395508, -0.003765583038330078, -0.0035016536712646484, -0.0032377243041992188, -0.002973794937133789, -0.0027098655700683594, -0.0024459362030029297, -0.0021820068359375, -0.0019180774688720703, -0.0016541481018066406, -0.001390218734741211, -0.0011262893676757812, -0.0008623600006103516, -0.0005984306335449219, -0.0003345012664794922, -7.05718994140625e-05, 0.0001933574676513672, 0.0004572868347167969, 0.0007212162017822266, 0.0009851455688476562, 0.001249074935913086, 0.0015130043029785156, 0.0017769336700439453, 0.002040863037109375, 0.0023047924041748047, 0.0025687217712402344, 0.002832651138305664, 0.0030965805053710938, 0.0033605098724365234, 0.003624439239501953, 0.003888368606567383, 0.0041522979736328125, 0.004416227340698242, 0.004680156707763672, 0.0049440860748291016, 0.005208015441894531, 0.005471944808959961, 0.005735874176025391, 0.00599980354309082, 0.00626373291015625]}, "gradients/decoder.model.decoder.layers.2.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 7.0, 21.0, 25.0, 62.0, 73.0, 132.0, 177.0, 167.0, 149.0, 73.0, 64.0, 34.0, 11.0, 9.0, 6.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.31661269068717957, -0.2956339716911316, -0.2746552526950836, -0.25367653369903564, -0.23269784450531006, -0.21171912550926208, -0.1907404065132141, -0.16976170241832733, -0.14878298342227936, -0.12780426442623138, -0.1068255603313446, -0.08584684133529663, -0.06486812978982925, -0.04388941824436188, -0.022910699248313904, -0.001931995153427124, 0.01904672384262085, 0.040025435388088226, 0.0610041506588459, 0.08198286592960358, 0.10296157747507095, 0.12394028902053833, 0.1449190080165863, 0.16589771211147308, 0.18687643110752106, 0.20785515010356903, 0.2288338541984558, 0.24981257319450378, 0.27079129219055176, 0.29176998138427734, 0.3127487301826477, 0.3337274193763733, 0.3547061085700989, 0.37568482756614685, 0.3966635465621948, 0.4176422357559204, 0.4386209547519684, 0.45959967374801636, 0.48057839274406433, 0.5015571117401123, 0.5225358009338379, 0.5435144901275635, 0.5644932389259338, 0.5854719281196594, 0.6064506769180298, 0.6274293661117554, 0.648408055305481, 0.6693868041038513, 0.6903655529022217, 0.7113442420959473, 0.7323229908943176, 0.7533016800880432, 0.7742804288864136, 0.7952591180801392, 0.8162378072738647, 0.8372165560722351, 0.8581952452659607, 0.8791739344596863, 0.9001526832580566, 0.9211313724517822, 0.9421101212501526, 0.9630888104438782, 0.9840675592422485, 1.0050462484359741, 1.0260249376296997]}, "gradients/decoder.model.decoder.layers.2.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 5.0, 1.0, 8.0, 11.0, 14.0, 15.0, 22.0, 17.0, 19.0, 22.0, 32.0, 30.0, 41.0, 46.0, 57.0, 58.0, 52.0, 59.0, 53.0, 54.0, 58.0, 42.0, 40.0, 39.0, 38.0, 29.0, 29.0, 20.0, 24.0, 18.0, 10.0, 14.0, 8.0, 7.0, 4.0, 6.0, 2.0, 0.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.25978797674179077, -0.25141122937202454, -0.2430344671010971, -0.23465770483016968, -0.22628095746040344, -0.2179042100906372, -0.20952744781970978, -0.20115068554878235, -0.1927739381790161, -0.18439719080924988, -0.17602042853832245, -0.16764366626739502, -0.15926691889762878, -0.15089017152786255, -0.14251340925693512, -0.1341366469860077, -0.12575989961624146, -0.11738314479589462, -0.10900638997554779, -0.10062963515520096, -0.09225288033485413, -0.0838761255145073, -0.07549937069416046, -0.06712261587381363, -0.0587458610534668, -0.050369106233119965, -0.04199235141277313, -0.0336155965924263, -0.025238841772079468, -0.016862086951732635, -0.008485332131385803, -0.00010857731103897095, 0.008268177509307861, 0.016644932329654694, 0.025021687150001526, 0.03339844197034836, 0.04177519679069519, 0.05015195161104202, 0.058528706431388855, 0.06690546125173569, 0.07528221607208252, 0.08365897089242935, 0.09203572571277618, 0.10041248053312302, 0.10878923535346985, 0.11716599017381668, 0.1255427449941635, 0.13391950726509094, 0.14229625463485718, 0.1506730020046234, 0.15904976427555084, 0.16742652654647827, 0.1758032739162445, 0.18418002128601074, 0.19255678355693817, 0.2009335458278656, 0.20931029319763184, 0.21768704056739807, 0.2260638028383255, 0.23444056510925293, 0.24281731247901917, 0.2511940598487854, 0.259570837020874, 0.26794758439064026, 0.2763243317604065]}, "gradients/decoder.model.decoder.layers.2.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 0.0, 3.0, 0.0, 5.0, 4.0, 5.0, 10.0, 12.0, 7.0, 29.0, 22.0, 40.0, 72.0, 107.0, 171.0, 274.0, 537.0, 1031.0, 2020.0, 4444.0, 10585.0, 29835.0, 117059.0, 681518.0, 144236.0, 34883.0, 11996.0, 4858.0, 2253.0, 1192.0, 601.0, 313.0, 159.0, 98.0, 62.0, 40.0, 28.0, 11.0, 14.0, 10.0, 8.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0], "bins": [-0.33642578125, -0.323760986328125, -0.31109619140625, -0.298431396484375, -0.2857666015625, -0.273101806640625, -0.26043701171875, -0.247772216796875, -0.235107421875, -0.222442626953125, -0.20977783203125, -0.197113037109375, -0.1844482421875, -0.171783447265625, -0.15911865234375, -0.146453857421875, -0.1337890625, -0.121124267578125, -0.10845947265625, -0.095794677734375, -0.0831298828125, -0.070465087890625, -0.05780029296875, -0.045135498046875, -0.032470703125, -0.019805908203125, -0.00714111328125, 0.005523681640625, 0.0181884765625, 0.030853271484375, 0.04351806640625, 0.056182861328125, 0.06884765625, 0.081512451171875, 0.09417724609375, 0.106842041015625, 0.1195068359375, 0.132171630859375, 0.14483642578125, 0.157501220703125, 0.170166015625, 0.182830810546875, 0.19549560546875, 0.208160400390625, 0.2208251953125, 0.233489990234375, 0.24615478515625, 0.258819580078125, 0.271484375, 0.284149169921875, 0.29681396484375, 0.309478759765625, 0.3221435546875, 0.334808349609375, 0.34747314453125, 0.360137939453125, 0.372802734375, 0.385467529296875, 0.39813232421875, 0.410797119140625, 0.4234619140625, 0.436126708984375, 0.44879150390625, 0.461456298828125, 0.47412109375]}, "gradients/decoder.model.decoder.layers.2.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 0.0, 6.0, 4.0, 3.0, 11.0, 15.0, 26.0, 34.0, 36.0, 47.0, 56.0, 86.0, 93.0, 82.0, 82.0, 105.0, 68.0, 55.0, 56.0, 43.0, 31.0, 30.0, 14.0, 15.0, 5.0, 4.0, 3.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.50341796875, -0.47954559326171875, -0.4556732177734375, -0.43180084228515625, -0.407928466796875, -0.38405609130859375, -0.3601837158203125, -0.33631134033203125, -0.31243896484375, -0.28856658935546875, -0.2646942138671875, -0.24082183837890625, -0.216949462890625, -0.19307708740234375, -0.1692047119140625, -0.14533233642578125, -0.1214599609375, -0.09758758544921875, -0.0737152099609375, -0.04984283447265625, -0.025970458984375, -0.00209808349609375, 0.0217742919921875, 0.04564666748046875, 0.06951904296875, 0.09339141845703125, 0.1172637939453125, 0.14113616943359375, 0.165008544921875, 0.18888092041015625, 0.2127532958984375, 0.23662567138671875, 0.260498046875, 0.28437042236328125, 0.3082427978515625, 0.33211517333984375, 0.355987548828125, 0.37985992431640625, 0.4037322998046875, 0.42760467529296875, 0.45147705078125, 0.47534942626953125, 0.4992218017578125, 0.5230941772460938, 0.546966552734375, 0.5708389282226562, 0.5947113037109375, 0.6185836791992188, 0.6424560546875, 0.6663284301757812, 0.6902008056640625, 0.7140731811523438, 0.737945556640625, 0.7618179321289062, 0.7856903076171875, 0.8095626831054688, 0.83343505859375, 0.8573074340820312, 0.8811798095703125, 0.9050521850585938, 0.928924560546875, 0.9527969360351562, 0.9766693115234375, 1.0005416870117188, 1.0244140625]}, "gradients/decoder.model.decoder.layers.2.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 5.0, 10.0, 3.0, 13.0, 10.0, 13.0, 17.0, 17.0, 25.0, 39.0, 40.0, 63.0, 93.0, 136.0, 251.0, 555.0, 1896.0, 11908.0, 184246.0, 818668.0, 25520.0, 3351.0, 826.0, 304.0, 145.0, 112.0, 74.0, 38.0, 42.0, 31.0, 28.0, 14.0, 20.0, 4.0, 10.0, 9.0, 4.0, 7.0, 3.0, 4.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.78955078125, -0.762481689453125, -0.73541259765625, -0.708343505859375, -0.6812744140625, -0.654205322265625, -0.62713623046875, -0.600067138671875, -0.572998046875, -0.545928955078125, -0.51885986328125, -0.491790771484375, -0.4647216796875, -0.437652587890625, -0.41058349609375, -0.383514404296875, -0.3564453125, -0.329376220703125, -0.30230712890625, -0.275238037109375, -0.2481689453125, -0.221099853515625, -0.19403076171875, -0.166961669921875, -0.139892578125, -0.112823486328125, -0.08575439453125, -0.058685302734375, -0.0316162109375, -0.004547119140625, 0.02252197265625, 0.049591064453125, 0.07666015625, 0.103729248046875, 0.13079833984375, 0.157867431640625, 0.1849365234375, 0.212005615234375, 0.23907470703125, 0.266143798828125, 0.293212890625, 0.320281982421875, 0.34735107421875, 0.374420166015625, 0.4014892578125, 0.428558349609375, 0.45562744140625, 0.482696533203125, 0.509765625, 0.536834716796875, 0.56390380859375, 0.590972900390625, 0.6180419921875, 0.645111083984375, 0.67218017578125, 0.699249267578125, 0.726318359375, 0.753387451171875, 0.78045654296875, 0.807525634765625, 0.8345947265625, 0.861663818359375, 0.88873291015625, 0.915802001953125, 0.94287109375]}, "gradients/decoder.model.decoder.layers.2.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 4.0, 6.0, 10.0, 5.0, 7.0, 12.0, 10.0, 14.0, 19.0, 21.0, 23.0, 29.0, 36.0, 31.0, 43.0, 58.0, 47.0, 43.0, 46.0, 53.0, 50.0, 52.0, 39.0, 46.0, 47.0, 41.0, 38.0, 23.0, 26.0, 19.0, 18.0, 19.0, 13.0, 12.0, 12.0, 5.0, 7.0, 4.0, 5.0, 1.0, 8.0, 4.0, 0.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.52783203125, -0.51116943359375, -0.4945068359375, -0.47784423828125, -0.461181640625, -0.44451904296875, -0.4278564453125, -0.41119384765625, -0.39453125, -0.37786865234375, -0.3612060546875, -0.34454345703125, -0.327880859375, -0.31121826171875, -0.2945556640625, -0.27789306640625, -0.26123046875, -0.24456787109375, -0.2279052734375, -0.21124267578125, -0.194580078125, -0.17791748046875, -0.1612548828125, -0.14459228515625, -0.1279296875, -0.11126708984375, -0.0946044921875, -0.07794189453125, -0.061279296875, -0.04461669921875, -0.0279541015625, -0.01129150390625, 0.00537109375, 0.02203369140625, 0.0386962890625, 0.05535888671875, 0.072021484375, 0.08868408203125, 0.1053466796875, 0.12200927734375, 0.138671875, 0.15533447265625, 0.1719970703125, 0.18865966796875, 0.205322265625, 0.22198486328125, 0.2386474609375, 0.25531005859375, 0.27197265625, 0.28863525390625, 0.3052978515625, 0.32196044921875, 0.338623046875, 0.35528564453125, 0.3719482421875, 0.38861083984375, 0.4052734375, 0.42193603515625, 0.4385986328125, 0.45526123046875, 0.471923828125, 0.48858642578125, 0.5052490234375, 0.52191162109375, 0.53857421875]}, "gradients/decoder.model.decoder.layers.2.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 3.0, 2.0, 1.0, 5.0, 6.0, 27.0, 29.0, 40.0, 110.0, 185.0, 367.0, 1112.0, 4477.0, 34412.0, 875485.0, 119417.0, 9939.0, 1885.0, 528.0, 237.0, 123.0, 49.0, 42.0, 27.0, 13.0, 8.0, 8.0, 7.0, 4.0, 4.0, 3.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.2010498046875, -0.1929149627685547, -0.18478012084960938, -0.17664527893066406, -0.16851043701171875, -0.16037559509277344, -0.15224075317382812, -0.1441059112548828, -0.1359710693359375, -0.1278362274169922, -0.11970138549804688, -0.11156654357910156, -0.10343170166015625, -0.09529685974121094, -0.08716201782226562, -0.07902717590332031, -0.070892333984375, -0.06275749206542969, -0.054622650146484375, -0.04648780822753906, -0.03835296630859375, -0.030218124389648438, -0.022083282470703125, -0.013948440551757812, -0.0058135986328125, 0.0023212432861328125, 0.010456085205078125, 0.018590927124023438, 0.02672576904296875, 0.03486061096191406, 0.042995452880859375, 0.05113029479980469, 0.05926513671875, 0.06739997863769531, 0.07553482055664062, 0.08366966247558594, 0.09180450439453125, 0.09993934631347656, 0.10807418823242188, 0.11620903015136719, 0.1243438720703125, 0.1324787139892578, 0.14061355590820312, 0.14874839782714844, 0.15688323974609375, 0.16501808166503906, 0.17315292358398438, 0.1812877655029297, 0.189422607421875, 0.1975574493408203, 0.20569229125976562, 0.21382713317871094, 0.22196197509765625, 0.23009681701660156, 0.23823165893554688, 0.2463665008544922, 0.2545013427734375, 0.2626361846923828, 0.2707710266113281, 0.27890586853027344, 0.28704071044921875, 0.29517555236816406, 0.3033103942871094, 0.3114452362060547, 0.319580078125]}, "gradients/decoder.model.decoder.layers.2.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 0.0, 6.0, 6.0, 7.0, 8.0, 7.0, 12.0, 25.0, 26.0, 45.0, 66.0, 140.0, 254.0, 167.0, 77.0, 42.0, 46.0, 25.0, 9.0, 7.0, 7.0, 4.0, 4.0, 4.0, 3.0, 3.0, 2.0, 0.0, 4.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.4557113647460938e-05, -2.3558735847473145e-05, -2.256035804748535e-05, -2.156198024749756e-05, -2.0563602447509766e-05, -1.9565224647521973e-05, -1.856684684753418e-05, -1.7568469047546387e-05, -1.6570091247558594e-05, -1.55717134475708e-05, -1.4573335647583008e-05, -1.3574957847595215e-05, -1.2576580047607422e-05, -1.1578202247619629e-05, -1.0579824447631836e-05, -9.581446647644043e-06, -8.58306884765625e-06, -7.584691047668457e-06, -6.586313247680664e-06, -5.587935447692871e-06, -4.589557647705078e-06, -3.591179847717285e-06, -2.592802047729492e-06, -1.5944242477416992e-06, -5.960464477539062e-07, 4.023313522338867e-07, 1.4007091522216797e-06, 2.3990869522094727e-06, 3.3974647521972656e-06, 4.395842552185059e-06, 5.3942203521728516e-06, 6.3925981521606445e-06, 7.3909759521484375e-06, 8.38935375213623e-06, 9.387731552124023e-06, 1.0386109352111816e-05, 1.138448715209961e-05, 1.2382864952087402e-05, 1.3381242752075195e-05, 1.4379620552062988e-05, 1.537799835205078e-05, 1.6376376152038574e-05, 1.7374753952026367e-05, 1.837313175201416e-05, 1.9371509552001953e-05, 2.0369887351989746e-05, 2.136826515197754e-05, 2.2366642951965332e-05, 2.3365020751953125e-05, 2.4363398551940918e-05, 2.536177635192871e-05, 2.6360154151916504e-05, 2.7358531951904297e-05, 2.835690975189209e-05, 2.9355287551879883e-05, 3.0353665351867676e-05, 3.135204315185547e-05, 3.235042095184326e-05, 3.3348798751831055e-05, 3.434717655181885e-05, 3.534555435180664e-05, 3.6343932151794434e-05, 3.7342309951782227e-05, 3.834068775177002e-05, 3.933906555175781e-05]}, "gradients/decoder.model.decoder.layers.2.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 2.0, 3.0, 7.0, 10.0, 16.0, 23.0, 36.0, 73.0, 100.0, 194.0, 336.0, 721.0, 1865.0, 8157.0, 85213.0, 884771.0, 57695.0, 6366.0, 1583.0, 634.0, 304.0, 186.0, 95.0, 59.0, 42.0, 23.0, 10.0, 9.0, 2.0, 10.0, 3.0, 2.0, 3.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 2.0], "bins": [-0.3154296875, -0.3074302673339844, -0.29943084716796875, -0.2914314270019531, -0.2834320068359375, -0.2754325866699219, -0.26743316650390625, -0.2594337463378906, -0.251434326171875, -0.24343490600585938, -0.23543548583984375, -0.22743606567382812, -0.2194366455078125, -0.21143722534179688, -0.20343780517578125, -0.19543838500976562, -0.18743896484375, -0.17943954467773438, -0.17144012451171875, -0.16344070434570312, -0.1554412841796875, -0.14744186401367188, -0.13944244384765625, -0.13144302368164062, -0.123443603515625, -0.11544418334960938, -0.10744476318359375, -0.09944534301757812, -0.0914459228515625, -0.08344650268554688, -0.07544708251953125, -0.06744766235351562, -0.0594482421875, -0.051448822021484375, -0.04344940185546875, -0.035449981689453125, -0.0274505615234375, -0.019451141357421875, -0.01145172119140625, -0.003452301025390625, 0.004547119140625, 0.012546539306640625, 0.02054595947265625, 0.028545379638671875, 0.0365447998046875, 0.044544219970703125, 0.05254364013671875, 0.060543060302734375, 0.06854248046875, 0.07654190063476562, 0.08454132080078125, 0.09254074096679688, 0.1005401611328125, 0.10853958129882812, 0.11653900146484375, 0.12453842163085938, 0.132537841796875, 0.14053726196289062, 0.14853668212890625, 0.15653610229492188, 0.1645355224609375, 0.17253494262695312, 0.18053436279296875, 0.18853378295898438, 0.196533203125]}, "gradients/decoder.model.decoder.layers.2.self_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 0.0, 1.0, 6.0, 3.0, 7.0, 2.0, 13.0, 13.0, 11.0, 9.0, 28.0, 18.0, 30.0, 35.0, 56.0, 71.0, 158.0, 193.0, 97.0, 55.0, 39.0, 27.0, 34.0, 24.0, 19.0, 14.0, 11.0, 9.0, 9.0, 2.0, 3.0, 3.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.045318603515625, -0.04343843460083008, -0.041558265686035156, -0.039678096771240234, -0.03779792785644531, -0.03591775894165039, -0.03403759002685547, -0.03215742111206055, -0.030277252197265625, -0.028397083282470703, -0.02651691436767578, -0.02463674545288086, -0.022756576538085938, -0.020876407623291016, -0.018996238708496094, -0.017116069793701172, -0.01523590087890625, -0.013355731964111328, -0.011475563049316406, -0.009595394134521484, -0.0077152252197265625, -0.005835056304931641, -0.003954887390136719, -0.002074718475341797, -0.000194549560546875, 0.0016856193542480469, 0.0035657882690429688, 0.005445957183837891, 0.0073261260986328125, 0.009206295013427734, 0.011086463928222656, 0.012966632843017578, 0.0148468017578125, 0.016726970672607422, 0.018607139587402344, 0.020487308502197266, 0.022367477416992188, 0.02424764633178711, 0.02612781524658203, 0.028007984161376953, 0.029888153076171875, 0.0317683219909668, 0.03364849090576172, 0.03552865982055664, 0.03740882873535156, 0.039288997650146484, 0.041169166564941406, 0.04304933547973633, 0.04492950439453125, 0.04680967330932617, 0.048689842224121094, 0.050570011138916016, 0.05245018005371094, 0.05433034896850586, 0.05621051788330078, 0.0580906867980957, 0.059970855712890625, 0.06185102462768555, 0.06373119354248047, 0.06561136245727539, 0.06749153137207031, 0.06937170028686523, 0.07125186920166016, 0.07313203811645508, 0.07501220703125]}, "gradients/decoder.model.decoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [10.0, 24.0, 52.0, 161.0, 318.0, 259.0, 132.0, 35.0, 19.0, 7.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.35728853940963745, -0.2844151258468628, -0.21154168248176575, -0.1386682540178299, -0.06579482555389404, 0.007078588008880615, 0.07995203137397766, 0.1528254747390747, 0.22569888830184937, 0.298572301864624, 0.37144574522972107, 0.4443191885948181, 0.5171926021575928, 0.5900660157203674, 0.6629394292831421, 0.7358129024505615, 0.8086863160133362, 0.8815597295761108, 0.9544332027435303, 1.0273065567016602, 1.1001800298690796, 1.173053503036499, 1.245926856994629, 1.3188003301620483, 1.3916738033294678, 1.4645472764968872, 1.537420630455017, 1.6102941036224365, 1.6831674575805664, 1.7560409307479858, 1.8289144039154053, 1.9017877578735352, 1.9746613502502441, 2.047534704208374, 2.120408296585083, 2.193281650543213, 2.2661550045013428, 2.3390283584594727, 2.4119019508361816, 2.4847753047943115, 2.5576486587524414, 2.6305220127105713, 2.7033956050872803, 2.77626895904541, 2.84914231300354, 2.92201566696167, 2.994889259338379, 3.067762613296509, 3.1406362056732178, 3.2135095596313477, 3.2863831520080566, 3.3592565059661865, 3.4321298599243164, 3.5050034523010254, 3.5778768062591553, 3.650750160217285, 3.723623752593994, 3.796497106552124, 3.869370698928833, 3.942244052886963, 4.015117645263672, 4.087990760803223, 4.160864353179932, 4.233737945556641, 4.306611061096191]}, "gradients/decoder.model.decoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 4.0, 6.0, 4.0, 7.0, 6.0, 12.0, 9.0, 11.0, 26.0, 19.0, 20.0, 26.0, 27.0, 28.0, 34.0, 37.0, 41.0, 39.0, 50.0, 48.0, 42.0, 48.0, 55.0, 46.0, 49.0, 50.0, 33.0, 36.0, 25.0, 28.0, 35.0, 20.0, 21.0, 11.0, 13.0, 9.0, 13.0, 4.0, 6.0, 6.0, 5.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7250390648841858, -0.6977466344833374, -0.6704542636871338, -0.6431618332862854, -0.615869402885437, -0.5885770320892334, -0.561284601688385, -0.5339921712875366, -0.506699800491333, -0.479407399892807, -0.452114999294281, -0.4248225688934326, -0.3975301682949066, -0.3702377676963806, -0.3429453372955322, -0.3156529366970062, -0.2883605360984802, -0.2610681354999542, -0.23377572000026703, -0.20648330450057983, -0.17919090390205383, -0.15189850330352783, -0.12460608780384064, -0.09731367230415344, -0.07002127170562744, -0.042728863656520844, -0.015436455607414246, 0.011855952441692352, 0.03914836049079895, 0.06644076108932495, 0.09373317658901215, 0.12102559208869934, 0.14831793308258057, 0.17561033368110657, 0.20290274918079376, 0.23019516468048096, 0.25748756527900696, 0.28477996587753296, 0.31207239627838135, 0.33936479687690735, 0.36665719747543335, 0.39394959807395935, 0.42124199867248535, 0.44853442907333374, 0.47582682967185974, 0.5031192302703857, 0.5304116606712341, 0.5577040910720825, 0.5849964618682861, 0.6122888922691345, 0.6395812630653381, 0.6668736934661865, 0.6941660642623901, 0.7214584946632385, 0.7487509250640869, 0.7760432958602905, 0.8033357262611389, 0.8306281566619873, 0.8579205274581909, 0.8852129578590393, 0.9125053882598877, 0.9397977590560913, 0.9670901894569397, 0.9943826198577881, 1.0216749906539917]}, "gradients/decoder.model.decoder.layers.1.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 4.0, 6.0, 9.0, 12.0, 25.0, 36.0, 85.0, 139.0, 288.0, 584.0, 1489.0, 5168.0, 28102.0, 814403.0, 3238712.0, 90786.0, 10295.0, 2447.0, 921.0, 378.0, 193.0, 90.0, 50.0, 29.0, 15.0, 8.0, 5.0, 2.0, 5.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.82763671875, -0.8034515380859375, -0.779266357421875, -0.7550811767578125, -0.73089599609375, -0.7067108154296875, -0.682525634765625, -0.6583404541015625, -0.6341552734375, -0.6099700927734375, -0.585784912109375, -0.5615997314453125, -0.53741455078125, -0.5132293701171875, -0.489044189453125, -0.4648590087890625, -0.440673828125, -0.4164886474609375, -0.392303466796875, -0.3681182861328125, -0.34393310546875, -0.3197479248046875, -0.295562744140625, -0.2713775634765625, -0.2471923828125, -0.2230072021484375, -0.198822021484375, -0.1746368408203125, -0.15045166015625, -0.1262664794921875, -0.102081298828125, -0.0778961181640625, -0.0537109375, -0.0295257568359375, -0.005340576171875, 0.0188446044921875, 0.04302978515625, 0.0672149658203125, 0.091400146484375, 0.1155853271484375, 0.1397705078125, 0.1639556884765625, 0.188140869140625, 0.2123260498046875, 0.23651123046875, 0.2606964111328125, 0.284881591796875, 0.3090667724609375, 0.333251953125, 0.3574371337890625, 0.381622314453125, 0.4058074951171875, 0.42999267578125, 0.4541778564453125, 0.478363037109375, 0.5025482177734375, 0.5267333984375, 0.5509185791015625, 0.575103759765625, 0.5992889404296875, 0.62347412109375, 0.6476593017578125, 0.671844482421875, 0.6960296630859375, 0.72021484375]}, "gradients/decoder.model.decoder.layers.1.fc2.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 6.0, 4.0, 10.0, 9.0, 2.0, 11.0, 15.0, 14.0, 16.0, 15.0, 18.0, 26.0, 27.0, 24.0, 31.0, 44.0, 41.0, 46.0, 37.0, 50.0, 47.0, 42.0, 42.0, 41.0, 43.0, 52.0, 39.0, 30.0, 33.0, 30.0, 26.0, 25.0, 13.0, 19.0, 14.0, 16.0, 8.0, 10.0, 7.0, 5.0, 5.0, 6.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.252197265625, -0.24477386474609375, -0.2373504638671875, -0.22992706298828125, -0.222503662109375, -0.21508026123046875, -0.2076568603515625, -0.20023345947265625, -0.19281005859375, -0.18538665771484375, -0.1779632568359375, -0.17053985595703125, -0.163116455078125, -0.15569305419921875, -0.1482696533203125, -0.14084625244140625, -0.1334228515625, -0.12599945068359375, -0.1185760498046875, -0.11115264892578125, -0.103729248046875, -0.09630584716796875, -0.0888824462890625, -0.08145904541015625, -0.07403564453125, -0.06661224365234375, -0.0591888427734375, -0.05176544189453125, -0.044342041015625, -0.03691864013671875, -0.0294952392578125, -0.02207183837890625, -0.0146484375, -0.00722503662109375, 0.0001983642578125, 0.00762176513671875, 0.015045166015625, 0.02246856689453125, 0.0298919677734375, 0.03731536865234375, 0.04473876953125, 0.05216217041015625, 0.0595855712890625, 0.06700897216796875, 0.074432373046875, 0.08185577392578125, 0.0892791748046875, 0.09670257568359375, 0.1041259765625, 0.11154937744140625, 0.1189727783203125, 0.12639617919921875, 0.133819580078125, 0.14124298095703125, 0.1486663818359375, 0.15608978271484375, 0.16351318359375, 0.17093658447265625, 0.1783599853515625, 0.18578338623046875, 0.193206787109375, 0.20063018798828125, 0.2080535888671875, 0.21547698974609375, 0.222900390625]}, "gradients/decoder.model.decoder.layers.1.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 4.0, 3.0, 0.0, 5.0, 3.0, 11.0, 11.0, 9.0, 27.0, 44.0, 45.0, 75.0, 205.0, 503.0, 1676.0, 9685.0, 293513.0, 3848566.0, 34818.0, 3592.0, 872.0, 307.0, 153.0, 65.0, 36.0, 16.0, 14.0, 7.0, 7.0, 6.0, 6.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.26171875, -1.2237701416015625, -1.185821533203125, -1.1478729248046875, -1.10992431640625, -1.0719757080078125, -1.034027099609375, -0.9960784912109375, -0.9581298828125, -0.9201812744140625, -0.882232666015625, -0.8442840576171875, -0.80633544921875, -0.7683868408203125, -0.730438232421875, -0.6924896240234375, -0.654541015625, -0.6165924072265625, -0.578643798828125, -0.5406951904296875, -0.50274658203125, -0.4647979736328125, -0.426849365234375, -0.3889007568359375, -0.3509521484375, -0.3130035400390625, -0.275054931640625, -0.2371063232421875, -0.19915771484375, -0.1612091064453125, -0.123260498046875, -0.0853118896484375, -0.04736328125, -0.0094146728515625, 0.028533935546875, 0.0664825439453125, 0.10443115234375, 0.1423797607421875, 0.180328369140625, 0.2182769775390625, 0.2562255859375, 0.2941741943359375, 0.332122802734375, 0.3700714111328125, 0.40802001953125, 0.4459686279296875, 0.483917236328125, 0.5218658447265625, 0.559814453125, 0.5977630615234375, 0.635711669921875, 0.6736602783203125, 0.71160888671875, 0.7495574951171875, 0.787506103515625, 0.8254547119140625, 0.8634033203125, 0.9013519287109375, 0.939300537109375, 0.9772491455078125, 1.01519775390625, 1.0531463623046875, 1.091094970703125, 1.1290435791015625, 1.1669921875]}, "gradients/decoder.model.decoder.layers.1.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 2.0, 2.0, 3.0, 3.0, 6.0, 11.0, 8.0, 11.0, 13.0, 15.0, 28.0, 27.0, 55.0, 90.0, 142.0, 264.0, 423.0, 595.0, 759.0, 619.0, 358.0, 231.0, 134.0, 89.0, 50.0, 33.0, 39.0, 14.0, 7.0, 10.0, 8.0, 10.0, 1.0, 3.0, 3.0, 2.0, 3.0, 5.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.15185546875, -0.14686012268066406, -0.14186477661132812, -0.1368694305419922, -0.13187408447265625, -0.1268787384033203, -0.12188339233398438, -0.11688804626464844, -0.1118927001953125, -0.10689735412597656, -0.10190200805664062, -0.09690666198730469, -0.09191131591796875, -0.08691596984863281, -0.08192062377929688, -0.07692527770996094, -0.071929931640625, -0.06693458557128906, -0.061939239501953125, -0.05694389343261719, -0.05194854736328125, -0.04695320129394531, -0.041957855224609375, -0.03696250915527344, -0.0319671630859375, -0.026971817016601562, -0.021976470947265625, -0.016981124877929688, -0.01198577880859375, -0.0069904327392578125, -0.001995086669921875, 0.0030002593994140625, 0.00799560546875, 0.012990951538085938, 0.017986297607421875, 0.022981643676757812, 0.02797698974609375, 0.03297233581542969, 0.037967681884765625, 0.04296302795410156, 0.0479583740234375, 0.05295372009277344, 0.057949066162109375, 0.06294441223144531, 0.06793975830078125, 0.07293510437011719, 0.07793045043945312, 0.08292579650878906, 0.087921142578125, 0.09291648864746094, 0.09791183471679688, 0.10290718078613281, 0.10790252685546875, 0.11289787292480469, 0.11789321899414062, 0.12288856506347656, 0.1278839111328125, 0.13287925720214844, 0.13787460327148438, 0.1428699493408203, 0.14786529541015625, 0.1528606414794922, 0.15785598754882812, 0.16285133361816406, 0.1678466796875]}, "gradients/decoder.model.decoder.layers.1.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 9.0, 6.0, 11.0, 3.0, 16.0, 12.0, 22.0, 24.0, 31.0, 34.0, 36.0, 44.0, 58.0, 75.0, 65.0, 75.0, 55.0, 75.0, 59.0, 68.0, 34.0, 38.0, 31.0, 28.0, 30.0, 20.0, 10.0, 14.0, 7.0, 6.0, 4.0, 5.0, 5.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0], "bins": [-0.5012553334236145, -0.48900681734085083, -0.47675830125808716, -0.4645098149776459, -0.4522612988948822, -0.44001278281211853, -0.42776426672935486, -0.4155157804489136, -0.4032672643661499, -0.39101874828338623, -0.37877023220062256, -0.3665217459201813, -0.3542732298374176, -0.34202471375465393, -0.32977619767189026, -0.317527711391449, -0.3052791953086853, -0.29303067922592163, -0.28078216314315796, -0.2685336768627167, -0.256285160779953, -0.24403664469718933, -0.23178812861442566, -0.21953962743282318, -0.20729109644889832, -0.19504258036613464, -0.18279407918453217, -0.1705455631017685, -0.15829706192016602, -0.14604854583740234, -0.13380002975463867, -0.1215515285730362, -0.10930302739143372, -0.09705451875925064, -0.08480601012706757, -0.0725574940443039, -0.06030898913741112, -0.04806048050522804, -0.03581196814775467, -0.023563459515571594, -0.01131495088338852, 0.0009335586801171303, 0.01318206824362278, 0.025430578738451004, 0.03767908737063408, 0.049927596002817154, 0.06217610836029053, 0.0744246169924736, 0.08667312562465668, 0.09892163425683975, 0.11117014288902283, 0.1234186589717865, 0.13566716015338898, 0.14791567623615265, 0.16016417741775513, 0.1724126935005188, 0.18466120958328247, 0.19690972566604614, 0.20915822684764862, 0.2214067429304123, 0.23365524411201477, 0.24590376019477844, 0.2581522762775421, 0.2704007625579834, 0.28264927864074707]}, "gradients/decoder.model.decoder.layers.1.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 5.0, 2.0, 3.0, 3.0, 3.0, 4.0, 5.0, 7.0, 6.0, 6.0, 12.0, 12.0, 11.0, 17.0, 16.0, 16.0, 20.0, 28.0, 20.0, 20.0, 34.0, 41.0, 32.0, 36.0, 30.0, 39.0, 35.0, 45.0, 42.0, 40.0, 41.0, 40.0, 39.0, 28.0, 38.0, 26.0, 34.0, 26.0, 25.0, 18.0, 24.0, 14.0, 10.0, 10.0, 14.0, 7.0, 6.0, 7.0, 5.0, 4.0, 6.0, 3.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.29343488812446594, -0.28508466482162476, -0.27673447132110596, -0.26838427782058716, -0.26003405451774597, -0.2516838312149048, -0.243333637714386, -0.234983429312706, -0.226633220911026, -0.218283012509346, -0.20993280410766602, -0.20158259570598602, -0.19323238730430603, -0.18488217890262604, -0.17653197050094604, -0.16818176209926605, -0.15983155369758606, -0.15148134529590607, -0.14313113689422607, -0.13478092849254608, -0.1264307200908661, -0.1180805116891861, -0.1097303032875061, -0.10138009488582611, -0.09302988648414612, -0.08467967808246613, -0.07632946968078613, -0.06797926127910614, -0.05962905287742615, -0.051278844475746155, -0.04292863607406616, -0.03457842767238617, -0.02622818946838379, -0.017877981066703796, -0.009527772665023804, -0.001177564263343811, 0.007172644138336182, 0.015522852540016174, 0.023873060941696167, 0.03222326934337616, 0.04057347774505615, 0.048923686146736145, 0.05727389454841614, 0.06562410295009613, 0.07397431135177612, 0.08232451975345612, 0.09067472815513611, 0.0990249365568161, 0.1073751449584961, 0.11572535336017609, 0.12407556176185608, 0.13242577016353607, 0.14077597856521606, 0.14912618696689606, 0.15747639536857605, 0.16582660377025604, 0.17417681217193604, 0.18252702057361603, 0.19087722897529602, 0.199227437376976, 0.207577645778656, 0.215927854180336, 0.224278062582016, 0.23262827098369598, 0.24097847938537598]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 5.0, 2.0, 3.0, 6.0, 8.0, 10.0, 7.0, 22.0, 33.0, 59.0, 86.0, 113.0, 179.0, 271.0, 411.0, 664.0, 1044.0, 1578.0, 2627.0, 4698.0, 8145.0, 16173.0, 46722.0, 231198.0, 534816.0, 137593.0, 32196.0, 12892.0, 6733.0, 3944.0, 2360.0, 1484.0, 906.0, 571.0, 343.0, 218.0, 145.0, 79.0, 80.0, 54.0, 22.0, 14.0, 17.0, 12.0, 3.0, 5.0, 5.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.12066650390625, -0.11704826354980469, -0.11343002319335938, -0.10981178283691406, -0.10619354248046875, -0.10257530212402344, -0.09895706176757812, -0.09533882141113281, -0.0917205810546875, -0.08810234069824219, -0.08448410034179688, -0.08086585998535156, -0.07724761962890625, -0.07362937927246094, -0.07001113891601562, -0.06639289855957031, -0.062774658203125, -0.05915641784667969, -0.055538177490234375, -0.05191993713378906, -0.04830169677734375, -0.04468345642089844, -0.041065216064453125, -0.03744697570800781, -0.0338287353515625, -0.030210494995117188, -0.026592254638671875, -0.022974014282226562, -0.01935577392578125, -0.015737533569335938, -0.012119293212890625, -0.008501052856445312, -0.0048828125, -0.0012645721435546875, 0.002353668212890625, 0.0059719085693359375, 0.00959014892578125, 0.013208389282226562, 0.016826629638671875, 0.020444869995117188, 0.0240631103515625, 0.027681350708007812, 0.031299591064453125, 0.03491783142089844, 0.03853607177734375, 0.04215431213378906, 0.045772552490234375, 0.04939079284667969, 0.053009033203125, 0.05662727355957031, 0.060245513916015625, 0.06386375427246094, 0.06748199462890625, 0.07110023498535156, 0.07471847534179688, 0.07833671569824219, 0.0819549560546875, 0.08557319641113281, 0.08919143676757812, 0.09280967712402344, 0.09642791748046875, 0.10004615783691406, 0.10366439819335938, 0.10728263854980469, 0.11090087890625]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 5.0, 2.0, 3.0, 7.0, 8.0, 3.0, 7.0, 9.0, 5.0, 7.0, 12.0, 14.0, 15.0, 13.0, 19.0, 30.0, 20.0, 38.0, 42.0, 32.0, 33.0, 33.0, 38.0, 53.0, 35.0, 42.0, 46.0, 38.0, 43.0, 50.0, 39.0, 39.0, 31.0, 35.0, 28.0, 18.0, 16.0, 17.0, 15.0, 15.0, 12.0, 7.0, 10.0, 8.0, 2.0, 4.0, 4.0, 6.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0], "bins": [-0.17919921875, -0.17395401000976562, -0.16870880126953125, -0.16346359252929688, -0.1582183837890625, -0.15297317504882812, -0.14772796630859375, -0.14248275756835938, -0.137237548828125, -0.13199234008789062, -0.12674713134765625, -0.12150192260742188, -0.1162567138671875, -0.11101150512695312, -0.10576629638671875, -0.10052108764648438, -0.09527587890625, -0.09003067016601562, -0.08478546142578125, -0.07954025268554688, -0.0742950439453125, -0.06904983520507812, -0.06380462646484375, -0.058559417724609375, -0.053314208984375, -0.048069000244140625, -0.04282379150390625, -0.037578582763671875, -0.0323333740234375, -0.027088165283203125, -0.02184295654296875, -0.016597747802734375, -0.0113525390625, -0.006107330322265625, -0.00086212158203125, 0.004383087158203125, 0.0096282958984375, 0.014873504638671875, 0.02011871337890625, 0.025363922119140625, 0.030609130859375, 0.035854339599609375, 0.04109954833984375, 0.046344757080078125, 0.0515899658203125, 0.056835174560546875, 0.06208038330078125, 0.06732559204101562, 0.07257080078125, 0.07781600952148438, 0.08306121826171875, 0.08830642700195312, 0.0935516357421875, 0.09879684448242188, 0.10404205322265625, 0.10928726196289062, 0.114532470703125, 0.11977767944335938, 0.12502288818359375, 0.13026809692382812, 0.1355133056640625, 0.14075851440429688, 0.14600372314453125, 0.15124893188476562, 0.156494140625]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 4.0, 3.0, 0.0, 5.0, 4.0, 3.0, 3.0, 7.0, 1.0, 8.0, 7.0, 16.0, 35.0, 31.0, 51.0, 60.0, 113.0, 166.0, 309.0, 462.0, 793.0, 1533.0, 3271.0, 7348.0, 19212.0, 68785.0, 321895.0, 458665.0, 118339.0, 28540.0, 10060.0, 4314.0, 1988.0, 1082.0, 604.0, 310.0, 191.0, 137.0, 75.0, 40.0, 29.0, 24.0, 13.0, 10.0, 4.0, 6.0, 8.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.08935546875, -0.08681488037109375, -0.0842742919921875, -0.08173370361328125, -0.079193115234375, -0.07665252685546875, -0.0741119384765625, -0.07157135009765625, -0.06903076171875, -0.06649017333984375, -0.0639495849609375, -0.06140899658203125, -0.058868408203125, -0.05632781982421875, -0.0537872314453125, -0.05124664306640625, -0.0487060546875, -0.04616546630859375, -0.0436248779296875, -0.04108428955078125, -0.038543701171875, -0.03600311279296875, -0.0334625244140625, -0.03092193603515625, -0.02838134765625, -0.02584075927734375, -0.0233001708984375, -0.02075958251953125, -0.018218994140625, -0.01567840576171875, -0.0131378173828125, -0.01059722900390625, -0.008056640625, -0.00551605224609375, -0.0029754638671875, -0.00043487548828125, 0.002105712890625, 0.00464630126953125, 0.0071868896484375, 0.00972747802734375, 0.01226806640625, 0.01480865478515625, 0.0173492431640625, 0.01988983154296875, 0.022430419921875, 0.02497100830078125, 0.0275115966796875, 0.03005218505859375, 0.0325927734375, 0.03513336181640625, 0.0376739501953125, 0.04021453857421875, 0.042755126953125, 0.04529571533203125, 0.0478363037109375, 0.05037689208984375, 0.05291748046875, 0.05545806884765625, 0.0579986572265625, 0.06053924560546875, 0.063079833984375, 0.06562042236328125, 0.0681610107421875, 0.07070159912109375, 0.0732421875]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 0.0, 1.0, 3.0, 2.0, 6.0, 8.0, 15.0, 9.0, 16.0, 22.0, 17.0, 17.0, 19.0, 25.0, 21.0, 27.0, 28.0, 26.0, 40.0, 30.0, 33.0, 29.0, 41.0, 45.0, 40.0, 49.0, 40.0, 41.0, 39.0, 37.0, 35.0, 42.0, 28.0, 22.0, 21.0, 16.0, 14.0, 11.0, 12.0, 11.0, 16.0, 7.0, 11.0, 8.0, 4.0, 4.0, 4.0, 2.0, 6.0, 5.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.305419921875, -0.2958984375, -0.286376953125, -0.27685546875, -0.267333984375, -0.2578125, -0.248291015625, -0.23876953125, -0.229248046875, -0.2197265625, -0.210205078125, -0.20068359375, -0.191162109375, -0.181640625, -0.172119140625, -0.16259765625, -0.153076171875, -0.1435546875, -0.134033203125, -0.12451171875, -0.114990234375, -0.10546875, -0.095947265625, -0.08642578125, -0.076904296875, -0.0673828125, -0.057861328125, -0.04833984375, -0.038818359375, -0.029296875, -0.019775390625, -0.01025390625, -0.000732421875, 0.0087890625, 0.018310546875, 0.02783203125, 0.037353515625, 0.046875, 0.056396484375, 0.06591796875, 0.075439453125, 0.0849609375, 0.094482421875, 0.10400390625, 0.113525390625, 0.123046875, 0.132568359375, 0.14208984375, 0.151611328125, 0.1611328125, 0.170654296875, 0.18017578125, 0.189697265625, 0.19921875, 0.208740234375, 0.21826171875, 0.227783203125, 0.2373046875, 0.246826171875, 0.25634765625, 0.265869140625, 0.275390625, 0.284912109375, 0.29443359375, 0.303955078125]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 6.0, 2.0, 5.0, 6.0, 6.0, 11.0, 15.0, 37.0, 66.0, 107.0, 163.0, 293.0, 562.0, 1007.0, 2300.0, 5793.0, 16660.0, 61985.0, 278616.0, 490884.0, 140168.0, 32768.0, 10007.0, 3814.0, 1602.0, 762.0, 358.0, 202.0, 132.0, 82.0, 49.0, 27.0, 20.0, 15.0, 7.0, 8.0, 5.0, 6.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0234375, -0.022608518600463867, -0.021779537200927734, -0.0209505558013916, -0.02012157440185547, -0.019292593002319336, -0.018463611602783203, -0.01763463020324707, -0.016805648803710938, -0.015976667404174805, -0.015147686004638672, -0.014318704605102539, -0.013489723205566406, -0.012660741806030273, -0.01183176040649414, -0.011002779006958008, -0.010173797607421875, -0.009344816207885742, -0.00851583480834961, -0.0076868534088134766, -0.006857872009277344, -0.006028890609741211, -0.005199909210205078, -0.004370927810668945, -0.0035419464111328125, -0.0027129650115966797, -0.0018839836120605469, -0.001055002212524414, -0.00022602081298828125, 0.0006029605865478516, 0.0014319419860839844, 0.002260923385620117, 0.00308990478515625, 0.003918886184692383, 0.004747867584228516, 0.0055768489837646484, 0.006405830383300781, 0.007234811782836914, 0.008063793182373047, 0.00889277458190918, 0.009721755981445312, 0.010550737380981445, 0.011379718780517578, 0.012208700180053711, 0.013037681579589844, 0.013866662979125977, 0.01469564437866211, 0.015524625778198242, 0.016353607177734375, 0.017182588577270508, 0.01801156997680664, 0.018840551376342773, 0.019669532775878906, 0.02049851417541504, 0.021327495574951172, 0.022156476974487305, 0.022985458374023438, 0.02381443977355957, 0.024643421173095703, 0.025472402572631836, 0.02630138397216797, 0.0271303653717041, 0.027959346771240234, 0.028788328170776367, 0.0296173095703125]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 3.0, 3.0, 0.0, 5.0, 1.0, 1.0, 4.0, 4.0, 11.0, 2.0, 10.0, 6.0, 16.0, 24.0, 24.0, 29.0, 45.0, 55.0, 61.0, 81.0, 93.0, 71.0, 76.0, 72.0, 73.0, 62.0, 35.0, 32.0, 33.0, 18.0, 9.0, 15.0, 12.0, 6.0, 6.0, 1.0, 4.0, 2.0, 1.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2516975402832031e-05, -1.2025237083435059e-05, -1.1533498764038086e-05, -1.1041760444641113e-05, -1.055002212524414e-05, -1.0058283805847168e-05, -9.566545486450195e-06, -9.074807167053223e-06, -8.58306884765625e-06, -8.091330528259277e-06, -7.599592208862305e-06, -7.107853889465332e-06, -6.616115570068359e-06, -6.124377250671387e-06, -5.632638931274414e-06, -5.140900611877441e-06, -4.649162292480469e-06, -4.157423973083496e-06, -3.6656856536865234e-06, -3.1739473342895508e-06, -2.682209014892578e-06, -2.1904706954956055e-06, -1.6987323760986328e-06, -1.2069940567016602e-06, -7.152557373046875e-07, -2.2351741790771484e-07, 2.682209014892578e-07, 7.599592208862305e-07, 1.2516975402832031e-06, 1.7434358596801758e-06, 2.2351741790771484e-06, 2.726912498474121e-06, 3.2186508178710938e-06, 3.7103891372680664e-06, 4.202127456665039e-06, 4.693865776062012e-06, 5.185604095458984e-06, 5.677342414855957e-06, 6.16908073425293e-06, 6.660819053649902e-06, 7.152557373046875e-06, 7.644295692443848e-06, 8.13603401184082e-06, 8.627772331237793e-06, 9.119510650634766e-06, 9.611248970031738e-06, 1.0102987289428711e-05, 1.0594725608825684e-05, 1.1086463928222656e-05, 1.1578202247619629e-05, 1.2069940567016602e-05, 1.2561678886413574e-05, 1.3053417205810547e-05, 1.354515552520752e-05, 1.4036893844604492e-05, 1.4528632164001465e-05, 1.5020370483398438e-05, 1.551210880279541e-05, 1.6003847122192383e-05, 1.6495585441589355e-05, 1.6987323760986328e-05, 1.74790620803833e-05, 1.7970800399780273e-05, 1.8462538719177246e-05, 1.895427703857422e-05]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 6.0, 3.0, 11.0, 10.0, 12.0, 12.0, 29.0, 29.0, 52.0, 65.0, 95.0, 138.0, 209.0, 318.0, 564.0, 882.0, 1543.0, 2682.0, 4897.0, 9906.0, 21999.0, 51450.0, 131740.0, 299048.0, 298017.0, 130078.0, 51141.0, 21825.0, 9991.0, 5013.0, 2737.0, 1530.0, 951.0, 543.0, 322.0, 227.0, 146.0, 100.0, 66.0, 45.0, 29.0, 33.0, 18.0, 18.0, 9.0, 8.0, 3.0, 5.0, 6.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.0214691162109375, -0.020818471908569336, -0.020167827606201172, -0.019517183303833008, -0.018866539001464844, -0.01821589469909668, -0.017565250396728516, -0.01691460609436035, -0.016263961791992188, -0.015613317489624023, -0.01496267318725586, -0.014312028884887695, -0.013661384582519531, -0.013010740280151367, -0.012360095977783203, -0.011709451675415039, -0.011058807373046875, -0.010408163070678711, -0.009757518768310547, -0.009106874465942383, -0.008456230163574219, -0.007805585861206055, -0.007154941558837891, -0.0065042972564697266, -0.0058536529541015625, -0.0052030086517333984, -0.004552364349365234, -0.0039017200469970703, -0.0032510757446289062, -0.002600431442260742, -0.0019497871398925781, -0.001299142837524414, -0.00064849853515625, 2.1457672119140625e-06, 0.0006527900695800781, 0.0013034343719482422, 0.0019540786743164062, 0.0026047229766845703, 0.0032553672790527344, 0.0039060115814208984, 0.0045566558837890625, 0.0052073001861572266, 0.005857944488525391, 0.006508588790893555, 0.007159233093261719, 0.007809877395629883, 0.008460521697998047, 0.009111166000366211, 0.009761810302734375, 0.010412454605102539, 0.011063098907470703, 0.011713743209838867, 0.012364387512207031, 0.013015031814575195, 0.01366567611694336, 0.014316320419311523, 0.014966964721679688, 0.015617609024047852, 0.016268253326416016, 0.01691889762878418, 0.017569541931152344, 0.018220186233520508, 0.018870830535888672, 0.019521474838256836, 0.020172119140625]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 4.0, 1.0, 5.0, 2.0, 1.0, 1.0, 0.0, 3.0, 3.0, 6.0, 1.0, 4.0, 6.0, 6.0, 9.0, 7.0, 14.0, 16.0, 13.0, 19.0, 32.0, 33.0, 35.0, 30.0, 43.0, 46.0, 69.0, 61.0, 58.0, 38.0, 55.0, 64.0, 57.0, 39.0, 29.0, 42.0, 27.0, 34.0, 20.0, 19.0, 8.0, 8.0, 4.0, 8.0, 5.0, 10.0, 3.0, 6.0, 3.0, 2.0, 1.0, 3.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.005176544189453125, -0.005019545555114746, -0.004862546920776367, -0.004705548286437988, -0.004548549652099609, -0.0043915510177612305, -0.0042345523834228516, -0.004077553749084473, -0.003920555114746094, -0.003763556480407715, -0.003606557846069336, -0.003449559211730957, -0.003292560577392578, -0.0031355619430541992, -0.0029785633087158203, -0.0028215646743774414, -0.0026645660400390625, -0.0025075674057006836, -0.0023505687713623047, -0.0021935701370239258, -0.002036571502685547, -0.001879572868347168, -0.001722574234008789, -0.0015655755996704102, -0.0014085769653320312, -0.0012515783309936523, -0.0010945796966552734, -0.0009375810623168945, -0.0007805824279785156, -0.0006235837936401367, -0.0004665851593017578, -0.0003095865249633789, -0.000152587890625, 4.410743713378906e-06, 0.0001614093780517578, 0.0003184080123901367, 0.0004754066467285156, 0.0006324052810668945, 0.0007894039154052734, 0.0009464025497436523, 0.0011034011840820312, 0.0012603998184204102, 0.001417398452758789, 0.001574397087097168, 0.0017313957214355469, 0.0018883943557739258, 0.0020453929901123047, 0.0022023916244506836, 0.0023593902587890625, 0.0025163888931274414, 0.0026733875274658203, 0.0028303861618041992, 0.002987384796142578, 0.003144383430480957, 0.003301382064819336, 0.003458380699157715, 0.0036153793334960938, 0.0037723779678344727, 0.0039293766021728516, 0.0040863752365112305, 0.004243373870849609, 0.004400372505187988, 0.004557371139526367, 0.004714369773864746, 0.004871368408203125]}, "gradients/decoder.model.decoder.layers.1.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 8.0, 3.0, 7.0, 10.0, 19.0, 23.0, 17.0, 45.0, 56.0, 53.0, 95.0, 85.0, 97.0, 91.0, 81.0, 75.0, 71.0, 56.0, 38.0, 39.0, 15.0, 12.0, 8.0, 4.0, 1.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3764435350894928, -0.36676907539367676, -0.3570946455001831, -0.34742018580436707, -0.3377457559108734, -0.3280712962150574, -0.3183968663215637, -0.3087224066257477, -0.29904794692993164, -0.2893734872341156, -0.27969905734062195, -0.2700245976448059, -0.26035016775131226, -0.2506757080554962, -0.24100126326084137, -0.23132681846618652, -0.22165237367153168, -0.21197792887687683, -0.20230348408222198, -0.19262903928756714, -0.1829545795917511, -0.17328013479709625, -0.1636056900024414, -0.15393123030662537, -0.1442568004131317, -0.13458235561847687, -0.12490790337324142, -0.11523345857858658, -0.10555900633335114, -0.09588456153869629, -0.08621011674404144, -0.076535664498806, -0.06686121225357056, -0.05718676373362541, -0.04751231521368027, -0.03783787041902542, -0.028163421899080276, -0.018488973379135132, -0.008814528584480286, 0.0008599236607551575, 0.010534368455410004, 0.02020881697535515, 0.029883263632655144, 0.03955771028995514, 0.049232158809900284, 0.05890660732984543, 0.06858105212450027, 0.07825550436973572, 0.08792994916439056, 0.09760439395904541, 0.10727884620428085, 0.1169532909989357, 0.12662774324417114, 0.136302188038826, 0.14597663283348083, 0.15565109252929688, 0.16532552242279053, 0.17499996721744537, 0.18467441201210022, 0.19434887170791626, 0.2040233165025711, 0.21369776129722595, 0.2233722060918808, 0.23304665088653564, 0.24272111058235168]}, "gradients/decoder.model.decoder.layers.1.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 5.0, 2.0, 6.0, 4.0, 6.0, 8.0, 14.0, 10.0, 8.0, 14.0, 20.0, 22.0, 23.0, 21.0, 35.0, 21.0, 37.0, 54.0, 41.0, 41.0, 39.0, 50.0, 57.0, 60.0, 43.0, 49.0, 35.0, 46.0, 41.0, 34.0, 22.0, 29.0, 28.0, 14.0, 15.0, 14.0, 7.0, 11.0, 4.0, 8.0, 5.0, 3.0, 2.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1717919558286667, -0.16606242954730988, -0.16033290326595306, -0.15460337698459625, -0.14887385070323944, -0.14314432442188263, -0.13741478323936462, -0.1316852569580078, -0.125955730676651, -0.12022620439529419, -0.11449667811393738, -0.10876715183258057, -0.10303762555122375, -0.09730809926986694, -0.09157856553792953, -0.08584903925657272, -0.08011952042579651, -0.0743899941444397, -0.06866046786308289, -0.06293094158172607, -0.057201411575078964, -0.05147188529372215, -0.04574235528707504, -0.04001282900571823, -0.03428330272436142, -0.028553776443004608, -0.022824248299002647, -0.017094720155000687, -0.011365193873643875, -0.005635667592287064, 9.386241436004639e-05, 0.005823388695716858, 0.01155291497707367, 0.01728244125843048, 0.02301196940243244, 0.028741497546434402, 0.034471023827791214, 0.040200550109148026, 0.045930080115795135, 0.05165960639715195, 0.05738913267850876, 0.06311865895986557, 0.06884818524122238, 0.07457771897315979, 0.0803072452545166, 0.08603677153587341, 0.09176629781723022, 0.09749582409858704, 0.10322535037994385, 0.10895487666130066, 0.11468440294265747, 0.12041392922401428, 0.1261434555053711, 0.1318729817867279, 0.13760250806808472, 0.14333203434944153, 0.14906156063079834, 0.15479108691215515, 0.16052061319351196, 0.16625013947486877, 0.17197966575622559, 0.1777091920375824, 0.1834387183189392, 0.18916824460029602, 0.19489778578281403]}, "gradients/decoder.model.decoder.layers.1.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 4.0, 3.0, 3.0, 11.0, 16.0, 14.0, 26.0, 34.0, 53.0, 74.0, 126.0, 162.0, 292.0, 451.0, 707.0, 1313.0, 2366.0, 4698.0, 9488.0, 20863.0, 51985.0, 175029.0, 494756.0, 188870.0, 54771.0, 21845.0, 9863.0, 4824.0, 2465.0, 1400.0, 792.0, 451.0, 266.0, 184.0, 112.0, 77.0, 54.0, 37.0, 31.0, 16.0, 10.0, 10.0, 3.0, 5.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.234375, -0.225860595703125, -0.21734619140625, -0.208831787109375, -0.2003173828125, -0.191802978515625, -0.18328857421875, -0.174774169921875, -0.166259765625, -0.157745361328125, -0.14923095703125, -0.140716552734375, -0.1322021484375, -0.123687744140625, -0.11517333984375, -0.106658935546875, -0.09814453125, -0.089630126953125, -0.08111572265625, -0.072601318359375, -0.0640869140625, -0.055572509765625, -0.04705810546875, -0.038543701171875, -0.030029296875, -0.021514892578125, -0.01300048828125, -0.004486083984375, 0.0040283203125, 0.012542724609375, 0.02105712890625, 0.029571533203125, 0.0380859375, 0.046600341796875, 0.05511474609375, 0.063629150390625, 0.0721435546875, 0.080657958984375, 0.08917236328125, 0.097686767578125, 0.106201171875, 0.114715576171875, 0.12322998046875, 0.131744384765625, 0.1402587890625, 0.148773193359375, 0.15728759765625, 0.165802001953125, 0.17431640625, 0.182830810546875, 0.19134521484375, 0.199859619140625, 0.2083740234375, 0.216888427734375, 0.22540283203125, 0.233917236328125, 0.242431640625, 0.250946044921875, 0.25946044921875, 0.267974853515625, 0.2764892578125, 0.285003662109375, 0.29351806640625, 0.302032470703125, 0.310546875]}, "gradients/decoder.model.decoder.layers.1.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 7.0, 5.0, 10.0, 7.0, 12.0, 17.0, 15.0, 17.0, 27.0, 27.0, 21.0, 25.0, 41.0, 47.0, 50.0, 63.0, 61.0, 65.0, 59.0, 53.0, 54.0, 58.0, 47.0, 41.0, 32.0, 30.0, 34.0, 16.0, 13.0, 15.0, 13.0, 7.0, 6.0, 7.0, 4.0, 1.0, 3.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.370361328125, -0.3564643859863281, -0.34256744384765625, -0.3286705017089844, -0.3147735595703125, -0.3008766174316406, -0.28697967529296875, -0.2730827331542969, -0.259185791015625, -0.24528884887695312, -0.23139190673828125, -0.21749496459960938, -0.2035980224609375, -0.18970108032226562, -0.17580413818359375, -0.16190719604492188, -0.14801025390625, -0.13411331176757812, -0.12021636962890625, -0.10631942749023438, -0.0924224853515625, -0.07852554321289062, -0.06462860107421875, -0.050731658935546875, -0.036834716796875, -0.022937774658203125, -0.00904083251953125, 0.004856109619140625, 0.0187530517578125, 0.032649993896484375, 0.04654693603515625, 0.060443878173828125, 0.0743408203125, 0.08823776245117188, 0.10213470458984375, 0.11603164672851562, 0.1299285888671875, 0.14382553100585938, 0.15772247314453125, 0.17161941528320312, 0.185516357421875, 0.19941329956054688, 0.21331024169921875, 0.22720718383789062, 0.2411041259765625, 0.2550010681152344, 0.26889801025390625, 0.2827949523925781, 0.29669189453125, 0.3105888366699219, 0.32448577880859375, 0.3383827209472656, 0.3522796630859375, 0.3661766052246094, 0.38007354736328125, 0.3939704895019531, 0.407867431640625, 0.4217643737792969, 0.43566131591796875, 0.4495582580566406, 0.4634552001953125, 0.4773521423339844, 0.49124908447265625, 0.5051460266113281, 0.51904296875]}, "gradients/decoder.model.decoder.layers.1.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 6.0, 8.0, 12.0, 13.0, 20.0, 29.0, 34.0, 67.0, 117.0, 286.0, 777.0, 3118.0, 19574.0, 282712.0, 699936.0, 34872.0, 5211.0, 1061.0, 335.0, 143.0, 78.0, 51.0, 39.0, 12.0, 22.0, 10.0, 3.0, 3.0, 5.0, 2.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.57470703125, -0.5527191162109375, -0.530731201171875, -0.5087432861328125, -0.48675537109375, -0.4647674560546875, -0.442779541015625, -0.4207916259765625, -0.3988037109375, -0.3768157958984375, -0.354827880859375, -0.3328399658203125, -0.31085205078125, -0.2888641357421875, -0.266876220703125, -0.2448883056640625, -0.222900390625, -0.2009124755859375, -0.178924560546875, -0.1569366455078125, -0.13494873046875, -0.1129608154296875, -0.090972900390625, -0.0689849853515625, -0.0469970703125, -0.0250091552734375, -0.003021240234375, 0.0189666748046875, 0.04095458984375, 0.0629425048828125, 0.084930419921875, 0.1069183349609375, 0.12890625, 0.1508941650390625, 0.172882080078125, 0.1948699951171875, 0.21685791015625, 0.2388458251953125, 0.260833740234375, 0.2828216552734375, 0.3048095703125, 0.3267974853515625, 0.348785400390625, 0.3707733154296875, 0.39276123046875, 0.4147491455078125, 0.436737060546875, 0.4587249755859375, 0.480712890625, 0.5027008056640625, 0.524688720703125, 0.5466766357421875, 0.56866455078125, 0.5906524658203125, 0.612640380859375, 0.6346282958984375, 0.6566162109375, 0.6786041259765625, 0.700592041015625, 0.7225799560546875, 0.74456787109375, 0.7665557861328125, 0.788543701171875, 0.8105316162109375, 0.83251953125]}, "gradients/decoder.model.decoder.layers.1.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 1.0, 4.0, 5.0, 7.0, 6.0, 9.0, 9.0, 10.0, 12.0, 20.0, 26.0, 31.0, 35.0, 33.0, 58.0, 51.0, 50.0, 57.0, 64.0, 57.0, 59.0, 60.0, 61.0, 54.0, 40.0, 38.0, 30.0, 26.0, 19.0, 16.0, 18.0, 8.0, 13.0, 8.0, 4.0, 6.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.62451171875, -0.6078262329101562, -0.5911407470703125, -0.5744552612304688, -0.557769775390625, -0.5410842895507812, -0.5243988037109375, -0.5077133178710938, -0.49102783203125, -0.47434234619140625, -0.4576568603515625, -0.44097137451171875, -0.424285888671875, -0.40760040283203125, -0.3909149169921875, -0.37422943115234375, -0.3575439453125, -0.34085845947265625, -0.3241729736328125, -0.30748748779296875, -0.290802001953125, -0.27411651611328125, -0.2574310302734375, -0.24074554443359375, -0.22406005859375, -0.20737457275390625, -0.1906890869140625, -0.17400360107421875, -0.157318115234375, -0.14063262939453125, -0.1239471435546875, -0.10726165771484375, -0.090576171875, -0.07389068603515625, -0.0572052001953125, -0.04051971435546875, -0.023834228515625, -0.00714874267578125, 0.0095367431640625, 0.02622222900390625, 0.04290771484375, 0.05959320068359375, 0.0762786865234375, 0.09296417236328125, 0.109649658203125, 0.12633514404296875, 0.1430206298828125, 0.15970611572265625, 0.1763916015625, 0.19307708740234375, 0.2097625732421875, 0.22644805908203125, 0.243133544921875, 0.25981903076171875, 0.2765045166015625, 0.29319000244140625, 0.30987548828125, 0.32656097412109375, 0.3432464599609375, 0.35993194580078125, 0.376617431640625, 0.39330291748046875, 0.4099884033203125, 0.42667388916015625, 0.443359375]}, "gradients/decoder.model.decoder.layers.1.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 6.0, 1.0, 13.0, 15.0, 15.0, 19.0, 39.0, 49.0, 119.0, 169.0, 335.0, 697.0, 1479.0, 3756.0, 13766.0, 82554.0, 664613.0, 239263.0, 30762.0, 6659.0, 2238.0, 918.0, 472.0, 262.0, 111.0, 86.0, 55.0, 27.0, 16.0, 10.0, 7.0, 8.0, 4.0, 5.0, 2.0, 2.0, 3.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.132080078125, -0.12838459014892578, -0.12468910217285156, -0.12099361419677734, -0.11729812622070312, -0.1136026382446289, -0.10990715026855469, -0.10621166229248047, -0.10251617431640625, -0.09882068634033203, -0.09512519836425781, -0.0914297103881836, -0.08773422241210938, -0.08403873443603516, -0.08034324645996094, -0.07664775848388672, -0.0729522705078125, -0.06925678253173828, -0.06556129455566406, -0.061865806579589844, -0.058170318603515625, -0.054474830627441406, -0.05077934265136719, -0.04708385467529297, -0.04338836669921875, -0.03969287872314453, -0.03599739074707031, -0.032301902770996094, -0.028606414794921875, -0.024910926818847656, -0.021215438842773438, -0.01751995086669922, -0.013824462890625, -0.010128974914550781, -0.0064334869384765625, -0.0027379989624023438, 0.000957489013671875, 0.004652976989746094, 0.008348464965820312, 0.012043952941894531, 0.01573944091796875, 0.01943492889404297, 0.023130416870117188, 0.026825904846191406, 0.030521392822265625, 0.034216880798339844, 0.03791236877441406, 0.04160785675048828, 0.0453033447265625, 0.04899883270263672, 0.05269432067871094, 0.056389808654785156, 0.060085296630859375, 0.0637807846069336, 0.06747627258300781, 0.07117176055908203, 0.07486724853515625, 0.07856273651123047, 0.08225822448730469, 0.0859537124633789, 0.08964920043945312, 0.09334468841552734, 0.09704017639160156, 0.10073566436767578, 0.10443115234375]}, "gradients/decoder.model.decoder.layers.1.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 4.0, 2.0, 7.0, 4.0, 7.0, 11.0, 6.0, 18.0, 12.0, 20.0, 23.0, 42.0, 33.0, 52.0, 63.0, 79.0, 91.0, 112.0, 87.0, 70.0, 58.0, 53.0, 38.0, 21.0, 15.0, 19.0, 11.0, 14.0, 7.0, 8.0, 5.0, 2.0, 3.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.519918441772461e-05, -1.4727935194969177e-05, -1.4256685972213745e-05, -1.3785436749458313e-05, -1.3314187526702881e-05, -1.2842938303947449e-05, -1.2371689081192017e-05, -1.1900439858436584e-05, -1.1429190635681152e-05, -1.095794141292572e-05, -1.0486692190170288e-05, -1.0015442967414856e-05, -9.544193744659424e-06, -9.072944521903992e-06, -8.60169529914856e-06, -8.130446076393127e-06, -7.659196853637695e-06, -7.187947630882263e-06, -6.716698408126831e-06, -6.245449185371399e-06, -5.774199962615967e-06, -5.302950739860535e-06, -4.8317015171051025e-06, -4.36045229434967e-06, -3.889203071594238e-06, -3.417953848838806e-06, -2.946704626083374e-06, -2.475455403327942e-06, -2.0042061805725098e-06, -1.5329569578170776e-06, -1.0617077350616455e-06, -5.904585123062134e-07, -1.1920928955078125e-07, 3.520399332046509e-07, 8.23289155960083e-07, 1.2945383787155151e-06, 1.7657876014709473e-06, 2.2370368242263794e-06, 2.7082860469818115e-06, 3.1795352697372437e-06, 3.6507844924926758e-06, 4.122033715248108e-06, 4.59328293800354e-06, 5.064532160758972e-06, 5.535781383514404e-06, 6.0070306062698364e-06, 6.4782798290252686e-06, 6.949529051780701e-06, 7.420778274536133e-06, 7.892027497291565e-06, 8.363276720046997e-06, 8.83452594280243e-06, 9.305775165557861e-06, 9.777024388313293e-06, 1.0248273611068726e-05, 1.0719522833824158e-05, 1.119077205657959e-05, 1.1662021279335022e-05, 1.2133270502090454e-05, 1.2604519724845886e-05, 1.3075768947601318e-05, 1.354701817035675e-05, 1.4018267393112183e-05, 1.4489516615867615e-05, 1.4960765838623047e-05]}, "gradients/decoder.model.decoder.layers.1.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 6.0, 5.0, 4.0, 5.0, 8.0, 10.0, 23.0, 36.0, 65.0, 106.0, 212.0, 467.0, 1049.0, 2643.0, 9233.0, 65880.0, 723375.0, 217917.0, 20194.0, 4427.0, 1592.0, 669.0, 293.0, 173.0, 83.0, 32.0, 17.0, 15.0, 9.0, 5.0, 5.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1702880859375, -0.16492080688476562, -0.15955352783203125, -0.15418624877929688, -0.1488189697265625, -0.14345169067382812, -0.13808441162109375, -0.13271713256835938, -0.127349853515625, -0.12198257446289062, -0.11661529541015625, -0.11124801635742188, -0.1058807373046875, -0.10051345825195312, -0.09514617919921875, -0.08977890014648438, -0.08441162109375, -0.07904434204101562, -0.07367706298828125, -0.06830978393554688, -0.0629425048828125, -0.057575225830078125, -0.05220794677734375, -0.046840667724609375, -0.041473388671875, -0.036106109619140625, -0.03073883056640625, -0.025371551513671875, -0.0200042724609375, -0.014636993408203125, -0.00926971435546875, -0.003902435302734375, 0.00146484375, 0.006832122802734375, 0.01219940185546875, 0.017566680908203125, 0.0229339599609375, 0.028301239013671875, 0.03366851806640625, 0.039035797119140625, 0.044403076171875, 0.049770355224609375, 0.05513763427734375, 0.060504913330078125, 0.0658721923828125, 0.07123947143554688, 0.07660675048828125, 0.08197402954101562, 0.08734130859375, 0.09270858764648438, 0.09807586669921875, 0.10344314575195312, 0.1088104248046875, 0.11417770385742188, 0.11954498291015625, 0.12491226196289062, 0.130279541015625, 0.13564682006835938, 0.14101409912109375, 0.14638137817382812, 0.1517486572265625, 0.15711593627929688, 0.16248321533203125, 0.16785049438476562, 0.1732177734375]}, "gradients/decoder.model.decoder.layers.1.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 5.0, 3.0, 14.0, 16.0, 18.0, 21.0, 29.0, 60.0, 86.0, 136.0, 145.0, 148.0, 93.0, 68.0, 41.0, 40.0, 26.0, 16.0, 14.0, 3.0, 7.0, 2.0, 2.0, 4.0, 2.0, 0.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0670166015625, -0.06490612030029297, -0.06279563903808594, -0.060685157775878906, -0.058574676513671875, -0.056464195251464844, -0.05435371398925781, -0.05224323272705078, -0.05013275146484375, -0.04802227020263672, -0.04591178894042969, -0.043801307678222656, -0.041690826416015625, -0.039580345153808594, -0.03746986389160156, -0.03535938262939453, -0.0332489013671875, -0.03113842010498047, -0.029027938842773438, -0.026917457580566406, -0.024806976318359375, -0.022696495056152344, -0.020586013793945312, -0.01847553253173828, -0.01636505126953125, -0.014254570007324219, -0.012144088745117188, -0.010033607482910156, -0.007923126220703125, -0.005812644958496094, -0.0037021636962890625, -0.0015916824340820312, 0.000518798828125, 0.0026292800903320312, 0.0047397613525390625, 0.006850242614746094, 0.008960723876953125, 0.011071205139160156, 0.013181686401367188, 0.015292167663574219, 0.01740264892578125, 0.01951313018798828, 0.021623611450195312, 0.023734092712402344, 0.025844573974609375, 0.027955055236816406, 0.030065536499023438, 0.03217601776123047, 0.0342864990234375, 0.03639698028564453, 0.03850746154785156, 0.040617942810058594, 0.042728424072265625, 0.044838905334472656, 0.04694938659667969, 0.04905986785888672, 0.05117034912109375, 0.05328083038330078, 0.05539131164550781, 0.057501792907714844, 0.059612274169921875, 0.061722755432128906, 0.06383323669433594, 0.06594371795654297, 0.06805419921875]}, "gradients/decoder.model.decoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 32.0, 87.0, 176.0, 280.0, 248.0, 116.0, 54.0, 11.0, 6.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8445942997932434, -0.7835565805435181, -0.7225189208984375, -0.6614812016487122, -0.6004435420036316, -0.5394058227539062, -0.4783681333065033, -0.41733044385910034, -0.3562927544116974, -0.29525506496429443, -0.23421737551689148, -0.17317967116832733, -0.11214198172092438, -0.05110427737236023, 0.009933412075042725, 0.07097110152244568, 0.13200879096984863, 0.1930464804172516, 0.25408416986465454, 0.3151218891143799, 0.37615954875946045, 0.4371972680091858, 0.49823495745658875, 0.5592726469039917, 0.6203103065490723, 0.6813480257987976, 0.7423856854438782, 0.8034234046936035, 0.8644610643386841, 0.9254987835884094, 0.9865365028381348, 1.0475741624832153, 1.1086119413375854, 1.169649600982666, 1.2306873798370361, 1.2917250394821167, 1.3527626991271973, 1.4138004779815674, 1.474838137626648, 1.5358757972717285, 1.596913456916809, 1.6579511165618896, 1.7189888954162598, 1.7800265550613403, 1.841064214706421, 1.902101993560791, 1.9631396532058716, 2.024177312850952, 2.0852150917053223, 2.1462528705596924, 2.2072904109954834, 2.2683281898498535, 2.3293659687042236, 2.3904035091400146, 2.4514412879943848, 2.512478828430176, 2.573516607284546, 2.634554386138916, 2.695591926574707, 2.756629705429077, 2.8176674842834473, 2.8787050247192383, 2.9397428035736084, 3.0007805824279785, 3.0618181228637695]}, "gradients/decoder.model.decoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 6.0, 4.0, 5.0, 6.0, 9.0, 19.0, 10.0, 13.0, 21.0, 24.0, 24.0, 23.0, 27.0, 31.0, 29.0, 42.0, 39.0, 37.0, 38.0, 42.0, 51.0, 51.0, 48.0, 55.0, 41.0, 38.0, 44.0, 43.0, 32.0, 19.0, 29.0, 17.0, 20.0, 11.0, 15.0, 12.0, 12.0, 6.0, 3.0, 10.0, 1.0, 1.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6871644258499146, -0.6649504899978638, -0.6427364945411682, -0.6205225586891174, -0.5983086228370667, -0.5760946869850159, -0.5538806915283203, -0.5316667556762695, -0.5094528198242188, -0.4872388541698456, -0.4650249183177948, -0.44281095266342163, -0.42059701681137085, -0.3983830511569977, -0.3761690855026245, -0.35395514965057373, -0.33174118399620056, -0.3095272183418274, -0.2873132824897766, -0.26509931683540344, -0.24288538098335266, -0.2206714153289795, -0.19845746457576752, -0.17624351382255554, -0.15402956306934357, -0.1318156123161316, -0.10960166156291962, -0.08738770335912704, -0.06517375260591507, -0.042959801852703094, -0.020745843648910522, 0.0014681071043014526, 0.023682057857513428, 0.0458960086107254, 0.06810995936393738, 0.09032391756772995, 0.11253786832094193, 0.1347518265247345, 0.15696577727794647, 0.17917972803115845, 0.20139367878437042, 0.2236076295375824, 0.24582158029079437, 0.26803553104400635, 0.2902494966983795, 0.3124634325504303, 0.33467739820480347, 0.35689133405685425, 0.3791052997112274, 0.4013192653656006, 0.42353320121765137, 0.44574716687202454, 0.4679611027240753, 0.4901750683784485, 0.5123890042304993, 0.5346029996871948, 0.5568169355392456, 0.5790308713912964, 0.6012448668479919, 0.6234588027000427, 0.6456727385520935, 0.6678866744041443, 0.6901006698608398, 0.7123146057128906, 0.7345285415649414]}, "gradients/decoder.model.decoder.layers.0.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 7.0, 4.0, 11.0, 10.0, 13.0, 12.0, 15.0, 19.0, 25.0, 40.0, 67.0, 105.0, 167.0, 346.0, 710.0, 1585.0, 3491.0, 9441.0, 34293.0, 377416.0, 3245929.0, 466798.0, 37175.0, 9898.0, 3630.0, 1558.0, 723.0, 342.0, 162.0, 98.0, 46.0, 42.0, 25.0, 21.0, 13.0, 12.0, 10.0, 8.0, 3.0, 4.0, 5.0, 1.0, 5.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.51953125, -0.5044822692871094, -0.48943328857421875, -0.4743843078613281, -0.4593353271484375, -0.4442863464355469, -0.42923736572265625, -0.4141883850097656, -0.399139404296875, -0.3840904235839844, -0.36904144287109375, -0.3539924621582031, -0.3389434814453125, -0.3238945007324219, -0.30884552001953125, -0.2937965393066406, -0.27874755859375, -0.2636985778808594, -0.24864959716796875, -0.23360061645507812, -0.2185516357421875, -0.20350265502929688, -0.18845367431640625, -0.17340469360351562, -0.158355712890625, -0.14330673217773438, -0.12825775146484375, -0.11320877075195312, -0.0981597900390625, -0.08311080932617188, -0.06806182861328125, -0.053012847900390625, -0.0379638671875, -0.022914886474609375, -0.00786590576171875, 0.007183074951171875, 0.0222320556640625, 0.037281036376953125, 0.05233001708984375, 0.06737899780273438, 0.082427978515625, 0.09747695922851562, 0.11252593994140625, 0.12757492065429688, 0.1426239013671875, 0.15767288208007812, 0.17272186279296875, 0.18777084350585938, 0.20281982421875, 0.21786880493164062, 0.23291778564453125, 0.24796676635742188, 0.2630157470703125, 0.2780647277832031, 0.29311370849609375, 0.3081626892089844, 0.323211669921875, 0.3382606506347656, 0.35330963134765625, 0.3683586120605469, 0.3834075927734375, 0.3984565734863281, 0.41350555419921875, 0.4285545349121094, 0.443603515625]}, "gradients/decoder.model.decoder.layers.0.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 2.0, 6.0, 8.0, 10.0, 11.0, 8.0, 16.0, 16.0, 10.0, 15.0, 21.0, 29.0, 25.0, 34.0, 32.0, 29.0, 27.0, 45.0, 40.0, 48.0, 37.0, 51.0, 41.0, 56.0, 50.0, 51.0, 41.0, 41.0, 44.0, 33.0, 22.0, 21.0, 13.0, 10.0, 13.0, 18.0, 9.0, 8.0, 2.0, 6.0, 3.0, 5.0, 6.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.222412109375, -0.21626853942871094, -0.21012496948242188, -0.2039813995361328, -0.19783782958984375, -0.1916942596435547, -0.18555068969726562, -0.17940711975097656, -0.1732635498046875, -0.16711997985839844, -0.16097640991210938, -0.1548328399658203, -0.14868927001953125, -0.1425457000732422, -0.13640213012695312, -0.13025856018066406, -0.124114990234375, -0.11797142028808594, -0.11182785034179688, -0.10568428039550781, -0.09954071044921875, -0.09339714050292969, -0.08725357055664062, -0.08111000061035156, -0.0749664306640625, -0.06882286071777344, -0.06267929077148438, -0.05653572082519531, -0.05039215087890625, -0.04424858093261719, -0.038105010986328125, -0.03196144104003906, -0.02581787109375, -0.019674301147460938, -0.013530731201171875, -0.0073871612548828125, -0.00124359130859375, 0.0048999786376953125, 0.011043548583984375, 0.017187118530273438, 0.0233306884765625, 0.029474258422851562, 0.035617828369140625, 0.04176139831542969, 0.04790496826171875, 0.05404853820800781, 0.060192108154296875, 0.06633567810058594, 0.072479248046875, 0.07862281799316406, 0.08476638793945312, 0.09090995788574219, 0.09705352783203125, 0.10319709777832031, 0.10934066772460938, 0.11548423767089844, 0.1216278076171875, 0.12777137756347656, 0.13391494750976562, 0.1400585174560547, 0.14620208740234375, 0.1523456573486328, 0.15848922729492188, 0.16463279724121094, 0.1707763671875]}, "gradients/decoder.model.decoder.layers.0.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 4.0, 10.0, 12.0, 12.0, 19.0, 40.0, 70.0, 141.0, 317.0, 989.0, 5383.0, 119756.0, 4015424.0, 47472.0, 3407.0, 726.0, 244.0, 120.0, 64.0, 42.0, 16.0, 11.0, 6.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4150390625, -1.3781814575195312, -1.3413238525390625, -1.3044662475585938, -1.267608642578125, -1.2307510375976562, -1.1938934326171875, -1.1570358276367188, -1.12017822265625, -1.0833206176757812, -1.0464630126953125, -1.0096054077148438, -0.972747802734375, -0.9358901977539062, -0.8990325927734375, -0.8621749877929688, -0.8253173828125, -0.7884597778320312, -0.7516021728515625, -0.7147445678710938, -0.677886962890625, -0.6410293579101562, -0.6041717529296875, -0.5673141479492188, -0.53045654296875, -0.49359893798828125, -0.4567413330078125, -0.41988372802734375, -0.383026123046875, -0.34616851806640625, -0.3093109130859375, -0.27245330810546875, -0.235595703125, -0.19873809814453125, -0.1618804931640625, -0.12502288818359375, -0.088165283203125, -0.05130767822265625, -0.0144500732421875, 0.02240753173828125, 0.05926513671875, 0.09612274169921875, 0.1329803466796875, 0.16983795166015625, 0.206695556640625, 0.24355316162109375, 0.2804107666015625, 0.31726837158203125, 0.3541259765625, 0.39098358154296875, 0.4278411865234375, 0.46469879150390625, 0.501556396484375, 0.5384140014648438, 0.5752716064453125, 0.6121292114257812, 0.64898681640625, 0.6858444213867188, 0.7227020263671875, 0.7595596313476562, 0.796417236328125, 0.8332748413085938, 0.8701324462890625, 0.9069900512695312, 0.94384765625]}, "gradients/decoder.model.decoder.layers.0.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 9.0, 18.0, 19.0, 33.0, 67.0, 110.0, 251.0, 638.0, 1180.0, 930.0, 432.0, 170.0, 96.0, 46.0, 34.0, 19.0, 8.0, 8.0, 1.0, 4.0, 3.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2130126953125, -0.20533180236816406, -0.19765090942382812, -0.1899700164794922, -0.18228912353515625, -0.1746082305908203, -0.16692733764648438, -0.15924644470214844, -0.1515655517578125, -0.14388465881347656, -0.13620376586914062, -0.1285228729248047, -0.12084197998046875, -0.11316108703613281, -0.10548019409179688, -0.09779930114746094, -0.090118408203125, -0.08243751525878906, -0.07475662231445312, -0.06707572937011719, -0.05939483642578125, -0.05171394348144531, -0.044033050537109375, -0.03635215759277344, -0.0286712646484375, -0.020990371704101562, -0.013309478759765625, -0.0056285858154296875, 0.00205230712890625, 0.009733200073242188, 0.017414093017578125, 0.025094985961914062, 0.03277587890625, 0.04045677185058594, 0.048137664794921875, 0.05581855773925781, 0.06349945068359375, 0.07118034362792969, 0.07886123657226562, 0.08654212951660156, 0.0942230224609375, 0.10190391540527344, 0.10958480834960938, 0.11726570129394531, 0.12494659423828125, 0.1326274871826172, 0.14030838012695312, 0.14798927307128906, 0.155670166015625, 0.16335105895996094, 0.17103195190429688, 0.1787128448486328, 0.18639373779296875, 0.1940746307373047, 0.20175552368164062, 0.20943641662597656, 0.2171173095703125, 0.22479820251464844, 0.23247909545898438, 0.2401599884033203, 0.24784088134765625, 0.2555217742919922, 0.2632026672363281, 0.27088356018066406, 0.278564453125]}, "gradients/decoder.model.decoder.layers.0.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 7.0, 6.0, 6.0, 12.0, 13.0, 16.0, 21.0, 28.0, 36.0, 47.0, 55.0, 70.0, 56.0, 77.0, 69.0, 73.0, 71.0, 49.0, 56.0, 56.0, 42.0, 34.0, 28.0, 19.0, 21.0, 10.0, 7.0, 5.0, 8.0, 6.0, 5.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.5387060642242432, -0.5260964632034302, -0.5134868621826172, -0.5008772611618042, -0.4882676601409912, -0.4756580591201782, -0.46304845809936523, -0.45043885707855225, -0.43782925605773926, -0.42521965503692627, -0.4126100540161133, -0.4000004529953003, -0.3873908519744873, -0.3747812509536743, -0.36217164993286133, -0.34956204891204834, -0.33695247769355774, -0.32434287667274475, -0.31173327565193176, -0.2991236746311188, -0.2865140736103058, -0.2739044725894928, -0.2612949013710022, -0.24868528544902802, -0.23607568442821503, -0.22346608340740204, -0.21085648238658905, -0.19824689626693726, -0.18563729524612427, -0.17302769422531128, -0.1604180932044983, -0.1478084921836853, -0.1351989209651947, -0.12258931994438171, -0.10997971892356873, -0.09737012535333633, -0.08476052433252335, -0.07215092331171036, -0.059541329741477966, -0.04693172872066498, -0.03432212769985199, -0.02171252854168415, -0.009102929383516312, 0.003506667912006378, 0.016116268932819366, 0.028725869953632355, 0.041335463523864746, 0.053945064544677734, 0.06655466556549072, 0.07916426658630371, 0.0917738676071167, 0.10438346117734909, 0.11699306219816208, 0.12960267066955566, 0.14221225678920746, 0.15482185781002045, 0.16743145883083344, 0.18004105985164642, 0.1926506608724594, 0.2052602469921112, 0.2178698480129242, 0.23047944903373718, 0.24308905005455017, 0.25569865107536316, 0.26830825209617615]}, "gradients/decoder.model.decoder.layers.0.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 3.0, 1.0, 3.0, 4.0, 2.0, 4.0, 4.0, 5.0, 10.0, 15.0, 9.0, 15.0, 14.0, 19.0, 18.0, 19.0, 33.0, 24.0, 43.0, 43.0, 42.0, 31.0, 40.0, 42.0, 55.0, 46.0, 37.0, 38.0, 29.0, 29.0, 46.0, 32.0, 35.0, 34.0, 28.0, 29.0, 19.0, 14.0, 14.0, 12.0, 12.0, 16.0, 9.0, 8.0, 5.0, 5.0, 5.0, 5.0, 2.0, 3.0, 2.0, 0.0, 2.0, 1.0], "bins": [-0.28750863671302795, -0.27930018305778503, -0.2710916996002197, -0.2628832459449768, -0.2546747624874115, -0.24646630883216858, -0.23825784027576447, -0.23004937171936035, -0.22184090316295624, -0.21363243460655212, -0.205423966050148, -0.1972154974937439, -0.18900704383850098, -0.18079856038093567, -0.17259010672569275, -0.16438163816928864, -0.15617316961288452, -0.1479647010564804, -0.1397562325000763, -0.13154776394367218, -0.12333930283784866, -0.11513083428144455, -0.10692237317562103, -0.09871390461921692, -0.0905054360628128, -0.08229696750640869, -0.07408849895000458, -0.06588003784418106, -0.05767156928777695, -0.04946310073137283, -0.04125463590025902, -0.0330461710691452, -0.02483770251274109, -0.016629235818982124, -0.00842076912522316, -0.00021230243146419525, 0.00799616426229477, 0.016204632818698883, 0.0244130976498127, 0.032621562480926514, 0.04083003103733063, 0.04903849959373474, 0.057246964424848557, 0.06545542925596237, 0.07366389781236649, 0.0818723663687706, 0.09008082747459412, 0.09828929603099823, 0.10649776458740234, 0.11470623314380646, 0.12291470170021057, 0.13112317025661469, 0.1393316388130188, 0.14754009246826172, 0.15574856102466583, 0.16395702958106995, 0.17216549813747406, 0.18037396669387817, 0.1885824352502823, 0.1967909038066864, 0.20499935746192932, 0.21320784091949463, 0.22141629457473755, 0.22962476313114166, 0.23783323168754578]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 2.0, 3.0, 5.0, 4.0, 9.0, 6.0, 15.0, 15.0, 25.0, 35.0, 43.0, 63.0, 78.0, 127.0, 169.0, 275.0, 446.0, 748.0, 1351.0, 2614.0, 4878.0, 9645.0, 22662.0, 80507.0, 429180.0, 384246.0, 71049.0, 20718.0, 9354.0, 4667.0, 2422.0, 1283.0, 695.0, 386.0, 250.0, 163.0, 126.0, 75.0, 50.0, 41.0, 28.0, 29.0, 13.0, 14.0, 14.0, 3.0, 8.0, 13.0, 4.0, 2.0, 3.0, 3.0, 2.0, 1.0, 1.0], "bins": [-0.10528564453125, -0.10218524932861328, -0.09908485412597656, -0.09598445892333984, -0.09288406372070312, -0.0897836685180664, -0.08668327331542969, -0.08358287811279297, -0.08048248291015625, -0.07738208770751953, -0.07428169250488281, -0.0711812973022461, -0.06808090209960938, -0.06498050689697266, -0.06188011169433594, -0.05877971649169922, -0.0556793212890625, -0.05257892608642578, -0.04947853088378906, -0.046378135681152344, -0.043277740478515625, -0.040177345275878906, -0.03707695007324219, -0.03397655487060547, -0.03087615966796875, -0.02777576446533203, -0.024675369262695312, -0.021574974060058594, -0.018474578857421875, -0.015374183654785156, -0.012273788452148438, -0.009173393249511719, -0.006072998046875, -0.0029726028442382812, 0.0001277923583984375, 0.0032281875610351562, 0.006328582763671875, 0.009428977966308594, 0.012529373168945312, 0.01562976837158203, 0.01873016357421875, 0.02183055877685547, 0.024930953979492188, 0.028031349182128906, 0.031131744384765625, 0.034232139587402344, 0.03733253479003906, 0.04043292999267578, 0.0435333251953125, 0.04663372039794922, 0.04973411560058594, 0.052834510803222656, 0.055934906005859375, 0.059035301208496094, 0.06213569641113281, 0.06523609161376953, 0.06833648681640625, 0.07143688201904297, 0.07453727722167969, 0.0776376724243164, 0.08073806762695312, 0.08383846282958984, 0.08693885803222656, 0.09003925323486328, 0.0931396484375]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 2.0, 1.0, 2.0, 3.0, 5.0, 3.0, 4.0, 1.0, 4.0, 10.0, 12.0, 12.0, 11.0, 14.0, 17.0, 23.0, 18.0, 26.0, 25.0, 37.0, 27.0, 54.0, 40.0, 35.0, 62.0, 50.0, 45.0, 47.0, 38.0, 41.0, 31.0, 42.0, 36.0, 25.0, 33.0, 27.0, 32.0, 16.0, 16.0, 19.0, 19.0, 9.0, 9.0, 8.0, 5.0, 4.0, 4.0, 3.0, 4.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1671142578125, -0.16146469116210938, -0.15581512451171875, -0.15016555786132812, -0.1445159912109375, -0.13886642456054688, -0.13321685791015625, -0.12756729125976562, -0.121917724609375, -0.11626815795898438, -0.11061859130859375, -0.10496902465820312, -0.0993194580078125, -0.09366989135742188, -0.08802032470703125, -0.08237075805664062, -0.07672119140625, -0.07107162475585938, -0.06542205810546875, -0.059772491455078125, -0.0541229248046875, -0.048473358154296875, -0.04282379150390625, -0.037174224853515625, -0.031524658203125, -0.025875091552734375, -0.02022552490234375, -0.014575958251953125, -0.0089263916015625, -0.003276824951171875, 0.00237274169921875, 0.008022308349609375, 0.013671875, 0.019321441650390625, 0.02497100830078125, 0.030620574951171875, 0.0362701416015625, 0.041919708251953125, 0.04756927490234375, 0.053218841552734375, 0.058868408203125, 0.06451797485351562, 0.07016754150390625, 0.07581710815429688, 0.0814666748046875, 0.08711624145507812, 0.09276580810546875, 0.09841537475585938, 0.10406494140625, 0.10971450805664062, 0.11536407470703125, 0.12101364135742188, 0.1266632080078125, 0.13231277465820312, 0.13796234130859375, 0.14361190795898438, 0.149261474609375, 0.15491104125976562, 0.16056060791015625, 0.16621017456054688, 0.1718597412109375, 0.17750930786132812, 0.18315887451171875, 0.18880844116210938, 0.1944580078125]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 5.0, 3.0, 5.0, 5.0, 7.0, 11.0, 9.0, 22.0, 23.0, 29.0, 43.0, 56.0, 100.0, 122.0, 188.0, 263.0, 446.0, 741.0, 1186.0, 2126.0, 4014.0, 8343.0, 19397.0, 54304.0, 191389.0, 441353.0, 219992.0, 62742.0, 22341.0, 9155.0, 4450.0, 2317.0, 1234.0, 766.0, 485.0, 309.0, 168.0, 122.0, 85.0, 49.0, 46.0, 33.0, 20.0, 21.0, 11.0, 9.0, 3.0, 6.0, 6.0, 5.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0638427734375, -0.06194019317626953, -0.06003761291503906, -0.058135032653808594, -0.056232452392578125, -0.054329872131347656, -0.05242729187011719, -0.05052471160888672, -0.04862213134765625, -0.04671955108642578, -0.04481697082519531, -0.042914390563964844, -0.041011810302734375, -0.039109230041503906, -0.03720664978027344, -0.03530406951904297, -0.0334014892578125, -0.03149890899658203, -0.029596328735351562, -0.027693748474121094, -0.025791168212890625, -0.023888587951660156, -0.021986007690429688, -0.02008342742919922, -0.01818084716796875, -0.01627826690673828, -0.014375686645507812, -0.012473106384277344, -0.010570526123046875, -0.008667945861816406, -0.0067653656005859375, -0.004862785339355469, -0.002960205078125, -0.0010576248168945312, 0.0008449554443359375, 0.0027475357055664062, 0.004650115966796875, 0.006552696228027344, 0.008455276489257812, 0.010357856750488281, 0.01226043701171875, 0.014163017272949219, 0.016065597534179688, 0.017968177795410156, 0.019870758056640625, 0.021773338317871094, 0.023675918579101562, 0.02557849884033203, 0.0274810791015625, 0.02938365936279297, 0.03128623962402344, 0.033188819885253906, 0.035091400146484375, 0.036993980407714844, 0.03889656066894531, 0.04079914093017578, 0.04270172119140625, 0.04460430145263672, 0.04650688171386719, 0.048409461975097656, 0.050312042236328125, 0.052214622497558594, 0.05411720275878906, 0.05601978302001953, 0.05792236328125]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 1.0, 3.0, 6.0, 4.0, 7.0, 12.0, 11.0, 12.0, 15.0, 19.0, 13.0, 23.0, 21.0, 22.0, 31.0, 28.0, 31.0, 41.0, 38.0, 51.0, 40.0, 34.0, 38.0, 30.0, 33.0, 41.0, 31.0, 29.0, 38.0, 32.0, 34.0, 33.0, 30.0, 29.0, 23.0, 23.0, 19.0, 13.0, 8.0, 16.0, 12.0, 6.0, 6.0, 6.0, 3.0, 3.0, 5.0, 0.0, 3.0, 0.0, 0.0, 2.0, 4.0], "bins": [-0.4091796875, -0.3971672058105469, -0.38515472412109375, -0.3731422424316406, -0.3611297607421875, -0.3491172790527344, -0.33710479736328125, -0.3250923156738281, -0.313079833984375, -0.3010673522949219, -0.28905487060546875, -0.2770423889160156, -0.2650299072265625, -0.2530174255371094, -0.24100494384765625, -0.22899246215820312, -0.21697998046875, -0.20496749877929688, -0.19295501708984375, -0.18094253540039062, -0.1689300537109375, -0.15691757202148438, -0.14490509033203125, -0.13289260864257812, -0.120880126953125, -0.10886764526367188, -0.09685516357421875, -0.08484268188476562, -0.0728302001953125, -0.060817718505859375, -0.04880523681640625, -0.036792755126953125, -0.0247802734375, -0.012767791748046875, -0.00075531005859375, 0.011257171630859375, 0.0232696533203125, 0.035282135009765625, 0.04729461669921875, 0.059307098388671875, 0.071319580078125, 0.08333206176757812, 0.09534454345703125, 0.10735702514648438, 0.1193695068359375, 0.13138198852539062, 0.14339447021484375, 0.15540695190429688, 0.16741943359375, 0.17943191528320312, 0.19144439697265625, 0.20345687866210938, 0.2154693603515625, 0.22748184204101562, 0.23949432373046875, 0.2515068054199219, 0.263519287109375, 0.2755317687988281, 0.28754425048828125, 0.2995567321777344, 0.3115692138671875, 0.3235816955566406, 0.33559417724609375, 0.3476066589355469, 0.359619140625]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 1.0, 11.0, 7.0, 12.0, 7.0, 20.0, 14.0, 19.0, 43.0, 76.0, 137.0, 191.0, 373.0, 867.0, 1689.0, 3908.0, 10736.0, 40895.0, 383763.0, 527420.0, 56922.0, 12972.0, 4544.0, 1959.0, 912.0, 463.0, 231.0, 152.0, 64.0, 44.0, 32.0, 21.0, 12.0, 14.0, 10.0, 8.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-0.047332763671875, -0.04598379135131836, -0.04463481903076172, -0.04328584671020508, -0.04193687438964844, -0.0405879020690918, -0.039238929748535156, -0.037889957427978516, -0.036540985107421875, -0.035192012786865234, -0.033843040466308594, -0.03249406814575195, -0.031145095825195312, -0.029796123504638672, -0.02844715118408203, -0.02709817886352539, -0.02574920654296875, -0.02440023422241211, -0.02305126190185547, -0.021702289581298828, -0.020353317260742188, -0.019004344940185547, -0.017655372619628906, -0.016306400299072266, -0.014957427978515625, -0.013608455657958984, -0.012259483337402344, -0.010910511016845703, -0.009561538696289062, -0.008212566375732422, -0.006863594055175781, -0.005514621734619141, -0.0041656494140625, -0.0028166770935058594, -0.0014677047729492188, -0.00011873245239257812, 0.0012302398681640625, 0.002579212188720703, 0.003928184509277344, 0.005277156829833984, 0.006626129150390625, 0.007975101470947266, 0.009324073791503906, 0.010673046112060547, 0.012022018432617188, 0.013370990753173828, 0.014719963073730469, 0.01606893539428711, 0.01741790771484375, 0.01876688003540039, 0.02011585235595703, 0.021464824676513672, 0.022813796997070312, 0.024162769317626953, 0.025511741638183594, 0.026860713958740234, 0.028209686279296875, 0.029558658599853516, 0.030907630920410156, 0.0322566032409668, 0.03360557556152344, 0.03495454788208008, 0.03630352020263672, 0.03765249252319336, 0.03900146484375]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 5.0, 3.0, 2.0, 7.0, 5.0, 7.0, 6.0, 13.0, 24.0, 51.0, 71.0, 149.0, 182.0, 183.0, 132.0, 65.0, 38.0, 19.0, 9.0, 9.0, 4.0, 4.0, 4.0, 6.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.8133392333984375e-05, -2.7156434953212738e-05, -2.61794775724411e-05, -2.5202520191669464e-05, -2.4225562810897827e-05, -2.324860543012619e-05, -2.2271648049354553e-05, -2.1294690668582916e-05, -2.031773328781128e-05, -1.9340775907039642e-05, -1.8363818526268005e-05, -1.738686114549637e-05, -1.640990376472473e-05, -1.5432946383953094e-05, -1.4455989003181458e-05, -1.347903162240982e-05, -1.2502074241638184e-05, -1.1525116860866547e-05, -1.054815948009491e-05, -9.571202099323273e-06, -8.594244718551636e-06, -7.617287337779999e-06, -6.640329957008362e-06, -5.663372576236725e-06, -4.686415195465088e-06, -3.709457814693451e-06, -2.732500433921814e-06, -1.755543053150177e-06, -7.7858567237854e-07, 1.9837170839309692e-07, 1.1753290891647339e-06, 2.152286469936371e-06, 3.129243850708008e-06, 4.106201231479645e-06, 5.083158612251282e-06, 6.060115993022919e-06, 7.037073373794556e-06, 8.014030754566193e-06, 8.99098813533783e-06, 9.967945516109467e-06, 1.0944902896881104e-05, 1.192186027765274e-05, 1.2898817658424377e-05, 1.3875775039196014e-05, 1.4852732419967651e-05, 1.582968980073929e-05, 1.6806647181510925e-05, 1.7783604562282562e-05, 1.87605619430542e-05, 1.9737519323825836e-05, 2.0714476704597473e-05, 2.169143408536911e-05, 2.2668391466140747e-05, 2.3645348846912384e-05, 2.462230622768402e-05, 2.5599263608455658e-05, 2.6576220989227295e-05, 2.7553178369998932e-05, 2.853013575077057e-05, 2.9507093131542206e-05, 3.0484050512313843e-05, 3.146100789308548e-05, 3.243796527385712e-05, 3.3414922654628754e-05, 3.439188003540039e-05]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 5.0, 9.0, 6.0, 11.0, 19.0, 23.0, 39.0, 40.0, 79.0, 96.0, 189.0, 251.0, 417.0, 644.0, 1087.0, 1834.0, 3132.0, 6124.0, 12462.0, 30140.0, 93762.0, 303068.0, 381388.0, 138189.0, 42257.0, 16342.0, 7531.0, 4019.0, 2129.0, 1260.0, 694.0, 466.0, 284.0, 176.0, 126.0, 84.0, 63.0, 34.0, 23.0, 17.0, 13.0, 8.0, 15.0, 4.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.02618408203125, -0.02531576156616211, -0.02444744110107422, -0.023579120635986328, -0.022710800170898438, -0.021842479705810547, -0.020974159240722656, -0.020105838775634766, -0.019237518310546875, -0.018369197845458984, -0.017500877380371094, -0.016632556915283203, -0.015764236450195312, -0.014895915985107422, -0.014027595520019531, -0.01315927505493164, -0.01229095458984375, -0.01142263412475586, -0.010554313659667969, -0.009685993194580078, -0.008817672729492188, -0.007949352264404297, -0.007081031799316406, -0.006212711334228516, -0.005344390869140625, -0.004476070404052734, -0.0036077499389648438, -0.002739429473876953, -0.0018711090087890625, -0.0010027885437011719, -0.00013446807861328125, 0.0007338523864746094, 0.0016021728515625, 0.0024704933166503906, 0.0033388137817382812, 0.004207134246826172, 0.0050754547119140625, 0.005943775177001953, 0.006812095642089844, 0.007680416107177734, 0.008548736572265625, 0.009417057037353516, 0.010285377502441406, 0.011153697967529297, 0.012022018432617188, 0.012890338897705078, 0.013758659362792969, 0.01462697982788086, 0.01549530029296875, 0.01636362075805664, 0.01723194122314453, 0.018100261688232422, 0.018968582153320312, 0.019836902618408203, 0.020705223083496094, 0.021573543548583984, 0.022441864013671875, 0.023310184478759766, 0.024178504943847656, 0.025046825408935547, 0.025915145874023438, 0.026783466339111328, 0.02765178680419922, 0.02852010726928711, 0.029388427734375]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 4.0, 5.0, 3.0, 6.0, 13.0, 9.0, 16.0, 20.0, 17.0, 38.0, 48.0, 77.0, 90.0, 83.0, 107.0, 92.0, 76.0, 85.0, 50.0, 39.0, 28.0, 21.0, 11.0, 19.0, 9.0, 10.0, 5.0, 7.0, 4.0, 2.0, 3.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01061248779296875, -0.0102766752243042, -0.009940862655639648, -0.009605050086975098, -0.009269237518310547, -0.008933424949645996, -0.008597612380981445, -0.008261799812316895, -0.007925987243652344, -0.007590174674987793, -0.007254362106323242, -0.006918549537658691, -0.006582736968994141, -0.00624692440032959, -0.005911111831665039, -0.005575299263000488, -0.0052394866943359375, -0.004903674125671387, -0.004567861557006836, -0.004232048988342285, -0.0038962364196777344, -0.0035604238510131836, -0.003224611282348633, -0.002888798713684082, -0.0025529861450195312, -0.0022171735763549805, -0.0018813610076904297, -0.001545548439025879, -0.0012097358703613281, -0.0008739233016967773, -0.0005381107330322266, -0.00020229816436767578, 0.000133514404296875, 0.0004693269729614258, 0.0008051395416259766, 0.0011409521102905273, 0.0014767646789550781, 0.001812577247619629, 0.0021483898162841797, 0.0024842023849487305, 0.0028200149536132812, 0.003155827522277832, 0.003491640090942383, 0.0038274526596069336, 0.004163265228271484, 0.004499077796936035, 0.004834890365600586, 0.005170702934265137, 0.0055065155029296875, 0.005842328071594238, 0.006178140640258789, 0.00651395320892334, 0.006849765777587891, 0.007185578346252441, 0.007521390914916992, 0.007857203483581543, 0.008193016052246094, 0.008528828620910645, 0.008864641189575195, 0.009200453758239746, 0.009536266326904297, 0.009872078895568848, 0.010207891464233398, 0.01054370403289795, 0.0108795166015625]}, "gradients/decoder.model.decoder.layers.0.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 4.0, 8.0, 6.0, 13.0, 13.0, 9.0, 13.0, 13.0, 24.0, 19.0, 46.0, 57.0, 48.0, 47.0, 52.0, 62.0, 56.0, 61.0, 61.0, 52.0, 52.0, 48.0, 55.0, 40.0, 27.0, 26.0, 15.0, 23.0, 12.0, 11.0, 6.0, 10.0, 6.0, 4.0, 4.0, 3.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.21121995151042938, -0.2046094834804535, -0.1979990005493164, -0.19138853251934052, -0.18477806448936462, -0.17816759645938873, -0.17155712842941284, -0.16494664549827576, -0.15833617746829987, -0.15172570943832397, -0.1451152265071869, -0.138504758477211, -0.1318942904472351, -0.12528382241725922, -0.11867334693670273, -0.11206287145614624, -0.10545240342617035, -0.09884193539619446, -0.09223145991563797, -0.08562098443508148, -0.07901051640510559, -0.0724000483751297, -0.06578957289457321, -0.05917910113930702, -0.05256862938404083, -0.04595815762877464, -0.03934768587350845, -0.032737214118242264, -0.026126742362976074, -0.019516270607709885, -0.012905798852443695, -0.0062953270971775055, 0.00031515955924987793, 0.0069256313145160675, 0.013536103069782257, 0.020146574825048447, 0.026757046580314636, 0.033367518335580826, 0.039977990090847015, 0.046588461846113205, 0.053198933601379395, 0.059809405356645584, 0.06641987711191177, 0.07303035259246826, 0.07964082062244415, 0.08625128865242004, 0.09286176413297653, 0.09947223961353302, 0.10608270764350891, 0.1126931756734848, 0.11930365115404129, 0.12591412663459778, 0.13252459466457367, 0.13913506269454956, 0.14574554562568665, 0.15235601365566254, 0.15896648168563843, 0.16557694971561432, 0.1721874177455902, 0.1787979006767273, 0.18540836870670319, 0.19201883673667908, 0.19862931966781616, 0.20523978769779205, 0.21185025572776794]}, "gradients/decoder.model.decoder.layers.0.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 5.0, 3.0, 2.0, 4.0, 2.0, 8.0, 4.0, 13.0, 17.0, 17.0, 13.0, 17.0, 21.0, 24.0, 23.0, 31.0, 44.0, 40.0, 46.0, 42.0, 40.0, 47.0, 46.0, 38.0, 43.0, 31.0, 43.0, 31.0, 32.0, 31.0, 32.0, 30.0, 36.0, 29.0, 16.0, 16.0, 15.0, 14.0, 10.0, 17.0, 9.0, 6.0, 4.0, 3.0, 4.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 3.0], "bins": [-0.18202324211597443, -0.17685925960540771, -0.1716952919960022, -0.16653130948543549, -0.16136732697486877, -0.15620335936546326, -0.15103937685489655, -0.14587539434432983, -0.14071142673492432, -0.1355474442243576, -0.1303834766149521, -0.12521949410438538, -0.12005551159381866, -0.11489153653383255, -0.10972756147384644, -0.10456357896327972, -0.09939959645271301, -0.0942356213927269, -0.08907163888216019, -0.08390766382217407, -0.07874368131160736, -0.07357970625162125, -0.06841573119163513, -0.06325174868106842, -0.058087773621082306, -0.05292379483580589, -0.04775981605052948, -0.042595840990543365, -0.03743186220526695, -0.03226788341999054, -0.027103906497359276, -0.021939929574728012, -0.016775965690612793, -0.011611987836658955, -0.006448009982705116, -0.001284032128751278, 0.0038799457252025604, 0.009043924510478973, 0.014207901433110237, 0.0193718783557415, 0.024535857141017914, 0.029699835926294327, 0.03486381471157074, 0.040027789771556854, 0.04519176855683327, 0.05035574734210968, 0.055519722402095795, 0.06068370118737221, 0.06584767997264862, 0.07101165503263474, 0.07617563754320145, 0.08133961260318756, 0.08650359511375427, 0.09166757017374039, 0.0968315452337265, 0.10199552774429321, 0.10715950280427933, 0.11232347786426544, 0.11748746037483215, 0.12265143543481827, 0.12781541049480438, 0.1329793930053711, 0.1381433755159378, 0.14330734312534332, 0.14847132563591003]}, "gradients/decoder.model.decoder.layers.0.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 2.0, 3.0, 7.0, 11.0, 7.0, 14.0, 16.0, 39.0, 47.0, 73.0, 125.0, 147.0, 255.0, 415.0, 691.0, 1233.0, 2344.0, 4395.0, 8518.0, 18313.0, 43889.0, 120770.0, 321582.0, 323463.0, 121380.0, 44037.0, 18364.0, 8592.0, 4276.0, 2375.0, 1272.0, 700.0, 420.0, 282.0, 170.0, 99.0, 70.0, 51.0, 41.0, 25.0, 12.0, 13.0, 8.0, 6.0, 4.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.313232421875, -0.303741455078125, -0.29425048828125, -0.284759521484375, -0.2752685546875, -0.265777587890625, -0.25628662109375, -0.246795654296875, -0.2373046875, -0.227813720703125, -0.21832275390625, -0.208831787109375, -0.1993408203125, -0.189849853515625, -0.18035888671875, -0.170867919921875, -0.161376953125, -0.151885986328125, -0.14239501953125, -0.132904052734375, -0.1234130859375, -0.113922119140625, -0.10443115234375, -0.094940185546875, -0.08544921875, -0.075958251953125, -0.06646728515625, -0.056976318359375, -0.0474853515625, -0.037994384765625, -0.02850341796875, -0.019012451171875, -0.009521484375, -3.0517578125e-05, 0.00946044921875, 0.018951416015625, 0.0284423828125, 0.037933349609375, 0.04742431640625, 0.056915283203125, 0.06640625, 0.075897216796875, 0.08538818359375, 0.094879150390625, 0.1043701171875, 0.113861083984375, 0.12335205078125, 0.132843017578125, 0.142333984375, 0.151824951171875, 0.16131591796875, 0.170806884765625, 0.1802978515625, 0.189788818359375, 0.19927978515625, 0.208770751953125, 0.21826171875, 0.227752685546875, 0.23724365234375, 0.246734619140625, 0.2562255859375, 0.265716552734375, 0.27520751953125, 0.284698486328125, 0.294189453125]}, "gradients/decoder.model.decoder.layers.0.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 1.0, 3.0, 2.0, 2.0, 2.0, 5.0, 3.0, 8.0, 9.0, 12.0, 18.0, 12.0, 14.0, 23.0, 33.0, 29.0, 28.0, 34.0, 54.0, 46.0, 44.0, 45.0, 58.0, 48.0, 45.0, 31.0, 43.0, 43.0, 43.0, 30.0, 41.0, 38.0, 20.0, 23.0, 24.0, 14.0, 16.0, 10.0, 13.0, 10.0, 9.0, 3.0, 5.0, 4.0, 4.0, 3.0, 2.0, 0.0, 2.0, 0.0, 3.0, 0.0, 3.0], "bins": [-0.320068359375, -0.310882568359375, -0.30169677734375, -0.292510986328125, -0.2833251953125, -0.274139404296875, -0.26495361328125, -0.255767822265625, -0.24658203125, -0.237396240234375, -0.22821044921875, -0.219024658203125, -0.2098388671875, -0.200653076171875, -0.19146728515625, -0.182281494140625, -0.173095703125, -0.163909912109375, -0.15472412109375, -0.145538330078125, -0.1363525390625, -0.127166748046875, -0.11798095703125, -0.108795166015625, -0.099609375, -0.090423583984375, -0.08123779296875, -0.072052001953125, -0.0628662109375, -0.053680419921875, -0.04449462890625, -0.035308837890625, -0.026123046875, -0.016937255859375, -0.00775146484375, 0.001434326171875, 0.0106201171875, 0.019805908203125, 0.02899169921875, 0.038177490234375, 0.04736328125, 0.056549072265625, 0.06573486328125, 0.074920654296875, 0.0841064453125, 0.093292236328125, 0.10247802734375, 0.111663818359375, 0.120849609375, 0.130035400390625, 0.13922119140625, 0.148406982421875, 0.1575927734375, 0.166778564453125, 0.17596435546875, 0.185150146484375, 0.1943359375, 0.203521728515625, 0.21270751953125, 0.221893310546875, 0.2310791015625, 0.240264892578125, 0.24945068359375, 0.258636474609375, 0.267822265625]}, "gradients/decoder.model.decoder.layers.0.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 6.0, 2.0, 6.0, 6.0, 4.0, 12.0, 13.0, 19.0, 32.0, 53.0, 72.0, 143.0, 206.0, 345.0, 632.0, 1248.0, 2414.0, 5123.0, 12081.0, 32206.0, 103575.0, 352478.0, 369565.0, 110855.0, 33900.0, 12887.0, 5369.0, 2510.0, 1214.0, 662.0, 350.0, 205.0, 132.0, 72.0, 52.0, 38.0, 23.0, 9.0, 12.0, 12.0, 8.0, 4.0, 3.0, 2.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.34912109375, -0.3370933532714844, -0.32506561279296875, -0.3130378723144531, -0.3010101318359375, -0.2889823913574219, -0.27695465087890625, -0.2649269104003906, -0.252899169921875, -0.24087142944335938, -0.22884368896484375, -0.21681594848632812, -0.2047882080078125, -0.19276046752929688, -0.18073272705078125, -0.16870498657226562, -0.15667724609375, -0.14464950561523438, -0.13262176513671875, -0.12059402465820312, -0.1085662841796875, -0.09653854370117188, -0.08451080322265625, -0.07248306274414062, -0.060455322265625, -0.048427581787109375, -0.03639984130859375, -0.024372100830078125, -0.0123443603515625, -0.000316619873046875, 0.01171112060546875, 0.023738861083984375, 0.0357666015625, 0.047794342041015625, 0.05982208251953125, 0.07184982299804688, 0.0838775634765625, 0.09590530395507812, 0.10793304443359375, 0.11996078491210938, 0.131988525390625, 0.14401626586914062, 0.15604400634765625, 0.16807174682617188, 0.1800994873046875, 0.19212722778320312, 0.20415496826171875, 0.21618270874023438, 0.22821044921875, 0.24023818969726562, 0.25226593017578125, 0.2642936706542969, 0.2763214111328125, 0.2883491516113281, 0.30037689208984375, 0.3124046325683594, 0.324432373046875, 0.3364601135253906, 0.34848785400390625, 0.3605155944824219, 0.3725433349609375, 0.3845710754394531, 0.39659881591796875, 0.4086265563964844, 0.420654296875]}, "gradients/decoder.model.decoder.layers.0.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 4.0, 2.0, 7.0, 11.0, 12.0, 8.0, 22.0, 24.0, 27.0, 28.0, 29.0, 40.0, 50.0, 44.0, 64.0, 69.0, 56.0, 55.0, 62.0, 58.0, 46.0, 48.0, 38.0, 44.0, 31.0, 23.0, 19.0, 21.0, 15.0, 14.0, 12.0, 10.0, 5.0, 3.0, 4.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.35400390625, -0.3403472900390625, -0.326690673828125, -0.3130340576171875, -0.29937744140625, -0.2857208251953125, -0.272064208984375, -0.2584075927734375, -0.2447509765625, -0.2310943603515625, -0.217437744140625, -0.2037811279296875, -0.19012451171875, -0.1764678955078125, -0.162811279296875, -0.1491546630859375, -0.135498046875, -0.1218414306640625, -0.108184814453125, -0.0945281982421875, -0.08087158203125, -0.0672149658203125, -0.053558349609375, -0.0399017333984375, -0.0262451171875, -0.0125885009765625, 0.001068115234375, 0.0147247314453125, 0.02838134765625, 0.0420379638671875, 0.055694580078125, 0.0693511962890625, 0.0830078125, 0.0966644287109375, 0.110321044921875, 0.1239776611328125, 0.13763427734375, 0.1512908935546875, 0.164947509765625, 0.1786041259765625, 0.1922607421875, 0.2059173583984375, 0.219573974609375, 0.2332305908203125, 0.24688720703125, 0.2605438232421875, 0.274200439453125, 0.2878570556640625, 0.301513671875, 0.3151702880859375, 0.328826904296875, 0.3424835205078125, 0.35614013671875, 0.3697967529296875, 0.383453369140625, 0.3971099853515625, 0.4107666015625, 0.4244232177734375, 0.438079833984375, 0.4517364501953125, 0.46539306640625, 0.4790496826171875, 0.492706298828125, 0.5063629150390625, 0.52001953125]}, "gradients/decoder.model.decoder.layers.0.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 1.0, 2.0, 8.0, 6.0, 10.0, 16.0, 22.0, 28.0, 50.0, 83.0, 149.0, 242.0, 368.0, 589.0, 950.0, 1699.0, 2945.0, 5148.0, 9861.0, 19688.0, 42038.0, 95770.0, 201597.0, 337507.0, 177032.0, 80781.0, 35898.0, 16738.0, 8540.0, 4492.0, 2576.0, 1409.0, 912.0, 531.0, 329.0, 194.0, 139.0, 76.0, 49.0, 28.0, 16.0, 22.0, 7.0, 7.0, 4.0, 4.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.04888916015625, -0.04737997055053711, -0.04587078094482422, -0.04436159133911133, -0.04285240173339844, -0.04134321212768555, -0.039834022521972656, -0.038324832916259766, -0.036815643310546875, -0.035306453704833984, -0.033797264099121094, -0.0322880744934082, -0.030778884887695312, -0.029269695281982422, -0.02776050567626953, -0.02625131607055664, -0.02474212646484375, -0.02323293685913086, -0.02172374725341797, -0.020214557647705078, -0.018705368041992188, -0.017196178436279297, -0.015686988830566406, -0.014177799224853516, -0.012668609619140625, -0.011159420013427734, -0.009650230407714844, -0.008141040802001953, -0.0066318511962890625, -0.005122661590576172, -0.0036134719848632812, -0.0021042823791503906, -0.0005950927734375, 0.0009140968322753906, 0.0024232864379882812, 0.003932476043701172, 0.0054416656494140625, 0.006950855255126953, 0.008460044860839844, 0.009969234466552734, 0.011478424072265625, 0.012987613677978516, 0.014496803283691406, 0.016005992889404297, 0.017515182495117188, 0.019024372100830078, 0.02053356170654297, 0.02204275131225586, 0.02355194091796875, 0.02506113052368164, 0.02657032012939453, 0.028079509735107422, 0.029588699340820312, 0.031097888946533203, 0.032607078552246094, 0.034116268157958984, 0.035625457763671875, 0.037134647369384766, 0.038643836975097656, 0.04015302658081055, 0.04166221618652344, 0.04317140579223633, 0.04468059539794922, 0.04618978500366211, 0.047698974609375]}, "gradients/decoder.model.decoder.layers.0.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 5.0, 0.0, 1.0, 0.0, 3.0, 5.0, 5.0, 7.0, 10.0, 7.0, 9.0, 5.0, 18.0, 17.0, 17.0, 27.0, 32.0, 48.0, 54.0, 48.0, 79.0, 101.0, 106.0, 59.0, 63.0, 62.0, 46.0, 36.0, 21.0, 29.0, 11.0, 14.0, 15.0, 10.0, 11.0, 7.0, 4.0, 4.0, 4.0, 3.0, 2.0, 1.0, 4.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3947486877441406e-05, -1.3538636267185211e-05, -1.3129785656929016e-05, -1.2720935046672821e-05, -1.2312084436416626e-05, -1.1903233826160431e-05, -1.1494383215904236e-05, -1.108553260564804e-05, -1.0676681995391846e-05, -1.026783138513565e-05, -9.858980774879456e-06, -9.45013016462326e-06, -9.041279554367065e-06, -8.63242894411087e-06, -8.223578333854675e-06, -7.81472772359848e-06, -7.405877113342285e-06, -6.99702650308609e-06, -6.588175892829895e-06, -6.1793252825737e-06, -5.770474672317505e-06, -5.36162406206131e-06, -4.952773451805115e-06, -4.54392284154892e-06, -4.135072231292725e-06, -3.7262216210365295e-06, -3.3173710107803345e-06, -2.9085204005241394e-06, -2.4996697902679443e-06, -2.0908191800117493e-06, -1.6819685697555542e-06, -1.2731179594993591e-06, -8.642673492431641e-07, -4.55416738986969e-07, -4.6566128730773926e-08, 3.6228448152542114e-07, 7.711350917816162e-07, 1.1799857020378113e-06, 1.5888363122940063e-06, 1.9976869225502014e-06, 2.4065375328063965e-06, 2.8153881430625916e-06, 3.2242387533187866e-06, 3.6330893635749817e-06, 4.041939973831177e-06, 4.450790584087372e-06, 4.859641194343567e-06, 5.268491804599762e-06, 5.677342414855957e-06, 6.086193025112152e-06, 6.495043635368347e-06, 6.903894245624542e-06, 7.312744855880737e-06, 7.721595466136932e-06, 8.130446076393127e-06, 8.539296686649323e-06, 8.948147296905518e-06, 9.356997907161713e-06, 9.765848517417908e-06, 1.0174699127674103e-05, 1.0583549737930298e-05, 1.0992400348186493e-05, 1.1401250958442688e-05, 1.1810101568698883e-05, 1.2218952178955078e-05]}, "gradients/decoder.model.decoder.layers.0.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 0.0, 0.0, 2.0, 4.0, 4.0, 3.0, 14.0, 11.0, 18.0, 16.0, 25.0, 49.0, 55.0, 83.0, 99.0, 156.0, 245.0, 304.0, 402.0, 630.0, 977.0, 1780.0, 3246.0, 6305.0, 13750.0, 33486.0, 99604.0, 332824.0, 386416.0, 104243.0, 34855.0, 14110.0, 6433.0, 3367.0, 1786.0, 1089.0, 695.0, 483.0, 293.0, 171.0, 138.0, 99.0, 59.0, 50.0, 53.0, 31.0, 19.0, 17.0, 12.0, 14.0, 12.0, 6.0, 5.0, 10.0, 6.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.083984375, -0.08127689361572266, -0.07856941223144531, -0.07586193084716797, -0.07315444946289062, -0.07044696807861328, -0.06773948669433594, -0.0650320053100586, -0.06232452392578125, -0.059617042541503906, -0.05690956115722656, -0.05420207977294922, -0.051494598388671875, -0.04878711700439453, -0.04607963562011719, -0.043372154235839844, -0.0406646728515625, -0.037957191467285156, -0.03524971008300781, -0.03254222869873047, -0.029834747314453125, -0.02712726593017578, -0.024419784545898438, -0.021712303161621094, -0.01900482177734375, -0.016297340393066406, -0.013589859008789062, -0.010882377624511719, -0.008174896240234375, -0.005467414855957031, -0.0027599334716796875, -5.245208740234375e-05, 0.002655029296875, 0.005362510681152344, 0.008069992065429688, 0.010777473449707031, 0.013484954833984375, 0.01619243621826172, 0.018899917602539062, 0.021607398986816406, 0.02431488037109375, 0.027022361755371094, 0.029729843139648438, 0.03243732452392578, 0.035144805908203125, 0.03785228729248047, 0.04055976867675781, 0.043267250061035156, 0.0459747314453125, 0.048682212829589844, 0.05138969421386719, 0.05409717559814453, 0.056804656982421875, 0.05951213836669922, 0.06221961975097656, 0.0649271011352539, 0.06763458251953125, 0.0703420639038086, 0.07304954528808594, 0.07575702667236328, 0.07846450805664062, 0.08117198944091797, 0.08387947082519531, 0.08658695220947266, 0.08929443359375]}, "gradients/decoder.model.decoder.layers.0.self_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 4.0, 5.0, 3.0, 3.0, 4.0, 5.0, 5.0, 10.0, 6.0, 14.0, 20.0, 18.0, 25.0, 39.0, 40.0, 67.0, 56.0, 80.0, 124.0, 105.0, 87.0, 73.0, 50.0, 26.0, 31.0, 22.0, 21.0, 11.0, 5.0, 11.0, 7.0, 5.0, 4.0, 4.0, 2.0, 1.0, 1.0, 4.0, 2.0, 3.0, 1.0, 3.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0499267578125, -0.04836320877075195, -0.046799659729003906, -0.04523611068725586, -0.04367256164550781, -0.042109012603759766, -0.04054546356201172, -0.03898191452026367, -0.037418365478515625, -0.03585481643676758, -0.03429126739501953, -0.032727718353271484, -0.031164169311523438, -0.02960062026977539, -0.028037071228027344, -0.026473522186279297, -0.02490997314453125, -0.023346424102783203, -0.021782875061035156, -0.02021932601928711, -0.018655776977539062, -0.017092227935791016, -0.015528678894042969, -0.013965129852294922, -0.012401580810546875, -0.010838031768798828, -0.009274482727050781, -0.007710933685302734, -0.0061473846435546875, -0.004583835601806641, -0.0030202865600585938, -0.0014567375183105469, 0.0001068115234375, 0.0016703605651855469, 0.0032339096069335938, 0.004797458648681641, 0.0063610076904296875, 0.007924556732177734, 0.009488105773925781, 0.011051654815673828, 0.012615203857421875, 0.014178752899169922, 0.01574230194091797, 0.017305850982666016, 0.018869400024414062, 0.02043294906616211, 0.021996498107910156, 0.023560047149658203, 0.02512359619140625, 0.026687145233154297, 0.028250694274902344, 0.02981424331665039, 0.03137779235839844, 0.032941341400146484, 0.03450489044189453, 0.03606843948364258, 0.037631988525390625, 0.03919553756713867, 0.04075908660888672, 0.042322635650634766, 0.04388618469238281, 0.04544973373413086, 0.047013282775878906, 0.04857683181762695, 0.050140380859375]}, "gradients/decoder.model.decoder.layernorm_embedding.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0, 5.0, 10.0, 16.0, 31.0, 74.0, 119.0, 200.0, 192.0, 148.0, 96.0, 61.0, 34.0, 10.0, 6.0, 4.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0467673540115356, -1.007058024406433, -0.9673486351966858, -0.9276392459869385, -0.8879299163818359, -0.8482205271720886, -0.8085111379623413, -0.7688018083572388, -0.7290924191474915, -0.6893830299377441, -0.6496737003326416, -0.6099643111228943, -0.570254921913147, -0.5305455923080444, -0.4908362030982971, -0.4511268436908722, -0.41141748428344727, -0.37170812487602234, -0.3319987654685974, -0.2922893762588501, -0.25258001685142517, -0.21287065744400024, -0.17316128313541412, -0.133451908826828, -0.09374254941940308, -0.05403318256139755, -0.014323815703392029, 0.025385551154613495, 0.06509491801261902, 0.10480427742004395, 0.14451365172863007, 0.1842230260372162, 0.22393250465393066, 0.2636418640613556, 0.3033512234687805, 0.34306061267852783, 0.38276997208595276, 0.4224793314933777, 0.462188720703125, 0.5018980503082275, 0.5416074395179749, 0.5813168287277222, 0.6210261583328247, 0.660735547542572, 0.7004449367523193, 0.7401542663574219, 0.7798636555671692, 0.8195730447769165, 0.859282374382019, 0.8989917635917664, 0.9387010931968689, 0.9784104824066162, 1.0181198120117188, 1.0578291416168213, 1.0975385904312134, 1.137247920036316, 1.176957368850708, 1.2166666984558105, 1.2563761472702026, 1.2960854768753052, 1.3357948064804077, 1.3755042552947998, 1.4152135848999023, 1.4549229145050049, 1.4946322441101074]}, "gradients/decoder.model.decoder.layernorm_embedding.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 4.0, 4.0, 8.0, 7.0, 5.0, 6.0, 6.0, 17.0, 17.0, 18.0, 17.0, 26.0, 22.0, 28.0, 40.0, 24.0, 35.0, 52.0, 41.0, 36.0, 55.0, 50.0, 50.0, 35.0, 40.0, 47.0, 31.0, 34.0, 26.0, 36.0, 30.0, 26.0, 24.0, 14.0, 21.0, 16.0, 13.0, 16.0, 7.0, 6.0, 5.0, 6.0, 4.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.6149052381515503, -0.5975620746612549, -0.5802189111709595, -0.5628758072853088, -0.5455326437950134, -0.528189480304718, -0.5108463168144226, -0.4935031533241272, -0.4761600196361542, -0.45881685614585876, -0.44147372245788574, -0.42413055896759033, -0.4067873954772949, -0.3894442617893219, -0.3721010982990265, -0.35475796461105347, -0.33741480112075806, -0.32007163763046265, -0.3027285039424896, -0.2853853404521942, -0.2680422067642212, -0.2506990432739258, -0.23335587978363037, -0.21601273119449615, -0.19866958260536194, -0.18132643401622772, -0.1639832854270935, -0.1466401219367981, -0.12929697334766388, -0.11195382475852966, -0.09461066871881485, -0.07726751267910004, -0.05992436408996582, -0.042581211775541306, -0.02523805946111679, -0.007894907146692276, 0.009448245167732239, 0.026791393756866455, 0.04413454979658127, 0.06147770583629608, 0.0788208544254303, 0.09616400301456451, 0.11350715905427933, 0.13085031509399414, 0.14819346368312836, 0.16553661227226257, 0.18287977576255798, 0.2002229243516922, 0.21756607294082642, 0.23490922152996063, 0.25225237011909485, 0.26959553360939026, 0.2869386672973633, 0.3042818307876587, 0.3216249942779541, 0.3389681577682495, 0.35631129145622253, 0.37365445494651794, 0.39099758863449097, 0.4083407521247864, 0.4256839156150818, 0.4430270493030548, 0.4603702127933502, 0.47771334648132324, 0.49505650997161865]}, "gradients/decoder.model.decoder.embed_positions.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 6.0, 3.0, 6.0, 7.0, 17.0, 18.0, 20.0, 23.0, 41.0, 43.0, 52.0, 61.0, 94.0, 150.0, 178.0, 255.0, 320.0, 482.0, 841.0, 1347.0, 2506.0, 4625.0, 1021404.0, 8392.0, 4050.0, 2072.0, 1191.0, 787.0, 469.0, 280.0, 203.0, 162.0, 98.0, 101.0, 72.0, 47.0, 38.0, 35.0, 29.0, 18.0, 25.0, 9.0, 9.0, 5.0, 7.0, 6.0, 7.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.598320722579956, -0.5776081085205078, -0.5568954944610596, -0.5361828804016113, -0.5154702663421631, -0.49475765228271484, -0.474045068025589, -0.45333245396614075, -0.4326198399066925, -0.41190722584724426, -0.391194611787796, -0.3704819977283478, -0.3497694134712219, -0.3290567994117737, -0.30834418535232544, -0.2876315712928772, -0.26691895723342896, -0.2462063431739807, -0.22549372911453247, -0.20478112995624542, -0.18406851589679718, -0.16335590183734894, -0.1426433026790619, -0.12193068861961365, -0.1012180745601654, -0.08050546050071716, -0.05979285389184952, -0.039080243557691574, -0.01836763322353363, 0.002344980835914612, 0.023057587444782257, 0.0437701940536499, 0.06448280811309814, 0.08519542217254639, 0.10590802878141403, 0.12662063539028168, 0.14733324944972992, 0.16804586350917816, 0.1887584626674652, 0.20947107672691345, 0.2301836907863617, 0.25089630484580994, 0.2716089189052582, 0.2923215329647064, 0.3130341172218323, 0.3337467312812805, 0.35445934534072876, 0.375171959400177, 0.39588457345962524, 0.4165971875190735, 0.43730980157852173, 0.45802241563796997, 0.4787350296974182, 0.49944764375686646, 0.5201602578163147, 0.5408728122711182, 0.5615854263305664, 0.5822980403900146, 0.6030106544494629, 0.6237232685089111, 0.6444358825683594, 0.6651484966278076, 0.6858611106872559, 0.7065737247467041, 0.7272863388061523]}, "gradients/decoder.model.decoder.embed_tokens.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 7.0, 8.0, 8.0, 17.0, 49.0, 110.0, 287.0, 835.0, 2415.0, 51457048.0, 7208.0, 1436.0, 539.0, 218.0, 74.0, 32.0, 19.0, 2.0, 7.0, 6.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.43700122833252, -13.050508499145508, -12.664015769958496, -12.277523040771484, -11.891031265258789, -11.504538536071777, -11.118045806884766, -10.731553077697754, -10.345060348510742, -9.95856761932373, -9.572074890136719, -9.185583114624023, -8.799090385437012, -8.41259765625, -8.026104927062988, -7.639612197875977, -7.253120422363281, -6.8666276931762695, -6.480135440826416, -6.093642711639404, -5.707150459289551, -5.320657730102539, -4.934165000915527, -4.547672271728516, -4.161180019378662, -3.7746875286102295, -3.388195037841797, -3.001702308654785, -2.6152098178863525, -2.22871732711792, -1.8422245979309082, -1.4557321071624756, -1.069239616394043, -0.6827470660209656, -0.2962545156478882, 0.09023809432983398, 0.4767305850982666, 0.8632230758666992, 1.249715805053711, 1.6362082958221436, 2.022700786590576, 2.409193277359009, 2.7956857681274414, 3.182178497314453, 3.5686709880828857, 3.9551634788513184, 4.34165620803833, 4.728148460388184, 5.114641189575195, 5.501133918762207, 5.8876261711120605, 6.274118900299072, 6.660611152648926, 7.0471038818359375, 7.433596611022949, 7.820089340209961, 8.206581115722656, 8.593073844909668, 8.97956657409668, 9.366058349609375, 9.752551078796387, 10.139043807983398, 10.52553653717041, 10.912029266357422, 11.298521995544434]}, "gradients/encoder.adapter.layers.2.conv.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 5.0, 5.0, 7.0, 26.0, 31.0, 40.0, 80.0, 113.0, 169.0, 290.0, 456.0, 789.0, 1298.0, 2087.0, 3590.0, 5904.0, 9991.0, 17003.0, 28016.0, 46827.0, 75334.0, 119186.0, 182364.0, 260300.0, 349174.0, 981586.0, 2930900.0, 400247.0, 292167.0, 210462.0, 142143.0, 90403.0, 55916.0, 33896.0, 20592.0, 12346.0, 7159.0, 4241.0, 2559.0, 1474.0, 899.0, 537.0, 319.0, 198.0, 112.0, 74.0, 53.0, 19.0, 21.0, 15.0, 10.0, 5.0, 3.0, 2.0, 0.0, 0.0, 3.0], "bins": [-0.27587890625, -0.2675666809082031, -0.25925445556640625, -0.2509422302246094, -0.2426300048828125, -0.23431777954101562, -0.22600555419921875, -0.21769332885742188, -0.209381103515625, -0.20106887817382812, -0.19275665283203125, -0.18444442749023438, -0.1761322021484375, -0.16781997680664062, -0.15950775146484375, -0.15119552612304688, -0.14288330078125, -0.13457107543945312, -0.12625885009765625, -0.11794662475585938, -0.1096343994140625, -0.10132217407226562, -0.09300994873046875, -0.08469772338867188, -0.076385498046875, -0.06807327270507812, -0.05976104736328125, -0.051448822021484375, -0.0431365966796875, -0.034824371337890625, -0.02651214599609375, -0.018199920654296875, -0.0098876953125, -0.001575469970703125, 0.00673675537109375, 0.015048980712890625, 0.0233612060546875, 0.031673431396484375, 0.03998565673828125, 0.048297882080078125, 0.056610107421875, 0.06492233276367188, 0.07323455810546875, 0.08154678344726562, 0.0898590087890625, 0.09817123413085938, 0.10648345947265625, 0.11479568481445312, 0.12310791015625, 0.13142013549804688, 0.13973236083984375, 0.14804458618164062, 0.1563568115234375, 0.16466903686523438, 0.17298126220703125, 0.18129348754882812, 0.189605712890625, 0.19791793823242188, 0.20623016357421875, 0.21454238891601562, 0.2228546142578125, 0.23116683959960938, 0.23947906494140625, 0.24779129028320312, 0.256103515625]}, "gradients/encoder.adapter.layers.2.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 4.0, 3.0, 0.0, 4.0, 8.0, 5.0, 9.0, 11.0, 17.0, 14.0, 20.0, 21.0, 31.0, 16.0, 22.0, 41.0, 24.0, 37.0, 43.0, 46.0, 56.0, 83.0, 560.0, 502.0, 58.0, 42.0, 48.0, 30.0, 36.0, 32.0, 30.0, 29.0, 35.0, 15.0, 17.0, 17.0, 15.0, 13.0, 11.0, 7.0, 4.0, 5.0, 4.0, 4.0, 3.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-2.619140625, -2.537261962890625, -2.45538330078125, -2.373504638671875, -2.2916259765625, -2.209747314453125, -2.12786865234375, -2.045989990234375, -1.964111328125, -1.882232666015625, -1.80035400390625, -1.718475341796875, -1.6365966796875, -1.554718017578125, -1.47283935546875, -1.390960693359375, -1.30908203125, -1.227203369140625, -1.14532470703125, -1.063446044921875, -0.9815673828125, -0.899688720703125, -0.81781005859375, -0.735931396484375, -0.654052734375, -0.572174072265625, -0.49029541015625, -0.408416748046875, -0.3265380859375, -0.244659423828125, -0.16278076171875, -0.080902099609375, 0.0009765625, 0.082855224609375, 0.16473388671875, 0.246612548828125, 0.3284912109375, 0.410369873046875, 0.49224853515625, 0.574127197265625, 0.656005859375, 0.737884521484375, 0.81976318359375, 0.901641845703125, 0.9835205078125, 1.065399169921875, 1.14727783203125, 1.229156494140625, 1.31103515625, 1.392913818359375, 1.47479248046875, 1.556671142578125, 1.6385498046875, 1.720428466796875, 1.80230712890625, 1.884185791015625, 1.966064453125, 2.047943115234375, 2.12982177734375, 2.211700439453125, 2.2935791015625, 2.375457763671875, 2.45733642578125, 2.539215087890625, 2.62109375]}, "gradients/encoder.adapter.layers.1.conv.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 1.0, 6.0, 4.0, 9.0, 8.0, 8.0, 23.0, 41.0, 69.0, 105.0, 126.0, 207.0, 404.0, 626.0, 1020.0, 1639.0, 2763.0, 4350.0, 7211.0, 11875.0, 18737.0, 29771.0, 46302.0, 69195.0, 102150.0, 142590.0, 193614.0, 244099.0, 290772.0, 721321.0, 3048997.0, 330798.0, 269988.0, 219103.0, 168145.0, 122947.0, 85462.0, 57096.0, 37135.0, 23672.0, 15004.0, 9398.0, 5662.0, 3393.0, 2095.0, 1357.0, 837.0, 501.0, 319.0, 196.0, 137.0, 62.0, 36.0, 14.0, 18.0, 10.0, 7.0, 5.0, 3.0, 7.0], "bins": [-0.184814453125, -0.17942047119140625, -0.1740264892578125, -0.16863250732421875, -0.163238525390625, -0.15784454345703125, -0.1524505615234375, -0.14705657958984375, -0.14166259765625, -0.13626861572265625, -0.1308746337890625, -0.12548065185546875, -0.120086669921875, -0.11469268798828125, -0.1092987060546875, -0.10390472412109375, -0.0985107421875, -0.09311676025390625, -0.0877227783203125, -0.08232879638671875, -0.076934814453125, -0.07154083251953125, -0.0661468505859375, -0.06075286865234375, -0.05535888671875, -0.04996490478515625, -0.0445709228515625, -0.03917694091796875, -0.033782958984375, -0.02838897705078125, -0.0229949951171875, -0.01760101318359375, -0.01220703125, -0.00681304931640625, -0.0014190673828125, 0.00397491455078125, 0.009368896484375, 0.01476287841796875, 0.0201568603515625, 0.02555084228515625, 0.03094482421875, 0.03633880615234375, 0.0417327880859375, 0.04712677001953125, 0.052520751953125, 0.05791473388671875, 0.0633087158203125, 0.06870269775390625, 0.0740966796875, 0.07949066162109375, 0.0848846435546875, 0.09027862548828125, 0.095672607421875, 0.10106658935546875, 0.1064605712890625, 0.11185455322265625, 0.11724853515625, 0.12264251708984375, 0.1280364990234375, 0.13343048095703125, 0.138824462890625, 0.14421844482421875, 0.1496124267578125, 0.15500640869140625, 0.160400390625]}, "gradients/encoder.adapter.layers.1.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 7.0, 5.0, 2.0, 4.0, 9.0, 16.0, 9.0, 16.0, 16.0, 20.0, 21.0, 18.0, 17.0, 30.0, 31.0, 38.0, 29.0, 44.0, 31.0, 30.0, 53.0, 484.0, 595.0, 61.0, 48.0, 40.0, 41.0, 36.0, 38.0, 28.0, 33.0, 27.0, 21.0, 19.0, 11.0, 21.0, 24.0, 15.0, 10.0, 3.0, 6.0, 8.0, 6.0, 4.0, 4.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.060546875, -1.98968505859375, -1.9188232421875, -1.84796142578125, -1.777099609375, -1.70623779296875, -1.6353759765625, -1.56451416015625, -1.49365234375, -1.42279052734375, -1.3519287109375, -1.28106689453125, -1.210205078125, -1.13934326171875, -1.0684814453125, -0.99761962890625, -0.9267578125, -0.85589599609375, -0.7850341796875, -0.71417236328125, -0.643310546875, -0.57244873046875, -0.5015869140625, -0.43072509765625, -0.35986328125, -0.28900146484375, -0.2181396484375, -0.14727783203125, -0.076416015625, -0.00555419921875, 0.0653076171875, 0.13616943359375, 0.20703125, 0.27789306640625, 0.3487548828125, 0.41961669921875, 0.490478515625, 0.56134033203125, 0.6322021484375, 0.70306396484375, 0.77392578125, 0.84478759765625, 0.9156494140625, 0.98651123046875, 1.057373046875, 1.12823486328125, 1.1990966796875, 1.26995849609375, 1.3408203125, 1.41168212890625, 1.4825439453125, 1.55340576171875, 1.624267578125, 1.69512939453125, 1.7659912109375, 1.83685302734375, 1.90771484375, 1.97857666015625, 2.0494384765625, 2.12030029296875, 2.191162109375, 2.26202392578125, 2.3328857421875, 2.40374755859375, 2.474609375]}, "gradients/encoder.adapter.layers.0.conv.weight": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 3.0, 3.0, 3.0, 5.0, 9.0, 10.0, 16.0, 17.0, 18.0, 41.0, 55.0, 65.0, 91.0, 136.0, 143.0, 218.0, 301.0, 404.0, 527.0, 759.0, 1052.0, 1574.0, 2616.0, 4539.0, 8963.0, 17606.0, 35698.0, 72037.0, 145264.0, 5531812.0, 276233.0, 93245.0, 47226.0, 23388.0, 11646.0, 6079.0, 3302.0, 2035.0, 1286.0, 855.0, 596.0, 424.0, 285.0, 226.0, 168.0, 125.0, 95.0, 57.0, 51.0, 44.0, 32.0, 19.0, 12.0, 14.0, 8.0, 2.0, 6.0, 3.0, 1.0, 1.0, 3.0], "bins": [-0.72900390625, -0.7067108154296875, -0.684417724609375, -0.6621246337890625, -0.63983154296875, -0.6175384521484375, -0.595245361328125, -0.5729522705078125, -0.5506591796875, -0.5283660888671875, -0.506072998046875, -0.4837799072265625, -0.46148681640625, -0.4391937255859375, -0.416900634765625, -0.3946075439453125, -0.372314453125, -0.3500213623046875, -0.327728271484375, -0.3054351806640625, -0.28314208984375, -0.2608489990234375, -0.238555908203125, -0.2162628173828125, -0.1939697265625, -0.1716766357421875, -0.149383544921875, -0.1270904541015625, -0.10479736328125, -0.0825042724609375, -0.060211181640625, -0.0379180908203125, -0.015625, 0.0066680908203125, 0.028961181640625, 0.0512542724609375, 0.07354736328125, 0.0958404541015625, 0.118133544921875, 0.1404266357421875, 0.1627197265625, 0.1850128173828125, 0.207305908203125, 0.2295989990234375, 0.25189208984375, 0.2741851806640625, 0.296478271484375, 0.3187713623046875, 0.341064453125, 0.3633575439453125, 0.385650634765625, 0.4079437255859375, 0.43023681640625, 0.4525299072265625, 0.474822998046875, 0.4971160888671875, 0.5194091796875, 0.5417022705078125, 0.563995361328125, 0.5862884521484375, 0.60858154296875, 0.6308746337890625, 0.653167724609375, 0.6754608154296875, 0.69775390625]}, "gradients/encoder.adapter.layers.0.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 2.0, 3.0, 5.0, 6.0, 2.0, 10.0, 8.0, 7.0, 13.0, 9.0, 13.0, 25.0, 36.0, 39.0, 38.0, 37.0, 44.0, 42.0, 39.0, 42.0, 98.0, 1012.0, 62.0, 58.0, 44.0, 48.0, 49.0, 40.0, 30.0, 25.0, 19.0, 29.0, 24.0, 21.0, 16.0, 7.0, 5.0, 5.0, 7.0, 5.0, 2.0, 2.0, 5.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.099609375, -3.0069580078125, -2.914306640625, -2.8216552734375, -2.72900390625, -2.6363525390625, -2.543701171875, -2.4510498046875, -2.3583984375, -2.2657470703125, -2.173095703125, -2.0804443359375, -1.98779296875, -1.8951416015625, -1.802490234375, -1.7098388671875, -1.6171875, -1.5245361328125, -1.431884765625, -1.3392333984375, -1.24658203125, -1.1539306640625, -1.061279296875, -0.9686279296875, -0.8759765625, -0.7833251953125, -0.690673828125, -0.5980224609375, -0.50537109375, -0.4127197265625, -0.320068359375, -0.2274169921875, -0.134765625, -0.0421142578125, 0.050537109375, 0.1431884765625, 0.23583984375, 0.3284912109375, 0.421142578125, 0.5137939453125, 0.6064453125, 0.6990966796875, 0.791748046875, 0.8843994140625, 0.97705078125, 1.0697021484375, 1.162353515625, 1.2550048828125, 1.34765625, 1.4403076171875, 1.532958984375, 1.6256103515625, 1.71826171875, 1.8109130859375, 1.903564453125, 1.9962158203125, 2.0888671875, 2.1815185546875, 2.274169921875, 2.3668212890625, 2.45947265625, 2.5521240234375, 2.644775390625, 2.7374267578125, 2.830078125]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 5.0, 1.0, 2.0, 2.0, 2.0, 3.0, 15.0, 19.0, 35.0, 80.0, 170.0, 284.0, 210.0, 100.0, 49.0, 23.0, 4.0, 4.0, 6.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.863334655761719, -15.454010009765625, -15.044686317443848, -14.635361671447754, -14.22603702545166, -13.816713333129883, -13.407388687133789, -12.998064041137695, -12.588739395141602, -12.179414749145508, -11.77009105682373, -11.360766410827637, -10.951441764831543, -10.542118072509766, -10.132793426513672, -9.723468780517578, -9.3141450881958, -8.904820442199707, -8.49549674987793, -8.086172103881836, -7.676847457885742, -7.267523288726807, -6.858199119567871, -6.448874473571777, -6.039550304412842, -5.630226135253906, -5.2209014892578125, -4.811577320098877, -4.402253150939941, -3.9929285049438477, -3.583604335784912, -3.1742799282073975, -2.764955520629883, -2.355631113052368, -1.946306824684143, -1.536982536315918, -1.1276581287384033, -0.7183337211608887, -0.3090095520019531, 0.10031485557556152, 0.5096392631530762, 0.918963611125946, 1.328287959098816, 1.737612247467041, 2.1469366550445557, 2.5562610626220703, 2.965585231781006, 3.3749096393585205, 3.784234046936035, 4.193558216094971, 4.6028828620910645, 5.01220703125, 5.421531677246094, 5.830855846405029, 6.240180015563965, 6.649504661560059, 7.058828830718994, 7.46815299987793, 7.877477645874023, 8.286802291870117, 8.696125984191895, 9.105450630187988, 9.514774322509766, 9.92409896850586, 10.333423614501953]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 2.0, 2.0, 2.0, 3.0, 0.0, 0.0, 5.0, 0.0, 4.0, 6.0, 7.0, 12.0, 8.0, 11.0, 12.0, 20.0, 20.0, 33.0, 28.0, 33.0, 34.0, 43.0, 53.0, 60.0, 68.0, 85.0, 49.0, 65.0, 58.0, 52.0, 37.0, 26.0, 27.0, 22.0, 22.0, 15.0, 14.0, 9.0, 12.0, 15.0, 11.0, 6.0, 5.0, 3.0, 3.0, 5.0, 3.0, 1.0, 2.0, 0.0, 4.0, 1.0], "bins": [-10.555952072143555, -10.27237606048584, -9.988801002502441, -9.705224990844727, -9.421649932861328, -9.138073921203613, -8.854498863220215, -8.5709228515625, -8.287347793579102, -8.003771781921387, -7.720196723937988, -7.436621189117432, -7.153045654296875, -6.86946964263916, -6.5858941078186035, -6.302318572998047, -6.018742561340332, -5.735167026519775, -5.451591491699219, -5.168015956878662, -4.8844404220581055, -4.600864410400391, -4.317288875579834, -4.033713340759277, -3.7501378059387207, -3.466562271118164, -3.1829867362976074, -2.8994109630584717, -2.615835428237915, -2.3322598934173584, -2.0486841201782227, -1.765108585357666, -1.4815325736999512, -1.1979570388793945, -0.9143813848495483, -0.6308057904243469, -0.3472301959991455, -0.06365466117858887, 0.21992099285125732, 0.5034966468811035, 0.7870721817016602, 1.0706477165222168, 1.354223370552063, 1.6377990245819092, 1.9213745594024658, 2.2049500942230225, 2.488525867462158, 2.772101402282715, 3.0556769371032715, 3.339252471923828, 3.6228280067443848, 3.9064037799835205, 4.189979553222656, 4.473554611206055, 4.7571306228637695, 5.040706157684326, 5.324281692504883, 5.6078572273254395, 5.891432762145996, 6.175008296966553, 6.458583831787109, 6.742159843444824, 7.025735378265381, 7.3093109130859375, 7.592886447906494]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 3.0, 9.0, 3.0, 12.0, 6.0, 16.0, 10.0, 28.0, 50.0, 53.0, 93.0, 107.0, 169.0, 271.0, 530.0, 845.0, 1435.0, 2789.0, 5394.0, 12519.0, 39522.0, 3574427.0, 498296.0, 34967.0, 11670.0, 5179.0, 2553.0, 1339.0, 762.0, 444.0, 289.0, 173.0, 94.0, 73.0, 41.0, 41.0, 21.0, 15.0, 12.0, 7.0, 8.0, 5.0, 3.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08148193359375, -0.07900810241699219, -0.07653427124023438, -0.07406044006347656, -0.07158660888671875, -0.06911277770996094, -0.06663894653320312, -0.06416511535644531, -0.0616912841796875, -0.05921745300292969, -0.056743621826171875, -0.05426979064941406, -0.05179595947265625, -0.04932212829589844, -0.046848297119140625, -0.04437446594238281, -0.041900634765625, -0.03942680358886719, -0.036952972412109375, -0.03447914123535156, -0.03200531005859375, -0.029531478881835938, -0.027057647705078125, -0.024583816528320312, -0.0221099853515625, -0.019636154174804688, -0.017162322998046875, -0.014688491821289062, -0.01221466064453125, -0.009740829467773438, -0.007266998291015625, -0.0047931671142578125, -0.0023193359375, 0.0001544952392578125, 0.002628326416015625, 0.0051021575927734375, 0.00757598876953125, 0.010049819946289062, 0.012523651123046875, 0.014997482299804688, 0.0174713134765625, 0.019945144653320312, 0.022418975830078125, 0.024892807006835938, 0.02736663818359375, 0.029840469360351562, 0.032314300537109375, 0.03478813171386719, 0.037261962890625, 0.03973579406738281, 0.042209625244140625, 0.04468345642089844, 0.04715728759765625, 0.04963111877441406, 0.052104949951171875, 0.05457878112792969, 0.0570526123046875, 0.05952644348144531, 0.062000274658203125, 0.06447410583496094, 0.06694793701171875, 0.06942176818847656, 0.07189559936523438, 0.07436943054199219, 0.07684326171875]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 2.0, 1.0, 2.0, 4.0, 4.0, 7.0, 3.0, 1.0, 0.0, 5.0, 5.0, 9.0, 4.0, 7.0, 9.0, 11.0, 18.0, 19.0, 30.0, 63.0, 439.0, 168.0, 52.0, 30.0, 17.0, 8.0, 10.0, 13.0, 12.0, 6.0, 3.0, 4.0, 8.0, 7.0, 6.0, 3.0, 4.0, 1.0, 4.0, 0.0, 2.0, 2.0, 0.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.0225067138671875, -0.021802902221679688, -0.021099090576171875, -0.020395278930664062, -0.01969146728515625, -0.018987655639648438, -0.018283843994140625, -0.017580032348632812, -0.016876220703125, -0.016172409057617188, -0.015468597412109375, -0.014764785766601562, -0.01406097412109375, -0.013357162475585938, -0.012653350830078125, -0.011949539184570312, -0.0112457275390625, -0.010541915893554688, -0.009838104248046875, -0.009134292602539062, -0.00843048095703125, -0.0077266693115234375, -0.007022857666015625, -0.0063190460205078125, -0.005615234375, -0.0049114227294921875, -0.004207611083984375, -0.0035037994384765625, -0.00279998779296875, -0.0020961761474609375, -0.001392364501953125, -0.0006885528564453125, 1.52587890625e-05, 0.0007190704345703125, 0.001422882080078125, 0.0021266937255859375, 0.00283050537109375, 0.0035343170166015625, 0.004238128662109375, 0.0049419403076171875, 0.005645751953125, 0.0063495635986328125, 0.007053375244140625, 0.0077571868896484375, 0.00846099853515625, 0.009164810180664062, 0.009868621826171875, 0.010572433471679688, 0.0112762451171875, 0.011980056762695312, 0.012683868408203125, 0.013387680053710938, 0.01409149169921875, 0.014795303344726562, 0.015499114990234375, 0.016202926635742188, 0.01690673828125, 0.017610549926757812, 0.018314361572265625, 0.019018173217773438, 0.01972198486328125, 0.020425796508789062, 0.021129608154296875, 0.021833419799804688, 0.0225372314453125]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 3.0, 6.0, 5.0, 3.0, 3.0, 5.0, 5.0, 6.0, 9.0, 15.0, 15.0, 19.0, 36.0, 63.0, 72.0, 158.0, 327.0, 636.0, 1399.0, 3245.0, 8679.0, 25848.0, 100798.0, 696303.0, 3055694.0, 229680.0, 48530.0, 14202.0, 4795.0, 1952.0, 867.0, 400.0, 219.0, 93.0, 61.0, 38.0, 28.0, 14.0, 16.0, 8.0, 7.0, 8.0, 2.0, 4.0, 3.0, 2.0, 1.0, 4.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0577392578125, -0.055891990661621094, -0.05404472351074219, -0.05219745635986328, -0.050350189208984375, -0.04850292205810547, -0.04665565490722656, -0.044808387756347656, -0.04296112060546875, -0.041113853454589844, -0.03926658630371094, -0.03741931915283203, -0.035572052001953125, -0.03372478485107422, -0.03187751770019531, -0.030030250549316406, -0.0281829833984375, -0.026335716247558594, -0.024488449096679688, -0.02264118194580078, -0.020793914794921875, -0.01894664764404297, -0.017099380493164062, -0.015252113342285156, -0.01340484619140625, -0.011557579040527344, -0.009710311889648438, -0.007863044738769531, -0.006015777587890625, -0.004168510437011719, -0.0023212432861328125, -0.00047397613525390625, 0.001373291015625, 0.0032205581665039062, 0.0050678253173828125, 0.006915092468261719, 0.008762359619140625, 0.010609626770019531, 0.012456893920898438, 0.014304161071777344, 0.01615142822265625, 0.017998695373535156, 0.019845962524414062, 0.02169322967529297, 0.023540496826171875, 0.02538776397705078, 0.027235031127929688, 0.029082298278808594, 0.0309295654296875, 0.032776832580566406, 0.03462409973144531, 0.03647136688232422, 0.038318634033203125, 0.04016590118408203, 0.04201316833496094, 0.043860435485839844, 0.04570770263671875, 0.047554969787597656, 0.04940223693847656, 0.05124950408935547, 0.053096771240234375, 0.05494403839111328, 0.05679130554199219, 0.058638572692871094, 0.06048583984375]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 1.0, 2.0, 3.0, 2.0, 4.0, 1.0, 4.0, 5.0, 10.0, 6.0, 6.0, 19.0, 16.0, 24.0, 16.0, 22.0, 33.0, 48.0, 68.0, 91.0, 91.0, 174.0, 253.0, 498.0, 1151.0, 672.0, 266.0, 148.0, 104.0, 76.0, 56.0, 45.0, 38.0, 24.0, 25.0, 18.0, 13.0, 12.0, 7.0, 5.0, 2.0, 6.0, 2.0, 6.0, 4.0, 1.0, 2.0, 1.0, 3.0, 1.0, 3.0], "bins": [-0.0283660888671875, -0.02761244773864746, -0.026858806610107422, -0.026105165481567383, -0.025351524353027344, -0.024597883224487305, -0.023844242095947266, -0.023090600967407227, -0.022336959838867188, -0.02158331871032715, -0.02082967758178711, -0.02007603645324707, -0.01932239532470703, -0.018568754196166992, -0.017815113067626953, -0.017061471939086914, -0.016307830810546875, -0.015554189682006836, -0.014800548553466797, -0.014046907424926758, -0.013293266296386719, -0.01253962516784668, -0.01178598403930664, -0.011032342910766602, -0.010278701782226562, -0.009525060653686523, -0.008771419525146484, -0.008017778396606445, -0.007264137268066406, -0.006510496139526367, -0.005756855010986328, -0.005003213882446289, -0.00424957275390625, -0.003495931625366211, -0.002742290496826172, -0.001988649368286133, -0.0012350082397460938, -0.0004813671112060547, 0.0002722740173339844, 0.0010259151458740234, 0.0017795562744140625, 0.0025331974029541016, 0.0032868385314941406, 0.00404047966003418, 0.004794120788574219, 0.005547761917114258, 0.006301403045654297, 0.007055044174194336, 0.007808685302734375, 0.008562326431274414, 0.009315967559814453, 0.010069608688354492, 0.010823249816894531, 0.01157689094543457, 0.01233053207397461, 0.013084173202514648, 0.013837814331054688, 0.014591455459594727, 0.015345096588134766, 0.016098737716674805, 0.016852378845214844, 0.017606019973754883, 0.018359661102294922, 0.01911330223083496, 0.019866943359375]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 14.0, 47.0, 151.0, 350.0, 310.0, 100.0, 22.0, 5.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3096752166748047, -0.2989852726459503, -0.28829532861709595, -0.27760541439056396, -0.2669154703617096, -0.2562255263328552, -0.24553558230400085, -0.23484563827514648, -0.2241557091474533, -0.21346576511859894, -0.20277583599090576, -0.1920858919620514, -0.18139594793319702, -0.17070601880550385, -0.16001607477664948, -0.1493261456489563, -0.13863620162010193, -0.12794625759124756, -0.11725632846355438, -0.10656638443470001, -0.09587644785642624, -0.08518651127815247, -0.0744965672492981, -0.06380663067102432, -0.05311669409275055, -0.042426757514476776, -0.031736817210912704, -0.021046876907348633, -0.01035694032907486, 0.0003329962491989136, 0.011022940278053284, 0.021712876856327057, 0.03240281343460083, 0.0430927500128746, 0.053782690316438675, 0.06447263062000275, 0.07516256719827652, 0.08585250377655029, 0.09654244780540466, 0.10723238438367844, 0.11792232096195221, 0.12861226499080658, 0.13930219411849976, 0.14999213814735413, 0.1606820821762085, 0.17137201130390167, 0.18206195533275604, 0.19275188446044922, 0.2034418284893036, 0.21413177251815796, 0.22482170164585114, 0.2355116456747055, 0.24620157480239868, 0.25689151883125305, 0.2675814628601074, 0.2782714068889618, 0.28896135091781616, 0.29965129494667053, 0.3103412389755249, 0.3210311532020569, 0.33172109723091125, 0.3424110412597656, 0.35310098528862, 0.36379092931747437, 0.37448084354400635]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 4.0, 7.0, 4.0, 8.0, 12.0, 22.0, 30.0, 30.0, 32.0, 37.0, 36.0, 37.0, 61.0, 77.0, 62.0, 86.0, 66.0, 65.0, 63.0, 45.0, 51.0, 41.0, 28.0, 21.0, 21.0, 18.0, 7.0, 11.0, 9.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.12411165237426758, -0.11969789862632751, -0.11528414487838745, -0.11087039113044739, -0.10645663738250732, -0.10204288363456726, -0.0976291373372078, -0.09321538358926773, -0.08880162984132767, -0.0843878760933876, -0.07997412234544754, -0.07556036859750748, -0.07114662230014801, -0.06673286855220795, -0.06231911480426788, -0.05790536105632782, -0.053491607308387756, -0.04907785356044769, -0.04466409981250763, -0.040250349789857864, -0.0358365960419178, -0.03142284229397774, -0.027009090408682823, -0.02259533852338791, -0.018181584775447845, -0.013767831958830357, -0.009354079142212868, -0.004940326325595379, -0.00052657350897789, 0.0038871802389621735, 0.008300932124257088, 0.012714684009552002, 0.017128437757492065, 0.02154219150543213, 0.025955943390727043, 0.030369695276021957, 0.03478344902396202, 0.039197202771902084, 0.04361095279455185, 0.04802470654249191, 0.052438460290431976, 0.05685221403837204, 0.0612659677863121, 0.06567972153425217, 0.07009346783161163, 0.0745072215795517, 0.07892097532749176, 0.08333472907543182, 0.08774848282337189, 0.09216223657131195, 0.09657599031925201, 0.10098974406719208, 0.10540349781513214, 0.1098172515630722, 0.11423099786043167, 0.11864475160837173, 0.1230585053563118, 0.12747225165367126, 0.13188600540161133, 0.1362997591495514, 0.14071351289749146, 0.14512726664543152, 0.14954102039337158, 0.15395477414131165, 0.1583685278892517]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 5.0, 14.0, 10.0, 17.0, 23.0, 43.0, 38.0, 65.0, 78.0, 114.0, 181.0, 222.0, 352.0, 509.0, 640.0, 958.0, 1420.0, 2085.0, 3103.0, 4908.0, 7685.0, 13055.0, 23888.0, 56305.0, 718165.0, 134916.0, 34425.0, 17270.0, 9911.0, 6130.0, 3800.0, 2560.0, 1687.0, 1258.0, 808.0, 541.0, 386.0, 278.0, 217.0, 146.0, 104.0, 70.0, 50.0, 30.0, 24.0, 24.0, 17.0, 11.0, 9.0, 3.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0], "bins": [-0.0806884765625, -0.07822418212890625, -0.0757598876953125, -0.07329559326171875, -0.070831298828125, -0.06836700439453125, -0.0659027099609375, -0.06343841552734375, -0.06097412109375, -0.05850982666015625, -0.0560455322265625, -0.05358123779296875, -0.051116943359375, -0.04865264892578125, -0.0461883544921875, -0.04372406005859375, -0.041259765625, -0.03879547119140625, -0.0363311767578125, -0.03386688232421875, -0.031402587890625, -0.02893829345703125, -0.0264739990234375, -0.02400970458984375, -0.02154541015625, -0.01908111572265625, -0.0166168212890625, -0.01415252685546875, -0.011688232421875, -0.00922393798828125, -0.0067596435546875, -0.00429534912109375, -0.0018310546875, 0.00063323974609375, 0.0030975341796875, 0.00556182861328125, 0.008026123046875, 0.01049041748046875, 0.0129547119140625, 0.01541900634765625, 0.01788330078125, 0.02034759521484375, 0.0228118896484375, 0.02527618408203125, 0.027740478515625, 0.03020477294921875, 0.0326690673828125, 0.03513336181640625, 0.03759765625, 0.04006195068359375, 0.0425262451171875, 0.04499053955078125, 0.047454833984375, 0.04991912841796875, 0.0523834228515625, 0.05484771728515625, 0.05731201171875, 0.05977630615234375, 0.0622406005859375, 0.06470489501953125, 0.067169189453125, 0.06963348388671875, 0.0720977783203125, 0.07456207275390625, 0.0770263671875]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 1.0, 3.0, 2.0, 3.0, 2.0, 7.0, 1.0, 3.0, 5.0, 5.0, 7.0, 6.0, 9.0, 6.0, 14.0, 8.0, 21.0, 27.0, 49.0, 179.0, 395.0, 88.0, 35.0, 27.0, 17.0, 8.0, 10.0, 12.0, 7.0, 8.0, 4.0, 7.0, 5.0, 5.0, 5.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.023895263671875, -0.023179292678833008, -0.022463321685791016, -0.021747350692749023, -0.02103137969970703, -0.02031540870666504, -0.019599437713623047, -0.018883466720581055, -0.018167495727539062, -0.01745152473449707, -0.016735553741455078, -0.016019582748413086, -0.015303611755371094, -0.014587640762329102, -0.01387166976928711, -0.013155698776245117, -0.012439727783203125, -0.011723756790161133, -0.01100778579711914, -0.010291814804077148, -0.009575843811035156, -0.008859872817993164, -0.008143901824951172, -0.00742793083190918, -0.0067119598388671875, -0.005995988845825195, -0.005280017852783203, -0.004564046859741211, -0.0038480758666992188, -0.0031321048736572266, -0.0024161338806152344, -0.0017001628875732422, -0.00098419189453125, -0.0002682209014892578, 0.0004477500915527344, 0.0011637210845947266, 0.0018796920776367188, 0.002595663070678711, 0.003311634063720703, 0.004027605056762695, 0.0047435760498046875, 0.00545954704284668, 0.006175518035888672, 0.006891489028930664, 0.007607460021972656, 0.008323431015014648, 0.00903940200805664, 0.009755373001098633, 0.010471343994140625, 0.011187314987182617, 0.01190328598022461, 0.012619256973266602, 0.013335227966308594, 0.014051198959350586, 0.014767169952392578, 0.01548314094543457, 0.016199111938476562, 0.016915082931518555, 0.017631053924560547, 0.01834702491760254, 0.01906299591064453, 0.019778966903686523, 0.020494937896728516, 0.021210908889770508, 0.0219268798828125]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 1.0, 6.0, 10.0, 6.0, 15.0, 13.0, 32.0, 41.0, 53.0, 74.0, 127.0, 166.0, 299.0, 566.0, 1166.0, 2743.0, 6846.0, 19184.0, 62834.0, 245335.0, 491939.0, 152666.0, 41298.0, 13608.0, 5198.0, 2133.0, 978.0, 484.0, 251.0, 138.0, 107.0, 69.0, 48.0, 40.0, 23.0, 18.0, 18.0, 7.0, 13.0, 5.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0677490234375, -0.06565380096435547, -0.06355857849121094, -0.061463356018066406, -0.059368133544921875, -0.057272911071777344, -0.05517768859863281, -0.05308246612548828, -0.05098724365234375, -0.04889202117919922, -0.04679679870605469, -0.044701576232910156, -0.042606353759765625, -0.040511131286621094, -0.03841590881347656, -0.03632068634033203, -0.0342254638671875, -0.03213024139404297, -0.030035018920898438, -0.027939796447753906, -0.025844573974609375, -0.023749351501464844, -0.021654129028320312, -0.01955890655517578, -0.01746368408203125, -0.015368461608886719, -0.013273239135742188, -0.011178016662597656, -0.009082794189453125, -0.006987571716308594, -0.0048923492431640625, -0.0027971267700195312, -0.000701904296875, 0.0013933181762695312, 0.0034885406494140625, 0.005583763122558594, 0.007678985595703125, 0.009774208068847656, 0.011869430541992188, 0.013964653015136719, 0.01605987548828125, 0.01815509796142578, 0.020250320434570312, 0.022345542907714844, 0.024440765380859375, 0.026535987854003906, 0.028631210327148438, 0.03072643280029297, 0.0328216552734375, 0.03491687774658203, 0.03701210021972656, 0.039107322692871094, 0.041202545166015625, 0.043297767639160156, 0.04539299011230469, 0.04748821258544922, 0.04958343505859375, 0.05167865753173828, 0.05377388000488281, 0.055869102478027344, 0.057964324951171875, 0.060059547424316406, 0.06215476989746094, 0.06424999237060547, 0.06634521484375]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 8.0, 3.0, 7.0, 11.0, 7.0, 9.0, 14.0, 20.0, 19.0, 31.0, 28.0, 43.0, 41.0, 36.0, 43.0, 51.0, 44.0, 48.0, 52.0, 58.0, 52.0, 41.0, 40.0, 39.0, 29.0, 39.0, 32.0, 19.0, 26.0, 20.0, 20.0, 19.0, 11.0, 13.0, 11.0, 6.0, 10.0, 6.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10394287109375, -0.1006765365600586, -0.09741020202636719, -0.09414386749267578, -0.09087753295898438, -0.08761119842529297, -0.08434486389160156, -0.08107852935791016, -0.07781219482421875, -0.07454586029052734, -0.07127952575683594, -0.06801319122314453, -0.06474685668945312, -0.06148052215576172, -0.05821418762207031, -0.054947853088378906, -0.0516815185546875, -0.048415184020996094, -0.04514884948730469, -0.04188251495361328, -0.038616180419921875, -0.03534984588623047, -0.03208351135253906, -0.028817176818847656, -0.02555084228515625, -0.022284507751464844, -0.019018173217773438, -0.01575183868408203, -0.012485504150390625, -0.009219169616699219, -0.0059528350830078125, -0.0026865005493164062, 0.000579833984375, 0.0038461685180664062, 0.0071125030517578125, 0.010378837585449219, 0.013645172119140625, 0.01691150665283203, 0.020177841186523438, 0.023444175720214844, 0.02671051025390625, 0.029976844787597656, 0.03324317932128906, 0.03650951385498047, 0.039775848388671875, 0.04304218292236328, 0.04630851745605469, 0.049574851989746094, 0.0528411865234375, 0.056107521057128906, 0.05937385559082031, 0.06264019012451172, 0.06590652465820312, 0.06917285919189453, 0.07243919372558594, 0.07570552825927734, 0.07897186279296875, 0.08223819732666016, 0.08550453186035156, 0.08877086639404297, 0.09203720092773438, 0.09530353546142578, 0.09856986999511719, 0.1018362045288086, 0.1051025390625]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 4.0, 2.0, 3.0, 4.0, 2.0, 10.0, 13.0, 14.0, 28.0, 30.0, 38.0, 59.0, 82.0, 119.0, 188.0, 274.0, 412.0, 659.0, 1197.0, 2343.0, 5048.0, 13056.0, 49009.0, 410631.0, 483938.0, 55844.0, 14437.0, 5299.0, 2516.0, 1275.0, 732.0, 462.0, 275.0, 171.0, 111.0, 76.0, 71.0, 33.0, 37.0, 7.0, 13.0, 10.0, 9.0, 7.0, 4.0, 5.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.06402587890625, -0.062198638916015625, -0.06037139892578125, -0.058544158935546875, -0.0567169189453125, -0.054889678955078125, -0.05306243896484375, -0.051235198974609375, -0.049407958984375, -0.047580718994140625, -0.04575347900390625, -0.043926239013671875, -0.0420989990234375, -0.040271759033203125, -0.03844451904296875, -0.036617279052734375, -0.0347900390625, -0.032962799072265625, -0.03113555908203125, -0.029308319091796875, -0.0274810791015625, -0.025653839111328125, -0.02382659912109375, -0.021999359130859375, -0.020172119140625, -0.018344879150390625, -0.01651763916015625, -0.014690399169921875, -0.0128631591796875, -0.011035919189453125, -0.00920867919921875, -0.007381439208984375, -0.00555419921875, -0.003726959228515625, -0.00189971923828125, -7.2479248046875e-05, 0.0017547607421875, 0.003582000732421875, 0.00540924072265625, 0.007236480712890625, 0.009063720703125, 0.010890960693359375, 0.01271820068359375, 0.014545440673828125, 0.0163726806640625, 0.018199920654296875, 0.02002716064453125, 0.021854400634765625, 0.023681640625, 0.025508880615234375, 0.02733612060546875, 0.029163360595703125, 0.0309906005859375, 0.032817840576171875, 0.03464508056640625, 0.036472320556640625, 0.038299560546875, 0.040126800537109375, 0.04195404052734375, 0.043781280517578125, 0.0456085205078125, 0.047435760498046875, 0.04926300048828125, 0.051090240478515625, 0.05291748046875]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 3.0, 4.0, 7.0, 2.0, 8.0, 9.0, 17.0, 12.0, 20.0, 30.0, 17.0, 30.0, 40.0, 47.0, 58.0, 69.0, 64.0, 69.0, 66.0, 78.0, 76.0, 53.0, 27.0, 34.0, 34.0, 21.0, 21.0, 19.0, 12.0, 17.0, 13.0, 7.0, 5.0, 4.0, 4.0, 0.0, 3.0, 2.0, 0.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-3.6716461181640625e-05, -3.569386899471283e-05, -3.4671276807785034e-05, -3.364868462085724e-05, -3.262609243392944e-05, -3.160350024700165e-05, -3.058090806007385e-05, -2.9558315873146057e-05, -2.8535723686218262e-05, -2.7513131499290466e-05, -2.649053931236267e-05, -2.5467947125434875e-05, -2.444535493850708e-05, -2.3422762751579285e-05, -2.240017056465149e-05, -2.1377578377723694e-05, -2.03549861907959e-05, -1.9332394003868103e-05, -1.8309801816940308e-05, -1.7287209630012512e-05, -1.6264617443084717e-05, -1.5242025256156921e-05, -1.4219433069229126e-05, -1.319684088230133e-05, -1.2174248695373535e-05, -1.115165650844574e-05, -1.0129064321517944e-05, -9.106472134590149e-06, -8.083879947662354e-06, -7.061287760734558e-06, -6.038695573806763e-06, -5.016103386878967e-06, -3.993511199951172e-06, -2.9709190130233765e-06, -1.948326826095581e-06, -9.257346391677856e-07, 9.685754776000977e-08, 1.1194497346878052e-06, 2.1420419216156006e-06, 3.164634108543396e-06, 4.187226295471191e-06, 5.209818482398987e-06, 6.232410669326782e-06, 7.255002856254578e-06, 8.277595043182373e-06, 9.300187230110168e-06, 1.0322779417037964e-05, 1.134537160396576e-05, 1.2367963790893555e-05, 1.339055597782135e-05, 1.4413148164749146e-05, 1.543574035167694e-05, 1.6458332538604736e-05, 1.7480924725532532e-05, 1.8503516912460327e-05, 1.9526109099388123e-05, 2.0548701286315918e-05, 2.1571293473243713e-05, 2.259388566017151e-05, 2.3616477847099304e-05, 2.46390700340271e-05, 2.5661662220954895e-05, 2.668425440788269e-05, 2.7706846594810486e-05, 2.872943878173828e-05]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 3.0, 5.0, 7.0, 9.0, 13.0, 26.0, 29.0, 44.0, 64.0, 112.0, 222.0, 371.0, 803.0, 1736.0, 4696.0, 17187.0, 112636.0, 727424.0, 152853.0, 20949.0, 5502.0, 2009.0, 856.0, 412.0, 210.0, 123.0, 83.0, 52.0, 41.0, 16.0, 15.0, 15.0, 5.0, 9.0, 3.0, 5.0, 3.0, 1.0, 1.0, 3.0, 3.0, 0.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.055389404296875, -0.053304195404052734, -0.05121898651123047, -0.0491337776184082, -0.04704856872558594, -0.04496335983276367, -0.042878150939941406, -0.04079294204711914, -0.038707733154296875, -0.03662252426147461, -0.034537315368652344, -0.03245210647583008, -0.030366897583007812, -0.028281688690185547, -0.02619647979736328, -0.024111270904541016, -0.02202606201171875, -0.019940853118896484, -0.01785564422607422, -0.015770435333251953, -0.013685226440429688, -0.011600017547607422, -0.009514808654785156, -0.007429599761962891, -0.005344390869140625, -0.0032591819763183594, -0.0011739730834960938, 0.0009112358093261719, 0.0029964447021484375, 0.005081653594970703, 0.007166862487792969, 0.009252071380615234, 0.0113372802734375, 0.013422489166259766, 0.015507698059082031, 0.017592906951904297, 0.019678115844726562, 0.021763324737548828, 0.023848533630371094, 0.02593374252319336, 0.028018951416015625, 0.03010416030883789, 0.032189369201660156, 0.03427457809448242, 0.03635978698730469, 0.03844499588012695, 0.04053020477294922, 0.042615413665771484, 0.04470062255859375, 0.046785831451416016, 0.04887104034423828, 0.05095624923706055, 0.05304145812988281, 0.05512666702270508, 0.057211875915527344, 0.05929708480834961, 0.061382293701171875, 0.06346750259399414, 0.0655527114868164, 0.06763792037963867, 0.06972312927246094, 0.0718083381652832, 0.07389354705810547, 0.07597875595092773, 0.07806396484375]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 1.0, 1.0, 5.0, 1.0, 1.0, 4.0, 5.0, 4.0, 4.0, 10.0, 6.0, 7.0, 21.0, 20.0, 22.0, 32.0, 40.0, 48.0, 50.0, 56.0, 77.0, 66.0, 79.0, 77.0, 66.0, 65.0, 42.0, 44.0, 31.0, 24.0, 23.0, 17.0, 12.0, 3.0, 7.0, 12.0, 5.0, 5.0, 1.0, 2.0, 6.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.032379150390625, -0.031101703643798828, -0.029824256896972656, -0.028546810150146484, -0.027269363403320312, -0.02599191665649414, -0.02471446990966797, -0.023437023162841797, -0.022159576416015625, -0.020882129669189453, -0.01960468292236328, -0.01832723617553711, -0.017049789428710938, -0.015772342681884766, -0.014494895935058594, -0.013217449188232422, -0.01194000244140625, -0.010662555694580078, -0.009385108947753906, -0.008107662200927734, -0.0068302154541015625, -0.005552768707275391, -0.004275321960449219, -0.002997875213623047, -0.001720428466796875, -0.0004429817199707031, 0.0008344650268554688, 0.0021119117736816406, 0.0033893585205078125, 0.004666805267333984, 0.005944252014160156, 0.007221698760986328, 0.0084991455078125, 0.009776592254638672, 0.011054039001464844, 0.012331485748291016, 0.013608932495117188, 0.01488637924194336, 0.01616382598876953, 0.017441272735595703, 0.018718719482421875, 0.019996166229248047, 0.02127361297607422, 0.02255105972290039, 0.023828506469726562, 0.025105953216552734, 0.026383399963378906, 0.027660846710205078, 0.02893829345703125, 0.030215740203857422, 0.031493186950683594, 0.032770633697509766, 0.03404808044433594, 0.03532552719116211, 0.03660297393798828, 0.03788042068481445, 0.039157867431640625, 0.0404353141784668, 0.04171276092529297, 0.04299020767211914, 0.04426765441894531, 0.045545101165771484, 0.046822547912597656, 0.04809999465942383, 0.04937744140625]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 5.0, 16.0, 15.0, 30.0, 75.0, 153.0, 248.0, 213.0, 124.0, 55.0, 28.0, 15.0, 11.0, 4.0, 2.0, 5.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 5.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.48074230551719666, -0.4563523232936859, -0.4319623112678528, -0.40757232904434204, -0.3831823468208313, -0.35879236459732056, -0.3344023525714874, -0.3100123703479767, -0.28562235832214355, -0.2612323760986328, -0.23684237897396088, -0.21245238184928894, -0.1880623996257782, -0.16367240250110626, -0.13928240537643433, -0.11489242315292358, -0.09050244092941284, -0.0661124512553215, -0.041722457855939865, -0.017332464456558228, 0.007057525217533112, 0.03144751489162445, 0.05583751201629639, 0.08022749423980713, 0.10461749136447906, 0.129007488489151, 0.15339747071266174, 0.17778746783733368, 0.20217746496200562, 0.22656744718551636, 0.2509574294090271, 0.27534741163253784, 0.2997373938560486, 0.3241273760795593, 0.34851738810539246, 0.3729073703289032, 0.39729735255241394, 0.42168736457824707, 0.4460773468017578, 0.47046732902526855, 0.4948573112487793, 0.51924729347229, 0.5436372756958008, 0.5680272579193115, 0.592417299747467, 0.6168072819709778, 0.6411972641944885, 0.6655872464179993, 0.6899772882461548, 0.7143672704696655, 0.7387572526931763, 0.763147234916687, 0.7875372767448425, 0.8119272589683533, 0.836317241191864, 0.8607072234153748, 0.8850972056388855, 0.9094871878623962, 0.933877170085907, 0.9582672119140625, 0.9826571941375732, 1.007047176361084, 1.0314371585845947, 1.0558271408081055, 1.0802171230316162]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 5.0, 4.0, 4.0, 8.0, 7.0, 7.0, 14.0, 24.0, 33.0, 49.0, 76.0, 135.0, 184.0, 145.0, 103.0, 75.0, 39.0, 16.0, 12.0, 9.0, 5.0, 5.0, 7.0, 6.0, 3.0, 3.0, 3.0, 2.0, 6.0, 2.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.504492998123169, -1.4502655267715454, -1.3960381746292114, -1.341810703277588, -1.287583351135254, -1.2333558797836304, -1.1791284084320068, -1.1249010562896729, -1.0706737041473389, -1.0164462327957153, -0.9622188806533813, -0.9079914093017578, -0.8537640571594238, -0.7995365858078003, -0.7453091740608215, -0.6910817623138428, -0.6368542909622192, -0.5826268792152405, -0.5283994674682617, -0.47417202591896057, -0.4199446141719818, -0.36571720242500305, -0.3114897608757019, -0.25726234912872314, -0.20303493738174438, -0.14880752563476562, -0.09458009898662567, -0.04035267233848572, 0.013874739408493042, 0.0681021511554718, 0.12232959270477295, 0.1765570044517517, 0.23078429698944092, 0.2850117087364197, 0.33923912048339844, 0.3934665620326996, 0.44769397377967834, 0.5019214153289795, 0.5561488270759583, 0.610376238822937, 0.6646036505699158, 0.7188310623168945, 0.7730584740638733, 0.827285885810852, 0.8815133571624756, 0.9357407093048096, 0.9899681806564331, 1.0441956520080566, 1.0984230041503906, 1.1526504755020142, 1.2068778276443481, 1.2611052989959717, 1.3153326511383057, 1.3695601224899292, 1.4237875938415527, 1.4780149459838867, 1.5322422981262207, 1.5864697694778442, 1.6406971216201782, 1.6949245929718018, 1.7491519451141357, 1.8033794164657593, 1.8576068878173828, 1.9118342399597168, 1.9660617113113403]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 7.0, 5.0, 10.0, 1.0, 11.0, 21.0, 24.0, 27.0, 37.0, 56.0, 91.0, 115.0, 191.0, 275.0, 419.0, 726.0, 1367.0, 2560.0, 5466.0, 14162.0, 56692.0, 3786349.0, 270691.0, 33308.0, 11213.0, 4703.0, 2427.0, 1362.0, 768.0, 410.0, 280.0, 170.0, 120.0, 58.0, 46.0, 30.0, 23.0, 20.0, 22.0, 5.0, 5.0, 6.0, 2.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.2022705078125, -0.1964588165283203, -0.19064712524414062, -0.18483543395996094, -0.17902374267578125, -0.17321205139160156, -0.16740036010742188, -0.1615886688232422, -0.1557769775390625, -0.1499652862548828, -0.14415359497070312, -0.13834190368652344, -0.13253021240234375, -0.12671852111816406, -0.12090682983398438, -0.11509513854980469, -0.109283447265625, -0.10347175598144531, -0.09766006469726562, -0.09184837341308594, -0.08603668212890625, -0.08022499084472656, -0.07441329956054688, -0.06860160827636719, -0.0627899169921875, -0.05697822570800781, -0.051166534423828125, -0.04535484313964844, -0.03954315185546875, -0.03373146057128906, -0.027919769287109375, -0.022108078002929688, -0.01629638671875, -0.010484695434570312, -0.004673004150390625, 0.0011386871337890625, 0.00695037841796875, 0.012762069702148438, 0.018573760986328125, 0.024385452270507812, 0.0301971435546875, 0.03600883483886719, 0.041820526123046875, 0.04763221740722656, 0.05344390869140625, 0.05925559997558594, 0.06506729125976562, 0.07087898254394531, 0.076690673828125, 0.08250236511230469, 0.08831405639648438, 0.09412574768066406, 0.09993743896484375, 0.10574913024902344, 0.11156082153320312, 0.11737251281738281, 0.1231842041015625, 0.1289958953857422, 0.13480758666992188, 0.14061927795410156, 0.14643096923828125, 0.15224266052246094, 0.15805435180664062, 0.1638660430908203, 0.169677734375]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 6.0, 2.0, 7.0, 2.0, 6.0, 7.0, 8.0, 20.0, 15.0, 26.0, 49.0, 127.0, 237.0, 203.0, 108.0, 45.0, 33.0, 21.0, 15.0, 3.0, 12.0, 6.0, 10.0, 8.0, 8.0, 3.0, 2.0, 3.0, 4.0, 4.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.023956298828125, -0.023235797882080078, -0.022515296936035156, -0.021794795989990234, -0.021074295043945312, -0.02035379409790039, -0.01963329315185547, -0.018912792205810547, -0.018192291259765625, -0.017471790313720703, -0.01675128936767578, -0.01603078842163086, -0.015310287475585938, -0.014589786529541016, -0.013869285583496094, -0.013148784637451172, -0.01242828369140625, -0.011707782745361328, -0.010987281799316406, -0.010266780853271484, -0.009546279907226562, -0.00882577896118164, -0.008105278015136719, -0.007384777069091797, -0.006664276123046875, -0.005943775177001953, -0.005223274230957031, -0.004502773284912109, -0.0037822723388671875, -0.0030617713928222656, -0.0023412704467773438, -0.0016207695007324219, -0.0009002685546875, -0.00017976760864257812, 0.0005407333374023438, 0.0012612342834472656, 0.0019817352294921875, 0.0027022361755371094, 0.0034227371215820312, 0.004143238067626953, 0.004863739013671875, 0.005584239959716797, 0.006304740905761719, 0.007025241851806641, 0.0077457427978515625, 0.008466243743896484, 0.009186744689941406, 0.009907245635986328, 0.01062774658203125, 0.011348247528076172, 0.012068748474121094, 0.012789249420166016, 0.013509750366210938, 0.01423025131225586, 0.014950752258300781, 0.015671253204345703, 0.016391754150390625, 0.017112255096435547, 0.01783275604248047, 0.01855325698852539, 0.019273757934570312, 0.019994258880615234, 0.020714759826660156, 0.021435260772705078, 0.02215576171875]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 0.0, 1.0, 0.0, 3.0, 7.0, 6.0, 10.0, 3.0, 19.0, 22.0, 44.0, 44.0, 81.0, 135.0, 186.0, 357.0, 721.0, 1593.0, 4453.0, 14727.0, 71676.0, 1194717.0, 2791547.0, 88040.0, 16903.0, 5187.0, 1929.0, 819.0, 432.0, 227.0, 139.0, 77.0, 49.0, 52.0, 25.0, 20.0, 12.0, 9.0, 8.0, 3.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.15478515625, -0.14980125427246094, -0.14481735229492188, -0.1398334503173828, -0.13484954833984375, -0.1298656463623047, -0.12488174438476562, -0.11989784240722656, -0.1149139404296875, -0.10993003845214844, -0.10494613647460938, -0.09996223449707031, -0.09497833251953125, -0.08999443054199219, -0.08501052856445312, -0.08002662658691406, -0.075042724609375, -0.07005882263183594, -0.06507492065429688, -0.06009101867675781, -0.05510711669921875, -0.05012321472167969, -0.045139312744140625, -0.04015541076660156, -0.0351715087890625, -0.030187606811523438, -0.025203704833984375, -0.020219802856445312, -0.01523590087890625, -0.010251998901367188, -0.005268096923828125, -0.0002841949462890625, 0.00469970703125, 0.009683609008789062, 0.014667510986328125, 0.019651412963867188, 0.02463531494140625, 0.029619216918945312, 0.034603118896484375, 0.03958702087402344, 0.0445709228515625, 0.04955482482910156, 0.054538726806640625, 0.05952262878417969, 0.06450653076171875, 0.06949043273925781, 0.07447433471679688, 0.07945823669433594, 0.084442138671875, 0.08942604064941406, 0.09440994262695312, 0.09939384460449219, 0.10437774658203125, 0.10936164855957031, 0.11434555053710938, 0.11932945251464844, 0.1243133544921875, 0.12929725646972656, 0.13428115844726562, 0.1392650604248047, 0.14424896240234375, 0.1492328643798828, 0.15421676635742188, 0.15920066833496094, 0.1641845703125]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 1.0, 2.0, 4.0, 4.0, 4.0, 7.0, 9.0, 12.0, 16.0, 31.0, 28.0, 59.0, 83.0, 151.0, 274.0, 654.0, 1814.0, 453.0, 165.0, 103.0, 55.0, 34.0, 19.0, 20.0, 21.0, 6.0, 8.0, 10.0, 8.0, 10.0, 4.0, 3.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.02874755859375, -0.02780008316040039, -0.02685260772705078, -0.025905132293701172, -0.024957656860351562, -0.024010181427001953, -0.023062705993652344, -0.022115230560302734, -0.021167755126953125, -0.020220279693603516, -0.019272804260253906, -0.018325328826904297, -0.017377853393554688, -0.016430377960205078, -0.015482902526855469, -0.01453542709350586, -0.01358795166015625, -0.01264047622680664, -0.011693000793457031, -0.010745525360107422, -0.009798049926757812, -0.008850574493408203, -0.007903099060058594, -0.006955623626708984, -0.006008148193359375, -0.005060672760009766, -0.004113197326660156, -0.003165721893310547, -0.0022182464599609375, -0.0012707710266113281, -0.00032329559326171875, 0.0006241798400878906, 0.0015716552734375, 0.0025191307067871094, 0.0034666061401367188, 0.004414081573486328, 0.0053615570068359375, 0.006309032440185547, 0.007256507873535156, 0.008203983306884766, 0.009151458740234375, 0.010098934173583984, 0.011046409606933594, 0.011993885040283203, 0.012941360473632812, 0.013888835906982422, 0.014836311340332031, 0.01578378677368164, 0.01673126220703125, 0.01767873764038086, 0.01862621307373047, 0.019573688507080078, 0.020521163940429688, 0.021468639373779297, 0.022416114807128906, 0.023363590240478516, 0.024311065673828125, 0.025258541107177734, 0.026206016540527344, 0.027153491973876953, 0.028100967407226562, 0.029048442840576172, 0.02999591827392578, 0.03094339370727539, 0.031890869140625]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 2.0, 1.0, 9.0, 19.0, 70.0, 206.0, 328.0, 238.0, 72.0, 34.0, 18.0, 6.0, 1.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.16206994652748108, -0.15288899838924408, -0.1437080353498459, -0.1345270872116089, -0.1253461241722107, -0.1161651760339737, -0.1069842278957367, -0.0978032723069191, -0.0886223167181015, -0.0794413611292839, -0.07026040554046631, -0.06107945740222931, -0.05189850181341171, -0.042717546224594116, -0.03353659436106682, -0.02435564249753952, -0.015174686908721924, -0.005993733182549477, 0.0031872205436229706, 0.012368174269795418, 0.021549127995967865, 0.03073008358478546, 0.03991103544831276, 0.04909198731184006, 0.058272942900657654, 0.06745389848947525, 0.07663485407829285, 0.08581580221652985, 0.09499675780534744, 0.10417771339416504, 0.11335866153240204, 0.12253961712121964, 0.13172060251235962, 0.14090155065059662, 0.1500825136899948, 0.1592634618282318, 0.16844442486763, 0.177625373005867, 0.186806321144104, 0.1959872841835022, 0.2051682323217392, 0.2143491804599762, 0.2235301434993744, 0.2327110916376114, 0.2418920397758484, 0.2510730028152466, 0.2602539658546448, 0.2694348990917206, 0.2786158621311188, 0.28779682517051697, 0.2969777584075928, 0.30615872144699097, 0.31533968448638916, 0.32452064752578735, 0.33370158076286316, 0.34288254380226135, 0.35206347703933716, 0.36124444007873535, 0.37042537331581116, 0.37960633635520935, 0.38878729939460754, 0.39796823263168335, 0.40714919567108154, 0.41633015871047974, 0.42551112174987793]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [4.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 4.0, 2.0, 3.0, 0.0, 3.0, 1.0, 4.0, 4.0, 5.0, 7.0, 5.0, 12.0, 16.0, 17.0, 15.0, 26.0, 39.0, 34.0, 64.0, 42.0, 53.0, 42.0, 66.0, 59.0, 63.0, 59.0, 66.0, 52.0, 55.0, 44.0, 19.0, 29.0, 18.0, 22.0, 12.0, 12.0, 9.0, 6.0, 4.0, 6.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1099323034286499, -0.10628964006900787, -0.10264697670936584, -0.09900431334972382, -0.09536164999008179, -0.09171898663043976, -0.08807633072137833, -0.0844336673617363, -0.08079100400209427, -0.07714834064245224, -0.07350567728281021, -0.06986301392316818, -0.06622035801410675, -0.06257769465446472, -0.05893503129482269, -0.055292367935180664, -0.051649704575538635, -0.048007041215896606, -0.04436437785625458, -0.04072171822190285, -0.03707905486226082, -0.03343639150261879, -0.02979373000562191, -0.02615106850862503, -0.022508405148983, -0.018865741789340973, -0.015223080292344093, -0.011580417864024639, -0.007937755435705185, -0.004295092076063156, -0.0006524305790662766, 0.002990230917930603, 0.006632894277572632, 0.010275556705892086, 0.01391821913421154, 0.01756088063120842, 0.02120354399085045, 0.024846207350492477, 0.028488868847489357, 0.03213153034448624, 0.035774193704128265, 0.039416857063770294, 0.04305952042341232, 0.04670218005776405, 0.05034484341740608, 0.05398750677704811, 0.05763016641139984, 0.06127282977104187, 0.0649154931306839, 0.06855815649032593, 0.07220081984996796, 0.07584348320960999, 0.07948614656925201, 0.08312880992889404, 0.08677146583795547, 0.0904141291975975, 0.09405679255723953, 0.09769945591688156, 0.10134211927652359, 0.10498478263616562, 0.10862743854522705, 0.11227010190486908, 0.11591276526451111, 0.11955542862415314, 0.12319809198379517]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 7.0, 5.0, 9.0, 7.0, 13.0, 7.0, 20.0, 24.0, 40.0, 44.0, 67.0, 68.0, 102.0, 141.0, 232.0, 327.0, 454.0, 664.0, 989.0, 1458.0, 2444.0, 4106.0, 6912.0, 13391.0, 28538.0, 84743.0, 525136.0, 278415.0, 53481.0, 21099.0, 10471.0, 5726.0, 3341.0, 1983.0, 1304.0, 831.0, 605.0, 441.0, 249.0, 164.0, 126.0, 115.0, 75.0, 52.0, 39.0, 27.0, 20.0, 13.0, 13.0, 10.0, 3.0, 6.0, 4.0, 3.0, 0.0, 3.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.08612060546875, -0.08332633972167969, -0.08053207397460938, -0.07773780822753906, -0.07494354248046875, -0.07214927673339844, -0.06935501098632812, -0.06656074523925781, -0.0637664794921875, -0.06097221374511719, -0.058177947998046875, -0.05538368225097656, -0.05258941650390625, -0.04979515075683594, -0.047000885009765625, -0.04420661926269531, -0.041412353515625, -0.03861808776855469, -0.035823822021484375, -0.03302955627441406, -0.03023529052734375, -0.027441024780273438, -0.024646759033203125, -0.021852493286132812, -0.0190582275390625, -0.016263961791992188, -0.013469696044921875, -0.010675430297851562, -0.00788116455078125, -0.0050868988037109375, -0.002292633056640625, 0.0005016326904296875, 0.0032958984375, 0.0060901641845703125, 0.008884429931640625, 0.011678695678710938, 0.01447296142578125, 0.017267227172851562, 0.020061492919921875, 0.022855758666992188, 0.0256500244140625, 0.028444290161132812, 0.031238555908203125, 0.03403282165527344, 0.03682708740234375, 0.03962135314941406, 0.042415618896484375, 0.04520988464355469, 0.048004150390625, 0.05079841613769531, 0.053592681884765625, 0.05638694763183594, 0.05918121337890625, 0.06197547912597656, 0.06476974487304688, 0.06756401062011719, 0.0703582763671875, 0.07315254211425781, 0.07594680786132812, 0.07874107360839844, 0.08153533935546875, 0.08432960510253906, 0.08712387084960938, 0.08991813659667969, 0.09271240234375]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 0.0, 5.0, 3.0, 5.0, 4.0, 12.0, 16.0, 15.0, 30.0, 37.0, 71.0, 132.0, 224.0, 169.0, 106.0, 52.0, 27.0, 21.0, 10.0, 12.0, 10.0, 7.0, 9.0, 3.0, 6.0, 1.0, 4.0, 5.0, 2.0, 0.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0228424072265625, -0.02212667465209961, -0.02141094207763672, -0.020695209503173828, -0.019979476928710938, -0.019263744354248047, -0.018548011779785156, -0.017832279205322266, -0.017116546630859375, -0.016400814056396484, -0.015685081481933594, -0.014969348907470703, -0.014253616333007812, -0.013537883758544922, -0.012822151184082031, -0.01210641860961914, -0.01139068603515625, -0.01067495346069336, -0.009959220886230469, -0.009243488311767578, -0.008527755737304688, -0.007812023162841797, -0.007096290588378906, -0.006380558013916016, -0.005664825439453125, -0.004949092864990234, -0.004233360290527344, -0.003517627716064453, -0.0028018951416015625, -0.002086162567138672, -0.0013704299926757812, -0.0006546974182128906, 6.103515625e-05, 0.0007767677307128906, 0.0014925003051757812, 0.002208232879638672, 0.0029239654541015625, 0.003639698028564453, 0.004355430603027344, 0.005071163177490234, 0.005786895751953125, 0.006502628326416016, 0.007218360900878906, 0.007934093475341797, 0.008649826049804688, 0.009365558624267578, 0.010081291198730469, 0.01079702377319336, 0.01151275634765625, 0.01222848892211914, 0.012944221496582031, 0.013659954071044922, 0.014375686645507812, 0.015091419219970703, 0.015807151794433594, 0.016522884368896484, 0.017238616943359375, 0.017954349517822266, 0.018670082092285156, 0.019385814666748047, 0.020101547241210938, 0.020817279815673828, 0.02153301239013672, 0.02224874496459961, 0.0229644775390625]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 3.0, 5.0, 6.0, 5.0, 8.0, 11.0, 9.0, 22.0, 24.0, 37.0, 46.0, 65.0, 85.0, 142.0, 254.0, 422.0, 765.0, 1273.0, 2724.0, 5852.0, 15100.0, 46549.0, 179485.0, 480183.0, 225930.0, 58014.0, 18188.0, 6823.0, 2950.0, 1506.0, 811.0, 420.0, 268.0, 165.0, 132.0, 63.0, 60.0, 34.0, 34.0, 24.0, 18.0, 12.0, 11.0, 9.0, 4.0, 3.0, 1.0, 0.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0], "bins": [-0.060211181640625, -0.05817556381225586, -0.05613994598388672, -0.05410432815551758, -0.05206871032714844, -0.0500330924987793, -0.047997474670410156, -0.045961856842041016, -0.043926239013671875, -0.041890621185302734, -0.039855003356933594, -0.03781938552856445, -0.03578376770019531, -0.03374814987182617, -0.03171253204345703, -0.02967691421508789, -0.02764129638671875, -0.02560567855834961, -0.02357006072998047, -0.021534442901611328, -0.019498825073242188, -0.017463207244873047, -0.015427589416503906, -0.013391971588134766, -0.011356353759765625, -0.009320735931396484, -0.007285118103027344, -0.005249500274658203, -0.0032138824462890625, -0.0011782646179199219, 0.0008573532104492188, 0.0028929710388183594, 0.0049285888671875, 0.006964206695556641, 0.008999824523925781, 0.011035442352294922, 0.013071060180664062, 0.015106678009033203, 0.017142295837402344, 0.019177913665771484, 0.021213531494140625, 0.023249149322509766, 0.025284767150878906, 0.027320384979248047, 0.029356002807617188, 0.03139162063598633, 0.03342723846435547, 0.03546285629272461, 0.03749847412109375, 0.03953409194946289, 0.04156970977783203, 0.04360532760620117, 0.04564094543457031, 0.04767656326293945, 0.049712181091308594, 0.051747798919677734, 0.053783416748046875, 0.055819034576416016, 0.057854652404785156, 0.0598902702331543, 0.06192588806152344, 0.06396150588989258, 0.06599712371826172, 0.06803274154663086, 0.070068359375]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 6.0, 6.0, 4.0, 6.0, 12.0, 9.0, 16.0, 17.0, 17.0, 24.0, 23.0, 33.0, 31.0, 31.0, 45.0, 32.0, 42.0, 45.0, 52.0, 52.0, 39.0, 48.0, 43.0, 38.0, 39.0, 39.0, 51.0, 36.0, 20.0, 29.0, 27.0, 13.0, 20.0, 8.0, 9.0, 11.0, 7.0, 8.0, 7.0, 3.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.052032470703125, -0.0501704216003418, -0.048308372497558594, -0.04644632339477539, -0.04458427429199219, -0.042722225189208984, -0.04086017608642578, -0.03899812698364258, -0.037136077880859375, -0.03527402877807617, -0.03341197967529297, -0.031549930572509766, -0.029687881469726562, -0.02782583236694336, -0.025963783264160156, -0.024101734161376953, -0.02223968505859375, -0.020377635955810547, -0.018515586853027344, -0.01665353775024414, -0.014791488647460938, -0.012929439544677734, -0.011067390441894531, -0.009205341339111328, -0.007343292236328125, -0.005481243133544922, -0.0036191940307617188, -0.0017571449279785156, 0.0001049041748046875, 0.0019669532775878906, 0.0038290023803710938, 0.005691051483154297, 0.0075531005859375, 0.009415149688720703, 0.011277198791503906, 0.01313924789428711, 0.015001296997070312, 0.016863346099853516, 0.01872539520263672, 0.020587444305419922, 0.022449493408203125, 0.024311542510986328, 0.02617359161376953, 0.028035640716552734, 0.029897689819335938, 0.03175973892211914, 0.033621788024902344, 0.03548383712768555, 0.03734588623046875, 0.03920793533325195, 0.041069984436035156, 0.04293203353881836, 0.04479408264160156, 0.046656131744384766, 0.04851818084716797, 0.05038022994995117, 0.052242279052734375, 0.05410432815551758, 0.05596637725830078, 0.057828426361083984, 0.05969047546386719, 0.06155252456665039, 0.0634145736694336, 0.0652766227722168, 0.067138671875]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 0.0, 3.0, 3.0, 3.0, 0.0, 8.0, 4.0, 7.0, 6.0, 17.0, 29.0, 31.0, 51.0, 83.0, 157.0, 403.0, 1145.0, 4900.0, 36008.0, 757701.0, 230296.0, 13914.0, 2484.0, 666.0, 295.0, 136.0, 81.0, 43.0, 32.0, 20.0, 7.0, 4.0, 5.0, 3.0, 6.0, 5.0, 4.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.12646484375, -0.12114906311035156, -0.11583328247070312, -0.11051750183105469, -0.10520172119140625, -0.09988594055175781, -0.09457015991210938, -0.08925437927246094, -0.0839385986328125, -0.07862281799316406, -0.07330703735351562, -0.06799125671386719, -0.06267547607421875, -0.05735969543457031, -0.052043914794921875, -0.04672813415527344, -0.041412353515625, -0.03609657287597656, -0.030780792236328125, -0.025465011596679688, -0.02014923095703125, -0.014833450317382812, -0.009517669677734375, -0.0042018890380859375, 0.0011138916015625, 0.0064296722412109375, 0.011745452880859375, 0.017061233520507812, 0.02237701416015625, 0.027692794799804688, 0.033008575439453125, 0.03832435607910156, 0.04364013671875, 0.04895591735839844, 0.054271697998046875, 0.05958747863769531, 0.06490325927734375, 0.07021903991699219, 0.07553482055664062, 0.08085060119628906, 0.0861663818359375, 0.09148216247558594, 0.09679794311523438, 0.10211372375488281, 0.10742950439453125, 0.11274528503417969, 0.11806106567382812, 0.12337684631347656, 0.128692626953125, 0.13400840759277344, 0.13932418823242188, 0.1446399688720703, 0.14995574951171875, 0.1552715301513672, 0.16058731079101562, 0.16590309143066406, 0.1712188720703125, 0.17653465270996094, 0.18185043334960938, 0.1871662139892578, 0.19248199462890625, 0.1977977752685547, 0.20311355590820312, 0.20842933654785156, 0.2137451171875]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 2.0, 5.0, 9.0, 4.0, 14.0, 16.0, 13.0, 22.0, 26.0, 32.0, 45.0, 48.0, 66.0, 85.0, 99.0, 89.0, 86.0, 74.0, 65.0, 37.0, 37.0, 31.0, 27.0, 20.0, 16.0, 8.0, 5.0, 4.0, 6.0, 4.0, 3.0, 3.0, 0.0, 1.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.561113357543945e-05, -5.383603274822235e-05, -5.206093192100525e-05, -5.028583109378815e-05, -4.8510730266571045e-05, -4.673562943935394e-05, -4.496052861213684e-05, -4.318542778491974e-05, -4.141032695770264e-05, -3.9635226130485535e-05, -3.786012530326843e-05, -3.608502447605133e-05, -3.430992364883423e-05, -3.2534822821617126e-05, -3.0759721994400024e-05, -2.8984621167182922e-05, -2.720952033996582e-05, -2.5434419512748718e-05, -2.3659318685531616e-05, -2.1884217858314514e-05, -2.0109117031097412e-05, -1.833401620388031e-05, -1.6558915376663208e-05, -1.4783814549446106e-05, -1.3008713722229004e-05, -1.1233612895011902e-05, -9.4585120677948e-06, -7.683411240577698e-06, -5.908310413360596e-06, -4.133209586143494e-06, -2.3581087589263916e-06, -5.830079317092896e-07, 1.1920928955078125e-06, 2.9671937227249146e-06, 4.742294549942017e-06, 6.517395377159119e-06, 8.29249620437622e-06, 1.0067597031593323e-05, 1.1842697858810425e-05, 1.3617798686027527e-05, 1.539289951324463e-05, 1.716800034046173e-05, 1.8943101167678833e-05, 2.0718201994895935e-05, 2.2493302822113037e-05, 2.426840364933014e-05, 2.604350447654724e-05, 2.7818605303764343e-05, 2.9593706130981445e-05, 3.136880695819855e-05, 3.314390778541565e-05, 3.491900861263275e-05, 3.6694109439849854e-05, 3.8469210267066956e-05, 4.024431109428406e-05, 4.201941192150116e-05, 4.379451274871826e-05, 4.5569613575935364e-05, 4.7344714403152466e-05, 4.911981523036957e-05, 5.089491605758667e-05, 5.267001688480377e-05, 5.4445117712020874e-05, 5.6220218539237976e-05, 5.799531936645508e-05]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 0.0, 3.0, 5.0, 4.0, 9.0, 17.0, 20.0, 40.0, 58.0, 85.0, 213.0, 371.0, 868.0, 2138.0, 6459.0, 27412.0, 198763.0, 658308.0, 125903.0, 19544.0, 5062.0, 1780.0, 744.0, 354.0, 161.0, 97.0, 49.0, 34.0, 18.0, 17.0, 5.0, 9.0, 5.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.1051025390625, -0.10221481323242188, -0.09932708740234375, -0.09643936157226562, -0.0935516357421875, -0.09066390991210938, -0.08777618408203125, -0.08488845825195312, -0.082000732421875, -0.07911300659179688, -0.07622528076171875, -0.07333755493164062, -0.0704498291015625, -0.06756210327148438, -0.06467437744140625, -0.061786651611328125, -0.05889892578125, -0.056011199951171875, -0.05312347412109375, -0.050235748291015625, -0.0473480224609375, -0.044460296630859375, -0.04157257080078125, -0.038684844970703125, -0.035797119140625, -0.032909393310546875, -0.03002166748046875, -0.027133941650390625, -0.0242462158203125, -0.021358489990234375, -0.01847076416015625, -0.015583038330078125, -0.0126953125, -0.009807586669921875, -0.00691986083984375, -0.004032135009765625, -0.0011444091796875, 0.001743316650390625, 0.00463104248046875, 0.007518768310546875, 0.010406494140625, 0.013294219970703125, 0.01618194580078125, 0.019069671630859375, 0.0219573974609375, 0.024845123291015625, 0.02773284912109375, 0.030620574951171875, 0.03350830078125, 0.036396026611328125, 0.03928375244140625, 0.042171478271484375, 0.0450592041015625, 0.047946929931640625, 0.05083465576171875, 0.053722381591796875, 0.056610107421875, 0.059497833251953125, 0.06238555908203125, 0.06527328491210938, 0.0681610107421875, 0.07104873657226562, 0.07393646240234375, 0.07682418823242188, 0.0797119140625]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 2.0, 9.0, 7.0, 11.0, 16.0, 27.0, 35.0, 50.0, 76.0, 117.0, 120.0, 163.0, 124.0, 78.0, 51.0, 38.0, 26.0, 21.0, 11.0, 13.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.09039306640625, -0.08788681030273438, -0.08538055419921875, -0.08287429809570312, -0.0803680419921875, -0.07786178588867188, -0.07535552978515625, -0.07284927368164062, -0.070343017578125, -0.06783676147460938, -0.06533050537109375, -0.06282424926757812, -0.0603179931640625, -0.057811737060546875, -0.05530548095703125, -0.052799224853515625, -0.05029296875, -0.047786712646484375, -0.04528045654296875, -0.042774200439453125, -0.0402679443359375, -0.037761688232421875, -0.03525543212890625, -0.032749176025390625, -0.030242919921875, -0.027736663818359375, -0.02523040771484375, -0.022724151611328125, -0.0202178955078125, -0.017711639404296875, -0.01520538330078125, -0.012699127197265625, -0.01019287109375, -0.007686614990234375, -0.00518035888671875, -0.002674102783203125, -0.0001678466796875, 0.002338409423828125, 0.00484466552734375, 0.007350921630859375, 0.009857177734375, 0.012363433837890625, 0.01486968994140625, 0.017375946044921875, 0.0198822021484375, 0.022388458251953125, 0.02489471435546875, 0.027400970458984375, 0.0299072265625, 0.032413482666015625, 0.03491973876953125, 0.037425994873046875, 0.0399322509765625, 0.042438507080078125, 0.04494476318359375, 0.047451019287109375, 0.049957275390625, 0.052463531494140625, 0.05496978759765625, 0.057476043701171875, 0.0599822998046875, 0.062488555908203125, 0.06499481201171875, 0.06750106811523438, 0.07000732421875]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 6.0, 10.0, 45.0, 344.0, 462.0, 107.0, 23.0, 10.0, 4.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4232504367828369, -0.3711588382720947, -0.3190672695636749, -0.26697567105293274, -0.21488408744335175, -0.16279250383377075, -0.11070090532302856, -0.058609336614608765, -0.006517738103866577, 0.045573849231004715, 0.09766543656587601, 0.1497570276260376, 0.2018486112356186, 0.2539401948451996, 0.3060317933559418, 0.3581233620643616, 0.41021496057510376, 0.46230655908584595, 0.5143981575965881, 0.5664896965026855, 0.6185812950134277, 0.6706728935241699, 0.7227644920349121, 0.7748560905456543, 0.8269476890563965, 0.8790392875671387, 0.9311308860778809, 0.983222484588623, 1.0353140830993652, 1.0874056816101074, 1.1394972801208496, 1.1915887594223022, 1.2436803579330444, 1.2957719564437866, 1.3478635549545288, 1.399955153465271, 1.4520467519760132, 1.5041382312774658, 1.556229829788208, 1.6083214282989502, 1.6604130268096924, 1.7125046253204346, 1.7645962238311768, 1.816687822341919, 1.8687794208526611, 1.9208710193634033, 1.9729626178741455, 2.0250542163848877, 2.07714581489563, 2.129237413406372, 2.1813290119171143, 2.2334206104278564, 2.2855122089385986, 2.337603807449341, 2.389695405960083, 2.441787004470825, 2.4938783645629883, 2.5459699630737305, 2.5980615615844727, 2.650153160095215, 2.702244758605957, 2.754336357116699, 2.8064279556274414, 2.8585195541381836, 2.910611152648926]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 0.0, 1.0, 5.0, 1.0, 5.0, 6.0, 9.0, 6.0, 15.0, 11.0, 23.0, 35.0, 44.0, 60.0, 69.0, 97.0, 75.0, 104.0, 85.0, 89.0, 59.0, 55.0, 41.0, 25.0, 22.0, 16.0, 12.0, 8.0, 8.0, 8.0, 4.0, 4.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7189944386482239, -0.696451723575592, -0.6739090085029602, -0.6513662338256836, -0.6288235187530518, -0.6062808036804199, -0.5837380886077881, -0.5611953735351562, -0.5386526584625244, -0.5161099433898926, -0.49356719851493835, -0.4710244834423065, -0.4484817385673523, -0.42593902349472046, -0.4033963084220886, -0.3808535933494568, -0.3583108186721802, -0.33576810359954834, -0.3132253587245941, -0.2906826436519623, -0.26813989877700806, -0.24559718370437622, -0.22305446863174438, -0.20051173865795135, -0.17796900868415833, -0.1554262787103653, -0.13288354873657227, -0.11034083366394043, -0.0877981036901474, -0.06525537371635437, -0.042712658643722534, -0.020169928669929504, 0.0023728609085083008, 0.024915587157011032, 0.04745831340551376, 0.0700010359287262, 0.09254376590251923, 0.11508649587631226, 0.1376292109489441, 0.16017194092273712, 0.18271467089653015, 0.20525740087032318, 0.2278001308441162, 0.25034284591674805, 0.2728855609893799, 0.2954283058643341, 0.31797102093696594, 0.34051376581192017, 0.363056480884552, 0.38559919595718384, 0.40814194083213806, 0.4306846559047699, 0.4532274007797241, 0.47577011585235596, 0.4983128309249878, 0.5208555459976196, 0.5433982610702515, 0.5659409761428833, 0.5884836912155151, 0.611026406288147, 0.6335691809654236, 0.6561118960380554, 0.6786546111106873, 0.7011973261833191, 0.7237401008605957]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 6.0, 8.0, 3.0, 13.0, 11.0, 15.0, 25.0, 22.0, 38.0, 37.0, 62.0, 73.0, 101.0, 107.0, 160.0, 235.0, 322.0, 506.0, 829.0, 1438.0, 2797.0, 5954.0, 16258.0, 70799.0, 3752701.0, 287989.0, 32747.0, 10082.0, 4424.0, 2343.0, 1405.0, 887.0, 614.0, 397.0, 293.0, 182.0, 111.0, 101.0, 69.0, 44.0, 29.0, 20.0, 16.0, 5.0, 4.0, 4.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.25048828125, -0.2434844970703125, -0.236480712890625, -0.2294769287109375, -0.22247314453125, -0.2154693603515625, -0.208465576171875, -0.2014617919921875, -0.1944580078125, -0.1874542236328125, -0.180450439453125, -0.1734466552734375, -0.16644287109375, -0.1594390869140625, -0.152435302734375, -0.1454315185546875, -0.138427734375, -0.1314239501953125, -0.124420166015625, -0.1174163818359375, -0.11041259765625, -0.1034088134765625, -0.096405029296875, -0.0894012451171875, -0.0823974609375, -0.0753936767578125, -0.068389892578125, -0.0613861083984375, -0.05438232421875, -0.0473785400390625, -0.040374755859375, -0.0333709716796875, -0.0263671875, -0.0193634033203125, -0.012359619140625, -0.0053558349609375, 0.00164794921875, 0.0086517333984375, 0.015655517578125, 0.0226593017578125, 0.0296630859375, 0.0366668701171875, 0.043670654296875, 0.0506744384765625, 0.05767822265625, 0.0646820068359375, 0.071685791015625, 0.0786895751953125, 0.085693359375, 0.0926971435546875, 0.099700927734375, 0.1067047119140625, 0.11370849609375, 0.1207122802734375, 0.127716064453125, 0.1347198486328125, 0.1417236328125, 0.1487274169921875, 0.155731201171875, 0.1627349853515625, 0.16973876953125, 0.1767425537109375, 0.183746337890625, 0.1907501220703125, 0.19775390625]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 3.0, 4.0, 5.0, 5.0, 10.0, 11.0, 18.0, 33.0, 61.0, 101.0, 118.0, 187.0, 170.0, 93.0, 61.0, 29.0, 20.0, 13.0, 7.0, 6.0, 17.0, 4.0, 6.0, 2.0, 2.0, 5.0, 7.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.025299072265625, -0.02457261085510254, -0.023846149444580078, -0.023119688034057617, -0.022393226623535156, -0.021666765213012695, -0.020940303802490234, -0.020213842391967773, -0.019487380981445312, -0.01876091957092285, -0.01803445816040039, -0.01730799674987793, -0.01658153533935547, -0.015855073928833008, -0.015128612518310547, -0.014402151107788086, -0.013675689697265625, -0.012949228286743164, -0.012222766876220703, -0.011496305465698242, -0.010769844055175781, -0.01004338264465332, -0.00931692123413086, -0.008590459823608398, -0.007863998413085938, -0.0071375370025634766, -0.006411075592041016, -0.005684614181518555, -0.004958152770996094, -0.004231691360473633, -0.003505229949951172, -0.002778768539428711, -0.00205230712890625, -0.001325845718383789, -0.0005993843078613281, 0.0001270771026611328, 0.0008535385131835938, 0.0015799999237060547, 0.0023064613342285156, 0.0030329227447509766, 0.0037593841552734375, 0.0044858455657958984, 0.005212306976318359, 0.00593876838684082, 0.006665229797363281, 0.007391691207885742, 0.008118152618408203, 0.008844614028930664, 0.009571075439453125, 0.010297536849975586, 0.011023998260498047, 0.011750459671020508, 0.012476921081542969, 0.01320338249206543, 0.01392984390258789, 0.014656305313110352, 0.015382766723632812, 0.016109228134155273, 0.016835689544677734, 0.017562150955200195, 0.018288612365722656, 0.019015073776245117, 0.019741535186767578, 0.02046799659729004, 0.0211944580078125]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 3.0, 1.0, 0.0, 5.0, 7.0, 13.0, 16.0, 26.0, 25.0, 71.0, 117.0, 223.0, 537.0, 1433.0, 5316.0, 26481.0, 338320.0, 3699938.0, 103256.0, 13556.0, 3121.0, 989.0, 368.0, 185.0, 115.0, 56.0, 39.0, 18.0, 9.0, 16.0, 11.0, 3.0, 0.0, 4.0, 1.0, 3.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0], "bins": [-0.270263671875, -0.26260948181152344, -0.2549552917480469, -0.2473011016845703, -0.23964691162109375, -0.2319927215576172, -0.22433853149414062, -0.21668434143066406, -0.2090301513671875, -0.20137596130371094, -0.19372177124023438, -0.1860675811767578, -0.17841339111328125, -0.1707592010498047, -0.16310501098632812, -0.15545082092285156, -0.147796630859375, -0.14014244079589844, -0.13248825073242188, -0.12483406066894531, -0.11717987060546875, -0.10952568054199219, -0.10187149047851562, -0.09421730041503906, -0.0865631103515625, -0.07890892028808594, -0.07125473022460938, -0.06360054016113281, -0.05594635009765625, -0.04829216003417969, -0.040637969970703125, -0.03298377990722656, -0.02532958984375, -0.017675399780273438, -0.010021209716796875, -0.0023670196533203125, 0.00528717041015625, 0.012941360473632812, 0.020595550537109375, 0.028249740600585938, 0.0359039306640625, 0.04355812072753906, 0.051212310791015625, 0.05886650085449219, 0.06652069091796875, 0.07417488098144531, 0.08182907104492188, 0.08948326110839844, 0.097137451171875, 0.10479164123535156, 0.11244583129882812, 0.12010002136230469, 0.12775421142578125, 0.1354084014892578, 0.14306259155273438, 0.15071678161621094, 0.1583709716796875, 0.16602516174316406, 0.17367935180664062, 0.1813335418701172, 0.18898773193359375, 0.1966419219970703, 0.20429611206054688, 0.21195030212402344, 0.2196044921875]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 0.0, 1.0, 2.0, 4.0, 7.0, 6.0, 1.0, 9.0, 5.0, 23.0, 29.0, 23.0, 41.0, 70.0, 73.0, 136.0, 205.0, 395.0, 1474.0, 721.0, 322.0, 170.0, 113.0, 71.0, 35.0, 34.0, 28.0, 8.0, 14.0, 12.0, 13.0, 9.0, 8.0, 5.0, 2.0, 2.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0222320556640625, -0.02136969566345215, -0.020507335662841797, -0.019644975662231445, -0.018782615661621094, -0.017920255661010742, -0.01705789566040039, -0.01619553565979004, -0.015333175659179688, -0.014470815658569336, -0.013608455657958984, -0.012746095657348633, -0.011883735656738281, -0.01102137565612793, -0.010159015655517578, -0.009296655654907227, -0.008434295654296875, -0.0075719356536865234, -0.006709575653076172, -0.00584721565246582, -0.004984855651855469, -0.004122495651245117, -0.0032601356506347656, -0.002397775650024414, -0.0015354156494140625, -0.0006730556488037109, 0.00018930435180664062, 0.0010516643524169922, 0.0019140243530273438, 0.0027763843536376953, 0.003638744354248047, 0.0045011043548583984, 0.00536346435546875, 0.0062258243560791016, 0.007088184356689453, 0.007950544357299805, 0.008812904357910156, 0.009675264358520508, 0.01053762435913086, 0.011399984359741211, 0.012262344360351562, 0.013124704360961914, 0.013987064361572266, 0.014849424362182617, 0.01571178436279297, 0.01657414436340332, 0.017436504364013672, 0.018298864364624023, 0.019161224365234375, 0.020023584365844727, 0.020885944366455078, 0.02174830436706543, 0.02261066436767578, 0.023473024368286133, 0.024335384368896484, 0.025197744369506836, 0.026060104370117188, 0.02692246437072754, 0.02778482437133789, 0.028647184371948242, 0.029509544372558594, 0.030371904373168945, 0.031234264373779297, 0.03209662437438965, 0.032958984375]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 3.0, 7.0, 30.0, 72.0, 242.0, 314.0, 204.0, 89.0, 30.0, 10.0, 3.0, 6.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09958233684301376, -0.08903111517429352, -0.07847990095615387, -0.06792868673801422, -0.057377465069293976, -0.04682624712586403, -0.03627502918243408, -0.025723807513713837, -0.015172593295574188, -0.004621375352144241, 0.005929842591285706, 0.016481060534715652, 0.0270322784781456, 0.037583496421575546, 0.04813471436500549, 0.05868593603372574, 0.06923715025186539, 0.07978837192058563, 0.09033958613872528, 0.10089080035686493, 0.11144202202558517, 0.12199324369430542, 0.13254445791244507, 0.14309567213058472, 0.15364688634872437, 0.164198100566864, 0.17474931478500366, 0.1853005439043045, 0.19585175812244415, 0.2064029723405838, 0.21695420145988464, 0.2275054156780243, 0.23805665969848633, 0.24860787391662598, 0.2591590881347656, 0.2697103023529053, 0.2802615165710449, 0.29081276059150696, 0.3013639748096466, 0.31191518902778625, 0.3224664032459259, 0.33301761746406555, 0.3435688316822052, 0.35412004590034485, 0.3646712899208069, 0.37522250413894653, 0.3857737183570862, 0.39632493257522583, 0.4068761467933655, 0.4174273610115051, 0.4279785752296448, 0.4385297894477844, 0.4490810036659241, 0.4596322476863861, 0.47018346190452576, 0.4807346761226654, 0.49128589034080505, 0.5018371343612671, 0.5123883485794067, 0.5229395627975464, 0.533490777015686, 0.5440419912338257, 0.5545932054519653, 0.565144419670105, 0.5756956338882446]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 4.0, 4.0, 2.0, 0.0, 8.0, 5.0, 6.0, 10.0, 11.0, 14.0, 26.0, 28.0, 33.0, 50.0, 43.0, 52.0, 53.0, 55.0, 64.0, 88.0, 54.0, 64.0, 53.0, 45.0, 50.0, 39.0, 32.0, 27.0, 19.0, 15.0, 10.0, 19.0, 7.0, 8.0, 3.0, 2.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.12629568576812744, -0.12237454950809479, -0.11845341324806213, -0.11453226953744888, -0.11061113327741623, -0.10668999701738358, -0.10276885330677032, -0.09884771704673767, -0.09492658078670502, -0.09100544452667236, -0.08708430826663971, -0.08316316455602646, -0.0792420282959938, -0.07532089203596115, -0.0713997483253479, -0.06747861206531525, -0.06355747580528259, -0.05963633954524994, -0.05571519955992699, -0.051794059574604034, -0.04787292331457138, -0.04395178705453873, -0.040030647069215775, -0.03610950708389282, -0.03218837082386017, -0.028267232701182365, -0.024346094578504562, -0.02042495645582676, -0.016503818333148956, -0.012582680210471153, -0.00866154208779335, -0.004740403965115547, -0.0008192658424377441, 0.003101872280240059, 0.007023010402917862, 0.010944148525595665, 0.014865286648273468, 0.01878642477095127, 0.022707562893629074, 0.026628701016306877, 0.03054983913898468, 0.034470975399017334, 0.038392115384340286, 0.04231325536966324, 0.04623439162969589, 0.050155527889728546, 0.0540766678750515, 0.05799780786037445, 0.061918944120407104, 0.06584008038043976, 0.06976121664047241, 0.07368236035108566, 0.07760349661111832, 0.08152463287115097, 0.08544577658176422, 0.08936691284179688, 0.09328804910182953, 0.09720918536186218, 0.10113032162189484, 0.10505146533250809, 0.10897260159254074, 0.1128937378525734, 0.11681488156318665, 0.1207360178232193, 0.12465715408325195]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 1.0, 3.0, 5.0, 8.0, 10.0, 16.0, 17.0, 39.0, 50.0, 78.0, 85.0, 159.0, 249.0, 388.0, 704.0, 1138.0, 2099.0, 4163.0, 9525.0, 27606.0, 127409.0, 635826.0, 182371.0, 34853.0, 11550.0, 4773.0, 2284.0, 1227.0, 722.0, 423.0, 267.0, 169.0, 107.0, 74.0, 48.0, 34.0, 25.0, 14.0, 8.0, 12.0, 8.0, 6.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1458740234375, -0.14125633239746094, -0.13663864135742188, -0.1320209503173828, -0.12740325927734375, -0.12278556823730469, -0.11816787719726562, -0.11355018615722656, -0.1089324951171875, -0.10431480407714844, -0.09969711303710938, -0.09507942199707031, -0.09046173095703125, -0.08584403991699219, -0.08122634887695312, -0.07660865783691406, -0.071990966796875, -0.06737327575683594, -0.06275558471679688, -0.05813789367675781, -0.05352020263671875, -0.04890251159667969, -0.044284820556640625, -0.03966712951660156, -0.0350494384765625, -0.030431747436523438, -0.025814056396484375, -0.021196365356445312, -0.01657867431640625, -0.011960983276367188, -0.007343292236328125, -0.0027256011962890625, 0.00189208984375, 0.0065097808837890625, 0.011127471923828125, 0.015745162963867188, 0.02036285400390625, 0.024980545043945312, 0.029598236083984375, 0.03421592712402344, 0.0388336181640625, 0.04345130920410156, 0.048069000244140625, 0.05268669128417969, 0.05730438232421875, 0.06192207336425781, 0.06653976440429688, 0.07115745544433594, 0.075775146484375, 0.08039283752441406, 0.08501052856445312, 0.08962821960449219, 0.09424591064453125, 0.09886360168457031, 0.10348129272460938, 0.10809898376464844, 0.1127166748046875, 0.11733436584472656, 0.12195205688476562, 0.1265697479248047, 0.13118743896484375, 0.1358051300048828, 0.14042282104492188, 0.14504051208496094, 0.149658203125]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 4.0, 1.0, 0.0, 5.0, 3.0, 7.0, 17.0, 25.0, 34.0, 51.0, 102.0, 126.0, 188.0, 131.0, 103.0, 75.0, 35.0, 27.0, 10.0, 13.0, 11.0, 11.0, 9.0, 6.0, 1.0, 3.0, 2.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0243988037109375, -0.023699283599853516, -0.02299976348876953, -0.022300243377685547, -0.021600723266601562, -0.020901203155517578, -0.020201683044433594, -0.01950216293334961, -0.018802642822265625, -0.01810312271118164, -0.017403602600097656, -0.016704082489013672, -0.016004562377929688, -0.015305042266845703, -0.014605522155761719, -0.013906002044677734, -0.01320648193359375, -0.012506961822509766, -0.011807441711425781, -0.011107921600341797, -0.010408401489257812, -0.009708881378173828, -0.009009361267089844, -0.00830984115600586, -0.007610321044921875, -0.006910800933837891, -0.006211280822753906, -0.005511760711669922, -0.0048122406005859375, -0.004112720489501953, -0.0034132003784179688, -0.0027136802673339844, -0.00201416015625, -0.0013146400451660156, -0.0006151199340820312, 8.440017700195312e-05, 0.0007839202880859375, 0.0014834403991699219, 0.0021829605102539062, 0.0028824806213378906, 0.003582000732421875, 0.004281520843505859, 0.004981040954589844, 0.005680561065673828, 0.0063800811767578125, 0.007079601287841797, 0.007779121398925781, 0.008478641510009766, 0.00917816162109375, 0.009877681732177734, 0.010577201843261719, 0.011276721954345703, 0.011976242065429688, 0.012675762176513672, 0.013375282287597656, 0.01407480239868164, 0.014774322509765625, 0.01547384262084961, 0.016173362731933594, 0.016872882843017578, 0.017572402954101562, 0.018271923065185547, 0.01897144317626953, 0.019670963287353516, 0.0203704833984375]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 5.0, 1.0, 1.0, 1.0, 5.0, 5.0, 5.0, 5.0, 5.0, 8.0, 21.0, 29.0, 23.0, 39.0, 57.0, 98.0, 121.0, 179.0, 260.0, 405.0, 647.0, 1173.0, 2587.0, 7146.0, 24591.0, 109258.0, 455568.0, 345090.0, 73038.0, 17991.0, 5412.0, 2035.0, 1041.0, 546.0, 340.0, 243.0, 160.0, 112.0, 75.0, 71.0, 45.0, 30.0, 25.0, 21.0, 7.0, 10.0, 6.0, 5.0, 3.0, 6.0, 3.0, 2.0, 2.0, 3.0, 2.0, 0.0, 2.0, 1.0], "bins": [-0.1275634765625, -0.12368202209472656, -0.11980056762695312, -0.11591911315917969, -0.11203765869140625, -0.10815620422363281, -0.10427474975585938, -0.10039329528808594, -0.0965118408203125, -0.09263038635253906, -0.08874893188476562, -0.08486747741699219, -0.08098602294921875, -0.07710456848144531, -0.07322311401367188, -0.06934165954589844, -0.065460205078125, -0.06157875061035156, -0.057697296142578125, -0.05381584167480469, -0.04993438720703125, -0.04605293273925781, -0.042171478271484375, -0.03829002380371094, -0.0344085693359375, -0.030527114868164062, -0.026645660400390625, -0.022764205932617188, -0.01888275146484375, -0.015001296997070312, -0.011119842529296875, -0.0072383880615234375, -0.00335693359375, 0.0005245208740234375, 0.004405975341796875, 0.008287429809570312, 0.01216888427734375, 0.016050338745117188, 0.019931793212890625, 0.023813247680664062, 0.0276947021484375, 0.03157615661621094, 0.035457611083984375, 0.03933906555175781, 0.04322052001953125, 0.04710197448730469, 0.050983428955078125, 0.05486488342285156, 0.058746337890625, 0.06262779235839844, 0.06650924682617188, 0.07039070129394531, 0.07427215576171875, 0.07815361022949219, 0.08203506469726562, 0.08591651916503906, 0.0897979736328125, 0.09367942810058594, 0.09756088256835938, 0.10144233703613281, 0.10532379150390625, 0.10920524597167969, 0.11308670043945312, 0.11696815490722656, 0.120849609375]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 4.0, 0.0, 3.0, 0.0, 3.0, 2.0, 4.0, 3.0, 1.0, 2.0, 3.0, 7.0, 5.0, 6.0, 7.0, 13.0, 13.0, 14.0, 24.0, 26.0, 24.0, 26.0, 34.0, 37.0, 38.0, 36.0, 40.0, 38.0, 38.0, 43.0, 45.0, 45.0, 44.0, 35.0, 34.0, 41.0, 37.0, 28.0, 26.0, 24.0, 21.0, 21.0, 21.0, 16.0, 14.0, 7.0, 11.0, 12.0, 7.0, 9.0, 4.0, 7.0, 4.0, 2.0, 1.0, 2.0, 3.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.0611572265625, -0.05928516387939453, -0.05741310119628906, -0.055541038513183594, -0.053668975830078125, -0.051796913146972656, -0.04992485046386719, -0.04805278778076172, -0.04618072509765625, -0.04430866241455078, -0.04243659973144531, -0.040564537048339844, -0.038692474365234375, -0.036820411682128906, -0.03494834899902344, -0.03307628631591797, -0.0312042236328125, -0.02933216094970703, -0.027460098266601562, -0.025588035583496094, -0.023715972900390625, -0.021843910217285156, -0.019971847534179688, -0.01809978485107422, -0.01622772216796875, -0.014355659484863281, -0.012483596801757812, -0.010611534118652344, -0.008739471435546875, -0.006867408752441406, -0.0049953460693359375, -0.0031232833862304688, -0.001251220703125, 0.0006208419799804688, 0.0024929046630859375, 0.004364967346191406, 0.006237030029296875, 0.008109092712402344, 0.009981155395507812, 0.011853218078613281, 0.01372528076171875, 0.015597343444824219, 0.017469406127929688, 0.019341468811035156, 0.021213531494140625, 0.023085594177246094, 0.024957656860351562, 0.02682971954345703, 0.0287017822265625, 0.03057384490966797, 0.03244590759277344, 0.034317970275878906, 0.036190032958984375, 0.038062095642089844, 0.03993415832519531, 0.04180622100830078, 0.04367828369140625, 0.04555034637451172, 0.04742240905761719, 0.049294471740722656, 0.051166534423828125, 0.053038597106933594, 0.05491065979003906, 0.05678272247314453, 0.05865478515625]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 3.0, 0.0, 2.0, 3.0, 0.0, 5.0, 4.0, 3.0, 9.0, 11.0, 18.0, 14.0, 26.0, 41.0, 48.0, 81.0, 146.0, 201.0, 317.0, 498.0, 839.0, 1413.0, 2582.0, 4923.0, 10884.0, 28084.0, 90444.0, 325958.0, 397777.0, 122222.0, 35966.0, 13087.0, 5812.0, 2910.0, 1657.0, 958.0, 581.0, 346.0, 233.0, 161.0, 89.0, 56.0, 54.0, 31.0, 20.0, 18.0, 9.0, 7.0, 5.0, 6.0, 2.0, 2.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.063232421875, -0.06120014190673828, -0.05916786193847656, -0.057135581970214844, -0.055103302001953125, -0.053071022033691406, -0.05103874206542969, -0.04900646209716797, -0.04697418212890625, -0.04494190216064453, -0.04290962219238281, -0.040877342224121094, -0.038845062255859375, -0.036812782287597656, -0.03478050231933594, -0.03274822235107422, -0.0307159423828125, -0.02868366241455078, -0.026651382446289062, -0.024619102478027344, -0.022586822509765625, -0.020554542541503906, -0.018522262573242188, -0.01648998260498047, -0.01445770263671875, -0.012425422668457031, -0.010393142700195312, -0.008360862731933594, -0.006328582763671875, -0.004296302795410156, -0.0022640228271484375, -0.00023174285888671875, 0.001800537109375, 0.0038328170776367188, 0.0058650970458984375, 0.007897377014160156, 0.009929656982421875, 0.011961936950683594, 0.013994216918945312, 0.01602649688720703, 0.01805877685546875, 0.02009105682373047, 0.022123336791992188, 0.024155616760253906, 0.026187896728515625, 0.028220176696777344, 0.030252456665039062, 0.03228473663330078, 0.0343170166015625, 0.03634929656982422, 0.03838157653808594, 0.040413856506347656, 0.042446136474609375, 0.044478416442871094, 0.04651069641113281, 0.04854297637939453, 0.05057525634765625, 0.05260753631591797, 0.05463981628417969, 0.056672096252441406, 0.058704376220703125, 0.060736656188964844, 0.06276893615722656, 0.06480121612548828, 0.06683349609375]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 5.0, 4.0, 5.0, 12.0, 9.0, 19.0, 14.0, 12.0, 35.0, 39.0, 51.0, 62.0, 52.0, 71.0, 83.0, 86.0, 68.0, 59.0, 63.0, 51.0, 39.0, 34.0, 27.0, 22.0, 13.0, 17.0, 16.0, 7.0, 8.0, 4.0, 6.0, 5.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-6.03795051574707e-05, -5.8525241911411285e-05, -5.667097866535187e-05, -5.481671541929245e-05, -5.296245217323303e-05, -5.1108188927173615e-05, -4.92539256811142e-05, -4.739966243505478e-05, -4.554539918899536e-05, -4.3691135942935944e-05, -4.1836872696876526e-05, -3.998260945081711e-05, -3.812834620475769e-05, -3.627408295869827e-05, -3.4419819712638855e-05, -3.256555646657944e-05, -3.071129322052002e-05, -2.8857029974460602e-05, -2.7002766728401184e-05, -2.5148503482341766e-05, -2.329424023628235e-05, -2.143997699022293e-05, -1.9585713744163513e-05, -1.7731450498104095e-05, -1.5877187252044678e-05, -1.402292400598526e-05, -1.2168660759925842e-05, -1.0314397513866425e-05, -8.460134267807007e-06, -6.605871021747589e-06, -4.751607775688171e-06, -2.8973445296287537e-06, -1.043081283569336e-06, 8.111819624900818e-07, 2.6654452085494995e-06, 4.519708454608917e-06, 6.373971700668335e-06, 8.228234946727753e-06, 1.008249819278717e-05, 1.1936761438846588e-05, 1.3791024684906006e-05, 1.5645287930965424e-05, 1.749955117702484e-05, 1.935381442308426e-05, 2.1208077669143677e-05, 2.3062340915203094e-05, 2.4916604161262512e-05, 2.677086740732193e-05, 2.8625130653381348e-05, 3.0479393899440765e-05, 3.233365714550018e-05, 3.41879203915596e-05, 3.604218363761902e-05, 3.7896446883678436e-05, 3.9750710129737854e-05, 4.160497337579727e-05, 4.345923662185669e-05, 4.531349986791611e-05, 4.7167763113975525e-05, 4.902202636003494e-05, 5.087628960609436e-05, 5.273055285215378e-05, 5.4584816098213196e-05, 5.6439079344272614e-05, 5.829334259033203e-05]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 5.0, 4.0, 13.0, 5.0, 15.0, 13.0, 25.0, 42.0, 49.0, 78.0, 152.0, 255.0, 488.0, 968.0, 2151.0, 6628.0, 27793.0, 181395.0, 643250.0, 151123.0, 24288.0, 5870.0, 2082.0, 838.0, 434.0, 246.0, 142.0, 74.0, 43.0, 38.0, 19.0, 3.0, 9.0, 10.0, 5.0, 3.0, 2.0, 5.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.10699462890625, -0.10397720336914062, -0.10095977783203125, -0.09794235229492188, -0.0949249267578125, -0.09190750122070312, -0.08889007568359375, -0.08587265014648438, -0.082855224609375, -0.07983779907226562, -0.07682037353515625, -0.07380294799804688, -0.0707855224609375, -0.06776809692382812, -0.06475067138671875, -0.061733245849609375, -0.0587158203125, -0.055698394775390625, -0.05268096923828125, -0.049663543701171875, -0.0466461181640625, -0.043628692626953125, -0.04061126708984375, -0.037593841552734375, -0.034576416015625, -0.031558990478515625, -0.02854156494140625, -0.025524139404296875, -0.0225067138671875, -0.019489288330078125, -0.01647186279296875, -0.013454437255859375, -0.01043701171875, -0.007419586181640625, -0.00440216064453125, -0.001384735107421875, 0.0016326904296875, 0.004650115966796875, 0.00766754150390625, 0.010684967041015625, 0.013702392578125, 0.016719818115234375, 0.01973724365234375, 0.022754669189453125, 0.0257720947265625, 0.028789520263671875, 0.03180694580078125, 0.034824371337890625, 0.037841796875, 0.040859222412109375, 0.04387664794921875, 0.046894073486328125, 0.0499114990234375, 0.052928924560546875, 0.05594635009765625, 0.058963775634765625, 0.061981201171875, 0.06499862670898438, 0.06801605224609375, 0.07103347778320312, 0.0740509033203125, 0.07706832885742188, 0.08008575439453125, 0.08310317993164062, 0.08612060546875]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 4.0, 6.0, 5.0, 11.0, 5.0, 8.0, 12.0, 19.0, 21.0, 29.0, 33.0, 34.0, 47.0, 54.0, 66.0, 69.0, 56.0, 83.0, 57.0, 65.0, 57.0, 39.0, 43.0, 41.0, 28.0, 28.0, 26.0, 16.0, 11.0, 6.0, 11.0, 5.0, 3.0, 6.0, 1.0, 2.0, 2.0, 2.0, 3.0], "bins": [-0.046600341796875, -0.045503854751586914, -0.04440736770629883, -0.04331088066101074, -0.042214393615722656, -0.04111790657043457, -0.040021419525146484, -0.0389249324798584, -0.03782844543457031, -0.03673195838928223, -0.03563547134399414, -0.034538984298706055, -0.03344249725341797, -0.03234601020812988, -0.031249523162841797, -0.03015303611755371, -0.029056549072265625, -0.02796006202697754, -0.026863574981689453, -0.025767087936401367, -0.02467060089111328, -0.023574113845825195, -0.02247762680053711, -0.021381139755249023, -0.020284652709960938, -0.01918816566467285, -0.018091678619384766, -0.01699519157409668, -0.015898704528808594, -0.014802217483520508, -0.013705730438232422, -0.012609243392944336, -0.01151275634765625, -0.010416269302368164, -0.009319782257080078, -0.008223295211791992, -0.007126808166503906, -0.00603032112121582, -0.004933834075927734, -0.0038373470306396484, -0.0027408599853515625, -0.0016443729400634766, -0.0005478858947753906, 0.0005486011505126953, 0.0016450881958007812, 0.002741575241088867, 0.003838062286376953, 0.004934549331665039, 0.006031036376953125, 0.007127523422241211, 0.008224010467529297, 0.009320497512817383, 0.010416984558105469, 0.011513471603393555, 0.01260995864868164, 0.013706445693969727, 0.014802932739257812, 0.0158994197845459, 0.016995906829833984, 0.01809239387512207, 0.019188880920410156, 0.020285367965698242, 0.021381855010986328, 0.022478342056274414, 0.0235748291015625]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 4.0, 8.0, 44.0, 156.0, 360.0, 304.0, 98.0, 21.0, 9.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.775293231010437, -0.715581476688385, -0.655869722366333, -0.5961580276489258, -0.5364462733268738, -0.4767345190048218, -0.41702279448509216, -0.35731106996536255, -0.29759931564331055, -0.23788757622241974, -0.17817583680152893, -0.11846409738063812, -0.058752357959747314, 0.0009593963623046875, 0.0606711208820343, 0.12038284540176392, 0.18009459972381592, 0.23980633914470673, 0.29951807856559753, 0.35922980308532715, 0.41894155740737915, 0.47865331172943115, 0.5383650064468384, 0.5980767607688904, 0.6577885150909424, 0.7175002694129944, 0.7772120237350464, 0.8369237184524536, 0.8966354727745056, 0.9563472270965576, 1.0160589218139648, 1.075770616531372, 1.1354823112487793, 1.1951940059661865, 1.2549058198928833, 1.3146175146102905, 1.3743293285369873, 1.4340410232543945, 1.4937527179718018, 1.553464412689209, 1.6131762266159058, 1.672887921333313, 1.7325997352600098, 1.792311429977417, 1.8520231246948242, 1.911734938621521, 1.9714466333389282, 2.031158447265625, 2.0908701419830322, 2.1505818367004395, 2.2102935314178467, 2.270005464553833, 2.3297171592712402, 2.3894288539886475, 2.4491405487060547, 2.508852243423462, 2.568563938140869, 2.6282756328582764, 2.6879873275756836, 2.74769926071167, 2.807410955429077, 2.8671226501464844, 2.9268343448638916, 2.986546039581299, 3.046257972717285]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 5.0, 8.0, 8.0, 8.0, 12.0, 24.0, 15.0, 22.0, 23.0, 23.0, 31.0, 34.0, 39.0, 36.0, 38.0, 40.0, 65.0, 59.0, 65.0, 48.0, 56.0, 62.0, 42.0, 38.0, 34.0, 33.0, 32.0, 17.0, 14.0, 17.0, 12.0, 10.0, 11.0, 6.0, 4.0, 5.0, 2.0, 4.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5495665073394775, -0.5306557416915894, -0.5117449760437012, -0.4928342401981354, -0.4739234745502472, -0.455012708902359, -0.4361019730567932, -0.41719120740890503, -0.39828044176101685, -0.37936967611312866, -0.3604589104652405, -0.3415481746196747, -0.3226374089717865, -0.3037266433238983, -0.2848159074783325, -0.26590514183044434, -0.24699437618255615, -0.22808361053466797, -0.20917285978794098, -0.190262109041214, -0.1713513433933258, -0.15244057774543762, -0.13352982699871063, -0.11461907625198364, -0.09570831060409546, -0.07679755240678787, -0.057886794209480286, -0.0389760360121727, -0.020065277814865112, -0.0011545196175575256, 0.01775623857975006, 0.03666698932647705, 0.055577754974365234, 0.07448851317167282, 0.09339927136898041, 0.112310029566288, 0.13122078776359558, 0.15013155341148376, 0.16904230415821075, 0.18795305490493774, 0.20686382055282593, 0.2257745862007141, 0.2446853369474411, 0.2635960876941681, 0.2825068533420563, 0.30141761898994446, 0.32032835483551025, 0.33923912048339844, 0.3581498861312866, 0.3770606517791748, 0.395971417427063, 0.4148821532726288, 0.43379291892051697, 0.45270368456840515, 0.47161442041397095, 0.49052518606185913, 0.5094359517097473, 0.5283467173576355, 0.5472574830055237, 0.5661682486534119, 0.5850789546966553, 0.6039897203445435, 0.6229004859924316, 0.6418112516403198, 0.660722017288208]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 0.0, 2.0, 4.0, 7.0, 6.0, 9.0, 17.0, 30.0, 41.0, 87.0, 160.0, 330.0, 902.0, 3219.0, 24182.0, 4015332.0, 139540.0, 7654.0, 1659.0, 580.0, 226.0, 117.0, 76.0, 39.0, 21.0, 18.0, 3.0, 9.0, 7.0, 5.0, 0.0, 2.0, 3.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.47314453125, -0.4582366943359375, -0.443328857421875, -0.4284210205078125, -0.41351318359375, -0.3986053466796875, -0.383697509765625, -0.3687896728515625, -0.3538818359375, -0.3389739990234375, -0.324066162109375, -0.3091583251953125, -0.29425048828125, -0.2793426513671875, -0.264434814453125, -0.2495269775390625, -0.234619140625, -0.2197113037109375, -0.204803466796875, -0.1898956298828125, -0.17498779296875, -0.1600799560546875, -0.145172119140625, -0.1302642822265625, -0.1153564453125, -0.1004486083984375, -0.085540771484375, -0.0706329345703125, -0.05572509765625, -0.0408172607421875, -0.025909423828125, -0.0110015869140625, 0.00390625, 0.0188140869140625, 0.033721923828125, 0.0486297607421875, 0.06353759765625, 0.0784454345703125, 0.093353271484375, 0.1082611083984375, 0.1231689453125, 0.1380767822265625, 0.152984619140625, 0.1678924560546875, 0.18280029296875, 0.1977081298828125, 0.212615966796875, 0.2275238037109375, 0.242431640625, 0.2573394775390625, 0.272247314453125, 0.2871551513671875, 0.30206298828125, 0.3169708251953125, 0.331878662109375, 0.3467864990234375, 0.3616943359375, 0.3766021728515625, 0.391510009765625, 0.4064178466796875, 0.42132568359375, 0.4362335205078125, 0.451141357421875, 0.4660491943359375, 0.48095703125]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 3.0, 2.0, 5.0, 7.0, 20.0, 31.0, 29.0, 45.0, 75.0, 127.0, 129.0, 122.0, 120.0, 72.0, 69.0, 38.0, 29.0, 27.0, 14.0, 7.0, 7.0, 9.0, 3.0, 4.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.02581787109375, -0.024997949600219727, -0.024178028106689453, -0.02335810661315918, -0.022538185119628906, -0.021718263626098633, -0.02089834213256836, -0.020078420639038086, -0.019258499145507812, -0.01843857765197754, -0.017618656158447266, -0.016798734664916992, -0.01597881317138672, -0.015158891677856445, -0.014338970184326172, -0.013519048690795898, -0.012699127197265625, -0.011879205703735352, -0.011059284210205078, -0.010239362716674805, -0.009419441223144531, -0.008599519729614258, -0.007779598236083984, -0.006959676742553711, -0.0061397552490234375, -0.005319833755493164, -0.004499912261962891, -0.003679990768432617, -0.0028600692749023438, -0.0020401477813720703, -0.0012202262878417969, -0.00040030479431152344, 0.00041961669921875, 0.0012395381927490234, 0.002059459686279297, 0.0028793811798095703, 0.0036993026733398438, 0.004519224166870117, 0.005339145660400391, 0.006159067153930664, 0.0069789886474609375, 0.007798910140991211, 0.008618831634521484, 0.009438753128051758, 0.010258674621582031, 0.011078596115112305, 0.011898517608642578, 0.012718439102172852, 0.013538360595703125, 0.014358282089233398, 0.015178203582763672, 0.015998125076293945, 0.01681804656982422, 0.017637968063354492, 0.018457889556884766, 0.01927781105041504, 0.020097732543945312, 0.020917654037475586, 0.02173757553100586, 0.022557497024536133, 0.023377418518066406, 0.02419734001159668, 0.025017261505126953, 0.025837182998657227, 0.0266571044921875]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 1.0, 1.0, 2.0, 5.0, 7.0, 6.0, 5.0, 8.0, 22.0, 15.0, 32.0, 53.0, 73.0, 114.0, 213.0, 340.0, 582.0, 1201.0, 2616.0, 7066.0, 25439.0, 160390.0, 3504243.0, 429401.0, 44930.0, 10640.0, 3595.0, 1494.0, 745.0, 405.0, 230.0, 129.0, 99.0, 46.0, 47.0, 28.0, 18.0, 12.0, 5.0, 12.0, 7.0, 6.0, 4.0, 4.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.171875, -0.1662731170654297, -0.16067123413085938, -0.15506935119628906, -0.14946746826171875, -0.14386558532714844, -0.13826370239257812, -0.1326618194580078, -0.1270599365234375, -0.12145805358886719, -0.11585617065429688, -0.11025428771972656, -0.10465240478515625, -0.09905052185058594, -0.09344863891601562, -0.08784675598144531, -0.082244873046875, -0.07664299011230469, -0.07104110717773438, -0.06543922424316406, -0.05983734130859375, -0.05423545837402344, -0.048633575439453125, -0.04303169250488281, -0.0374298095703125, -0.03182792663574219, -0.026226043701171875, -0.020624160766601562, -0.01502227783203125, -0.009420394897460938, -0.003818511962890625, 0.0017833709716796875, 0.00738525390625, 0.012987136840820312, 0.018589019775390625, 0.024190902709960938, 0.02979278564453125, 0.03539466857910156, 0.040996551513671875, 0.04659843444824219, 0.0522003173828125, 0.05780220031738281, 0.06340408325195312, 0.06900596618652344, 0.07460784912109375, 0.08020973205566406, 0.08581161499023438, 0.09141349792480469, 0.097015380859375, 0.10261726379394531, 0.10821914672851562, 0.11382102966308594, 0.11942291259765625, 0.12502479553222656, 0.13062667846679688, 0.1362285614013672, 0.1418304443359375, 0.1474323272705078, 0.15303421020507812, 0.15863609313964844, 0.16423797607421875, 0.16983985900878906, 0.17544174194335938, 0.1810436248779297, 0.1866455078125]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 1.0, 4.0, 5.0, 8.0, 13.0, 10.0, 21.0, 20.0, 29.0, 49.0, 83.0, 141.0, 269.0, 627.0, 1798.0, 429.0, 239.0, 123.0, 55.0, 41.0, 35.0, 13.0, 19.0, 11.0, 9.0, 7.0, 2.0, 3.0, 1.0, 2.0, 4.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.032501220703125, -0.03126859664916992, -0.030035972595214844, -0.028803348541259766, -0.027570724487304688, -0.02633810043334961, -0.02510547637939453, -0.023872852325439453, -0.022640228271484375, -0.021407604217529297, -0.02017498016357422, -0.01894235610961914, -0.017709732055664062, -0.016477108001708984, -0.015244483947753906, -0.014011859893798828, -0.01277923583984375, -0.011546611785888672, -0.010313987731933594, -0.009081363677978516, -0.007848739624023438, -0.006616115570068359, -0.005383491516113281, -0.004150867462158203, -0.002918243408203125, -0.0016856193542480469, -0.00045299530029296875, 0.0007796287536621094, 0.0020122528076171875, 0.0032448768615722656, 0.004477500915527344, 0.005710124969482422, 0.0069427490234375, 0.008175373077392578, 0.009407997131347656, 0.010640621185302734, 0.011873245239257812, 0.01310586929321289, 0.014338493347167969, 0.015571117401123047, 0.016803741455078125, 0.018036365509033203, 0.01926898956298828, 0.02050161361694336, 0.021734237670898438, 0.022966861724853516, 0.024199485778808594, 0.025432109832763672, 0.02666473388671875, 0.027897357940673828, 0.029129981994628906, 0.030362606048583984, 0.03159523010253906, 0.03282785415649414, 0.03406047821044922, 0.0352931022644043, 0.036525726318359375, 0.03775835037231445, 0.03899097442626953, 0.04022359848022461, 0.04145622253417969, 0.042688846588134766, 0.043921470642089844, 0.04515409469604492, 0.04638671875]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 5.0, 2.0, 6.0, 9.0, 14.0, 22.0, 46.0, 70.0, 121.0, 140.0, 146.0, 134.0, 117.0, 73.0, 46.0, 18.0, 12.0, 12.0, 6.0, 3.0, 2.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2676220238208771, -0.2612111270427704, -0.2548002600669861, -0.2483893632888794, -0.2419784665107727, -0.2355675846338272, -0.2291567027568817, -0.22274580597877502, -0.21633490920066833, -0.20992402732372284, -0.20351313054561615, -0.19710224866867065, -0.19069135189056396, -0.18428047001361847, -0.17786958813667297, -0.17145869135856628, -0.1650478094816208, -0.1586369276046753, -0.1522260308265686, -0.1458151489496231, -0.13940425217151642, -0.13299337029457092, -0.12658247351646423, -0.12017159163951874, -0.11376070231199265, -0.10734981298446655, -0.10093892365694046, -0.09452803432941437, -0.08811715245246887, -0.08170625567436218, -0.07529537379741669, -0.0688844844698906, -0.062473610043525696, -0.0560627207159996, -0.04965183138847351, -0.04324094578623772, -0.036830056458711624, -0.03041916713118553, -0.024008281528949738, -0.017597392201423645, -0.011186502873897552, -0.004775614477694035, 0.0016352739185094833, 0.008046161383390427, 0.01445705071091652, 0.02086794003844261, 0.027278825640678406, 0.0336897149682045, 0.04010060429573059, 0.04651149362325668, 0.052922382950782776, 0.05933326855301857, 0.06574416160583496, 0.07215504348278046, 0.07856593281030655, 0.08497682213783264, 0.09138771146535873, 0.09779860079288483, 0.10420949012041092, 0.11062037944793701, 0.11703126132488251, 0.1234421581029892, 0.1298530399799347, 0.13626393675804138, 0.14267481863498688]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 0.0, 1.0, 3.0, 3.0, 4.0, 15.0, 7.0, 11.0, 10.0, 7.0, 15.0, 15.0, 19.0, 14.0, 27.0, 34.0, 36.0, 37.0, 41.0, 41.0, 51.0, 52.0, 44.0, 48.0, 47.0, 44.0, 40.0, 33.0, 44.0, 24.0, 37.0, 38.0, 23.0, 19.0, 13.0, 26.0, 14.0, 20.0, 13.0, 13.0, 10.0, 2.0, 4.0, 3.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.12018674612045288, -0.11640593409538269, -0.1126251146197319, -0.10884430259466171, -0.10506348311901093, -0.10128267109394073, -0.09750185906887054, -0.09372104704380035, -0.08994022756814957, -0.08615941554307938, -0.08237859606742859, -0.0785977840423584, -0.07481697201728821, -0.07103615254163742, -0.06725534051656723, -0.06347452104091644, -0.05969370901584625, -0.055912893265485764, -0.052132077515125275, -0.048351265490055084, -0.044570449739694595, -0.040789633989334106, -0.037008821964263916, -0.03322800621390343, -0.029447190463542938, -0.02566637471318245, -0.02188556082546711, -0.01810474693775177, -0.014323931187391281, -0.010543115437030792, -0.006762301549315453, -0.002981487661600113, 0.000799328088760376, 0.00458014290779829, 0.008360957726836205, 0.012141772545874119, 0.015922587364912033, 0.019703403115272522, 0.02348421700298786, 0.0272650308907032, 0.03104584664106369, 0.03482666239142418, 0.03860747814178467, 0.04238829016685486, 0.04616910591721535, 0.049949921667575836, 0.05373073369264603, 0.057511549443006516, 0.061292365193367004, 0.0650731772184372, 0.06885399669408798, 0.07263480871915817, 0.07641562819480896, 0.08019644021987915, 0.08397725224494934, 0.08775806427001953, 0.09153888374567032, 0.09531969577074051, 0.0991005152463913, 0.10288132727146149, 0.10666213929653168, 0.11044295877218246, 0.11422377079725266, 0.11800459027290344, 0.12178540229797363]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 6.0, 2.0, 2.0, 1.0, 7.0, 4.0, 6.0, 11.0, 14.0, 24.0, 33.0, 38.0, 79.0, 95.0, 199.0, 320.0, 490.0, 926.0, 1610.0, 3394.0, 7932.0, 25434.0, 104829.0, 445859.0, 348406.0, 76432.0, 19620.0, 6541.0, 2841.0, 1419.0, 790.0, 441.0, 256.0, 179.0, 107.0, 81.0, 31.0, 34.0, 15.0, 13.0, 11.0, 9.0, 2.0, 7.0, 3.0, 8.0, 1.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1279296875, -0.12378883361816406, -0.11964797973632812, -0.11550712585449219, -0.11136627197265625, -0.10722541809082031, -0.10308456420898438, -0.09894371032714844, -0.0948028564453125, -0.09066200256347656, -0.08652114868164062, -0.08238029479980469, -0.07823944091796875, -0.07409858703613281, -0.06995773315429688, -0.06581687927246094, -0.061676025390625, -0.05753517150878906, -0.053394317626953125, -0.04925346374511719, -0.04511260986328125, -0.04097175598144531, -0.036830902099609375, -0.03269004821777344, -0.0285491943359375, -0.024408340454101562, -0.020267486572265625, -0.016126632690429688, -0.01198577880859375, -0.007844924926757812, -0.003704071044921875, 0.0004367828369140625, 0.00457763671875, 0.008718490600585938, 0.012859344482421875, 0.017000198364257812, 0.02114105224609375, 0.025281906127929688, 0.029422760009765625, 0.03356361389160156, 0.0377044677734375, 0.04184532165527344, 0.045986175537109375, 0.05012702941894531, 0.05426788330078125, 0.05840873718261719, 0.06254959106445312, 0.06669044494628906, 0.070831298828125, 0.07497215270996094, 0.07911300659179688, 0.08325386047363281, 0.08739471435546875, 0.09153556823730469, 0.09567642211914062, 0.09981727600097656, 0.1039581298828125, 0.10809898376464844, 0.11223983764648438, 0.11638069152832031, 0.12052154541015625, 0.12466239929199219, 0.12880325317382812, 0.13294410705566406, 0.1370849609375]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 8.0, 14.0, 17.0, 23.0, 46.0, 62.0, 102.0, 112.0, 113.0, 102.0, 101.0, 80.0, 62.0, 44.0, 33.0, 25.0, 21.0, 10.0, 8.0, 6.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0260467529296875, -0.02523946762084961, -0.02443218231201172, -0.023624897003173828, -0.022817611694335938, -0.022010326385498047, -0.021203041076660156, -0.020395755767822266, -0.019588470458984375, -0.018781185150146484, -0.017973899841308594, -0.017166614532470703, -0.016359329223632812, -0.015552043914794922, -0.014744758605957031, -0.01393747329711914, -0.01313018798828125, -0.01232290267944336, -0.011515617370605469, -0.010708332061767578, -0.009901046752929688, -0.009093761444091797, -0.008286476135253906, -0.007479190826416016, -0.006671905517578125, -0.005864620208740234, -0.005057334899902344, -0.004250049591064453, -0.0034427642822265625, -0.002635478973388672, -0.0018281936645507812, -0.0010209083557128906, -0.000213623046875, 0.0005936622619628906, 0.0014009475708007812, 0.002208232879638672, 0.0030155181884765625, 0.003822803497314453, 0.004630088806152344, 0.005437374114990234, 0.006244659423828125, 0.007051944732666016, 0.007859230041503906, 0.008666515350341797, 0.009473800659179688, 0.010281085968017578, 0.011088371276855469, 0.01189565658569336, 0.01270294189453125, 0.01351022720336914, 0.014317512512207031, 0.015124797821044922, 0.015932083129882812, 0.016739368438720703, 0.017546653747558594, 0.018353939056396484, 0.019161224365234375, 0.019968509674072266, 0.020775794982910156, 0.021583080291748047, 0.022390365600585938, 0.023197650909423828, 0.02400493621826172, 0.02481222152709961, 0.0256195068359375]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 7.0, 4.0, 6.0, 8.0, 16.0, 23.0, 23.0, 21.0, 51.0, 60.0, 98.0, 124.0, 123.0, 177.0, 229.0, 367.0, 479.0, 816.0, 1438.0, 2919.0, 7003.0, 20810.0, 67895.0, 218052.0, 432687.0, 200212.0, 62715.0, 19135.0, 6450.0, 2742.0, 1302.0, 780.0, 450.0, 388.0, 268.0, 170.0, 138.0, 89.0, 73.0, 53.0, 37.0, 36.0, 28.0, 12.0, 14.0, 8.0, 9.0, 6.0, 5.0, 5.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.10113525390625, -0.09792137145996094, -0.09470748901367188, -0.09149360656738281, -0.08827972412109375, -0.08506584167480469, -0.08185195922851562, -0.07863807678222656, -0.0754241943359375, -0.07221031188964844, -0.06899642944335938, -0.06578254699707031, -0.06256866455078125, -0.05935478210449219, -0.056140899658203125, -0.05292701721191406, -0.049713134765625, -0.04649925231933594, -0.043285369873046875, -0.04007148742675781, -0.03685760498046875, -0.03364372253417969, -0.030429840087890625, -0.027215957641601562, -0.0240020751953125, -0.020788192749023438, -0.017574310302734375, -0.014360427856445312, -0.01114654541015625, -0.007932662963867188, -0.004718780517578125, -0.0015048980712890625, 0.001708984375, 0.0049228668212890625, 0.008136749267578125, 0.011350631713867188, 0.01456451416015625, 0.017778396606445312, 0.020992279052734375, 0.024206161499023438, 0.0274200439453125, 0.030633926391601562, 0.033847808837890625, 0.03706169128417969, 0.04027557373046875, 0.04348945617675781, 0.046703338623046875, 0.04991722106933594, 0.053131103515625, 0.05634498596191406, 0.059558868408203125, 0.06277275085449219, 0.06598663330078125, 0.06920051574707031, 0.07241439819335938, 0.07562828063964844, 0.0788421630859375, 0.08205604553222656, 0.08526992797851562, 0.08848381042480469, 0.09169769287109375, 0.09491157531738281, 0.09812545776367188, 0.10133934020996094, 0.10455322265625]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 6.0, 3.0, 4.0, 2.0, 9.0, 8.0, 14.0, 18.0, 22.0, 25.0, 16.0, 30.0, 25.0, 28.0, 43.0, 37.0, 51.0, 40.0, 41.0, 53.0, 54.0, 50.0, 43.0, 52.0, 48.0, 32.0, 31.0, 43.0, 28.0, 28.0, 20.0, 18.0, 16.0, 16.0, 8.0, 12.0, 5.0, 5.0, 8.0, 7.0, 3.0, 3.0, 5.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08087158203125, -0.07817745208740234, -0.07548332214355469, -0.07278919219970703, -0.07009506225585938, -0.06740093231201172, -0.06470680236816406, -0.062012672424316406, -0.05931854248046875, -0.056624412536621094, -0.05393028259277344, -0.05123615264892578, -0.048542022705078125, -0.04584789276123047, -0.04315376281738281, -0.040459632873535156, -0.0377655029296875, -0.035071372985839844, -0.03237724304199219, -0.02968311309814453, -0.026988983154296875, -0.02429485321044922, -0.021600723266601562, -0.018906593322753906, -0.01621246337890625, -0.013518333435058594, -0.010824203491210938, -0.008130073547363281, -0.005435943603515625, -0.0027418136596679688, -4.76837158203125e-05, 0.0026464462280273438, 0.005340576171875, 0.008034706115722656, 0.010728836059570312, 0.013422966003417969, 0.016117095947265625, 0.01881122589111328, 0.021505355834960938, 0.024199485778808594, 0.02689361572265625, 0.029587745666503906, 0.03228187561035156, 0.03497600555419922, 0.037670135498046875, 0.04036426544189453, 0.04305839538574219, 0.045752525329589844, 0.0484466552734375, 0.051140785217285156, 0.05383491516113281, 0.05652904510498047, 0.059223175048828125, 0.06191730499267578, 0.06461143493652344, 0.0673055648803711, 0.06999969482421875, 0.0726938247680664, 0.07538795471191406, 0.07808208465576172, 0.08077621459960938, 0.08347034454345703, 0.08616447448730469, 0.08885860443115234, 0.091552734375]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 3.0, 3.0, 3.0, 5.0, 6.0, 15.0, 12.0, 12.0, 23.0, 64.0, 43.0, 80.0, 120.0, 207.0, 312.0, 538.0, 877.0, 1467.0, 2516.0, 4450.0, 8202.0, 16136.0, 33305.0, 76734.0, 211720.0, 385615.0, 178420.0, 66548.0, 29460.0, 14317.0, 7544.0, 4135.0, 2280.0, 1275.0, 788.0, 454.0, 314.0, 179.0, 126.0, 76.0, 53.0, 53.0, 16.0, 10.0, 15.0, 10.0, 9.0, 3.0, 5.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.049163818359375, -0.04743385314941406, -0.045703887939453125, -0.04397392272949219, -0.04224395751953125, -0.04051399230957031, -0.038784027099609375, -0.03705406188964844, -0.0353240966796875, -0.03359413146972656, -0.031864166259765625, -0.030134201049804688, -0.02840423583984375, -0.026674270629882812, -0.024944305419921875, -0.023214340209960938, -0.021484375, -0.019754409790039062, -0.018024444580078125, -0.016294479370117188, -0.01456451416015625, -0.012834548950195312, -0.011104583740234375, -0.009374618530273438, -0.0076446533203125, -0.0059146881103515625, -0.004184722900390625, -0.0024547576904296875, -0.00072479248046875, 0.0010051727294921875, 0.002735137939453125, 0.0044651031494140625, 0.006195068359375, 0.007925033569335938, 0.009654998779296875, 0.011384963989257812, 0.01311492919921875, 0.014844894409179688, 0.016574859619140625, 0.018304824829101562, 0.0200347900390625, 0.021764755249023438, 0.023494720458984375, 0.025224685668945312, 0.02695465087890625, 0.028684616088867188, 0.030414581298828125, 0.03214454650878906, 0.03387451171875, 0.03560447692871094, 0.037334442138671875, 0.03906440734863281, 0.04079437255859375, 0.04252433776855469, 0.044254302978515625, 0.04598426818847656, 0.0477142333984375, 0.04944419860839844, 0.051174163818359375, 0.05290412902832031, 0.05463409423828125, 0.05636405944824219, 0.058094024658203125, 0.05982398986816406, 0.061553955078125]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 1.0, 2.0, 2.0, 2.0, 3.0, 3.0, 12.0, 15.0, 17.0, 26.0, 33.0, 37.0, 45.0, 44.0, 73.0, 92.0, 111.0, 72.0, 77.0, 76.0, 61.0, 33.0, 46.0, 29.0, 23.0, 12.0, 13.0, 15.0, 8.0, 7.0, 4.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.118680953979492e-05, -3.96091490983963e-05, -3.803148865699768e-05, -3.645382821559906e-05, -3.487616777420044e-05, -3.329850733280182e-05, -3.17208468914032e-05, -3.0143186450004578e-05, -2.8565526008605957e-05, -2.6987865567207336e-05, -2.5410205125808716e-05, -2.3832544684410095e-05, -2.2254884243011475e-05, -2.0677223801612854e-05, -1.9099563360214233e-05, -1.7521902918815613e-05, -1.5944242477416992e-05, -1.4366582036018372e-05, -1.2788921594619751e-05, -1.121126115322113e-05, -9.63360071182251e-06, -8.05594027042389e-06, -6.4782798290252686e-06, -4.900619387626648e-06, -3.3229589462280273e-06, -1.7452985048294067e-06, -1.6763806343078613e-07, 1.4100223779678345e-06, 2.987682819366455e-06, 4.565343260765076e-06, 6.143003702163696e-06, 7.720664143562317e-06, 9.298324584960938e-06, 1.0875985026359558e-05, 1.2453645467758179e-05, 1.40313059091568e-05, 1.560896635055542e-05, 1.718662679195404e-05, 1.876428723335266e-05, 2.0341947674751282e-05, 2.1919608116149902e-05, 2.3497268557548523e-05, 2.5074928998947144e-05, 2.6652589440345764e-05, 2.8230249881744385e-05, 2.9807910323143005e-05, 3.1385570764541626e-05, 3.2963231205940247e-05, 3.454089164733887e-05, 3.611855208873749e-05, 3.769621253013611e-05, 3.927387297153473e-05, 4.085153341293335e-05, 4.242919385433197e-05, 4.400685429573059e-05, 4.558451473712921e-05, 4.716217517852783e-05, 4.873983561992645e-05, 5.031749606132507e-05, 5.1895156502723694e-05, 5.3472816944122314e-05, 5.5050477385520935e-05, 5.6628137826919556e-05, 5.8205798268318176e-05, 5.97834587097168e-05]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 5.0, 2.0, 1.0, 5.0, 7.0, 11.0, 9.0, 15.0, 25.0, 30.0, 38.0, 70.0, 114.0, 148.0, 245.0, 428.0, 840.0, 1932.0, 5304.0, 20321.0, 105762.0, 669688.0, 198657.0, 32078.0, 7812.0, 2570.0, 1090.0, 523.0, 280.0, 162.0, 120.0, 69.0, 63.0, 32.0, 30.0, 20.0, 12.0, 10.0, 10.0, 9.0, 5.0, 4.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 2.0], "bins": [-0.137939453125, -0.13417625427246094, -0.13041305541992188, -0.1266498565673828, -0.12288665771484375, -0.11912345886230469, -0.11536026000976562, -0.11159706115722656, -0.1078338623046875, -0.10407066345214844, -0.10030746459960938, -0.09654426574707031, -0.09278106689453125, -0.08901786804199219, -0.08525466918945312, -0.08149147033691406, -0.077728271484375, -0.07396507263183594, -0.07020187377929688, -0.06643867492675781, -0.06267547607421875, -0.05891227722167969, -0.055149078369140625, -0.05138587951660156, -0.0476226806640625, -0.04385948181152344, -0.040096282958984375, -0.03633308410644531, -0.03256988525390625, -0.028806686401367188, -0.025043487548828125, -0.021280288696289062, -0.01751708984375, -0.013753890991210938, -0.009990692138671875, -0.0062274932861328125, -0.00246429443359375, 0.0012989044189453125, 0.005062103271484375, 0.008825302124023438, 0.0125885009765625, 0.016351699829101562, 0.020114898681640625, 0.023878097534179688, 0.02764129638671875, 0.03140449523925781, 0.035167694091796875, 0.03893089294433594, 0.042694091796875, 0.04645729064941406, 0.050220489501953125, 0.05398368835449219, 0.05774688720703125, 0.06151008605957031, 0.06527328491210938, 0.06903648376464844, 0.0727996826171875, 0.07656288146972656, 0.08032608032226562, 0.08408927917480469, 0.08785247802734375, 0.09161567687988281, 0.09537887573242188, 0.09914207458496094, 0.1029052734375]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 0.0, 8.0, 2.0, 11.0, 7.0, 8.0, 14.0, 12.0, 11.0, 23.0, 24.0, 23.0, 29.0, 42.0, 54.0, 66.0, 73.0, 78.0, 78.0, 84.0, 57.0, 63.0, 54.0, 24.0, 31.0, 20.0, 18.0, 23.0, 10.0, 13.0, 10.0, 5.0, 3.0, 8.0, 5.0, 4.0, 4.0, 1.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.051788330078125, -0.050187110900878906, -0.04858589172363281, -0.04698467254638672, -0.045383453369140625, -0.04378223419189453, -0.04218101501464844, -0.040579795837402344, -0.03897857666015625, -0.037377357482910156, -0.03577613830566406, -0.03417491912841797, -0.032573699951171875, -0.03097248077392578, -0.029371261596679688, -0.027770042419433594, -0.0261688232421875, -0.024567604064941406, -0.022966384887695312, -0.02136516571044922, -0.019763946533203125, -0.01816272735595703, -0.016561508178710938, -0.014960289001464844, -0.01335906982421875, -0.011757850646972656, -0.010156631469726562, -0.008555412292480469, -0.006954193115234375, -0.005352973937988281, -0.0037517547607421875, -0.0021505355834960938, -0.00054931640625, 0.0010519027709960938, 0.0026531219482421875, 0.004254341125488281, 0.005855560302734375, 0.007456779479980469, 0.009057998657226562, 0.010659217834472656, 0.01226043701171875, 0.013861656188964844, 0.015462875366210938, 0.01706409454345703, 0.018665313720703125, 0.02026653289794922, 0.021867752075195312, 0.023468971252441406, 0.0250701904296875, 0.026671409606933594, 0.028272628784179688, 0.02987384796142578, 0.031475067138671875, 0.03307628631591797, 0.03467750549316406, 0.036278724670410156, 0.03787994384765625, 0.039481163024902344, 0.04108238220214844, 0.04268360137939453, 0.044284820556640625, 0.04588603973388672, 0.04748725891113281, 0.049088478088378906, 0.050689697265625]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 5.0, 5.0, 9.0, 22.0, 52.0, 123.0, 203.0, 250.0, 168.0, 98.0, 40.0, 18.0, 9.0, 2.0, 5.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1698739528656006, -1.1302838325500488, -1.090693712234497, -1.0511035919189453, -1.0115134716033936, -0.971923291683197, -0.9323331117630005, -0.8927429914474487, -0.853152871131897, -0.8135627508163452, -0.7739726305007935, -0.7343824505805969, -0.6947923302650452, -0.6552022099494934, -0.6156120300292969, -0.5760219097137451, -0.5364317893981934, -0.4968416690826416, -0.45725151896476746, -0.4176613688468933, -0.37807124853134155, -0.3384811282157898, -0.29889097809791565, -0.2593008279800415, -0.21971070766448975, -0.1801205724477768, -0.14053043723106384, -0.10094030201435089, -0.06135016679763794, -0.021760031580924988, 0.017830103635787964, 0.05742025375366211, 0.09701037406921387, 0.13660050928592682, 0.17619064450263977, 0.21578077971935272, 0.2553709149360657, 0.29496103525161743, 0.3345511853694916, 0.3741413354873657, 0.4137314558029175, 0.45332157611846924, 0.4929117262363434, 0.5325018763542175, 0.5720919966697693, 0.611682116985321, 0.6512722969055176, 0.6908624172210693, 0.7304525375366211, 0.7700426578521729, 0.8096327781677246, 0.8492229580879211, 0.8888130784034729, 0.9284031987190247, 0.9679933786392212, 1.007583498954773, 1.0471736192703247, 1.0867637395858765, 1.1263538599014282, 1.16594398021698, 1.2055342197418213, 1.245124340057373, 1.2847144603729248, 1.3243045806884766, 1.3638947010040283]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 0.0, 2.0, 4.0, 3.0, 2.0, 2.0, 7.0, 7.0, 8.0, 8.0, 12.0, 21.0, 14.0, 15.0, 13.0, 15.0, 12.0, 21.0, 23.0, 28.0, 22.0, 36.0, 28.0, 30.0, 43.0, 44.0, 40.0, 33.0, 33.0, 40.0, 41.0, 46.0, 34.0, 50.0, 26.0, 27.0, 31.0, 33.0, 23.0, 19.0, 21.0, 16.0, 14.0, 10.0, 10.0, 10.0, 9.0, 8.0, 5.0, 6.0, 0.0, 3.0, 0.0, 2.0, 1.0, 1.0, 4.0], "bins": [-0.49877625703811646, -0.48435696959495544, -0.46993765234947205, -0.45551836490631104, -0.44109907746315, -0.426679790019989, -0.4122604727745056, -0.3978411853313446, -0.3834218978881836, -0.3690026104450226, -0.3545832931995392, -0.3401640057563782, -0.32574471831321716, -0.31132543087005615, -0.29690611362457275, -0.28248682618141174, -0.26806750893592834, -0.25364822149276733, -0.23922891914844513, -0.22480961680412292, -0.21039032936096191, -0.1959710270166397, -0.1815517246723175, -0.1671324372291565, -0.1527131348848343, -0.13829383254051208, -0.12387454509735107, -0.10945524275302887, -0.09503594785928726, -0.08061665296554565, -0.06619735062122345, -0.05177805572748184, -0.037358760833740234, -0.022939464077353477, -0.00852016732096672, 0.0058991312980651855, 0.020318426191806793, 0.0347377210855484, 0.049157023429870605, 0.06357631832361221, 0.07799561321735382, 0.09241490811109543, 0.10683420300483704, 0.12125350534915924, 0.13567280769348145, 0.15009209513664246, 0.16451139748096466, 0.17893069982528687, 0.19334998726844788, 0.20776928961277008, 0.2221885770559311, 0.2366078794002533, 0.2510271668434143, 0.2654464840888977, 0.2798657715320587, 0.2942850589752197, 0.3087043762207031, 0.32312366366386414, 0.33754298090934753, 0.35196226835250854, 0.36638155579566956, 0.38080084323883057, 0.39522016048431396, 0.409639447927475, 0.424058735370636]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [4.0, 1.0, 1.0, 3.0, 2.0, 2.0, 2.0, 3.0, 2.0, 0.0, 4.0, 4.0, 9.0, 12.0, 13.0, 11.0, 21.0, 38.0, 43.0, 101.0, 127.0, 197.0, 431.0, 750.0, 1434.0, 3176.0, 8837.0, 35862.0, 374283.0, 3648371.0, 93867.0, 17015.0, 5278.0, 2095.0, 979.0, 532.0, 299.0, 157.0, 109.0, 72.0, 56.0, 20.0, 19.0, 12.0, 13.0, 7.0, 6.0, 6.0, 5.0, 5.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.16650390625, -0.1608104705810547, -0.15511703491210938, -0.14942359924316406, -0.14373016357421875, -0.13803672790527344, -0.13234329223632812, -0.1266498565673828, -0.1209564208984375, -0.11526298522949219, -0.10956954956054688, -0.10387611389160156, -0.09818267822265625, -0.09248924255371094, -0.08679580688476562, -0.08110237121582031, -0.075408935546875, -0.06971549987792969, -0.06402206420898438, -0.05832862854003906, -0.05263519287109375, -0.04694175720214844, -0.041248321533203125, -0.03555488586425781, -0.0298614501953125, -0.024168014526367188, -0.018474578857421875, -0.012781143188476562, -0.00708770751953125, -0.0013942718505859375, 0.004299163818359375, 0.009992599487304688, 0.01568603515625, 0.021379470825195312, 0.027072906494140625, 0.03276634216308594, 0.03845977783203125, 0.04415321350097656, 0.049846649169921875, 0.05554008483886719, 0.0612335205078125, 0.06692695617675781, 0.07262039184570312, 0.07831382751464844, 0.08400726318359375, 0.08970069885253906, 0.09539413452148438, 0.10108757019042969, 0.106781005859375, 0.11247444152832031, 0.11816787719726562, 0.12386131286621094, 0.12955474853515625, 0.13524818420410156, 0.14094161987304688, 0.1466350555419922, 0.1523284912109375, 0.1580219268798828, 0.16371536254882812, 0.16940879821777344, 0.17510223388671875, 0.18079566955566406, 0.18648910522460938, 0.1921825408935547, 0.1978759765625]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 3.0, 3.0, 7.0, 9.0, 12.0, 19.0, 24.0, 31.0, 39.0, 54.0, 74.0, 75.0, 83.0, 98.0, 96.0, 86.0, 62.0, 55.0, 42.0, 36.0, 31.0, 31.0, 11.0, 10.0, 3.0, 3.0, 2.0, 2.0, 1.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.02899169921875, -0.028154850006103516, -0.02731800079345703, -0.026481151580810547, -0.025644302368164062, -0.024807453155517578, -0.023970603942871094, -0.02313375473022461, -0.022296905517578125, -0.02146005630493164, -0.020623207092285156, -0.019786357879638672, -0.018949508666992188, -0.018112659454345703, -0.01727581024169922, -0.016438961029052734, -0.01560211181640625, -0.014765262603759766, -0.013928413391113281, -0.013091564178466797, -0.012254714965820312, -0.011417865753173828, -0.010581016540527344, -0.00974416732788086, -0.008907318115234375, -0.00807046890258789, -0.007233619689941406, -0.006396770477294922, -0.0055599212646484375, -0.004723072052001953, -0.0038862228393554688, -0.0030493736267089844, -0.0022125244140625, -0.0013756752014160156, -0.0005388259887695312, 0.0002980232238769531, 0.0011348724365234375, 0.001971721649169922, 0.0028085708618164062, 0.0036454200744628906, 0.004482269287109375, 0.005319118499755859, 0.006155967712402344, 0.006992816925048828, 0.007829666137695312, 0.008666515350341797, 0.009503364562988281, 0.010340213775634766, 0.01117706298828125, 0.012013912200927734, 0.012850761413574219, 0.013687610626220703, 0.014524459838867188, 0.015361309051513672, 0.016198158264160156, 0.01703500747680664, 0.017871856689453125, 0.01870870590209961, 0.019545555114746094, 0.020382404327392578, 0.021219253540039062, 0.022056102752685547, 0.02289295196533203, 0.023729801177978516, 0.024566650390625]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 6.0, 4.0, 0.0, 4.0, 7.0, 7.0, 2.0, 9.0, 15.0, 16.0, 19.0, 32.0, 59.0, 50.0, 111.0, 177.0, 302.0, 518.0, 834.0, 1729.0, 3797.0, 12447.0, 72911.0, 2629886.0, 1389578.0, 63571.0, 11353.0, 3541.0, 1476.0, 753.0, 380.0, 249.0, 163.0, 103.0, 61.0, 41.0, 26.0, 13.0, 10.0, 13.0, 4.0, 8.0, 2.0, 1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1793212890625, -0.17353057861328125, -0.1677398681640625, -0.16194915771484375, -0.156158447265625, -0.15036773681640625, -0.1445770263671875, -0.13878631591796875, -0.13299560546875, -0.12720489501953125, -0.1214141845703125, -0.11562347412109375, -0.109832763671875, -0.10404205322265625, -0.0982513427734375, -0.09246063232421875, -0.086669921875, -0.08087921142578125, -0.0750885009765625, -0.06929779052734375, -0.063507080078125, -0.05771636962890625, -0.0519256591796875, -0.04613494873046875, -0.04034423828125, -0.03455352783203125, -0.0287628173828125, -0.02297210693359375, -0.017181396484375, -0.01139068603515625, -0.0055999755859375, 0.00019073486328125, 0.0059814453125, 0.01177215576171875, 0.0175628662109375, 0.02335357666015625, 0.029144287109375, 0.03493499755859375, 0.0407257080078125, 0.04651641845703125, 0.05230712890625, 0.05809783935546875, 0.0638885498046875, 0.06967926025390625, 0.075469970703125, 0.08126068115234375, 0.0870513916015625, 0.09284210205078125, 0.0986328125, 0.10442352294921875, 0.1102142333984375, 0.11600494384765625, 0.121795654296875, 0.12758636474609375, 0.1333770751953125, 0.13916778564453125, 0.14495849609375, 0.15074920654296875, 0.1565399169921875, 0.16233062744140625, 0.168121337890625, 0.17391204833984375, 0.1797027587890625, 0.18549346923828125, 0.1912841796875]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 3.0, 3.0, 4.0, 6.0, 9.0, 14.0, 21.0, 43.0, 74.0, 173.0, 453.0, 2218.0, 625.0, 207.0, 93.0, 57.0, 21.0, 28.0, 10.0, 5.0, 6.0, 2.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.078125, -0.07615423202514648, -0.07418346405029297, -0.07221269607543945, -0.07024192810058594, -0.06827116012573242, -0.0663003921508789, -0.06432962417602539, -0.062358856201171875, -0.06038808822631836, -0.058417320251464844, -0.05644655227661133, -0.05447578430175781, -0.0525050163269043, -0.05053424835205078, -0.048563480377197266, -0.04659271240234375, -0.044621944427490234, -0.04265117645263672, -0.0406804084777832, -0.03870964050292969, -0.03673887252807617, -0.034768104553222656, -0.03279733657836914, -0.030826568603515625, -0.02885580062866211, -0.026885032653808594, -0.024914264678955078, -0.022943496704101562, -0.020972728729248047, -0.01900196075439453, -0.017031192779541016, -0.0150604248046875, -0.013089656829833984, -0.011118888854980469, -0.009148120880126953, -0.0071773529052734375, -0.005206584930419922, -0.0032358169555664062, -0.0012650489807128906, 0.000705718994140625, 0.0026764869689941406, 0.004647254943847656, 0.006618022918701172, 0.008588790893554688, 0.010559558868408203, 0.012530326843261719, 0.014501094818115234, 0.01647186279296875, 0.018442630767822266, 0.02041339874267578, 0.022384166717529297, 0.024354934692382812, 0.026325702667236328, 0.028296470642089844, 0.03026723861694336, 0.032238006591796875, 0.03420877456665039, 0.036179542541503906, 0.03815031051635742, 0.04012107849121094, 0.04209184646606445, 0.04406261444091797, 0.046033382415771484, 0.048004150390625]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 0.0, 3.0, 6.0, 4.0, 4.0, 12.0, 6.0, 16.0, 26.0, 43.0, 59.0, 93.0, 128.0, 134.0, 123.0, 94.0, 88.0, 73.0, 39.0, 29.0, 10.0, 5.0, 6.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1828184276819229, -0.17528069019317627, -0.16774295270442963, -0.16020521521568298, -0.15266746282577515, -0.1451297402381897, -0.13759198784828186, -0.13005425035953522, -0.12251651287078857, -0.11497877538204193, -0.10744103789329529, -0.09990329295396805, -0.0923655554652214, -0.08482781797647476, -0.07729007303714752, -0.06975233554840088, -0.062214598059654236, -0.05467686057090759, -0.04713911935687065, -0.03960137814283371, -0.03206364065408707, -0.024525903165340424, -0.016988161951303482, -0.00945042073726654, -0.0019126832485198975, 0.005625056102871895, 0.013162795454263687, 0.02070053480565548, 0.02823827415704727, 0.035776011645793915, 0.043313752859830856, 0.0508514940738678, 0.058389246463775635, 0.06592698395252228, 0.07346472144126892, 0.08100246638059616, 0.0885402038693428, 0.09607794135808945, 0.10361568629741669, 0.11115342378616333, 0.11869116127490997, 0.12622889876365662, 0.13376663625240326, 0.1413043737411499, 0.14884212613105774, 0.1563798487186432, 0.16391760110855103, 0.17145533859729767, 0.1789930760860443, 0.18653081357479095, 0.1940685510635376, 0.20160628855228424, 0.20914402604103088, 0.21668177843093872, 0.22421951591968536, 0.231757253408432, 0.23929499089717865, 0.2468327283859253, 0.25437048077583313, 0.2619082033634186, 0.2694459557533264, 0.27698367834091187, 0.2845214307308197, 0.29205918312072754, 0.299596905708313]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 4.0, 2.0, 2.0, 4.0, 7.0, 5.0, 2.0, 5.0, 11.0, 15.0, 17.0, 10.0, 20.0, 24.0, 23.0, 21.0, 23.0, 31.0, 30.0, 33.0, 36.0, 39.0, 29.0, 33.0, 43.0, 38.0, 34.0, 44.0, 34.0, 32.0, 30.0, 27.0, 25.0, 26.0, 19.0, 28.0, 21.0, 29.0, 24.0, 21.0, 26.0, 14.0, 9.0, 13.0, 9.0, 5.0, 11.0, 5.0, 8.0, 1.0, 3.0, 2.0, 2.0, 3.0, 3.0, 1.0, 2.0], "bins": [-0.1259007453918457, -0.12195496261119843, -0.11800917983055115, -0.11406338959932327, -0.110117606818676, -0.10617182403802872, -0.10222603380680084, -0.09828025102615356, -0.09433446824550629, -0.09038868546485901, -0.08644290268421173, -0.08249711245298386, -0.07855132967233658, -0.0746055468916893, -0.07065975666046143, -0.06671397387981415, -0.06276819109916687, -0.05882240831851959, -0.054876621812582016, -0.05093083530664444, -0.04698505252599716, -0.043039269745349884, -0.03909348323941231, -0.03514769673347473, -0.031201913952827454, -0.027256129309535027, -0.0233103446662426, -0.019364560022950172, -0.015418775379657745, -0.011472990736365318, -0.007527206093072891, -0.003581421449780464, 0.0003643631935119629, 0.00431014783680439, 0.008255932480096817, 0.012201717123389244, 0.01614750176668167, 0.020093286409974098, 0.024039071053266525, 0.027984855696558952, 0.03193064033985138, 0.03587642312049866, 0.039822209626436234, 0.04376799613237381, 0.04771377891302109, 0.051659561693668365, 0.05560534819960594, 0.05955113470554352, 0.0634969174861908, 0.06744270026683807, 0.07138848304748535, 0.07533427327871323, 0.0792800560593605, 0.08322583884000778, 0.08717162907123566, 0.09111741185188293, 0.09506319463253021, 0.09900897741317749, 0.10295476019382477, 0.10690055042505264, 0.11084633320569992, 0.1147921159863472, 0.11873790621757507, 0.12268368899822235, 0.12662947177886963]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 2.0, 7.0, 4.0, 8.0, 7.0, 9.0, 15.0, 17.0, 26.0, 30.0, 43.0, 80.0, 103.0, 160.0, 201.0, 332.0, 528.0, 903.0, 1438.0, 2802.0, 5378.0, 10782.0, 23174.0, 52400.0, 120483.0, 258893.0, 298215.0, 150503.0, 65724.0, 28819.0, 13349.0, 6346.0, 3173.0, 1782.0, 993.0, 630.0, 360.0, 257.0, 177.0, 117.0, 84.0, 45.0, 44.0, 43.0, 23.0, 17.0, 7.0, 8.0, 5.0, 9.0, 4.0, 4.0, 2.0, 3.0, 2.0], "bins": [-0.079345703125, -0.07708740234375, -0.0748291015625, -0.07257080078125, -0.0703125, -0.06805419921875, -0.0657958984375, -0.06353759765625, -0.061279296875, -0.05902099609375, -0.0567626953125, -0.05450439453125, -0.05224609375, -0.04998779296875, -0.0477294921875, -0.04547119140625, -0.043212890625, -0.04095458984375, -0.0386962890625, -0.03643798828125, -0.0341796875, -0.03192138671875, -0.0296630859375, -0.02740478515625, -0.025146484375, -0.02288818359375, -0.0206298828125, -0.01837158203125, -0.01611328125, -0.01385498046875, -0.0115966796875, -0.00933837890625, -0.007080078125, -0.00482177734375, -0.0025634765625, -0.00030517578125, 0.001953125, 0.00421142578125, 0.0064697265625, 0.00872802734375, 0.010986328125, 0.01324462890625, 0.0155029296875, 0.01776123046875, 0.02001953125, 0.02227783203125, 0.0245361328125, 0.02679443359375, 0.029052734375, 0.03131103515625, 0.0335693359375, 0.03582763671875, 0.0380859375, 0.04034423828125, 0.0426025390625, 0.04486083984375, 0.047119140625, 0.04937744140625, 0.0516357421875, 0.05389404296875, 0.05615234375, 0.05841064453125, 0.0606689453125, 0.06292724609375, 0.065185546875]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 10.0, 13.0, 12.0, 22.0, 26.0, 42.0, 47.0, 50.0, 82.0, 69.0, 91.0, 83.0, 81.0, 63.0, 68.0, 56.0, 45.0, 35.0, 39.0, 18.0, 14.0, 11.0, 8.0, 4.0, 5.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0287628173828125, -0.027905941009521484, -0.02704906463623047, -0.026192188262939453, -0.025335311889648438, -0.024478435516357422, -0.023621559143066406, -0.02276468276977539, -0.021907806396484375, -0.02105093002319336, -0.020194053649902344, -0.019337177276611328, -0.018480300903320312, -0.017623424530029297, -0.01676654815673828, -0.015909671783447266, -0.01505279541015625, -0.014195919036865234, -0.013339042663574219, -0.012482166290283203, -0.011625289916992188, -0.010768413543701172, -0.009911537170410156, -0.00905466079711914, -0.008197784423828125, -0.007340908050537109, -0.006484031677246094, -0.005627155303955078, -0.0047702789306640625, -0.003913402557373047, -0.0030565261840820312, -0.0021996498107910156, -0.0013427734375, -0.0004858970642089844, 0.00037097930908203125, 0.0012278556823730469, 0.0020847320556640625, 0.002941608428955078, 0.0037984848022460938, 0.004655361175537109, 0.005512237548828125, 0.006369113922119141, 0.007225990295410156, 0.008082866668701172, 0.008939743041992188, 0.009796619415283203, 0.010653495788574219, 0.011510372161865234, 0.01236724853515625, 0.013224124908447266, 0.014081001281738281, 0.014937877655029297, 0.015794754028320312, 0.016651630401611328, 0.017508506774902344, 0.01836538314819336, 0.019222259521484375, 0.02007913589477539, 0.020936012268066406, 0.021792888641357422, 0.022649765014648438, 0.023506641387939453, 0.02436351776123047, 0.025220394134521484, 0.0260772705078125]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 2.0, 0.0, 0.0, 6.0, 1.0, 2.0, 7.0, 5.0, 10.0, 8.0, 16.0, 21.0, 18.0, 41.0, 48.0, 69.0, 81.0, 130.0, 184.0, 223.0, 322.0, 536.0, 810.0, 1290.0, 2461.0, 5613.0, 13960.0, 41784.0, 133899.0, 370809.0, 316134.0, 105077.0, 33268.0, 11459.0, 4637.0, 2169.0, 1178.0, 735.0, 463.0, 312.0, 230.0, 139.0, 118.0, 63.0, 54.0, 38.0, 43.0, 25.0, 24.0, 14.0, 6.0, 9.0, 4.0, 3.0, 5.0, 4.0, 1.0, 1.0, 0.0, 2.0, 1.0], "bins": [-0.097412109375, -0.0944509506225586, -0.09148979187011719, -0.08852863311767578, -0.08556747436523438, -0.08260631561279297, -0.07964515686035156, -0.07668399810791016, -0.07372283935546875, -0.07076168060302734, -0.06780052185058594, -0.06483936309814453, -0.061878204345703125, -0.05891704559326172, -0.05595588684082031, -0.052994728088378906, -0.0500335693359375, -0.047072410583496094, -0.04411125183105469, -0.04115009307861328, -0.038188934326171875, -0.03522777557373047, -0.03226661682128906, -0.029305458068847656, -0.02634429931640625, -0.023383140563964844, -0.020421981811523438, -0.01746082305908203, -0.014499664306640625, -0.011538505554199219, -0.008577346801757812, -0.005616188049316406, -0.002655029296875, 0.00030612945556640625, 0.0032672882080078125, 0.006228446960449219, 0.009189605712890625, 0.012150764465332031, 0.015111923217773438, 0.018073081970214844, 0.02103424072265625, 0.023995399475097656, 0.026956558227539062, 0.02991771697998047, 0.032878875732421875, 0.03584003448486328, 0.03880119323730469, 0.041762351989746094, 0.0447235107421875, 0.047684669494628906, 0.05064582824707031, 0.05360698699951172, 0.056568145751953125, 0.05952930450439453, 0.06249046325683594, 0.06545162200927734, 0.06841278076171875, 0.07137393951416016, 0.07433509826660156, 0.07729625701904297, 0.08025741577148438, 0.08321857452392578, 0.08617973327636719, 0.0891408920288086, 0.09210205078125]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 6.0, 3.0, 4.0, 8.0, 8.0, 9.0, 15.0, 19.0, 23.0, 30.0, 21.0, 35.0, 30.0, 42.0, 44.0, 45.0, 55.0, 65.0, 58.0, 49.0, 43.0, 61.0, 52.0, 52.0, 30.0, 23.0, 34.0, 22.0, 22.0, 21.0, 18.0, 13.0, 16.0, 9.0, 5.0, 4.0, 3.0, 3.0, 3.0, 1.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.11798095703125, -0.11449813842773438, -0.11101531982421875, -0.10753250122070312, -0.1040496826171875, -0.10056686401367188, -0.09708404541015625, -0.09360122680664062, -0.090118408203125, -0.08663558959960938, -0.08315277099609375, -0.07966995239257812, -0.0761871337890625, -0.07270431518554688, -0.06922149658203125, -0.06573867797851562, -0.062255859375, -0.058773040771484375, -0.05529022216796875, -0.051807403564453125, -0.0483245849609375, -0.044841766357421875, -0.04135894775390625, -0.037876129150390625, -0.034393310546875, -0.030910491943359375, -0.02742767333984375, -0.023944854736328125, -0.0204620361328125, -0.016979217529296875, -0.01349639892578125, -0.010013580322265625, -0.00653076171875, -0.003047943115234375, 0.00043487548828125, 0.003917694091796875, 0.0074005126953125, 0.010883331298828125, 0.01436614990234375, 0.017848968505859375, 0.021331787109375, 0.024814605712890625, 0.02829742431640625, 0.031780242919921875, 0.0352630615234375, 0.038745880126953125, 0.04222869873046875, 0.045711517333984375, 0.0491943359375, 0.052677154541015625, 0.05615997314453125, 0.059642791748046875, 0.0631256103515625, 0.06660842895507812, 0.07009124755859375, 0.07357406616210938, 0.077056884765625, 0.08053970336914062, 0.08402252197265625, 0.08750534057617188, 0.0909881591796875, 0.09447097778320312, 0.09795379638671875, 0.10143661499023438, 0.10491943359375]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 5.0, 1.0, 3.0, 15.0, 11.0, 13.0, 22.0, 42.0, 63.0, 94.0, 125.0, 219.0, 377.0, 704.0, 1184.0, 2353.0, 4775.0, 10342.0, 25200.0, 72515.0, 296114.0, 460401.0, 111637.0, 35675.0, 13895.0, 6163.0, 2990.0, 1569.0, 830.0, 447.0, 266.0, 180.0, 104.0, 70.0, 57.0, 29.0, 21.0, 20.0, 6.0, 11.0, 7.0, 1.0, 0.0, 7.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.056793212890625, -0.0547032356262207, -0.052613258361816406, -0.05052328109741211, -0.04843330383300781, -0.046343326568603516, -0.04425334930419922, -0.04216337203979492, -0.040073394775390625, -0.03798341751098633, -0.03589344024658203, -0.033803462982177734, -0.03171348571777344, -0.02962350845336914, -0.027533531188964844, -0.025443553924560547, -0.02335357666015625, -0.021263599395751953, -0.019173622131347656, -0.01708364486694336, -0.014993667602539062, -0.012903690338134766, -0.010813713073730469, -0.008723735809326172, -0.006633758544921875, -0.004543781280517578, -0.0024538040161132812, -0.0003638267517089844, 0.0017261505126953125, 0.0038161277770996094, 0.005906105041503906, 0.007996082305908203, 0.0100860595703125, 0.012176036834716797, 0.014266014099121094, 0.01635599136352539, 0.018445968627929688, 0.020535945892333984, 0.02262592315673828, 0.024715900421142578, 0.026805877685546875, 0.028895854949951172, 0.03098583221435547, 0.033075809478759766, 0.03516578674316406, 0.03725576400756836, 0.039345741271972656, 0.04143571853637695, 0.04352569580078125, 0.04561567306518555, 0.047705650329589844, 0.04979562759399414, 0.05188560485839844, 0.053975582122802734, 0.05606555938720703, 0.05815553665161133, 0.060245513916015625, 0.06233549118041992, 0.06442546844482422, 0.06651544570922852, 0.06860542297363281, 0.07069540023803711, 0.0727853775024414, 0.0748753547668457, 0.07696533203125]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 2.0, 4.0, 5.0, 5.0, 6.0, 8.0, 17.0, 22.0, 32.0, 47.0, 72.0, 63.0, 78.0, 97.0, 114.0, 103.0, 78.0, 71.0, 61.0, 39.0, 21.0, 21.0, 18.0, 10.0, 7.0, 5.0, 5.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.2319297790527344e-05, -4.043988883495331e-05, -3.856047987937927e-05, -3.668107092380524e-05, -3.48016619682312e-05, -3.2922253012657166e-05, -3.104284405708313e-05, -2.9163435101509094e-05, -2.728402614593506e-05, -2.5404617190361023e-05, -2.3525208234786987e-05, -2.164579927921295e-05, -1.9766390323638916e-05, -1.788698136806488e-05, -1.6007572412490845e-05, -1.4128163456916809e-05, -1.2248754501342773e-05, -1.0369345545768738e-05, -8.489936590194702e-06, -6.6105276346206665e-06, -4.731118679046631e-06, -2.8517097234725952e-06, -9.723007678985596e-07, 9.071081876754761e-07, 2.7865171432495117e-06, 4.665926098823547e-06, 6.545335054397583e-06, 8.424744009971619e-06, 1.0304152965545654e-05, 1.218356192111969e-05, 1.4062970876693726e-05, 1.594237983226776e-05, 1.7821788787841797e-05, 1.9701197743415833e-05, 2.1580606698989868e-05, 2.3460015654563904e-05, 2.533942461013794e-05, 2.7218833565711975e-05, 2.909824252128601e-05, 3.0977651476860046e-05, 3.285706043243408e-05, 3.473646938800812e-05, 3.661587834358215e-05, 3.849528729915619e-05, 4.0374696254730225e-05, 4.225410521030426e-05, 4.4133514165878296e-05, 4.601292312145233e-05, 4.789233207702637e-05, 4.97717410326004e-05, 5.165114998817444e-05, 5.3530558943748474e-05, 5.540996789932251e-05, 5.7289376854896545e-05, 5.916878581047058e-05, 6.104819476604462e-05, 6.292760372161865e-05, 6.480701267719269e-05, 6.668642163276672e-05, 6.856583058834076e-05, 7.04452395439148e-05, 7.232464849948883e-05, 7.420405745506287e-05, 7.60834664106369e-05, 7.796287536621094e-05]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 7.0, 4.0, 3.0, 11.0, 13.0, 10.0, 12.0, 22.0, 26.0, 38.0, 56.0, 77.0, 114.0, 180.0, 266.0, 520.0, 847.0, 1827.0, 4155.0, 10959.0, 33791.0, 141930.0, 610947.0, 181656.0, 39563.0, 12376.0, 4771.0, 1966.0, 987.0, 495.0, 305.0, 180.0, 113.0, 71.0, 77.0, 51.0, 26.0, 24.0, 26.0, 14.0, 7.0, 6.0, 11.0, 6.0, 6.0, 3.0, 2.0, 2.0, 0.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.07562255859375, -0.0732269287109375, -0.070831298828125, -0.0684356689453125, -0.0660400390625, -0.0636444091796875, -0.061248779296875, -0.0588531494140625, -0.05645751953125, -0.0540618896484375, -0.051666259765625, -0.0492706298828125, -0.046875, -0.0444793701171875, -0.042083740234375, -0.0396881103515625, -0.03729248046875, -0.0348968505859375, -0.032501220703125, -0.0301055908203125, -0.0277099609375, -0.0253143310546875, -0.022918701171875, -0.0205230712890625, -0.01812744140625, -0.0157318115234375, -0.013336181640625, -0.0109405517578125, -0.008544921875, -0.0061492919921875, -0.003753662109375, -0.0013580322265625, 0.00103759765625, 0.0034332275390625, 0.005828857421875, 0.0082244873046875, 0.0106201171875, 0.0130157470703125, 0.015411376953125, 0.0178070068359375, 0.02020263671875, 0.0225982666015625, 0.024993896484375, 0.0273895263671875, 0.02978515625, 0.0321807861328125, 0.034576416015625, 0.0369720458984375, 0.03936767578125, 0.0417633056640625, 0.044158935546875, 0.0465545654296875, 0.0489501953125, 0.0513458251953125, 0.053741455078125, 0.0561370849609375, 0.05853271484375, 0.0609283447265625, 0.063323974609375, 0.0657196044921875, 0.068115234375, 0.0705108642578125, 0.072906494140625, 0.0753021240234375, 0.07769775390625]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 1.0, 3.0, 7.0, 5.0, 4.0, 7.0, 6.0, 11.0, 8.0, 10.0, 14.0, 21.0, 23.0, 30.0, 31.0, 46.0, 57.0, 85.0, 94.0, 92.0, 98.0, 71.0, 76.0, 50.0, 34.0, 22.0, 16.0, 20.0, 14.0, 11.0, 4.0, 9.0, 4.0, 5.0, 4.0, 3.0, 5.0, 1.0, 6.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0], "bins": [-0.0531005859375, -0.051512718200683594, -0.04992485046386719, -0.04833698272705078, -0.046749114990234375, -0.04516124725341797, -0.04357337951660156, -0.041985511779785156, -0.04039764404296875, -0.038809776306152344, -0.03722190856933594, -0.03563404083251953, -0.034046173095703125, -0.03245830535888672, -0.030870437622070312, -0.029282569885253906, -0.0276947021484375, -0.026106834411621094, -0.024518966674804688, -0.02293109893798828, -0.021343231201171875, -0.01975536346435547, -0.018167495727539062, -0.016579627990722656, -0.01499176025390625, -0.013403892517089844, -0.011816024780273438, -0.010228157043457031, -0.008640289306640625, -0.007052421569824219, -0.0054645538330078125, -0.0038766860961914062, -0.002288818359375, -0.0007009506225585938, 0.0008869171142578125, 0.0024747848510742188, 0.004062652587890625, 0.005650520324707031, 0.0072383880615234375, 0.008826255798339844, 0.01041412353515625, 0.012001991271972656, 0.013589859008789062, 0.015177726745605469, 0.016765594482421875, 0.01835346221923828, 0.019941329956054688, 0.021529197692871094, 0.0231170654296875, 0.024704933166503906, 0.026292800903320312, 0.02788066864013672, 0.029468536376953125, 0.03105640411376953, 0.03264427185058594, 0.034232139587402344, 0.03582000732421875, 0.037407875061035156, 0.03899574279785156, 0.04058361053466797, 0.042171478271484375, 0.04375934600830078, 0.04534721374511719, 0.046935081481933594, 0.04852294921875]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 4.0, 17.0, 37.0, 60.0, 130.0, 164.0, 197.0, 179.0, 111.0, 61.0, 23.0, 9.0, 7.0, 5.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.36662888526916504, -0.3313409984111786, -0.29605311155319214, -0.2607652544975281, -0.22547736763954163, -0.19018948078155518, -0.15490160882472992, -0.11961373686790466, -0.08432585000991821, -0.04903797060251236, -0.013750091195106506, 0.021537788212299347, 0.0568256676197052, 0.09211355447769165, 0.1274014264345169, 0.16268929839134216, 0.1979771852493286, 0.23326507210731506, 0.2685529589653015, 0.3038408160209656, 0.339128702878952, 0.3744165897369385, 0.40970444679260254, 0.444992333650589, 0.48028022050857544, 0.5155680775642395, 0.5508559942245483, 0.5861438512802124, 0.6214317083358765, 0.6567196249961853, 0.6920074820518494, 0.7272953987121582, 0.7625832557678223, 0.7978711128234863, 0.8331590294837952, 0.8684468865394592, 0.9037348031997681, 0.9390226602554321, 0.9743105173110962, 1.0095983743667603, 1.0448863506317139, 1.080174207687378, 1.115462064743042, 1.1507500410079956, 1.1860378980636597, 1.2213257551193237, 1.2566136121749878, 1.2919014692306519, 1.327189326286316, 1.36247718334198, 1.397765040397644, 1.4330530166625977, 1.4683408737182617, 1.5036287307739258, 1.5389165878295898, 1.574204444885254, 1.609492301940918, 1.644780158996582, 1.680068016052246, 1.7153559923171997, 1.7506438493728638, 1.7859317064285278, 1.821219563484192, 1.856507420539856, 1.8917953968048096]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 4.0, 4.0, 5.0, 13.0, 12.0, 8.0, 27.0, 20.0, 23.0, 26.0, 40.0, 36.0, 49.0, 50.0, 69.0, 54.0, 61.0, 65.0, 62.0, 56.0, 44.0, 48.0, 49.0, 43.0, 27.0, 25.0, 22.0, 18.0, 10.0, 11.0, 8.0, 9.0, 4.0, 3.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6638667583465576, -0.6416358947753906, -0.6194049715995789, -0.5971741080284119, -0.5749431848526001, -0.5527123212814331, -0.5304814577102661, -0.5082505345344543, -0.48601964116096497, -0.4637887477874756, -0.4415578544139862, -0.4193269610404968, -0.39709609746932983, -0.37486517429351807, -0.3526343107223511, -0.3304034173488617, -0.3081725239753723, -0.28594163060188293, -0.26371073722839355, -0.24147985875606537, -0.219248965382576, -0.1970180720090866, -0.17478719353675842, -0.15255630016326904, -0.13032540678977966, -0.10809451341629028, -0.0858636274933815, -0.06363274157047272, -0.04140184819698334, -0.019170954823493958, 0.0030599236488342285, 0.02529081702232361, 0.047521770000457764, 0.06975266337394714, 0.09198354929685593, 0.11421443521976471, 0.1364453285932541, 0.15867622196674347, 0.18090710043907166, 0.20313799381256104, 0.22536888718605042, 0.2475997805595398, 0.2698306739330292, 0.29206156730651855, 0.31429243087768555, 0.3365233540534973, 0.3587542176246643, 0.3809851109981537, 0.40321600437164307, 0.42544689774513245, 0.4476777911186218, 0.4699086546897888, 0.4921395778656006, 0.5143704414367676, 0.5366013050079346, 0.5588322281837463, 0.5810631513595581, 0.6032940149307251, 0.6255249381065369, 0.6477558016777039, 0.6699867248535156, 0.6922175884246826, 0.7144484519958496, 0.7366793751716614, 0.7589102387428284]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 4.0, 1.0, 10.0, 8.0, 11.0, 23.0, 32.0, 54.0, 93.0, 194.0, 348.0, 739.0, 1737.0, 5003.0, 21371.0, 176554.0, 3826009.0, 135625.0, 18810.0, 4659.0, 1604.0, 707.0, 332.0, 146.0, 105.0, 40.0, 33.0, 14.0, 11.0, 5.0, 1.0, 2.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1778564453125, -0.17201614379882812, -0.16617584228515625, -0.16033554077148438, -0.1544952392578125, -0.14865493774414062, -0.14281463623046875, -0.13697433471679688, -0.131134033203125, -0.12529373168945312, -0.11945343017578125, -0.11361312866210938, -0.1077728271484375, -0.10193252563476562, -0.09609222412109375, -0.09025192260742188, -0.08441162109375, -0.07857131958007812, -0.07273101806640625, -0.06689071655273438, -0.0610504150390625, -0.055210113525390625, -0.04936981201171875, -0.043529510498046875, -0.037689208984375, -0.031848907470703125, -0.02600860595703125, -0.020168304443359375, -0.0143280029296875, -0.008487701416015625, -0.00264739990234375, 0.003192901611328125, 0.009033203125, 0.014873504638671875, 0.02071380615234375, 0.026554107666015625, 0.0323944091796875, 0.038234710693359375, 0.04407501220703125, 0.049915313720703125, 0.055755615234375, 0.061595916748046875, 0.06743621826171875, 0.07327651977539062, 0.0791168212890625, 0.08495712280273438, 0.09079742431640625, 0.09663772583007812, 0.10247802734375, 0.10831832885742188, 0.11415863037109375, 0.11999893188476562, 0.1258392333984375, 0.13167953491210938, 0.13751983642578125, 0.14336013793945312, 0.149200439453125, 0.15504074096679688, 0.16088104248046875, 0.16672134399414062, 0.1725616455078125, 0.17840194702148438, 0.18424224853515625, 0.19008255004882812, 0.1959228515625]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 4.0, 8.0, 6.0, 9.0, 9.0, 23.0, 23.0, 27.0, 27.0, 53.0, 62.0, 63.0, 58.0, 82.0, 75.0, 83.0, 54.0, 61.0, 42.0, 62.0, 38.0, 38.0, 25.0, 22.0, 14.0, 10.0, 9.0, 6.0, 5.0, 1.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.02801513671875, -0.027231693267822266, -0.02644824981689453, -0.025664806365966797, -0.024881362915039062, -0.024097919464111328, -0.023314476013183594, -0.02253103256225586, -0.021747589111328125, -0.02096414566040039, -0.020180702209472656, -0.019397258758544922, -0.018613815307617188, -0.017830371856689453, -0.01704692840576172, -0.016263484954833984, -0.01548004150390625, -0.014696598052978516, -0.013913154602050781, -0.013129711151123047, -0.012346267700195312, -0.011562824249267578, -0.010779380798339844, -0.00999593734741211, -0.009212493896484375, -0.00842905044555664, -0.007645606994628906, -0.006862163543701172, -0.0060787200927734375, -0.005295276641845703, -0.004511833190917969, -0.0037283897399902344, -0.0029449462890625, -0.0021615028381347656, -0.0013780593872070312, -0.0005946159362792969, 0.0001888275146484375, 0.0009722709655761719, 0.0017557144165039062, 0.0025391578674316406, 0.003322601318359375, 0.004106044769287109, 0.004889488220214844, 0.005672931671142578, 0.0064563751220703125, 0.007239818572998047, 0.008023262023925781, 0.008806705474853516, 0.00959014892578125, 0.010373592376708984, 0.011157035827636719, 0.011940479278564453, 0.012723922729492188, 0.013507366180419922, 0.014290809631347656, 0.01507425308227539, 0.015857696533203125, 0.01664113998413086, 0.017424583435058594, 0.018208026885986328, 0.018991470336914062, 0.019774913787841797, 0.02055835723876953, 0.021341800689697266, 0.022125244140625]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 1.0, 2.0, 1.0, 3.0, 4.0, 9.0, 8.0, 11.0, 8.0, 21.0, 18.0, 33.0, 32.0, 38.0, 37.0, 54.0, 82.0, 157.0, 344.0, 1037.0, 4337.0, 31020.0, 2887850.0, 1235929.0, 27547.0, 3995.0, 987.0, 344.0, 117.0, 74.0, 47.0, 24.0, 22.0, 25.0, 13.0, 13.0, 13.0, 10.0, 5.0, 6.0, 8.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.317626953125, -0.3073692321777344, -0.29711151123046875, -0.2868537902832031, -0.2765960693359375, -0.2663383483886719, -0.25608062744140625, -0.24582290649414062, -0.235565185546875, -0.22530746459960938, -0.21504974365234375, -0.20479202270507812, -0.1945343017578125, -0.18427658081054688, -0.17401885986328125, -0.16376113891601562, -0.15350341796875, -0.14324569702148438, -0.13298797607421875, -0.12273025512695312, -0.1124725341796875, -0.10221481323242188, -0.09195709228515625, -0.08169937133789062, -0.071441650390625, -0.061183929443359375, -0.05092620849609375, -0.040668487548828125, -0.0304107666015625, -0.020153045654296875, -0.00989532470703125, 0.000362396240234375, 0.0106201171875, 0.020877838134765625, 0.03113555908203125, 0.041393280029296875, 0.0516510009765625, 0.061908721923828125, 0.07216644287109375, 0.08242416381835938, 0.092681884765625, 0.10293960571289062, 0.11319732666015625, 0.12345504760742188, 0.1337127685546875, 0.14397048950195312, 0.15422821044921875, 0.16448593139648438, 0.17474365234375, 0.18500137329101562, 0.19525909423828125, 0.20551681518554688, 0.2157745361328125, 0.22603225708007812, 0.23628997802734375, 0.24654769897460938, 0.256805419921875, 0.2670631408691406, 0.27732086181640625, 0.2875785827636719, 0.2978363037109375, 0.3080940246582031, 0.31835174560546875, 0.3286094665527344, 0.3388671875]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 5.0, 7.0, 9.0, 20.0, 25.0, 91.0, 188.0, 715.0, 2356.0, 381.0, 149.0, 48.0, 39.0, 23.0, 13.0, 8.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.142333984375, -0.1393880844116211, -0.1364421844482422, -0.13349628448486328, -0.13055038452148438, -0.12760448455810547, -0.12465858459472656, -0.12171268463134766, -0.11876678466796875, -0.11582088470458984, -0.11287498474121094, -0.10992908477783203, -0.10698318481445312, -0.10403728485107422, -0.10109138488769531, -0.0981454849243164, -0.0951995849609375, -0.0922536849975586, -0.08930778503417969, -0.08636188507080078, -0.08341598510742188, -0.08047008514404297, -0.07752418518066406, -0.07457828521728516, -0.07163238525390625, -0.06868648529052734, -0.06574058532714844, -0.06279468536376953, -0.059848785400390625, -0.05690288543701172, -0.05395698547363281, -0.051011085510253906, -0.048065185546875, -0.045119285583496094, -0.04217338562011719, -0.03922748565673828, -0.036281585693359375, -0.03333568572998047, -0.030389785766601562, -0.027443885803222656, -0.02449798583984375, -0.021552085876464844, -0.018606185913085938, -0.01566028594970703, -0.012714385986328125, -0.009768486022949219, -0.0068225860595703125, -0.0038766860961914062, -0.0009307861328125, 0.0020151138305664062, 0.0049610137939453125, 0.007906913757324219, 0.010852813720703125, 0.013798713684082031, 0.016744613647460938, 0.019690513610839844, 0.02263641357421875, 0.025582313537597656, 0.028528213500976562, 0.03147411346435547, 0.034420013427734375, 0.03736591339111328, 0.04031181335449219, 0.043257713317871094, 0.04620361328125]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 7.0, 9.0, 14.0, 30.0, 61.0, 88.0, 140.0, 168.0, 161.0, 133.0, 93.0, 65.0, 24.0, 11.0, 6.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.18401604890823364, -0.17166294157505035, -0.15930983424186707, -0.14695671200752258, -0.1346036046743393, -0.122250497341156, -0.10989739000797272, -0.09754427522420883, -0.08519116789102554, -0.07283806055784225, -0.06048494577407837, -0.04813183844089508, -0.035778727382421494, -0.023425616323947906, -0.011072508990764618, 0.0012806057929992676, 0.013633713126182556, 0.025986824184656143, 0.03833993524312973, 0.05069304257631302, 0.0630461573600769, 0.07539926469326019, 0.08775237202644348, 0.10010548681020737, 0.11245859414339066, 0.12481170147657394, 0.13716481626033783, 0.14951792359352112, 0.1618710309267044, 0.1742241382598877, 0.18657726049423218, 0.19893036782741547, 0.21128347516059875, 0.22363658249378204, 0.23598968982696533, 0.24834281206130981, 0.2606959044933319, 0.2730490267276764, 0.2854021191596985, 0.29775524139404297, 0.31010836362838745, 0.32246148586273193, 0.33481457829475403, 0.3471677005290985, 0.3595207929611206, 0.3718739151954651, 0.38422703742980957, 0.39658012986183167, 0.40893322229385376, 0.42128634452819824, 0.43363943696022034, 0.4459925591945648, 0.4583456516265869, 0.4706987738609314, 0.4830518960952759, 0.495404988527298, 0.5077581405639648, 0.5201112627983093, 0.5324643850326538, 0.5448174476623535, 0.557170569896698, 0.5695236921310425, 0.581876814365387, 0.5942299365997314, 0.6065829992294312]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 4.0, 3.0, 0.0, 2.0, 1.0, 6.0, 5.0, 8.0, 10.0, 11.0, 5.0, 18.0, 23.0, 24.0, 28.0, 30.0, 28.0, 23.0, 35.0, 50.0, 46.0, 40.0, 36.0, 32.0, 51.0, 42.0, 34.0, 44.0, 37.0, 45.0, 35.0, 41.0, 29.0, 19.0, 25.0, 20.0, 21.0, 12.0, 19.0, 9.0, 7.0, 14.0, 6.0, 6.0, 9.0, 7.0, 5.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0], "bins": [-0.16341900825500488, -0.1584937572479248, -0.15356852114200592, -0.14864327013492584, -0.14371801912784576, -0.13879278302192688, -0.1338675320148468, -0.12894228100776672, -0.12401703745126724, -0.11909179389476776, -0.11416654288768768, -0.1092412993311882, -0.10431605577468872, -0.09939080476760864, -0.09446556121110916, -0.08954031765460968, -0.0846150666475296, -0.07968982309103012, -0.07476457208395004, -0.06983932852745056, -0.06491407752037048, -0.059988833963871, -0.05506359040737152, -0.05013834312558174, -0.04521309584379196, -0.04028784856200218, -0.0353626012802124, -0.03043735772371292, -0.02551211044192314, -0.020586863160133362, -0.01566161774098873, -0.010736372321844101, -0.005811125040054321, -0.0008858786895871162, 0.004039367660880089, 0.008964614011347294, 0.013889860361814499, 0.01881510764360428, 0.02374035306274891, 0.02866559848189354, 0.03359084576368332, 0.0385160930454731, 0.04344134032726288, 0.04836658388376236, 0.05329183116555214, 0.05821707844734192, 0.0631423220038414, 0.06806756556034088, 0.07299281656742096, 0.07791806012392044, 0.08284331113100052, 0.0877685546875, 0.09269380569458008, 0.09761904925107956, 0.10254429280757904, 0.10746954381465912, 0.1123947873711586, 0.11732003092765808, 0.12224528193473816, 0.12717053294181824, 0.13209576904773712, 0.1370210200548172, 0.14194627106189728, 0.14687150716781616, 0.15179675817489624]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 5.0, 1.0, 6.0, 9.0, 9.0, 18.0, 23.0, 33.0, 43.0, 80.0, 133.0, 191.0, 314.0, 570.0, 972.0, 1916.0, 3876.0, 7944.0, 17487.0, 41180.0, 97913.0, 230820.0, 340556.0, 174744.0, 72925.0, 30731.0, 13254.0, 6154.0, 3024.0, 1556.0, 838.0, 513.0, 248.0, 187.0, 80.0, 77.0, 50.0, 31.0, 18.0, 12.0, 7.0, 3.0, 5.0, 4.0, 3.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0], "bins": [-0.0860595703125, -0.08362388610839844, -0.08118820190429688, -0.07875251770019531, -0.07631683349609375, -0.07388114929199219, -0.07144546508789062, -0.06900978088378906, -0.0665740966796875, -0.06413841247558594, -0.061702728271484375, -0.05926704406738281, -0.05683135986328125, -0.05439567565917969, -0.051959991455078125, -0.04952430725097656, -0.047088623046875, -0.04465293884277344, -0.042217254638671875, -0.03978157043457031, -0.03734588623046875, -0.03491020202636719, -0.032474517822265625, -0.030038833618164062, -0.0276031494140625, -0.025167465209960938, -0.022731781005859375, -0.020296096801757812, -0.01786041259765625, -0.015424728393554688, -0.012989044189453125, -0.010553359985351562, -0.00811767578125, -0.0056819915771484375, -0.003246307373046875, -0.0008106231689453125, 0.00162506103515625, 0.0040607452392578125, 0.006496429443359375, 0.008932113647460938, 0.0113677978515625, 0.013803482055664062, 0.016239166259765625, 0.018674850463867188, 0.02111053466796875, 0.023546218872070312, 0.025981903076171875, 0.028417587280273438, 0.030853271484375, 0.03328895568847656, 0.035724639892578125, 0.03816032409667969, 0.04059600830078125, 0.04303169250488281, 0.045467376708984375, 0.04790306091308594, 0.0503387451171875, 0.05277442932128906, 0.055210113525390625, 0.05764579772949219, 0.06008148193359375, 0.06251716613769531, 0.06495285034179688, 0.06738853454589844, 0.06982421875]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 7.0, 3.0, 6.0, 5.0, 13.0, 11.0, 31.0, 22.0, 40.0, 39.0, 48.0, 48.0, 55.0, 68.0, 90.0, 69.0, 62.0, 49.0, 62.0, 49.0, 51.0, 36.0, 32.0, 36.0, 18.0, 17.0, 7.0, 10.0, 7.0, 4.0, 3.0, 1.0, 6.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0295867919921875, -0.028775691986083984, -0.02796459197998047, -0.027153491973876953, -0.026342391967773438, -0.025531291961669922, -0.024720191955566406, -0.02390909194946289, -0.023097991943359375, -0.02228689193725586, -0.021475791931152344, -0.020664691925048828, -0.019853591918945312, -0.019042491912841797, -0.01823139190673828, -0.017420291900634766, -0.01660919189453125, -0.015798091888427734, -0.014986991882324219, -0.014175891876220703, -0.013364791870117188, -0.012553691864013672, -0.011742591857910156, -0.01093149185180664, -0.010120391845703125, -0.00930929183959961, -0.008498191833496094, -0.007687091827392578, -0.0068759918212890625, -0.006064891815185547, -0.005253791809082031, -0.004442691802978516, -0.003631591796875, -0.0028204917907714844, -0.0020093917846679688, -0.0011982917785644531, -0.0003871917724609375, 0.0004239082336425781, 0.0012350082397460938, 0.0020461082458496094, 0.002857208251953125, 0.0036683082580566406, 0.004479408264160156, 0.005290508270263672, 0.0061016082763671875, 0.006912708282470703, 0.007723808288574219, 0.008534908294677734, 0.00934600830078125, 0.010157108306884766, 0.010968208312988281, 0.011779308319091797, 0.012590408325195312, 0.013401508331298828, 0.014212608337402344, 0.01502370834350586, 0.015834808349609375, 0.01664590835571289, 0.017457008361816406, 0.018268108367919922, 0.019079208374023438, 0.019890308380126953, 0.02070140838623047, 0.021512508392333984, 0.0223236083984375]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 4.0, 9.0, 11.0, 11.0, 11.0, 17.0, 40.0, 51.0, 76.0, 136.0, 231.0, 354.0, 774.0, 1513.0, 3769.0, 14688.0, 87902.0, 525238.0, 347483.0, 51292.0, 9468.0, 2770.0, 1209.0, 610.0, 338.0, 211.0, 122.0, 88.0, 51.0, 30.0, 18.0, 13.0, 11.0, 3.0, 6.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1396484375, -0.1348094940185547, -0.12997055053710938, -0.12513160705566406, -0.12029266357421875, -0.11545372009277344, -0.11061477661132812, -0.10577583312988281, -0.1009368896484375, -0.09609794616699219, -0.09125900268554688, -0.08642005920410156, -0.08158111572265625, -0.07674217224121094, -0.07190322875976562, -0.06706428527832031, -0.062225341796875, -0.05738639831542969, -0.052547454833984375, -0.04770851135253906, -0.04286956787109375, -0.03803062438964844, -0.033191680908203125, -0.028352737426757812, -0.0235137939453125, -0.018674850463867188, -0.013835906982421875, -0.008996963500976562, -0.00415802001953125, 0.0006809234619140625, 0.005519866943359375, 0.010358810424804688, 0.01519775390625, 0.020036697387695312, 0.024875640869140625, 0.029714584350585938, 0.03455352783203125, 0.03939247131347656, 0.044231414794921875, 0.04907035827636719, 0.0539093017578125, 0.05874824523925781, 0.06358718872070312, 0.06842613220214844, 0.07326507568359375, 0.07810401916503906, 0.08294296264648438, 0.08778190612792969, 0.092620849609375, 0.09745979309082031, 0.10229873657226562, 0.10713768005371094, 0.11197662353515625, 0.11681556701660156, 0.12165451049804688, 0.1264934539794922, 0.1313323974609375, 0.1361713409423828, 0.14101028442382812, 0.14584922790527344, 0.15068817138671875, 0.15552711486816406, 0.16036605834960938, 0.1652050018310547, 0.1700439453125]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 4.0, 0.0, 8.0, 7.0, 3.0, 11.0, 14.0, 24.0, 20.0, 25.0, 36.0, 48.0, 26.0, 43.0, 29.0, 44.0, 74.0, 56.0, 59.0, 57.0, 48.0, 47.0, 47.0, 46.0, 29.0, 43.0, 27.0, 37.0, 16.0, 15.0, 12.0, 15.0, 15.0, 5.0, 5.0, 5.0, 3.0, 3.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.10943603515625, -0.10591697692871094, -0.10239791870117188, -0.09887886047363281, -0.09535980224609375, -0.09184074401855469, -0.08832168579101562, -0.08480262756347656, -0.0812835693359375, -0.07776451110839844, -0.07424545288085938, -0.07072639465332031, -0.06720733642578125, -0.06368827819824219, -0.060169219970703125, -0.05665016174316406, -0.053131103515625, -0.04961204528808594, -0.046092987060546875, -0.04257392883300781, -0.03905487060546875, -0.03553581237792969, -0.032016754150390625, -0.028497695922851562, -0.0249786376953125, -0.021459579467773438, -0.017940521240234375, -0.014421463012695312, -0.01090240478515625, -0.0073833465576171875, -0.003864288330078125, -0.0003452301025390625, 0.003173828125, 0.0066928863525390625, 0.010211944580078125, 0.013731002807617188, 0.01725006103515625, 0.020769119262695312, 0.024288177490234375, 0.027807235717773438, 0.0313262939453125, 0.03484535217285156, 0.038364410400390625, 0.04188346862792969, 0.04540252685546875, 0.04892158508300781, 0.052440643310546875, 0.05595970153808594, 0.059478759765625, 0.06299781799316406, 0.06651687622070312, 0.07003593444824219, 0.07355499267578125, 0.07707405090332031, 0.08059310913085938, 0.08411216735839844, 0.0876312255859375, 0.09115028381347656, 0.09466934204101562, 0.09818840026855469, 0.10170745849609375, 0.10522651672363281, 0.10874557495117188, 0.11226463317871094, 0.11578369140625]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 5.0, 3.0, 4.0, 15.0, 17.0, 23.0, 26.0, 51.0, 70.0, 119.0, 177.0, 309.0, 480.0, 880.0, 1657.0, 3136.0, 6487.0, 14612.0, 41046.0, 180104.0, 594953.0, 143502.0, 35331.0, 13194.0, 5841.0, 2952.0, 1511.0, 809.0, 457.0, 284.0, 148.0, 118.0, 86.0, 49.0, 40.0, 18.0, 13.0, 13.0, 4.0, 10.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0], "bins": [-0.085205078125, -0.08286666870117188, -0.08052825927734375, -0.07818984985351562, -0.0758514404296875, -0.07351303100585938, -0.07117462158203125, -0.06883621215820312, -0.066497802734375, -0.06415939331054688, -0.06182098388671875, -0.059482574462890625, -0.0571441650390625, -0.054805755615234375, -0.05246734619140625, -0.050128936767578125, -0.04779052734375, -0.045452117919921875, -0.04311370849609375, -0.040775299072265625, -0.0384368896484375, -0.036098480224609375, -0.03376007080078125, -0.031421661376953125, -0.029083251953125, -0.026744842529296875, -0.02440643310546875, -0.022068023681640625, -0.0197296142578125, -0.017391204833984375, -0.01505279541015625, -0.012714385986328125, -0.0103759765625, -0.008037567138671875, -0.00569915771484375, -0.003360748291015625, -0.0010223388671875, 0.001316070556640625, 0.00365447998046875, 0.005992889404296875, 0.008331298828125, 0.010669708251953125, 0.01300811767578125, 0.015346527099609375, 0.0176849365234375, 0.020023345947265625, 0.02236175537109375, 0.024700164794921875, 0.02703857421875, 0.029376983642578125, 0.03171539306640625, 0.034053802490234375, 0.0363922119140625, 0.038730621337890625, 0.04106903076171875, 0.043407440185546875, 0.045745849609375, 0.048084259033203125, 0.05042266845703125, 0.052761077880859375, 0.0550994873046875, 0.057437896728515625, 0.05977630615234375, 0.062114715576171875, 0.064453125]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 5.0, 4.0, 13.0, 13.0, 19.0, 33.0, 60.0, 101.0, 128.0, 184.0, 164.0, 116.0, 75.0, 41.0, 14.0, 18.0, 6.0, 8.0, 2.0, 4.0, 3.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.091594696044922e-05, -5.781091749668121e-05, -5.470588803291321e-05, -5.16008585691452e-05, -4.84958291053772e-05, -4.539079964160919e-05, -4.2285770177841187e-05, -3.918074071407318e-05, -3.6075711250305176e-05, -3.297068178653717e-05, -2.9865652322769165e-05, -2.676062285900116e-05, -2.3655593395233154e-05, -2.055056393146515e-05, -1.7445534467697144e-05, -1.4340505003929138e-05, -1.1235475540161133e-05, -8.130446076393127e-06, -5.025416612625122e-06, -1.9203871488571167e-06, 1.1846423149108887e-06, 4.289671778678894e-06, 7.394701242446899e-06, 1.0499730706214905e-05, 1.360476016998291e-05, 1.6709789633750916e-05, 1.981481909751892e-05, 2.2919848561286926e-05, 2.602487802505493e-05, 2.9129907488822937e-05, 3.223493695259094e-05, 3.533996641635895e-05, 3.844499588012695e-05, 4.155002534389496e-05, 4.4655054807662964e-05, 4.776008427143097e-05, 5.0865113735198975e-05, 5.397014319896698e-05, 5.7075172662734985e-05, 6.018020212650299e-05, 6.3285231590271e-05, 6.6390261054039e-05, 6.949529051780701e-05, 7.260031998157501e-05, 7.570534944534302e-05, 7.881037890911102e-05, 8.191540837287903e-05, 8.502043783664703e-05, 8.812546730041504e-05, 9.123049676418304e-05, 9.433552622795105e-05, 9.744055569171906e-05, 0.00010054558515548706, 0.00010365061461925507, 0.00010675564408302307, 0.00010986067354679108, 0.00011296570301055908, 0.00011607073247432709, 0.00011917576193809509, 0.0001222807914018631, 0.0001253858208656311, 0.0001284908503293991, 0.00013159587979316711, 0.00013470090925693512, 0.00013780593872070312]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 1.0, 7.0, 8.0, 9.0, 11.0, 14.0, 14.0, 14.0, 26.0, 36.0, 53.0, 85.0, 154.0, 256.0, 463.0, 985.0, 2175.0, 5539.0, 17410.0, 82048.0, 652068.0, 237791.0, 33767.0, 9375.0, 3332.0, 1381.0, 670.0, 345.0, 181.0, 103.0, 73.0, 54.0, 29.0, 25.0, 16.0, 18.0, 10.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.09228515625, -0.08928298950195312, -0.08628082275390625, -0.08327865600585938, -0.0802764892578125, -0.07727432250976562, -0.07427215576171875, -0.07126998901367188, -0.068267822265625, -0.06526565551757812, -0.06226348876953125, -0.059261322021484375, -0.0562591552734375, -0.053256988525390625, -0.05025482177734375, -0.047252655029296875, -0.04425048828125, -0.041248321533203125, -0.03824615478515625, -0.035243988037109375, -0.0322418212890625, -0.029239654541015625, -0.02623748779296875, -0.023235321044921875, -0.020233154296875, -0.017230987548828125, -0.01422882080078125, -0.011226654052734375, -0.0082244873046875, -0.005222320556640625, -0.00222015380859375, 0.000782012939453125, 0.0037841796875, 0.006786346435546875, 0.00978851318359375, 0.012790679931640625, 0.0157928466796875, 0.018795013427734375, 0.02179718017578125, 0.024799346923828125, 0.027801513671875, 0.030803680419921875, 0.03380584716796875, 0.036808013916015625, 0.0398101806640625, 0.042812347412109375, 0.04581451416015625, 0.048816680908203125, 0.05181884765625, 0.054821014404296875, 0.05782318115234375, 0.060825347900390625, 0.0638275146484375, 0.06682968139648438, 0.06983184814453125, 0.07283401489257812, 0.075836181640625, 0.07883834838867188, 0.08184051513671875, 0.08484268188476562, 0.0878448486328125, 0.09084701538085938, 0.09384918212890625, 0.09685134887695312, 0.099853515625]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 1.0, 3.0, 4.0, 4.0, 7.0, 6.0, 9.0, 11.0, 21.0, 14.0, 18.0, 38.0, 55.0, 65.0, 119.0, 110.0, 112.0, 109.0, 70.0, 50.0, 42.0, 41.0, 19.0, 20.0, 14.0, 8.0, 11.0, 6.0, 4.0, 4.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0], "bins": [-0.08099365234375, -0.0790705680847168, -0.0771474838256836, -0.07522439956665039, -0.07330131530761719, -0.07137823104858398, -0.06945514678955078, -0.06753206253051758, -0.06560897827148438, -0.06368589401245117, -0.06176280975341797, -0.059839725494384766, -0.05791664123535156, -0.05599355697631836, -0.054070472717285156, -0.05214738845825195, -0.05022430419921875, -0.04830121994018555, -0.046378135681152344, -0.04445505142211914, -0.04253196716308594, -0.040608882904052734, -0.03868579864501953, -0.03676271438598633, -0.034839630126953125, -0.03291654586791992, -0.03099346160888672, -0.029070377349853516, -0.027147293090820312, -0.02522420883178711, -0.023301124572753906, -0.021378040313720703, -0.0194549560546875, -0.017531871795654297, -0.015608787536621094, -0.01368570327758789, -0.011762619018554688, -0.009839534759521484, -0.007916450500488281, -0.005993366241455078, -0.004070281982421875, -0.002147197723388672, -0.00022411346435546875, 0.0016989707946777344, 0.0036220550537109375, 0.005545139312744141, 0.007468223571777344, 0.009391307830810547, 0.01131439208984375, 0.013237476348876953, 0.015160560607910156, 0.01708364486694336, 0.019006729125976562, 0.020929813385009766, 0.02285289764404297, 0.024775981903076172, 0.026699066162109375, 0.028622150421142578, 0.03054523468017578, 0.032468318939208984, 0.03439140319824219, 0.03631448745727539, 0.038237571716308594, 0.0401606559753418, 0.042083740234375]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 13.0, 29.0, 73.0, 141.0, 238.0, 213.0, 161.0, 73.0, 48.0, 6.0, 7.0, 6.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3839235305786133, -0.3415030539035797, -0.29908257722854614, -0.25666213035583496, -0.2142416536808014, -0.17182117700576782, -0.12940073013305664, -0.08698025345802307, -0.0445597767829895, -0.0021393075585365295, 0.04028116166591644, 0.08270162343978882, 0.1251221001148224, 0.16754257678985596, 0.20996302366256714, 0.2523835003376007, 0.2948039770126343, 0.33722445368766785, 0.3796449303627014, 0.4220653772354126, 0.46448585391044617, 0.5069063305854797, 0.5493267774581909, 0.5917472839355469, 0.6341677308082581, 0.6765881776809692, 0.7190086841583252, 0.7614291310310364, 0.8038495779037476, 0.8462700843811035, 0.8886905312538147, 0.9311109781265259, 0.9735314846038818, 1.0159519910812378, 1.0583723783493042, 1.1007928848266602, 1.1432133913040161, 1.185633897781372, 1.2280542850494385, 1.2704747915267944, 1.3128952980041504, 1.3553158044815063, 1.3977361917495728, 1.4401566982269287, 1.4825772047042847, 1.5249977111816406, 1.567418098449707, 1.609838604927063, 1.6522589921951294, 1.6946794986724854, 1.7370998859405518, 1.7795203924179077, 1.8219408988952637, 1.86436128616333, 1.906781792640686, 1.949202299118042, 1.9916226863861084, 2.034043073654175, 2.0764636993408203, 2.1188840866088867, 2.161304473876953, 2.2037250995635986, 2.246145486831665, 2.2885658740997314, 2.330986499786377]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 4.0, 6.0, 4.0, 4.0, 6.0, 10.0, 9.0, 21.0, 16.0, 19.0, 37.0, 29.0, 31.0, 26.0, 46.0, 29.0, 32.0, 48.0, 52.0, 37.0, 38.0, 57.0, 38.0, 46.0, 47.0, 41.0, 38.0, 35.0, 17.0, 31.0, 25.0, 22.0, 19.0, 18.0, 14.0, 9.0, 5.0, 8.0, 9.0, 7.0, 4.0, 3.0, 2.0, 1.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.47896742820739746, -0.46249446272850037, -0.44602149724960327, -0.4295485019683838, -0.4130755364894867, -0.3966025710105896, -0.3801296055316925, -0.3636566400527954, -0.3471836447715759, -0.33071067929267883, -0.31423771381378174, -0.29776471853256226, -0.28129175305366516, -0.26481878757476807, -0.24834582209587097, -0.23187285661697388, -0.21539989113807678, -0.1989269256591797, -0.1824539452791214, -0.1659809798002243, -0.14950799942016602, -0.13303503394126892, -0.11656206846237183, -0.10008909553289413, -0.08361612260341644, -0.06714314967393875, -0.05067018046975136, -0.034197211265563965, -0.017724238336086273, -0.0012512654066085815, 0.015221700072288513, 0.031694673001766205, 0.048167645931243896, 0.06464061886072159, 0.08111359179019928, 0.09758655726909637, 0.11405953019857407, 0.13053250312805176, 0.14700546860694885, 0.16347843408584595, 0.17995141446590424, 0.19642437994480133, 0.21289736032485962, 0.2293703258037567, 0.2458432912826538, 0.2623162865638733, 0.278789222240448, 0.2952622175216675, 0.3117351830005646, 0.32820814847946167, 0.34468111395835876, 0.36115407943725586, 0.37762707471847534, 0.39410004019737244, 0.41057300567626953, 0.4270459711551666, 0.4435189366340637, 0.4599919021129608, 0.4764648675918579, 0.4929378628730774, 0.5094107985496521, 0.5258837938308716, 0.5423567295074463, 0.5588297247886658, 0.5753027200698853]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 6.0, 10.0, 10.0, 13.0, 13.0, 26.0, 36.0, 60.0, 63.0, 97.0, 160.0, 253.0, 381.0, 577.0, 997.0, 1750.0, 3053.0, 5866.0, 12166.0, 28015.0, 81229.0, 398437.0, 3217664.0, 321066.0, 71780.0, 25910.0, 11417.0, 5647.0, 3115.0, 1716.0, 1019.0, 617.0, 385.0, 249.0, 155.0, 118.0, 61.0, 49.0, 39.0, 15.0, 16.0, 11.0, 2.0, 5.0, 4.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.08563232421875, -0.08290958404541016, -0.08018684387207031, -0.07746410369873047, -0.07474136352539062, -0.07201862335205078, -0.06929588317871094, -0.0665731430053711, -0.06385040283203125, -0.061127662658691406, -0.05840492248535156, -0.05568218231201172, -0.052959442138671875, -0.05023670196533203, -0.04751396179199219, -0.044791221618652344, -0.0420684814453125, -0.039345741271972656, -0.03662300109863281, -0.03390026092529297, -0.031177520751953125, -0.02845478057861328, -0.025732040405273438, -0.023009300231933594, -0.02028656005859375, -0.017563819885253906, -0.014841079711914062, -0.012118339538574219, -0.009395599365234375, -0.006672859191894531, -0.0039501190185546875, -0.0012273788452148438, 0.001495361328125, 0.004218101501464844, 0.0069408416748046875, 0.009663581848144531, 0.012386322021484375, 0.015109062194824219, 0.017831802368164062, 0.020554542541503906, 0.02327728271484375, 0.026000022888183594, 0.028722763061523438, 0.03144550323486328, 0.034168243408203125, 0.03689098358154297, 0.03961372375488281, 0.042336463928222656, 0.0450592041015625, 0.047781944274902344, 0.05050468444824219, 0.05322742462158203, 0.055950164794921875, 0.05867290496826172, 0.06139564514160156, 0.0641183853149414, 0.06684112548828125, 0.0695638656616211, 0.07228660583496094, 0.07500934600830078, 0.07773208618164062, 0.08045482635498047, 0.08317756652832031, 0.08590030670166016, 0.088623046875]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 1.0, 3.0, 1.0, 3.0, 4.0, 8.0, 12.0, 12.0, 15.0, 28.0, 35.0, 33.0, 49.0, 39.0, 69.0, 63.0, 58.0, 79.0, 74.0, 49.0, 57.0, 57.0, 56.0, 49.0, 31.0, 28.0, 24.0, 20.0, 10.0, 9.0, 8.0, 10.0, 3.0, 1.0, 3.0, 1.0, 2.0, 2.0, 2.0, 0.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0264434814453125, -0.02564382553100586, -0.02484416961669922, -0.024044513702392578, -0.023244857788085938, -0.022445201873779297, -0.021645545959472656, -0.020845890045166016, -0.020046234130859375, -0.019246578216552734, -0.018446922302246094, -0.017647266387939453, -0.016847610473632812, -0.016047954559326172, -0.015248298645019531, -0.01444864273071289, -0.01364898681640625, -0.01284933090209961, -0.012049674987792969, -0.011250019073486328, -0.010450363159179688, -0.009650707244873047, -0.008851051330566406, -0.008051395416259766, -0.007251739501953125, -0.006452083587646484, -0.005652427673339844, -0.004852771759033203, -0.0040531158447265625, -0.003253459930419922, -0.0024538040161132812, -0.0016541481018066406, -0.0008544921875, -5.4836273193359375e-05, 0.0007448196411132812, 0.0015444755554199219, 0.0023441314697265625, 0.003143787384033203, 0.003943443298339844, 0.004743099212646484, 0.005542755126953125, 0.006342411041259766, 0.007142066955566406, 0.007941722869873047, 0.008741378784179688, 0.009541034698486328, 0.010340690612792969, 0.01114034652709961, 0.01194000244140625, 0.01273965835571289, 0.013539314270019531, 0.014338970184326172, 0.015138626098632812, 0.015938282012939453, 0.016737937927246094, 0.017537593841552734, 0.018337249755859375, 0.019136905670166016, 0.019936561584472656, 0.020736217498779297, 0.021535873413085938, 0.022335529327392578, 0.02313518524169922, 0.02393484115600586, 0.0247344970703125]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 5.0, 0.0, 3.0, 8.0, 6.0, 9.0, 14.0, 26.0, 22.0, 27.0, 42.0, 47.0, 80.0, 115.0, 226.0, 436.0, 928.0, 2623.0, 9960.0, 62440.0, 1356542.0, 2660067.0, 82842.0, 12506.0, 3115.0, 1095.0, 440.0, 242.0, 154.0, 87.0, 47.0, 36.0, 31.0, 24.0, 15.0, 8.0, 10.0, 1.0, 5.0, 0.0, 3.0, 1.0, 1.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1849365234375, -0.17898178100585938, -0.17302703857421875, -0.16707229614257812, -0.1611175537109375, -0.15516281127929688, -0.14920806884765625, -0.14325332641601562, -0.137298583984375, -0.13134384155273438, -0.12538909912109375, -0.11943435668945312, -0.1134796142578125, -0.10752487182617188, -0.10157012939453125, -0.09561538696289062, -0.08966064453125, -0.08370590209960938, -0.07775115966796875, -0.07179641723632812, -0.0658416748046875, -0.059886932373046875, -0.05393218994140625, -0.047977447509765625, -0.042022705078125, -0.036067962646484375, -0.03011322021484375, -0.024158477783203125, -0.0182037353515625, -0.012248992919921875, -0.00629425048828125, -0.000339508056640625, 0.005615234375, 0.011569976806640625, 0.01752471923828125, 0.023479461669921875, 0.0294342041015625, 0.035388946533203125, 0.04134368896484375, 0.047298431396484375, 0.053253173828125, 0.059207916259765625, 0.06516265869140625, 0.07111740112304688, 0.0770721435546875, 0.08302688598632812, 0.08898162841796875, 0.09493637084960938, 0.10089111328125, 0.10684585571289062, 0.11280059814453125, 0.11875534057617188, 0.1247100830078125, 0.13066482543945312, 0.13661956787109375, 0.14257431030273438, 0.148529052734375, 0.15448379516601562, 0.16043853759765625, 0.16639328002929688, 0.1723480224609375, 0.17830276489257812, 0.18425750732421875, 0.19021224975585938, 0.1961669921875]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 3.0, 5.0, 10.0, 12.0, 32.0, 51.0, 96.0, 208.0, 527.0, 1680.0, 842.0, 298.0, 124.0, 78.0, 35.0, 35.0, 8.0, 11.0, 7.0, 8.0, 4.0, 5.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10662841796875, -0.10387325286865234, -0.10111808776855469, -0.09836292266845703, -0.09560775756835938, -0.09285259246826172, -0.09009742736816406, -0.0873422622680664, -0.08458709716796875, -0.0818319320678711, -0.07907676696777344, -0.07632160186767578, -0.07356643676757812, -0.07081127166748047, -0.06805610656738281, -0.06530094146728516, -0.0625457763671875, -0.059790611267089844, -0.05703544616699219, -0.05428028106689453, -0.051525115966796875, -0.04876995086669922, -0.04601478576660156, -0.043259620666503906, -0.04050445556640625, -0.037749290466308594, -0.03499412536621094, -0.03223896026611328, -0.029483795166015625, -0.02672863006591797, -0.023973464965820312, -0.021218299865722656, -0.018463134765625, -0.015707969665527344, -0.012952804565429688, -0.010197639465332031, -0.007442474365234375, -0.004687309265136719, -0.0019321441650390625, 0.0008230209350585938, 0.00357818603515625, 0.006333351135253906, 0.009088516235351562, 0.011843681335449219, 0.014598846435546875, 0.01735401153564453, 0.020109176635742188, 0.022864341735839844, 0.0256195068359375, 0.028374671936035156, 0.031129837036132812, 0.03388500213623047, 0.036640167236328125, 0.03939533233642578, 0.04215049743652344, 0.044905662536621094, 0.04766082763671875, 0.050415992736816406, 0.05317115783691406, 0.05592632293701172, 0.058681488037109375, 0.06143665313720703, 0.06419181823730469, 0.06694698333740234, 0.0697021484375]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 9.0, 16.0, 76.0, 146.0, 265.0, 271.0, 135.0, 59.0, 25.0, 7.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.453777015209198, -0.42830225825309753, -0.40282750129699707, -0.377352774143219, -0.35187798738479614, -0.32640326023101807, -0.3009285032749176, -0.27545374631881714, -0.24997898936271667, -0.2245042324066162, -0.19902947545051575, -0.17355473339557648, -0.148079976439476, -0.12260521948337555, -0.09713047742843628, -0.07165572047233582, -0.04618096351623535, -0.020706210285425186, 0.004768542945384979, 0.030243292450904846, 0.05571804940700531, 0.08119280636310577, 0.10666754841804504, 0.1321423053741455, 0.15761706233024597, 0.18309181928634644, 0.2085665762424469, 0.23404131829738617, 0.25951606035232544, 0.2849908471107483, 0.31046557426452637, 0.33594033122062683, 0.3614150285720825, 0.386889785528183, 0.41236454248428345, 0.4378392696380615, 0.4633140563964844, 0.48878878355026245, 0.5142635107040405, 0.5397382974624634, 0.5652130842208862, 0.5906878113746643, 0.6161625981330872, 0.6416373252868652, 0.6671121120452881, 0.6925868391990662, 0.7180615663528442, 0.7435363531112671, 0.7690110802650452, 0.7944858074188232, 0.8199605941772461, 0.8454353213310242, 0.870910108089447, 0.8963848352432251, 0.921859622001648, 0.947334349155426, 0.9728090763092041, 0.9982838034629822, 1.0237585306167603, 1.049233317375183, 1.074708104133606, 1.1001828908920288, 1.125657558441162, 1.151132345199585, 1.1766071319580078]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 0.0, 4.0, 5.0, 0.0, 7.0, 8.0, 13.0, 16.0, 21.0, 22.0, 22.0, 19.0, 31.0, 45.0, 28.0, 34.0, 49.0, 53.0, 40.0, 53.0, 35.0, 34.0, 51.0, 37.0, 31.0, 43.0, 45.0, 46.0, 36.0, 25.0, 29.0, 27.0, 24.0, 16.0, 13.0, 10.0, 13.0, 8.0, 3.0, 3.0, 3.0, 4.0, 3.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.20565760135650635, -0.19885583221912384, -0.19205406308174133, -0.18525227904319763, -0.17845050990581512, -0.17164874076843262, -0.16484695672988892, -0.1580451875925064, -0.1512434184551239, -0.1444416493177414, -0.1376398801803589, -0.13083809614181519, -0.12403632700443268, -0.11723455786705017, -0.11043278127908707, -0.10363100469112396, -0.09682923555374146, -0.09002746641635895, -0.08322568982839584, -0.07642391324043274, -0.06962214410305023, -0.06282037496566772, -0.05601859837770462, -0.049216825515031815, -0.04241505265235901, -0.0356132797896862, -0.028811506927013397, -0.02200973406434059, -0.015207961201667786, -0.00840618833899498, -0.001604415476322174, 0.005197357386350632, 0.011999130249023438, 0.018800903111696243, 0.02560267597436905, 0.032404448837041855, 0.03920622169971466, 0.046007994562387466, 0.05280976742506027, 0.05961154028773308, 0.06641331315040588, 0.07321508228778839, 0.0800168588757515, 0.0868186354637146, 0.0936204046010971, 0.10042217373847961, 0.10722395032644272, 0.11402572691440582, 0.12082749605178833, 0.12762926518917084, 0.13443103432655334, 0.14123281836509705, 0.14803458750247955, 0.15483635663986206, 0.16163814067840576, 0.16843990981578827, 0.17524167895317078, 0.18204344809055328, 0.1888452172279358, 0.1956470012664795, 0.202448770403862, 0.2092505395412445, 0.2160523235797882, 0.22285409271717072, 0.22965586185455322]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 5.0, 5.0, 10.0, 16.0, 23.0, 33.0, 57.0, 87.0, 133.0, 186.0, 353.0, 624.0, 1080.0, 1971.0, 3932.0, 8020.0, 17929.0, 39986.0, 94038.0, 258315.0, 376774.0, 139915.0, 57486.0, 25152.0, 11153.0, 5298.0, 2611.0, 1439.0, 775.0, 441.0, 246.0, 175.0, 89.0, 76.0, 45.0, 29.0, 18.0, 11.0, 8.0, 5.0, 6.0, 0.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.095703125, -0.0926370620727539, -0.08957099914550781, -0.08650493621826172, -0.08343887329101562, -0.08037281036376953, -0.07730674743652344, -0.07424068450927734, -0.07117462158203125, -0.06810855865478516, -0.06504249572753906, -0.06197643280029297, -0.058910369873046875, -0.05584430694580078, -0.05277824401855469, -0.049712181091308594, -0.0466461181640625, -0.043580055236816406, -0.04051399230957031, -0.03744792938232422, -0.034381866455078125, -0.03131580352783203, -0.028249740600585938, -0.025183677673339844, -0.02211761474609375, -0.019051551818847656, -0.015985488891601562, -0.012919425964355469, -0.009853363037109375, -0.006787300109863281, -0.0037212371826171875, -0.0006551742553710938, 0.002410888671875, 0.005476951599121094, 0.008543014526367188, 0.011609077453613281, 0.014675140380859375, 0.01774120330810547, 0.020807266235351562, 0.023873329162597656, 0.02693939208984375, 0.030005455017089844, 0.03307151794433594, 0.03613758087158203, 0.039203643798828125, 0.04226970672607422, 0.04533576965332031, 0.048401832580566406, 0.0514678955078125, 0.054533958435058594, 0.05760002136230469, 0.06066608428955078, 0.06373214721679688, 0.06679821014404297, 0.06986427307128906, 0.07293033599853516, 0.07599639892578125, 0.07906246185302734, 0.08212852478027344, 0.08519458770751953, 0.08826065063476562, 0.09132671356201172, 0.09439277648925781, 0.0974588394165039, 0.10052490234375]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 2.0, 3.0, 2.0, 8.0, 3.0, 8.0, 17.0, 19.0, 23.0, 31.0, 22.0, 36.0, 39.0, 39.0, 56.0, 45.0, 55.0, 66.0, 75.0, 66.0, 51.0, 56.0, 55.0, 36.0, 37.0, 37.0, 29.0, 19.0, 14.0, 16.0, 10.0, 7.0, 3.0, 6.0, 6.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0244903564453125, -0.02372908592224121, -0.022967815399169922, -0.022206544876098633, -0.021445274353027344, -0.020684003829956055, -0.019922733306884766, -0.019161462783813477, -0.018400192260742188, -0.0176389217376709, -0.01687765121459961, -0.01611638069152832, -0.015355110168457031, -0.014593839645385742, -0.013832569122314453, -0.013071298599243164, -0.012310028076171875, -0.011548757553100586, -0.010787487030029297, -0.010026216506958008, -0.009264945983886719, -0.00850367546081543, -0.007742404937744141, -0.0069811344146728516, -0.0062198638916015625, -0.0054585933685302734, -0.004697322845458984, -0.003936052322387695, -0.0031747817993164062, -0.002413511276245117, -0.0016522407531738281, -0.0008909702301025391, -0.00012969970703125, 0.0006315708160400391, 0.0013928413391113281, 0.002154111862182617, 0.0029153823852539062, 0.0036766529083251953, 0.004437923431396484, 0.0051991939544677734, 0.0059604644775390625, 0.0067217350006103516, 0.007483005523681641, 0.00824427604675293, 0.009005546569824219, 0.009766817092895508, 0.010528087615966797, 0.011289358139038086, 0.012050628662109375, 0.012811899185180664, 0.013573169708251953, 0.014334440231323242, 0.015095710754394531, 0.01585698127746582, 0.01661825180053711, 0.0173795223236084, 0.018140792846679688, 0.018902063369750977, 0.019663333892822266, 0.020424604415893555, 0.021185874938964844, 0.021947145462036133, 0.022708415985107422, 0.02346968650817871, 0.02423095703125]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 4.0, 1.0, 5.0, 4.0, 12.0, 12.0, 21.0, 34.0, 41.0, 52.0, 76.0, 109.0, 174.0, 233.0, 318.0, 524.0, 954.0, 1895.0, 3884.0, 9881.0, 27873.0, 88781.0, 356294.0, 404812.0, 101579.0, 31174.0, 10726.0, 4361.0, 2016.0, 983.0, 578.0, 378.0, 241.0, 159.0, 93.0, 74.0, 73.0, 37.0, 21.0, 20.0, 21.0, 8.0, 8.0, 6.0, 2.0, 5.0, 6.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1236572265625, -0.120025634765625, -0.11639404296875, -0.112762451171875, -0.109130859375, -0.105499267578125, -0.10186767578125, -0.098236083984375, -0.0946044921875, -0.090972900390625, -0.08734130859375, -0.083709716796875, -0.080078125, -0.076446533203125, -0.07281494140625, -0.069183349609375, -0.0655517578125, -0.061920166015625, -0.05828857421875, -0.054656982421875, -0.051025390625, -0.047393798828125, -0.04376220703125, -0.040130615234375, -0.0364990234375, -0.032867431640625, -0.02923583984375, -0.025604248046875, -0.02197265625, -0.018341064453125, -0.01470947265625, -0.011077880859375, -0.0074462890625, -0.003814697265625, -0.00018310546875, 0.003448486328125, 0.007080078125, 0.010711669921875, 0.01434326171875, 0.017974853515625, 0.0216064453125, 0.025238037109375, 0.02886962890625, 0.032501220703125, 0.0361328125, 0.039764404296875, 0.04339599609375, 0.047027587890625, 0.0506591796875, 0.054290771484375, 0.05792236328125, 0.061553955078125, 0.065185546875, 0.068817138671875, 0.07244873046875, 0.076080322265625, 0.0797119140625, 0.083343505859375, 0.08697509765625, 0.090606689453125, 0.09423828125, 0.097869873046875, 0.10150146484375, 0.105133056640625, 0.1087646484375]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 2.0, 0.0, 3.0, 3.0, 0.0, 2.0, 5.0, 5.0, 10.0, 11.0, 9.0, 14.0, 17.0, 21.0, 27.0, 29.0, 30.0, 42.0, 36.0, 44.0, 47.0, 40.0, 48.0, 52.0, 54.0, 47.0, 46.0, 43.0, 47.0, 52.0, 38.0, 42.0, 26.0, 17.0, 16.0, 14.0, 15.0, 16.0, 11.0, 8.0, 9.0, 2.0, 5.0, 2.0, 2.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0966796875, -0.09312629699707031, -0.08957290649414062, -0.08601951599121094, -0.08246612548828125, -0.07891273498535156, -0.07535934448242188, -0.07180595397949219, -0.0682525634765625, -0.06469917297363281, -0.061145782470703125, -0.05759239196777344, -0.05403900146484375, -0.05048561096191406, -0.046932220458984375, -0.04337882995605469, -0.039825439453125, -0.03627204895019531, -0.032718658447265625, -0.029165267944335938, -0.02561187744140625, -0.022058486938476562, -0.018505096435546875, -0.014951705932617188, -0.0113983154296875, -0.007844924926757812, -0.004291534423828125, -0.0007381439208984375, 0.00281524658203125, 0.0063686370849609375, 0.009922027587890625, 0.013475418090820312, 0.01702880859375, 0.020582199096679688, 0.024135589599609375, 0.027688980102539062, 0.03124237060546875, 0.03479576110839844, 0.038349151611328125, 0.04190254211425781, 0.0454559326171875, 0.04900932312011719, 0.052562713623046875, 0.05611610412597656, 0.05966949462890625, 0.06322288513183594, 0.06677627563476562, 0.07032966613769531, 0.073883056640625, 0.07743644714355469, 0.08098983764648438, 0.08454322814941406, 0.08809661865234375, 0.09165000915527344, 0.09520339965820312, 0.09875679016113281, 0.1023101806640625, 0.10586357116699219, 0.10941696166992188, 0.11297035217285156, 0.11652374267578125, 0.12007713317871094, 0.12363052368164062, 0.1271839141845703, 0.1307373046875]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 2.0, 5.0, 10.0, 11.0, 14.0, 34.0, 48.0, 68.0, 95.0, 191.0, 239.0, 531.0, 1054.0, 2345.0, 6162.0, 22586.0, 126141.0, 690588.0, 159301.0, 27021.0, 7087.0, 2612.0, 1129.0, 527.0, 307.0, 148.0, 98.0, 61.0, 46.0, 31.0, 14.0, 21.0, 4.0, 9.0, 5.0, 5.0, 7.0, 1.0, 0.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10693359375, -0.10290718078613281, -0.09888076782226562, -0.09485435485839844, -0.09082794189453125, -0.08680152893066406, -0.08277511596679688, -0.07874870300292969, -0.0747222900390625, -0.07069587707519531, -0.06666946411132812, -0.06264305114746094, -0.05861663818359375, -0.05459022521972656, -0.050563812255859375, -0.04653739929199219, -0.042510986328125, -0.03848457336425781, -0.034458160400390625, -0.030431747436523438, -0.02640533447265625, -0.022378921508789062, -0.018352508544921875, -0.014326095581054688, -0.0102996826171875, -0.0062732696533203125, -0.002246856689453125, 0.0017795562744140625, 0.00580596923828125, 0.009832382202148438, 0.013858795166015625, 0.017885208129882812, 0.02191162109375, 0.025938034057617188, 0.029964447021484375, 0.03399085998535156, 0.03801727294921875, 0.04204368591308594, 0.046070098876953125, 0.05009651184082031, 0.0541229248046875, 0.05814933776855469, 0.062175750732421875, 0.06620216369628906, 0.07022857666015625, 0.07425498962402344, 0.07828140258789062, 0.08230781555175781, 0.086334228515625, 0.09036064147949219, 0.09438705444335938, 0.09841346740722656, 0.10243988037109375, 0.10646629333496094, 0.11049270629882812, 0.11451911926269531, 0.1185455322265625, 0.12257194519042969, 0.12659835815429688, 0.13062477111816406, 0.13465118408203125, 0.13867759704589844, 0.14270401000976562, 0.1467304229736328, 0.1507568359375]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 3.0, 4.0, 3.0, 5.0, 4.0, 10.0, 10.0, 15.0, 13.0, 12.0, 22.0, 35.0, 45.0, 48.0, 50.0, 59.0, 71.0, 61.0, 78.0, 75.0, 67.0, 82.0, 39.0, 42.0, 25.0, 29.0, 16.0, 14.0, 12.0, 16.0, 11.0, 8.0, 5.0, 4.0, 3.0, 3.0, 3.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-4.029273986816406e-05, -3.8689933717250824e-05, -3.7087127566337585e-05, -3.548432141542435e-05, -3.388151526451111e-05, -3.227870911359787e-05, -3.067590296268463e-05, -2.9073096811771393e-05, -2.7470290660858154e-05, -2.5867484509944916e-05, -2.4264678359031677e-05, -2.266187220811844e-05, -2.10590660572052e-05, -1.945625990629196e-05, -1.7853453755378723e-05, -1.6250647604465485e-05, -1.4647841453552246e-05, -1.3045035302639008e-05, -1.1442229151725769e-05, -9.83942300081253e-06, -8.236616849899292e-06, -6.6338106989860535e-06, -5.031004548072815e-06, -3.4281983971595764e-06, -1.8253922462463379e-06, -2.2258609533309937e-07, 1.3802200555801392e-06, 2.9830262064933777e-06, 4.585832357406616e-06, 6.188638508319855e-06, 7.791444659233093e-06, 9.394250810146332e-06, 1.099705696105957e-05, 1.2599863111972809e-05, 1.4202669262886047e-05, 1.5805475413799286e-05, 1.7408281564712524e-05, 1.9011087715625763e-05, 2.0613893866539e-05, 2.221670001745224e-05, 2.381950616836548e-05, 2.5422312319278717e-05, 2.7025118470191956e-05, 2.8627924621105194e-05, 3.0230730772018433e-05, 3.183353692293167e-05, 3.343634307384491e-05, 3.503914922475815e-05, 3.664195537567139e-05, 3.8244761526584625e-05, 3.9847567677497864e-05, 4.14503738284111e-05, 4.305317997932434e-05, 4.465598613023758e-05, 4.625879228115082e-05, 4.7861598432064056e-05, 4.9464404582977295e-05, 5.1067210733890533e-05, 5.267001688480377e-05, 5.427282303571701e-05, 5.587562918663025e-05, 5.747843533754349e-05, 5.9081241488456726e-05, 6.0684047639369965e-05, 6.22868537902832e-05]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 1.0, 4.0, 10.0, 15.0, 12.0, 24.0, 23.0, 30.0, 55.0, 59.0, 106.0, 121.0, 190.0, 300.0, 518.0, 943.0, 1970.0, 4132.0, 9323.0, 24855.0, 81671.0, 370543.0, 417370.0, 90700.0, 26846.0, 9908.0, 4311.0, 1945.0, 1055.0, 528.0, 321.0, 212.0, 135.0, 85.0, 63.0, 43.0, 33.0, 22.0, 16.0, 12.0, 18.0, 7.0, 9.0, 4.0, 2.0, 6.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.071044921875, -0.0686798095703125, -0.066314697265625, -0.0639495849609375, -0.06158447265625, -0.0592193603515625, -0.056854248046875, -0.0544891357421875, -0.0521240234375, -0.0497589111328125, -0.047393798828125, -0.0450286865234375, -0.04266357421875, -0.0402984619140625, -0.037933349609375, -0.0355682373046875, -0.033203125, -0.0308380126953125, -0.028472900390625, -0.0261077880859375, -0.02374267578125, -0.0213775634765625, -0.019012451171875, -0.0166473388671875, -0.0142822265625, -0.0119171142578125, -0.009552001953125, -0.0071868896484375, -0.00482177734375, -0.0024566650390625, -9.1552734375e-05, 0.0022735595703125, 0.004638671875, 0.0070037841796875, 0.009368896484375, 0.0117340087890625, 0.01409912109375, 0.0164642333984375, 0.018829345703125, 0.0211944580078125, 0.0235595703125, 0.0259246826171875, 0.028289794921875, 0.0306549072265625, 0.03302001953125, 0.0353851318359375, 0.037750244140625, 0.0401153564453125, 0.04248046875, 0.0448455810546875, 0.047210693359375, 0.0495758056640625, 0.05194091796875, 0.0543060302734375, 0.056671142578125, 0.0590362548828125, 0.0614013671875, 0.0637664794921875, 0.066131591796875, 0.0684967041015625, 0.07086181640625, 0.0732269287109375, 0.075592041015625, 0.0779571533203125, 0.080322265625]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 5.0, 0.0, 6.0, 5.0, 7.0, 3.0, 9.0, 10.0, 7.0, 11.0, 23.0, 31.0, 32.0, 33.0, 40.0, 58.0, 87.0, 116.0, 113.0, 82.0, 74.0, 62.0, 35.0, 32.0, 23.0, 20.0, 15.0, 8.0, 11.0, 6.0, 7.0, 7.0, 6.0, 3.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 4.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.05633544921875, -0.05446052551269531, -0.052585601806640625, -0.05071067810058594, -0.04883575439453125, -0.04696083068847656, -0.045085906982421875, -0.04321098327636719, -0.0413360595703125, -0.03946113586425781, -0.037586212158203125, -0.03571128845214844, -0.03383636474609375, -0.03196144104003906, -0.030086517333984375, -0.028211593627929688, -0.026336669921875, -0.024461746215820312, -0.022586822509765625, -0.020711898803710938, -0.01883697509765625, -0.016962051391601562, -0.015087127685546875, -0.013212203979492188, -0.0113372802734375, -0.009462356567382812, -0.007587432861328125, -0.0057125091552734375, -0.00383758544921875, -0.0019626617431640625, -8.7738037109375e-05, 0.0017871856689453125, 0.003662109375, 0.0055370330810546875, 0.007411956787109375, 0.009286880493164062, 0.01116180419921875, 0.013036727905273438, 0.014911651611328125, 0.016786575317382812, 0.0186614990234375, 0.020536422729492188, 0.022411346435546875, 0.024286270141601562, 0.02616119384765625, 0.028036117553710938, 0.029911041259765625, 0.03178596496582031, 0.033660888671875, 0.03553581237792969, 0.037410736083984375, 0.03928565979003906, 0.04116058349609375, 0.04303550720214844, 0.044910430908203125, 0.04678535461425781, 0.0486602783203125, 0.05053520202636719, 0.052410125732421875, 0.05428504943847656, 0.05615997314453125, 0.05803489685058594, 0.059909820556640625, 0.06178474426269531, 0.06365966796875]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 7.0, 13.0, 17.0, 32.0, 42.0, 64.0, 101.0, 136.0, 126.0, 137.0, 99.0, 100.0, 54.0, 32.0, 12.0, 13.0, 10.0, 10.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.45304882526397705, -0.4243328273296356, -0.3956168293952942, -0.36690086126327515, -0.3381848633289337, -0.3094688653945923, -0.28075286746025085, -0.2520368695259094, -0.2233208864927292, -0.19460488855838776, -0.16588890552520752, -0.1371729075908661, -0.10845691710710526, -0.07974092662334442, -0.05102492868900299, -0.022308945655822754, 0.006407052278518677, 0.03512304276227951, 0.06383903324604034, 0.09255503118038177, 0.12127102166414261, 0.14998701214790344, 0.17870301008224487, 0.2074189931154251, 0.23613499104976654, 0.2648509740829468, 0.2935669720172882, 0.32228296995162964, 0.35099896788597107, 0.3797149658203125, 0.40843093395233154, 0.437146931886673, 0.4658629298210144, 0.49457892775535583, 0.5232949256896973, 0.5520108938217163, 0.5807269215583801, 0.6094428896903992, 0.638158917427063, 0.666874885559082, 0.6955908536911011, 0.7243068218231201, 0.7530228495597839, 0.781738817691803, 0.8104548454284668, 0.8391708135604858, 0.8678867816925049, 0.8966028094291687, 0.9253188371658325, 0.9540348052978516, 0.9827508330345154, 1.0114668607711792, 1.0401828289031982, 1.0688987970352173, 1.0976147651672363, 1.1263307332992554, 1.1550467014312744, 1.1837626695632935, 1.2124786376953125, 1.241194725036621, 1.2699106931686401, 1.2986266613006592, 1.3273426294326782, 1.3560585975646973, 1.3847746849060059]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 5.0, 10.0, 4.0, 4.0, 15.0, 3.0, 14.0, 5.0, 26.0, 17.0, 22.0, 22.0, 32.0, 34.0, 26.0, 43.0, 25.0, 43.0, 41.0, 42.0, 46.0, 42.0, 46.0, 29.0, 43.0, 40.0, 50.0, 35.0, 38.0, 31.0, 24.0, 21.0, 25.0, 20.0, 17.0, 18.0, 6.0, 10.0, 5.0, 7.0, 8.0, 6.0, 2.0, 4.0, 1.0, 1.0, 2.0, 1.0, 3.0, 1.0, 1.0], "bins": [-0.6243494153022766, -0.6065165400505066, -0.5886836647987366, -0.5708507895469666, -0.5530179142951965, -0.5351850390434265, -0.5173521637916565, -0.4995192885398865, -0.48168641328811646, -0.46385353803634644, -0.4460206627845764, -0.4281877875328064, -0.4103549122810364, -0.39252203702926636, -0.37468916177749634, -0.3568562865257263, -0.3390234410762787, -0.32119056582450867, -0.30335769057273865, -0.28552481532096863, -0.2676919400691986, -0.2498590648174286, -0.23202620446681976, -0.21419332921504974, -0.19636045396327972, -0.1785275787115097, -0.16069470345973969, -0.14286184310913086, -0.12502896785736084, -0.10719608515501022, -0.0893632173538208, -0.07153034210205078, -0.05369746685028076, -0.03586459159851074, -0.01803172007203102, -0.00019884854555130005, 0.01763402670621872, 0.03546690195798874, 0.05329976975917816, 0.07113264501094818, 0.0889655202627182, 0.10679839551448822, 0.12463127076625824, 0.14246413111686707, 0.16029700636863708, 0.1781298816204071, 0.19596275687217712, 0.21379563212394714, 0.23162850737571716, 0.24946138262748718, 0.2672942578792572, 0.2851271331310272, 0.30296000838279724, 0.32079288363456726, 0.3386257290840149, 0.3564586043357849, 0.37429147958755493, 0.39212435483932495, 0.40995723009109497, 0.427790105342865, 0.445622980594635, 0.46345585584640503, 0.48128873109817505, 0.49912160634994507, 0.5169544816017151]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 3.0, 2.0, 1.0, 5.0, 10.0, 5.0, 7.0, 8.0, 9.0, 19.0, 26.0, 36.0, 55.0, 95.0, 121.0, 201.0, 324.0, 453.0, 749.0, 1308.0, 2158.0, 3917.0, 7088.0, 14270.0, 31409.0, 82453.0, 347514.0, 3228096.0, 332643.0, 80347.0, 30450.0, 13848.0, 7079.0, 3866.0, 2226.0, 1307.0, 794.0, 518.0, 305.0, 196.0, 122.0, 81.0, 57.0, 34.0, 26.0, 13.0, 12.0, 14.0, 3.0, 3.0, 2.0, 5.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.078369140625, -0.07579898834228516, -0.07322883605957031, -0.07065868377685547, -0.06808853149414062, -0.06551837921142578, -0.06294822692871094, -0.060378074645996094, -0.05780792236328125, -0.055237770080566406, -0.05266761779785156, -0.05009746551513672, -0.047527313232421875, -0.04495716094970703, -0.04238700866699219, -0.039816856384277344, -0.0372467041015625, -0.034676551818847656, -0.03210639953613281, -0.02953624725341797, -0.026966094970703125, -0.02439594268798828, -0.021825790405273438, -0.019255638122558594, -0.01668548583984375, -0.014115333557128906, -0.011545181274414062, -0.008975028991699219, -0.006404876708984375, -0.0038347244262695312, -0.0012645721435546875, 0.0013055801391601562, 0.003875732421875, 0.006445884704589844, 0.009016036987304688, 0.011586189270019531, 0.014156341552734375, 0.01672649383544922, 0.019296646118164062, 0.021866798400878906, 0.02443695068359375, 0.027007102966308594, 0.029577255249023438, 0.03214740753173828, 0.034717559814453125, 0.03728771209716797, 0.03985786437988281, 0.042428016662597656, 0.0449981689453125, 0.047568321228027344, 0.05013847351074219, 0.05270862579345703, 0.055278778076171875, 0.05784893035888672, 0.06041908264160156, 0.0629892349243164, 0.06555938720703125, 0.0681295394897461, 0.07069969177246094, 0.07326984405517578, 0.07583999633789062, 0.07841014862060547, 0.08098030090332031, 0.08355045318603516, 0.08612060546875]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 2.0, 2.0, 6.0, 4.0, 10.0, 4.0, 14.0, 14.0, 14.0, 19.0, 29.0, 31.0, 23.0, 29.0, 33.0, 39.0, 45.0, 51.0, 55.0, 55.0, 45.0, 46.0, 42.0, 61.0, 47.0, 41.0, 35.0, 32.0, 25.0, 39.0, 16.0, 17.0, 13.0, 17.0, 13.0, 6.0, 6.0, 4.0, 4.0, 5.0, 2.0, 1.0, 4.0, 4.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0], "bins": [-0.0236358642578125, -0.022953510284423828, -0.022271156311035156, -0.021588802337646484, -0.020906448364257812, -0.02022409439086914, -0.01954174041748047, -0.018859386444091797, -0.018177032470703125, -0.017494678497314453, -0.01681232452392578, -0.01612997055053711, -0.015447616577148438, -0.014765262603759766, -0.014082908630371094, -0.013400554656982422, -0.01271820068359375, -0.012035846710205078, -0.011353492736816406, -0.010671138763427734, -0.009988784790039062, -0.00930643081665039, -0.008624076843261719, -0.007941722869873047, -0.007259368896484375, -0.006577014923095703, -0.005894660949707031, -0.005212306976318359, -0.0045299530029296875, -0.0038475990295410156, -0.0031652450561523438, -0.002482891082763672, -0.001800537109375, -0.0011181831359863281, -0.00043582916259765625, 0.0002465248107910156, 0.0009288787841796875, 0.0016112327575683594, 0.0022935867309570312, 0.002975940704345703, 0.003658294677734375, 0.004340648651123047, 0.005023002624511719, 0.005705356597900391, 0.0063877105712890625, 0.007070064544677734, 0.007752418518066406, 0.008434772491455078, 0.00911712646484375, 0.009799480438232422, 0.010481834411621094, 0.011164188385009766, 0.011846542358398438, 0.01252889633178711, 0.013211250305175781, 0.013893604278564453, 0.014575958251953125, 0.015258312225341797, 0.01594066619873047, 0.01662302017211914, 0.017305374145507812, 0.017987728118896484, 0.018670082092285156, 0.019352436065673828, 0.0200347900390625]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 5.0, 7.0, 6.0, 3.0, 13.0, 19.0, 32.0, 32.0, 51.0, 68.0, 122.0, 172.0, 235.0, 375.0, 602.0, 962.0, 1728.0, 3417.0, 7404.0, 19207.0, 58651.0, 264351.0, 3190667.0, 510964.0, 88674.0, 26631.0, 10131.0, 4415.0, 2155.0, 1184.0, 652.0, 426.0, 303.0, 206.0, 126.0, 95.0, 63.0, 40.0, 30.0, 21.0, 19.0, 11.0, 5.0, 0.0, 1.0, 3.0, 0.0, 4.0, 2.0, 3.0, 0.0, 2.0], "bins": [-0.15625, -0.15174102783203125, -0.1472320556640625, -0.14272308349609375, -0.138214111328125, -0.13370513916015625, -0.1291961669921875, -0.12468719482421875, -0.12017822265625, -0.11566925048828125, -0.1111602783203125, -0.10665130615234375, -0.102142333984375, -0.09763336181640625, -0.0931243896484375, -0.08861541748046875, -0.0841064453125, -0.07959747314453125, -0.0750885009765625, -0.07057952880859375, -0.066070556640625, -0.06156158447265625, -0.0570526123046875, -0.05254364013671875, -0.04803466796875, -0.04352569580078125, -0.0390167236328125, -0.03450775146484375, -0.029998779296875, -0.02548980712890625, -0.0209808349609375, -0.01647186279296875, -0.011962890625, -0.00745391845703125, -0.0029449462890625, 0.00156402587890625, 0.006072998046875, 0.01058197021484375, 0.0150909423828125, 0.01959991455078125, 0.02410888671875, 0.02861785888671875, 0.0331268310546875, 0.03763580322265625, 0.042144775390625, 0.04665374755859375, 0.0511627197265625, 0.05567169189453125, 0.0601806640625, 0.06468963623046875, 0.0691986083984375, 0.07370758056640625, 0.078216552734375, 0.08272552490234375, 0.0872344970703125, 0.09174346923828125, 0.09625244140625, 0.10076141357421875, 0.1052703857421875, 0.10977935791015625, 0.114288330078125, 0.11879730224609375, 0.1233062744140625, 0.12781524658203125, 0.13232421875]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 5.0, 3.0, 1.0, 2.0, 11.0, 7.0, 6.0, 20.0, 27.0, 43.0, 48.0, 97.0, 203.0, 442.0, 1797.0, 689.0, 286.0, 135.0, 100.0, 55.0, 43.0, 17.0, 15.0, 8.0, 5.0, 2.0, 4.0, 5.0, 3.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08624267578125, -0.08368206024169922, -0.08112144470214844, -0.07856082916259766, -0.07600021362304688, -0.0734395980834961, -0.07087898254394531, -0.06831836700439453, -0.06575775146484375, -0.06319713592529297, -0.06063652038574219, -0.058075904846191406, -0.055515289306640625, -0.052954673767089844, -0.05039405822753906, -0.04783344268798828, -0.0452728271484375, -0.04271221160888672, -0.04015159606933594, -0.037590980529785156, -0.035030364990234375, -0.032469749450683594, -0.029909133911132812, -0.02734851837158203, -0.02478790283203125, -0.02222728729248047, -0.019666671752929688, -0.017106056213378906, -0.014545440673828125, -0.011984825134277344, -0.009424209594726562, -0.006863594055175781, -0.004302978515625, -0.0017423629760742188, 0.0008182525634765625, 0.0033788681030273438, 0.005939483642578125, 0.008500099182128906, 0.011060714721679688, 0.013621330261230469, 0.01618194580078125, 0.01874256134033203, 0.021303176879882812, 0.023863792419433594, 0.026424407958984375, 0.028985023498535156, 0.03154563903808594, 0.03410625457763672, 0.0366668701171875, 0.03922748565673828, 0.04178810119628906, 0.044348716735839844, 0.046909332275390625, 0.049469947814941406, 0.05203056335449219, 0.05459117889404297, 0.05715179443359375, 0.05971240997314453, 0.06227302551269531, 0.0648336410522461, 0.06739425659179688, 0.06995487213134766, 0.07251548767089844, 0.07507610321044922, 0.07763671875]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 4.0, 2.0, 9.0, 31.0, 87.0, 192.0, 267.0, 242.0, 112.0, 48.0, 8.0, 6.0, 1.0, 2.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5530012249946594, -0.5230609178543091, -0.49312061071395874, -0.4631803035736084, -0.43323999643325806, -0.4032996892929077, -0.3733593821525574, -0.34341907501220703, -0.3134787678718567, -0.28353846073150635, -0.253598153591156, -0.22365784645080566, -0.19371753931045532, -0.16377723217010498, -0.13383692502975464, -0.1038966178894043, -0.07395631074905396, -0.04401600360870361, -0.014075696468353271, 0.01586461067199707, 0.04580491781234741, 0.07574522495269775, 0.1056855320930481, 0.13562583923339844, 0.16556614637374878, 0.19550645351409912, 0.22544676065444946, 0.2553870677947998, 0.28532737493515015, 0.3152676820755005, 0.34520798921585083, 0.37514829635620117, 0.4050886631011963, 0.43502897024154663, 0.464969277381897, 0.4949095845222473, 0.5248498916625977, 0.554790198802948, 0.5847305059432983, 0.6146708130836487, 0.644611120223999, 0.6745514273643494, 0.7044917345046997, 0.73443204164505, 0.7643723487854004, 0.7943126559257507, 0.8242529630661011, 0.8541932702064514, 0.8841335773468018, 0.9140738844871521, 0.9440141916275024, 0.9739544987678528, 1.0038948059082031, 1.0338351726531982, 1.0637754201889038, 1.0937156677246094, 1.1236560344696045, 1.1535964012145996, 1.1835366487503052, 1.2134768962860107, 1.2434172630310059, 1.273357629776001, 1.3032978773117065, 1.333238124847412, 1.3631784915924072]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 2.0, 3.0, 1.0, 1.0, 1.0, 5.0, 6.0, 6.0, 6.0, 6.0, 11.0, 10.0, 10.0, 15.0, 28.0, 14.0, 21.0, 37.0, 32.0, 42.0, 38.0, 34.0, 35.0, 36.0, 40.0, 46.0, 47.0, 45.0, 38.0, 38.0, 42.0, 31.0, 35.0, 36.0, 19.0, 31.0, 22.0, 22.0, 19.0, 10.0, 12.0, 12.0, 14.0, 12.0, 8.0, 9.0, 4.0, 4.0, 6.0, 2.0, 3.0, 6.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.20667040348052979, -0.19992177188396454, -0.1931731402873993, -0.18642450869083405, -0.1796758770942688, -0.17292724549770355, -0.1661786139011383, -0.15942999720573425, -0.1526813507080078, -0.14593271911144257, -0.13918408751487732, -0.13243545591831207, -0.12568682432174683, -0.11893819272518158, -0.11218956857919693, -0.10544093698263168, -0.09869231283664703, -0.09194368124008179, -0.08519504964351654, -0.0784464180469513, -0.07169778645038605, -0.0649491548538208, -0.05820053070783615, -0.051451899111270905, -0.04470326751470566, -0.03795463591814041, -0.031206006184220314, -0.024457376450300217, -0.01770874485373497, -0.010960113257169724, -0.004211485385894775, 0.002537146210670471, 0.009285777807235718, 0.016034409403800964, 0.02278303913772106, 0.02953166887164116, 0.036280300468206406, 0.04302893206477165, 0.0497775599360466, 0.05652619153261185, 0.0632748231291771, 0.07002345472574234, 0.07677208632230759, 0.08352071046829224, 0.09026934206485748, 0.09701797366142273, 0.10376660525798798, 0.11051523685455322, 0.11726386845111847, 0.12401250004768372, 0.13076113164424896, 0.1375097632408142, 0.14425839483737946, 0.1510070264339447, 0.15775564312934875, 0.1645042896270752, 0.17125290632247925, 0.1780015379190445, 0.18475016951560974, 0.191498801112175, 0.19824743270874023, 0.20499606430530548, 0.21174469590187073, 0.21849331259727478, 0.22524195909500122]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 2.0, 3.0, 5.0, 8.0, 8.0, 11.0, 28.0, 25.0, 46.0, 62.0, 111.0, 175.0, 251.0, 347.0, 602.0, 939.0, 1554.0, 2488.0, 4323.0, 7165.0, 12326.0, 21456.0, 36904.0, 64043.0, 115578.0, 229409.0, 253454.0, 128815.0, 70663.0, 40944.0, 23226.0, 13731.0, 7911.0, 4626.0, 2834.0, 1695.0, 1036.0, 646.0, 408.0, 252.0, 158.0, 96.0, 88.0, 26.0, 25.0, 22.0, 12.0, 8.0, 8.0, 5.0, 2.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0], "bins": [-0.071533203125, -0.06915569305419922, -0.06677818298339844, -0.06440067291259766, -0.062023162841796875, -0.059645652770996094, -0.05726814270019531, -0.05489063262939453, -0.05251312255859375, -0.05013561248779297, -0.04775810241699219, -0.045380592346191406, -0.043003082275390625, -0.040625572204589844, -0.03824806213378906, -0.03587055206298828, -0.0334930419921875, -0.03111553192138672, -0.028738021850585938, -0.026360511779785156, -0.023983001708984375, -0.021605491638183594, -0.019227981567382812, -0.01685047149658203, -0.01447296142578125, -0.012095451354980469, -0.009717941284179688, -0.007340431213378906, -0.004962921142578125, -0.0025854110717773438, -0.0002079010009765625, 0.0021696090698242188, 0.004547119140625, 0.006924629211425781, 0.009302139282226562, 0.011679649353027344, 0.014057159423828125, 0.016434669494628906, 0.018812179565429688, 0.02118968963623047, 0.02356719970703125, 0.02594470977783203, 0.028322219848632812, 0.030699729919433594, 0.033077239990234375, 0.035454750061035156, 0.03783226013183594, 0.04020977020263672, 0.0425872802734375, 0.04496479034423828, 0.04734230041503906, 0.049719810485839844, 0.052097320556640625, 0.054474830627441406, 0.05685234069824219, 0.05922985076904297, 0.06160736083984375, 0.06398487091064453, 0.06636238098144531, 0.0687398910522461, 0.07111740112304688, 0.07349491119384766, 0.07587242126464844, 0.07824993133544922, 0.08062744140625]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 0.0, 2.0, 3.0, 3.0, 4.0, 6.0, 8.0, 5.0, 12.0, 5.0, 13.0, 18.0, 23.0, 15.0, 19.0, 22.0, 18.0, 35.0, 31.0, 36.0, 35.0, 38.0, 43.0, 43.0, 43.0, 42.0, 52.0, 33.0, 53.0, 41.0, 36.0, 30.0, 32.0, 29.0, 22.0, 26.0, 27.0, 18.0, 17.0, 10.0, 9.0, 9.0, 6.0, 9.0, 7.0, 8.0, 4.0, 3.0, 1.0, 3.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0], "bins": [-0.0221099853515625, -0.021448612213134766, -0.02078723907470703, -0.020125865936279297, -0.019464492797851562, -0.018803119659423828, -0.018141746520996094, -0.01748037338256836, -0.016819000244140625, -0.01615762710571289, -0.015496253967285156, -0.014834880828857422, -0.014173507690429688, -0.013512134552001953, -0.012850761413574219, -0.012189388275146484, -0.01152801513671875, -0.010866641998291016, -0.010205268859863281, -0.009543895721435547, -0.008882522583007812, -0.008221149444580078, -0.007559776306152344, -0.006898403167724609, -0.006237030029296875, -0.005575656890869141, -0.004914283752441406, -0.004252910614013672, -0.0035915374755859375, -0.002930164337158203, -0.0022687911987304688, -0.0016074180603027344, -0.000946044921875, -0.0002846717834472656, 0.00037670135498046875, 0.0010380744934082031, 0.0016994476318359375, 0.002360820770263672, 0.0030221939086914062, 0.0036835670471191406, 0.004344940185546875, 0.005006313323974609, 0.005667686462402344, 0.006329059600830078, 0.0069904327392578125, 0.007651805877685547, 0.008313179016113281, 0.008974552154541016, 0.00963592529296875, 0.010297298431396484, 0.010958671569824219, 0.011620044708251953, 0.012281417846679688, 0.012942790985107422, 0.013604164123535156, 0.01426553726196289, 0.014926910400390625, 0.01558828353881836, 0.016249656677246094, 0.016911029815673828, 0.017572402954101562, 0.018233776092529297, 0.01889514923095703, 0.019556522369384766, 0.0202178955078125]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 4.0, 6.0, 6.0, 4.0, 8.0, 14.0, 21.0, 27.0, 44.0, 55.0, 101.0, 176.0, 308.0, 455.0, 819.0, 1565.0, 3591.0, 10891.0, 44515.0, 255486.0, 601776.0, 97470.0, 20538.0, 5886.0, 2225.0, 1076.0, 535.0, 338.0, 216.0, 132.0, 103.0, 56.0, 44.0, 20.0, 16.0, 13.0, 8.0, 7.0, 1.0, 4.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.21923828125, -0.21264266967773438, -0.20604705810546875, -0.19945144653320312, -0.1928558349609375, -0.18626022338867188, -0.17966461181640625, -0.17306900024414062, -0.166473388671875, -0.15987777709960938, -0.15328216552734375, -0.14668655395507812, -0.1400909423828125, -0.13349533081054688, -0.12689971923828125, -0.12030410766601562, -0.11370849609375, -0.10711288452148438, -0.10051727294921875, -0.09392166137695312, -0.0873260498046875, -0.08073043823242188, -0.07413482666015625, -0.06753921508789062, -0.060943603515625, -0.054347991943359375, -0.04775238037109375, -0.041156768798828125, -0.0345611572265625, -0.027965545654296875, -0.02136993408203125, -0.014774322509765625, -0.0081787109375, -0.001583099365234375, 0.00501251220703125, 0.011608123779296875, 0.0182037353515625, 0.024799346923828125, 0.03139495849609375, 0.037990570068359375, 0.044586181640625, 0.051181793212890625, 0.05777740478515625, 0.06437301635742188, 0.0709686279296875, 0.07756423950195312, 0.08415985107421875, 0.09075546264648438, 0.09735107421875, 0.10394668579101562, 0.11054229736328125, 0.11713790893554688, 0.1237335205078125, 0.13032913208007812, 0.13692474365234375, 0.14352035522460938, 0.150115966796875, 0.15671157836914062, 0.16330718994140625, 0.16990280151367188, 0.1764984130859375, 0.18309402465820312, 0.18968963623046875, 0.19628524780273438, 0.202880859375]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 3.0, 5.0, 7.0, 4.0, 13.0, 17.0, 12.0, 15.0, 24.0, 29.0, 26.0, 45.0, 41.0, 41.0, 52.0, 55.0, 54.0, 62.0, 52.0, 60.0, 52.0, 51.0, 49.0, 35.0, 40.0, 24.0, 24.0, 27.0, 13.0, 19.0, 13.0, 16.0, 10.0, 4.0, 3.0, 4.0, 3.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1402587890625, -0.13572311401367188, -0.13118743896484375, -0.12665176391601562, -0.1221160888671875, -0.11758041381835938, -0.11304473876953125, -0.10850906372070312, -0.103973388671875, -0.09943771362304688, -0.09490203857421875, -0.09036636352539062, -0.0858306884765625, -0.08129501342773438, -0.07675933837890625, -0.07222366333007812, -0.06768798828125, -0.06315231323242188, -0.05861663818359375, -0.054080963134765625, -0.0495452880859375, -0.045009613037109375, -0.04047393798828125, -0.035938262939453125, -0.031402587890625, -0.026866912841796875, -0.02233123779296875, -0.017795562744140625, -0.0132598876953125, -0.008724212646484375, -0.00418853759765625, 0.000347137451171875, 0.0048828125, 0.009418487548828125, 0.01395416259765625, 0.018489837646484375, 0.0230255126953125, 0.027561187744140625, 0.03209686279296875, 0.036632537841796875, 0.041168212890625, 0.045703887939453125, 0.05023956298828125, 0.054775238037109375, 0.0593109130859375, 0.06384658813476562, 0.06838226318359375, 0.07291793823242188, 0.07745361328125, 0.08198928833007812, 0.08652496337890625, 0.09106063842773438, 0.0955963134765625, 0.10013198852539062, 0.10466766357421875, 0.10920333862304688, 0.113739013671875, 0.11827468872070312, 0.12281036376953125, 0.12734603881835938, 0.1318817138671875, 0.13641738891601562, 0.14095306396484375, 0.14548873901367188, 0.1500244140625]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 1.0, 3.0, 4.0, 3.0, 4.0, 10.0, 15.0, 12.0, 24.0, 23.0, 46.0, 46.0, 91.0, 182.0, 400.0, 1393.0, 8778.0, 374379.0, 649929.0, 10607.0, 1606.0, 519.0, 197.0, 93.0, 51.0, 34.0, 31.0, 21.0, 22.0, 16.0, 8.0, 6.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.490478515625, -0.4764823913574219, -0.46248626708984375, -0.4484901428222656, -0.4344940185546875, -0.4204978942871094, -0.40650177001953125, -0.3925056457519531, -0.378509521484375, -0.3645133972167969, -0.35051727294921875, -0.3365211486816406, -0.3225250244140625, -0.3085289001464844, -0.29453277587890625, -0.2805366516113281, -0.26654052734375, -0.2525444030761719, -0.23854827880859375, -0.22455215454101562, -0.2105560302734375, -0.19655990600585938, -0.18256378173828125, -0.16856765747070312, -0.154571533203125, -0.14057540893554688, -0.12657928466796875, -0.11258316040039062, -0.0985870361328125, -0.08459091186523438, -0.07059478759765625, -0.056598663330078125, -0.0426025390625, -0.028606414794921875, -0.01461029052734375, -0.000614166259765625, 0.0133819580078125, 0.027378082275390625, 0.04137420654296875, 0.055370330810546875, 0.069366455078125, 0.08336257934570312, 0.09735870361328125, 0.11135482788085938, 0.1253509521484375, 0.13934707641601562, 0.15334320068359375, 0.16733932495117188, 0.18133544921875, 0.19533157348632812, 0.20932769775390625, 0.22332382202148438, 0.2373199462890625, 0.2513160705566406, 0.26531219482421875, 0.2793083190917969, 0.293304443359375, 0.3073005676269531, 0.32129669189453125, 0.3352928161621094, 0.3492889404296875, 0.3632850646972656, 0.37728118896484375, 0.3912773132324219, 0.4052734375]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 3.0, 5.0, 7.0, 13.0, 5.0, 18.0, 22.0, 28.0, 44.0, 62.0, 79.0, 100.0, 85.0, 100.0, 65.0, 90.0, 74.0, 56.0, 42.0, 25.0, 30.0, 14.0, 10.0, 10.0, 5.0, 5.0, 2.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.429983139038086e-05, -5.22444024682045e-05, -5.018897354602814e-05, -4.8133544623851776e-05, -4.6078115701675415e-05, -4.4022686779499054e-05, -4.196725785732269e-05, -3.991182893514633e-05, -3.785640001296997e-05, -3.580097109079361e-05, -3.374554216861725e-05, -3.169011324644089e-05, -2.9634684324264526e-05, -2.7579255402088165e-05, -2.5523826479911804e-05, -2.3468397557735443e-05, -2.1412968635559082e-05, -1.935753971338272e-05, -1.730211079120636e-05, -1.5246681869029999e-05, -1.3191252946853638e-05, -1.1135824024677277e-05, -9.080395102500916e-06, -7.0249661803245544e-06, -4.969537258148193e-06, -2.9141083359718323e-06, -8.586794137954712e-07, 1.1967495083808899e-06, 3.252178430557251e-06, 5.307607352733612e-06, 7.363036274909973e-06, 9.418465197086334e-06, 1.1473894119262695e-05, 1.3529323041439056e-05, 1.5584751963615417e-05, 1.764018088579178e-05, 1.969560980796814e-05, 2.17510387301445e-05, 2.3806467652320862e-05, 2.5861896574497223e-05, 2.7917325496673584e-05, 2.9972754418849945e-05, 3.2028183341026306e-05, 3.408361226320267e-05, 3.613904118537903e-05, 3.819447010755539e-05, 4.024989902973175e-05, 4.230532795190811e-05, 4.436075687408447e-05, 4.6416185796260834e-05, 4.8471614718437195e-05, 5.0527043640613556e-05, 5.258247256278992e-05, 5.463790148496628e-05, 5.669333040714264e-05, 5.8748759329319e-05, 6.080418825149536e-05, 6.285961717367172e-05, 6.491504609584808e-05, 6.697047501802444e-05, 6.90259039402008e-05, 7.108133286237717e-05, 7.313676178455353e-05, 7.519219070672989e-05, 7.724761962890625e-05]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 4.0, 4.0, 4.0, 4.0, 6.0, 6.0, 9.0, 18.0, 11.0, 23.0, 33.0, 49.0, 50.0, 86.0, 132.0, 217.0, 460.0, 871.0, 1874.0, 5280.0, 27694.0, 739424.0, 250553.0, 15071.0, 3631.0, 1421.0, 652.0, 339.0, 216.0, 133.0, 84.0, 45.0, 47.0, 28.0, 19.0, 21.0, 13.0, 7.0, 5.0, 2.0, 1.0, 6.0, 1.0, 0.0, 1.0, 3.0, 2.0, 0.0, 4.0, 2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2119140625, -0.20402145385742188, -0.19612884521484375, -0.18823623657226562, -0.1803436279296875, -0.17245101928710938, -0.16455841064453125, -0.15666580200195312, -0.148773193359375, -0.14088058471679688, -0.13298797607421875, -0.12509536743164062, -0.1172027587890625, -0.10931015014648438, -0.10141754150390625, -0.09352493286132812, -0.08563232421875, -0.07773971557617188, -0.06984710693359375, -0.061954498291015625, -0.0540618896484375, -0.046169281005859375, -0.03827667236328125, -0.030384063720703125, -0.022491455078125, -0.014598846435546875, -0.00670623779296875, 0.001186370849609375, 0.0090789794921875, 0.016971588134765625, 0.02486419677734375, 0.032756805419921875, 0.0406494140625, 0.048542022705078125, 0.05643463134765625, 0.06432723999023438, 0.0722198486328125, 0.08011245727539062, 0.08800506591796875, 0.09589767456054688, 0.103790283203125, 0.11168289184570312, 0.11957550048828125, 0.12746810913085938, 0.1353607177734375, 0.14325332641601562, 0.15114593505859375, 0.15903854370117188, 0.16693115234375, 0.17482376098632812, 0.18271636962890625, 0.19060897827148438, 0.1985015869140625, 0.20639419555664062, 0.21428680419921875, 0.22217941284179688, 0.230072021484375, 0.23796463012695312, 0.24585723876953125, 0.2537498474121094, 0.2616424560546875, 0.2695350646972656, 0.27742767333984375, 0.2853202819824219, 0.293212890625]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 4.0, 4.0, 5.0, 7.0, 13.0, 9.0, 37.0, 38.0, 84.0, 121.0, 208.0, 205.0, 112.0, 63.0, 30.0, 19.0, 12.0, 6.0, 7.0, 4.0, 4.0, 2.0, 1.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.2017822265625, -0.19672775268554688, -0.19167327880859375, -0.18661880493164062, -0.1815643310546875, -0.17650985717773438, -0.17145538330078125, -0.16640090942382812, -0.161346435546875, -0.15629196166992188, -0.15123748779296875, -0.14618301391601562, -0.1411285400390625, -0.13607406616210938, -0.13101959228515625, -0.12596511840820312, -0.12091064453125, -0.11585617065429688, -0.11080169677734375, -0.10574722290039062, -0.1006927490234375, -0.09563827514648438, -0.09058380126953125, -0.08552932739257812, -0.080474853515625, -0.07542037963867188, -0.07036590576171875, -0.06531143188476562, -0.0602569580078125, -0.055202484130859375, -0.05014801025390625, -0.045093536376953125, -0.0400390625, -0.034984588623046875, -0.02993011474609375, -0.024875640869140625, -0.0198211669921875, -0.014766693115234375, -0.00971221923828125, -0.004657745361328125, 0.000396728515625, 0.005451202392578125, 0.01050567626953125, 0.015560150146484375, 0.0206146240234375, 0.025669097900390625, 0.03072357177734375, 0.035778045654296875, 0.04083251953125, 0.045886993408203125, 0.05094146728515625, 0.055995941162109375, 0.0610504150390625, 0.06610488891601562, 0.07115936279296875, 0.07621383666992188, 0.081268310546875, 0.08632278442382812, 0.09137725830078125, 0.09643173217773438, 0.1014862060546875, 0.10654067993164062, 0.11159515380859375, 0.11664962768554688, 0.1217041015625]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 9.0, 20.0, 26.0, 55.0, 86.0, 144.0, 191.0, 166.0, 151.0, 69.0, 40.0, 22.0, 14.0, 6.0, 2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.904351830482483, -1.8404170274734497, -1.776482343673706, -1.7125475406646729, -1.6486128568649292, -1.584678053855896, -1.5207433700561523, -1.4568085670471191, -1.392873764038086, -1.3289389610290527, -1.265004277229309, -1.2010694742202759, -1.1371347904205322, -1.073199987411499, -1.0092651844024658, -0.9453305006027222, -0.8813958168029785, -0.8174610733985901, -0.7535263299942017, -0.6895915269851685, -0.6256568431854248, -0.5617220401763916, -0.4977872967720032, -0.43385255336761475, -0.3699178099632263, -0.3059830665588379, -0.24204830825328827, -0.17811354994773865, -0.11417880654335022, -0.05024406313896179, 0.013690710067749023, 0.07762545347213745, 0.14156031608581543, 0.20549505949020386, 0.2694298028945923, 0.3333645761013031, 0.39729931950569153, 0.46123406291007996, 0.5251688361167908, 0.5891035795211792, 0.6530383229255676, 0.716973066329956, 0.7809078097343445, 0.8448425531387329, 0.9087773561477661, 0.9727120399475098, 1.036646842956543, 1.1005816459655762, 1.1645163297653198, 1.228451132774353, 1.2923858165740967, 1.3563206195831299, 1.4202553033828735, 1.4841901063919067, 1.5481247901916504, 1.6120595932006836, 1.6759943962097168, 1.73992919921875, 1.8038638830184937, 1.8677986860275269, 1.9317333698272705, 1.9956681728363037, 2.059602975845337, 2.123537540435791, 2.187472343444824]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 5.0, 5.0, 5.0, 1.0, 11.0, 8.0, 15.0, 12.0, 14.0, 23.0, 18.0, 26.0, 32.0, 40.0, 43.0, 48.0, 46.0, 55.0, 51.0, 76.0, 58.0, 55.0, 46.0, 37.0, 46.0, 32.0, 34.0, 34.0, 29.0, 18.0, 22.0, 16.0, 17.0, 8.0, 7.0, 4.0, 5.0, 2.0, 6.0, 3.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.694084107875824, -0.6658458113670349, -0.6376074552536011, -0.609369158744812, -0.581130862236023, -0.5528925061225891, -0.5246542096138, -0.4964158833026886, -0.46817755699157715, -0.4399392306804657, -0.41170090436935425, -0.3834626078605652, -0.35522428154945374, -0.3269859552383423, -0.2987476587295532, -0.2705093324184418, -0.24227100610733032, -0.21403267979621887, -0.18579436838626862, -0.15755605697631836, -0.1293177306652069, -0.10107940435409546, -0.0728410929441452, -0.044602781534194946, -0.016364455223083496, 0.011873863637447357, 0.04011218249797821, 0.06835050135850906, 0.09658882021903992, 0.12482714653015137, 0.15306545794010162, 0.18130376935005188, 0.20954203605651855, 0.23778036236763, 0.26601868867874146, 0.2942569851875305, 0.32249531149864197, 0.3507336378097534, 0.3789719343185425, 0.40721026062965393, 0.4354485869407654, 0.46368691325187683, 0.4919252395629883, 0.5201635360717773, 0.5484018325805664, 0.5766401886940002, 0.6048784852027893, 0.6331168413162231, 0.6613551378250122, 0.6895934343338013, 0.7178317904472351, 0.7460700869560242, 0.774308443069458, 0.8025467395782471, 0.8307850360870361, 0.8590233325958252, 0.887261688709259, 0.9154999852180481, 0.9437383413314819, 0.971976637840271, 1.00021493434906, 1.0284533500671387, 1.0566916465759277, 1.0849299430847168, 1.1131682395935059]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 5.0, 3.0, 3.0, 7.0, 11.0, 15.0, 26.0, 42.0, 47.0, 80.0, 114.0, 209.0, 342.0, 544.0, 959.0, 1677.0, 3120.0, 6173.0, 13961.0, 34089.0, 101128.0, 525630.0, 3132314.0, 259427.0, 67353.0, 24888.0, 10825.0, 5152.0, 2608.0, 1434.0, 826.0, 487.0, 285.0, 162.0, 121.0, 68.0, 64.0, 33.0, 19.0, 11.0, 12.0, 6.0, 3.0, 5.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1170654296875, -0.11365509033203125, -0.1102447509765625, -0.10683441162109375, -0.103424072265625, -0.10001373291015625, -0.0966033935546875, -0.09319305419921875, -0.08978271484375, -0.08637237548828125, -0.0829620361328125, -0.07955169677734375, -0.076141357421875, -0.07273101806640625, -0.0693206787109375, -0.06591033935546875, -0.0625, -0.05908966064453125, -0.0556793212890625, -0.05226898193359375, -0.048858642578125, -0.04544830322265625, -0.0420379638671875, -0.03862762451171875, -0.03521728515625, -0.03180694580078125, -0.0283966064453125, -0.02498626708984375, -0.021575927734375, -0.01816558837890625, -0.0147552490234375, -0.01134490966796875, -0.0079345703125, -0.00452423095703125, -0.0011138916015625, 0.00229644775390625, 0.005706787109375, 0.00911712646484375, 0.0125274658203125, 0.01593780517578125, 0.01934814453125, 0.02275848388671875, 0.0261688232421875, 0.02957916259765625, 0.032989501953125, 0.03639984130859375, 0.0398101806640625, 0.04322052001953125, 0.046630859375, 0.05004119873046875, 0.0534515380859375, 0.05686187744140625, 0.060272216796875, 0.06368255615234375, 0.0670928955078125, 0.07050323486328125, 0.07391357421875, 0.07732391357421875, 0.0807342529296875, 0.08414459228515625, 0.087554931640625, 0.09096527099609375, 0.0943756103515625, 0.09778594970703125, 0.1011962890625]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 6.0, 5.0, 4.0, 10.0, 11.0, 13.0, 18.0, 30.0, 29.0, 33.0, 39.0, 44.0, 58.0, 42.0, 71.0, 61.0, 49.0, 56.0, 59.0, 67.0, 53.0, 47.0, 46.0, 41.0, 30.0, 23.0, 14.0, 9.0, 5.0, 11.0, 6.0, 4.0, 8.0, 4.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0290374755859375, -0.02801823616027832, -0.02699899673461914, -0.02597975730895996, -0.02496051788330078, -0.0239412784576416, -0.022922039031982422, -0.021902799606323242, -0.020883560180664062, -0.019864320755004883, -0.018845081329345703, -0.017825841903686523, -0.016806602478027344, -0.015787363052368164, -0.014768123626708984, -0.013748884201049805, -0.012729644775390625, -0.011710405349731445, -0.010691165924072266, -0.009671926498413086, -0.008652687072753906, -0.0076334476470947266, -0.006614208221435547, -0.005594968795776367, -0.0045757293701171875, -0.003556489944458008, -0.002537250518798828, -0.0015180110931396484, -0.0004987716674804688, 0.0005204677581787109, 0.0015397071838378906, 0.0025589466094970703, 0.00357818603515625, 0.00459742546081543, 0.005616664886474609, 0.006635904312133789, 0.007655143737792969, 0.008674383163452148, 0.009693622589111328, 0.010712862014770508, 0.011732101440429688, 0.012751340866088867, 0.013770580291748047, 0.014789819717407227, 0.015809059143066406, 0.016828298568725586, 0.017847537994384766, 0.018866777420043945, 0.019886016845703125, 0.020905256271362305, 0.021924495697021484, 0.022943735122680664, 0.023962974548339844, 0.024982213973999023, 0.026001453399658203, 0.027020692825317383, 0.028039932250976562, 0.029059171676635742, 0.030078411102294922, 0.0310976505279541, 0.03211688995361328, 0.03313612937927246, 0.03415536880493164, 0.03517460823059082, 0.03619384765625]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 8.0, 10.0, 10.0, 11.0, 19.0, 19.0, 40.0, 65.0, 55.0, 122.0, 144.0, 253.0, 465.0, 728.0, 1412.0, 3045.0, 7997.0, 25504.0, 107731.0, 893390.0, 2896106.0, 196583.0, 40754.0, 11754.0, 4207.0, 1787.0, 855.0, 463.0, 277.0, 157.0, 97.0, 69.0, 56.0, 29.0, 23.0, 13.0, 4.0, 11.0, 8.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.127197265625, -0.12170791625976562, -0.11621856689453125, -0.11072921752929688, -0.1052398681640625, -0.09975051879882812, -0.09426116943359375, -0.08877182006835938, -0.083282470703125, -0.07779312133789062, -0.07230377197265625, -0.06681442260742188, -0.0613250732421875, -0.055835723876953125, -0.05034637451171875, -0.044857025146484375, -0.03936767578125, -0.033878326416015625, -0.02838897705078125, -0.022899627685546875, -0.0174102783203125, -0.011920928955078125, -0.00643157958984375, -0.000942230224609375, 0.004547119140625, 0.010036468505859375, 0.01552581787109375, 0.021015167236328125, 0.0265045166015625, 0.031993865966796875, 0.03748321533203125, 0.042972564697265625, 0.0484619140625, 0.053951263427734375, 0.05944061279296875, 0.06492996215820312, 0.0704193115234375, 0.07590866088867188, 0.08139801025390625, 0.08688735961914062, 0.092376708984375, 0.09786605834960938, 0.10335540771484375, 0.10884475708007812, 0.1143341064453125, 0.11982345581054688, 0.12531280517578125, 0.13080215454101562, 0.13629150390625, 0.14178085327148438, 0.14727020263671875, 0.15275955200195312, 0.1582489013671875, 0.16373825073242188, 0.16922760009765625, 0.17471694946289062, 0.180206298828125, 0.18569564819335938, 0.19118499755859375, 0.19667434692382812, 0.2021636962890625, 0.20765304565429688, 0.21314239501953125, 0.21863174438476562, 0.22412109375]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 0.0, 1.0, 1.0, 4.0, 4.0, 5.0, 7.0, 11.0, 27.0, 38.0, 44.0, 80.0, 115.0, 209.0, 446.0, 1300.0, 931.0, 329.0, 211.0, 117.0, 55.0, 44.0, 30.0, 19.0, 20.0, 10.0, 3.0, 9.0, 1.0, 7.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1265869140625, -0.123565673828125, -0.12054443359375, -0.117523193359375, -0.114501953125, -0.111480712890625, -0.10845947265625, -0.105438232421875, -0.1024169921875, -0.099395751953125, -0.09637451171875, -0.093353271484375, -0.09033203125, -0.087310791015625, -0.08428955078125, -0.081268310546875, -0.0782470703125, -0.075225830078125, -0.07220458984375, -0.069183349609375, -0.066162109375, -0.063140869140625, -0.06011962890625, -0.057098388671875, -0.0540771484375, -0.051055908203125, -0.04803466796875, -0.045013427734375, -0.0419921875, -0.038970947265625, -0.03594970703125, -0.032928466796875, -0.0299072265625, -0.026885986328125, -0.02386474609375, -0.020843505859375, -0.017822265625, -0.014801025390625, -0.01177978515625, -0.008758544921875, -0.0057373046875, -0.002716064453125, 0.00030517578125, 0.003326416015625, 0.00634765625, 0.009368896484375, 0.01239013671875, 0.015411376953125, 0.0184326171875, 0.021453857421875, 0.02447509765625, 0.027496337890625, 0.030517578125, 0.033538818359375, 0.03656005859375, 0.039581298828125, 0.0426025390625, 0.045623779296875, 0.04864501953125, 0.051666259765625, 0.0546875, 0.057708740234375, 0.06072998046875, 0.063751220703125, 0.0667724609375]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 5.0, 6.0, 13.0, 36.0, 88.0, 114.0, 182.0, 180.0, 167.0, 100.0, 74.0, 24.0, 11.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5478748679161072, -0.5223398208618164, -0.49680474400520325, -0.4712696671485901, -0.4457346200942993, -0.42019957304000854, -0.3946644961833954, -0.3691294193267822, -0.34359437227249146, -0.3180593252182007, -0.2925242483615875, -0.26698917150497437, -0.2414541244506836, -0.21591906249523163, -0.19038400053977966, -0.1648489385843277, -0.13931387662887573, -0.11377881467342377, -0.0882437527179718, -0.06270869076251984, -0.03717362880706787, -0.011638566851615906, 0.01389649510383606, 0.039431557059288025, 0.06496661901473999, 0.09050168097019196, 0.11603674292564392, 0.1415718048810959, 0.16710686683654785, 0.19264192879199982, 0.21817699074745178, 0.24371205270290375, 0.2692471742630005, 0.29478222131729126, 0.3203172981739044, 0.3458523750305176, 0.37138742208480835, 0.3969224691390991, 0.4224575459957123, 0.44799262285232544, 0.4735276699066162, 0.499062716960907, 0.5245977640151978, 0.5501328706741333, 0.5756679177284241, 0.6012029647827148, 0.6267380714416504, 0.6522731184959412, 0.6778081655502319, 0.7033432126045227, 0.7288782596588135, 0.754413366317749, 0.7799484133720398, 0.8054834604263306, 0.8310185670852661, 0.8565536141395569, 0.8820886611938477, 0.9076237082481384, 0.9331587553024292, 0.9586938619613647, 0.9842289090156555, 1.0097639560699463, 1.0352990627288818, 1.0608340501785278, 1.0863691568374634]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 1.0, 4.0, 2.0, 3.0, 4.0, 9.0, 10.0, 6.0, 13.0, 16.0, 17.0, 17.0, 25.0, 32.0, 38.0, 30.0, 36.0, 45.0, 53.0, 49.0, 57.0, 43.0, 54.0, 48.0, 60.0, 54.0, 34.0, 44.0, 42.0, 32.0, 28.0, 19.0, 16.0, 23.0, 9.0, 12.0, 7.0, 3.0, 5.0, 5.0, 1.0, 3.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.29751962423324585, -0.28751102089881897, -0.2775024473667145, -0.2674938440322876, -0.2574852705001831, -0.24747666716575623, -0.23746807873249054, -0.22745949029922485, -0.21745088696479797, -0.2074422985315323, -0.1974337100982666, -0.18742510676383972, -0.17741651833057404, -0.16740792989730835, -0.15739934146404266, -0.14739075303077698, -0.1373821645975113, -0.1273735761642456, -0.11736498028039932, -0.10735639184713364, -0.09734779596328735, -0.08733920753002167, -0.07733061909675598, -0.0673220232129097, -0.05731343477964401, -0.04730484262108803, -0.03729625046253204, -0.027287662029266357, -0.017279069870710373, -0.007270477712154388, 0.0027381107211112976, 0.01274670660495758, 0.022755295038223267, 0.03276388719677925, 0.042772479355335236, 0.05278106778860092, 0.0627896636724472, 0.07279825210571289, 0.08280684053897858, 0.09281543642282486, 0.10282402485609055, 0.11283261328935623, 0.12284120917320251, 0.1328497976064682, 0.1428583860397339, 0.15286698937416077, 0.16287556290626526, 0.17288416624069214, 0.18289275467395782, 0.1929013431072235, 0.2029099315404892, 0.21291851997375488, 0.22292712330818176, 0.23293571174144745, 0.24294430017471313, 0.25295290350914, 0.2629614770412445, 0.2729700803756714, 0.2829786539077759, 0.29298725724220276, 0.30299583077430725, 0.31300443410873413, 0.3230130076408386, 0.3330216109752655, 0.3430302143096924]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 4.0, 4.0, 5.0, 15.0, 14.0, 16.0, 35.0, 57.0, 77.0, 125.0, 232.0, 392.0, 633.0, 1131.0, 2213.0, 4325.0, 8629.0, 18492.0, 39487.0, 91106.0, 454644.0, 292754.0, 71002.0, 32700.0, 15295.0, 7212.0, 3590.0, 1873.0, 1048.0, 544.0, 325.0, 224.0, 105.0, 98.0, 59.0, 35.0, 19.0, 15.0, 11.0, 5.0, 6.0, 4.0, 0.0, 5.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.131103515625, -0.12711524963378906, -0.12312698364257812, -0.11913871765136719, -0.11515045166015625, -0.11116218566894531, -0.10717391967773438, -0.10318565368652344, -0.0991973876953125, -0.09520912170410156, -0.09122085571289062, -0.08723258972167969, -0.08324432373046875, -0.07925605773925781, -0.07526779174804688, -0.07127952575683594, -0.067291259765625, -0.06330299377441406, -0.059314727783203125, -0.05532646179199219, -0.05133819580078125, -0.04734992980957031, -0.043361663818359375, -0.03937339782714844, -0.0353851318359375, -0.03139686584472656, -0.027408599853515625, -0.023420333862304688, -0.01943206787109375, -0.015443801879882812, -0.011455535888671875, -0.0074672698974609375, -0.00347900390625, 0.0005092620849609375, 0.004497528076171875, 0.008485794067382812, 0.01247406005859375, 0.016462326049804688, 0.020450592041015625, 0.024438858032226562, 0.0284271240234375, 0.03241539001464844, 0.036403656005859375, 0.04039192199707031, 0.04438018798828125, 0.04836845397949219, 0.052356719970703125, 0.05634498596191406, 0.060333251953125, 0.06432151794433594, 0.06830978393554688, 0.07229804992675781, 0.07628631591796875, 0.08027458190917969, 0.08426284790039062, 0.08825111389160156, 0.0922393798828125, 0.09622764587402344, 0.10021591186523438, 0.10420417785644531, 0.10819244384765625, 0.11218070983886719, 0.11616897583007812, 0.12015724182128906, 0.1241455078125]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 7.0, 5.0, 3.0, 5.0, 6.0, 7.0, 9.0, 6.0, 10.0, 15.0, 18.0, 15.0, 30.0, 30.0, 28.0, 27.0, 35.0, 33.0, 46.0, 35.0, 47.0, 34.0, 48.0, 39.0, 44.0, 38.0, 54.0, 40.0, 42.0, 33.0, 31.0, 32.0, 29.0, 24.0, 15.0, 14.0, 15.0, 11.0, 11.0, 10.0, 5.0, 8.0, 6.0, 2.0, 1.0, 1.0, 4.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.02496337890625, -0.024183273315429688, -0.023403167724609375, -0.022623062133789062, -0.02184295654296875, -0.021062850952148438, -0.020282745361328125, -0.019502639770507812, -0.0187225341796875, -0.017942428588867188, -0.017162322998046875, -0.016382217407226562, -0.01560211181640625, -0.014822006225585938, -0.014041900634765625, -0.013261795043945312, -0.012481689453125, -0.011701583862304688, -0.010921478271484375, -0.010141372680664062, -0.00936126708984375, -0.008581161499023438, -0.007801055908203125, -0.0070209503173828125, -0.0062408447265625, -0.0054607391357421875, -0.004680633544921875, -0.0039005279541015625, -0.00312042236328125, -0.0023403167724609375, -0.001560211181640625, -0.0007801055908203125, 0.0, 0.0007801055908203125, 0.001560211181640625, 0.0023403167724609375, 0.00312042236328125, 0.0039005279541015625, 0.004680633544921875, 0.0054607391357421875, 0.0062408447265625, 0.0070209503173828125, 0.007801055908203125, 0.008581161499023438, 0.00936126708984375, 0.010141372680664062, 0.010921478271484375, 0.011701583862304688, 0.012481689453125, 0.013261795043945312, 0.014041900634765625, 0.014822006225585938, 0.01560211181640625, 0.016382217407226562, 0.017162322998046875, 0.017942428588867188, 0.0187225341796875, 0.019502639770507812, 0.020282745361328125, 0.021062850952148438, 0.02184295654296875, 0.022623062133789062, 0.023403167724609375, 0.024183273315429688, 0.02496337890625]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 4.0, 4.0, 8.0, 10.0, 6.0, 13.0, 23.0, 19.0, 31.0, 39.0, 56.0, 58.0, 73.0, 89.0, 146.0, 217.0, 280.0, 367.0, 633.0, 1118.0, 1925.0, 4037.0, 10661.0, 31264.0, 93729.0, 638720.0, 185822.0, 49795.0, 16896.0, 6171.0, 2583.0, 1301.0, 742.0, 431.0, 328.0, 234.0, 170.0, 142.0, 95.0, 74.0, 56.0, 47.0, 36.0, 23.0, 21.0, 21.0, 4.0, 10.0, 9.0, 9.0, 3.0, 2.0, 2.0, 3.0, 1.0, 1.0, 3.0], "bins": [-0.156982421875, -0.15218353271484375, -0.1473846435546875, -0.14258575439453125, -0.137786865234375, -0.13298797607421875, -0.1281890869140625, -0.12339019775390625, -0.11859130859375, -0.11379241943359375, -0.1089935302734375, -0.10419464111328125, -0.099395751953125, -0.09459686279296875, -0.0897979736328125, -0.08499908447265625, -0.0802001953125, -0.07540130615234375, -0.0706024169921875, -0.06580352783203125, -0.061004638671875, -0.05620574951171875, -0.0514068603515625, -0.04660797119140625, -0.04180908203125, -0.03701019287109375, -0.0322113037109375, -0.02741241455078125, -0.022613525390625, -0.01781463623046875, -0.0130157470703125, -0.00821685791015625, -0.00341796875, 0.00138092041015625, 0.0061798095703125, 0.01097869873046875, 0.015777587890625, 0.02057647705078125, 0.0253753662109375, 0.03017425537109375, 0.03497314453125, 0.03977203369140625, 0.0445709228515625, 0.04936981201171875, 0.054168701171875, 0.05896759033203125, 0.0637664794921875, 0.06856536865234375, 0.0733642578125, 0.07816314697265625, 0.0829620361328125, 0.08776092529296875, 0.092559814453125, 0.09735870361328125, 0.1021575927734375, 0.10695648193359375, 0.11175537109375, 0.11655426025390625, 0.1213531494140625, 0.12615203857421875, 0.130950927734375, 0.13574981689453125, 0.1405487060546875, 0.14534759521484375, 0.150146484375]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 1.0, 2.0, 4.0, 4.0, 2.0, 5.0, 5.0, 8.0, 8.0, 19.0, 10.0, 21.0, 28.0, 46.0, 54.0, 55.0, 47.0, 59.0, 58.0, 60.0, 61.0, 52.0, 57.0, 62.0, 58.0, 45.0, 37.0, 28.0, 27.0, 18.0, 15.0, 15.0, 10.0, 8.0, 6.0, 4.0, 4.0, 2.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1678466796875, -0.1627788543701172, -0.15771102905273438, -0.15264320373535156, -0.14757537841796875, -0.14250755310058594, -0.13743972778320312, -0.1323719024658203, -0.1273040771484375, -0.12223625183105469, -0.11716842651367188, -0.11210060119628906, -0.10703277587890625, -0.10196495056152344, -0.09689712524414062, -0.09182929992675781, -0.086761474609375, -0.08169364929199219, -0.07662582397460938, -0.07155799865722656, -0.06649017333984375, -0.06142234802246094, -0.056354522705078125, -0.05128669738769531, -0.0462188720703125, -0.04115104675292969, -0.036083221435546875, -0.031015396118164062, -0.02594757080078125, -0.020879745483398438, -0.015811920166015625, -0.010744094848632812, -0.00567626953125, -0.0006084442138671875, 0.004459381103515625, 0.009527206420898438, 0.01459503173828125, 0.019662857055664062, 0.024730682373046875, 0.029798507690429688, 0.0348663330078125, 0.03993415832519531, 0.045001983642578125, 0.05006980895996094, 0.05513763427734375, 0.06020545959472656, 0.06527328491210938, 0.07034111022949219, 0.075408935546875, 0.08047676086425781, 0.08554458618164062, 0.09061241149902344, 0.09568023681640625, 0.10074806213378906, 0.10581588745117188, 0.11088371276855469, 0.1159515380859375, 0.12101936340332031, 0.12608718872070312, 0.13115501403808594, 0.13622283935546875, 0.14129066467285156, 0.14635848999023438, 0.1514263153076172, 0.156494140625]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 5.0, 6.0, 5.0, 11.0, 10.0, 16.0, 18.0, 26.0, 53.0, 94.0, 189.0, 522.0, 2598.0, 29158.0, 941765.0, 68602.0, 4183.0, 723.0, 261.0, 127.0, 65.0, 49.0, 28.0, 23.0, 14.0, 7.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.405517578125, -0.394134521484375, -0.38275146484375, -0.371368408203125, -0.3599853515625, -0.348602294921875, -0.33721923828125, -0.325836181640625, -0.314453125, -0.303070068359375, -0.29168701171875, -0.280303955078125, -0.2689208984375, -0.257537841796875, -0.24615478515625, -0.234771728515625, -0.223388671875, -0.212005615234375, -0.20062255859375, -0.189239501953125, -0.1778564453125, -0.166473388671875, -0.15509033203125, -0.143707275390625, -0.13232421875, -0.120941162109375, -0.10955810546875, -0.098175048828125, -0.0867919921875, -0.075408935546875, -0.06402587890625, -0.052642822265625, -0.041259765625, -0.029876708984375, -0.01849365234375, -0.007110595703125, 0.0042724609375, 0.015655517578125, 0.02703857421875, 0.038421630859375, 0.0498046875, 0.061187744140625, 0.07257080078125, 0.083953857421875, 0.0953369140625, 0.106719970703125, 0.11810302734375, 0.129486083984375, 0.140869140625, 0.152252197265625, 0.16363525390625, 0.175018310546875, 0.1864013671875, 0.197784423828125, 0.20916748046875, 0.220550537109375, 0.23193359375, 0.243316650390625, 0.25469970703125, 0.266082763671875, 0.2774658203125, 0.288848876953125, 0.30023193359375, 0.311614990234375, 0.322998046875]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 6.0, 7.0, 10.0, 20.0, 31.0, 41.0, 78.0, 129.0, 138.0, 150.0, 142.0, 87.0, 61.0, 31.0, 25.0, 18.0, 11.0, 6.0, 7.0, 3.0, 4.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.930662155151367e-05, -5.6224875152111053e-05, -5.3143128752708435e-05, -5.006138235330582e-05, -4.69796359539032e-05, -4.389788955450058e-05, -4.081614315509796e-05, -3.773439675569534e-05, -3.4652650356292725e-05, -3.1570903956890106e-05, -2.8489157557487488e-05, -2.540741115808487e-05, -2.232566475868225e-05, -1.9243918359279633e-05, -1.6162171959877014e-05, -1.3080425560474396e-05, -9.998679161071777e-06, -6.916932761669159e-06, -3.8351863622665405e-06, -7.534399628639221e-07, 2.3283064365386963e-06, 5.410052835941315e-06, 8.491799235343933e-06, 1.1573545634746552e-05, 1.465529203414917e-05, 1.773703843355179e-05, 2.0818784832954407e-05, 2.3900531232357025e-05, 2.6982277631759644e-05, 3.0064024031162262e-05, 3.314577043056488e-05, 3.62275168299675e-05, 3.930926322937012e-05, 4.2391009628772736e-05, 4.5472756028175354e-05, 4.855450242757797e-05, 5.163624882698059e-05, 5.471799522638321e-05, 5.779974162578583e-05, 6.0881488025188446e-05, 6.396323442459106e-05, 6.704498082399368e-05, 7.01267272233963e-05, 7.320847362279892e-05, 7.629022002220154e-05, 7.937196642160416e-05, 8.245371282100677e-05, 8.55354592204094e-05, 8.861720561981201e-05, 9.169895201921463e-05, 9.478069841861725e-05, 9.786244481801987e-05, 0.00010094419121742249, 0.0001040259376168251, 0.00010710768401622772, 0.00011018943041563034, 0.00011327117681503296, 0.00011635292321443558, 0.0001194346696138382, 0.00012251641601324081, 0.00012559816241264343, 0.00012867990881204605, 0.00013176165521144867, 0.0001348434016108513, 0.0001379251480102539]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 3.0, 2.0, 2.0, 8.0, 5.0, 15.0, 20.0, 22.0, 50.0, 62.0, 115.0, 191.0, 328.0, 757.0, 2540.0, 12395.0, 184138.0, 816426.0, 25448.0, 3885.0, 1081.0, 431.0, 238.0, 143.0, 88.0, 58.0, 39.0, 30.0, 10.0, 10.0, 7.0, 7.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2435302734375, -0.23595809936523438, -0.22838592529296875, -0.22081375122070312, -0.2132415771484375, -0.20566940307617188, -0.19809722900390625, -0.19052505493164062, -0.182952880859375, -0.17538070678710938, -0.16780853271484375, -0.16023635864257812, -0.1526641845703125, -0.14509201049804688, -0.13751983642578125, -0.12994766235351562, -0.12237548828125, -0.11480331420898438, -0.10723114013671875, -0.09965896606445312, -0.0920867919921875, -0.08451461791992188, -0.07694244384765625, -0.06937026977539062, -0.061798095703125, -0.054225921630859375, -0.04665374755859375, -0.039081573486328125, -0.0315093994140625, -0.023937225341796875, -0.01636505126953125, -0.008792877197265625, -0.001220703125, 0.006351470947265625, 0.01392364501953125, 0.021495819091796875, 0.0290679931640625, 0.036640167236328125, 0.04421234130859375, 0.051784515380859375, 0.059356689453125, 0.06692886352539062, 0.07450103759765625, 0.08207321166992188, 0.0896453857421875, 0.09721755981445312, 0.10478973388671875, 0.11236190795898438, 0.11993408203125, 0.12750625610351562, 0.13507843017578125, 0.14265060424804688, 0.1502227783203125, 0.15779495239257812, 0.16536712646484375, 0.17293930053710938, 0.180511474609375, 0.18808364868164062, 0.19565582275390625, 0.20322799682617188, 0.2108001708984375, 0.21837234497070312, 0.22594451904296875, 0.23351669311523438, 0.2410888671875]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 5.0, 1.0, 3.0, 6.0, 12.0, 12.0, 20.0, 19.0, 25.0, 43.0, 68.0, 163.0, 276.0, 162.0, 60.0, 24.0, 31.0, 22.0, 15.0, 11.0, 9.0, 6.0, 2.0, 3.0, 1.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1295166015625, -0.125762939453125, -0.12200927734375, -0.118255615234375, -0.114501953125, -0.110748291015625, -0.10699462890625, -0.103240966796875, -0.0994873046875, -0.095733642578125, -0.09197998046875, -0.088226318359375, -0.08447265625, -0.080718994140625, -0.07696533203125, -0.073211669921875, -0.0694580078125, -0.065704345703125, -0.06195068359375, -0.058197021484375, -0.054443359375, -0.050689697265625, -0.04693603515625, -0.043182373046875, -0.0394287109375, -0.035675048828125, -0.03192138671875, -0.028167724609375, -0.0244140625, -0.020660400390625, -0.01690673828125, -0.013153076171875, -0.0093994140625, -0.005645751953125, -0.00189208984375, 0.001861572265625, 0.005615234375, 0.009368896484375, 0.01312255859375, 0.016876220703125, 0.0206298828125, 0.024383544921875, 0.02813720703125, 0.031890869140625, 0.03564453125, 0.039398193359375, 0.04315185546875, 0.046905517578125, 0.0506591796875, 0.054412841796875, 0.05816650390625, 0.061920166015625, 0.065673828125, 0.069427490234375, 0.07318115234375, 0.076934814453125, 0.0806884765625, 0.084442138671875, 0.08819580078125, 0.091949462890625, 0.095703125, 0.099456787109375, 0.10321044921875, 0.106964111328125, 0.1107177734375]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 7.0, 5.0, 21.0, 50.0, 123.0, 220.0, 256.0, 199.0, 85.0, 29.0, 13.0, 5.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1755073070526123, -1.0989019870758057, -1.022296667098999, -0.9456912279129028, -0.8690859079360962, -0.7924805879592896, -0.7158752083778381, -0.6392698287963867, -0.5626645088195801, -0.48605915904045105, -0.409453809261322, -0.332848459482193, -0.25624310970306396, -0.17963775992393494, -0.10303241014480591, -0.026427030563354492, 0.05017828941345215, 0.12678363919258118, 0.2033889889717102, 0.27999433875083923, 0.35659968852996826, 0.4332050383090973, 0.5098103880882263, 0.5864157676696777, 0.6630210876464844, 0.739626407623291, 0.8162317872047424, 0.8928371667861938, 0.9694424867630005, 1.0460478067398071, 1.1226532459259033, 1.19925856590271, 1.2758641242980957, 1.3524694442749023, 1.429074764251709, 1.5056802034378052, 1.5822855234146118, 1.6588908433914185, 1.7354962825775146, 1.8121016025543213, 1.888706922531128, 1.9653122425079346, 2.041917562484741, 2.118522882461548, 2.1951284408569336, 2.2717337608337402, 2.348339080810547, 2.4249444007873535, 2.50154972076416, 2.578155040740967, 2.6547603607177734, 2.73136568069458, 2.8079710006713867, 2.8845765590667725, 2.961181879043579, 3.0377871990203857, 3.1143925189971924, 3.190997838973999, 3.2676031589508057, 3.3442084789276123, 3.420814037322998, 3.4974193572998047, 3.5740246772766113, 3.650629997253418, 3.7272353172302246]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 6.0, 3.0, 6.0, 6.0, 10.0, 9.0, 14.0, 20.0, 14.0, 16.0, 24.0, 30.0, 23.0, 32.0, 25.0, 36.0, 45.0, 43.0, 44.0, 60.0, 52.0, 55.0, 45.0, 42.0, 56.0, 46.0, 41.0, 24.0, 26.0, 27.0, 20.0, 22.0, 25.0, 9.0, 15.0, 11.0, 9.0, 4.0, 5.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.8387554287910461, -0.8171766996383667, -0.7955979108810425, -0.774019181728363, -0.7524404525756836, -0.7308617234230042, -0.7092829942703247, -0.6877042055130005, -0.666125476360321, -0.6445467472076416, -0.6229679584503174, -0.6013892292976379, -0.5798105001449585, -0.558231770992279, -0.5366530418395996, -0.5150742530822754, -0.49349552392959595, -0.4719167947769165, -0.4503380358219147, -0.42875927686691284, -0.4071805477142334, -0.38560181856155396, -0.3640230596065521, -0.3424443006515503, -0.32086557149887085, -0.2992868423461914, -0.2777080833911896, -0.25612932443618774, -0.2345505952835083, -0.21297185122966766, -0.19139310717582703, -0.1698143631219864, -0.14823567867279053, -0.1266569346189499, -0.10507819056510925, -0.08349944651126862, -0.06192070245742798, -0.04034195840358734, -0.018763214349746704, 0.002815529704093933, 0.02439427375793457, 0.04597301781177521, 0.06755176186561584, 0.08913050591945648, 0.11070924997329712, 0.13228799402713776, 0.1538667380809784, 0.17544548213481903, 0.19702422618865967, 0.2186029702425003, 0.24018171429634094, 0.2617604732513428, 0.2833392024040222, 0.30491793155670166, 0.3264966905117035, 0.3480754494667053, 0.36965417861938477, 0.3912329077720642, 0.41281166672706604, 0.43439042568206787, 0.4559691548347473, 0.47754788398742676, 0.4991266429424286, 0.5207054018974304, 0.5422841310501099]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 5.0, 4.0, 5.0, 14.0, 8.0, 19.0, 26.0, 31.0, 54.0, 100.0, 142.0, 228.0, 389.0, 709.0, 1166.0, 2143.0, 4281.0, 8755.0, 19781.0, 51008.0, 173474.0, 3005724.0, 746496.0, 112258.0, 37534.0, 15310.0, 6829.0, 3472.0, 1798.0, 980.0, 613.0, 348.0, 220.0, 137.0, 74.0, 63.0, 27.0, 21.0, 18.0, 16.0, 6.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.13623046875, -0.1324300765991211, -0.1286296844482422, -0.12482929229736328, -0.12102890014648438, -0.11722850799560547, -0.11342811584472656, -0.10962772369384766, -0.10582733154296875, -0.10202693939208984, -0.09822654724121094, -0.09442615509033203, -0.09062576293945312, -0.08682537078857422, -0.08302497863769531, -0.0792245864868164, -0.0754241943359375, -0.0716238021850586, -0.06782341003417969, -0.06402301788330078, -0.060222625732421875, -0.05642223358154297, -0.05262184143066406, -0.048821449279785156, -0.04502105712890625, -0.041220664978027344, -0.03742027282714844, -0.03361988067626953, -0.029819488525390625, -0.02601909637451172, -0.022218704223632812, -0.018418312072753906, -0.014617919921875, -0.010817527770996094, -0.0070171356201171875, -0.0032167434692382812, 0.000583648681640625, 0.004384040832519531, 0.008184432983398438, 0.011984825134277344, 0.01578521728515625, 0.019585609436035156, 0.023386001586914062, 0.02718639373779297, 0.030986785888671875, 0.03478717803955078, 0.03858757019042969, 0.042387962341308594, 0.0461883544921875, 0.049988746643066406, 0.05378913879394531, 0.05758953094482422, 0.061389923095703125, 0.06519031524658203, 0.06899070739746094, 0.07279109954833984, 0.07659149169921875, 0.08039188385009766, 0.08419227600097656, 0.08799266815185547, 0.09179306030273438, 0.09559345245361328, 0.09939384460449219, 0.1031942367553711, 0.10699462890625]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 6.0, 6.0, 7.0, 6.0, 12.0, 8.0, 19.0, 20.0, 25.0, 23.0, 45.0, 40.0, 46.0, 53.0, 42.0, 56.0, 50.0, 63.0, 64.0, 52.0, 57.0, 61.0, 49.0, 42.0, 27.0, 26.0, 24.0, 19.0, 19.0, 11.0, 10.0, 6.0, 8.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.030792236328125, -0.029666900634765625, -0.02854156494140625, -0.027416229248046875, -0.0262908935546875, -0.025165557861328125, -0.02404022216796875, -0.022914886474609375, -0.02178955078125, -0.020664215087890625, -0.01953887939453125, -0.018413543701171875, -0.0172882080078125, -0.016162872314453125, -0.01503753662109375, -0.013912200927734375, -0.012786865234375, -0.011661529541015625, -0.01053619384765625, -0.009410858154296875, -0.0082855224609375, -0.007160186767578125, -0.00603485107421875, -0.004909515380859375, -0.0037841796875, -0.002658843994140625, -0.00153350830078125, -0.000408172607421875, 0.0007171630859375, 0.001842498779296875, 0.00296783447265625, 0.004093170166015625, 0.005218505859375, 0.006343841552734375, 0.00746917724609375, 0.008594512939453125, 0.0097198486328125, 0.010845184326171875, 0.01197052001953125, 0.013095855712890625, 0.01422119140625, 0.015346527099609375, 0.01647186279296875, 0.017597198486328125, 0.0187225341796875, 0.019847869873046875, 0.02097320556640625, 0.022098541259765625, 0.023223876953125, 0.024349212646484375, 0.02547454833984375, 0.026599884033203125, 0.0277252197265625, 0.028850555419921875, 0.02997589111328125, 0.031101226806640625, 0.0322265625, 0.033351898193359375, 0.03447723388671875, 0.035602569580078125, 0.0367279052734375, 0.037853240966796875, 0.03897857666015625, 0.040103912353515625, 0.041229248046875]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 6.0, 3.0, 6.0, 9.0, 13.0, 14.0, 22.0, 25.0, 27.0, 38.0, 66.0, 87.0, 109.0, 131.0, 222.0, 305.0, 570.0, 992.0, 1992.0, 4874.0, 14218.0, 54503.0, 358490.0, 3460041.0, 235746.0, 41751.0, 11720.0, 4092.0, 1743.0, 927.0, 470.0, 332.0, 195.0, 146.0, 92.0, 78.0, 69.0, 50.0, 25.0, 19.0, 20.0, 13.0, 10.0, 13.0, 5.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.224853515625, -0.21831893920898438, -0.21178436279296875, -0.20524978637695312, -0.1987152099609375, -0.19218063354492188, -0.18564605712890625, -0.17911148071289062, -0.172576904296875, -0.16604232788085938, -0.15950775146484375, -0.15297317504882812, -0.1464385986328125, -0.13990402221679688, -0.13336944580078125, -0.12683486938476562, -0.12030029296875, -0.11376571655273438, -0.10723114013671875, -0.10069656372070312, -0.0941619873046875, -0.08762741088867188, -0.08109283447265625, -0.07455825805664062, -0.068023681640625, -0.061489105224609375, -0.05495452880859375, -0.048419952392578125, -0.0418853759765625, -0.035350799560546875, -0.02881622314453125, -0.022281646728515625, -0.0157470703125, -0.009212493896484375, -0.00267791748046875, 0.003856658935546875, 0.0103912353515625, 0.016925811767578125, 0.02346038818359375, 0.029994964599609375, 0.036529541015625, 0.043064117431640625, 0.04959869384765625, 0.056133270263671875, 0.0626678466796875, 0.06920242309570312, 0.07573699951171875, 0.08227157592773438, 0.08880615234375, 0.09534072875976562, 0.10187530517578125, 0.10840988159179688, 0.1149444580078125, 0.12147903442382812, 0.12801361083984375, 0.13454818725585938, 0.141082763671875, 0.14761734008789062, 0.15415191650390625, 0.16068649291992188, 0.1672210693359375, 0.17375564575195312, 0.18029022216796875, 0.18682479858398438, 0.193359375]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 3.0, 2.0, 5.0, 6.0, 9.0, 14.0, 21.0, 39.0, 75.0, 134.0, 330.0, 1568.0, 1262.0, 303.0, 141.0, 62.0, 35.0, 21.0, 17.0, 11.0, 10.0, 5.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11895751953125, -0.11498737335205078, -0.11101722717285156, -0.10704708099365234, -0.10307693481445312, -0.0991067886352539, -0.09513664245605469, -0.09116649627685547, -0.08719635009765625, -0.08322620391845703, -0.07925605773925781, -0.0752859115600586, -0.07131576538085938, -0.06734561920166016, -0.06337547302246094, -0.05940532684326172, -0.0554351806640625, -0.05146503448486328, -0.04749488830566406, -0.043524742126464844, -0.039554595947265625, -0.035584449768066406, -0.03161430358886719, -0.02764415740966797, -0.02367401123046875, -0.01970386505126953, -0.015733718872070312, -0.011763572692871094, -0.007793426513671875, -0.0038232803344726562, 0.0001468658447265625, 0.004117012023925781, 0.008087158203125, 0.012057304382324219, 0.016027450561523438, 0.019997596740722656, 0.023967742919921875, 0.027937889099121094, 0.03190803527832031, 0.03587818145751953, 0.03984832763671875, 0.04381847381591797, 0.04778861999511719, 0.051758766174316406, 0.055728912353515625, 0.059699058532714844, 0.06366920471191406, 0.06763935089111328, 0.0716094970703125, 0.07557964324951172, 0.07954978942871094, 0.08351993560791016, 0.08749008178710938, 0.0914602279663086, 0.09543037414550781, 0.09940052032470703, 0.10337066650390625, 0.10734081268310547, 0.11131095886230469, 0.1152811050415039, 0.11925125122070312, 0.12322139739990234, 0.12719154357910156, 0.13116168975830078, 0.1351318359375]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 4.0, 2.0, 8.0, 9.0, 24.0, 45.0, 85.0, 124.0, 184.0, 156.0, 133.0, 97.0, 55.0, 42.0, 20.0, 10.0, 3.0, 4.0, 3.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.9729800820350647, -0.9513079524040222, -0.9296358227729797, -0.9079636931419373, -0.8862915635108948, -0.8646194338798523, -0.8429473638534546, -0.8212752342224121, -0.7996031045913696, -0.7779309749603271, -0.7562588453292847, -0.7345867156982422, -0.7129145860671997, -0.6912424564361572, -0.6695703268051147, -0.6478981971740723, -0.6262260675430298, -0.6045539379119873, -0.5828818082809448, -0.5612096786499023, -0.5395375490188599, -0.5178654193878174, -0.4961933195590973, -0.4745211899280548, -0.45284906029701233, -0.43117693066596985, -0.40950480103492737, -0.3878327012062073, -0.3661605715751648, -0.3444884419441223, -0.32281631231307983, -0.30114418268203735, -0.2794719934463501, -0.2577998638153076, -0.23612773418426514, -0.21445561945438385, -0.19278348982334137, -0.1711113601922989, -0.1494392454624176, -0.12776711583137512, -0.10609498620033264, -0.08442285656929016, -0.06275073438882828, -0.041078612208366394, -0.019406482577323914, 0.002265647053718567, 0.023937761783599854, 0.045609891414642334, 0.06728202104568481, 0.0889541506767273, 0.11062627285718918, 0.13229839503765106, 0.15397052466869354, 0.17564265429973602, 0.1973147690296173, 0.2189868986606598, 0.24065902829170227, 0.26233115792274475, 0.28400328755378723, 0.3056753873825073, 0.3273475170135498, 0.3490196466445923, 0.37069177627563477, 0.39236390590667725, 0.4140360355377197]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 6.0, 5.0, 8.0, 11.0, 7.0, 9.0, 8.0, 16.0, 17.0, 17.0, 18.0, 25.0, 26.0, 28.0, 23.0, 27.0, 27.0, 35.0, 36.0, 44.0, 49.0, 48.0, 34.0, 48.0, 35.0, 33.0, 29.0, 36.0, 41.0, 27.0, 23.0, 32.0, 20.0, 23.0, 23.0, 16.0, 15.0, 17.0, 8.0, 10.0, 10.0, 9.0, 12.0, 10.0, 1.0, 2.0, 4.0, 2.0, 2.0, 1.0, 2.0], "bins": [-0.26798975467681885, -0.26048341393470764, -0.25297704339027405, -0.24547070264816284, -0.23796434700489044, -0.23045799136161804, -0.22295165061950684, -0.21544529497623444, -0.20793893933296204, -0.20043258368968964, -0.19292622804641724, -0.18541988730430603, -0.17791353166103363, -0.17040717601776123, -0.16290083527565002, -0.15539447963237762, -0.14788812398910522, -0.14038176834583282, -0.13287541270256042, -0.12536907196044922, -0.11786271631717682, -0.11035636067390442, -0.10285001248121262, -0.09534366428852081, -0.08783730864524841, -0.08033095300197601, -0.07282460480928421, -0.06531825661659241, -0.05781190097332001, -0.050305549055337906, -0.042799197137355804, -0.0352928452193737, -0.0277864933013916, -0.0202801413834095, -0.012773789465427399, -0.005267437547445297, 0.002238914370536804, 0.009745266288518906, 0.017251618206501007, 0.02475797012448311, 0.03226432204246521, 0.03977067396044731, 0.04727702587842941, 0.054783377796411514, 0.062289729714393616, 0.06979608535766602, 0.07730243355035782, 0.08480878174304962, 0.09231513738632202, 0.09982149302959442, 0.10732784122228622, 0.11483418941497803, 0.12234054505825043, 0.12984690070152283, 0.13735324144363403, 0.14485959708690643, 0.15236595273017883, 0.15987230837345123, 0.16737866401672363, 0.17488500475883484, 0.18239136040210724, 0.18989771604537964, 0.19740405678749084, 0.20491041243076324, 0.21241676807403564]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 8.0, 8.0, 4.0, 7.0, 10.0, 9.0, 27.0, 22.0, 29.0, 56.0, 72.0, 117.0, 163.0, 342.0, 667.0, 1390.0, 2952.0, 6621.0, 13703.0, 27959.0, 64459.0, 348127.0, 444951.0, 76440.0, 31025.0, 15369.0, 7416.0, 3417.0, 1532.0, 734.0, 371.0, 202.0, 111.0, 63.0, 42.0, 33.0, 33.0, 20.0, 16.0, 10.0, 7.0, 7.0, 5.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.119140625, -0.11542606353759766, -0.11171150207519531, -0.10799694061279297, -0.10428237915039062, -0.10056781768798828, -0.09685325622558594, -0.0931386947631836, -0.08942413330078125, -0.0857095718383789, -0.08199501037597656, -0.07828044891357422, -0.07456588745117188, -0.07085132598876953, -0.06713676452636719, -0.06342220306396484, -0.0597076416015625, -0.055993080139160156, -0.05227851867675781, -0.04856395721435547, -0.044849395751953125, -0.04113483428955078, -0.03742027282714844, -0.033705711364746094, -0.02999114990234375, -0.026276588439941406, -0.022562026977539062, -0.01884746551513672, -0.015132904052734375, -0.011418342590332031, -0.0077037811279296875, -0.003989219665527344, -0.000274658203125, 0.0034399032592773438, 0.0071544647216796875, 0.010869026184082031, 0.014583587646484375, 0.01829814910888672, 0.022012710571289062, 0.025727272033691406, 0.02944183349609375, 0.033156394958496094, 0.03687095642089844, 0.04058551788330078, 0.044300079345703125, 0.04801464080810547, 0.05172920227050781, 0.055443763732910156, 0.0591583251953125, 0.06287288665771484, 0.06658744812011719, 0.07030200958251953, 0.07401657104492188, 0.07773113250732422, 0.08144569396972656, 0.0851602554321289, 0.08887481689453125, 0.0925893783569336, 0.09630393981933594, 0.10001850128173828, 0.10373306274414062, 0.10744762420654297, 0.11116218566894531, 0.11487674713134766, 0.11859130859375]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 2.0, 2.0, 2.0, 5.0, 1.0, 2.0, 5.0, 5.0, 7.0, 8.0, 9.0, 11.0, 16.0, 10.0, 15.0, 26.0, 15.0, 21.0, 28.0, 31.0, 24.0, 40.0, 22.0, 43.0, 27.0, 39.0, 43.0, 40.0, 44.0, 47.0, 35.0, 42.0, 33.0, 30.0, 42.0, 29.0, 37.0, 36.0, 18.0, 15.0, 17.0, 15.0, 7.0, 21.0, 6.0, 8.0, 14.0, 5.0, 4.0, 3.0, 2.0, 4.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.0261993408203125, -0.025350570678710938, -0.024501800537109375, -0.023653030395507812, -0.02280426025390625, -0.021955490112304688, -0.021106719970703125, -0.020257949829101562, -0.0194091796875, -0.018560409545898438, -0.017711639404296875, -0.016862869262695312, -0.01601409912109375, -0.015165328979492188, -0.014316558837890625, -0.013467788696289062, -0.0126190185546875, -0.011770248413085938, -0.010921478271484375, -0.010072708129882812, -0.00922393798828125, -0.008375167846679688, -0.007526397705078125, -0.0066776275634765625, -0.005828857421875, -0.0049800872802734375, -0.004131317138671875, -0.0032825469970703125, -0.00243377685546875, -0.0015850067138671875, -0.000736236572265625, 0.0001125335693359375, 0.0009613037109375, 0.0018100738525390625, 0.002658843994140625, 0.0035076141357421875, 0.00435638427734375, 0.0052051544189453125, 0.006053924560546875, 0.0069026947021484375, 0.00775146484375, 0.008600234985351562, 0.009449005126953125, 0.010297775268554688, 0.01114654541015625, 0.011995315551757812, 0.012844085693359375, 0.013692855834960938, 0.0145416259765625, 0.015390396118164062, 0.016239166259765625, 0.017087936401367188, 0.01793670654296875, 0.018785476684570312, 0.019634246826171875, 0.020483016967773438, 0.021331787109375, 0.022180557250976562, 0.023029327392578125, 0.023878097534179688, 0.02472686767578125, 0.025575637817382812, 0.026424407958984375, 0.027273178100585938, 0.0281219482421875]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 3.0, 7.0, 10.0, 6.0, 10.0, 13.0, 20.0, 21.0, 36.0, 51.0, 88.0, 162.0, 208.0, 451.0, 941.0, 2422.0, 7056.0, 22383.0, 69406.0, 767240.0, 129440.0, 32029.0, 10460.0, 3450.0, 1285.0, 586.0, 298.0, 163.0, 114.0, 60.0, 40.0, 31.0, 22.0, 9.0, 8.0, 6.0, 12.0, 6.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.228271484375, -0.2220458984375, -0.2158203125, -0.2095947265625, -0.203369140625, -0.1971435546875, -0.19091796875, -0.1846923828125, -0.178466796875, -0.1722412109375, -0.166015625, -0.1597900390625, -0.153564453125, -0.1473388671875, -0.14111328125, -0.1348876953125, -0.128662109375, -0.1224365234375, -0.1162109375, -0.1099853515625, -0.103759765625, -0.0975341796875, -0.09130859375, -0.0850830078125, -0.078857421875, -0.0726318359375, -0.06640625, -0.0601806640625, -0.053955078125, -0.0477294921875, -0.04150390625, -0.0352783203125, -0.029052734375, -0.0228271484375, -0.0166015625, -0.0103759765625, -0.004150390625, 0.0020751953125, 0.00830078125, 0.0145263671875, 0.020751953125, 0.0269775390625, 0.033203125, 0.0394287109375, 0.045654296875, 0.0518798828125, 0.05810546875, 0.0643310546875, 0.070556640625, 0.0767822265625, 0.0830078125, 0.0892333984375, 0.095458984375, 0.1016845703125, 0.10791015625, 0.1141357421875, 0.120361328125, 0.1265869140625, 0.1328125, 0.1390380859375, 0.145263671875, 0.1514892578125, 0.15771484375, 0.1639404296875, 0.170166015625]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 1.0, 1.0, 5.0, 4.0, 5.0, 2.0, 6.0, 5.0, 6.0, 17.0, 19.0, 23.0, 28.0, 32.0, 45.0, 53.0, 44.0, 54.0, 61.0, 74.0, 68.0, 71.0, 63.0, 45.0, 48.0, 43.0, 40.0, 28.0, 26.0, 16.0, 14.0, 16.0, 13.0, 6.0, 10.0, 6.0, 4.0, 2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.2061767578125, -0.20047950744628906, -0.19478225708007812, -0.1890850067138672, -0.18338775634765625, -0.1776905059814453, -0.17199325561523438, -0.16629600524902344, -0.1605987548828125, -0.15490150451660156, -0.14920425415039062, -0.1435070037841797, -0.13780975341796875, -0.1321125030517578, -0.12641525268554688, -0.12071800231933594, -0.115020751953125, -0.10932350158691406, -0.10362625122070312, -0.09792900085449219, -0.09223175048828125, -0.08653450012207031, -0.08083724975585938, -0.07513999938964844, -0.0694427490234375, -0.06374549865722656, -0.058048248291015625, -0.05235099792480469, -0.04665374755859375, -0.04095649719238281, -0.035259246826171875, -0.029561996459960938, -0.02386474609375, -0.018167495727539062, -0.012470245361328125, -0.0067729949951171875, -0.00107574462890625, 0.0046215057373046875, 0.010318756103515625, 0.016016006469726562, 0.0217132568359375, 0.027410507202148438, 0.033107757568359375, 0.03880500793457031, 0.04450225830078125, 0.05019950866699219, 0.055896759033203125, 0.06159400939941406, 0.067291259765625, 0.07298851013183594, 0.07868576049804688, 0.08438301086425781, 0.09008026123046875, 0.09577751159667969, 0.10147476196289062, 0.10717201232910156, 0.1128692626953125, 0.11856651306152344, 0.12426376342773438, 0.1299610137939453, 0.13565826416015625, 0.1413555145263672, 0.14705276489257812, 0.15275001525878906, 0.158447265625]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 3.0, 4.0, 4.0, 11.0, 20.0, 23.0, 25.0, 38.0, 47.0, 95.0, 133.0, 203.0, 322.0, 563.0, 922.0, 1628.0, 2963.0, 6025.0, 12620.0, 28002.0, 69142.0, 606507.0, 233118.0, 46447.0, 20245.0, 9336.0, 4541.0, 2352.0, 1279.0, 744.0, 443.0, 265.0, 179.0, 90.0, 51.0, 44.0, 28.0, 31.0, 17.0, 14.0, 7.0, 8.0, 9.0, 6.0, 2.0, 4.0, 3.0, 3.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.0716552734375, -0.0695352554321289, -0.06741523742675781, -0.06529521942138672, -0.06317520141601562, -0.06105518341064453, -0.05893516540527344, -0.056815147399902344, -0.05469512939453125, -0.052575111389160156, -0.05045509338378906, -0.04833507537841797, -0.046215057373046875, -0.04409503936767578, -0.04197502136230469, -0.039855003356933594, -0.0377349853515625, -0.035614967346191406, -0.03349494934082031, -0.03137493133544922, -0.029254913330078125, -0.02713489532470703, -0.025014877319335938, -0.022894859313964844, -0.02077484130859375, -0.018654823303222656, -0.016534805297851562, -0.014414787292480469, -0.012294769287109375, -0.010174751281738281, -0.008054733276367188, -0.005934715270996094, -0.003814697265625, -0.0016946792602539062, 0.0004253387451171875, 0.0025453567504882812, 0.004665374755859375, 0.006785392761230469, 0.008905410766601562, 0.011025428771972656, 0.01314544677734375, 0.015265464782714844, 0.017385482788085938, 0.01950550079345703, 0.021625518798828125, 0.02374553680419922, 0.025865554809570312, 0.027985572814941406, 0.0301055908203125, 0.032225608825683594, 0.03434562683105469, 0.03646564483642578, 0.038585662841796875, 0.04070568084716797, 0.04282569885253906, 0.044945716857910156, 0.04706573486328125, 0.049185752868652344, 0.05130577087402344, 0.05342578887939453, 0.055545806884765625, 0.05766582489013672, 0.05978584289550781, 0.061905860900878906, 0.06402587890625]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 3.0, 4.0, 8.0, 5.0, 8.0, 15.0, 14.0, 27.0, 38.0, 44.0, 66.0, 75.0, 93.0, 109.0, 119.0, 107.0, 81.0, 56.0, 29.0, 25.0, 17.0, 19.0, 10.0, 17.0, 1.0, 5.0, 7.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.645917892456055e-05, -6.464775651693344e-05, -6.283633410930634e-05, -6.102491170167923e-05, -5.9213489294052124e-05, -5.740206688642502e-05, -5.559064447879791e-05, -5.377922207117081e-05, -5.19677996635437e-05, -5.0156377255916595e-05, -4.834495484828949e-05, -4.6533532440662384e-05, -4.472211003303528e-05, -4.291068762540817e-05, -4.109926521778107e-05, -3.928784281015396e-05, -3.7476420402526855e-05, -3.566499799489975e-05, -3.3853575587272644e-05, -3.204215317964554e-05, -3.0230730772018433e-05, -2.8419308364391327e-05, -2.660788595676422e-05, -2.4796463549137115e-05, -2.298504114151001e-05, -2.1173618733882904e-05, -1.93621963262558e-05, -1.7550773918628693e-05, -1.5739351511001587e-05, -1.3927929103374481e-05, -1.2116506695747375e-05, -1.030508428812027e-05, -8.493661880493164e-06, -6.682239472866058e-06, -4.870817065238953e-06, -3.059394657611847e-06, -1.2479722499847412e-06, 5.634501576423645e-07, 2.3748725652694702e-06, 4.186294972896576e-06, 5.997717380523682e-06, 7.809139788150787e-06, 9.620562195777893e-06, 1.1431984603404999e-05, 1.3243407011032104e-05, 1.505482941865921e-05, 1.6866251826286316e-05, 1.867767423391342e-05, 2.0489096641540527e-05, 2.2300519049167633e-05, 2.411194145679474e-05, 2.5923363864421844e-05, 2.773478627204895e-05, 2.9546208679676056e-05, 3.135763108730316e-05, 3.316905349493027e-05, 3.498047590255737e-05, 3.679189831018448e-05, 3.8603320717811584e-05, 4.041474312543869e-05, 4.2226165533065796e-05, 4.40375879406929e-05, 4.584901034832001e-05, 4.766043275594711e-05, 4.947185516357422e-05]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 3.0, 2.0, 4.0, 11.0, 9.0, 9.0, 25.0, 42.0, 69.0, 151.0, 259.0, 593.0, 1562.0, 4633.0, 16197.0, 70088.0, 812799.0, 110708.0, 21933.0, 6041.0, 1968.0, 751.0, 342.0, 159.0, 85.0, 44.0, 30.0, 13.0, 13.0, 9.0, 5.0, 4.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0906982421875, -0.08701324462890625, -0.0833282470703125, -0.07964324951171875, -0.075958251953125, -0.07227325439453125, -0.0685882568359375, -0.06490325927734375, -0.06121826171875, -0.05753326416015625, -0.0538482666015625, -0.05016326904296875, -0.046478271484375, -0.04279327392578125, -0.0391082763671875, -0.03542327880859375, -0.03173828125, -0.02805328369140625, -0.0243682861328125, -0.02068328857421875, -0.016998291015625, -0.01331329345703125, -0.0096282958984375, -0.00594329833984375, -0.00225830078125, 0.00142669677734375, 0.0051116943359375, 0.00879669189453125, 0.012481689453125, 0.01616668701171875, 0.0198516845703125, 0.02353668212890625, 0.0272216796875, 0.03090667724609375, 0.0345916748046875, 0.03827667236328125, 0.041961669921875, 0.04564666748046875, 0.0493316650390625, 0.05301666259765625, 0.05670166015625, 0.06038665771484375, 0.0640716552734375, 0.06775665283203125, 0.071441650390625, 0.07512664794921875, 0.0788116455078125, 0.08249664306640625, 0.086181640625, 0.08986663818359375, 0.0935516357421875, 0.09723663330078125, 0.100921630859375, 0.10460662841796875, 0.1082916259765625, 0.11197662353515625, 0.11566162109375, 0.11934661865234375, 0.1230316162109375, 0.12671661376953125, 0.130401611328125, 0.13408660888671875, 0.1377716064453125, 0.14145660400390625, 0.1451416015625]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 3.0, 4.0, 1.0, 2.0, 1.0, 7.0, 6.0, 5.0, 7.0, 7.0, 6.0, 8.0, 14.0, 26.0, 26.0, 37.0, 96.0, 150.0, 203.0, 146.0, 81.0, 44.0, 25.0, 14.0, 18.0, 11.0, 12.0, 10.0, 9.0, 7.0, 3.0, 5.0, 5.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.055267333984375, -0.0530095100402832, -0.050751686096191406, -0.04849386215209961, -0.04623603820800781, -0.043978214263916016, -0.04172039031982422, -0.03946256637573242, -0.037204742431640625, -0.03494691848754883, -0.03268909454345703, -0.030431270599365234, -0.028173446655273438, -0.02591562271118164, -0.023657798767089844, -0.021399974822998047, -0.01914215087890625, -0.016884326934814453, -0.014626502990722656, -0.01236867904663086, -0.010110855102539062, -0.007853031158447266, -0.005595207214355469, -0.003337383270263672, -0.001079559326171875, 0.0011782646179199219, 0.0034360885620117188, 0.005693912506103516, 0.007951736450195312, 0.01020956039428711, 0.012467384338378906, 0.014725208282470703, 0.0169830322265625, 0.019240856170654297, 0.021498680114746094, 0.02375650405883789, 0.026014328002929688, 0.028272151947021484, 0.03052997589111328, 0.03278779983520508, 0.035045623779296875, 0.03730344772338867, 0.03956127166748047, 0.041819095611572266, 0.04407691955566406, 0.04633474349975586, 0.048592567443847656, 0.05085039138793945, 0.05310821533203125, 0.05536603927612305, 0.057623863220214844, 0.05988168716430664, 0.06213951110839844, 0.06439733505249023, 0.06665515899658203, 0.06891298294067383, 0.07117080688476562, 0.07342863082885742, 0.07568645477294922, 0.07794427871704102, 0.08020210266113281, 0.08245992660522461, 0.0847177505493164, 0.0869755744934082, 0.0892333984375]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 6.0, 5.0, 10.0, 10.0, 28.0, 40.0, 69.0, 95.0, 131.0, 152.0, 149.0, 121.0, 78.0, 47.0, 37.0, 23.0, 8.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.5589745044708252, -1.5216351747512817, -1.4842958450317383, -1.4469563961029053, -1.4096170663833618, -1.3722777366638184, -1.334938406944275, -1.2975990772247314, -1.2602596282958984, -1.222920298576355, -1.1855809688568115, -1.1482415199279785, -1.110902190208435, -1.0735628604888916, -1.0362235307693481, -0.9988842010498047, -0.9615448713302612, -0.9242055416107178, -0.8868661522865295, -0.8495268225669861, -0.8121874332427979, -0.7748481035232544, -0.7375087738037109, -0.7001694440841675, -0.6628300547599792, -0.6254907250404358, -0.5881513357162476, -0.5508120059967041, -0.5134726762771606, -0.4761332869529724, -0.43879395723342896, -0.4014545977115631, -0.3641153573989868, -0.32677599787712097, -0.2894366383552551, -0.25209730863571167, -0.21475794911384583, -0.17741858959197998, -0.14007924497127533, -0.10273990035057068, -0.06540054082870483, -0.028061188757419586, 0.009278163313865662, 0.04661751538515091, 0.08395686745643616, 0.121296226978302, 0.15863557159900665, 0.1959749162197113, 0.23331427574157715, 0.270653635263443, 0.30799299478530884, 0.3453323245048523, 0.38267168402671814, 0.420011043548584, 0.45735037326812744, 0.4946897327899933, 0.5320290923118591, 0.5693684220314026, 0.6067078113555908, 0.6440471410751343, 0.6813864707946777, 0.718725860118866, 0.7560651898384094, 0.7934045791625977, 0.8307439088821411]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 1.0, 2.0, 1.0, 4.0, 1.0, 5.0, 7.0, 9.0, 8.0, 17.0, 11.0, 20.0, 15.0, 23.0, 30.0, 40.0, 18.0, 38.0, 33.0, 46.0, 47.0, 38.0, 30.0, 46.0, 50.0, 46.0, 50.0, 51.0, 45.0, 42.0, 35.0, 26.0, 22.0, 24.0, 31.0, 17.0, 15.0, 17.0, 10.0, 6.0, 7.0, 7.0, 7.0, 6.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 3.0], "bins": [-0.7214030623435974, -0.7007407546043396, -0.680078387260437, -0.6594160795211792, -0.6387537717819214, -0.6180914044380188, -0.597429096698761, -0.5767667293548584, -0.5561044216156006, -0.5354421138763428, -0.5147797465324402, -0.4941174387931824, -0.4734551012516022, -0.452792763710022, -0.43213045597076416, -0.41146811842918396, -0.39080578088760376, -0.37014344334602356, -0.34948110580444336, -0.32881879806518555, -0.30815646052360535, -0.28749412298202515, -0.26683181524276733, -0.24616947770118713, -0.22550714015960693, -0.20484480261802673, -0.18418247997760773, -0.16352015733718872, -0.14285781979560852, -0.12219548970460892, -0.10153315961360931, -0.08087083697319031, -0.06020849943161011, -0.039546169340610504, -0.0188838392496109, 0.0017784908413887024, 0.022440820932388306, 0.04310315102338791, 0.06376548111438751, 0.08442780375480652, 0.10509014129638672, 0.12575247883796692, 0.14641480147838593, 0.16707712411880493, 0.18773946166038513, 0.20840179920196533, 0.22906412184238434, 0.24972644448280334, 0.27038878202438354, 0.29105111956596375, 0.31171345710754395, 0.33237576484680176, 0.35303810238838196, 0.37370043992996216, 0.39436274766921997, 0.41502508521080017, 0.43568742275238037, 0.45634976029396057, 0.47701209783554077, 0.4976744055747986, 0.5183367729187012, 0.538999080657959, 0.5596613883972168, 0.5803236961364746, 0.6009860634803772]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 5.0, 3.0, 2.0, 5.0, 2.0, 10.0, 16.0, 26.0, 34.0, 55.0, 77.0, 144.0, 274.0, 506.0, 865.0, 1728.0, 3601.0, 8113.0, 20184.0, 60820.0, 303292.0, 3490451.0, 221863.0, 51017.0, 17356.0, 7174.0, 3221.0, 1584.0, 820.0, 445.0, 260.0, 141.0, 72.0, 58.0, 31.0, 16.0, 8.0, 7.0, 2.0, 6.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1959228515625, -0.19054412841796875, -0.1851654052734375, -0.17978668212890625, -0.174407958984375, -0.16902923583984375, -0.1636505126953125, -0.15827178955078125, -0.15289306640625, -0.14751434326171875, -0.1421356201171875, -0.13675689697265625, -0.131378173828125, -0.12599945068359375, -0.1206207275390625, -0.11524200439453125, -0.10986328125, -0.10448455810546875, -0.0991058349609375, -0.09372711181640625, -0.088348388671875, -0.08296966552734375, -0.0775909423828125, -0.07221221923828125, -0.06683349609375, -0.06145477294921875, -0.0560760498046875, -0.05069732666015625, -0.045318603515625, -0.03993988037109375, -0.0345611572265625, -0.02918243408203125, -0.0238037109375, -0.01842498779296875, -0.0130462646484375, -0.00766754150390625, -0.002288818359375, 0.00308990478515625, 0.0084686279296875, 0.01384735107421875, 0.01922607421875, 0.02460479736328125, 0.0299835205078125, 0.03536224365234375, 0.040740966796875, 0.04611968994140625, 0.0514984130859375, 0.05687713623046875, 0.062255859375, 0.06763458251953125, 0.0730133056640625, 0.07839202880859375, 0.083770751953125, 0.08914947509765625, 0.0945281982421875, 0.09990692138671875, 0.10528564453125, 0.11066436767578125, 0.1160430908203125, 0.12142181396484375, 0.126800537109375, 0.13217926025390625, 0.1375579833984375, 0.14293670654296875, 0.1483154296875]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 7.0, 3.0, 1.0, 6.0, 3.0, 10.0, 11.0, 11.0, 11.0, 15.0, 26.0, 35.0, 22.0, 29.0, 39.0, 49.0, 50.0, 44.0, 50.0, 60.0, 55.0, 51.0, 68.0, 51.0, 45.0, 36.0, 39.0, 39.0, 18.0, 27.0, 19.0, 28.0, 20.0, 9.0, 5.0, 7.0, 5.0, 5.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03302001953125, -0.03185272216796875, -0.0306854248046875, -0.02951812744140625, -0.028350830078125, -0.02718353271484375, -0.0260162353515625, -0.02484893798828125, -0.023681640625, -0.02251434326171875, -0.0213470458984375, -0.02017974853515625, -0.019012451171875, -0.01784515380859375, -0.0166778564453125, -0.01551055908203125, -0.01434326171875, -0.01317596435546875, -0.0120086669921875, -0.01084136962890625, -0.009674072265625, -0.00850677490234375, -0.0073394775390625, -0.00617218017578125, -0.0050048828125, -0.00383758544921875, -0.0026702880859375, -0.00150299072265625, -0.000335693359375, 0.00083160400390625, 0.0019989013671875, 0.00316619873046875, 0.00433349609375, 0.00550079345703125, 0.0066680908203125, 0.00783538818359375, 0.009002685546875, 0.01016998291015625, 0.0113372802734375, 0.01250457763671875, 0.013671875, 0.01483917236328125, 0.0160064697265625, 0.01717376708984375, 0.018341064453125, 0.01950836181640625, 0.0206756591796875, 0.02184295654296875, 0.02301025390625, 0.02417755126953125, 0.0253448486328125, 0.02651214599609375, 0.027679443359375, 0.02884674072265625, 0.0300140380859375, 0.03118133544921875, 0.0323486328125, 0.03351593017578125, 0.0346832275390625, 0.03585052490234375, 0.037017822265625, 0.03818511962890625, 0.0393524169921875, 0.04051971435546875, 0.04168701171875]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 6.0, 9.0, 14.0, 19.0, 25.0, 21.0, 41.0, 45.0, 86.0, 128.0, 191.0, 274.0, 452.0, 607.0, 1046.0, 1724.0, 2981.0, 5692.0, 13342.0, 38869.0, 174722.0, 3342947.0, 497887.0, 73593.0, 21231.0, 8518.0, 3925.0, 2166.0, 1324.0, 795.0, 571.0, 345.0, 183.0, 159.0, 119.0, 67.0, 51.0, 38.0, 25.0, 13.0, 8.0, 6.0, 5.0, 8.0, 3.0, 1.0, 2.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2283935546875, -0.22071266174316406, -0.21303176879882812, -0.2053508758544922, -0.19766998291015625, -0.1899890899658203, -0.18230819702148438, -0.17462730407714844, -0.1669464111328125, -0.15926551818847656, -0.15158462524414062, -0.1439037322998047, -0.13622283935546875, -0.1285419464111328, -0.12086105346679688, -0.11318016052246094, -0.105499267578125, -0.09781837463378906, -0.09013748168945312, -0.08245658874511719, -0.07477569580078125, -0.06709480285644531, -0.059413909912109375, -0.05173301696777344, -0.0440521240234375, -0.03637123107910156, -0.028690338134765625, -0.021009445190429688, -0.01332855224609375, -0.0056476593017578125, 0.002033233642578125, 0.009714126586914062, 0.01739501953125, 0.025075912475585938, 0.032756805419921875, 0.04043769836425781, 0.04811859130859375, 0.05579948425292969, 0.06348037719726562, 0.07116127014160156, 0.0788421630859375, 0.08652305603027344, 0.09420394897460938, 0.10188484191894531, 0.10956573486328125, 0.11724662780761719, 0.12492752075195312, 0.13260841369628906, 0.140289306640625, 0.14797019958496094, 0.15565109252929688, 0.1633319854736328, 0.17101287841796875, 0.1786937713623047, 0.18637466430664062, 0.19405555725097656, 0.2017364501953125, 0.20941734313964844, 0.21709823608398438, 0.2247791290283203, 0.23246002197265625, 0.2401409149169922, 0.24782180786132812, 0.25550270080566406, 0.26318359375]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 4.0, 2.0, 3.0, 2.0, 3.0, 10.0, 5.0, 5.0, 15.0, 18.0, 21.0, 32.0, 51.0, 101.0, 155.0, 350.0, 2153.0, 596.0, 217.0, 129.0, 71.0, 31.0, 32.0, 18.0, 18.0, 7.0, 9.0, 2.0, 2.0, 4.0, 2.0, 2.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1243896484375, -0.12058067321777344, -0.11677169799804688, -0.11296272277832031, -0.10915374755859375, -0.10534477233886719, -0.10153579711914062, -0.09772682189941406, -0.0939178466796875, -0.09010887145996094, -0.08629989624023438, -0.08249092102050781, -0.07868194580078125, -0.07487297058105469, -0.07106399536132812, -0.06725502014160156, -0.063446044921875, -0.05963706970214844, -0.055828094482421875, -0.05201911926269531, -0.04821014404296875, -0.04440116882324219, -0.040592193603515625, -0.03678321838378906, -0.0329742431640625, -0.029165267944335938, -0.025356292724609375, -0.021547317504882812, -0.01773834228515625, -0.013929367065429688, -0.010120391845703125, -0.0063114166259765625, -0.00250244140625, 0.0013065338134765625, 0.005115509033203125, 0.008924484252929688, 0.01273345947265625, 0.016542434692382812, 0.020351409912109375, 0.024160385131835938, 0.0279693603515625, 0.03177833557128906, 0.035587310791015625, 0.03939628601074219, 0.04320526123046875, 0.04701423645019531, 0.050823211669921875, 0.05463218688964844, 0.058441162109375, 0.06225013732910156, 0.06605911254882812, 0.06986808776855469, 0.07367706298828125, 0.07748603820800781, 0.08129501342773438, 0.08510398864746094, 0.0889129638671875, 0.09272193908691406, 0.09653091430664062, 0.10033988952636719, 0.10414886474609375, 0.10795783996582031, 0.11176681518554688, 0.11557579040527344, 0.119384765625]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 8.0, 8.0, 31.0, 69.0, 116.0, 208.0, 217.0, 148.0, 105.0, 44.0, 23.0, 20.0, 8.0, 3.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5500032901763916, -0.5155172944068909, -0.48103129863739014, -0.4465453028678894, -0.41205930709838867, -0.37757331132888794, -0.3430872857570648, -0.3086012899875641, -0.27411529421806335, -0.23962929844856262, -0.2051433026790619, -0.17065729200839996, -0.13617129623889923, -0.1016853004693985, -0.06719928979873657, -0.03271329402923584, 0.0017727017402648926, 0.03625870123505592, 0.07074470072984695, 0.10523070394992828, 0.13971669971942902, 0.17420269548892975, 0.20868870615959167, 0.2431747019290924, 0.27766069769859314, 0.31214669346809387, 0.3466326892375946, 0.3811187148094177, 0.41560471057891846, 0.4500907063484192, 0.4845767021179199, 0.5190626978874207, 0.5535486936569214, 0.5880346894264221, 0.6225206851959229, 0.6570066809654236, 0.6914926767349243, 0.725978672504425, 0.7604646682739258, 0.7949507236480713, 0.8294366598129272, 0.863922655582428, 0.8984086513519287, 0.9328946471214294, 0.9673806428909302, 1.0018666982650757, 1.0363526344299316, 1.0708386898040771, 1.1053247451782227, 1.1398108005523682, 1.1742967367172241, 1.2087827920913696, 1.2432687282562256, 1.277754783630371, 1.312240719795227, 1.3467267751693726, 1.3812127113342285, 1.415698766708374, 1.45018470287323, 1.4846707582473755, 1.5191566944122314, 1.553642749786377, 1.588128685951233, 1.6226147413253784, 1.6571006774902344]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 4.0, 3.0, 2.0, 9.0, 4.0, 7.0, 7.0, 20.0, 9.0, 14.0, 12.0, 22.0, 23.0, 31.0, 22.0, 24.0, 24.0, 22.0, 35.0, 22.0, 31.0, 35.0, 45.0, 51.0, 31.0, 41.0, 41.0, 45.0, 34.0, 31.0, 34.0, 27.0, 30.0, 31.0, 26.0, 27.0, 25.0, 20.0, 13.0, 16.0, 9.0, 4.0, 14.0, 5.0, 9.0, 7.0, 2.0, 2.0, 4.0, 3.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.3495801091194153, -0.33873802423477173, -0.32789596915245056, -0.317053884267807, -0.30621182918548584, -0.2953697443008423, -0.28452765941619873, -0.2736855745315552, -0.262843519449234, -0.25200143456459045, -0.2411593794822693, -0.23031729459762573, -0.21947522461414337, -0.208633154630661, -0.19779106974601746, -0.1869489997625351, -0.17610692977905273, -0.16526485979557037, -0.154422789812088, -0.14358070492744446, -0.1327386349439621, -0.12189656496047974, -0.11105448752641678, -0.10021241009235382, -0.08937034010887146, -0.0785282701253891, -0.06768619269132614, -0.05684411898255348, -0.04600204527378082, -0.03515997156500816, -0.024317897856235504, -0.013475820422172546, -0.0026337504386901855, 0.008208323270082474, 0.019050396978855133, 0.029892470687627792, 0.04073454439640045, 0.05157661810517311, 0.06241869181394577, 0.07326076924800873, 0.08410283923149109, 0.09494490921497345, 0.10578698664903641, 0.11662906408309937, 0.12747113406658173, 0.1383132040500641, 0.14915528893470764, 0.15999735891819, 0.17083942890167236, 0.18168149888515472, 0.19252356886863708, 0.20336565375328064, 0.214207723736763, 0.22504979372024536, 0.23589187860488892, 0.24673394858837128, 0.25757601857185364, 0.2684181034564972, 0.27926015853881836, 0.2901022434234619, 0.30094432830810547, 0.31178638339042664, 0.3226284682750702, 0.33347052335739136, 0.3443126082420349]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 4.0, 2.0, 5.0, 8.0, 8.0, 15.0, 31.0, 30.0, 41.0, 67.0, 97.0, 145.0, 191.0, 292.0, 469.0, 844.0, 1386.0, 2461.0, 4637.0, 8755.0, 16611.0, 30758.0, 56811.0, 104118.0, 219823.0, 296327.0, 141606.0, 74227.0, 41057.0, 22163.0, 11559.0, 6230.0, 3302.0, 1799.0, 953.0, 617.0, 364.0, 215.0, 172.0, 103.0, 71.0, 57.0, 33.0, 31.0, 25.0, 13.0, 9.0, 6.0, 6.0, 2.0, 3.0, 3.0, 4.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.11309814453125, -0.109588623046875, -0.1060791015625, -0.102569580078125, -0.09906005859375, -0.095550537109375, -0.092041015625, -0.088531494140625, -0.08502197265625, -0.081512451171875, -0.0780029296875, -0.074493408203125, -0.07098388671875, -0.067474365234375, -0.06396484375, -0.060455322265625, -0.05694580078125, -0.053436279296875, -0.0499267578125, -0.046417236328125, -0.04290771484375, -0.039398193359375, -0.035888671875, -0.032379150390625, -0.02886962890625, -0.025360107421875, -0.0218505859375, -0.018341064453125, -0.01483154296875, -0.011322021484375, -0.0078125, -0.004302978515625, -0.00079345703125, 0.002716064453125, 0.0062255859375, 0.009735107421875, 0.01324462890625, 0.016754150390625, 0.020263671875, 0.023773193359375, 0.02728271484375, 0.030792236328125, 0.0343017578125, 0.037811279296875, 0.04132080078125, 0.044830322265625, 0.04833984375, 0.051849365234375, 0.05535888671875, 0.058868408203125, 0.0623779296875, 0.065887451171875, 0.06939697265625, 0.072906494140625, 0.076416015625, 0.079925537109375, 0.08343505859375, 0.086944580078125, 0.0904541015625, 0.093963623046875, 0.09747314453125, 0.100982666015625, 0.1044921875, 0.108001708984375, 0.11151123046875]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 1.0, 3.0, 4.0, 10.0, 11.0, 6.0, 12.0, 12.0, 8.0, 18.0, 22.0, 17.0, 23.0, 26.0, 33.0, 29.0, 27.0, 23.0, 26.0, 45.0, 55.0, 50.0, 40.0, 33.0, 39.0, 52.0, 47.0, 37.0, 30.0, 46.0, 36.0, 30.0, 15.0, 28.0, 23.0, 16.0, 13.0, 12.0, 14.0, 9.0, 8.0, 10.0, 3.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.03515625, -0.0339818000793457, -0.032807350158691406, -0.03163290023803711, -0.030458450317382812, -0.029284000396728516, -0.02810955047607422, -0.026935100555419922, -0.025760650634765625, -0.024586200714111328, -0.02341175079345703, -0.022237300872802734, -0.021062850952148438, -0.01988840103149414, -0.018713951110839844, -0.017539501190185547, -0.01636505126953125, -0.015190601348876953, -0.014016151428222656, -0.01284170150756836, -0.011667251586914062, -0.010492801666259766, -0.009318351745605469, -0.008143901824951172, -0.006969451904296875, -0.005795001983642578, -0.004620552062988281, -0.0034461021423339844, -0.0022716522216796875, -0.0010972023010253906, 7.724761962890625e-05, 0.0012516975402832031, 0.0024261474609375, 0.003600597381591797, 0.004775047302246094, 0.005949497222900391, 0.0071239471435546875, 0.008298397064208984, 0.009472846984863281, 0.010647296905517578, 0.011821746826171875, 0.012996196746826172, 0.014170646667480469, 0.015345096588134766, 0.016519546508789062, 0.01769399642944336, 0.018868446350097656, 0.020042896270751953, 0.02121734619140625, 0.022391796112060547, 0.023566246032714844, 0.02474069595336914, 0.025915145874023438, 0.027089595794677734, 0.02826404571533203, 0.029438495635986328, 0.030612945556640625, 0.03178739547729492, 0.03296184539794922, 0.034136295318603516, 0.03531074523925781, 0.03648519515991211, 0.037659645080566406, 0.0388340950012207, 0.040008544921875]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 3.0, 2.0, 3.0, 2.0, 2.0, 0.0, 6.0, 7.0, 6.0, 6.0, 13.0, 13.0, 15.0, 17.0, 24.0, 29.0, 52.0, 54.0, 79.0, 114.0, 155.0, 201.0, 280.0, 385.0, 563.0, 947.0, 1887.0, 4643.0, 13557.0, 44187.0, 145017.0, 562026.0, 188848.0, 56891.0, 17170.0, 5752.0, 2321.0, 1138.0, 613.0, 376.0, 311.0, 190.0, 153.0, 131.0, 104.0, 68.0, 55.0, 38.0, 29.0, 26.0, 19.0, 6.0, 15.0, 2.0, 1.0, 7.0, 3.0, 2.0, 0.0, 5.0, 1.0, 2.0, 2.0], "bins": [-0.22412109375, -0.21724700927734375, -0.2103729248046875, -0.20349884033203125, -0.196624755859375, -0.18975067138671875, -0.1828765869140625, -0.17600250244140625, -0.16912841796875, -0.16225433349609375, -0.1553802490234375, -0.14850616455078125, -0.141632080078125, -0.13475799560546875, -0.1278839111328125, -0.12100982666015625, -0.1141357421875, -0.10726165771484375, -0.1003875732421875, -0.09351348876953125, -0.086639404296875, -0.07976531982421875, -0.0728912353515625, -0.06601715087890625, -0.05914306640625, -0.05226898193359375, -0.0453948974609375, -0.03852081298828125, -0.031646728515625, -0.02477264404296875, -0.0178985595703125, -0.01102447509765625, -0.004150390625, 0.00272369384765625, 0.0095977783203125, 0.01647186279296875, 0.023345947265625, 0.03022003173828125, 0.0370941162109375, 0.04396820068359375, 0.05084228515625, 0.05771636962890625, 0.0645904541015625, 0.07146453857421875, 0.078338623046875, 0.08521270751953125, 0.0920867919921875, 0.09896087646484375, 0.1058349609375, 0.11270904541015625, 0.1195831298828125, 0.12645721435546875, 0.133331298828125, 0.14020538330078125, 0.1470794677734375, 0.15395355224609375, 0.16082763671875, 0.16770172119140625, 0.1745758056640625, 0.18144989013671875, 0.188323974609375, 0.19519805908203125, 0.2020721435546875, 0.20894622802734375, 0.2158203125]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 3.0, 3.0, 4.0, 4.0, 10.0, 3.0, 7.0, 7.0, 7.0, 15.0, 12.0, 19.0, 17.0, 17.0, 22.0, 37.0, 33.0, 35.0, 44.0, 35.0, 47.0, 57.0, 51.0, 54.0, 39.0, 57.0, 51.0, 39.0, 40.0, 21.0, 22.0, 32.0, 23.0, 25.0, 26.0, 18.0, 9.0, 11.0, 15.0, 5.0, 12.0, 3.0, 2.0, 1.0, 4.0, 4.0, 4.0, 2.0, 0.0, 2.0, 2.0, 1.0, 2.0], "bins": [-0.2347412109375, -0.22794151306152344, -0.22114181518554688, -0.2143421173095703, -0.20754241943359375, -0.2007427215576172, -0.19394302368164062, -0.18714332580566406, -0.1803436279296875, -0.17354393005371094, -0.16674423217773438, -0.1599445343017578, -0.15314483642578125, -0.1463451385498047, -0.13954544067382812, -0.13274574279785156, -0.125946044921875, -0.11914634704589844, -0.11234664916992188, -0.10554695129394531, -0.09874725341796875, -0.09194755554199219, -0.08514785766601562, -0.07834815979003906, -0.0715484619140625, -0.06474876403808594, -0.057949066162109375, -0.05114936828613281, -0.04434967041015625, -0.03754997253417969, -0.030750274658203125, -0.023950576782226562, -0.01715087890625, -0.010351181030273438, -0.003551483154296875, 0.0032482147216796875, 0.01004791259765625, 0.016847610473632812, 0.023647308349609375, 0.030447006225585938, 0.0372467041015625, 0.04404640197753906, 0.050846099853515625, 0.05764579772949219, 0.06444549560546875, 0.07124519348144531, 0.07804489135742188, 0.08484458923339844, 0.091644287109375, 0.09844398498535156, 0.10524368286132812, 0.11204338073730469, 0.11884307861328125, 0.1256427764892578, 0.13244247436523438, 0.13924217224121094, 0.1460418701171875, 0.15284156799316406, 0.15964126586914062, 0.1664409637451172, 0.17324066162109375, 0.1800403594970703, 0.18684005737304688, 0.19363975524902344, 0.200439453125]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 9.0, 9.0, 7.0, 10.0, 24.0, 29.0, 48.0, 65.0, 127.0, 272.0, 600.0, 1663.0, 7778.0, 111757.0, 869151.0, 49852.0, 4997.0, 1217.0, 423.0, 192.0, 106.0, 69.0, 32.0, 36.0, 30.0, 19.0, 9.0, 5.0, 10.0, 3.0, 1.0, 1.0, 4.0, 5.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.426513671875, -0.4159507751464844, -0.40538787841796875, -0.3948249816894531, -0.3842620849609375, -0.3736991882324219, -0.36313629150390625, -0.3525733947753906, -0.342010498046875, -0.3314476013183594, -0.32088470458984375, -0.3103218078613281, -0.2997589111328125, -0.2891960144042969, -0.27863311767578125, -0.2680702209472656, -0.25750732421875, -0.24694442749023438, -0.23638153076171875, -0.22581863403320312, -0.2152557373046875, -0.20469284057617188, -0.19412994384765625, -0.18356704711914062, -0.173004150390625, -0.16244125366210938, -0.15187835693359375, -0.14131546020507812, -0.1307525634765625, -0.12018966674804688, -0.10962677001953125, -0.09906387329101562, -0.0885009765625, -0.07793807983398438, -0.06737518310546875, -0.056812286376953125, -0.0462493896484375, -0.035686492919921875, -0.02512359619140625, -0.014560699462890625, -0.003997802734375, 0.006565093994140625, 0.01712799072265625, 0.027690887451171875, 0.0382537841796875, 0.048816680908203125, 0.05937957763671875, 0.06994247436523438, 0.08050537109375, 0.09106826782226562, 0.10163116455078125, 0.11219406127929688, 0.1227569580078125, 0.13331985473632812, 0.14388275146484375, 0.15444564819335938, 0.165008544921875, 0.17557144165039062, 0.18613433837890625, 0.19669723510742188, 0.2072601318359375, 0.21782302856445312, 0.22838592529296875, 0.23894882202148438, 0.24951171875]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 3.0, 3.0, 9.0, 6.0, 8.0, 10.0, 19.0, 18.0, 31.0, 50.0, 60.0, 88.0, 102.0, 114.0, 126.0, 99.0, 68.0, 61.0, 39.0, 34.0, 12.0, 18.0, 14.0, 7.0, 6.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.772445678710938e-05, -7.520057260990143e-05, -7.267668843269348e-05, -7.015280425548553e-05, -6.762892007827759e-05, -6.510503590106964e-05, -6.25811517238617e-05, -6.005726754665375e-05, -5.75333833694458e-05, -5.5009499192237854e-05, -5.248561501502991e-05, -4.996173083782196e-05, -4.7437846660614014e-05, -4.491396248340607e-05, -4.239007830619812e-05, -3.986619412899017e-05, -3.7342309951782227e-05, -3.481842577457428e-05, -3.229454159736633e-05, -2.9770657420158386e-05, -2.724677324295044e-05, -2.4722889065742493e-05, -2.2199004888534546e-05, -1.96751207113266e-05, -1.7151236534118652e-05, -1.4627352356910706e-05, -1.2103468179702759e-05, -9.579584002494812e-06, -7.055699825286865e-06, -4.5318156480789185e-06, -2.0079314708709717e-06, 5.159527063369751e-07, 3.039836883544922e-06, 5.563721060752869e-06, 8.087605237960815e-06, 1.0611489415168762e-05, 1.3135373592376709e-05, 1.5659257769584656e-05, 1.8183141946792603e-05, 2.070702612400055e-05, 2.3230910301208496e-05, 2.5754794478416443e-05, 2.827867865562439e-05, 3.0802562832832336e-05, 3.332644701004028e-05, 3.585033118724823e-05, 3.837421536445618e-05, 4.0898099541664124e-05, 4.342198371887207e-05, 4.594586789608002e-05, 4.8469752073287964e-05, 5.099363625049591e-05, 5.351752042770386e-05, 5.6041404604911804e-05, 5.856528878211975e-05, 6.10891729593277e-05, 6.361305713653564e-05, 6.613694131374359e-05, 6.866082549095154e-05, 7.118470966815948e-05, 7.370859384536743e-05, 7.623247802257538e-05, 7.875636219978333e-05, 8.128024637699127e-05, 8.380413055419922e-05]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 4.0, 1.0, 3.0, 6.0, 10.0, 17.0, 16.0, 19.0, 22.0, 52.0, 88.0, 121.0, 216.0, 311.0, 580.0, 1134.0, 2575.0, 6361.0, 27516.0, 310319.0, 633411.0, 50336.0, 9045.0, 3175.0, 1482.0, 749.0, 388.0, 240.0, 116.0, 82.0, 57.0, 36.0, 23.0, 11.0, 9.0, 8.0, 4.0, 3.0, 7.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0], "bins": [-0.2322998046875, -0.2254962921142578, -0.21869277954101562, -0.21188926696777344, -0.20508575439453125, -0.19828224182128906, -0.19147872924804688, -0.1846752166748047, -0.1778717041015625, -0.1710681915283203, -0.16426467895507812, -0.15746116638183594, -0.15065765380859375, -0.14385414123535156, -0.13705062866210938, -0.1302471160888672, -0.123443603515625, -0.11664009094238281, -0.10983657836914062, -0.10303306579589844, -0.09622955322265625, -0.08942604064941406, -0.08262252807617188, -0.07581901550292969, -0.0690155029296875, -0.06221199035644531, -0.055408477783203125, -0.04860496520996094, -0.04180145263671875, -0.03499794006347656, -0.028194427490234375, -0.021390914916992188, -0.01458740234375, -0.0077838897705078125, -0.000980377197265625, 0.0058231353759765625, 0.01262664794921875, 0.019430160522460938, 0.026233673095703125, 0.03303718566894531, 0.0398406982421875, 0.04664421081542969, 0.053447723388671875, 0.06025123596191406, 0.06705474853515625, 0.07385826110839844, 0.08066177368164062, 0.08746528625488281, 0.094268798828125, 0.10107231140136719, 0.10787582397460938, 0.11467933654785156, 0.12148284912109375, 0.12828636169433594, 0.13508987426757812, 0.1418933868408203, 0.1486968994140625, 0.1555004119873047, 0.16230392456054688, 0.16910743713378906, 0.17591094970703125, 0.18271446228027344, 0.18951797485351562, 0.1963214874267578, 0.203125]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 1.0, 0.0, 1.0, 8.0, 5.0, 4.0, 3.0, 12.0, 15.0, 34.0, 24.0, 43.0, 72.0, 73.0, 135.0, 175.0, 112.0, 83.0, 64.0, 47.0, 30.0, 19.0, 11.0, 8.0, 8.0, 5.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1751708984375, -0.17006874084472656, -0.16496658325195312, -0.1598644256591797, -0.15476226806640625, -0.1496601104736328, -0.14455795288085938, -0.13945579528808594, -0.1343536376953125, -0.12925148010253906, -0.12414932250976562, -0.11904716491699219, -0.11394500732421875, -0.10884284973144531, -0.10374069213867188, -0.09863853454589844, -0.093536376953125, -0.08843421936035156, -0.08333206176757812, -0.07822990417480469, -0.07312774658203125, -0.06802558898925781, -0.06292343139648438, -0.05782127380371094, -0.0527191162109375, -0.04761695861816406, -0.042514801025390625, -0.03741264343261719, -0.03231048583984375, -0.027208328247070312, -0.022106170654296875, -0.017004013061523438, -0.01190185546875, -0.0067996978759765625, -0.001697540283203125, 0.0034046173095703125, 0.00850677490234375, 0.013608932495117188, 0.018711090087890625, 0.023813247680664062, 0.0289154052734375, 0.03401756286621094, 0.039119720458984375, 0.04422187805175781, 0.04932403564453125, 0.05442619323730469, 0.059528350830078125, 0.06463050842285156, 0.069732666015625, 0.07483482360839844, 0.07993698120117188, 0.08503913879394531, 0.09014129638671875, 0.09524345397949219, 0.10034561157226562, 0.10544776916503906, 0.1105499267578125, 0.11565208435058594, 0.12075424194335938, 0.1258563995361328, 0.13095855712890625, 0.1360607147216797, 0.14116287231445312, 0.14626502990722656, 0.1513671875]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 9.0, 14.0, 38.0, 54.0, 77.0, 115.0, 150.0, 159.0, 131.0, 91.0, 68.0, 43.0, 22.0, 12.0, 11.0, 8.0, 4.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.583528995513916, -1.5179442167282104, -1.4523593187332153, -1.3867745399475098, -1.3211896419525146, -1.255604863166809, -1.1900200843811035, -1.1244351863861084, -1.0588504076004028, -0.9932655692100525, -0.9276807308197021, -0.8620959520339966, -0.7965111136436462, -0.7309262752532959, -0.6653414964675903, -0.59975665807724, -0.5341718196868896, -0.4685869812965393, -0.40300217270851135, -0.3374173641204834, -0.27183252573013306, -0.20624768733978271, -0.14066287875175476, -0.0750780701637268, -0.009493231773376465, 0.05609159171581268, 0.12167641520500183, 0.18726123869419098, 0.2528460621833801, 0.31843090057373047, 0.3840157091617584, 0.4496005177497864, 0.5151851177215576, 0.580769956111908, 0.6463547945022583, 0.7119395732879639, 0.7775244116783142, 0.8431092500686646, 0.9086940288543701, 0.9742788672447205, 1.0398637056350708, 1.1054484844207764, 1.1710333824157715, 1.236618161201477, 1.3022029399871826, 1.3677878379821777, 1.4333726167678833, 1.4989573955535889, 1.564542293548584, 1.6301270723342896, 1.6957119703292847, 1.7612967491149902, 1.8268816471099854, 1.892466425895691, 1.9580512046813965, 2.0236361026763916, 2.0892210006713867, 2.154805898666382, 2.220390558242798, 2.285975456237793, 2.351560354232788, 2.417145252227783, 2.482729911804199, 2.5483148097991943, 2.6138994693756104]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 5.0, 2.0, 5.0, 11.0, 9.0, 9.0, 11.0, 17.0, 19.0, 17.0, 17.0, 22.0, 30.0, 22.0, 29.0, 31.0, 36.0, 35.0, 31.0, 39.0, 47.0, 53.0, 48.0, 37.0, 49.0, 31.0, 43.0, 39.0, 42.0, 38.0, 28.0, 17.0, 21.0, 19.0, 15.0, 10.0, 15.0, 13.0, 8.0, 7.0, 9.0, 6.0, 3.0, 3.0, 5.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 4.0], "bins": [-1.1979303359985352, -1.1631454229354858, -1.1283605098724365, -1.0935757160186768, -1.0587908029556274, -1.0240058898925781, -0.9892209768295288, -0.9544361233711243, -0.9196512699127197, -0.8848663568496704, -0.8500815033912659, -0.8152965903282166, -0.780511736869812, -0.7457268238067627, -0.7109419107437134, -0.6761570572853088, -0.6413721442222595, -0.6065872311592102, -0.5718023777008057, -0.5370174646377563, -0.5022326111793518, -0.4674476981163025, -0.43266281485557556, -0.39787793159484863, -0.3630930483341217, -0.3283081650733948, -0.29352328181266785, -0.2587383985519409, -0.2239535003900528, -0.18916861712932587, -0.15438371896743774, -0.11959883570671082, -0.08481395244598389, -0.05002906545996666, -0.015244178473949432, 0.019540712237358093, 0.05432559549808502, 0.08911047875881195, 0.12389537692070007, 0.158680260181427, 0.19346514344215393, 0.22825002670288086, 0.2630349099636078, 0.2978197932243347, 0.33260470628738403, 0.3673895597457886, 0.4021744728088379, 0.4369593560695648, 0.47174423933029175, 0.5065291523933411, 0.5413140058517456, 0.5760989189147949, 0.6108837723731995, 0.6456686854362488, 0.6804535388946533, 0.7152384519577026, 0.750023365020752, 0.7848082780838013, 0.8195931315422058, 0.8543780446052551, 0.8891628980636597, 0.923947811126709, 0.9587327241897583, 0.9935175776481628, 1.0283024311065674]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 4.0, 1.0, 1.0, 4.0, 3.0, 7.0, 10.0, 10.0, 10.0, 25.0, 30.0, 35.0, 49.0, 96.0, 126.0, 171.0, 280.0, 486.0, 836.0, 1331.0, 2272.0, 4554.0, 8752.0, 18639.0, 43829.0, 125255.0, 669655.0, 2987207.0, 214559.0, 64743.0, 25998.0, 11850.0, 5945.0, 3177.0, 1764.0, 979.0, 583.0, 361.0, 219.0, 142.0, 94.0, 66.0, 42.0, 32.0, 24.0, 16.0, 3.0, 12.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1488037109375, -0.1438770294189453, -0.13895034790039062, -0.13402366638183594, -0.12909698486328125, -0.12417030334472656, -0.11924362182617188, -0.11431694030761719, -0.1093902587890625, -0.10446357727050781, -0.09953689575195312, -0.09461021423339844, -0.08968353271484375, -0.08475685119628906, -0.07983016967773438, -0.07490348815917969, -0.069976806640625, -0.06505012512207031, -0.060123443603515625, -0.05519676208496094, -0.05027008056640625, -0.04534339904785156, -0.040416717529296875, -0.03549003601074219, -0.0305633544921875, -0.025636672973632812, -0.020709991455078125, -0.015783309936523438, -0.01085662841796875, -0.0059299468994140625, -0.001003265380859375, 0.0039234161376953125, 0.00885009765625, 0.013776779174804688, 0.018703460693359375, 0.023630142211914062, 0.02855682373046875, 0.03348350524902344, 0.038410186767578125, 0.04333686828613281, 0.0482635498046875, 0.05319023132324219, 0.058116912841796875, 0.06304359436035156, 0.06797027587890625, 0.07289695739746094, 0.07782363891601562, 0.08275032043457031, 0.087677001953125, 0.09260368347167969, 0.09753036499023438, 0.10245704650878906, 0.10738372802734375, 0.11231040954589844, 0.11723709106445312, 0.12216377258300781, 0.1270904541015625, 0.1320171356201172, 0.13694381713867188, 0.14187049865722656, 0.14679718017578125, 0.15172386169433594, 0.15665054321289062, 0.1615772247314453, 0.16650390625]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 5.0, 9.0, 6.0, 12.0, 8.0, 9.0, 24.0, 21.0, 23.0, 26.0, 27.0, 28.0, 32.0, 40.0, 38.0, 33.0, 57.0, 46.0, 60.0, 46.0, 47.0, 40.0, 39.0, 54.0, 38.0, 31.0, 30.0, 29.0, 30.0, 21.0, 15.0, 19.0, 13.0, 11.0, 8.0, 9.0, 6.0, 5.0, 2.0, 6.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.047943115234375, -0.04653644561767578, -0.04512977600097656, -0.043723106384277344, -0.042316436767578125, -0.040909767150878906, -0.03950309753417969, -0.03809642791748047, -0.03668975830078125, -0.03528308868408203, -0.03387641906738281, -0.032469749450683594, -0.031063079833984375, -0.029656410217285156, -0.028249740600585938, -0.02684307098388672, -0.0254364013671875, -0.02402973175048828, -0.022623062133789062, -0.021216392517089844, -0.019809722900390625, -0.018403053283691406, -0.016996383666992188, -0.015589714050292969, -0.01418304443359375, -0.012776374816894531, -0.011369705200195312, -0.009963035583496094, -0.008556365966796875, -0.007149696350097656, -0.0057430267333984375, -0.004336357116699219, -0.0029296875, -0.0015230178833007812, -0.0001163482666015625, 0.0012903213500976562, 0.002696990966796875, 0.004103660583496094, 0.0055103302001953125, 0.006916999816894531, 0.00832366943359375, 0.009730339050292969, 0.011137008666992188, 0.012543678283691406, 0.013950347900390625, 0.015357017517089844, 0.016763687133789062, 0.01817035675048828, 0.0195770263671875, 0.02098369598388672, 0.022390365600585938, 0.023797035217285156, 0.025203704833984375, 0.026610374450683594, 0.028017044067382812, 0.02942371368408203, 0.03083038330078125, 0.03223705291748047, 0.03364372253417969, 0.035050392150878906, 0.036457061767578125, 0.037863731384277344, 0.03927040100097656, 0.04067707061767578, 0.042083740234375]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 4.0, 4.0, 6.0, 7.0, 7.0, 8.0, 14.0, 26.0, 35.0, 31.0, 53.0, 79.0, 132.0, 168.0, 224.0, 371.0, 594.0, 1083.0, 2144.0, 5289.0, 15918.0, 64077.0, 463158.0, 3385403.0, 199435.0, 37699.0, 10504.0, 3797.0, 1637.0, 832.0, 483.0, 331.0, 252.0, 137.0, 98.0, 66.0, 57.0, 33.0, 20.0, 21.0, 16.0, 13.0, 8.0, 4.0, 3.0, 3.0, 1.0, 2.0, 3.0, 3.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.27783203125, -0.2672767639160156, -0.25672149658203125, -0.24616622924804688, -0.2356109619140625, -0.22505569458007812, -0.21450042724609375, -0.20394515991210938, -0.193389892578125, -0.18283462524414062, -0.17227935791015625, -0.16172409057617188, -0.1511688232421875, -0.14061355590820312, -0.13005828857421875, -0.11950302124023438, -0.10894775390625, -0.09839248657226562, -0.08783721923828125, -0.07728195190429688, -0.0667266845703125, -0.056171417236328125, -0.04561614990234375, -0.035060882568359375, -0.024505615234375, -0.013950347900390625, -0.00339508056640625, 0.007160186767578125, 0.0177154541015625, 0.028270721435546875, 0.03882598876953125, 0.049381256103515625, 0.0599365234375, 0.07049179077148438, 0.08104705810546875, 0.09160232543945312, 0.1021575927734375, 0.11271286010742188, 0.12326812744140625, 0.13382339477539062, 0.144378662109375, 0.15493392944335938, 0.16548919677734375, 0.17604446411132812, 0.1865997314453125, 0.19715499877929688, 0.20771026611328125, 0.21826553344726562, 0.22882080078125, 0.23937606811523438, 0.24993133544921875, 0.2604866027832031, 0.2710418701171875, 0.2815971374511719, 0.29215240478515625, 0.3027076721191406, 0.313262939453125, 0.3238182067871094, 0.33437347412109375, 0.3449287414550781, 0.3554840087890625, 0.3660392761230469, 0.37659454345703125, 0.3871498107910156, 0.397705078125]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 6.0, 3.0, 9.0, 9.0, 9.0, 20.0, 32.0, 32.0, 75.0, 131.0, 256.0, 1021.0, 1721.0, 310.0, 207.0, 90.0, 53.0, 26.0, 27.0, 15.0, 7.0, 7.0, 4.0, 6.0, 2.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.27099609375, -0.2645606994628906, -0.25812530517578125, -0.2516899108886719, -0.2452545166015625, -0.23881912231445312, -0.23238372802734375, -0.22594833374023438, -0.219512939453125, -0.21307754516601562, -0.20664215087890625, -0.20020675659179688, -0.1937713623046875, -0.18733596801757812, -0.18090057373046875, -0.17446517944335938, -0.16802978515625, -0.16159439086914062, -0.15515899658203125, -0.14872360229492188, -0.1422882080078125, -0.13585281372070312, -0.12941741943359375, -0.12298202514648438, -0.116546630859375, -0.11011123657226562, -0.10367584228515625, -0.09724044799804688, -0.0908050537109375, -0.08436965942382812, -0.07793426513671875, -0.07149887084960938, -0.0650634765625, -0.058628082275390625, -0.05219268798828125, -0.045757293701171875, -0.0393218994140625, -0.032886505126953125, -0.02645111083984375, -0.020015716552734375, -0.013580322265625, -0.007144927978515625, -0.00070953369140625, 0.005725860595703125, 0.0121612548828125, 0.018596649169921875, 0.02503204345703125, 0.031467437744140625, 0.03790283203125, 0.044338226318359375, 0.05077362060546875, 0.057209014892578125, 0.0636444091796875, 0.07007980346679688, 0.07651519775390625, 0.08295059204101562, 0.089385986328125, 0.09582138061523438, 0.10225677490234375, 0.10869216918945312, 0.1151275634765625, 0.12156295776367188, 0.12799835205078125, 0.13443374633789062, 0.140869140625]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 7.0, 13.0, 29.0, 70.0, 204.0, 324.0, 223.0, 101.0, 19.0, 13.0, 4.0, 4.0, 2.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.812553882598877, -3.7325737476348877, -3.6525933742523193, -3.57261323928833, -3.492633104324341, -3.4126529693603516, -3.332672595977783, -3.252692461013794, -3.1727123260498047, -3.0927321910858154, -3.012751817703247, -2.932771682739258, -2.8527915477752686, -2.7728114128112793, -2.692831039428711, -2.6128509044647217, -2.5328707695007324, -2.452890634536743, -2.372910261154175, -2.2929301261901855, -2.2129499912261963, -2.132969856262207, -2.0529894828796387, -1.9730093479156494, -1.893028974533081, -1.8130487203598022, -1.733068585395813, -1.6530883312225342, -1.573108196258545, -1.4931279420852661, -1.4131476879119873, -1.333167552947998, -1.2531875371932983, -1.1732072830200195, -1.0932271480560303, -1.0132468938827515, -0.9332667589187622, -0.8532865047454834, -0.7733063101768494, -0.6933261156082153, -0.6133459210395813, -0.5333657264709473, -0.45338553190231323, -0.3734053075313568, -0.2934251129627228, -0.21344491839408875, -0.13346469402313232, -0.05348449945449829, 0.026495695114135742, 0.10647589713335037, 0.186456099152565, 0.26643630862236023, 0.34641650319099426, 0.4263966977596283, 0.5063769221305847, 0.5863571166992188, 0.6663373112678528, 0.7463175058364868, 0.8262977004051208, 0.9062778949737549, 0.9862581491470337, 1.066238284111023, 1.1462185382843018, 1.226198673248291, 1.3061789274215698]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 3.0, 6.0, 6.0, 12.0, 15.0, 13.0, 25.0, 32.0, 28.0, 44.0, 28.0, 39.0, 24.0, 37.0, 45.0, 44.0, 54.0, 56.0, 45.0, 39.0, 50.0, 42.0, 35.0, 46.0, 36.0, 36.0, 33.0, 32.0, 21.0, 13.0, 11.0, 14.0, 8.0, 10.0, 9.0, 10.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5369692444801331, -0.5185194611549377, -0.5000696778297424, -0.4816198945045471, -0.4631701111793518, -0.4447203278541565, -0.4262705147266388, -0.4078207314014435, -0.38937094807624817, -0.37092116475105286, -0.35247138142585754, -0.33402159810066223, -0.31557178497314453, -0.2971220016479492, -0.2786722183227539, -0.2602224349975586, -0.24177265167236328, -0.22332286834716797, -0.20487308502197266, -0.18642328679561615, -0.16797350347042084, -0.14952372014522552, -0.13107392191886902, -0.1126241385936737, -0.0941743552684784, -0.07572457194328308, -0.05727478116750717, -0.03882499411702156, -0.02037520706653595, -0.0019254237413406372, 0.016524367034435272, 0.03497415781021118, 0.05342400074005127, 0.07187378406524658, 0.09032357484102249, 0.1087733656167984, 0.1272231489419937, 0.14567293226718903, 0.16412273049354553, 0.18257251381874084, 0.20102229714393616, 0.21947208046913147, 0.23792186379432678, 0.2563716471195221, 0.2748214602470398, 0.2932712435722351, 0.3117210268974304, 0.33017081022262573, 0.34862059354782104, 0.36707037687301636, 0.38552016019821167, 0.403969943523407, 0.4224197268486023, 0.4408695101737976, 0.4593193233013153, 0.4777691066265106, 0.49621888995170593, 0.5146687030792236, 0.533118486404419, 0.5515682697296143, 0.5700180530548096, 0.5884678363800049, 0.6069176197052002, 0.6253674030303955, 0.6438171863555908]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 5.0, 2.0, 4.0, 5.0, 1.0, 7.0, 18.0, 26.0, 29.0, 55.0, 78.0, 131.0, 187.0, 260.0, 438.0, 767.0, 1336.0, 2276.0, 4100.0, 7388.0, 14121.0, 27267.0, 53901.0, 109728.0, 213314.0, 271654.0, 169939.0, 83604.0, 41551.0, 21521.0, 10907.0, 5923.0, 3407.0, 1841.0, 1131.0, 614.0, 382.0, 234.0, 148.0, 92.0, 50.0, 42.0, 29.0, 21.0, 6.0, 12.0, 2.0, 4.0, 3.0, 2.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1317138671875, -0.1276378631591797, -0.12356185913085938, -0.11948585510253906, -0.11540985107421875, -0.11133384704589844, -0.10725784301757812, -0.10318183898925781, -0.0991058349609375, -0.09502983093261719, -0.09095382690429688, -0.08687782287597656, -0.08280181884765625, -0.07872581481933594, -0.07464981079101562, -0.07057380676269531, -0.066497802734375, -0.06242179870605469, -0.058345794677734375, -0.05426979064941406, -0.05019378662109375, -0.04611778259277344, -0.042041778564453125, -0.03796577453613281, -0.0338897705078125, -0.029813766479492188, -0.025737762451171875, -0.021661758422851562, -0.01758575439453125, -0.013509750366210938, -0.009433746337890625, -0.0053577423095703125, -0.00128173828125, 0.0027942657470703125, 0.006870269775390625, 0.010946273803710938, 0.01502227783203125, 0.019098281860351562, 0.023174285888671875, 0.027250289916992188, 0.0313262939453125, 0.03540229797363281, 0.039478302001953125, 0.04355430603027344, 0.04763031005859375, 0.05170631408691406, 0.055782318115234375, 0.05985832214355469, 0.063934326171875, 0.06801033020019531, 0.07208633422851562, 0.07616233825683594, 0.08023834228515625, 0.08431434631347656, 0.08839035034179688, 0.09246635437011719, 0.0965423583984375, 0.10061836242675781, 0.10469436645507812, 0.10877037048339844, 0.11284637451171875, 0.11692237854003906, 0.12099838256835938, 0.1250743865966797, 0.129150390625]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 5.0, 4.0, 2.0, 7.0, 4.0, 3.0, 6.0, 8.0, 10.0, 14.0, 23.0, 17.0, 27.0, 11.0, 29.0, 23.0, 36.0, 32.0, 42.0, 43.0, 43.0, 52.0, 42.0, 47.0, 43.0, 41.0, 33.0, 38.0, 40.0, 37.0, 28.0, 29.0, 30.0, 34.0, 21.0, 23.0, 17.0, 12.0, 15.0, 8.0, 8.0, 6.0, 4.0, 6.0, 5.0, 2.0, 3.0, 0.0, 3.0, 1.0, 2.0], "bins": [-0.053375244140625, -0.05192375183105469, -0.050472259521484375, -0.04902076721191406, -0.04756927490234375, -0.04611778259277344, -0.044666290283203125, -0.04321479797363281, -0.0417633056640625, -0.04031181335449219, -0.038860321044921875, -0.03740882873535156, -0.03595733642578125, -0.03450584411621094, -0.033054351806640625, -0.03160285949707031, -0.0301513671875, -0.028699874877929688, -0.027248382568359375, -0.025796890258789062, -0.02434539794921875, -0.022893905639648438, -0.021442413330078125, -0.019990921020507812, -0.0185394287109375, -0.017087936401367188, -0.015636444091796875, -0.014184951782226562, -0.01273345947265625, -0.011281967163085938, -0.009830474853515625, -0.008378982543945312, -0.006927490234375, -0.0054759979248046875, -0.004024505615234375, -0.0025730133056640625, -0.00112152099609375, 0.0003299713134765625, 0.001781463623046875, 0.0032329559326171875, 0.0046844482421875, 0.0061359405517578125, 0.007587432861328125, 0.009038925170898438, 0.01049041748046875, 0.011941909790039062, 0.013393402099609375, 0.014844894409179688, 0.01629638671875, 0.017747879028320312, 0.019199371337890625, 0.020650863647460938, 0.02210235595703125, 0.023553848266601562, 0.025005340576171875, 0.026456832885742188, 0.0279083251953125, 0.029359817504882812, 0.030811309814453125, 0.03226280212402344, 0.03371429443359375, 0.03516578674316406, 0.036617279052734375, 0.03806877136230469, 0.039520263671875]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 6.0, 5.0, 6.0, 6.0, 13.0, 10.0, 23.0, 30.0, 35.0, 46.0, 65.0, 97.0, 141.0, 224.0, 377.0, 571.0, 1283.0, 2760.0, 7724.0, 28573.0, 148352.0, 596558.0, 207935.0, 37562.0, 9483.0, 3300.0, 1400.0, 697.0, 430.0, 262.0, 183.0, 139.0, 79.0, 44.0, 38.0, 36.0, 22.0, 12.0, 9.0, 12.0, 4.0, 6.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.38037109375, -0.3699760437011719, -0.35958099365234375, -0.3491859436035156, -0.3387908935546875, -0.3283958435058594, -0.31800079345703125, -0.3076057434082031, -0.297210693359375, -0.2868156433105469, -0.27642059326171875, -0.2660255432128906, -0.2556304931640625, -0.24523544311523438, -0.23484039306640625, -0.22444534301757812, -0.21405029296875, -0.20365524291992188, -0.19326019287109375, -0.18286514282226562, -0.1724700927734375, -0.16207504272460938, -0.15167999267578125, -0.14128494262695312, -0.130889892578125, -0.12049484252929688, -0.11009979248046875, -0.09970474243164062, -0.0893096923828125, -0.07891464233398438, -0.06851959228515625, -0.058124542236328125, -0.0477294921875, -0.037334442138671875, -0.02693939208984375, -0.016544342041015625, -0.0061492919921875, 0.004245758056640625, 0.01464080810546875, 0.025035858154296875, 0.035430908203125, 0.045825958251953125, 0.05622100830078125, 0.06661605834960938, 0.0770111083984375, 0.08740615844726562, 0.09780120849609375, 0.10819625854492188, 0.11859130859375, 0.12898635864257812, 0.13938140869140625, 0.14977645874023438, 0.1601715087890625, 0.17056655883789062, 0.18096160888671875, 0.19135665893554688, 0.201751708984375, 0.21214675903320312, 0.22254180908203125, 0.23293685913085938, 0.2433319091796875, 0.2537269592285156, 0.26412200927734375, 0.2745170593261719, 0.284912109375]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 4.0, 1.0, 6.0, 3.0, 3.0, 5.0, 5.0, 8.0, 18.0, 12.0, 12.0, 23.0, 20.0, 20.0, 17.0, 33.0, 45.0, 36.0, 37.0, 39.0, 49.0, 55.0, 55.0, 58.0, 52.0, 51.0, 46.0, 41.0, 34.0, 28.0, 33.0, 38.0, 30.0, 19.0, 17.0, 12.0, 12.0, 7.0, 13.0, 4.0, 3.0, 1.0, 1.0, 3.0, 2.0, 2.0, 0.0, 3.0, 2.0, 0.0, 1.0], "bins": [-0.36083984375, -0.3508110046386719, -0.34078216552734375, -0.3307533264160156, -0.3207244873046875, -0.3106956481933594, -0.30066680908203125, -0.2906379699707031, -0.280609130859375, -0.2705802917480469, -0.26055145263671875, -0.2505226135253906, -0.2404937744140625, -0.23046493530273438, -0.22043609619140625, -0.21040725708007812, -0.20037841796875, -0.19034957885742188, -0.18032073974609375, -0.17029190063476562, -0.1602630615234375, -0.15023422241210938, -0.14020538330078125, -0.13017654418945312, -0.120147705078125, -0.11011886596679688, -0.10009002685546875, -0.09006118774414062, -0.0800323486328125, -0.07000350952148438, -0.05997467041015625, -0.049945831298828125, -0.0399169921875, -0.029888153076171875, -0.01985931396484375, -0.009830474853515625, 0.0001983642578125, 0.010227203369140625, 0.02025604248046875, 0.030284881591796875, 0.040313720703125, 0.050342559814453125, 0.06037139892578125, 0.07040023803710938, 0.0804290771484375, 0.09045791625976562, 0.10048675537109375, 0.11051559448242188, 0.12054443359375, 0.13057327270507812, 0.14060211181640625, 0.15063095092773438, 0.1606597900390625, 0.17068862915039062, 0.18071746826171875, 0.19074630737304688, 0.200775146484375, 0.21080398559570312, 0.22083282470703125, 0.23086166381835938, 0.2408905029296875, 0.2509193420410156, 0.26094818115234375, 0.2709770202636719, 0.281005859375]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 8.0, 2.0, 2.0, 3.0, 7.0, 16.0, 13.0, 22.0, 26.0, 34.0, 64.0, 105.0, 176.0, 339.0, 678.0, 1296.0, 2838.0, 7585.0, 22981.0, 98642.0, 461058.0, 354430.0, 70156.0, 17373.0, 5919.0, 2413.0, 1111.0, 556.0, 265.0, 161.0, 106.0, 55.0, 34.0, 25.0, 21.0, 9.0, 10.0, 5.0, 3.0, 4.0, 1.0, 2.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1549072265625, -0.14972496032714844, -0.14454269409179688, -0.1393604278564453, -0.13417816162109375, -0.1289958953857422, -0.12381362915039062, -0.11863136291503906, -0.1134490966796875, -0.10826683044433594, -0.10308456420898438, -0.09790229797363281, -0.09272003173828125, -0.08753776550292969, -0.08235549926757812, -0.07717323303222656, -0.071990966796875, -0.06680870056152344, -0.061626434326171875, -0.05644416809082031, -0.05126190185546875, -0.04607963562011719, -0.040897369384765625, -0.03571510314941406, -0.0305328369140625, -0.025350570678710938, -0.020168304443359375, -0.014986038208007812, -0.00980377197265625, -0.0046215057373046875, 0.000560760498046875, 0.0057430267333984375, 0.01092529296875, 0.016107559204101562, 0.021289825439453125, 0.026472091674804688, 0.03165435791015625, 0.03683662414550781, 0.042018890380859375, 0.04720115661621094, 0.0523834228515625, 0.05756568908691406, 0.06274795532226562, 0.06793022155761719, 0.07311248779296875, 0.07829475402832031, 0.08347702026367188, 0.08865928649902344, 0.093841552734375, 0.09902381896972656, 0.10420608520507812, 0.10938835144042969, 0.11457061767578125, 0.11975288391113281, 0.12493515014648438, 0.13011741638183594, 0.1352996826171875, 0.14048194885253906, 0.14566421508789062, 0.1508464813232422, 0.15602874755859375, 0.1612110137939453, 0.16639328002929688, 0.17157554626464844, 0.1767578125]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 4.0, 3.0, 6.0, 5.0, 6.0, 7.0, 6.0, 17.0, 12.0, 13.0, 24.0, 33.0, 41.0, 34.0, 47.0, 50.0, 61.0, 59.0, 36.0, 63.0, 60.0, 52.0, 57.0, 44.0, 39.0, 35.0, 33.0, 38.0, 25.0, 17.0, 18.0, 11.0, 11.0, 10.0, 11.0, 4.0, 4.0, 5.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.6372413635253906e-05, -4.494283348321915e-05, -4.351325333118439e-05, -4.208367317914963e-05, -4.065409302711487e-05, -3.922451287508011e-05, -3.779493272304535e-05, -3.636535257101059e-05, -3.493577241897583e-05, -3.350619226694107e-05, -3.207661211490631e-05, -3.064703196287155e-05, -2.9217451810836792e-05, -2.7787871658802032e-05, -2.6358291506767273e-05, -2.4928711354732513e-05, -2.3499131202697754e-05, -2.2069551050662994e-05, -2.0639970898628235e-05, -1.9210390746593475e-05, -1.7780810594558716e-05, -1.6351230442523956e-05, -1.4921650290489197e-05, -1.3492070138454437e-05, -1.2062489986419678e-05, -1.0632909834384918e-05, -9.203329682350159e-06, -7.7737495303154e-06, -6.34416937828064e-06, -4.91458922624588e-06, -3.4850090742111206e-06, -2.055428922176361e-06, -6.258487701416016e-07, 8.03731381893158e-07, 2.2333115339279175e-06, 3.662891685962677e-06, 5.0924718379974365e-06, 6.522051990032196e-06, 7.951632142066956e-06, 9.381212294101715e-06, 1.0810792446136475e-05, 1.2240372598171234e-05, 1.3669952750205994e-05, 1.5099532902240753e-05, 1.6529113054275513e-05, 1.7958693206310272e-05, 1.9388273358345032e-05, 2.081785351037979e-05, 2.224743366241455e-05, 2.367701381444931e-05, 2.510659396648407e-05, 2.653617411851883e-05, 2.796575427055359e-05, 2.939533442258835e-05, 3.082491457462311e-05, 3.225449472665787e-05, 3.368407487869263e-05, 3.5113655030727386e-05, 3.6543235182762146e-05, 3.7972815334796906e-05, 3.9402395486831665e-05, 4.0831975638866425e-05, 4.2261555790901184e-05, 4.3691135942935944e-05, 4.51207160949707e-05]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 3.0, 0.0, 5.0, 4.0, 0.0, 3.0, 5.0, 6.0, 8.0, 13.0, 17.0, 36.0, 47.0, 70.0, 92.0, 129.0, 216.0, 414.0, 701.0, 1491.0, 3304.0, 8924.0, 30162.0, 142562.0, 547033.0, 244950.0, 47254.0, 12742.0, 4496.0, 1767.0, 860.0, 486.0, 284.0, 174.0, 102.0, 46.0, 55.0, 22.0, 17.0, 14.0, 10.0, 10.0, 7.0, 6.0, 4.0, 4.0, 2.0, 1.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.1761474609375, -0.1709136962890625, -0.165679931640625, -0.1604461669921875, -0.15521240234375, -0.1499786376953125, -0.144744873046875, -0.1395111083984375, -0.13427734375, -0.1290435791015625, -0.123809814453125, -0.1185760498046875, -0.11334228515625, -0.1081085205078125, -0.102874755859375, -0.0976409912109375, -0.0924072265625, -0.0871734619140625, -0.081939697265625, -0.0767059326171875, -0.07147216796875, -0.0662384033203125, -0.061004638671875, -0.0557708740234375, -0.050537109375, -0.0453033447265625, -0.040069580078125, -0.0348358154296875, -0.02960205078125, -0.0243682861328125, -0.019134521484375, -0.0139007568359375, -0.0086669921875, -0.0034332275390625, 0.001800537109375, 0.0070343017578125, 0.01226806640625, 0.0175018310546875, 0.022735595703125, 0.0279693603515625, 0.033203125, 0.0384368896484375, 0.043670654296875, 0.0489044189453125, 0.05413818359375, 0.0593719482421875, 0.064605712890625, 0.0698394775390625, 0.0750732421875, 0.0803070068359375, 0.085540771484375, 0.0907745361328125, 0.09600830078125, 0.1012420654296875, 0.106475830078125, 0.1117095947265625, 0.116943359375, 0.1221771240234375, 0.127410888671875, 0.1326446533203125, 0.13787841796875, 0.1431121826171875, 0.148345947265625, 0.1535797119140625, 0.1588134765625]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 4.0, 1.0, 2.0, 1.0, 5.0, 5.0, 5.0, 8.0, 17.0, 10.0, 21.0, 32.0, 49.0, 62.0, 73.0, 98.0, 88.0, 110.0, 100.0, 93.0, 62.0, 31.0, 27.0, 29.0, 17.0, 14.0, 15.0, 5.0, 6.0, 5.0, 3.0, 2.0, 3.0, 1.0, 4.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.1875, -0.18230819702148438, -0.17711639404296875, -0.17192459106445312, -0.1667327880859375, -0.16154098510742188, -0.15634918212890625, -0.15115737915039062, -0.145965576171875, -0.14077377319335938, -0.13558197021484375, -0.13039016723632812, -0.1251983642578125, -0.12000656127929688, -0.11481475830078125, -0.10962295532226562, -0.10443115234375, -0.09923934936523438, -0.09404754638671875, -0.08885574340820312, -0.0836639404296875, -0.07847213745117188, -0.07328033447265625, -0.06808853149414062, -0.062896728515625, -0.057704925537109375, -0.05251312255859375, -0.047321319580078125, -0.0421295166015625, -0.036937713623046875, -0.03174591064453125, -0.026554107666015625, -0.0213623046875, -0.016170501708984375, -0.01097869873046875, -0.005786895751953125, -0.0005950927734375, 0.004596710205078125, 0.00978851318359375, 0.014980316162109375, 0.020172119140625, 0.025363922119140625, 0.03055572509765625, 0.035747528076171875, 0.0409393310546875, 0.046131134033203125, 0.05132293701171875, 0.056514739990234375, 0.06170654296875, 0.06689834594726562, 0.07209014892578125, 0.07728195190429688, 0.0824737548828125, 0.08766555786132812, 0.09285736083984375, 0.09804916381835938, 0.103240966796875, 0.10843276977539062, 0.11362457275390625, 0.11881637573242188, 0.1240081787109375, 0.12919998168945312, 0.13439178466796875, 0.13958358764648438, 0.144775390625]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [3.0, 1.0, 3.0, 16.0, 63.0, 181.0, 290.0, 263.0, 153.0, 27.0, 11.0, 7.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2634855508804321, -1.082746982574463, -0.9020082950592041, -0.7212697267532349, -0.5405310988426208, -0.35979247093200684, -0.1790539026260376, 0.0016847848892211914, 0.18242335319519043, 0.36316198110580444, 0.5439006090164185, 0.7246391773223877, 0.9053778052330017, 1.0861164331436157, 1.266855001449585, 1.4475936889648438, 1.628332257270813, 1.8090708255767822, 1.989809513092041, 2.1705479621887207, 2.3512866497039795, 2.5320253372192383, 2.712763786315918, 2.893502712249756, 3.0742411613464355, 3.2549798488616943, 3.435718297958374, 3.616456985473633, 3.7971956729888916, 3.9779343605041504, 4.15867280960083, 4.339411735534668, 4.5201497077941895, 4.700888156890869, 4.881627082824707, 5.062365531921387, 5.243103981018066, 5.423842906951904, 5.604581356048584, 5.785320281982422, 5.966058731079102, 6.146797180175781, 6.327536106109619, 6.508274555206299, 6.6890130043029785, 6.869751930236816, 7.050490379333496, 7.231228828430176, 7.4119672775268555, 7.592705726623535, 7.773444652557373, 7.954183101654053, 8.13492202758789, 8.31566047668457, 8.49639892578125, 8.67713737487793, 8.857876777648926, 9.038615226745605, 9.219353675842285, 9.400093078613281, 9.580831527709961, 9.76156997680664, 9.94230842590332, 10.123046875, 10.30378532409668]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 5.0, 6.0, 6.0, 11.0, 7.0, 13.0, 6.0, 24.0, 15.0, 23.0, 17.0, 32.0, 32.0, 32.0, 44.0, 62.0, 45.0, 46.0, 48.0, 47.0, 41.0, 47.0, 43.0, 47.0, 41.0, 39.0, 51.0, 34.0, 29.0, 11.0, 19.0, 16.0, 14.0, 12.0, 9.0, 4.0, 10.0, 6.0, 7.0, 4.0, 5.0, 1.0, 0.0, 1.0, 4.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.7388379573822021, -1.6875922679901123, -1.636346459388733, -1.585100769996643, -1.5338549613952637, -1.4826092720031738, -1.431363582611084, -1.3801178932189941, -1.3288720846176147, -1.277626395225525, -1.2263805866241455, -1.1751348972320557, -1.1238892078399658, -1.0726433992385864, -1.0213977098464966, -0.970151960849762, -0.9189062118530273, -0.8676604628562927, -0.8164147138595581, -0.7651690244674683, -0.7139232754707336, -0.662677526473999, -0.6114318370819092, -0.5601860880851746, -0.5089403390884399, -0.4576945900917053, -0.4064488708972931, -0.35520315170288086, -0.30395740270614624, -0.2527116537094116, -0.2014659345149994, -0.15022021532058716, -0.09897446632385254, -0.047728732228279114, 0.0035170018672943115, 0.05476273596286774, 0.10600847005844116, 0.15725421905517578, 0.208499938249588, 0.25974565744400024, 0.31099140644073486, 0.3622371554374695, 0.4134828746318817, 0.46472859382629395, 0.5159743428230286, 0.5672200918197632, 0.618465781211853, 0.6697115302085876, 0.7209572792053223, 0.7722030282020569, 0.8234487771987915, 0.8746944665908813, 0.925940215587616, 0.9771859645843506, 1.0284316539764404, 1.0796773433685303, 1.1309231519699097, 1.1821688413619995, 1.233414649963379, 1.2846603393554688, 1.3359060287475586, 1.387151837348938, 1.4383975267410278, 1.4896433353424072, 1.540889024734497]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 7.0, 3.0, 4.0, 12.0, 9.0, 19.0, 20.0, 36.0, 57.0, 69.0, 85.0, 152.0, 222.0, 366.0, 669.0, 1152.0, 2123.0, 4441.0, 10911.0, 39514.0, 3783656.0, 304383.0, 28948.0, 8917.0, 3840.0, 1998.0, 1020.0, 581.0, 380.0, 232.0, 137.0, 109.0, 56.0, 61.0, 25.0, 23.0, 18.0, 7.0, 8.0, 8.0, 3.0, 4.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.36962890625, -0.3593330383300781, -0.34903717041015625, -0.3387413024902344, -0.3284454345703125, -0.3181495666503906, -0.30785369873046875, -0.2975578308105469, -0.287261962890625, -0.2769660949707031, -0.26667022705078125, -0.2563743591308594, -0.2460784912109375, -0.23578262329101562, -0.22548675537109375, -0.21519088745117188, -0.20489501953125, -0.19459915161132812, -0.18430328369140625, -0.17400741577148438, -0.1637115478515625, -0.15341567993164062, -0.14311981201171875, -0.13282394409179688, -0.122528076171875, -0.11223220825195312, -0.10193634033203125, -0.09164047241210938, -0.0813446044921875, -0.07104873657226562, -0.06075286865234375, -0.050457000732421875, -0.0401611328125, -0.029865264892578125, -0.01956939697265625, -0.009273529052734375, 0.0010223388671875, 0.011318206787109375, 0.02161407470703125, 0.031909942626953125, 0.042205810546875, 0.052501678466796875, 0.06279754638671875, 0.07309341430664062, 0.0833892822265625, 0.09368515014648438, 0.10398101806640625, 0.11427688598632812, 0.12457275390625, 0.13486862182617188, 0.14516448974609375, 0.15546035766601562, 0.1657562255859375, 0.17605209350585938, 0.18634796142578125, 0.19664382934570312, 0.206939697265625, 0.21723556518554688, 0.22753143310546875, 0.23782730102539062, 0.2481231689453125, 0.2584190368652344, 0.26871490478515625, 0.2790107727050781, 0.289306640625]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 0.0, 3.0, 4.0, 6.0, 3.0, 6.0, 5.0, 16.0, 14.0, 9.0, 20.0, 25.0, 20.0, 30.0, 20.0, 32.0, 25.0, 40.0, 39.0, 48.0, 51.0, 46.0, 46.0, 47.0, 50.0, 34.0, 43.0, 47.0, 42.0, 41.0, 25.0, 26.0, 25.0, 22.0, 20.0, 18.0, 17.0, 11.0, 6.0, 2.0, 9.0, 1.0, 3.0, 3.0, 3.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.056915283203125, -0.055274009704589844, -0.05363273620605469, -0.05199146270751953, -0.050350189208984375, -0.04870891571044922, -0.04706764221191406, -0.045426368713378906, -0.04378509521484375, -0.042143821716308594, -0.04050254821777344, -0.03886127471923828, -0.037220001220703125, -0.03557872772216797, -0.03393745422363281, -0.032296180725097656, -0.0306549072265625, -0.029013633728027344, -0.027372360229492188, -0.02573108673095703, -0.024089813232421875, -0.02244853973388672, -0.020807266235351562, -0.019165992736816406, -0.01752471923828125, -0.015883445739746094, -0.014242172241210938, -0.012600898742675781, -0.010959625244140625, -0.009318351745605469, -0.0076770782470703125, -0.006035804748535156, -0.00439453125, -0.0027532577514648438, -0.0011119842529296875, 0.0005292892456054688, 0.002170562744140625, 0.0038118362426757812, 0.0054531097412109375, 0.007094383239746094, 0.00873565673828125, 0.010376930236816406, 0.012018203735351562, 0.013659477233886719, 0.015300750732421875, 0.01694202423095703, 0.018583297729492188, 0.020224571228027344, 0.0218658447265625, 0.023507118225097656, 0.025148391723632812, 0.02678966522216797, 0.028430938720703125, 0.03007221221923828, 0.03171348571777344, 0.033354759216308594, 0.03499603271484375, 0.036637306213378906, 0.03827857971191406, 0.03991985321044922, 0.041561126708984375, 0.04320240020751953, 0.04484367370605469, 0.046484947204589844, 0.048126220703125]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 5.0, 1.0, 8.0, 9.0, 11.0, 15.0, 30.0, 25.0, 43.0, 81.0, 94.0, 184.0, 282.0, 516.0, 1263.0, 4570.0, 51646.0, 4103893.0, 25922.0, 3428.0, 1070.0, 509.0, 248.0, 175.0, 77.0, 64.0, 35.0, 31.0, 19.0, 8.0, 11.0, 3.0, 4.0, 6.0, 4.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2119140625, -1.17449951171875, -1.1370849609375, -1.09967041015625, -1.062255859375, -1.02484130859375, -0.9874267578125, -0.95001220703125, -0.91259765625, -0.87518310546875, -0.8377685546875, -0.80035400390625, -0.762939453125, -0.72552490234375, -0.6881103515625, -0.65069580078125, -0.61328125, -0.57586669921875, -0.5384521484375, -0.50103759765625, -0.463623046875, -0.42620849609375, -0.3887939453125, -0.35137939453125, -0.31396484375, -0.27655029296875, -0.2391357421875, -0.20172119140625, -0.164306640625, -0.12689208984375, -0.0894775390625, -0.05206298828125, -0.0146484375, 0.02276611328125, 0.0601806640625, 0.09759521484375, 0.135009765625, 0.17242431640625, 0.2098388671875, 0.24725341796875, 0.28466796875, 0.32208251953125, 0.3594970703125, 0.39691162109375, 0.434326171875, 0.47174072265625, 0.5091552734375, 0.54656982421875, 0.583984375, 0.62139892578125, 0.6588134765625, 0.69622802734375, 0.733642578125, 0.77105712890625, 0.8084716796875, 0.84588623046875, 0.88330078125, 0.92071533203125, 0.9581298828125, 0.99554443359375, 1.032958984375, 1.07037353515625, 1.1077880859375, 1.14520263671875, 1.1826171875]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 6.0, 9.0, 22.0, 58.0, 114.0, 3468.0, 251.0, 76.0, 24.0, 21.0, 15.0, 4.0, 6.0, 5.0, 1.0, 0.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.228759765625, -0.2231426239013672, -0.21752548217773438, -0.21190834045410156, -0.20629119873046875, -0.20067405700683594, -0.19505691528320312, -0.1894397735595703, -0.1838226318359375, -0.1782054901123047, -0.17258834838867188, -0.16697120666503906, -0.16135406494140625, -0.15573692321777344, -0.15011978149414062, -0.1445026397705078, -0.138885498046875, -0.1332683563232422, -0.12765121459960938, -0.12203407287597656, -0.11641693115234375, -0.11079978942871094, -0.10518264770507812, -0.09956550598144531, -0.0939483642578125, -0.08833122253417969, -0.08271408081054688, -0.07709693908691406, -0.07147979736328125, -0.06586265563964844, -0.060245513916015625, -0.05462837219238281, -0.04901123046875, -0.04339408874511719, -0.037776947021484375, -0.03215980529785156, -0.02654266357421875, -0.020925521850585938, -0.015308380126953125, -0.009691238403320312, -0.0040740966796875, 0.0015430450439453125, 0.007160186767578125, 0.012777328491210938, 0.01839447021484375, 0.024011611938476562, 0.029628753662109375, 0.03524589538574219, 0.040863037109375, 0.04648017883300781, 0.052097320556640625, 0.05771446228027344, 0.06333160400390625, 0.06894874572753906, 0.07456588745117188, 0.08018302917480469, 0.0858001708984375, 0.09141731262207031, 0.09703445434570312, 0.10265159606933594, 0.10826873779296875, 0.11388587951660156, 0.11950302124023438, 0.1251201629638672, 0.1307373046875]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 8.0, 3.0, 5.0, 5.0, 10.0, 19.0, 28.0, 50.0, 70.0, 100.0, 137.0, 144.0, 124.0, 115.0, 64.0, 45.0, 38.0, 20.0, 13.0, 8.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3986055850982666, -0.38072556257247925, -0.3628455400466919, -0.34496551752090454, -0.3270854949951172, -0.30920547246932983, -0.2913254201412201, -0.27344539761543274, -0.2555653750896454, -0.23768535256385803, -0.21980533003807068, -0.20192529261112213, -0.18404527008533478, -0.16616524755954742, -0.14828521013259888, -0.13040518760681152, -0.11252516508102417, -0.09464514255523682, -0.07676511257886887, -0.058885086327791214, -0.04100506007671356, -0.02312503755092621, -0.005245007574558258, 0.012635022401809692, 0.030515044927597046, 0.0483950711786747, 0.06627509742975235, 0.0841551274061203, 0.10203514993190765, 0.11991517245769501, 0.13779520988464355, 0.1556752324104309, 0.17355531454086304, 0.1914353370666504, 0.20931535959243774, 0.2271953970193863, 0.24507541954517365, 0.2629554271697998, 0.28083547949790955, 0.2987155020236969, 0.31659552454948425, 0.3344755470752716, 0.35235556960105896, 0.3702355921268463, 0.38811564445495605, 0.4059956669807434, 0.42387568950653076, 0.4417557120323181, 0.45963573455810547, 0.4775157570838928, 0.4953957796096802, 0.5132758021354675, 0.5311558246612549, 0.5490358471870422, 0.5669158697128296, 0.5847959518432617, 0.6026759147644043, 0.6205559372901917, 0.638435959815979, 0.6563159823417664, 0.6741960048675537, 0.6920760273933411, 0.7099560499191284, 0.7278361320495605, 0.7457161545753479]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 1.0, 4.0, 2.0, 7.0, 5.0, 8.0, 12.0, 8.0, 16.0, 16.0, 24.0, 25.0, 24.0, 27.0, 32.0, 38.0, 41.0, 33.0, 34.0, 47.0, 41.0, 48.0, 48.0, 45.0, 54.0, 49.0, 49.0, 36.0, 33.0, 25.0, 27.0, 26.0, 27.0, 14.0, 24.0, 18.0, 13.0, 9.0, 10.0, 3.0, 3.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.24449318647384644, -0.23632627725601196, -0.2281593531370163, -0.21999244391918182, -0.21182551980018616, -0.20365861058235168, -0.1954917013645172, -0.18732477724552155, -0.17915785312652588, -0.1709909439086914, -0.16282401978969574, -0.15465711057186127, -0.1464901864528656, -0.13832327723503113, -0.13015636801719666, -0.12198944389820099, -0.11382253468036652, -0.10565561801195145, -0.09748870134353638, -0.0893217921257019, -0.08115486800670624, -0.07298795878887177, -0.0648210421204567, -0.056654125452041626, -0.048487208783626556, -0.04032029211521149, -0.03215337544679642, -0.023986462503671646, -0.015819545835256577, -0.007652629166841507, 0.0005142837762832642, 0.008681200444698334, 0.016848117113113403, 0.025015033781528473, 0.03318195044994354, 0.041348863393068314, 0.04951578006148338, 0.05768269672989845, 0.06584960967302322, 0.0740165263414383, 0.08218344300985336, 0.09035035967826843, 0.0985172763466835, 0.10668419301509857, 0.11485110223293304, 0.12301802635192871, 0.13118493556976318, 0.13935184478759766, 0.14751876890659332, 0.1556856781244278, 0.16385260224342346, 0.17201951146125793, 0.1801864355802536, 0.18835334479808807, 0.19652026891708374, 0.2046871781349182, 0.21285408735275269, 0.22102099657058716, 0.22918792068958282, 0.2373548299074173, 0.24552175402641296, 0.25368866324424744, 0.2618555724620819, 0.27002251148223877, 0.27818942070007324]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 9.0, 10.0, 20.0, 18.0, 30.0, 45.0, 71.0, 116.0, 201.0, 284.0, 471.0, 897.0, 1483.0, 2951.0, 6036.0, 12721.0, 28624.0, 64834.0, 139165.0, 246519.0, 257969.0, 154013.0, 71669.0, 31886.0, 14397.0, 6790.0, 3235.0, 1777.0, 946.0, 512.0, 282.0, 210.0, 129.0, 90.0, 46.0, 40.0, 20.0, 15.0, 10.0, 7.0, 5.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.18896484375, -0.1835765838623047, -0.17818832397460938, -0.17280006408691406, -0.16741180419921875, -0.16202354431152344, -0.15663528442382812, -0.1512470245361328, -0.1458587646484375, -0.1404705047607422, -0.13508224487304688, -0.12969398498535156, -0.12430572509765625, -0.11891746520996094, -0.11352920532226562, -0.10814094543457031, -0.102752685546875, -0.09736442565917969, -0.09197616577148438, -0.08658790588378906, -0.08119964599609375, -0.07581138610839844, -0.07042312622070312, -0.06503486633300781, -0.0596466064453125, -0.05425834655761719, -0.048870086669921875, -0.04348182678222656, -0.03809356689453125, -0.03270530700683594, -0.027317047119140625, -0.021928787231445312, -0.01654052734375, -0.011152267456054688, -0.005764007568359375, -0.0003757476806640625, 0.00501251220703125, 0.010400772094726562, 0.015789031982421875, 0.021177291870117188, 0.0265655517578125, 0.03195381164550781, 0.037342071533203125, 0.04273033142089844, 0.04811859130859375, 0.05350685119628906, 0.058895111083984375, 0.06428337097167969, 0.069671630859375, 0.07505989074707031, 0.08044815063476562, 0.08583641052246094, 0.09122467041015625, 0.09661293029785156, 0.10200119018554688, 0.10738945007324219, 0.1127777099609375, 0.11816596984863281, 0.12355422973632812, 0.12894248962402344, 0.13433074951171875, 0.13971900939941406, 0.14510726928710938, 0.1504955291748047, 0.1558837890625]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 4.0, 5.0, 5.0, 10.0, 8.0, 12.0, 14.0, 20.0, 19.0, 32.0, 34.0, 34.0, 31.0, 44.0, 35.0, 59.0, 53.0, 55.0, 63.0, 56.0, 56.0, 42.0, 45.0, 47.0, 43.0, 44.0, 27.0, 32.0, 17.0, 17.0, 12.0, 11.0, 2.0, 5.0, 7.0, 2.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08160400390625, -0.0791482925415039, -0.07669258117675781, -0.07423686981201172, -0.07178115844726562, -0.06932544708251953, -0.06686973571777344, -0.06441402435302734, -0.06195831298828125, -0.059502601623535156, -0.05704689025878906, -0.05459117889404297, -0.052135467529296875, -0.04967975616455078, -0.04722404479980469, -0.044768333435058594, -0.0423126220703125, -0.039856910705566406, -0.03740119934082031, -0.03494548797607422, -0.032489776611328125, -0.03003406524658203, -0.027578353881835938, -0.025122642517089844, -0.02266693115234375, -0.020211219787597656, -0.017755508422851562, -0.015299797058105469, -0.012844085693359375, -0.010388374328613281, -0.007932662963867188, -0.005476951599121094, -0.003021240234375, -0.0005655288696289062, 0.0018901824951171875, 0.004345893859863281, 0.006801605224609375, 0.009257316589355469, 0.011713027954101562, 0.014168739318847656, 0.01662445068359375, 0.019080162048339844, 0.021535873413085938, 0.02399158477783203, 0.026447296142578125, 0.02890300750732422, 0.03135871887207031, 0.033814430236816406, 0.0362701416015625, 0.038725852966308594, 0.04118156433105469, 0.04363727569580078, 0.046092987060546875, 0.04854869842529297, 0.05100440979003906, 0.053460121154785156, 0.05591583251953125, 0.058371543884277344, 0.06082725524902344, 0.06328296661376953, 0.06573867797851562, 0.06819438934326172, 0.07065010070800781, 0.0731058120727539, 0.0755615234375]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 5.0, 7.0, 8.0, 16.0, 14.0, 17.0, 26.0, 42.0, 58.0, 76.0, 125.0, 156.0, 220.0, 356.0, 590.0, 1095.0, 2266.0, 6164.0, 24554.0, 139184.0, 574057.0, 243029.0, 41159.0, 9096.0, 2872.0, 1306.0, 724.0, 422.0, 288.0, 177.0, 130.0, 82.0, 66.0, 47.0, 33.0, 20.0, 20.0, 16.0, 8.0, 9.0, 8.0, 2.0, 4.0, 4.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.39697265625, -0.3851776123046875, -0.373382568359375, -0.3615875244140625, -0.34979248046875, -0.3379974365234375, -0.326202392578125, -0.3144073486328125, -0.3026123046875, -0.2908172607421875, -0.279022216796875, -0.2672271728515625, -0.25543212890625, -0.2436370849609375, -0.231842041015625, -0.2200469970703125, -0.208251953125, -0.1964569091796875, -0.184661865234375, -0.1728668212890625, -0.16107177734375, -0.1492767333984375, -0.137481689453125, -0.1256866455078125, -0.1138916015625, -0.1020965576171875, -0.090301513671875, -0.0785064697265625, -0.06671142578125, -0.0549163818359375, -0.043121337890625, -0.0313262939453125, -0.01953125, -0.0077362060546875, 0.004058837890625, 0.0158538818359375, 0.02764892578125, 0.0394439697265625, 0.051239013671875, 0.0630340576171875, 0.0748291015625, 0.0866241455078125, 0.098419189453125, 0.1102142333984375, 0.12200927734375, 0.1338043212890625, 0.145599365234375, 0.1573944091796875, 0.169189453125, 0.1809844970703125, 0.192779541015625, 0.2045745849609375, 0.21636962890625, 0.2281646728515625, 0.239959716796875, 0.2517547607421875, 0.2635498046875, 0.2753448486328125, 0.287139892578125, 0.2989349365234375, 0.31072998046875, 0.3225250244140625, 0.334320068359375, 0.3461151123046875, 0.35791015625]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 7.0, 8.0, 6.0, 17.0, 13.0, 16.0, 14.0, 20.0, 22.0, 22.0, 31.0, 24.0, 35.0, 37.0, 46.0, 38.0, 45.0, 41.0, 43.0, 38.0, 43.0, 32.0, 43.0, 47.0, 37.0, 30.0, 24.0, 26.0, 31.0, 21.0, 23.0, 23.0, 22.0, 13.0, 11.0, 15.0, 9.0, 10.0, 7.0, 0.0, 1.0, 6.0, 3.0, 2.0, 5.0, 0.0, 1.0], "bins": [-0.427978515625, -0.416259765625, -0.404541015625, -0.392822265625, -0.381103515625, -0.369384765625, -0.357666015625, -0.345947265625, -0.334228515625, -0.322509765625, -0.310791015625, -0.299072265625, -0.287353515625, -0.275634765625, -0.263916015625, -0.252197265625, -0.240478515625, -0.228759765625, -0.217041015625, -0.205322265625, -0.193603515625, -0.181884765625, -0.170166015625, -0.158447265625, -0.146728515625, -0.135009765625, -0.123291015625, -0.111572265625, -0.099853515625, -0.088134765625, -0.076416015625, -0.064697265625, -0.052978515625, -0.041259765625, -0.029541015625, -0.017822265625, -0.006103515625, 0.005615234375, 0.017333984375, 0.029052734375, 0.040771484375, 0.052490234375, 0.064208984375, 0.075927734375, 0.087646484375, 0.099365234375, 0.111083984375, 0.122802734375, 0.134521484375, 0.146240234375, 0.157958984375, 0.169677734375, 0.181396484375, 0.193115234375, 0.204833984375, 0.216552734375, 0.228271484375, 0.239990234375, 0.251708984375, 0.263427734375, 0.275146484375, 0.286865234375, 0.298583984375, 0.310302734375, 0.322021484375]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 4.0, 5.0, 8.0, 9.0, 15.0, 11.0, 32.0, 49.0, 75.0, 99.0, 170.0, 262.0, 430.0, 792.0, 1485.0, 3002.0, 7105.0, 19581.0, 69625.0, 310408.0, 473215.0, 114843.0, 29439.0, 9710.0, 4014.0, 1868.0, 970.0, 528.0, 288.0, 153.0, 124.0, 80.0, 54.0, 31.0, 22.0, 17.0, 2.0, 7.0, 9.0, 12.0, 2.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.192138671875, -0.18696975708007812, -0.18180084228515625, -0.17663192749023438, -0.1714630126953125, -0.16629409790039062, -0.16112518310546875, -0.15595626831054688, -0.150787353515625, -0.14561843872070312, -0.14044952392578125, -0.13528060913085938, -0.1301116943359375, -0.12494277954101562, -0.11977386474609375, -0.11460494995117188, -0.10943603515625, -0.10426712036132812, -0.09909820556640625, -0.09392929077148438, -0.0887603759765625, -0.08359146118164062, -0.07842254638671875, -0.07325363159179688, -0.068084716796875, -0.06291580200195312, -0.05774688720703125, -0.052577972412109375, -0.0474090576171875, -0.042240142822265625, -0.03707122802734375, -0.031902313232421875, -0.0267333984375, -0.021564483642578125, -0.01639556884765625, -0.011226654052734375, -0.0060577392578125, -0.000888824462890625, 0.00428009033203125, 0.009449005126953125, 0.014617919921875, 0.019786834716796875, 0.02495574951171875, 0.030124664306640625, 0.0352935791015625, 0.040462493896484375, 0.04563140869140625, 0.050800323486328125, 0.05596923828125, 0.061138153076171875, 0.06630706787109375, 0.07147598266601562, 0.0766448974609375, 0.08181381225585938, 0.08698272705078125, 0.09215164184570312, 0.097320556640625, 0.10248947143554688, 0.10765838623046875, 0.11282730102539062, 0.1179962158203125, 0.12316513061523438, 0.12833404541015625, 0.13350296020507812, 0.138671875]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 6.0, 7.0, 7.0, 9.0, 21.0, 15.0, 28.0, 43.0, 50.0, 48.0, 66.0, 79.0, 72.0, 72.0, 76.0, 77.0, 70.0, 50.0, 59.0, 41.0, 21.0, 26.0, 13.0, 13.0, 15.0, 3.0, 7.0, 4.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.458427429199219e-05, -4.2698346078395844e-05, -4.08124178647995e-05, -3.8926489651203156e-05, -3.704056143760681e-05, -3.515463322401047e-05, -3.3268705010414124e-05, -3.138277679681778e-05, -2.9496848583221436e-05, -2.761092036962509e-05, -2.5724992156028748e-05, -2.3839063942432404e-05, -2.195313572883606e-05, -2.0067207515239716e-05, -1.818127930164337e-05, -1.6295351088047028e-05, -1.4409422874450684e-05, -1.252349466085434e-05, -1.0637566447257996e-05, -8.751638233661652e-06, -6.865710020065308e-06, -4.979781806468964e-06, -3.0938535928726196e-06, -1.2079253792762756e-06, 6.780028343200684e-07, 2.5639310479164124e-06, 4.449859261512756e-06, 6.3357874751091e-06, 8.221715688705444e-06, 1.0107643902301788e-05, 1.1993572115898132e-05, 1.3879500329494476e-05, 1.576542854309082e-05, 1.7651356756687164e-05, 1.9537284970283508e-05, 2.1423213183879852e-05, 2.3309141397476196e-05, 2.519506961107254e-05, 2.7080997824668884e-05, 2.8966926038265228e-05, 3.085285425186157e-05, 3.2738782465457916e-05, 3.462471067905426e-05, 3.6510638892650604e-05, 3.839656710624695e-05, 4.028249531984329e-05, 4.2168423533439636e-05, 4.405435174703598e-05, 4.5940279960632324e-05, 4.782620817422867e-05, 4.971213638782501e-05, 5.1598064601421356e-05, 5.34839928150177e-05, 5.5369921028614044e-05, 5.725584924221039e-05, 5.914177745580673e-05, 6.1027705669403076e-05, 6.291363388299942e-05, 6.479956209659576e-05, 6.668549031019211e-05, 6.857141852378845e-05, 7.04573467373848e-05, 7.234327495098114e-05, 7.422920316457748e-05, 7.611513137817383e-05]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 6.0, 3.0, 5.0, 5.0, 14.0, 18.0, 32.0, 50.0, 78.0, 145.0, 227.0, 484.0, 1203.0, 3606.0, 16141.0, 146322.0, 730744.0, 128888.0, 15009.0, 3399.0, 1181.0, 451.0, 242.0, 128.0, 61.0, 49.0, 24.0, 26.0, 10.0, 5.0, 1.0, 0.0, 6.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.356689453125, -0.34808921813964844, -0.3394889831542969, -0.3308887481689453, -0.32228851318359375, -0.3136882781982422, -0.3050880432128906, -0.29648780822753906, -0.2878875732421875, -0.27928733825683594, -0.2706871032714844, -0.2620868682861328, -0.25348663330078125, -0.2448863983154297, -0.23628616333007812, -0.22768592834472656, -0.219085693359375, -0.21048545837402344, -0.20188522338867188, -0.1932849884033203, -0.18468475341796875, -0.1760845184326172, -0.16748428344726562, -0.15888404846191406, -0.1502838134765625, -0.14168357849121094, -0.13308334350585938, -0.12448310852050781, -0.11588287353515625, -0.10728263854980469, -0.09868240356445312, -0.09008216857910156, -0.08148193359375, -0.07288169860839844, -0.06428146362304688, -0.05568122863769531, -0.04708099365234375, -0.03848075866699219, -0.029880523681640625, -0.021280288696289062, -0.0126800537109375, -0.0040798187255859375, 0.004520416259765625, 0.013120651245117188, 0.02172088623046875, 0.030321121215820312, 0.038921356201171875, 0.04752159118652344, 0.056121826171875, 0.06472206115722656, 0.07332229614257812, 0.08192253112792969, 0.09052276611328125, 0.09912300109863281, 0.10772323608398438, 0.11632347106933594, 0.1249237060546875, 0.13352394104003906, 0.14212417602539062, 0.1507244110107422, 0.15932464599609375, 0.1679248809814453, 0.17652511596679688, 0.18512535095214844, 0.1937255859375]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 8.0, 2.0, 3.0, 6.0, 11.0, 16.0, 26.0, 46.0, 40.0, 57.0, 70.0, 113.0, 103.0, 105.0, 95.0, 77.0, 66.0, 52.0, 39.0, 28.0, 14.0, 9.0, 10.0, 5.0, 5.0, 3.0, 1.0, 0.0, 5.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.314453125, -0.3070049285888672, -0.2995567321777344, -0.29210853576660156, -0.28466033935546875, -0.27721214294433594, -0.2697639465332031, -0.2623157501220703, -0.2548675537109375, -0.2474193572998047, -0.23997116088867188, -0.23252296447753906, -0.22507476806640625, -0.21762657165527344, -0.21017837524414062, -0.2027301788330078, -0.195281982421875, -0.1878337860107422, -0.18038558959960938, -0.17293739318847656, -0.16548919677734375, -0.15804100036621094, -0.15059280395507812, -0.1431446075439453, -0.1356964111328125, -0.1282482147216797, -0.12080001831054688, -0.11335182189941406, -0.10590362548828125, -0.09845542907714844, -0.09100723266601562, -0.08355903625488281, -0.07611083984375, -0.06866264343261719, -0.061214447021484375, -0.05376625061035156, -0.04631805419921875, -0.03886985778808594, -0.031421661376953125, -0.023973464965820312, -0.0165252685546875, -0.009077072143554688, -0.001628875732421875, 0.0058193206787109375, 0.01326751708984375, 0.020715713500976562, 0.028163909912109375, 0.03561210632324219, 0.043060302734375, 0.05050849914550781, 0.057956695556640625, 0.06540489196777344, 0.07285308837890625, 0.08030128479003906, 0.08774948120117188, 0.09519767761230469, 0.1026458740234375, 0.11009407043457031, 0.11754226684570312, 0.12499046325683594, 0.13243865966796875, 0.13988685607910156, 0.14733505249023438, 0.1547832489013672, 0.1622314453125]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 10.0, 20.0, 28.0, 48.0, 101.0, 150.0, 168.0, 144.0, 132.0, 77.0, 63.0, 28.0, 15.0, 9.0, 5.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.422314167022705, -3.3121464252471924, -3.2019784450531006, -3.091810703277588, -2.981642961502075, -2.8714752197265625, -2.7613072395324707, -2.651139497756958, -2.5409717559814453, -2.4308040142059326, -2.320636034011841, -2.210468292236328, -2.1003005504608154, -1.9901326894760132, -1.879964828491211, -1.7697970867156982, -1.6596291065216064, -1.5494612455368042, -1.4392935037612915, -1.3291256427764893, -1.2189579010009766, -1.1087900400161743, -0.9986221790313721, -0.8884543776512146, -0.7782865762710571, -0.6681187748908997, -0.5579509735107422, -0.44778311252593994, -0.33761531114578247, -0.227447509765625, -0.11727964878082275, -0.007111847400665283, 0.10305595397949219, 0.21322377026081085, 0.3233915865421295, 0.4335594177246094, 0.5437272191047668, 0.6538950204849243, 0.7640628814697266, 0.874230682849884, 0.9843984842300415, 1.0945663452148438, 1.2047340869903564, 1.3149019479751587, 1.425069808959961, 1.5352375507354736, 1.6454054117202759, 1.7555732727050781, 1.8657410144805908, 1.975908875465393, 2.0860767364501953, 2.196244478225708, 2.3064122200012207, 2.4165802001953125, 2.526747941970825, 2.636915683746338, 2.7470836639404297, 2.8572514057159424, 2.967419385910034, 3.077587127685547, 3.1877548694610596, 3.2979226112365723, 3.408090591430664, 3.5182583332061768, 3.6284260749816895]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 4.0, 0.0, 4.0, 1.0, 4.0, 10.0, 7.0, 9.0, 11.0, 17.0, 17.0, 15.0, 17.0, 18.0, 26.0, 43.0, 36.0, 36.0, 41.0, 48.0, 37.0, 42.0, 57.0, 63.0, 68.0, 63.0, 40.0, 38.0, 28.0, 21.0, 26.0, 34.0, 25.0, 17.0, 21.0, 16.0, 11.0, 5.0, 8.0, 6.0, 2.0, 4.0, 5.0, 3.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.2215898036956787, -2.1516826152801514, -2.081775426864624, -2.0118682384490967, -1.9419611692428589, -1.8720539808273315, -1.8021469116210938, -1.7322397232055664, -1.662332534790039, -1.5924253463745117, -1.5225181579589844, -1.4526110887527466, -1.3827039003372192, -1.312796711921692, -1.242889642715454, -1.1729824542999268, -1.1030752658843994, -1.033168077468872, -0.9632609486579895, -0.8933538198471069, -0.8234466314315796, -0.7535394430160522, -0.6836323142051697, -0.6137251853942871, -0.5438179969787598, -0.4739108383655548, -0.40400367975234985, -0.3340965211391449, -0.26418936252593994, -0.19428220391273499, -0.12437504529953003, -0.05446788668632507, 0.015439033508300781, 0.08534619212150574, 0.1552533507347107, 0.22516050934791565, 0.2950676679611206, 0.36497482657432556, 0.4348819851875305, 0.5047891139984131, 0.5746963024139404, 0.6446034908294678, 0.7145106196403503, 0.7844177484512329, 0.8543249368667603, 0.9242321252822876, 0.9941392540931702, 1.0640463829040527, 1.13395357131958, 1.2038607597351074, 1.2737679481506348, 1.3436750173568726, 1.4135822057724, 1.4834893941879272, 1.553396463394165, 1.6233036518096924, 1.6932108402252197, 1.763118028640747, 1.8330252170562744, 1.9029322862625122, 1.9728394746780396, 2.0427465438842773, 2.1126537322998047, 2.182560920715332, 2.2524681091308594]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 1.0, 2.0, 2.0, 4.0, 10.0, 16.0, 14.0, 17.0, 19.0, 34.0, 36.0, 54.0, 91.0, 115.0, 152.0, 171.0, 295.0, 441.0, 657.0, 1004.0, 1652.0, 2742.0, 5049.0, 10061.0, 23905.0, 93171.0, 3890199.0, 114323.0, 26172.0, 10616.0, 5372.0, 2937.0, 1732.0, 1036.0, 683.0, 410.0, 346.0, 200.0, 140.0, 105.0, 78.0, 61.0, 49.0, 23.0, 27.0, 16.0, 13.0, 6.0, 8.0, 8.0, 12.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 4.0], "bins": [-0.275390625, -0.26692962646484375, -0.2584686279296875, -0.25000762939453125, -0.241546630859375, -0.23308563232421875, -0.2246246337890625, -0.21616363525390625, -0.20770263671875, -0.19924163818359375, -0.1907806396484375, -0.18231964111328125, -0.173858642578125, -0.16539764404296875, -0.1569366455078125, -0.14847564697265625, -0.1400146484375, -0.13155364990234375, -0.1230926513671875, -0.11463165283203125, -0.106170654296875, -0.09770965576171875, -0.0892486572265625, -0.08078765869140625, -0.07232666015625, -0.06386566162109375, -0.0554046630859375, -0.04694366455078125, -0.038482666015625, -0.03002166748046875, -0.0215606689453125, -0.01309967041015625, -0.004638671875, 0.00382232666015625, 0.0122833251953125, 0.02074432373046875, 0.029205322265625, 0.03766632080078125, 0.0461273193359375, 0.05458831787109375, 0.06304931640625, 0.07151031494140625, 0.0799713134765625, 0.08843231201171875, 0.096893310546875, 0.10535430908203125, 0.1138153076171875, 0.12227630615234375, 0.1307373046875, 0.13919830322265625, 0.1476593017578125, 0.15612030029296875, 0.164581298828125, 0.17304229736328125, 0.1815032958984375, 0.18996429443359375, 0.19842529296875, 0.20688629150390625, 0.2153472900390625, 0.22380828857421875, 0.232269287109375, 0.24073028564453125, 0.2491912841796875, 0.25765228271484375, 0.26611328125]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 4.0, 2.0, 3.0, 2.0, 8.0, 4.0, 5.0, 11.0, 13.0, 16.0, 21.0, 20.0, 24.0, 28.0, 32.0, 45.0, 49.0, 47.0, 49.0, 65.0, 57.0, 74.0, 45.0, 50.0, 39.0, 34.0, 43.0, 44.0, 38.0, 29.0, 20.0, 19.0, 7.0, 14.0, 9.0, 9.0, 6.0, 3.0, 5.0, 7.0, 0.0, 4.0, 6.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.0899658203125, -0.08747100830078125, -0.0849761962890625, -0.08248138427734375, -0.079986572265625, -0.07749176025390625, -0.0749969482421875, -0.07250213623046875, -0.07000732421875, -0.06751251220703125, -0.0650177001953125, -0.06252288818359375, -0.060028076171875, -0.05753326416015625, -0.0550384521484375, -0.05254364013671875, -0.050048828125, -0.04755401611328125, -0.0450592041015625, -0.04256439208984375, -0.040069580078125, -0.03757476806640625, -0.0350799560546875, -0.03258514404296875, -0.03009033203125, -0.02759552001953125, -0.0251007080078125, -0.02260589599609375, -0.020111083984375, -0.01761627197265625, -0.0151214599609375, -0.01262664794921875, -0.0101318359375, -0.00763702392578125, -0.0051422119140625, -0.00264739990234375, -0.000152587890625, 0.00234222412109375, 0.0048370361328125, 0.00733184814453125, 0.00982666015625, 0.01232147216796875, 0.0148162841796875, 0.01731109619140625, 0.019805908203125, 0.02230072021484375, 0.0247955322265625, 0.02729034423828125, 0.02978515625, 0.03227996826171875, 0.0347747802734375, 0.03726959228515625, 0.039764404296875, 0.04225921630859375, 0.0447540283203125, 0.04724884033203125, 0.04974365234375, 0.05223846435546875, 0.0547332763671875, 0.05722808837890625, 0.059722900390625, 0.06221771240234375, 0.0647125244140625, 0.06720733642578125, 0.0697021484375]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 5.0, 3.0, 8.0, 8.0, 10.0, 13.0, 14.0, 10.0, 27.0, 34.0, 50.0, 66.0, 70.0, 95.0, 124.0, 184.0, 235.0, 340.0, 487.0, 688.0, 1090.0, 1788.0, 3130.0, 6214.0, 14423.0, 42087.0, 277286.0, 3728689.0, 76521.0, 21432.0, 8687.0, 4117.0, 2203.0, 1237.0, 851.0, 589.0, 371.0, 309.0, 222.0, 144.0, 98.0, 97.0, 52.0, 38.0, 36.0, 31.0, 27.0, 19.0, 7.0, 9.0, 5.0, 8.0, 5.0, 3.0, 1.0, 0.0, 2.0], "bins": [-0.393798828125, -0.38228607177734375, -0.3707733154296875, -0.35926055908203125, -0.347747802734375, -0.33623504638671875, -0.3247222900390625, -0.31320953369140625, -0.30169677734375, -0.29018402099609375, -0.2786712646484375, -0.26715850830078125, -0.255645751953125, -0.24413299560546875, -0.2326202392578125, -0.22110748291015625, -0.2095947265625, -0.19808197021484375, -0.1865692138671875, -0.17505645751953125, -0.163543701171875, -0.15203094482421875, -0.1405181884765625, -0.12900543212890625, -0.11749267578125, -0.10597991943359375, -0.0944671630859375, -0.08295440673828125, -0.071441650390625, -0.05992889404296875, -0.0484161376953125, -0.03690338134765625, -0.025390625, -0.01387786865234375, -0.0023651123046875, 0.00914764404296875, 0.020660400390625, 0.03217315673828125, 0.0436859130859375, 0.05519866943359375, 0.06671142578125, 0.07822418212890625, 0.0897369384765625, 0.10124969482421875, 0.112762451171875, 0.12427520751953125, 0.1357879638671875, 0.14730072021484375, 0.1588134765625, 0.17032623291015625, 0.1818389892578125, 0.19335174560546875, 0.204864501953125, 0.21637725830078125, 0.2278900146484375, 0.23940277099609375, 0.25091552734375, 0.26242828369140625, 0.2739410400390625, 0.28545379638671875, 0.296966552734375, 0.30847930908203125, 0.3199920654296875, 0.33150482177734375, 0.343017578125]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 6.0, 6.0, 6.0, 6.0, 6.0, 8.0, 16.0, 47.0, 68.0, 148.0, 2850.0, 600.0, 130.0, 56.0, 38.0, 14.0, 19.0, 15.0, 8.0, 13.0, 4.0, 4.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-0.1231689453125, -0.1195383071899414, -0.11590766906738281, -0.11227703094482422, -0.10864639282226562, -0.10501575469970703, -0.10138511657714844, -0.09775447845458984, -0.09412384033203125, -0.09049320220947266, -0.08686256408691406, -0.08323192596435547, -0.07960128784179688, -0.07597064971923828, -0.07234001159667969, -0.0687093734741211, -0.0650787353515625, -0.061448097229003906, -0.05781745910644531, -0.05418682098388672, -0.050556182861328125, -0.04692554473876953, -0.04329490661621094, -0.039664268493652344, -0.03603363037109375, -0.032402992248535156, -0.028772354125976562, -0.02514171600341797, -0.021511077880859375, -0.01788043975830078, -0.014249801635742188, -0.010619163513183594, -0.006988525390625, -0.0033578872680664062, 0.0002727508544921875, 0.0039033889770507812, 0.007534027099609375, 0.011164665222167969, 0.014795303344726562, 0.018425941467285156, 0.02205657958984375, 0.025687217712402344, 0.029317855834960938, 0.03294849395751953, 0.036579132080078125, 0.04020977020263672, 0.04384040832519531, 0.047471046447753906, 0.0511016845703125, 0.054732322692871094, 0.05836296081542969, 0.06199359893798828, 0.06562423706054688, 0.06925487518310547, 0.07288551330566406, 0.07651615142822266, 0.08014678955078125, 0.08377742767333984, 0.08740806579589844, 0.09103870391845703, 0.09466934204101562, 0.09829998016357422, 0.10193061828613281, 0.1055612564086914, 0.10919189453125]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 7.0, 2.0, 11.0, 14.0, 22.0, 48.0, 87.0, 118.0, 132.0, 143.0, 151.0, 86.0, 74.0, 47.0, 24.0, 14.0, 13.0, 8.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.664283275604248, -0.6442078351974487, -0.6241323947906494, -0.6040569543838501, -0.5839815139770508, -0.5639060735702515, -0.5438306331634521, -0.5237551927566528, -0.5036797523498535, -0.4836043119430542, -0.4635288715362549, -0.44345343112945557, -0.42337799072265625, -0.40330255031585693, -0.38322708010673523, -0.3631516396999359, -0.3430761694908142, -0.3230007290840149, -0.3029252886772156, -0.28284984827041626, -0.26277440786361694, -0.24269895255565643, -0.22262349724769592, -0.2025480568408966, -0.1824726164340973, -0.16239717602729797, -0.14232173562049866, -0.12224628031253815, -0.10217083990573883, -0.08209539949893951, -0.0620199516415596, -0.04194450378417969, -0.02186906337738037, -0.0017936192452907562, 0.01828182488679886, 0.038357269018888474, 0.05843271315097809, 0.0785081535577774, 0.09858360141515732, 0.11865904927253723, 0.13873448967933655, 0.15880993008613586, 0.17888537049293518, 0.1989608258008957, 0.219036266207695, 0.23911170661449432, 0.25918716192245483, 0.27926260232925415, 0.29933804273605347, 0.3194134831428528, 0.3394889235496521, 0.3595643639564514, 0.37963980436325073, 0.39971524477005005, 0.41979071497917175, 0.43986615538597107, 0.4599415957927704, 0.4800170361995697, 0.5000925064086914, 0.5201679468154907, 0.54024338722229, 0.5603188276290894, 0.5803942680358887, 0.600469708442688, 0.6205451488494873]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 3.0, 0.0, 1.0, 4.0, 1.0, 2.0, 6.0, 2.0, 6.0, 6.0, 11.0, 7.0, 10.0, 18.0, 6.0, 17.0, 16.0, 17.0, 30.0, 30.0, 28.0, 30.0, 53.0, 46.0, 41.0, 45.0, 53.0, 40.0, 51.0, 54.0, 40.0, 34.0, 37.0, 36.0, 30.0, 36.0, 24.0, 21.0, 23.0, 19.0, 20.0, 15.0, 16.0, 8.0, 6.0, 4.0, 4.0, 4.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.24712252616882324, -0.23897069692611694, -0.23081886768341064, -0.22266703844070435, -0.21451520919799805, -0.20636337995529175, -0.19821156561374664, -0.19005973637104034, -0.18190790712833405, -0.17375607788562775, -0.16560424864292145, -0.15745241940021515, -0.14930060505867004, -0.14114877581596375, -0.13299694657325745, -0.12484511733055115, -0.11669328808784485, -0.10854145884513855, -0.10038962960243225, -0.09223780781030655, -0.08408597856760025, -0.07593414932489395, -0.06778232753276825, -0.05963049829006195, -0.05147866904735565, -0.04332683980464935, -0.03517501428723335, -0.027023186907172203, -0.018871359527111053, -0.010719530284404755, -0.0025677047669887543, 0.005584120750427246, 0.013735949993133545, 0.021887777373194695, 0.030039604753255844, 0.038191430270671844, 0.04634325951337814, 0.05449508875608444, 0.06264691054821014, 0.07079873979091644, 0.07895056903362274, 0.08710239827632904, 0.09525422751903534, 0.10340604931116104, 0.11155787855386734, 0.11970970779657364, 0.12786152958869934, 0.13601335883140564, 0.14416518807411194, 0.15231701731681824, 0.16046884655952454, 0.16862067580223083, 0.17677250504493713, 0.18492433428764343, 0.19307614862918854, 0.20122797787189484, 0.20937980711460114, 0.21753163635730743, 0.22568346560001373, 0.23383529484272003, 0.24198710918426514, 0.25013893842697144, 0.25829076766967773, 0.26644259691238403, 0.27459442615509033]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 7.0, 6.0, 5.0, 11.0, 7.0, 23.0, 33.0, 45.0, 56.0, 109.0, 131.0, 215.0, 352.0, 594.0, 985.0, 1821.0, 3743.0, 7604.0, 16482.0, 38018.0, 87788.0, 197588.0, 308220.0, 211601.0, 96561.0, 41579.0, 17920.0, 8363.0, 3890.0, 2053.0, 1128.0, 612.0, 369.0, 240.0, 149.0, 85.0, 52.0, 37.0, 33.0, 21.0, 6.0, 10.0, 3.0, 3.0, 4.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1407470703125, -0.13544654846191406, -0.13014602661132812, -0.12484550476074219, -0.11954498291015625, -0.11424446105957031, -0.10894393920898438, -0.10364341735839844, -0.0983428955078125, -0.09304237365722656, -0.08774185180664062, -0.08244132995605469, -0.07714080810546875, -0.07184028625488281, -0.06653976440429688, -0.06123924255371094, -0.055938720703125, -0.05063819885253906, -0.045337677001953125, -0.04003715515136719, -0.03473663330078125, -0.029436111450195312, -0.024135589599609375, -0.018835067749023438, -0.0135345458984375, -0.008234024047851562, -0.002933502197265625, 0.0023670196533203125, 0.00766754150390625, 0.012968063354492188, 0.018268585205078125, 0.023569107055664062, 0.02886962890625, 0.03417015075683594, 0.039470672607421875, 0.04477119445800781, 0.05007171630859375, 0.05537223815917969, 0.060672760009765625, 0.06597328186035156, 0.0712738037109375, 0.07657432556152344, 0.08187484741210938, 0.08717536926269531, 0.09247589111328125, 0.09777641296386719, 0.10307693481445312, 0.10837745666503906, 0.113677978515625, 0.11897850036621094, 0.12427902221679688, 0.1295795440673828, 0.13488006591796875, 0.1401805877685547, 0.14548110961914062, 0.15078163146972656, 0.1560821533203125, 0.16138267517089844, 0.16668319702148438, 0.1719837188720703, 0.17728424072265625, 0.1825847625732422, 0.18788528442382812, 0.19318580627441406, 0.198486328125]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 4.0, 3.0, 2.0, 5.0, 4.0, 9.0, 11.0, 22.0, 14.0, 26.0, 24.0, 36.0, 33.0, 42.0, 37.0, 56.0, 52.0, 60.0, 48.0, 66.0, 54.0, 55.0, 58.0, 47.0, 49.0, 37.0, 35.0, 24.0, 28.0, 14.0, 15.0, 8.0, 5.0, 4.0, 8.0, 2.0, 2.0, 3.0, 2.0, 4.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.1072998046875, -0.10440826416015625, -0.1015167236328125, -0.09862518310546875, -0.095733642578125, -0.09284210205078125, -0.0899505615234375, -0.08705902099609375, -0.08416748046875, -0.08127593994140625, -0.0783843994140625, -0.07549285888671875, -0.072601318359375, -0.06970977783203125, -0.0668182373046875, -0.06392669677734375, -0.06103515625, -0.05814361572265625, -0.0552520751953125, -0.05236053466796875, -0.049468994140625, -0.04657745361328125, -0.0436859130859375, -0.04079437255859375, -0.03790283203125, -0.03501129150390625, -0.0321197509765625, -0.02922821044921875, -0.026336669921875, -0.02344512939453125, -0.0205535888671875, -0.01766204833984375, -0.0147705078125, -0.01187896728515625, -0.0089874267578125, -0.00609588623046875, -0.003204345703125, -0.00031280517578125, 0.0025787353515625, 0.00547027587890625, 0.00836181640625, 0.01125335693359375, 0.0141448974609375, 0.01703643798828125, 0.019927978515625, 0.02281951904296875, 0.0257110595703125, 0.02860260009765625, 0.031494140625, 0.03438568115234375, 0.0372772216796875, 0.04016876220703125, 0.043060302734375, 0.04595184326171875, 0.0488433837890625, 0.05173492431640625, 0.05462646484375, 0.05751800537109375, 0.0604095458984375, 0.06330108642578125, 0.066192626953125, 0.06908416748046875, 0.0719757080078125, 0.07486724853515625, 0.0777587890625]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 5.0, 4.0, 4.0, 6.0, 18.0, 19.0, 18.0, 30.0, 34.0, 81.0, 108.0, 154.0, 233.0, 378.0, 619.0, 1224.0, 2945.0, 10044.0, 59200.0, 529415.0, 388520.0, 42346.0, 7963.0, 2539.0, 1062.0, 561.0, 362.0, 215.0, 137.0, 109.0, 63.0, 47.0, 23.0, 19.0, 19.0, 11.0, 7.0, 7.0, 5.0, 3.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.4365234375, -0.42436981201171875, -0.4122161865234375, -0.40006256103515625, -0.387908935546875, -0.37575531005859375, -0.3636016845703125, -0.35144805908203125, -0.33929443359375, -0.32714080810546875, -0.3149871826171875, -0.30283355712890625, -0.290679931640625, -0.27852630615234375, -0.2663726806640625, -0.25421905517578125, -0.2420654296875, -0.22991180419921875, -0.2177581787109375, -0.20560455322265625, -0.193450927734375, -0.18129730224609375, -0.1691436767578125, -0.15699005126953125, -0.14483642578125, -0.13268280029296875, -0.1205291748046875, -0.10837554931640625, -0.096221923828125, -0.08406829833984375, -0.0719146728515625, -0.05976104736328125, -0.047607421875, -0.03545379638671875, -0.0233001708984375, -0.01114654541015625, 0.001007080078125, 0.01316070556640625, 0.0253143310546875, 0.03746795654296875, 0.04962158203125, 0.06177520751953125, 0.0739288330078125, 0.08608245849609375, 0.098236083984375, 0.11038970947265625, 0.1225433349609375, 0.13469696044921875, 0.1468505859375, 0.15900421142578125, 0.1711578369140625, 0.18331146240234375, 0.195465087890625, 0.20761871337890625, 0.2197723388671875, 0.23192596435546875, 0.24407958984375, 0.25623321533203125, 0.2683868408203125, 0.28054046630859375, 0.292694091796875, 0.30484771728515625, 0.3170013427734375, 0.32915496826171875, 0.34130859375]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 6.0, 1.0, 2.0, 0.0, 6.0, 6.0, 5.0, 9.0, 8.0, 9.0, 16.0, 22.0, 25.0, 29.0, 24.0, 38.0, 37.0, 38.0, 48.0, 45.0, 45.0, 69.0, 58.0, 50.0, 57.0, 44.0, 43.0, 46.0, 44.0, 43.0, 30.0, 24.0, 15.0, 21.0, 6.0, 7.0, 11.0, 6.0, 4.0, 3.0, 5.0, 2.0, 4.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.373046875, -0.3598518371582031, -0.34665679931640625, -0.3334617614746094, -0.3202667236328125, -0.3070716857910156, -0.29387664794921875, -0.2806816101074219, -0.267486572265625, -0.2542915344238281, -0.24109649658203125, -0.22790145874023438, -0.2147064208984375, -0.20151138305664062, -0.18831634521484375, -0.17512130737304688, -0.16192626953125, -0.14873123168945312, -0.13553619384765625, -0.12234115600585938, -0.1091461181640625, -0.09595108032226562, -0.08275604248046875, -0.06956100463867188, -0.056365966796875, -0.043170928955078125, -0.02997589111328125, -0.016780853271484375, -0.0035858154296875, 0.009609222412109375, 0.02280426025390625, 0.035999298095703125, 0.0491943359375, 0.062389373779296875, 0.07558441162109375, 0.08877944946289062, 0.1019744873046875, 0.11516952514648438, 0.12836456298828125, 0.14155960083007812, 0.154754638671875, 0.16794967651367188, 0.18114471435546875, 0.19433975219726562, 0.2075347900390625, 0.22072982788085938, 0.23392486572265625, 0.24711990356445312, 0.26031494140625, 0.2735099792480469, 0.28670501708984375, 0.2999000549316406, 0.3130950927734375, 0.3262901306152344, 0.33948516845703125, 0.3526802062988281, 0.365875244140625, 0.3790702819824219, 0.39226531982421875, 0.4054603576660156, 0.4186553955078125, 0.4318504333496094, 0.44504547119140625, 0.4582405090332031, 0.471435546875]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 6.0, 8.0, 15.0, 21.0, 47.0, 75.0, 198.0, 540.0, 2009.0, 14450.0, 642892.0, 376146.0, 9828.0, 1518.0, 471.0, 178.0, 85.0, 36.0, 15.0, 12.0, 6.0, 8.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4404296875, -0.4274482727050781, -0.41446685791015625, -0.4014854431152344, -0.3885040283203125, -0.3755226135253906, -0.36254119873046875, -0.3495597839355469, -0.336578369140625, -0.3235969543457031, -0.31061553955078125, -0.2976341247558594, -0.2846527099609375, -0.2716712951660156, -0.25868988037109375, -0.24570846557617188, -0.23272705078125, -0.21974563598632812, -0.20676422119140625, -0.19378280639648438, -0.1808013916015625, -0.16781997680664062, -0.15483856201171875, -0.14185714721679688, -0.128875732421875, -0.11589431762695312, -0.10291290283203125, -0.08993148803710938, -0.0769500732421875, -0.06396865844726562, -0.05098724365234375, -0.038005828857421875, -0.0250244140625, -0.012042999267578125, 0.00093841552734375, 0.013919830322265625, 0.0269012451171875, 0.039882659912109375, 0.05286407470703125, 0.06584548950195312, 0.078826904296875, 0.09180831909179688, 0.10478973388671875, 0.11777114868164062, 0.1307525634765625, 0.14373397827148438, 0.15671539306640625, 0.16969680786132812, 0.18267822265625, 0.19565963745117188, 0.20864105224609375, 0.22162246704101562, 0.2346038818359375, 0.24758529663085938, 0.26056671142578125, 0.2735481262207031, 0.286529541015625, 0.2995109558105469, 0.31249237060546875, 0.3254737854003906, 0.3384552001953125, 0.3514366149902344, 0.36441802978515625, 0.3773994445800781, 0.390380859375]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 7.0, 5.0, 15.0, 11.0, 16.0, 16.0, 40.0, 39.0, 52.0, 68.0, 92.0, 83.0, 91.0, 86.0, 80.0, 70.0, 51.0, 55.0, 43.0, 25.0, 13.0, 15.0, 9.0, 6.0, 5.0, 3.0, 2.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.7147274017333984e-05, -4.5076943933963776e-05, -4.300661385059357e-05, -4.093628376722336e-05, -3.886595368385315e-05, -3.679562360048294e-05, -3.472529351711273e-05, -3.265496343374252e-05, -3.0584633350372314e-05, -2.8514303267002106e-05, -2.6443973183631897e-05, -2.4373643100261688e-05, -2.230331301689148e-05, -2.023298293352127e-05, -1.8162652850151062e-05, -1.6092322766780853e-05, -1.4021992683410645e-05, -1.1951662600040436e-05, -9.881332516670227e-06, -7.811002433300018e-06, -5.7406723499298096e-06, -3.670342266559601e-06, -1.600012183189392e-06, 4.7031790018081665e-07, 2.5406479835510254e-06, 4.610978066921234e-06, 6.681308150291443e-06, 8.751638233661652e-06, 1.082196831703186e-05, 1.2892298400402069e-05, 1.4962628483772278e-05, 1.7032958567142487e-05, 1.9103288650512695e-05, 2.1173618733882904e-05, 2.3243948817253113e-05, 2.531427890062332e-05, 2.738460898399353e-05, 2.945493906736374e-05, 3.152526915073395e-05, 3.3595599234104156e-05, 3.5665929317474365e-05, 3.7736259400844574e-05, 3.980658948421478e-05, 4.187691956758499e-05, 4.39472496509552e-05, 4.601757973432541e-05, 4.808790981769562e-05, 5.0158239901065826e-05, 5.2228569984436035e-05, 5.4298900067806244e-05, 5.636923015117645e-05, 5.843956023454666e-05, 6.050989031791687e-05, 6.258022040128708e-05, 6.465055048465729e-05, 6.67208805680275e-05, 6.87912106513977e-05, 7.086154073476791e-05, 7.293187081813812e-05, 7.500220090150833e-05, 7.707253098487854e-05, 7.914286106824875e-05, 8.121319115161896e-05, 8.328352123498917e-05, 8.535385131835938e-05]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 8.0, 11.0, 12.0, 14.0, 36.0, 53.0, 101.0, 165.0, 338.0, 678.0, 1579.0, 4947.0, 23800.0, 269719.0, 667135.0, 66208.0, 9217.0, 2594.0, 984.0, 424.0, 236.0, 123.0, 66.0, 39.0, 17.0, 13.0, 8.0, 11.0, 9.0, 3.0, 6.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.218505859375, -0.21076583862304688, -0.20302581787109375, -0.19528579711914062, -0.1875457763671875, -0.17980575561523438, -0.17206573486328125, -0.16432571411132812, -0.156585693359375, -0.14884567260742188, -0.14110565185546875, -0.13336563110351562, -0.1256256103515625, -0.11788558959960938, -0.11014556884765625, -0.10240554809570312, -0.09466552734375, -0.08692550659179688, -0.07918548583984375, -0.07144546508789062, -0.0637054443359375, -0.055965423583984375, -0.04822540283203125, -0.040485382080078125, -0.032745361328125, -0.025005340576171875, -0.01726531982421875, -0.009525299072265625, -0.0017852783203125, 0.005954742431640625, 0.01369476318359375, 0.021434783935546875, 0.0291748046875, 0.036914825439453125, 0.04465484619140625, 0.052394866943359375, 0.0601348876953125, 0.06787490844726562, 0.07561492919921875, 0.08335494995117188, 0.091094970703125, 0.09883499145507812, 0.10657501220703125, 0.11431503295898438, 0.1220550537109375, 0.12979507446289062, 0.13753509521484375, 0.14527511596679688, 0.15301513671875, 0.16075515747070312, 0.16849517822265625, 0.17623519897460938, 0.1839752197265625, 0.19171524047851562, 0.19945526123046875, 0.20719528198242188, 0.214935302734375, 0.22267532348632812, 0.23041534423828125, 0.23815536499023438, 0.2458953857421875, 0.2536354064941406, 0.26137542724609375, 0.2691154479980469, 0.27685546875]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 3.0, 2.0, 0.0, 3.0, 3.0, 9.0, 7.0, 7.0, 14.0, 19.0, 30.0, 38.0, 46.0, 58.0, 72.0, 85.0, 62.0, 85.0, 91.0, 72.0, 69.0, 51.0, 44.0, 32.0, 35.0, 26.0, 14.0, 8.0, 9.0, 0.0, 3.0, 2.0, 3.0, 3.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1573486328125, -0.151947021484375, -0.14654541015625, -0.141143798828125, -0.1357421875, -0.130340576171875, -0.12493896484375, -0.119537353515625, -0.1141357421875, -0.108734130859375, -0.10333251953125, -0.097930908203125, -0.092529296875, -0.087127685546875, -0.08172607421875, -0.076324462890625, -0.0709228515625, -0.065521240234375, -0.06011962890625, -0.054718017578125, -0.04931640625, -0.043914794921875, -0.03851318359375, -0.033111572265625, -0.0277099609375, -0.022308349609375, -0.01690673828125, -0.011505126953125, -0.006103515625, -0.000701904296875, 0.00469970703125, 0.010101318359375, 0.0155029296875, 0.020904541015625, 0.02630615234375, 0.031707763671875, 0.037109375, 0.042510986328125, 0.04791259765625, 0.053314208984375, 0.0587158203125, 0.064117431640625, 0.06951904296875, 0.074920654296875, 0.080322265625, 0.085723876953125, 0.09112548828125, 0.096527099609375, 0.1019287109375, 0.107330322265625, 0.11273193359375, 0.118133544921875, 0.12353515625, 0.128936767578125, 0.13433837890625, 0.139739990234375, 0.1451416015625, 0.150543212890625, 0.15594482421875, 0.161346435546875, 0.166748046875, 0.172149658203125, 0.17755126953125, 0.182952880859375, 0.1883544921875]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 8.0, 15.0, 39.0, 124.0, 237.0, 274.0, 190.0, 79.0, 29.0, 9.0, 1.0, 3.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.918266534805298, -2.739671468734741, -2.5610766410827637, -2.382481575012207, -2.2038865089416504, -2.025291681289673, -1.8466966152191162, -1.6681016683578491, -1.489506721496582, -1.310911774635315, -1.1323168277740479, -0.9537217617034912, -0.7751268148422241, -0.596531867980957, -0.4179368019104004, -0.2393418550491333, -0.06074690818786621, 0.11784806847572327, 0.29644304513931274, 0.4750380516052246, 0.6536329984664917, 0.8322279453277588, 1.0108230113983154, 1.1894179582595825, 1.3680129051208496, 1.5466078519821167, 1.7252027988433838, 1.9037978649139404, 2.082392692565918, 2.2609877586364746, 2.4395828247070312, 2.618177890777588, 2.7967729568481445, 2.975368022918701, 3.1539628505706787, 3.3325579166412354, 3.511152744293213, 3.6897478103637695, 3.868342876434326, 4.046937942504883, 4.225532531738281, 4.404127597808838, 4.5827226638793945, 4.761317253112793, 4.93991231918335, 5.118507385253906, 5.297102451324463, 5.4756975173950195, 5.654292583465576, 5.832887649536133, 6.0114827156066895, 6.190077781677246, 6.3686723709106445, 6.547267436981201, 6.725862503051758, 6.9044575691223145, 7.083052635192871, 7.261647701263428, 7.440242767333984, 7.618837356567383, 7.7974324226379395, 7.976027488708496, 8.154623031616211, 8.33321762084961, 8.511812210083008]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 1.0, 3.0, 7.0, 1.0, 9.0, 3.0, 8.0, 1.0, 12.0, 17.0, 11.0, 13.0, 11.0, 16.0, 24.0, 39.0, 25.0, 39.0, 46.0, 60.0, 55.0, 68.0, 45.0, 47.0, 59.0, 57.0, 60.0, 44.0, 30.0, 25.0, 25.0, 24.0, 25.0, 25.0, 18.0, 14.0, 12.0, 12.0, 4.0, 6.0, 2.0, 5.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.0916075706481934, -2.0315911769866943, -1.9715749025344849, -1.9115585088729858, -1.8515422344207764, -1.7915258407592773, -1.7315094470977783, -1.6714931726455688, -1.6114768981933594, -1.5514605045318604, -1.4914442300796509, -1.4314278364181519, -1.3714115619659424, -1.3113951683044434, -1.2513787746429443, -1.1913625001907349, -1.1313461065292358, -1.0713297128677368, -1.0113134384155273, -0.9512970447540283, -0.8912807703018188, -0.8312643766403198, -0.7712480425834656, -0.7112317085266113, -0.6512153744697571, -0.5911990404129028, -0.5311827063560486, -0.47116634249687195, -0.4111500084400177, -0.35113367438316345, -0.2911173105239868, -0.23110097646713257, -0.17108476161956787, -0.11106842011213303, -0.05105207860469818, 0.00896427035331726, 0.06898060441017151, 0.12899693846702576, 0.1890133023262024, 0.24902963638305664, 0.3090459704399109, 0.36906230449676514, 0.4290786385536194, 0.489095002412796, 0.5491113662719727, 0.6091276407241821, 0.6691440343856812, 0.7291603684425354, 0.7891767024993896, 0.8491930365562439, 0.9092093706130981, 0.9692257642745972, 1.0292420387268066, 1.0892584323883057, 1.1492748260498047, 1.2092911005020142, 1.2693073749542236, 1.3293237686157227, 1.3893400430679321, 1.4493564367294312, 1.5093727111816406, 1.5693891048431396, 1.6294054985046387, 1.6894217729568481, 1.7494381666183472]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 6.0, 9.0, 7.0, 9.0, 10.0, 16.0, 29.0, 30.0, 49.0, 103.0, 143.0, 158.0, 274.0, 462.0, 736.0, 1091.0, 1945.0, 3624.0, 7609.0, 20463.0, 202115.0, 3909827.0, 26883.0, 8878.0, 4129.0, 2178.0, 1303.0, 826.0, 476.0, 278.0, 189.0, 135.0, 91.0, 50.0, 53.0, 37.0, 19.0, 20.0, 10.0, 5.0, 5.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.355712890625, -0.3446311950683594, -0.33354949951171875, -0.3224678039550781, -0.3113861083984375, -0.3003044128417969, -0.28922271728515625, -0.2781410217285156, -0.267059326171875, -0.2559776306152344, -0.24489593505859375, -0.23381423950195312, -0.2227325439453125, -0.21165084838867188, -0.20056915283203125, -0.18948745727539062, -0.17840576171875, -0.16732406616210938, -0.15624237060546875, -0.14516067504882812, -0.1340789794921875, -0.12299728393554688, -0.11191558837890625, -0.10083389282226562, -0.089752197265625, -0.07867050170898438, -0.06758880615234375, -0.056507110595703125, -0.0454254150390625, -0.034343719482421875, -0.02326202392578125, -0.012180328369140625, -0.0010986328125, 0.009983062744140625, 0.02106475830078125, 0.032146453857421875, 0.0432281494140625, 0.054309844970703125, 0.06539154052734375, 0.07647323608398438, 0.087554931640625, 0.09863662719726562, 0.10971832275390625, 0.12080001831054688, 0.1318817138671875, 0.14296340942382812, 0.15404510498046875, 0.16512680053710938, 0.17620849609375, 0.18729019165039062, 0.19837188720703125, 0.20945358276367188, 0.2205352783203125, 0.23161697387695312, 0.24269866943359375, 0.2537803649902344, 0.264862060546875, 0.2759437561035156, 0.28702545166015625, 0.2981071472167969, 0.3091888427734375, 0.3202705383300781, 0.33135223388671875, 0.3424339294433594, 0.353515625]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 3.0, 8.0, 1.0, 9.0, 16.0, 9.0, 22.0, 22.0, 24.0, 40.0, 58.0, 51.0, 69.0, 56.0, 64.0, 83.0, 71.0, 70.0, 71.0, 63.0, 51.0, 41.0, 29.0, 22.0, 13.0, 13.0, 6.0, 4.0, 5.0, 4.0, 4.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1357421875, -0.13199329376220703, -0.12824440002441406, -0.1244955062866211, -0.12074661254882812, -0.11699771881103516, -0.11324882507324219, -0.10949993133544922, -0.10575103759765625, -0.10200214385986328, -0.09825325012207031, -0.09450435638427734, -0.09075546264648438, -0.0870065689086914, -0.08325767517089844, -0.07950878143310547, -0.0757598876953125, -0.07201099395751953, -0.06826210021972656, -0.0645132064819336, -0.060764312744140625, -0.057015419006347656, -0.05326652526855469, -0.04951763153076172, -0.04576873779296875, -0.04201984405517578, -0.03827095031738281, -0.034522056579589844, -0.030773162841796875, -0.027024269104003906, -0.023275375366210938, -0.01952648162841797, -0.015777587890625, -0.012028694152832031, -0.008279800415039062, -0.004530906677246094, -0.000782012939453125, 0.0029668807983398438, 0.0067157745361328125, 0.010464668273925781, 0.01421356201171875, 0.01796245574951172, 0.021711349487304688, 0.025460243225097656, 0.029209136962890625, 0.032958030700683594, 0.03670692443847656, 0.04045581817626953, 0.0442047119140625, 0.04795360565185547, 0.05170249938964844, 0.055451393127441406, 0.059200286865234375, 0.06294918060302734, 0.06669807434082031, 0.07044696807861328, 0.07419586181640625, 0.07794475555419922, 0.08169364929199219, 0.08544254302978516, 0.08919143676757812, 0.0929403305053711, 0.09668922424316406, 0.10043811798095703, 0.10418701171875]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 6.0, 5.0, 4.0, 10.0, 14.0, 16.0, 10.0, 14.0, 27.0, 34.0, 47.0, 63.0, 99.0, 203.0, 308.0, 623.0, 1210.0, 2920.0, 8810.0, 44650.0, 4049976.0, 67641.0, 11191.0, 3428.0, 1445.0, 644.0, 339.0, 182.0, 108.0, 69.0, 58.0, 30.0, 23.0, 15.0, 17.0, 14.0, 13.0, 8.0, 11.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.50830078125, -0.48987579345703125, -0.4714508056640625, -0.45302581787109375, -0.434600830078125, -0.41617584228515625, -0.3977508544921875, -0.37932586669921875, -0.36090087890625, -0.34247589111328125, -0.3240509033203125, -0.30562591552734375, -0.287200927734375, -0.26877593994140625, -0.2503509521484375, -0.23192596435546875, -0.2135009765625, -0.19507598876953125, -0.1766510009765625, -0.15822601318359375, -0.139801025390625, -0.12137603759765625, -0.1029510498046875, -0.08452606201171875, -0.06610107421875, -0.04767608642578125, -0.0292510986328125, -0.01082611083984375, 0.007598876953125, 0.02602386474609375, 0.0444488525390625, 0.06287384033203125, 0.081298828125, 0.09972381591796875, 0.1181488037109375, 0.13657379150390625, 0.154998779296875, 0.17342376708984375, 0.1918487548828125, 0.21027374267578125, 0.22869873046875, 0.24712371826171875, 0.2655487060546875, 0.28397369384765625, 0.302398681640625, 0.32082366943359375, 0.3392486572265625, 0.35767364501953125, 0.3760986328125, 0.39452362060546875, 0.4129486083984375, 0.43137359619140625, 0.449798583984375, 0.46822357177734375, 0.4866485595703125, 0.5050735473632812, 0.52349853515625, 0.5419235229492188, 0.5603485107421875, 0.5787734985351562, 0.597198486328125, 0.6156234741210938, 0.6340484619140625, 0.6524734497070312, 0.6708984375]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 5.0, 2.0, 7.0, 7.0, 9.0, 11.0, 14.0, 27.0, 54.0, 151.0, 3472.0, 193.0, 60.0, 20.0, 18.0, 10.0, 7.0, 6.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08172607421875, -0.07776165008544922, -0.07379722595214844, -0.06983280181884766, -0.06586837768554688, -0.061903953552246094, -0.05793952941894531, -0.05397510528564453, -0.05001068115234375, -0.04604625701904297, -0.04208183288574219, -0.038117408752441406, -0.034152984619140625, -0.030188560485839844, -0.026224136352539062, -0.02225971221923828, -0.0182952880859375, -0.014330863952636719, -0.010366439819335938, -0.006402015686035156, -0.002437591552734375, 0.0015268325805664062, 0.0054912567138671875, 0.009455680847167969, 0.01342010498046875, 0.01738452911376953, 0.021348953247070312, 0.025313377380371094, 0.029277801513671875, 0.033242225646972656, 0.03720664978027344, 0.04117107391357422, 0.045135498046875, 0.04909992218017578, 0.05306434631347656, 0.057028770446777344, 0.060993194580078125, 0.0649576187133789, 0.06892204284667969, 0.07288646697998047, 0.07685089111328125, 0.08081531524658203, 0.08477973937988281, 0.0887441635131836, 0.09270858764648438, 0.09667301177978516, 0.10063743591308594, 0.10460186004638672, 0.1085662841796875, 0.11253070831298828, 0.11649513244628906, 0.12045955657958984, 0.12442398071289062, 0.1283884048461914, 0.1323528289794922, 0.13631725311279297, 0.14028167724609375, 0.14424610137939453, 0.1482105255126953, 0.1521749496459961, 0.15613937377929688, 0.16010379791259766, 0.16406822204589844, 0.16803264617919922, 0.1719970703125]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 4.0, 5.0, 4.0, 9.0, 15.0, 27.0, 47.0, 73.0, 103.0, 128.0, 145.0, 133.0, 117.0, 74.0, 53.0, 33.0, 19.0, 6.0, 7.0, 4.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.5267080664634705, -0.5120776891708374, -0.49744731187820435, -0.4828169345855713, -0.4681865870952606, -0.45355620980262756, -0.4389258325099945, -0.42429545521736145, -0.4096651077270508, -0.3950347304344177, -0.38040435314178467, -0.3657739758491516, -0.35114362835884094, -0.3365132510662079, -0.32188287377357483, -0.3072524964809418, -0.2926221191883087, -0.27799174189567566, -0.2633613646030426, -0.24873100221157074, -0.23410063982009888, -0.21947026252746582, -0.20483988523483276, -0.1902095079421997, -0.17557914555072784, -0.1609487682580948, -0.14631840586662292, -0.13168802857398987, -0.11705765873193741, -0.10242728888988495, -0.08779691159725189, -0.07316654175519943, -0.05853617191314697, -0.04390580207109451, -0.029275428503751755, -0.014645054936408997, -1.4685094356536865e-05, 0.014615684747695923, 0.02924606204032898, 0.04387643188238144, 0.0585068017244339, 0.07313717156648636, 0.08776754140853882, 0.10239791870117188, 0.11702828854322433, 0.1316586583852768, 0.14628903567790985, 0.1609193980693817, 0.17554977536201477, 0.19018015265464783, 0.2048105150461197, 0.21944089233875275, 0.2340712547302246, 0.24870163202285767, 0.2633320093154907, 0.2779623866081238, 0.29259276390075684, 0.3072231411933899, 0.32185351848602295, 0.336483895778656, 0.3511142432689667, 0.36574462056159973, 0.3803749978542328, 0.39500537514686584, 0.4096357226371765]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 2.0, 3.0, 3.0, 8.0, 5.0, 6.0, 7.0, 7.0, 19.0, 9.0, 22.0, 20.0, 14.0, 30.0, 34.0, 31.0, 30.0, 41.0, 38.0, 35.0, 51.0, 48.0, 38.0, 40.0, 41.0, 29.0, 39.0, 41.0, 29.0, 37.0, 32.0, 30.0, 27.0, 22.0, 22.0, 20.0, 14.0, 15.0, 18.0, 13.0, 11.0, 8.0, 5.0, 2.0, 4.0, 5.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.17311352491378784, -0.16769325733184814, -0.16227300465106964, -0.15685273706912994, -0.15143248438835144, -0.14601221680641174, -0.14059194922447205, -0.13517168164253235, -0.12975142896175385, -0.12433116883039474, -0.11891090869903564, -0.11349064111709595, -0.10807038098573685, -0.10265012085437775, -0.09722985327243805, -0.09180959314107895, -0.08638933300971985, -0.08096907287836075, -0.07554881274700165, -0.07012854516506195, -0.06470828503370285, -0.05928802490234375, -0.05386776104569435, -0.04844749718904495, -0.04302723705768585, -0.03760697692632675, -0.03218671306967735, -0.026766451075673103, -0.021346189081668854, -0.015925927087664604, -0.010505665093660355, -0.005085401237010956, 0.00033485889434814453, 0.005755120888352394, 0.011175382882356644, 0.016595644876360893, 0.022015906870365143, 0.027436168864369392, 0.03285643085837364, 0.03827669471502304, 0.04369695484638214, 0.04911721497774124, 0.05453747883439064, 0.05995774269104004, 0.06537800282239914, 0.07079826295375824, 0.07621853053569794, 0.08163879066705704, 0.08705905079841614, 0.09247931092977524, 0.09789957106113434, 0.10331983864307404, 0.10874009877443314, 0.11416035890579224, 0.11958062648773193, 0.12500089406967163, 0.13042114675045013, 0.13584141433238983, 0.14126166701316833, 0.14668193459510803, 0.15210220217704773, 0.15752245485782623, 0.16294272243976593, 0.16836297512054443, 0.17378324270248413]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 4.0, 9.0, 7.0, 4.0, 16.0, 21.0, 38.0, 40.0, 47.0, 69.0, 100.0, 175.0, 267.0, 451.0, 734.0, 1372.0, 2626.0, 4945.0, 9900.0, 20527.0, 42985.0, 93802.0, 210456.0, 319126.0, 184503.0, 81910.0, 37977.0, 17813.0, 8854.0, 4378.0, 2205.0, 1268.0, 736.0, 437.0, 243.0, 176.0, 106.0, 77.0, 49.0, 32.0, 17.0, 17.0, 12.0, 8.0, 4.0, 10.0, 5.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1474609375, -0.14276695251464844, -0.13807296752929688, -0.1333789825439453, -0.12868499755859375, -0.12399101257324219, -0.11929702758789062, -0.11460304260253906, -0.1099090576171875, -0.10521507263183594, -0.10052108764648438, -0.09582710266113281, -0.09113311767578125, -0.08643913269042969, -0.08174514770507812, -0.07705116271972656, -0.072357177734375, -0.06766319274902344, -0.06296920776367188, -0.05827522277832031, -0.05358123779296875, -0.04888725280761719, -0.044193267822265625, -0.03949928283691406, -0.0348052978515625, -0.030111312866210938, -0.025417327880859375, -0.020723342895507812, -0.01602935791015625, -0.011335372924804688, -0.006641387939453125, -0.0019474029541015625, 0.00274658203125, 0.0074405670166015625, 0.012134552001953125, 0.016828536987304688, 0.02152252197265625, 0.026216506958007812, 0.030910491943359375, 0.03560447692871094, 0.0402984619140625, 0.04499244689941406, 0.049686431884765625, 0.05438041687011719, 0.05907440185546875, 0.06376838684082031, 0.06846237182617188, 0.07315635681152344, 0.077850341796875, 0.08254432678222656, 0.08723831176757812, 0.09193229675292969, 0.09662628173828125, 0.10132026672363281, 0.10601425170898438, 0.11070823669433594, 0.1154022216796875, 0.12009620666503906, 0.12479019165039062, 0.1294841766357422, 0.13417816162109375, 0.1388721466064453, 0.14356613159179688, 0.14826011657714844, 0.1529541015625]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 2.0, 2.0, 10.0, 10.0, 14.0, 14.0, 20.0, 27.0, 24.0, 36.0, 52.0, 62.0, 59.0, 86.0, 83.0, 80.0, 91.0, 58.0, 55.0, 44.0, 45.0, 42.0, 30.0, 23.0, 10.0, 11.0, 8.0, 0.0, 5.0, 0.0, 4.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.152587890625, -0.14844894409179688, -0.14430999755859375, -0.14017105102539062, -0.1360321044921875, -0.13189315795898438, -0.12775421142578125, -0.12361526489257812, -0.119476318359375, -0.11533737182617188, -0.11119842529296875, -0.10705947875976562, -0.1029205322265625, -0.09878158569335938, -0.09464263916015625, -0.09050369262695312, -0.08636474609375, -0.08222579956054688, -0.07808685302734375, -0.07394790649414062, -0.0698089599609375, -0.06567001342773438, -0.06153106689453125, -0.057392120361328125, -0.053253173828125, -0.049114227294921875, -0.04497528076171875, -0.040836334228515625, -0.0366973876953125, -0.032558441162109375, -0.02841949462890625, -0.024280548095703125, -0.0201416015625, -0.016002655029296875, -0.01186370849609375, -0.007724761962890625, -0.0035858154296875, 0.000553131103515625, 0.00469207763671875, 0.008831024169921875, 0.012969970703125, 0.017108917236328125, 0.02124786376953125, 0.025386810302734375, 0.0295257568359375, 0.033664703369140625, 0.03780364990234375, 0.041942596435546875, 0.04608154296875, 0.050220489501953125, 0.05435943603515625, 0.058498382568359375, 0.0626373291015625, 0.06677627563476562, 0.07091522216796875, 0.07505416870117188, 0.079193115234375, 0.08333206176757812, 0.08747100830078125, 0.09160995483398438, 0.0957489013671875, 0.09988784790039062, 0.10402679443359375, 0.10816574096679688, 0.1123046875]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 3.0, 1.0, 4.0, 0.0, 9.0, 6.0, 5.0, 13.0, 22.0, 29.0, 40.0, 39.0, 55.0, 70.0, 107.0, 111.0, 181.0, 300.0, 422.0, 732.0, 1401.0, 3207.0, 10739.0, 52878.0, 454774.0, 453938.0, 52171.0, 10516.0, 3237.0, 1369.0, 723.0, 434.0, 294.0, 203.0, 123.0, 92.0, 86.0, 51.0, 40.0, 32.0, 33.0, 20.0, 14.0, 11.0, 6.0, 5.0, 7.0, 4.0, 1.0, 4.0, 2.0, 0.0, 2.0, 1.0, 2.0], "bins": [-0.32177734375, -0.3123130798339844, -0.30284881591796875, -0.2933845520019531, -0.2839202880859375, -0.2744560241699219, -0.26499176025390625, -0.2555274963378906, -0.246063232421875, -0.23659896850585938, -0.22713470458984375, -0.21767044067382812, -0.2082061767578125, -0.19874191284179688, -0.18927764892578125, -0.17981338500976562, -0.17034912109375, -0.16088485717773438, -0.15142059326171875, -0.14195632934570312, -0.1324920654296875, -0.12302780151367188, -0.11356353759765625, -0.10409927368164062, -0.094635009765625, -0.08517074584960938, -0.07570648193359375, -0.06624221801757812, -0.0567779541015625, -0.047313690185546875, -0.03784942626953125, -0.028385162353515625, -0.0189208984375, -0.009456634521484375, 7.62939453125e-06, 0.009471893310546875, 0.0189361572265625, 0.028400421142578125, 0.03786468505859375, 0.047328948974609375, 0.056793212890625, 0.06625747680664062, 0.07572174072265625, 0.08518600463867188, 0.0946502685546875, 0.10411453247070312, 0.11357879638671875, 0.12304306030273438, 0.13250732421875, 0.14197158813476562, 0.15143585205078125, 0.16090011596679688, 0.1703643798828125, 0.17982864379882812, 0.18929290771484375, 0.19875717163085938, 0.208221435546875, 0.21768569946289062, 0.22714996337890625, 0.23661422729492188, 0.2460784912109375, 0.2555427551269531, 0.26500701904296875, 0.2744712829589844, 0.283935546875]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 4.0, 4.0, 6.0, 3.0, 5.0, 4.0, 11.0, 10.0, 20.0, 27.0, 25.0, 34.0, 33.0, 44.0, 39.0, 50.0, 47.0, 54.0, 51.0, 49.0, 54.0, 50.0, 39.0, 41.0, 43.0, 45.0, 36.0, 32.0, 38.0, 25.0, 13.0, 9.0, 23.0, 10.0, 10.0, 6.0, 4.0, 5.0, 5.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.4873046875, -0.4737281799316406, -0.46015167236328125, -0.4465751647949219, -0.4329986572265625, -0.4194221496582031, -0.40584564208984375, -0.3922691345214844, -0.378692626953125, -0.3651161193847656, -0.35153961181640625, -0.3379631042480469, -0.3243865966796875, -0.3108100891113281, -0.29723358154296875, -0.2836570739746094, -0.27008056640625, -0.2565040588378906, -0.24292755126953125, -0.22935104370117188, -0.2157745361328125, -0.20219802856445312, -0.18862152099609375, -0.17504501342773438, -0.161468505859375, -0.14789199829101562, -0.13431549072265625, -0.12073898315429688, -0.1071624755859375, -0.09358596801757812, -0.08000946044921875, -0.06643295288085938, -0.0528564453125, -0.039279937744140625, -0.02570343017578125, -0.012126922607421875, 0.0014495849609375, 0.015026092529296875, 0.02860260009765625, 0.042179107666015625, 0.055755615234375, 0.06933212280273438, 0.08290863037109375, 0.09648513793945312, 0.1100616455078125, 0.12363815307617188, 0.13721466064453125, 0.15079116821289062, 0.16436767578125, 0.17794418334960938, 0.19152069091796875, 0.20509719848632812, 0.2186737060546875, 0.23225021362304688, 0.24582672119140625, 0.2594032287597656, 0.272979736328125, 0.2865562438964844, 0.30013275146484375, 0.3137092590332031, 0.3272857666015625, 0.3408622741699219, 0.35443878173828125, 0.3680152893066406, 0.381591796875]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 4.0, 5.0, 11.0, 10.0, 23.0, 71.0, 141.0, 385.0, 1476.0, 12118.0, 702824.0, 322432.0, 7437.0, 1098.0, 319.0, 101.0, 48.0, 20.0, 17.0, 8.0, 2.0, 4.0, 2.0, 4.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.489990234375, -0.4780120849609375, -0.466033935546875, -0.4540557861328125, -0.44207763671875, -0.4300994873046875, -0.418121337890625, -0.4061431884765625, -0.3941650390625, -0.3821868896484375, -0.370208740234375, -0.3582305908203125, -0.34625244140625, -0.3342742919921875, -0.322296142578125, -0.3103179931640625, -0.29833984375, -0.2863616943359375, -0.274383544921875, -0.2624053955078125, -0.25042724609375, -0.2384490966796875, -0.226470947265625, -0.2144927978515625, -0.2025146484375, -0.1905364990234375, -0.178558349609375, -0.1665802001953125, -0.15460205078125, -0.1426239013671875, -0.130645751953125, -0.1186676025390625, -0.106689453125, -0.0947113037109375, -0.082733154296875, -0.0707550048828125, -0.05877685546875, -0.0467987060546875, -0.034820556640625, -0.0228424072265625, -0.0108642578125, 0.0011138916015625, 0.013092041015625, 0.0250701904296875, 0.03704833984375, 0.0490264892578125, 0.061004638671875, 0.0729827880859375, 0.0849609375, 0.0969390869140625, 0.108917236328125, 0.1208953857421875, 0.13287353515625, 0.1448516845703125, 0.156829833984375, 0.1688079833984375, 0.1807861328125, 0.1927642822265625, 0.204742431640625, 0.2167205810546875, 0.22869873046875, 0.2406768798828125, 0.252655029296875, 0.2646331787109375, 0.276611328125]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 5.0, 0.0, 6.0, 4.0, 9.0, 5.0, 4.0, 6.0, 9.0, 11.0, 17.0, 13.0, 18.0, 33.0, 30.0, 60.0, 63.0, 58.0, 67.0, 97.0, 76.0, 77.0, 65.0, 57.0, 52.0, 35.0, 35.0, 20.0, 14.0, 17.0, 15.0, 10.0, 7.0, 2.0, 6.0, 5.0, 4.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-6.115436553955078e-05, -5.970802158117294e-05, -5.8261677622795105e-05, -5.681533366441727e-05, -5.536898970603943e-05, -5.392264574766159e-05, -5.247630178928375e-05, -5.1029957830905914e-05, -4.9583613872528076e-05, -4.813726991415024e-05, -4.66909259557724e-05, -4.524458199739456e-05, -4.3798238039016724e-05, -4.2351894080638885e-05, -4.090555012226105e-05, -3.945920616388321e-05, -3.801286220550537e-05, -3.656651824712753e-05, -3.5120174288749695e-05, -3.367383033037186e-05, -3.222748637199402e-05, -3.078114241361618e-05, -2.9334798455238342e-05, -2.7888454496860504e-05, -2.6442110538482666e-05, -2.4995766580104828e-05, -2.354942262172699e-05, -2.210307866334915e-05, -2.0656734704971313e-05, -1.9210390746593475e-05, -1.7764046788215637e-05, -1.63177028298378e-05, -1.4871358871459961e-05, -1.3425014913082123e-05, -1.1978670954704285e-05, -1.0532326996326447e-05, -9.085983037948608e-06, -7.63963907957077e-06, -6.193295121192932e-06, -4.746951162815094e-06, -3.300607204437256e-06, -1.8542632460594177e-06, -4.079192876815796e-07, 1.0384246706962585e-06, 2.4847686290740967e-06, 3.931112587451935e-06, 5.377456545829773e-06, 6.823800504207611e-06, 8.27014446258545e-06, 9.716488420963287e-06, 1.1162832379341125e-05, 1.2609176337718964e-05, 1.4055520296096802e-05, 1.550186425447464e-05, 1.6948208212852478e-05, 1.8394552171230316e-05, 1.9840896129608154e-05, 2.1287240087985992e-05, 2.273358404636383e-05, 2.417992800474167e-05, 2.5626271963119507e-05, 2.7072615921497345e-05, 2.8518959879875183e-05, 2.996530383825302e-05, 3.141164779663086e-05]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 5.0, 8.0, 5.0, 6.0, 12.0, 14.0, 38.0, 53.0, 78.0, 154.0, 261.0, 487.0, 1056.0, 2895.0, 10818.0, 78367.0, 701611.0, 222894.0, 22061.0, 4731.0, 1645.0, 646.0, 317.0, 176.0, 86.0, 45.0, 33.0, 18.0, 12.0, 6.0, 7.0, 6.0, 0.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.2093505859375, -0.20294952392578125, -0.1965484619140625, -0.19014739990234375, -0.183746337890625, -0.17734527587890625, -0.1709442138671875, -0.16454315185546875, -0.15814208984375, -0.15174102783203125, -0.1453399658203125, -0.13893890380859375, -0.132537841796875, -0.12613677978515625, -0.1197357177734375, -0.11333465576171875, -0.10693359375, -0.10053253173828125, -0.0941314697265625, -0.08773040771484375, -0.081329345703125, -0.07492828369140625, -0.0685272216796875, -0.06212615966796875, -0.05572509765625, -0.04932403564453125, -0.0429229736328125, -0.03652191162109375, -0.030120849609375, -0.02371978759765625, -0.0173187255859375, -0.01091766357421875, -0.0045166015625, 0.00188446044921875, 0.0082855224609375, 0.01468658447265625, 0.021087646484375, 0.02748870849609375, 0.0338897705078125, 0.04029083251953125, 0.04669189453125, 0.05309295654296875, 0.0594940185546875, 0.06589508056640625, 0.072296142578125, 0.07869720458984375, 0.0850982666015625, 0.09149932861328125, 0.097900390625, 0.10430145263671875, 0.1107025146484375, 0.11710357666015625, 0.123504638671875, 0.12990570068359375, 0.1363067626953125, 0.14270782470703125, 0.14910888671875, 0.15550994873046875, 0.1619110107421875, 0.16831207275390625, 0.174713134765625, 0.18111419677734375, 0.1875152587890625, 0.19391632080078125, 0.2003173828125]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 4.0, 4.0, 5.0, 9.0, 7.0, 15.0, 6.0, 18.0, 27.0, 26.0, 24.0, 56.0, 46.0, 57.0, 63.0, 76.0, 75.0, 77.0, 59.0, 58.0, 59.0, 39.0, 40.0, 23.0, 23.0, 20.0, 28.0, 14.0, 9.0, 8.0, 11.0, 5.0, 4.0, 3.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1240234375, -0.12037944793701172, -0.11673545837402344, -0.11309146881103516, -0.10944747924804688, -0.1058034896850586, -0.10215950012207031, -0.09851551055908203, -0.09487152099609375, -0.09122753143310547, -0.08758354187011719, -0.0839395523071289, -0.08029556274414062, -0.07665157318115234, -0.07300758361816406, -0.06936359405517578, -0.0657196044921875, -0.06207561492919922, -0.05843162536621094, -0.054787635803222656, -0.051143646240234375, -0.047499656677246094, -0.04385566711425781, -0.04021167755126953, -0.03656768798828125, -0.03292369842529297, -0.029279708862304688, -0.025635719299316406, -0.021991729736328125, -0.018347740173339844, -0.014703750610351562, -0.011059761047363281, -0.007415771484375, -0.0037717819213867188, -0.0001277923583984375, 0.0035161972045898438, 0.007160186767578125, 0.010804176330566406, 0.014448165893554688, 0.01809215545654297, 0.02173614501953125, 0.02538013458251953, 0.029024124145507812, 0.032668113708496094, 0.036312103271484375, 0.039956092834472656, 0.04360008239746094, 0.04724407196044922, 0.0508880615234375, 0.05453205108642578, 0.05817604064941406, 0.061820030212402344, 0.06546401977539062, 0.0691080093383789, 0.07275199890136719, 0.07639598846435547, 0.08003997802734375, 0.08368396759033203, 0.08732795715332031, 0.0909719467163086, 0.09461593627929688, 0.09825992584228516, 0.10190391540527344, 0.10554790496826172, 0.10919189453125]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 0.0, 5.0, 1.0, 6.0, 1.0, 18.0, 27.0, 66.0, 164.0, 193.0, 235.0, 154.0, 83.0, 34.0, 15.0, 2.0, 3.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6376831531524658, -1.5120912790298462, -1.3864994049072266, -1.2609076499938965, -1.1353156566619873, -1.0097239017486572, -0.8841320276260376, -0.758540153503418, -0.6329482793807983, -0.5073564052581787, -0.38176456093788147, -0.25617271661758423, -0.1305808424949646, -0.004988968372344971, 0.12060284614562988, 0.2461947202682495, 0.37178659439086914, 0.49737846851348877, 0.6229703426361084, 0.7485621571540833, 0.8741540312767029, 0.9997459053993225, 1.1253377199172974, 1.250929594039917, 1.3765214681625366, 1.5021133422851562, 1.6277052164077759, 1.7532970905303955, 1.8788888454437256, 2.0044808387756348, 2.130072593688965, 2.255664348602295, 2.381256580352783, 2.5068483352661133, 2.6324403285980225, 2.7580320835113525, 2.8836240768432617, 3.009215831756592, 3.134807586669922, 3.260399580001831, 3.3859915733337402, 3.5115833282470703, 3.6371753215789795, 3.7627670764923096, 3.8883590698242188, 4.013950824737549, 4.139542579650879, 4.265134811401367, 4.390726089477539, 4.516317844390869, 4.641909599304199, 4.7675018310546875, 4.893093585968018, 5.018685340881348, 5.144277095794678, 5.269868850708008, 5.395461082458496, 5.521052837371826, 5.646644592285156, 5.7722368240356445, 5.897828578948975, 6.023420333862305, 6.149012088775635, 6.274603843688965, 6.400196075439453]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 4.0, 2.0, 3.0, 7.0, 6.0, 3.0, 5.0, 13.0, 13.0, 11.0, 12.0, 24.0, 22.0, 32.0, 23.0, 27.0, 26.0, 39.0, 31.0, 43.0, 41.0, 61.0, 66.0, 57.0, 50.0, 59.0, 36.0, 51.0, 33.0, 33.0, 28.0, 25.0, 20.0, 25.0, 24.0, 13.0, 5.0, 7.0, 6.0, 5.0, 3.0, 3.0, 6.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-1.9483669996261597, -1.8918190002441406, -1.8352710008621216, -1.7787230014801025, -1.722175121307373, -1.665627121925354, -1.609079122543335, -1.552531123161316, -1.4959831237792969, -1.4394351243972778, -1.3828871250152588, -1.3263392448425293, -1.2697912454605103, -1.2132432460784912, -1.1566952466964722, -1.1001472473144531, -1.0435993671417236, -0.9870513677597046, -0.9305034279823303, -0.8739554286003113, -0.8174074292182922, -0.760859489440918, -0.7043114900588989, -0.6477634906768799, -0.5912154912948608, -0.5346674919128418, -0.47811952233314514, -0.4215715527534485, -0.36502355337142944, -0.3084755837917328, -0.25192761421203613, -0.1953796148300171, -0.13883161544799805, -0.0822836309671402, -0.025735653936862946, 0.030812323093414307, 0.08736030757427216, 0.14390829205513, 0.20045626163482666, 0.2570042610168457, 0.31355223059654236, 0.370100200176239, 0.42664819955825806, 0.4831961691379547, 0.5397441387176514, 0.5962921380996704, 0.6528401374816895, 0.7093881368637085, 0.7659360766410828, 0.8224840760231018, 0.8790320158004761, 0.9355800151824951, 0.9921280145645142, 1.0486760139465332, 1.1052238941192627, 1.1617720127105713, 1.2183198928833008, 1.2748678922653198, 1.3314158916473389, 1.3879637718200684, 1.4445117712020874, 1.5010597705841064, 1.5576077699661255, 1.6141557693481445, 1.6707037687301636]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 3.0, 4.0, 8.0, 12.0, 16.0, 19.0, 26.0, 38.0, 66.0, 111.0, 164.0, 253.0, 423.0, 756.0, 1319.0, 2513.0, 4931.0, 11363.0, 33761.0, 200696.0, 3822723.0, 78982.0, 20385.0, 7817.0, 3567.0, 1786.0, 957.0, 594.0, 345.0, 211.0, 165.0, 104.0, 67.0, 42.0, 21.0, 15.0, 10.0, 7.0, 6.0, 2.0, 0.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.27685546875, -0.2677154541015625, -0.258575439453125, -0.2494354248046875, -0.24029541015625, -0.2311553955078125, -0.222015380859375, -0.2128753662109375, -0.2037353515625, -0.1945953369140625, -0.185455322265625, -0.1763153076171875, -0.16717529296875, -0.1580352783203125, -0.148895263671875, -0.1397552490234375, -0.130615234375, -0.1214752197265625, -0.112335205078125, -0.1031951904296875, -0.09405517578125, -0.0849151611328125, -0.075775146484375, -0.0666351318359375, -0.0574951171875, -0.0483551025390625, -0.039215087890625, -0.0300750732421875, -0.02093505859375, -0.0117950439453125, -0.002655029296875, 0.0064849853515625, 0.015625, 0.0247650146484375, 0.033905029296875, 0.0430450439453125, 0.05218505859375, 0.0613250732421875, 0.070465087890625, 0.0796051025390625, 0.0887451171875, 0.0978851318359375, 0.107025146484375, 0.1161651611328125, 0.12530517578125, 0.1344451904296875, 0.143585205078125, 0.1527252197265625, 0.161865234375, 0.1710052490234375, 0.180145263671875, 0.1892852783203125, 0.19842529296875, 0.2075653076171875, 0.216705322265625, 0.2258453369140625, 0.2349853515625, 0.2441253662109375, 0.253265380859375, 0.2624053955078125, 0.27154541015625, 0.2806854248046875, 0.289825439453125, 0.2989654541015625, 0.30810546875]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 2.0, 2.0, 4.0, 6.0, 7.0, 3.0, 7.0, 14.0, 12.0, 15.0, 21.0, 19.0, 38.0, 56.0, 48.0, 48.0, 64.0, 62.0, 80.0, 66.0, 49.0, 45.0, 50.0, 44.0, 47.0, 40.0, 37.0, 34.0, 23.0, 14.0, 6.0, 11.0, 5.0, 6.0, 6.0, 4.0, 6.0, 2.0, 1.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.10357666015625, -0.10055828094482422, -0.09753990173339844, -0.09452152252197266, -0.09150314331054688, -0.0884847640991211, -0.08546638488769531, -0.08244800567626953, -0.07942962646484375, -0.07641124725341797, -0.07339286804199219, -0.0703744888305664, -0.06735610961914062, -0.06433773040771484, -0.06131935119628906, -0.05830097198486328, -0.0552825927734375, -0.05226421356201172, -0.04924583435058594, -0.046227455139160156, -0.043209075927734375, -0.040190696716308594, -0.03717231750488281, -0.03415393829345703, -0.03113555908203125, -0.02811717987060547, -0.025098800659179688, -0.022080421447753906, -0.019062042236328125, -0.016043663024902344, -0.013025283813476562, -0.010006904602050781, -0.006988525390625, -0.003970146179199219, -0.0009517669677734375, 0.0020666122436523438, 0.005084991455078125, 0.008103370666503906, 0.011121749877929688, 0.014140129089355469, 0.01715850830078125, 0.02017688751220703, 0.023195266723632812, 0.026213645935058594, 0.029232025146484375, 0.032250404357910156, 0.03526878356933594, 0.03828716278076172, 0.0413055419921875, 0.04432392120361328, 0.04734230041503906, 0.050360679626464844, 0.053379058837890625, 0.056397438049316406, 0.05941581726074219, 0.06243419647216797, 0.06545257568359375, 0.06847095489501953, 0.07148933410644531, 0.0745077133178711, 0.07752609252929688, 0.08054447174072266, 0.08356285095214844, 0.08658123016357422, 0.089599609375]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 5.0, 7.0, 14.0, 14.0, 22.0, 28.0, 48.0, 81.0, 107.0, 150.0, 245.0, 442.0, 747.0, 1464.0, 3269.0, 8044.0, 26090.0, 154271.0, 3818326.0, 141843.0, 24830.0, 7796.0, 3115.0, 1463.0, 719.0, 406.0, 255.0, 154.0, 107.0, 78.0, 46.0, 33.0, 15.0, 19.0, 15.0, 3.0, 6.0, 4.0, 2.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.37353515625, -0.3632965087890625, -0.353057861328125, -0.3428192138671875, -0.33258056640625, -0.3223419189453125, -0.312103271484375, -0.3018646240234375, -0.2916259765625, -0.2813873291015625, -0.271148681640625, -0.2609100341796875, -0.25067138671875, -0.2404327392578125, -0.230194091796875, -0.2199554443359375, -0.209716796875, -0.1994781494140625, -0.189239501953125, -0.1790008544921875, -0.16876220703125, -0.1585235595703125, -0.148284912109375, -0.1380462646484375, -0.1278076171875, -0.1175689697265625, -0.107330322265625, -0.0970916748046875, -0.08685302734375, -0.0766143798828125, -0.066375732421875, -0.0561370849609375, -0.0458984375, -0.0356597900390625, -0.025421142578125, -0.0151824951171875, -0.00494384765625, 0.0052947998046875, 0.015533447265625, 0.0257720947265625, 0.0360107421875, 0.0462493896484375, 0.056488037109375, 0.0667266845703125, 0.07696533203125, 0.0872039794921875, 0.097442626953125, 0.1076812744140625, 0.117919921875, 0.1281585693359375, 0.138397216796875, 0.1486358642578125, 0.15887451171875, 0.1691131591796875, 0.179351806640625, 0.1895904541015625, 0.1998291015625, 0.2100677490234375, 0.220306396484375, 0.2305450439453125, 0.24078369140625, 0.2510223388671875, 0.261260986328125, 0.2714996337890625, 0.28173828125]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 4.0, 1.0, 5.0, 5.0, 3.0, 11.0, 6.0, 10.0, 9.0, 25.0, 39.0, 47.0, 100.0, 219.0, 1693.0, 1439.0, 187.0, 105.0, 44.0, 42.0, 23.0, 15.0, 17.0, 9.0, 4.0, 6.0, 4.0, 4.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0], "bins": [-0.15771484375, -0.15345191955566406, -0.14918899536132812, -0.1449260711669922, -0.14066314697265625, -0.1364002227783203, -0.13213729858398438, -0.12787437438964844, -0.1236114501953125, -0.11934852600097656, -0.11508560180664062, -0.11082267761230469, -0.10655975341796875, -0.10229682922363281, -0.09803390502929688, -0.09377098083496094, -0.089508056640625, -0.08524513244628906, -0.08098220825195312, -0.07671928405761719, -0.07245635986328125, -0.06819343566894531, -0.06393051147460938, -0.05966758728027344, -0.0554046630859375, -0.05114173889160156, -0.046878814697265625, -0.04261589050292969, -0.03835296630859375, -0.03409004211425781, -0.029827117919921875, -0.025564193725585938, -0.02130126953125, -0.017038345336914062, -0.012775421142578125, -0.008512496948242188, -0.00424957275390625, 1.33514404296875e-05, 0.004276275634765625, 0.008539199829101562, 0.0128021240234375, 0.017065048217773438, 0.021327972412109375, 0.025590896606445312, 0.02985382080078125, 0.03411674499511719, 0.038379669189453125, 0.04264259338378906, 0.046905517578125, 0.05116844177246094, 0.055431365966796875, 0.05969429016113281, 0.06395721435546875, 0.06822013854980469, 0.07248306274414062, 0.07674598693847656, 0.0810089111328125, 0.08527183532714844, 0.08953475952148438, 0.09379768371582031, 0.09806060791015625, 0.10232353210449219, 0.10658645629882812, 0.11084938049316406, 0.1151123046875]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 5.0, 4.0, 9.0, 13.0, 22.0, 39.0, 81.0, 134.0, 171.0, 189.0, 135.0, 82.0, 53.0, 28.0, 21.0, 8.0, 3.0, 7.0, 4.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8752933740615845, -0.8462796211242676, -0.8172658085823059, -0.788252055644989, -0.7592383027076721, -0.7302244901657104, -0.7012107372283936, -0.6721969842910767, -0.6431832313537598, -0.6141694784164429, -0.5851556658744812, -0.5561419129371643, -0.5271281599998474, -0.49811437726020813, -0.46910059452056885, -0.44008684158325195, -0.4110730290412903, -0.382059246301651, -0.3530454933643341, -0.3240317106246948, -0.29501795768737793, -0.26600417494773865, -0.23699039220809937, -0.20797662436962128, -0.1789628565311432, -0.1499490886926651, -0.12093531340360641, -0.09192153811454773, -0.06290777027606964, -0.03389400243759155, -0.0048802196979522705, 0.024133548140525818, 0.05314725637435913, 0.08216102421283722, 0.1111747995018959, 0.1401885747909546, 0.16920234262943268, 0.19821611046791077, 0.22722989320755005, 0.25624364614486694, 0.2852574288845062, 0.3142712116241455, 0.3432849645614624, 0.3722987473011017, 0.40131253004074097, 0.43032628297805786, 0.45934006571769714, 0.4883538484573364, 0.5173676013946533, 0.5463813543319702, 0.5753951668739319, 0.6044089198112488, 0.6334226727485657, 0.6624364852905273, 0.6914502382278442, 0.7204639911651611, 0.749477744102478, 0.7784914970397949, 0.8075053095817566, 0.8365190625190735, 0.8655328154563904, 0.894546627998352, 0.923560380935669, 0.9525741338729858, 0.9815879464149475]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 1.0, 4.0, 4.0, 3.0, 6.0, 1.0, 6.0, 7.0, 10.0, 8.0, 15.0, 7.0, 16.0, 18.0, 22.0, 23.0, 25.0, 23.0, 31.0, 37.0, 50.0, 37.0, 38.0, 50.0, 48.0, 33.0, 56.0, 32.0, 38.0, 33.0, 42.0, 33.0, 34.0, 34.0, 31.0, 22.0, 16.0, 20.0, 18.0, 14.0, 13.0, 8.0, 7.0, 8.0, 8.0, 5.0, 5.0, 3.0, 2.0, 3.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.2980915307998657, -0.2880476415157318, -0.2780037522315979, -0.267959862947464, -0.2579159736633301, -0.24787208437919617, -0.23782820999622345, -0.22778432071208954, -0.21774043142795563, -0.20769654214382172, -0.1976526528596878, -0.1876087635755539, -0.17756488919258118, -0.16752099990844727, -0.15747711062431335, -0.14743322134017944, -0.13738933205604553, -0.12734544277191162, -0.11730155348777771, -0.1072576716542244, -0.09721378237009048, -0.08716989308595657, -0.07712601125240326, -0.06708212196826935, -0.05703823268413544, -0.046994343400001526, -0.03695045784115791, -0.02690657041966915, -0.01686268299818039, -0.006818793714046478, 0.0032250918447971344, 0.013268977403640747, 0.023312866687774658, 0.03335675597190857, 0.04340064153075218, 0.053444527089595795, 0.0634884163737297, 0.07353230565786362, 0.08357618749141693, 0.09362007677555084, 0.10366396605968475, 0.11370785534381866, 0.12375174462795258, 0.1337956339120865, 0.1438395082950592, 0.15388339757919312, 0.16392728686332703, 0.17397117614746094, 0.18401506543159485, 0.19405895471572876, 0.20410284399986267, 0.21414673328399658, 0.2241906225681305, 0.2342345118522644, 0.24427838623523712, 0.2543222904205322, 0.26436614990234375, 0.27441003918647766, 0.2844539284706116, 0.2944978177547455, 0.3045417070388794, 0.3145855963230133, 0.3246294856071472, 0.33467334508895874, 0.34471726417541504]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 2.0, 2.0, 1.0, 4.0, 6.0, 8.0, 16.0, 12.0, 15.0, 39.0, 45.0, 70.0, 122.0, 184.0, 309.0, 483.0, 878.0, 1368.0, 2508.0, 4486.0, 8517.0, 16076.0, 31159.0, 60061.0, 118426.0, 260561.0, 280306.0, 127671.0, 64308.0, 33176.0, 17360.0, 9053.0, 4754.0, 2757.0, 1527.0, 886.0, 503.0, 319.0, 196.0, 147.0, 99.0, 44.0, 30.0, 25.0, 13.0, 10.0, 9.0, 5.0, 2.0, 2.0, 3.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.1517333984375, -0.1466846466064453, -0.14163589477539062, -0.13658714294433594, -0.13153839111328125, -0.12648963928222656, -0.12144088745117188, -0.11639213562011719, -0.1113433837890625, -0.10629463195800781, -0.10124588012695312, -0.09619712829589844, -0.09114837646484375, -0.08609962463378906, -0.08105087280273438, -0.07600212097167969, -0.070953369140625, -0.06590461730957031, -0.060855865478515625, -0.05580711364746094, -0.05075836181640625, -0.04570960998535156, -0.040660858154296875, -0.03561210632324219, -0.0305633544921875, -0.025514602661132812, -0.020465850830078125, -0.015417098999023438, -0.01036834716796875, -0.0053195953369140625, -0.000270843505859375, 0.0047779083251953125, 0.00982666015625, 0.014875411987304688, 0.019924163818359375, 0.024972915649414062, 0.03002166748046875, 0.03507041931152344, 0.040119171142578125, 0.04516792297363281, 0.0502166748046875, 0.05526542663574219, 0.060314178466796875, 0.06536293029785156, 0.07041168212890625, 0.07546043395996094, 0.08050918579101562, 0.08555793762207031, 0.090606689453125, 0.09565544128417969, 0.10070419311523438, 0.10575294494628906, 0.11080169677734375, 0.11585044860839844, 0.12089920043945312, 0.1259479522705078, 0.1309967041015625, 0.1360454559326172, 0.14109420776367188, 0.14614295959472656, 0.15119171142578125, 0.15624046325683594, 0.16128921508789062, 0.1663379669189453, 0.17138671875]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 5.0, 6.0, 9.0, 5.0, 8.0, 6.0, 9.0, 11.0, 18.0, 17.0, 23.0, 41.0, 44.0, 40.0, 42.0, 59.0, 55.0, 61.0, 53.0, 54.0, 54.0, 45.0, 57.0, 55.0, 41.0, 41.0, 37.0, 32.0, 23.0, 10.0, 6.0, 11.0, 8.0, 6.0, 4.0, 7.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.1025390625, -0.0994110107421875, -0.096282958984375, -0.0931549072265625, -0.09002685546875, -0.0868988037109375, -0.083770751953125, -0.0806427001953125, -0.0775146484375, -0.0743865966796875, -0.071258544921875, -0.0681304931640625, -0.06500244140625, -0.0618743896484375, -0.058746337890625, -0.0556182861328125, -0.052490234375, -0.0493621826171875, -0.046234130859375, -0.0431060791015625, -0.03997802734375, -0.0368499755859375, -0.033721923828125, -0.0305938720703125, -0.0274658203125, -0.0243377685546875, -0.021209716796875, -0.0180816650390625, -0.01495361328125, -0.0118255615234375, -0.008697509765625, -0.0055694580078125, -0.00244140625, 0.0006866455078125, 0.003814697265625, 0.0069427490234375, 0.01007080078125, 0.0131988525390625, 0.016326904296875, 0.0194549560546875, 0.0225830078125, 0.0257110595703125, 0.028839111328125, 0.0319671630859375, 0.03509521484375, 0.0382232666015625, 0.041351318359375, 0.0444793701171875, 0.047607421875, 0.0507354736328125, 0.053863525390625, 0.0569915771484375, 0.06011962890625, 0.0632476806640625, 0.066375732421875, 0.0695037841796875, 0.0726318359375, 0.0757598876953125, 0.078887939453125, 0.0820159912109375, 0.08514404296875, 0.0882720947265625, 0.091400146484375, 0.0945281982421875, 0.09765625]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 5.0, 7.0, 13.0, 17.0, 23.0, 39.0, 40.0, 59.0, 85.0, 119.0, 176.0, 245.0, 341.0, 578.0, 1024.0, 2045.0, 5511.0, 21816.0, 144577.0, 697602.0, 142365.0, 21538.0, 5594.0, 2016.0, 1026.0, 564.0, 343.0, 227.0, 169.0, 106.0, 86.0, 55.0, 52.0, 20.0, 22.0, 12.0, 10.0, 9.0, 10.0, 4.0, 2.0, 2.0, 0.0, 5.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.3662109375, -0.35527801513671875, -0.3443450927734375, -0.33341217041015625, -0.322479248046875, -0.31154632568359375, -0.3006134033203125, -0.28968048095703125, -0.27874755859375, -0.26781463623046875, -0.2568817138671875, -0.24594879150390625, -0.235015869140625, -0.22408294677734375, -0.2131500244140625, -0.20221710205078125, -0.1912841796875, -0.18035125732421875, -0.1694183349609375, -0.15848541259765625, -0.147552490234375, -0.13661956787109375, -0.1256866455078125, -0.11475372314453125, -0.10382080078125, -0.09288787841796875, -0.0819549560546875, -0.07102203369140625, -0.060089111328125, -0.04915618896484375, -0.0382232666015625, -0.02729034423828125, -0.016357421875, -0.00542449951171875, 0.0055084228515625, 0.01644134521484375, 0.027374267578125, 0.03830718994140625, 0.0492401123046875, 0.06017303466796875, 0.07110595703125, 0.08203887939453125, 0.0929718017578125, 0.10390472412109375, 0.114837646484375, 0.12577056884765625, 0.1367034912109375, 0.14763641357421875, 0.1585693359375, 0.16950225830078125, 0.1804351806640625, 0.19136810302734375, 0.202301025390625, 0.21323394775390625, 0.2241668701171875, 0.23509979248046875, 0.24603271484375, 0.25696563720703125, 0.2678985595703125, 0.27883148193359375, 0.289764404296875, 0.30069732666015625, 0.3116302490234375, 0.32256317138671875, 0.33349609375]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 2.0, 4.0, 1.0, 8.0, 3.0, 8.0, 4.0, 10.0, 5.0, 14.0, 15.0, 17.0, 22.0, 18.0, 35.0, 23.0, 23.0, 27.0, 33.0, 46.0, 38.0, 48.0, 49.0, 50.0, 36.0, 51.0, 45.0, 38.0, 37.0, 33.0, 37.0, 30.0, 31.0, 16.0, 23.0, 19.0, 16.0, 20.0, 12.0, 11.0, 8.0, 6.0, 7.0, 6.0, 10.0, 5.0, 4.0, 4.0, 1.0, 4.0, 2.0], "bins": [-0.353759765625, -0.3442115783691406, -0.33466339111328125, -0.3251152038574219, -0.3155670166015625, -0.3060188293457031, -0.29647064208984375, -0.2869224548339844, -0.277374267578125, -0.2678260803222656, -0.25827789306640625, -0.24872970581054688, -0.2391815185546875, -0.22963333129882812, -0.22008514404296875, -0.21053695678710938, -0.20098876953125, -0.19144058227539062, -0.18189239501953125, -0.17234420776367188, -0.1627960205078125, -0.15324783325195312, -0.14369964599609375, -0.13415145874023438, -0.124603271484375, -0.11505508422851562, -0.10550689697265625, -0.09595870971679688, -0.0864105224609375, -0.07686233520507812, -0.06731414794921875, -0.057765960693359375, -0.0482177734375, -0.038669586181640625, -0.02912139892578125, -0.019573211669921875, -0.0100250244140625, -0.000476837158203125, 0.00907135009765625, 0.018619537353515625, 0.028167724609375, 0.037715911865234375, 0.04726409912109375, 0.056812286376953125, 0.0663604736328125, 0.07590866088867188, 0.08545684814453125, 0.09500503540039062, 0.10455322265625, 0.11410140991210938, 0.12364959716796875, 0.13319778442382812, 0.1427459716796875, 0.15229415893554688, 0.16184234619140625, 0.17139053344726562, 0.180938720703125, 0.19048690795898438, 0.20003509521484375, 0.20958328247070312, 0.2191314697265625, 0.22867965698242188, 0.23822784423828125, 0.24777603149414062, 0.25732421875]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 4.0, 5.0, 2.0, 2.0, 4.0, 7.0, 10.0, 5.0, 11.0, 16.0, 27.0, 54.0, 69.0, 99.0, 183.0, 353.0, 607.0, 1377.0, 3453.0, 10586.0, 44298.0, 245307.0, 583104.0, 123507.0, 24281.0, 6621.0, 2413.0, 1029.0, 491.0, 257.0, 134.0, 94.0, 55.0, 28.0, 24.0, 11.0, 10.0, 7.0, 3.0, 7.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09912109375, -0.09561920166015625, -0.0921173095703125, -0.08861541748046875, -0.085113525390625, -0.08161163330078125, -0.0781097412109375, -0.07460784912109375, -0.07110595703125, -0.06760406494140625, -0.0641021728515625, -0.06060028076171875, -0.057098388671875, -0.05359649658203125, -0.0500946044921875, -0.04659271240234375, -0.0430908203125, -0.03958892822265625, -0.0360870361328125, -0.03258514404296875, -0.029083251953125, -0.02558135986328125, -0.0220794677734375, -0.01857757568359375, -0.01507568359375, -0.01157379150390625, -0.0080718994140625, -0.00457000732421875, -0.001068115234375, 0.00243377685546875, 0.0059356689453125, 0.00943756103515625, 0.012939453125, 0.01644134521484375, 0.0199432373046875, 0.02344512939453125, 0.026947021484375, 0.03044891357421875, 0.0339508056640625, 0.03745269775390625, 0.04095458984375, 0.04445648193359375, 0.0479583740234375, 0.05146026611328125, 0.054962158203125, 0.05846405029296875, 0.0619659423828125, 0.06546783447265625, 0.0689697265625, 0.07247161865234375, 0.0759735107421875, 0.07947540283203125, 0.082977294921875, 0.08647918701171875, 0.0899810791015625, 0.09348297119140625, 0.09698486328125, 0.10048675537109375, 0.1039886474609375, 0.10749053955078125, 0.110992431640625, 0.11449432373046875, 0.1179962158203125, 0.12149810791015625, 0.125]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 0.0, 3.0, 1.0, 2.0, 2.0, 2.0, 3.0, 6.0, 1.0, 12.0, 10.0, 14.0, 19.0, 21.0, 24.0, 30.0, 42.0, 32.0, 49.0, 54.0, 81.0, 92.0, 106.0, 88.0, 77.0, 38.0, 38.0, 29.0, 28.0, 26.0, 14.0, 11.0, 13.0, 9.0, 6.0, 10.0, 11.0, 2.0, 6.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.172325134277344e-05, -4.011392593383789e-05, -3.8504600524902344e-05, -3.68952751159668e-05, -3.528594970703125e-05, -3.36766242980957e-05, -3.2067298889160156e-05, -3.045797348022461e-05, -2.8848648071289062e-05, -2.7239322662353516e-05, -2.562999725341797e-05, -2.4020671844482422e-05, -2.2411346435546875e-05, -2.0802021026611328e-05, -1.919269561767578e-05, -1.7583370208740234e-05, -1.5974044799804688e-05, -1.436471939086914e-05, -1.2755393981933594e-05, -1.1146068572998047e-05, -9.5367431640625e-06, -7.927417755126953e-06, -6.318092346191406e-06, -4.708766937255859e-06, -3.0994415283203125e-06, -1.4901161193847656e-06, 1.1920928955078125e-07, 1.7285346984863281e-06, 3.337860107421875e-06, 4.947185516357422e-06, 6.556510925292969e-06, 8.165836334228516e-06, 9.775161743164062e-06, 1.138448715209961e-05, 1.2993812561035156e-05, 1.4603137969970703e-05, 1.621246337890625e-05, 1.7821788787841797e-05, 1.9431114196777344e-05, 2.104043960571289e-05, 2.2649765014648438e-05, 2.4259090423583984e-05, 2.586841583251953e-05, 2.7477741241455078e-05, 2.9087066650390625e-05, 3.069639205932617e-05, 3.230571746826172e-05, 3.3915042877197266e-05, 3.552436828613281e-05, 3.713369369506836e-05, 3.8743019104003906e-05, 4.035234451293945e-05, 4.1961669921875e-05, 4.357099533081055e-05, 4.5180320739746094e-05, 4.678964614868164e-05, 4.839897155761719e-05, 5.0008296966552734e-05, 5.161762237548828e-05, 5.322694778442383e-05, 5.4836273193359375e-05, 5.644559860229492e-05, 5.805492401123047e-05, 5.9664249420166016e-05, 6.127357482910156e-05]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 6.0, 6.0, 5.0, 12.0, 11.0, 21.0, 24.0, 27.0, 38.0, 60.0, 92.0, 129.0, 246.0, 351.0, 591.0, 1218.0, 2578.0, 6460.0, 22617.0, 114802.0, 552775.0, 279469.0, 47639.0, 11485.0, 3987.0, 1745.0, 871.0, 481.0, 287.0, 179.0, 100.0, 71.0, 55.0, 34.0, 25.0, 17.0, 10.0, 12.0, 6.0, 5.0, 4.0, 4.0, 1.0, 2.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.10760498046875, -0.10421562194824219, -0.10082626342773438, -0.09743690490722656, -0.09404754638671875, -0.09065818786621094, -0.08726882934570312, -0.08387947082519531, -0.0804901123046875, -0.07710075378417969, -0.07371139526367188, -0.07032203674316406, -0.06693267822265625, -0.06354331970214844, -0.060153961181640625, -0.05676460266113281, -0.053375244140625, -0.04998588562011719, -0.046596527099609375, -0.04320716857910156, -0.03981781005859375, -0.03642845153808594, -0.033039093017578125, -0.029649734497070312, -0.0262603759765625, -0.022871017456054688, -0.019481658935546875, -0.016092300415039062, -0.01270294189453125, -0.009313583374023438, -0.005924224853515625, -0.0025348663330078125, 0.0008544921875, 0.0042438507080078125, 0.007633209228515625, 0.011022567749023438, 0.01441192626953125, 0.017801284790039062, 0.021190643310546875, 0.024580001831054688, 0.0279693603515625, 0.03135871887207031, 0.034748077392578125, 0.03813743591308594, 0.04152679443359375, 0.04491615295410156, 0.048305511474609375, 0.05169486999511719, 0.055084228515625, 0.05847358703613281, 0.061862945556640625, 0.06525230407714844, 0.06864166259765625, 0.07203102111816406, 0.07542037963867188, 0.07880973815917969, 0.0821990966796875, 0.08558845520019531, 0.08897781372070312, 0.09236717224121094, 0.09575653076171875, 0.09914588928222656, 0.10253524780273438, 0.10592460632324219, 0.10931396484375]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 0.0, 1.0, 1.0, 3.0, 4.0, 5.0, 6.0, 1.0, 1.0, 7.0, 7.0, 13.0, 14.0, 11.0, 15.0, 22.0, 25.0, 27.0, 29.0, 38.0, 47.0, 59.0, 46.0, 64.0, 72.0, 58.0, 55.0, 69.0, 46.0, 42.0, 43.0, 26.0, 28.0, 15.0, 18.0, 10.0, 14.0, 14.0, 7.0, 7.0, 13.0, 7.0, 1.0, 6.0, 4.0, 5.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.08648681640625, -0.08392047882080078, -0.08135414123535156, -0.07878780364990234, -0.07622146606445312, -0.0736551284790039, -0.07108879089355469, -0.06852245330810547, -0.06595611572265625, -0.06338977813720703, -0.06082344055175781, -0.058257102966308594, -0.055690765380859375, -0.053124427795410156, -0.05055809020996094, -0.04799175262451172, -0.0454254150390625, -0.04285907745361328, -0.04029273986816406, -0.037726402282714844, -0.035160064697265625, -0.032593727111816406, -0.030027389526367188, -0.02746105194091797, -0.02489471435546875, -0.02232837677001953, -0.019762039184570312, -0.017195701599121094, -0.014629364013671875, -0.012063026428222656, -0.009496688842773438, -0.006930351257324219, -0.004364013671875, -0.0017976760864257812, 0.0007686614990234375, 0.0033349990844726562, 0.005901336669921875, 0.008467674255371094, 0.011034011840820312, 0.013600349426269531, 0.01616668701171875, 0.01873302459716797, 0.021299362182617188, 0.023865699768066406, 0.026432037353515625, 0.028998374938964844, 0.03156471252441406, 0.03413105010986328, 0.0366973876953125, 0.03926372528076172, 0.04183006286621094, 0.044396400451660156, 0.046962738037109375, 0.049529075622558594, 0.05209541320800781, 0.05466175079345703, 0.05722808837890625, 0.05979442596435547, 0.06236076354980469, 0.0649271011352539, 0.06749343872070312, 0.07005977630615234, 0.07262611389160156, 0.07519245147705078, 0.0777587890625]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 4.0, 6.0, 1.0, 8.0, 23.0, 27.0, 46.0, 70.0, 89.0, 101.0, 112.0, 122.0, 113.0, 73.0, 66.0, 59.0, 36.0, 13.0, 15.0, 8.0, 4.0, 5.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.1587326526641846, -2.1010186672210693, -2.043304920196533, -1.985590934753418, -1.9278769493103027, -1.870163083076477, -1.8124492168426514, -1.7547352313995361, -1.6970213651657104, -1.6393074989318848, -1.5815935134887695, -1.5238796472549438, -1.4661657810211182, -1.408451795578003, -1.3507379293441772, -1.2930240631103516, -1.2353100776672363, -1.1775962114334106, -1.1198822259902954, -1.0621683597564697, -1.0044543743133545, -0.9467405080795288, -0.8890266418457031, -0.8313127160072327, -0.7735987901687622, -0.7158848643302917, -0.6581709384918213, -0.6004570722579956, -0.5427431464195251, -0.4850292205810547, -0.4273153245449066, -0.36960142850875854, -0.3118875026702881, -0.2541735768318176, -0.19645968079566956, -0.1387457698583603, -0.08103185892105103, -0.023317933082580566, 0.034395962953567505, 0.09210985898971558, 0.14982378482818604, 0.2075376957654953, 0.26525160670280457, 0.32296550273895264, 0.3806794285774231, 0.43839335441589355, 0.4961072504520416, 0.5538211464881897, 0.6115350723266602, 0.6692489981651306, 0.7269629240036011, 0.7846767902374268, 0.8423907160758972, 0.9001046419143677, 0.9578185081481934, 1.0155324935913086, 1.0732463598251343, 1.13096022605896, 1.1886742115020752, 1.2463880777359009, 1.3041019439697266, 1.3618159294128418, 1.4195297956466675, 1.4772436618804932, 1.5349576473236084]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 3.0, 2.0, 2.0, 6.0, 4.0, 6.0, 9.0, 15.0, 17.0, 7.0, 28.0, 17.0, 14.0, 22.0, 20.0, 33.0, 35.0, 39.0, 26.0, 39.0, 39.0, 38.0, 44.0, 50.0, 63.0, 52.0, 47.0, 52.0, 34.0, 31.0, 27.0, 34.0, 26.0, 18.0, 24.0, 13.0, 13.0, 13.0, 9.0, 9.0, 5.0, 5.0, 3.0, 4.0, 0.0, 4.0, 0.0, 4.0, 1.0, 3.0, 3.0, 1.0], "bins": [-1.6132254600524902, -1.5671130418777466, -1.521000623703003, -1.4748882055282593, -1.4287757873535156, -1.382663369178772, -1.3365509510040283, -1.2904385328292847, -1.244326114654541, -1.1982136964797974, -1.1521012783050537, -1.10598886013031, -1.0598764419555664, -1.0137640237808228, -0.9676516056060791, -0.9215391874313354, -0.875426709651947, -0.8293142914772034, -0.7832018733024597, -0.7370894551277161, -0.6909770369529724, -0.6448646187782288, -0.5987521409988403, -0.5526397228240967, -0.506527304649353, -0.4604148864746094, -0.4143024682998657, -0.36819005012512207, -0.3220776319503784, -0.27596521377563477, -0.22985276579856873, -0.18374034762382507, -0.1376279592514038, -0.09151554107666016, -0.04540311545133591, 0.0007093101739883423, 0.046821728348731995, 0.09293414652347565, 0.1390465795993805, 0.18515899777412415, 0.2312714159488678, 0.27738383412361145, 0.3234962522983551, 0.36960870027542114, 0.4157211184501648, 0.46183353662490845, 0.5079459547996521, 0.5540583729743958, 0.6001707911491394, 0.6462832093238831, 0.6923956274986267, 0.7385080456733704, 0.784620463848114, 0.8307328820228577, 0.8768453598022461, 0.9229577779769897, 0.9690701961517334, 1.015182614326477, 1.0612950325012207, 1.1074074506759644, 1.153519868850708, 1.1996322870254517, 1.2457447052001953, 1.291857123374939, 1.3379695415496826]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 1.0, 3.0, 5.0, 5.0, 6.0, 19.0, 15.0, 31.0, 31.0, 51.0, 84.0, 134.0, 171.0, 278.0, 441.0, 699.0, 1093.0, 1910.0, 3375.0, 6021.0, 11704.0, 24240.0, 57194.0, 169165.0, 870389.0, 2393611.0, 457601.0, 112879.0, 42571.0, 19292.0, 9385.0, 4877.0, 2824.0, 1565.0, 947.0, 571.0, 415.0, 228.0, 153.0, 114.0, 60.0, 49.0, 20.0, 21.0, 17.0, 12.0, 7.0, 2.0, 4.0, 3.0, 1.0, 1.0, 1.0], "bins": [-0.1444091796875, -0.14043426513671875, -0.1364593505859375, -0.13248443603515625, -0.128509521484375, -0.12453460693359375, -0.1205596923828125, -0.11658477783203125, -0.11260986328125, -0.10863494873046875, -0.1046600341796875, -0.10068511962890625, -0.096710205078125, -0.09273529052734375, -0.0887603759765625, -0.08478546142578125, -0.080810546875, -0.07683563232421875, -0.0728607177734375, -0.06888580322265625, -0.064910888671875, -0.06093597412109375, -0.0569610595703125, -0.05298614501953125, -0.04901123046875, -0.04503631591796875, -0.0410614013671875, -0.03708648681640625, -0.033111572265625, -0.02913665771484375, -0.0251617431640625, -0.02118682861328125, -0.0172119140625, -0.01323699951171875, -0.0092620849609375, -0.00528717041015625, -0.001312255859375, 0.00266265869140625, 0.0066375732421875, 0.01061248779296875, 0.01458740234375, 0.01856231689453125, 0.0225372314453125, 0.02651214599609375, 0.030487060546875, 0.03446197509765625, 0.0384368896484375, 0.04241180419921875, 0.04638671875, 0.05036163330078125, 0.0543365478515625, 0.05831146240234375, 0.062286376953125, 0.06626129150390625, 0.0702362060546875, 0.07421112060546875, 0.07818603515625, 0.08216094970703125, 0.0861358642578125, 0.09011077880859375, 0.094085693359375, 0.09806060791015625, 0.1020355224609375, 0.10601043701171875, 0.1099853515625]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 4.0, 4.0, 6.0, 5.0, 11.0, 11.0, 10.0, 11.0, 21.0, 23.0, 25.0, 27.0, 33.0, 33.0, 36.0, 52.0, 44.0, 53.0, 34.0, 55.0, 59.0, 48.0, 49.0, 45.0, 50.0, 34.0, 41.0, 42.0, 24.0, 27.0, 21.0, 20.0, 10.0, 8.0, 10.0, 8.0, 3.0, 6.0, 1.0, 0.0, 3.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.08941650390625, -0.08683586120605469, -0.08425521850585938, -0.08167457580566406, -0.07909393310546875, -0.07651329040527344, -0.07393264770507812, -0.07135200500488281, -0.0687713623046875, -0.06619071960449219, -0.06361007690429688, -0.06102943420410156, -0.05844879150390625, -0.05586814880371094, -0.053287506103515625, -0.05070686340332031, -0.048126220703125, -0.04554557800292969, -0.042964935302734375, -0.04038429260253906, -0.03780364990234375, -0.03522300720214844, -0.032642364501953125, -0.030061721801757812, -0.0274810791015625, -0.024900436401367188, -0.022319793701171875, -0.019739151000976562, -0.01715850830078125, -0.014577865600585938, -0.011997222900390625, -0.009416580200195312, -0.0068359375, -0.0042552947998046875, -0.001674652099609375, 0.0009059906005859375, 0.00348663330078125, 0.0060672760009765625, 0.008647918701171875, 0.011228561401367188, 0.0138092041015625, 0.016389846801757812, 0.018970489501953125, 0.021551132202148438, 0.02413177490234375, 0.026712417602539062, 0.029293060302734375, 0.03187370300292969, 0.034454345703125, 0.03703498840332031, 0.039615631103515625, 0.04219627380371094, 0.04477691650390625, 0.04735755920410156, 0.049938201904296875, 0.05251884460449219, 0.0550994873046875, 0.05768013000488281, 0.060260772705078125, 0.06284141540527344, 0.06542205810546875, 0.06800270080566406, 0.07058334350585938, 0.07316398620605469, 0.07574462890625]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 10.0, 7.0, 11.0, 18.0, 32.0, 68.0, 106.0, 235.0, 465.0, 1210.0, 3830.0, 14412.0, 82426.0, 1843647.0, 2137188.0, 89002.0, 15426.0, 3944.0, 1287.0, 491.0, 244.0, 100.0, 61.0, 21.0, 20.0, 11.0, 4.0, 6.0, 4.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.253662109375, -0.24352264404296875, -0.2333831787109375, -0.22324371337890625, -0.213104248046875, -0.20296478271484375, -0.1928253173828125, -0.18268585205078125, -0.17254638671875, -0.16240692138671875, -0.1522674560546875, -0.14212799072265625, -0.131988525390625, -0.12184906005859375, -0.1117095947265625, -0.10157012939453125, -0.0914306640625, -0.08129119873046875, -0.0711517333984375, -0.06101226806640625, -0.050872802734375, -0.04073333740234375, -0.0305938720703125, -0.02045440673828125, -0.01031494140625, -0.00017547607421875, 0.0099639892578125, 0.02010345458984375, 0.030242919921875, 0.04038238525390625, 0.0505218505859375, 0.06066131591796875, 0.07080078125, 0.08094024658203125, 0.0910797119140625, 0.10121917724609375, 0.111358642578125, 0.12149810791015625, 0.1316375732421875, 0.14177703857421875, 0.15191650390625, 0.16205596923828125, 0.1721954345703125, 0.18233489990234375, 0.192474365234375, 0.20261383056640625, 0.2127532958984375, 0.22289276123046875, 0.2330322265625, 0.24317169189453125, 0.2533111572265625, 0.26345062255859375, 0.273590087890625, 0.28372955322265625, 0.2938690185546875, 0.30400848388671875, 0.31414794921875, 0.32428741455078125, 0.3344268798828125, 0.34456634521484375, 0.354705810546875, 0.36484527587890625, 0.3749847412109375, 0.38512420654296875, 0.395263671875]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 3.0, 2.0, 5.0, 4.0, 0.0, 8.0, 9.0, 13.0, 16.0, 18.0, 31.0, 51.0, 55.0, 84.0, 124.0, 237.0, 414.0, 753.0, 916.0, 525.0, 287.0, 160.0, 100.0, 65.0, 60.0, 40.0, 22.0, 17.0, 12.0, 10.0, 11.0, 9.0, 8.0, 4.0, 4.0, 1.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.31787109375, -0.3095550537109375, -0.301239013671875, -0.2929229736328125, -0.28460693359375, -0.2762908935546875, -0.267974853515625, -0.2596588134765625, -0.2513427734375, -0.2430267333984375, -0.234710693359375, -0.2263946533203125, -0.21807861328125, -0.2097625732421875, -0.201446533203125, -0.1931304931640625, -0.184814453125, -0.1764984130859375, -0.168182373046875, -0.1598663330078125, -0.15155029296875, -0.1432342529296875, -0.134918212890625, -0.1266021728515625, -0.1182861328125, -0.1099700927734375, -0.101654052734375, -0.0933380126953125, -0.08502197265625, -0.0767059326171875, -0.068389892578125, -0.0600738525390625, -0.0517578125, -0.0434417724609375, -0.035125732421875, -0.0268096923828125, -0.01849365234375, -0.0101776123046875, -0.001861572265625, 0.0064544677734375, 0.0147705078125, 0.0230865478515625, 0.031402587890625, 0.0397186279296875, 0.04803466796875, 0.0563507080078125, 0.064666748046875, 0.0729827880859375, 0.081298828125, 0.0896148681640625, 0.097930908203125, 0.1062469482421875, 0.11456298828125, 0.1228790283203125, 0.131195068359375, 0.1395111083984375, 0.1478271484375, 0.1561431884765625, 0.164459228515625, 0.1727752685546875, 0.18109130859375, 0.1894073486328125, 0.197723388671875, 0.2060394287109375, 0.21435546875]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 5.0, 4.0, 1.0, 2.0, 10.0, 22.0, 41.0, 91.0, 153.0, 227.0, 204.0, 123.0, 64.0, 30.0, 11.0, 5.0, 5.0, 4.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.057502746582031, -3.955089569091797, -3.8526766300201416, -3.7502634525299072, -3.647850513458252, -3.5454373359680176, -3.443024158477783, -3.340611219406128, -3.2381982803344727, -3.1357851028442383, -3.033372163772583, -2.9309589862823486, -2.8285460472106934, -2.726132869720459, -2.6237196922302246, -2.5213067531585693, -2.418893575668335, -2.3164803981781006, -2.2140674591064453, -2.111654281616211, -2.0092413425445557, -1.9068281650543213, -1.8044151067733765, -1.7020020484924316, -1.5995889902114868, -1.497175931930542, -1.3947628736495972, -1.2923498153686523, -1.189936637878418, -1.0875236988067627, -0.9851105213165283, -0.8826974630355835, -0.7802846431732178, -0.677871584892273, -0.5754585266113281, -0.4730454087257385, -0.3706323504447937, -0.2682192921638489, -0.16580617427825928, -0.06339311599731445, 0.03901994228363037, 0.1414330154657364, 0.2438460886478424, 0.3462591767311096, 0.44867223501205444, 0.5510852932929993, 0.6534984111785889, 0.7559114694595337, 0.8583245277404785, 0.9607375860214233, 1.0631506443023682, 1.1655638217926025, 1.2679767608642578, 1.3703899383544922, 1.472802996635437, 1.5752160549163818, 1.6776291131973267, 1.7800421714782715, 1.8824552297592163, 1.9848682880401611, 2.0872814655303955, 2.189694404602051, 2.292107582092285, 2.3945207595825195, 2.496933698654175]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 4.0, 3.0, 6.0, 5.0, 5.0, 9.0, 7.0, 11.0, 12.0, 19.0, 19.0, 24.0, 31.0, 30.0, 36.0, 40.0, 53.0, 43.0, 41.0, 62.0, 49.0, 47.0, 44.0, 44.0, 51.0, 49.0, 40.0, 42.0, 26.0, 21.0, 25.0, 15.0, 21.0, 16.0, 13.0, 12.0, 10.0, 5.0, 5.0, 8.0, 2.0, 4.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0209617614746094, -0.9830405712127686, -0.9451194405555725, -0.9071983098983765, -0.8692771196365356, -0.8313559293746948, -0.7934347987174988, -0.7555136680603027, -0.7175924777984619, -0.6796712875366211, -0.641750156879425, -0.603829026222229, -0.5659078359603882, -0.5279866456985474, -0.4900655150413513, -0.4521443545818329, -0.41422319412231445, -0.376302033662796, -0.3383808732032776, -0.30045971274375916, -0.2625385522842407, -0.2246173918247223, -0.18669623136520386, -0.14877507090568542, -0.11085391044616699, -0.07293274998664856, -0.03501158952713013, 0.0029095709323883057, 0.04083073139190674, 0.07875189185142517, 0.1166730523109436, 0.15459421277046204, 0.19251549243927002, 0.23043665289878845, 0.2683578133583069, 0.3062789738178253, 0.34420013427734375, 0.3821212947368622, 0.4200424551963806, 0.45796361565589905, 0.4958847761154175, 0.5338059663772583, 0.5717270970344543, 0.6096482276916504, 0.6475694179534912, 0.685490608215332, 0.7234117388725281, 0.7613328695297241, 0.7992540597915649, 0.8371752500534058, 0.8750963807106018, 0.9130175113677979, 0.9509387016296387, 0.9888598918914795, 1.0267810821533203, 1.0647021532058716, 1.1026233434677124, 1.1405445337295532, 1.1784656047821045, 1.2163867950439453, 1.2543079853057861, 1.292229175567627, 1.3301503658294678, 1.368071436882019, 1.4059926271438599]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 4.0, 2.0, 6.0, 8.0, 15.0, 19.0, 43.0, 55.0, 63.0, 106.0, 166.0, 310.0, 464.0, 828.0, 1421.0, 2354.0, 4300.0, 8438.0, 16758.0, 36360.0, 89450.0, 340543.0, 372984.0, 97999.0, 38450.0, 17802.0, 8952.0, 4591.0, 2545.0, 1381.0, 824.0, 487.0, 301.0, 181.0, 130.0, 74.0, 49.0, 37.0, 27.0, 16.0, 7.0, 7.0, 5.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.185791015625, -0.17916488647460938, -0.17253875732421875, -0.16591262817382812, -0.1592864990234375, -0.15266036987304688, -0.14603424072265625, -0.13940811157226562, -0.132781982421875, -0.12615585327148438, -0.11952972412109375, -0.11290359497070312, -0.1062774658203125, -0.09965133666992188, -0.09302520751953125, -0.08639907836914062, -0.07977294921875, -0.07314682006835938, -0.06652069091796875, -0.059894561767578125, -0.0532684326171875, -0.046642303466796875, -0.04001617431640625, -0.033390045166015625, -0.026763916015625, -0.020137786865234375, -0.01351165771484375, -0.006885528564453125, -0.0002593994140625, 0.006366729736328125, 0.01299285888671875, 0.019618988037109375, 0.0262451171875, 0.032871246337890625, 0.03949737548828125, 0.046123504638671875, 0.0527496337890625, 0.059375762939453125, 0.06600189208984375, 0.07262802124023438, 0.079254150390625, 0.08588027954101562, 0.09250640869140625, 0.09913253784179688, 0.1057586669921875, 0.11238479614257812, 0.11901092529296875, 0.12563705444335938, 0.13226318359375, 0.13888931274414062, 0.14551544189453125, 0.15214157104492188, 0.1587677001953125, 0.16539382934570312, 0.17201995849609375, 0.17864608764648438, 0.185272216796875, 0.19189834594726562, 0.19852447509765625, 0.20515060424804688, 0.2117767333984375, 0.21840286254882812, 0.22502899169921875, 0.23165512084960938, 0.23828125]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 0.0, 3.0, 2.0, 3.0, 3.0, 5.0, 6.0, 5.0, 8.0, 10.0, 18.0, 16.0, 19.0, 31.0, 45.0, 43.0, 48.0, 48.0, 60.0, 63.0, 65.0, 55.0, 48.0, 54.0, 51.0, 52.0, 46.0, 41.0, 35.0, 31.0, 29.0, 23.0, 13.0, 8.0, 9.0, 7.0, 1.0, 6.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.078857421875, -0.07561111450195312, -0.07236480712890625, -0.06911849975585938, -0.0658721923828125, -0.06262588500976562, -0.05937957763671875, -0.056133270263671875, -0.052886962890625, -0.049640655517578125, -0.04639434814453125, -0.043148040771484375, -0.0399017333984375, -0.036655426025390625, -0.03340911865234375, -0.030162811279296875, -0.02691650390625, -0.023670196533203125, -0.02042388916015625, -0.017177581787109375, -0.0139312744140625, -0.010684967041015625, -0.00743865966796875, -0.004192352294921875, -0.000946044921875, 0.002300262451171875, 0.00554656982421875, 0.008792877197265625, 0.0120391845703125, 0.015285491943359375, 0.01853179931640625, 0.021778106689453125, 0.0250244140625, 0.028270721435546875, 0.03151702880859375, 0.034763336181640625, 0.0380096435546875, 0.041255950927734375, 0.04450225830078125, 0.047748565673828125, 0.050994873046875, 0.054241180419921875, 0.05748748779296875, 0.060733795166015625, 0.0639801025390625, 0.06722640991210938, 0.07047271728515625, 0.07371902465820312, 0.07696533203125, 0.08021163940429688, 0.08345794677734375, 0.08670425415039062, 0.0899505615234375, 0.09319686889648438, 0.09644317626953125, 0.09968948364257812, 0.102935791015625, 0.10618209838867188, 0.10942840576171875, 0.11267471313476562, 0.1159210205078125, 0.11916732788085938, 0.12241363525390625, 0.12565994262695312, 0.12890625]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 6.0, 5.0, 5.0, 3.0, 5.0, 8.0, 20.0, 20.0, 42.0, 40.0, 72.0, 102.0, 135.0, 227.0, 390.0, 734.0, 1486.0, 4025.0, 15862.0, 128579.0, 822866.0, 58631.0, 9690.0, 2849.0, 1238.0, 608.0, 329.0, 215.0, 109.0, 77.0, 57.0, 38.0, 25.0, 13.0, 19.0, 12.0, 4.0, 9.0, 3.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.362060546875, -0.3471870422363281, -0.33231353759765625, -0.3174400329589844, -0.3025665283203125, -0.2876930236816406, -0.27281951904296875, -0.2579460144042969, -0.243072509765625, -0.22819900512695312, -0.21332550048828125, -0.19845199584960938, -0.1835784912109375, -0.16870498657226562, -0.15383148193359375, -0.13895797729492188, -0.12408447265625, -0.10921096801757812, -0.09433746337890625, -0.07946395874023438, -0.0645904541015625, -0.049716949462890625, -0.03484344482421875, -0.019969940185546875, -0.005096435546875, 0.009777069091796875, 0.02465057373046875, 0.039524078369140625, 0.0543975830078125, 0.06927108764648438, 0.08414459228515625, 0.09901809692382812, 0.1138916015625, 0.12876510620117188, 0.14363861083984375, 0.15851211547851562, 0.1733856201171875, 0.18825912475585938, 0.20313262939453125, 0.21800613403320312, 0.232879638671875, 0.24775314331054688, 0.26262664794921875, 0.2775001525878906, 0.2923736572265625, 0.3072471618652344, 0.32212066650390625, 0.3369941711425781, 0.35186767578125, 0.3667411804199219, 0.38161468505859375, 0.3964881896972656, 0.4113616943359375, 0.4262351989746094, 0.44110870361328125, 0.4559822082519531, 0.470855712890625, 0.4857292175292969, 0.5006027221679688, 0.5154762268066406, 0.5303497314453125, 0.5452232360839844, 0.5600967407226562, 0.5749702453613281, 0.58984375]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 6.0, 4.0, 4.0, 2.0, 4.0, 12.0, 12.0, 14.0, 21.0, 33.0, 28.0, 34.0, 36.0, 53.0, 52.0, 55.0, 63.0, 63.0, 71.0, 51.0, 59.0, 63.0, 64.0, 43.0, 31.0, 35.0, 20.0, 16.0, 13.0, 10.0, 8.0, 7.0, 4.0, 5.0, 5.0, 1.0, 5.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.385498046875, -0.3700599670410156, -0.35462188720703125, -0.3391838073730469, -0.3237457275390625, -0.3083076477050781, -0.29286956787109375, -0.2774314880371094, -0.261993408203125, -0.24655532836914062, -0.23111724853515625, -0.21567916870117188, -0.2002410888671875, -0.18480300903320312, -0.16936492919921875, -0.15392684936523438, -0.13848876953125, -0.12305068969726562, -0.10761260986328125, -0.09217453002929688, -0.0767364501953125, -0.061298370361328125, -0.04586029052734375, -0.030422210693359375, -0.014984130859375, 0.000453948974609375, 0.01589202880859375, 0.031330108642578125, 0.0467681884765625, 0.062206268310546875, 0.07764434814453125, 0.09308242797851562, 0.1085205078125, 0.12395858764648438, 0.13939666748046875, 0.15483474731445312, 0.1702728271484375, 0.18571090698242188, 0.20114898681640625, 0.21658706665039062, 0.232025146484375, 0.24746322631835938, 0.26290130615234375, 0.2783393859863281, 0.2937774658203125, 0.3092155456542969, 0.32465362548828125, 0.3400917053222656, 0.35552978515625, 0.3709678649902344, 0.38640594482421875, 0.4018440246582031, 0.4172821044921875, 0.4327201843261719, 0.44815826416015625, 0.4635963439941406, 0.479034423828125, 0.4944725036621094, 0.5099105834960938, 0.5253486633300781, 0.5407867431640625, 0.5562248229980469, 0.5716629028320312, 0.5871009826660156, 0.6025390625]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 0.0, 4.0, 2.0, 3.0, 11.0, 4.0, 15.0, 19.0, 44.0, 79.0, 113.0, 262.0, 680.0, 1761.0, 7357.0, 48873.0, 796162.0, 170779.0, 17231.0, 3375.0, 999.0, 353.0, 199.0, 87.0, 56.0, 32.0, 21.0, 15.0, 7.0, 7.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 5.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2158203125, -0.2087993621826172, -0.20177841186523438, -0.19475746154785156, -0.18773651123046875, -0.18071556091308594, -0.17369461059570312, -0.1666736602783203, -0.1596527099609375, -0.1526317596435547, -0.14561080932617188, -0.13858985900878906, -0.13156890869140625, -0.12454795837402344, -0.11752700805664062, -0.11050605773925781, -0.103485107421875, -0.09646415710449219, -0.08944320678710938, -0.08242225646972656, -0.07540130615234375, -0.06838035583496094, -0.061359405517578125, -0.05433845520019531, -0.0473175048828125, -0.04029655456542969, -0.033275604248046875, -0.026254653930664062, -0.01923370361328125, -0.012212753295898438, -0.005191802978515625, 0.0018291473388671875, 0.00885009765625, 0.015871047973632812, 0.022891998291015625, 0.029912948608398438, 0.03693389892578125, 0.04395484924316406, 0.050975799560546875, 0.05799674987792969, 0.0650177001953125, 0.07203865051269531, 0.07905960083007812, 0.08608055114746094, 0.09310150146484375, 0.10012245178222656, 0.10714340209960938, 0.11416435241699219, 0.121185302734375, 0.1282062530517578, 0.13522720336914062, 0.14224815368652344, 0.14926910400390625, 0.15629005432128906, 0.16331100463867188, 0.1703319549560547, 0.1773529052734375, 0.1843738555908203, 0.19139480590820312, 0.19841575622558594, 0.20543670654296875, 0.21245765686035156, 0.21947860717773438, 0.2264995574951172, 0.2335205078125]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 8.0, 1.0, 5.0, 4.0, 9.0, 11.0, 9.0, 11.0, 17.0, 29.0, 44.0, 37.0, 68.0, 103.0, 135.0, 115.0, 106.0, 76.0, 63.0, 38.0, 27.0, 20.0, 15.0, 10.0, 9.0, 10.0, 6.0, 7.0, 6.0, 4.0, 2.0, 1.0, 3.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.349252700805664e-05, -7.15227797627449e-05, -6.955303251743317e-05, -6.758328527212143e-05, -6.561353802680969e-05, -6.364379078149796e-05, -6.167404353618622e-05, -5.970429629087448e-05, -5.7734549045562744e-05, -5.576480180025101e-05, -5.379505455493927e-05, -5.182530730962753e-05, -4.9855560064315796e-05, -4.788581281900406e-05, -4.591606557369232e-05, -4.3946318328380585e-05, -4.197657108306885e-05, -4.000682383775711e-05, -3.8037076592445374e-05, -3.6067329347133636e-05, -3.40975821018219e-05, -3.212783485651016e-05, -3.0158087611198425e-05, -2.8188340365886688e-05, -2.621859312057495e-05, -2.4248845875263214e-05, -2.2279098629951477e-05, -2.030935138463974e-05, -1.8339604139328003e-05, -1.6369856894016266e-05, -1.4400109648704529e-05, -1.2430362403392792e-05, -1.0460615158081055e-05, -8.490867912769318e-06, -6.5211206674575806e-06, -4.5513734221458435e-06, -2.5816261768341064e-06, -6.118789315223694e-07, 1.3578683137893677e-06, 3.3276155591011047e-06, 5.297362804412842e-06, 7.267110049724579e-06, 9.236857295036316e-06, 1.1206604540348053e-05, 1.317635178565979e-05, 1.5146099030971527e-05, 1.7115846276283264e-05, 1.9085593521595e-05, 2.1055340766906738e-05, 2.3025088012218475e-05, 2.4994835257530212e-05, 2.696458250284195e-05, 2.8934329748153687e-05, 3.0904076993465424e-05, 3.287382423877716e-05, 3.48435714840889e-05, 3.6813318729400635e-05, 3.878306597471237e-05, 4.075281322002411e-05, 4.2722560465335846e-05, 4.469230771064758e-05, 4.666205495595932e-05, 4.863180220127106e-05, 5.0601549446582794e-05, 5.257129669189453e-05]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 0.0, 2.0, 4.0, 4.0, 4.0, 2.0, 8.0, 6.0, 12.0, 14.0, 18.0, 33.0, 34.0, 52.0, 86.0, 115.0, 176.0, 279.0, 542.0, 1003.0, 2214.0, 5789.0, 21296.0, 139227.0, 743651.0, 106656.0, 18010.0, 5080.0, 1985.0, 928.0, 480.0, 288.0, 192.0, 120.0, 79.0, 52.0, 38.0, 23.0, 14.0, 13.0, 8.0, 9.0, 7.0, 4.0, 4.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.164306640625, -0.159393310546875, -0.15447998046875, -0.149566650390625, -0.1446533203125, -0.139739990234375, -0.13482666015625, -0.129913330078125, -0.125, -0.120086669921875, -0.11517333984375, -0.110260009765625, -0.1053466796875, -0.100433349609375, -0.09552001953125, -0.090606689453125, -0.085693359375, -0.080780029296875, -0.07586669921875, -0.070953369140625, -0.0660400390625, -0.061126708984375, -0.05621337890625, -0.051300048828125, -0.04638671875, -0.041473388671875, -0.03656005859375, -0.031646728515625, -0.0267333984375, -0.021820068359375, -0.01690673828125, -0.011993408203125, -0.007080078125, -0.002166748046875, 0.00274658203125, 0.007659912109375, 0.0125732421875, 0.017486572265625, 0.02239990234375, 0.027313232421875, 0.0322265625, 0.037139892578125, 0.04205322265625, 0.046966552734375, 0.0518798828125, 0.056793212890625, 0.06170654296875, 0.066619873046875, 0.071533203125, 0.076446533203125, 0.08135986328125, 0.086273193359375, 0.0911865234375, 0.096099853515625, 0.10101318359375, 0.105926513671875, 0.11083984375, 0.115753173828125, 0.12066650390625, 0.125579833984375, 0.1304931640625, 0.135406494140625, 0.14031982421875, 0.145233154296875, 0.150146484375]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 2.0, 3.0, 2.0, 0.0, 3.0, 2.0, 6.0, 3.0, 10.0, 14.0, 12.0, 17.0, 24.0, 30.0, 47.0, 52.0, 63.0, 97.0, 105.0, 93.0, 78.0, 70.0, 53.0, 46.0, 47.0, 25.0, 20.0, 19.0, 12.0, 8.0, 6.0, 8.0, 8.0, 9.0, 4.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.14013671875, -0.1360340118408203, -0.13193130493164062, -0.12782859802246094, -0.12372589111328125, -0.11962318420410156, -0.11552047729492188, -0.11141777038574219, -0.1073150634765625, -0.10321235656738281, -0.09910964965820312, -0.09500694274902344, -0.09090423583984375, -0.08680152893066406, -0.08269882202148438, -0.07859611511230469, -0.074493408203125, -0.07039070129394531, -0.06628799438476562, -0.06218528747558594, -0.05808258056640625, -0.05397987365722656, -0.049877166748046875, -0.04577445983886719, -0.0416717529296875, -0.03756904602050781, -0.033466339111328125, -0.029363632202148438, -0.02526092529296875, -0.021158218383789062, -0.017055511474609375, -0.012952804565429688, -0.00885009765625, -0.0047473907470703125, -0.000644683837890625, 0.0034580230712890625, 0.00756072998046875, 0.011663436889648438, 0.015766143798828125, 0.019868850708007812, 0.0239715576171875, 0.028074264526367188, 0.032176971435546875, 0.03627967834472656, 0.04038238525390625, 0.04448509216308594, 0.048587799072265625, 0.05269050598144531, 0.056793212890625, 0.06089591979980469, 0.06499862670898438, 0.06910133361816406, 0.07320404052734375, 0.07730674743652344, 0.08140945434570312, 0.08551216125488281, 0.0896148681640625, 0.09371757507324219, 0.09782028198242188, 0.10192298889160156, 0.10602569580078125, 0.11012840270996094, 0.11423110961914062, 0.11833381652832031, 0.1224365234375]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 3.0, 4.0, 7.0, 10.0, 41.0, 164.0, 335.0, 262.0, 123.0, 29.0, 17.0, 6.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.136778831481934, -3.963371753692627, -3.7899646759033203, -3.6165573596954346, -3.443150281906128, -3.2697432041168213, -3.0963358879089355, -2.922928810119629, -2.7495217323303223, -2.5761146545410156, -2.402707576751709, -2.2293002605438232, -2.0558931827545166, -1.88248610496521, -1.7090789079666138, -1.5356717109680176, -1.362264633178711, -1.1888575553894043, -1.015450358390808, -0.8420432209968567, -0.6686360836029053, -0.49522894620895386, -0.32182180881500244, -0.14841461181640625, 0.02499246597290039, 0.1983996033668518, 0.3718067407608032, 0.5452138781547546, 0.718621015548706, 0.8920281529426575, 1.0654352903366089, 1.238842487335205, 1.4122495651245117, 1.5856566429138184, 1.7590638399124146, 1.9324710369110107, 2.1058781147003174, 2.279285192489624, 2.4526925086975098, 2.6260995864868164, 2.799506664276123, 2.9729137420654297, 3.1463208198547363, 3.319728136062622, 3.4931352138519287, 3.6665422916412354, 3.839949607849121, 4.013356685638428, 4.186763763427734, 4.360170841217041, 4.533577919006348, 4.706984996795654, 4.880392074584961, 5.053799629211426, 5.227206707000732, 5.400613784790039, 5.574020862579346, 5.747427940368652, 5.920835018157959, 6.094242095947266, 6.2676496505737305, 6.441056728363037, 6.614463806152344, 6.78787088394165, 6.961277961730957]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 3.0, 3.0, 17.0, 21.0, 21.0, 39.0, 48.0, 51.0, 65.0, 70.0, 81.0, 104.0, 113.0, 89.0, 61.0, 60.0, 44.0, 35.0, 44.0, 15.0, 7.0, 9.0, 5.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.6194236278533936, -3.528352737426758, -3.437281608581543, -3.3462107181549072, -3.2551395893096924, -3.1640686988830566, -3.072997570037842, -2.981926679611206, -2.8908557891845703, -2.7997848987579346, -2.7087137699127197, -2.617642879486084, -2.526571750640869, -2.4355008602142334, -2.3444299697875977, -2.253358840942383, -2.162287712097168, -2.0712168216705322, -1.9801456928253174, -1.8890748023986816, -1.7980036735534668, -1.706932783126831, -1.6158617734909058, -1.5247907638549805, -1.4337197542190552, -1.3426487445831299, -1.2515777349472046, -1.1605067253112793, -1.0694358348846436, -0.9783647656440735, -0.887293815612793, -0.7962228059768677, -0.7051515579223633, -0.614080548286438, -0.5230095386505127, -0.4319385886192322, -0.3408675789833069, -0.2497965693473816, -0.15872561931610107, -0.06765460968017578, 0.02341639995574951, 0.11448739469051361, 0.2055583894252777, 0.2966293692588806, 0.3877003788948059, 0.4787713885307312, 0.5698423385620117, 0.660913348197937, 0.7519843578338623, 0.8430553674697876, 0.9341263771057129, 1.0251972675323486, 1.1162683963775635, 1.2073392868041992, 1.2984102964401245, 1.3894813060760498, 1.480552315711975, 1.5716233253479004, 1.6626943349838257, 1.753765344619751, 1.8448362350463867, 1.9359073638916016, 2.0269782543182373, 2.118049144744873, 2.209120273590088]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 3.0, 6.0, 3.0, 2.0, 9.0, 6.0, 8.0, 9.0, 16.0, 25.0, 29.0, 31.0, 36.0, 62.0, 98.0, 138.0, 339.0, 1109.0, 9359.0, 325397.0, 3809270.0, 43986.0, 3117.0, 575.0, 220.0, 124.0, 77.0, 59.0, 27.0, 33.0, 24.0, 20.0, 16.0, 10.0, 16.0, 4.0, 5.0, 3.0, 4.0, 6.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.611328125, -0.5953521728515625, -0.579376220703125, -0.5634002685546875, -0.54742431640625, -0.5314483642578125, -0.515472412109375, -0.4994964599609375, -0.4835205078125, -0.4675445556640625, -0.451568603515625, -0.4355926513671875, -0.41961669921875, -0.4036407470703125, -0.387664794921875, -0.3716888427734375, -0.355712890625, -0.3397369384765625, -0.323760986328125, -0.3077850341796875, -0.29180908203125, -0.2758331298828125, -0.259857177734375, -0.2438812255859375, -0.2279052734375, -0.2119293212890625, -0.195953369140625, -0.1799774169921875, -0.16400146484375, -0.1480255126953125, -0.132049560546875, -0.1160736083984375, -0.10009765625, -0.0841217041015625, -0.068145751953125, -0.0521697998046875, -0.03619384765625, -0.0202178955078125, -0.004241943359375, 0.0117340087890625, 0.0277099609375, 0.0436859130859375, 0.059661865234375, 0.0756378173828125, 0.09161376953125, 0.1075897216796875, 0.123565673828125, 0.1395416259765625, 0.155517578125, 0.1714935302734375, 0.187469482421875, 0.2034454345703125, 0.21942138671875, 0.2353973388671875, 0.251373291015625, 0.2673492431640625, 0.2833251953125, 0.2993011474609375, 0.315277099609375, 0.3312530517578125, 0.34722900390625, 0.3632049560546875, 0.379180908203125, 0.3951568603515625, 0.4111328125]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 4.0, 8.0, 5.0, 9.0, 21.0, 29.0, 36.0, 49.0, 57.0, 80.0, 79.0, 73.0, 89.0, 81.0, 67.0, 74.0, 74.0, 50.0, 35.0, 32.0, 27.0, 13.0, 4.0, 3.0, 6.0, 3.0, 0.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1337890625, -0.129425048828125, -0.12506103515625, -0.120697021484375, -0.1163330078125, -0.111968994140625, -0.10760498046875, -0.103240966796875, -0.098876953125, -0.094512939453125, -0.09014892578125, -0.085784912109375, -0.0814208984375, -0.077056884765625, -0.07269287109375, -0.068328857421875, -0.06396484375, -0.059600830078125, -0.05523681640625, -0.050872802734375, -0.0465087890625, -0.042144775390625, -0.03778076171875, -0.033416748046875, -0.029052734375, -0.024688720703125, -0.02032470703125, -0.015960693359375, -0.0115966796875, -0.007232666015625, -0.00286865234375, 0.001495361328125, 0.005859375, 0.010223388671875, 0.01458740234375, 0.018951416015625, 0.0233154296875, 0.027679443359375, 0.03204345703125, 0.036407470703125, 0.040771484375, 0.045135498046875, 0.04949951171875, 0.053863525390625, 0.0582275390625, 0.062591552734375, 0.06695556640625, 0.071319580078125, 0.07568359375, 0.080047607421875, 0.08441162109375, 0.088775634765625, 0.0931396484375, 0.097503662109375, 0.10186767578125, 0.106231689453125, 0.110595703125, 0.114959716796875, 0.11932373046875, 0.123687744140625, 0.1280517578125, 0.132415771484375, 0.13677978515625, 0.141143798828125, 0.1455078125]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 4.0, 1.0, 3.0, 5.0, 6.0, 6.0, 13.0, 16.0, 37.0, 43.0, 66.0, 112.0, 167.0, 278.0, 505.0, 931.0, 1610.0, 3202.0, 6636.0, 15095.0, 36881.0, 108313.0, 494897.0, 2557393.0, 746880.0, 141752.0, 45020.0, 18327.0, 8134.0, 3726.0, 1904.0, 998.0, 557.0, 273.0, 186.0, 100.0, 82.0, 49.0, 30.0, 16.0, 9.0, 13.0, 7.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1683349609375, -0.16317176818847656, -0.15800857543945312, -0.1528453826904297, -0.14768218994140625, -0.1425189971923828, -0.13735580444335938, -0.13219261169433594, -0.1270294189453125, -0.12186622619628906, -0.11670303344726562, -0.11153984069824219, -0.10637664794921875, -0.10121345520019531, -0.09605026245117188, -0.09088706970214844, -0.085723876953125, -0.08056068420410156, -0.07539749145507812, -0.07023429870605469, -0.06507110595703125, -0.05990791320800781, -0.054744720458984375, -0.04958152770996094, -0.0444183349609375, -0.03925514221191406, -0.034091949462890625, -0.028928756713867188, -0.02376556396484375, -0.018602371215820312, -0.013439178466796875, -0.008275985717773438, -0.00311279296875, 0.0020503997802734375, 0.007213592529296875, 0.012376785278320312, 0.01753997802734375, 0.022703170776367188, 0.027866363525390625, 0.03302955627441406, 0.0381927490234375, 0.04335594177246094, 0.048519134521484375, 0.05368232727050781, 0.05884552001953125, 0.06400871276855469, 0.06917190551757812, 0.07433509826660156, 0.079498291015625, 0.08466148376464844, 0.08982467651367188, 0.09498786926269531, 0.10015106201171875, 0.10531425476074219, 0.11047744750976562, 0.11564064025878906, 0.1208038330078125, 0.12596702575683594, 0.13113021850585938, 0.1362934112548828, 0.14145660400390625, 0.1466197967529297, 0.15178298950195312, 0.15694618225097656, 0.162109375]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 4.0, 0.0, 1.0, 7.0, 6.0, 2.0, 13.0, 13.0, 17.0, 30.0, 41.0, 44.0, 62.0, 90.0, 147.0, 281.0, 464.0, 830.0, 806.0, 434.0, 291.0, 167.0, 97.0, 86.0, 34.0, 22.0, 27.0, 18.0, 8.0, 13.0, 6.0, 12.0, 2.0, 4.0, 4.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.314208984375, -0.3057117462158203, -0.2972145080566406, -0.28871726989746094, -0.28022003173828125, -0.27172279357910156, -0.2632255554199219, -0.2547283172607422, -0.2462310791015625, -0.2377338409423828, -0.22923660278320312, -0.22073936462402344, -0.21224212646484375, -0.20374488830566406, -0.19524765014648438, -0.1867504119873047, -0.178253173828125, -0.1697559356689453, -0.16125869750976562, -0.15276145935058594, -0.14426422119140625, -0.13576698303222656, -0.12726974487304688, -0.11877250671386719, -0.1102752685546875, -0.10177803039550781, -0.09328079223632812, -0.08478355407714844, -0.07628631591796875, -0.06778907775878906, -0.059291839599609375, -0.05079460144042969, -0.04229736328125, -0.03380012512207031, -0.025302886962890625, -0.016805648803710938, -0.00830841064453125, 0.0001888275146484375, 0.008686065673828125, 0.017183303833007812, 0.0256805419921875, 0.03417778015136719, 0.042675018310546875, 0.05117225646972656, 0.05966949462890625, 0.06816673278808594, 0.07666397094726562, 0.08516120910644531, 0.093658447265625, 0.10215568542480469, 0.11065292358398438, 0.11915016174316406, 0.12764739990234375, 0.13614463806152344, 0.14464187622070312, 0.1531391143798828, 0.1616363525390625, 0.1701335906982422, 0.17863082885742188, 0.18712806701660156, 0.19562530517578125, 0.20412254333496094, 0.21261978149414062, 0.2211170196533203, 0.2296142578125]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [3.0, 3.0, 1.0, 3.0, 2.0, 1.0, 6.0, 3.0, 7.0, 17.0, 51.0, 117.0, 229.0, 268.0, 168.0, 66.0, 37.0, 12.0, 7.0, 6.0, 4.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4222029447555542, -1.3133485317230225, -1.2044942378997803, -1.0956398248672485, -0.9867854118347168, -0.8779309988021851, -0.7690766453742981, -0.6602222919464111, -0.5513678789138794, -0.44251349568367004, -0.3336591124534607, -0.22480472922325134, -0.11595034599304199, -0.007095932960510254, 0.10175842046737671, 0.21061277389526367, 0.3194671869277954, 0.42832157015800476, 0.5371759533882141, 0.6460303068161011, 0.7548847198486328, 0.8637391328811646, 0.9725934863090515, 1.0814478397369385, 1.1903022527694702, 1.299156665802002, 1.4080109596252441, 1.5168653726577759, 1.6257197856903076, 1.7345741987228394, 1.843428611755371, 1.9522829055786133, 2.0611371994018555, 2.1699914932250977, 2.278846025466919, 2.387700319290161, 2.4965548515319824, 2.6054091453552246, 2.714263439178467, 2.823117733001709, 2.9319722652435303, 3.0408265590667725, 3.1496810913085938, 3.258535385131836, 3.367389678955078, 3.4762442111968994, 3.5850985050201416, 3.693953037261963, 3.802807331085205, 3.9116616249084473, 4.0205159187316895, 4.12937068939209, 4.238224983215332, 4.347079277038574, 4.455933570861816, 4.564787864685059, 4.673642158508301, 4.782496452331543, 4.891350746154785, 5.0002055168151855, 5.109059810638428, 5.21791410446167, 5.326768398284912, 5.435622692108154, 5.544477462768555]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 5.0, 7.0, 6.0, 10.0, 14.0, 13.0, 28.0, 26.0, 23.0, 42.0, 42.0, 35.0, 37.0, 45.0, 62.0, 42.0, 53.0, 54.0, 59.0, 52.0, 45.0, 45.0, 34.0, 38.0, 31.0, 35.0, 21.0, 24.0, 17.0, 13.0, 14.0, 11.0, 7.0, 7.0, 3.0, 3.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9469990730285645, -0.9092732667922974, -0.8715474009513855, -0.8338215351104736, -0.7960957288742065, -0.7583699226379395, -0.7206440567970276, -0.6829181909561157, -0.6451923847198486, -0.6074665784835815, -0.5697407126426697, -0.5320148468017578, -0.4942890405654907, -0.45656320452690125, -0.41883736848831177, -0.3811115324497223, -0.3433856964111328, -0.30565986037254333, -0.26793402433395386, -0.23020818829536438, -0.1924823522567749, -0.15475651621818542, -0.11703068017959595, -0.07930484414100647, -0.04157900810241699, -0.0038531720638275146, 0.03387266397476196, 0.07159850001335144, 0.10932433605194092, 0.1470501720905304, 0.18477600812911987, 0.22250184416770935, 0.2602275609970093, 0.29795339703559875, 0.33567923307418823, 0.3734050691127777, 0.4111309051513672, 0.44885674118995667, 0.48658257722854614, 0.524308443069458, 0.5620342493057251, 0.5997600555419922, 0.637485921382904, 0.6752117872238159, 0.712937593460083, 0.7506633996963501, 0.788389265537262, 0.8261151313781738, 0.8638409376144409, 0.901566743850708, 0.9392926096916199, 0.9770184755325317, 1.0147442817687988, 1.052470088005066, 1.090195894241333, 1.1279218196868896, 1.1656476259231567, 1.2033734321594238, 1.2410993576049805, 1.2788251638412476, 1.3165509700775146, 1.3542767763137817, 1.3920025825500488, 1.4297285079956055, 1.4674543142318726]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 3.0, 2.0, 8.0, 3.0, 9.0, 13.0, 20.0, 28.0, 26.0, 49.0, 72.0, 112.0, 144.0, 193.0, 253.0, 397.0, 576.0, 800.0, 1336.0, 2035.0, 3374.0, 5562.0, 9557.0, 17194.0, 33672.0, 77692.0, 219479.0, 377279.0, 170936.0, 62596.0, 28404.0, 14864.0, 8407.0, 4967.0, 2925.0, 1857.0, 1155.0, 805.0, 572.0, 325.0, 244.0, 176.0, 123.0, 99.0, 70.0, 42.0, 28.0, 23.0, 23.0, 12.0, 9.0, 7.0, 1.0, 0.0, 6.0, 3.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.14599609375, -0.1413440704345703, -0.13669204711914062, -0.13204002380371094, -0.12738800048828125, -0.12273597717285156, -0.11808395385742188, -0.11343193054199219, -0.1087799072265625, -0.10412788391113281, -0.09947586059570312, -0.09482383728027344, -0.09017181396484375, -0.08551979064941406, -0.08086776733398438, -0.07621574401855469, -0.071563720703125, -0.06691169738769531, -0.062259674072265625, -0.05760765075683594, -0.05295562744140625, -0.04830360412597656, -0.043651580810546875, -0.03899955749511719, -0.0343475341796875, -0.029695510864257812, -0.025043487548828125, -0.020391464233398438, -0.01573944091796875, -0.011087417602539062, -0.006435394287109375, -0.0017833709716796875, 0.00286865234375, 0.0075206756591796875, 0.012172698974609375, 0.016824722290039062, 0.02147674560546875, 0.026128768920898438, 0.030780792236328125, 0.03543281555175781, 0.0400848388671875, 0.04473686218261719, 0.049388885498046875, 0.05404090881347656, 0.05869293212890625, 0.06334495544433594, 0.06799697875976562, 0.07264900207519531, 0.077301025390625, 0.08195304870605469, 0.08660507202148438, 0.09125709533691406, 0.09590911865234375, 0.10056114196777344, 0.10521316528320312, 0.10986518859863281, 0.1145172119140625, 0.11916923522949219, 0.12382125854492188, 0.12847328186035156, 0.13312530517578125, 0.13777732849121094, 0.14242935180664062, 0.1470813751220703, 0.1517333984375]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 4.0, 2.0, 4.0, 4.0, 2.0, 10.0, 9.0, 14.0, 5.0, 6.0, 23.0, 22.0, 21.0, 31.0, 20.0, 27.0, 34.0, 42.0, 28.0, 38.0, 33.0, 43.0, 48.0, 33.0, 44.0, 39.0, 39.0, 33.0, 42.0, 42.0, 41.0, 22.0, 31.0, 32.0, 19.0, 18.0, 16.0, 24.0, 13.0, 9.0, 9.0, 5.0, 8.0, 9.0, 3.0, 4.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.07855224609375, -0.07616043090820312, -0.07376861572265625, -0.07137680053710938, -0.0689849853515625, -0.06659317016601562, -0.06420135498046875, -0.061809539794921875, -0.059417724609375, -0.057025909423828125, -0.05463409423828125, -0.052242279052734375, -0.0498504638671875, -0.047458648681640625, -0.04506683349609375, -0.042675018310546875, -0.040283203125, -0.037891387939453125, -0.03549957275390625, -0.033107757568359375, -0.0307159423828125, -0.028324127197265625, -0.02593231201171875, -0.023540496826171875, -0.021148681640625, -0.018756866455078125, -0.01636505126953125, -0.013973236083984375, -0.0115814208984375, -0.009189605712890625, -0.00679779052734375, -0.004405975341796875, -0.00201416015625, 0.000377655029296875, 0.00276947021484375, 0.005161285400390625, 0.0075531005859375, 0.009944915771484375, 0.01233673095703125, 0.014728546142578125, 0.017120361328125, 0.019512176513671875, 0.02190399169921875, 0.024295806884765625, 0.0266876220703125, 0.029079437255859375, 0.03147125244140625, 0.033863067626953125, 0.0362548828125, 0.038646697998046875, 0.04103851318359375, 0.043430328369140625, 0.0458221435546875, 0.048213958740234375, 0.05060577392578125, 0.052997589111328125, 0.055389404296875, 0.057781219482421875, 0.06017303466796875, 0.06256484985351562, 0.0649566650390625, 0.06734848022460938, 0.06974029541015625, 0.07213211059570312, 0.07452392578125]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 3.0, 5.0, 3.0, 10.0, 12.0, 12.0, 17.0, 24.0, 39.0, 75.0, 84.0, 183.0, 268.0, 582.0, 1233.0, 3071.0, 10459.0, 54765.0, 738060.0, 206203.0, 23930.0, 5775.0, 1953.0, 790.0, 425.0, 197.0, 127.0, 84.0, 55.0, 40.0, 20.0, 16.0, 18.0, 8.0, 12.0, 4.0, 0.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.276123046875, -0.2634391784667969, -0.25075531005859375, -0.23807144165039062, -0.2253875732421875, -0.21270370483398438, -0.20001983642578125, -0.18733596801757812, -0.174652099609375, -0.16196823120117188, -0.14928436279296875, -0.13660049438476562, -0.1239166259765625, -0.11123275756835938, -0.09854888916015625, -0.08586502075195312, -0.07318115234375, -0.060497283935546875, -0.04781341552734375, -0.035129547119140625, -0.0224456787109375, -0.009761810302734375, 0.00292205810546875, 0.015605926513671875, 0.028289794921875, 0.040973663330078125, 0.05365753173828125, 0.06634140014648438, 0.0790252685546875, 0.09170913696289062, 0.10439300537109375, 0.11707687377929688, 0.1297607421875, 0.14244461059570312, 0.15512847900390625, 0.16781234741210938, 0.1804962158203125, 0.19318008422851562, 0.20586395263671875, 0.21854782104492188, 0.231231689453125, 0.24391555786132812, 0.25659942626953125, 0.2692832946777344, 0.2819671630859375, 0.2946510314941406, 0.30733489990234375, 0.3200187683105469, 0.33270263671875, 0.3453865051269531, 0.35807037353515625, 0.3707542419433594, 0.3834381103515625, 0.3961219787597656, 0.40880584716796875, 0.4214897155761719, 0.434173583984375, 0.4468574523925781, 0.45954132080078125, 0.4722251892089844, 0.4849090576171875, 0.4975929260253906, 0.5102767944335938, 0.5229606628417969, 0.53564453125]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 5.0, 3.0, 11.0, 6.0, 9.0, 15.0, 18.0, 36.0, 54.0, 66.0, 82.0, 99.0, 88.0, 90.0, 98.0, 97.0, 59.0, 53.0, 37.0, 33.0, 19.0, 12.0, 6.0, 9.0, 2.0, 1.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.67626953125, -0.6538238525390625, -0.631378173828125, -0.6089324951171875, -0.58648681640625, -0.5640411376953125, -0.541595458984375, -0.5191497802734375, -0.4967041015625, -0.4742584228515625, -0.451812744140625, -0.4293670654296875, -0.40692138671875, -0.3844757080078125, -0.362030029296875, -0.3395843505859375, -0.317138671875, -0.2946929931640625, -0.272247314453125, -0.2498016357421875, -0.22735595703125, -0.2049102783203125, -0.182464599609375, -0.1600189208984375, -0.1375732421875, -0.1151275634765625, -0.092681884765625, -0.0702362060546875, -0.04779052734375, -0.0253448486328125, -0.002899169921875, 0.0195465087890625, 0.0419921875, 0.0644378662109375, 0.086883544921875, 0.1093292236328125, 0.13177490234375, 0.1542205810546875, 0.176666259765625, 0.1991119384765625, 0.2215576171875, 0.2440032958984375, 0.266448974609375, 0.2888946533203125, 0.31134033203125, 0.3337860107421875, 0.356231689453125, 0.3786773681640625, 0.401123046875, 0.4235687255859375, 0.446014404296875, 0.4684600830078125, 0.49090576171875, 0.5133514404296875, 0.535797119140625, 0.5582427978515625, 0.5806884765625, 0.6031341552734375, 0.625579833984375, 0.6480255126953125, 0.67047119140625, 0.6929168701171875, 0.715362548828125, 0.7378082275390625, 0.76025390625]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 7.0, 11.0, 11.0, 33.0, 59.0, 185.0, 851.0, 7793.0, 598194.0, 433227.0, 7016.0, 828.0, 205.0, 66.0, 33.0, 16.0, 9.0, 3.0, 3.0, 6.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.59765625, -0.5843696594238281, -0.5710830688476562, -0.5577964782714844, -0.5445098876953125, -0.5312232971191406, -0.5179367065429688, -0.5046501159667969, -0.491363525390625, -0.4780769348144531, -0.46479034423828125, -0.4515037536621094, -0.4382171630859375, -0.4249305725097656, -0.41164398193359375, -0.3983573913574219, -0.38507080078125, -0.3717842102050781, -0.35849761962890625, -0.3452110290527344, -0.3319244384765625, -0.3186378479003906, -0.30535125732421875, -0.2920646667480469, -0.278778076171875, -0.2654914855957031, -0.25220489501953125, -0.23891830444335938, -0.2256317138671875, -0.21234512329101562, -0.19905853271484375, -0.18577194213867188, -0.1724853515625, -0.15919876098632812, -0.14591217041015625, -0.13262557983398438, -0.1193389892578125, -0.10605239868164062, -0.09276580810546875, -0.07947921752929688, -0.066192626953125, -0.052906036376953125, -0.03961944580078125, -0.026332855224609375, -0.0130462646484375, 0.000240325927734375, 0.01352691650390625, 0.026813507080078125, 0.04010009765625, 0.053386688232421875, 0.06667327880859375, 0.07995986938476562, 0.0932464599609375, 0.10653305053710938, 0.11981964111328125, 0.13310623168945312, 0.146392822265625, 0.15967941284179688, 0.17296600341796875, 0.18625259399414062, 0.1995391845703125, 0.21282577514648438, 0.22611236572265625, 0.23939895629882812, 0.252685546875]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 0.0, 5.0, 3.0, 5.0, 5.0, 7.0, 5.0, 12.0, 12.0, 14.0, 26.0, 26.0, 53.0, 56.0, 68.0, 86.0, 80.0, 111.0, 83.0, 78.0, 57.0, 53.0, 46.0, 26.0, 20.0, 16.0, 12.0, 7.0, 8.0, 7.0, 4.0, 6.0, 3.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.5239925384521484e-05, -4.3752603232860565e-05, -4.2265281081199646e-05, -4.077795892953873e-05, -3.929063677787781e-05, -3.780331462621689e-05, -3.631599247455597e-05, -3.482867032289505e-05, -3.334134817123413e-05, -3.185402601957321e-05, -3.0366703867912292e-05, -2.8879381716251373e-05, -2.7392059564590454e-05, -2.5904737412929535e-05, -2.4417415261268616e-05, -2.2930093109607697e-05, -2.1442770957946777e-05, -1.9955448806285858e-05, -1.846812665462494e-05, -1.698080450296402e-05, -1.54934823513031e-05, -1.4006160199642181e-05, -1.2518838047981262e-05, -1.1031515896320343e-05, -9.544193744659424e-06, -8.056871592998505e-06, -6.5695494413375854e-06, -5.082227289676666e-06, -3.594905138015747e-06, -2.107582986354828e-06, -6.202608346939087e-07, 8.670613169670105e-07, 2.3543834686279297e-06, 3.841705620288849e-06, 5.329027771949768e-06, 6.816349923610687e-06, 8.303672075271606e-06, 9.790994226932526e-06, 1.1278316378593445e-05, 1.2765638530254364e-05, 1.4252960681915283e-05, 1.5740282833576202e-05, 1.722760498523712e-05, 1.871492713689804e-05, 2.020224928855896e-05, 2.168957144021988e-05, 2.31768935918808e-05, 2.4664215743541718e-05, 2.6151537895202637e-05, 2.7638860046863556e-05, 2.9126182198524475e-05, 3.0613504350185394e-05, 3.2100826501846313e-05, 3.358814865350723e-05, 3.507547080516815e-05, 3.656279295682907e-05, 3.805011510848999e-05, 3.953743726015091e-05, 4.102475941181183e-05, 4.251208156347275e-05, 4.399940371513367e-05, 4.5486725866794586e-05, 4.6974048018455505e-05, 4.8461370170116425e-05, 4.9948692321777344e-05]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 5.0, 2.0, 5.0, 3.0, 8.0, 15.0, 24.0, 38.0, 74.0, 151.0, 397.0, 1116.0, 4217.0, 32495.0, 750465.0, 242114.0, 13730.0, 2386.0, 768.0, 269.0, 115.0, 77.0, 39.0, 20.0, 7.0, 6.0, 6.0, 0.0, 4.0, 3.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.320068359375, -0.3122272491455078, -0.3043861389160156, -0.29654502868652344, -0.28870391845703125, -0.28086280822753906, -0.2730216979980469, -0.2651805877685547, -0.2573394775390625, -0.2494983673095703, -0.24165725708007812, -0.23381614685058594, -0.22597503662109375, -0.21813392639160156, -0.21029281616210938, -0.2024517059326172, -0.194610595703125, -0.1867694854736328, -0.17892837524414062, -0.17108726501464844, -0.16324615478515625, -0.15540504455566406, -0.14756393432617188, -0.1397228240966797, -0.1318817138671875, -0.12404060363769531, -0.11619949340820312, -0.10835838317871094, -0.10051727294921875, -0.09267616271972656, -0.08483505249023438, -0.07699394226074219, -0.06915283203125, -0.06131172180175781, -0.053470611572265625, -0.04562950134277344, -0.03778839111328125, -0.029947280883789062, -0.022106170654296875, -0.014265060424804688, -0.0064239501953125, 0.0014171600341796875, 0.009258270263671875, 0.017099380493164062, 0.02494049072265625, 0.03278160095214844, 0.040622711181640625, 0.04846382141113281, 0.056304931640625, 0.06414604187011719, 0.07198715209960938, 0.07982826232910156, 0.08766937255859375, 0.09551048278808594, 0.10335159301757812, 0.11119270324707031, 0.1190338134765625, 0.1268749237060547, 0.13471603393554688, 0.14255714416503906, 0.15039825439453125, 0.15823936462402344, 0.16608047485351562, 0.1739215850830078, 0.1817626953125]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 5.0, 2.0, 11.0, 19.0, 32.0, 44.0, 49.0, 98.0, 158.0, 165.0, 144.0, 104.0, 69.0, 51.0, 20.0, 15.0, 11.0, 10.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.364990234375, -0.35746288299560547, -0.34993553161621094, -0.3424081802368164, -0.3348808288574219, -0.32735347747802734, -0.3198261260986328, -0.3122987747192383, -0.30477142333984375, -0.2972440719604492, -0.2897167205810547, -0.28218936920166016, -0.2746620178222656, -0.2671346664428711, -0.25960731506347656, -0.25207996368408203, -0.2445526123046875, -0.23702526092529297, -0.22949790954589844, -0.2219705581665039, -0.21444320678710938, -0.20691585540771484, -0.1993885040283203, -0.19186115264892578, -0.18433380126953125, -0.17680644989013672, -0.1692790985107422, -0.16175174713134766, -0.15422439575195312, -0.1466970443725586, -0.13916969299316406, -0.13164234161376953, -0.124114990234375, -0.11658763885498047, -0.10906028747558594, -0.1015329360961914, -0.09400558471679688, -0.08647823333740234, -0.07895088195800781, -0.07142353057861328, -0.06389617919921875, -0.05636882781982422, -0.04884147644042969, -0.041314125061035156, -0.033786773681640625, -0.026259422302246094, -0.018732070922851562, -0.011204719543457031, -0.0036773681640625, 0.0038499832153320312, 0.011377334594726562, 0.018904685974121094, 0.026432037353515625, 0.033959388732910156, 0.04148674011230469, 0.04901409149169922, 0.05654144287109375, 0.06406879425048828, 0.07159614562988281, 0.07912349700927734, 0.08665084838867188, 0.0941781997680664, 0.10170555114746094, 0.10923290252685547, 0.11676025390625]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 7.0, 13.0, 35.0, 93.0, 210.0, 304.0, 192.0, 92.0, 27.0, 8.0, 8.0, 7.0, 3.0, 1.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.023674011230469, -3.8949646949768066, -3.7662553787231445, -3.6375458240509033, -3.508836507797241, -3.380127191543579, -3.251417636871338, -3.122708320617676, -2.9939990043640137, -2.8652896881103516, -2.7365803718566895, -2.6078708171844482, -2.479161500930786, -2.350452184677124, -2.221742630004883, -2.0930333137512207, -1.9643239974975586, -1.8356146812438965, -1.7069052457809448, -1.5781958103179932, -1.449486494064331, -1.320777177810669, -1.1920677423477173, -1.0633583068847656, -0.9346489906311035, -0.8059396147727966, -0.6772302389144897, -0.5485208630561829, -0.419811487197876, -0.2911021113395691, -0.1623927354812622, -0.03368335962295532, 0.09502649307250977, 0.22373586893081665, 0.35244524478912354, 0.4811546206474304, 0.6098639965057373, 0.7385733723640442, 0.8672827482223511, 0.995992124080658, 1.1247014999389648, 1.253410816192627, 1.3821202516555786, 1.5108296871185303, 1.6395390033721924, 1.7682483196258545, 1.8969577550888062, 2.025667190551758, 2.15437650680542, 2.283085823059082, 2.411795139312744, 2.5405046939849854, 2.6692140102386475, 2.7979233264923096, 2.926632881164551, 3.055342197418213, 3.184051513671875, 3.312760829925537, 3.441470146179199, 3.5701797008514404, 3.6988890171051025, 3.8275983333587646, 3.956307888031006, 4.085017204284668, 4.21372652053833]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 6.0, 15.0, 11.0, 17.0, 41.0, 50.0, 63.0, 72.0, 99.0, 130.0, 131.0, 83.0, 73.0, 61.0, 55.0, 47.0, 23.0, 16.0, 10.0, 5.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.6359992027282715, -4.5257887840271, -4.415578365325928, -4.305367946624756, -4.195158004760742, -4.08494758605957, -3.9747371673583984, -3.8645267486572266, -3.7543163299560547, -3.644105911254883, -3.53389573097229, -3.423685312271118, -3.3134748935699463, -3.2032647132873535, -3.0930542945861816, -2.9828438758850098, -2.872633457183838, -2.762423038482666, -2.6522128582000732, -2.5420024394989014, -2.4317920207977295, -2.3215818405151367, -2.211371421813965, -2.101161003112793, -1.9909508228302002, -1.8807405233383179, -1.770530104637146, -1.6603198051452637, -1.5501093864440918, -1.4398990869522095, -1.3296887874603271, -1.2194783687591553, -1.1092679500579834, -0.9990575909614563, -0.8888472318649292, -0.7786369323730469, -0.668426513671875, -0.5582162141799927, -0.4480058550834656, -0.3377954959869385, -0.22758513689041138, -0.11737478524446487, -0.007164433598518372, 0.10304591059684753, 0.21325626969337463, 0.32346659898757935, 0.43367695808410645, 0.5438873171806335, 0.6540976762771606, 0.7643080353736877, 0.8745183944702148, 0.9847286939620972, 1.094939112663269, 1.2051494121551514, 1.3153598308563232, 1.4255701303482056, 1.535780429840088, 1.6459907293319702, 1.756201148033142, 1.8664114475250244, 1.9766218662261963, 2.086832046508789, 2.197042465209961, 2.307252883911133, 2.4174633026123047]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 3.0, 4.0, 1.0, 2.0, 3.0, 8.0, 2.0, 11.0, 8.0, 6.0, 6.0, 11.0, 11.0, 24.0, 33.0, 24.0, 58.0, 113.0, 190.0, 431.0, 1113.0, 3272.0, 11563.0, 51879.0, 378248.0, 2759825.0, 863088.0, 96486.0, 19437.0, 5417.0, 1812.0, 672.0, 307.0, 123.0, 57.0, 19.0, 12.0, 6.0, 3.0, 2.0], "bins": [-0.32177734375, -0.31529903411865234, -0.3088207244873047, -0.30234241485595703, -0.2958641052246094, -0.2893857955932617, -0.28290748596191406, -0.2764291763305664, -0.26995086669921875, -0.2634725570678711, -0.25699424743652344, -0.2505159378051758, -0.24403762817382812, -0.23755931854248047, -0.2310810089111328, -0.22460269927978516, -0.2181243896484375, -0.21164608001708984, -0.2051677703857422, -0.19868946075439453, -0.19221115112304688, -0.18573284149169922, -0.17925453186035156, -0.1727762222290039, -0.16629791259765625, -0.1598196029663086, -0.15334129333496094, -0.14686298370361328, -0.14038467407226562, -0.13390636444091797, -0.1274280548095703, -0.12094974517822266, -0.114471435546875, -0.10799312591552734, -0.10151481628417969, -0.09503650665283203, -0.08855819702148438, -0.08207988739013672, -0.07560157775878906, -0.0691232681274414, -0.06264495849609375, -0.056166648864746094, -0.04968833923339844, -0.04321002960205078, -0.036731719970703125, -0.03025341033935547, -0.023775100708007812, -0.017296791076660156, -0.0108184814453125, -0.004340171813964844, 0.0021381378173828125, 0.008616447448730469, 0.015094757080078125, 0.02157306671142578, 0.028051376342773438, 0.034529685974121094, 0.04100799560546875, 0.047486305236816406, 0.05396461486816406, 0.06044292449951172, 0.06692123413085938, 0.07339954376220703, 0.07987785339355469, 0.08635616302490234, 0.09283447265625]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 7.0, 11.0, 18.0, 40.0, 69.0, 108.0, 153.0, 153.0, 142.0, 118.0, 101.0, 47.0, 38.0, 9.0, 5.0, 3.0], "bins": [-0.47119140625, -0.46272754669189453, -0.45426368713378906, -0.4457998275756836, -0.4373359680175781, -0.42887210845947266, -0.4204082489013672, -0.4119443893432617, -0.40348052978515625, -0.3950166702270508, -0.3865528106689453, -0.37808895111083984, -0.3696250915527344, -0.3611612319946289, -0.35269737243652344, -0.34423351287841797, -0.3357696533203125, -0.32730579376220703, -0.31884193420410156, -0.3103780746459961, -0.3019142150878906, -0.29345035552978516, -0.2849864959716797, -0.2765226364135742, -0.26805877685546875, -0.2595949172973633, -0.2511310577392578, -0.24266719818115234, -0.23420333862304688, -0.2257394790649414, -0.21727561950683594, -0.20881175994873047, -0.200347900390625, -0.19188404083251953, -0.18342018127441406, -0.1749563217163086, -0.16649246215820312, -0.15802860260009766, -0.1495647430419922, -0.14110088348388672, -0.13263702392578125, -0.12417316436767578, -0.11570930480957031, -0.10724544525146484, -0.09878158569335938, -0.0903177261352539, -0.08185386657714844, -0.07339000701904297, -0.0649261474609375, -0.05646228790283203, -0.04799842834472656, -0.039534568786621094, -0.031070709228515625, -0.022606849670410156, -0.014142990112304688, -0.005679130554199219, 0.00278472900390625, 0.011248588562011719, 0.019712448120117188, 0.028176307678222656, 0.036640167236328125, 0.045104026794433594, 0.05356788635253906, 0.06203174591064453, 0.07049560546875]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 1.0, 5.0, 6.0, 4.0, 5.0, 6.0, 17.0, 13.0, 24.0, 29.0, 43.0, 55.0, 96.0, 161.0, 235.0, 414.0, 766.0, 1653.0, 3659.0, 9039.0, 24612.0, 77224.0, 302937.0, 1847317.0, 1559236.0, 260281.0, 68791.0, 22217.0, 8402.0, 3320.0, 1601.0, 830.0, 469.0, 252.0, 173.0, 129.0, 80.0, 46.0, 45.0, 26.0, 26.0, 12.0, 6.0, 5.0, 4.0, 7.0, 3.0, 5.0, 1.0, 1.0, 2.0, 3.0, 1.0], "bins": [-0.19482421875, -0.18924903869628906, -0.18367385864257812, -0.1780986785888672, -0.17252349853515625, -0.1669483184814453, -0.16137313842773438, -0.15579795837402344, -0.1502227783203125, -0.14464759826660156, -0.13907241821289062, -0.1334972381591797, -0.12792205810546875, -0.12234687805175781, -0.11677169799804688, -0.11119651794433594, -0.105621337890625, -0.10004615783691406, -0.09447097778320312, -0.08889579772949219, -0.08332061767578125, -0.07774543762207031, -0.07217025756835938, -0.06659507751464844, -0.0610198974609375, -0.05544471740722656, -0.049869537353515625, -0.04429435729980469, -0.03871917724609375, -0.03314399719238281, -0.027568817138671875, -0.021993637084960938, -0.01641845703125, -0.010843276977539062, -0.005268096923828125, 0.0003070831298828125, 0.00588226318359375, 0.011457443237304688, 0.017032623291015625, 0.022607803344726562, 0.0281829833984375, 0.03375816345214844, 0.039333343505859375, 0.04490852355957031, 0.05048370361328125, 0.05605888366699219, 0.061634063720703125, 0.06720924377441406, 0.072784423828125, 0.07835960388183594, 0.08393478393554688, 0.08950996398925781, 0.09508514404296875, 0.10066032409667969, 0.10623550415039062, 0.11181068420410156, 0.1173858642578125, 0.12296104431152344, 0.12853622436523438, 0.1341114044189453, 0.13968658447265625, 0.1452617645263672, 0.15083694458007812, 0.15641212463378906, 0.1619873046875]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 4.0, 4.0, 5.0, 8.0, 19.0, 16.0, 26.0, 29.0, 43.0, 49.0, 70.0, 102.0, 135.0, 185.0, 298.0, 434.0, 505.0, 563.0, 476.0, 322.0, 198.0, 172.0, 98.0, 89.0, 55.0, 39.0, 35.0, 30.0, 18.0, 12.0, 8.0, 10.0, 10.0, 5.0, 3.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2325439453125, -0.22426414489746094, -0.21598434448242188, -0.2077045440673828, -0.19942474365234375, -0.1911449432373047, -0.18286514282226562, -0.17458534240722656, -0.1663055419921875, -0.15802574157714844, -0.14974594116210938, -0.1414661407470703, -0.13318634033203125, -0.12490653991699219, -0.11662673950195312, -0.10834693908691406, -0.100067138671875, -0.09178733825683594, -0.08350753784179688, -0.07522773742675781, -0.06694793701171875, -0.05866813659667969, -0.050388336181640625, -0.04210853576660156, -0.0338287353515625, -0.025548934936523438, -0.017269134521484375, -0.008989334106445312, -0.00070953369140625, 0.0075702667236328125, 0.015850067138671875, 0.024129867553710938, 0.03240966796875, 0.04068946838378906, 0.048969268798828125, 0.05724906921386719, 0.06552886962890625, 0.07380867004394531, 0.08208847045898438, 0.09036827087402344, 0.0986480712890625, 0.10692787170410156, 0.11520767211914062, 0.12348747253417969, 0.13176727294921875, 0.1400470733642578, 0.14832687377929688, 0.15660667419433594, 0.164886474609375, 0.17316627502441406, 0.18144607543945312, 0.1897258758544922, 0.19800567626953125, 0.2062854766845703, 0.21456527709960938, 0.22284507751464844, 0.2311248779296875, 0.23940467834472656, 0.24768447875976562, 0.2559642791748047, 0.26424407958984375, 0.2725238800048828, 0.2808036804199219, 0.28908348083496094, 0.29736328125]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 6.0, 7.0, 20.0, 40.0, 181.0, 302.0, 241.0, 120.0, 40.0, 21.0, 6.0, 7.0, 6.0, 2.0, 2.0, 2.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.394401788711548, -2.241150379180908, -2.0878992080688477, -1.934647798538208, -1.781396508216858, -1.6281452178955078, -1.4748938083648682, -1.321642518043518, -1.168391227722168, -1.0151399374008179, -0.861888587474823, -0.7086372375488281, -0.555385947227478, -0.40213465690612793, -0.24888330698013306, -0.09563195705413818, 0.057619333267211914, 0.2108706533908844, 0.3641219735145569, 0.5173733234405518, 0.6706246137619019, 0.823875904083252, 0.9771272540092468, 1.1303786039352417, 1.2836298942565918, 1.436881184577942, 1.590132474899292, 1.7433838844299316, 1.8966351747512817, 2.049886465072632, 2.2031378746032715, 2.356389045715332, 2.509640693664551, 2.6628921031951904, 2.816143274307251, 2.9693946838378906, 3.122645854949951, 3.275897264480591, 3.4291486740112305, 3.582399845123291, 3.7356512546539307, 3.8889026641845703, 4.042153835296631, 4.195405006408691, 4.34865665435791, 4.501907825469971, 4.655158996582031, 4.80841064453125, 4.9616618156433105, 5.114912986755371, 5.26816463470459, 5.42141580581665, 5.574666976928711, 5.72791862487793, 5.88116979598999, 6.034420967102051, 6.1876726150512695, 6.34092378616333, 6.494175434112549, 6.647426605224609, 6.80067777633667, 6.9539289474487305, 7.107180595397949, 7.26043176651001, 7.41368293762207]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 3.0, 3.0, 13.0, 10.0, 16.0, 27.0, 42.0, 53.0, 65.0, 73.0, 76.0, 98.0, 94.0, 97.0, 70.0, 64.0, 54.0, 48.0, 39.0, 20.0, 14.0, 14.0, 9.0, 3.0, 6.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4143567085266113, -1.3306742906570435, -1.2469918727874756, -1.1633094549179077, -1.0796270370483398, -0.995944619178772, -0.9122622013092041, -0.8285797834396362, -0.7448973655700684, -0.6612149477005005, -0.5775325298309326, -0.49385011196136475, -0.4101676940917969, -0.326485276222229, -0.24280285835266113, -0.15912044048309326, -0.07543802261352539, 0.00824439525604248, 0.09192681312561035, 0.17560923099517822, 0.2592916488647461, 0.34297406673431396, 0.42665648460388184, 0.5103389024734497, 0.5940213203430176, 0.6777037382125854, 0.7613861560821533, 0.8450685739517212, 0.9287509918212891, 1.012433409690857, 1.0961158275604248, 1.1797982454299927, 1.2634809017181396, 1.3471633195877075, 1.4308457374572754, 1.5145281553268433, 1.5982105731964111, 1.681892991065979, 1.7655754089355469, 1.8492578268051147, 1.9329402446746826, 2.016622543334961, 2.1003050804138184, 2.183987617492676, 2.267669916152954, 2.3513522148132324, 2.43503475189209, 2.5187172889709473, 2.6023995876312256, 2.686081886291504, 2.7697644233703613, 2.8534469604492188, 2.937129259109497, 3.0208115577697754, 3.104494094848633, 3.1881766319274902, 3.2718589305877686, 3.355541229248047, 3.4392237663269043, 3.5229063034057617, 3.60658860206604, 3.6902709007263184, 3.773953437805176, 3.857635974884033, 3.9413182735443115]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 4.0, 4.0, 12.0, 10.0, 22.0, 30.0, 39.0, 57.0, 106.0, 181.0, 243.0, 389.0, 549.0, 837.0, 1346.0, 2054.0, 3260.0, 5057.0, 8182.0, 13241.0, 21684.0, 36856.0, 64947.0, 128402.0, 264975.0, 239516.0, 111804.0, 58508.0, 33747.0, 19904.0, 11959.0, 7610.0, 4655.0, 2942.0, 1968.0, 1201.0, 792.0, 483.0, 369.0, 210.0, 128.0, 109.0, 52.0, 42.0, 29.0, 15.0, 8.0, 7.0, 7.0, 7.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.1435546875, -0.1391925811767578, -0.13483047485351562, -0.13046836853027344, -0.12610626220703125, -0.12174415588378906, -0.11738204956054688, -0.11301994323730469, -0.1086578369140625, -0.10429573059082031, -0.09993362426757812, -0.09557151794433594, -0.09120941162109375, -0.08684730529785156, -0.08248519897460938, -0.07812309265136719, -0.073760986328125, -0.06939888000488281, -0.06503677368164062, -0.06067466735839844, -0.05631256103515625, -0.05195045471191406, -0.047588348388671875, -0.04322624206542969, -0.0388641357421875, -0.03450202941894531, -0.030139923095703125, -0.025777816772460938, -0.02141571044921875, -0.017053604125976562, -0.012691497802734375, -0.008329391479492188, -0.00396728515625, 0.0003948211669921875, 0.004756927490234375, 0.009119033813476562, 0.01348114013671875, 0.017843246459960938, 0.022205352783203125, 0.026567459106445312, 0.0309295654296875, 0.03529167175292969, 0.039653778076171875, 0.04401588439941406, 0.04837799072265625, 0.05274009704589844, 0.057102203369140625, 0.06146430969238281, 0.065826416015625, 0.07018852233886719, 0.07455062866210938, 0.07891273498535156, 0.08327484130859375, 0.08763694763183594, 0.09199905395507812, 0.09636116027832031, 0.1007232666015625, 0.10508537292480469, 0.10944747924804688, 0.11380958557128906, 0.11817169189453125, 0.12253379821777344, 0.12689590454101562, 0.1312580108642578, 0.1356201171875]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 6.0, 1.0, 5.0, 9.0, 11.0, 12.0, 16.0, 23.0, 33.0, 45.0, 45.0, 57.0, 62.0, 59.0, 68.0, 71.0, 68.0, 61.0, 60.0, 45.0, 55.0, 47.0, 41.0, 27.0, 26.0, 22.0, 16.0, 12.0, 3.0, 6.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.15576171875, -0.15185260772705078, -0.14794349670410156, -0.14403438568115234, -0.14012527465820312, -0.1362161636352539, -0.1323070526123047, -0.12839794158935547, -0.12448883056640625, -0.12057971954345703, -0.11667060852050781, -0.1127614974975586, -0.10885238647460938, -0.10494327545166016, -0.10103416442871094, -0.09712505340576172, -0.0932159423828125, -0.08930683135986328, -0.08539772033691406, -0.08148860931396484, -0.07757949829101562, -0.0736703872680664, -0.06976127624511719, -0.06585216522216797, -0.06194305419921875, -0.05803394317626953, -0.05412483215332031, -0.050215721130371094, -0.046306610107421875, -0.042397499084472656, -0.03848838806152344, -0.03457927703857422, -0.030670166015625, -0.02676105499267578, -0.022851943969726562, -0.018942832946777344, -0.015033721923828125, -0.011124610900878906, -0.0072154998779296875, -0.0033063888549804688, 0.00060272216796875, 0.004511833190917969, 0.008420944213867188, 0.012330055236816406, 0.016239166259765625, 0.020148277282714844, 0.024057388305664062, 0.02796649932861328, 0.0318756103515625, 0.03578472137451172, 0.03969383239746094, 0.043602943420410156, 0.047512054443359375, 0.051421165466308594, 0.05533027648925781, 0.05923938751220703, 0.06314849853515625, 0.06705760955810547, 0.07096672058105469, 0.0748758316040039, 0.07878494262695312, 0.08269405364990234, 0.08660316467285156, 0.09051227569580078, 0.09442138671875]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 3.0, 1.0, 7.0, 8.0, 10.0, 14.0, 17.0, 16.0, 18.0, 29.0, 48.0, 59.0, 83.0, 96.0, 140.0, 228.0, 374.0, 558.0, 950.0, 1706.0, 3625.0, 9569.0, 34355.0, 210116.0, 687107.0, 71763.0, 16416.0, 5414.0, 2414.0, 1234.0, 765.0, 448.0, 251.0, 189.0, 161.0, 95.0, 77.0, 56.0, 49.0, 24.0, 26.0, 12.0, 12.0, 8.0, 3.0, 6.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.45166015625, -0.4380683898925781, -0.42447662353515625, -0.4108848571777344, -0.3972930908203125, -0.3837013244628906, -0.37010955810546875, -0.3565177917480469, -0.342926025390625, -0.3293342590332031, -0.31574249267578125, -0.3021507263183594, -0.2885589599609375, -0.2749671936035156, -0.26137542724609375, -0.24778366088867188, -0.23419189453125, -0.22060012817382812, -0.20700836181640625, -0.19341659545898438, -0.1798248291015625, -0.16623306274414062, -0.15264129638671875, -0.13904953002929688, -0.125457763671875, -0.11186599731445312, -0.09827423095703125, -0.08468246459960938, -0.0710906982421875, -0.057498931884765625, -0.04390716552734375, -0.030315399169921875, -0.0167236328125, -0.003131866455078125, 0.01045989990234375, 0.024051666259765625, 0.0376434326171875, 0.051235198974609375, 0.06482696533203125, 0.07841873168945312, 0.092010498046875, 0.10560226440429688, 0.11919403076171875, 0.13278579711914062, 0.1463775634765625, 0.15996932983398438, 0.17356109619140625, 0.18715286254882812, 0.20074462890625, 0.21433639526367188, 0.22792816162109375, 0.24151992797851562, 0.2551116943359375, 0.2687034606933594, 0.28229522705078125, 0.2958869934082031, 0.309478759765625, 0.3230705261230469, 0.33666229248046875, 0.3502540588378906, 0.3638458251953125, 0.3774375915527344, 0.39102935791015625, 0.4046211242675781, 0.418212890625]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 3.0, 3.0, 2.0, 4.0, 1.0, 6.0, 6.0, 5.0, 9.0, 10.0, 16.0, 19.0, 21.0, 28.0, 37.0, 39.0, 35.0, 39.0, 38.0, 44.0, 57.0, 45.0, 51.0, 66.0, 54.0, 51.0, 50.0, 38.0, 33.0, 32.0, 29.0, 22.0, 23.0, 13.0, 26.0, 18.0, 10.0, 5.0, 8.0, 9.0, 2.0, 1.0, 6.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.53515625, -0.5210113525390625, -0.506866455078125, -0.4927215576171875, -0.47857666015625, -0.4644317626953125, -0.450286865234375, -0.4361419677734375, -0.4219970703125, -0.4078521728515625, -0.393707275390625, -0.3795623779296875, -0.36541748046875, -0.3512725830078125, -0.337127685546875, -0.3229827880859375, -0.308837890625, -0.2946929931640625, -0.280548095703125, -0.2664031982421875, -0.25225830078125, -0.2381134033203125, -0.223968505859375, -0.2098236083984375, -0.1956787109375, -0.1815338134765625, -0.167388916015625, -0.1532440185546875, -0.13909912109375, -0.1249542236328125, -0.110809326171875, -0.0966644287109375, -0.08251953125, -0.0683746337890625, -0.054229736328125, -0.0400848388671875, -0.02593994140625, -0.0117950439453125, 0.002349853515625, 0.0164947509765625, 0.0306396484375, 0.0447845458984375, 0.058929443359375, 0.0730743408203125, 0.08721923828125, 0.1013641357421875, 0.115509033203125, 0.1296539306640625, 0.143798828125, 0.1579437255859375, 0.172088623046875, 0.1862335205078125, 0.20037841796875, 0.2145233154296875, 0.228668212890625, 0.2428131103515625, 0.2569580078125, 0.2711029052734375, 0.285247802734375, 0.2993927001953125, 0.31353759765625, 0.3276824951171875, 0.341827392578125, 0.3559722900390625, 0.3701171875]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 4.0, 3.0, 5.0, 5.0, 10.0, 20.0, 33.0, 48.0, 62.0, 137.0, 283.0, 570.0, 1442.0, 4207.0, 16318.0, 96492.0, 742118.0, 154433.0, 23484.0, 5589.0, 1825.0, 764.0, 336.0, 163.0, 86.0, 46.0, 30.0, 20.0, 7.0, 9.0, 8.0, 5.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.254638671875, -0.24821090698242188, -0.24178314208984375, -0.23535537719726562, -0.2289276123046875, -0.22249984741210938, -0.21607208251953125, -0.20964431762695312, -0.203216552734375, -0.19678878784179688, -0.19036102294921875, -0.18393325805664062, -0.1775054931640625, -0.17107772827148438, -0.16464996337890625, -0.15822219848632812, -0.15179443359375, -0.14536666870117188, -0.13893890380859375, -0.13251113891601562, -0.1260833740234375, -0.11965560913085938, -0.11322784423828125, -0.10680007934570312, -0.100372314453125, -0.09394454956054688, -0.08751678466796875, -0.08108901977539062, -0.0746612548828125, -0.06823348999023438, -0.06180572509765625, -0.055377960205078125, -0.0489501953125, -0.042522430419921875, -0.03609466552734375, -0.029666900634765625, -0.0232391357421875, -0.016811370849609375, -0.01038360595703125, -0.003955841064453125, 0.002471923828125, 0.008899688720703125, 0.01532745361328125, 0.021755218505859375, 0.0281829833984375, 0.034610748291015625, 0.04103851318359375, 0.047466278076171875, 0.05389404296875, 0.060321807861328125, 0.06674957275390625, 0.07317733764648438, 0.0796051025390625, 0.08603286743164062, 0.09246063232421875, 0.09888839721679688, 0.105316162109375, 0.11174392700195312, 0.11817169189453125, 0.12459945678710938, 0.1310272216796875, 0.13745498657226562, 0.14388275146484375, 0.15031051635742188, 0.15673828125]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 4.0, 5.0, 5.0, 3.0, 5.0, 9.0, 11.0, 12.0, 15.0, 16.0, 14.0, 17.0, 22.0, 30.0, 37.0, 33.0, 59.0, 70.0, 75.0, 86.0, 75.0, 84.0, 53.0, 54.0, 43.0, 26.0, 30.0, 20.0, 19.0, 13.0, 8.0, 9.0, 8.0, 7.0, 6.0, 6.0, 5.0, 4.0, 1.0, 3.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.8683414459228516e-05, -3.7243589758872986e-05, -3.5803765058517456e-05, -3.4363940358161926e-05, -3.2924115657806396e-05, -3.148429095745087e-05, -3.0044466257095337e-05, -2.8604641556739807e-05, -2.7164816856384277e-05, -2.5724992156028748e-05, -2.4285167455673218e-05, -2.2845342755317688e-05, -2.1405518054962158e-05, -1.996569335460663e-05, -1.85258686542511e-05, -1.708604395389557e-05, -1.564621925354004e-05, -1.420639455318451e-05, -1.276656985282898e-05, -1.132674515247345e-05, -9.88692045211792e-06, -8.44709575176239e-06, -7.00727105140686e-06, -5.5674463510513306e-06, -4.127621650695801e-06, -2.687796950340271e-06, -1.2479722499847412e-06, 1.9185245037078857e-07, 1.6316771507263184e-06, 3.071501851081848e-06, 4.511326551437378e-06, 5.951151251792908e-06, 7.3909759521484375e-06, 8.830800652503967e-06, 1.0270625352859497e-05, 1.1710450053215027e-05, 1.3150274753570557e-05, 1.4590099453926086e-05, 1.6029924154281616e-05, 1.7469748854637146e-05, 1.8909573554992676e-05, 2.0349398255348206e-05, 2.1789222955703735e-05, 2.3229047656059265e-05, 2.4668872356414795e-05, 2.6108697056770325e-05, 2.7548521757125854e-05, 2.8988346457481384e-05, 3.0428171157836914e-05, 3.1867995858192444e-05, 3.3307820558547974e-05, 3.4747645258903503e-05, 3.618746995925903e-05, 3.762729465961456e-05, 3.906711935997009e-05, 4.050694406032562e-05, 4.194676876068115e-05, 4.338659346103668e-05, 4.482641816139221e-05, 4.626624286174774e-05, 4.770606756210327e-05, 4.91458922624588e-05, 5.058571696281433e-05, 5.202554166316986e-05, 5.346536636352539e-05]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 3.0, 7.0, 10.0, 13.0, 14.0, 13.0, 27.0, 29.0, 40.0, 59.0, 87.0, 129.0, 198.0, 310.0, 499.0, 864.0, 1625.0, 3577.0, 9314.0, 35639.0, 205126.0, 663780.0, 95898.0, 19752.0, 5879.0, 2490.0, 1211.0, 749.0, 425.0, 253.0, 172.0, 101.0, 78.0, 57.0, 38.0, 20.0, 19.0, 12.0, 12.0, 9.0, 8.0, 4.0, 2.0, 1.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.14892578125, -0.1441669464111328, -0.13940811157226562, -0.13464927673339844, -0.12989044189453125, -0.12513160705566406, -0.12037277221679688, -0.11561393737792969, -0.1108551025390625, -0.10609626770019531, -0.10133743286132812, -0.09657859802246094, -0.09181976318359375, -0.08706092834472656, -0.08230209350585938, -0.07754325866699219, -0.072784423828125, -0.06802558898925781, -0.06326675415039062, -0.05850791931152344, -0.05374908447265625, -0.04899024963378906, -0.044231414794921875, -0.03947257995605469, -0.0347137451171875, -0.029954910278320312, -0.025196075439453125, -0.020437240600585938, -0.01567840576171875, -0.010919570922851562, -0.006160736083984375, -0.0014019012451171875, 0.00335693359375, 0.008115768432617188, 0.012874603271484375, 0.017633438110351562, 0.02239227294921875, 0.027151107788085938, 0.031909942626953125, 0.03666877746582031, 0.0414276123046875, 0.04618644714355469, 0.050945281982421875, 0.05570411682128906, 0.06046295166015625, 0.06522178649902344, 0.06998062133789062, 0.07473945617675781, 0.079498291015625, 0.08425712585449219, 0.08901596069335938, 0.09377479553222656, 0.09853363037109375, 0.10329246520996094, 0.10805130004882812, 0.11281013488769531, 0.1175689697265625, 0.12232780456542969, 0.12708663940429688, 0.13184547424316406, 0.13660430908203125, 0.14136314392089844, 0.14612197875976562, 0.1508808135986328, 0.1556396484375]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 2.0, 1.0, 4.0, 2.0, 1.0, 2.0, 4.0, 5.0, 5.0, 8.0, 15.0, 16.0, 20.0, 16.0, 15.0, 38.0, 31.0, 37.0, 59.0, 45.0, 64.0, 75.0, 71.0, 66.0, 69.0, 57.0, 57.0, 38.0, 42.0, 31.0, 17.0, 20.0, 15.0, 17.0, 8.0, 6.0, 8.0, 3.0, 3.0, 9.0, 2.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.12548828125, -0.12138748168945312, -0.11728668212890625, -0.11318588256835938, -0.1090850830078125, -0.10498428344726562, -0.10088348388671875, -0.09678268432617188, -0.092681884765625, -0.08858108520507812, -0.08448028564453125, -0.08037948608398438, -0.0762786865234375, -0.07217788696289062, -0.06807708740234375, -0.06397628784179688, -0.05987548828125, -0.055774688720703125, -0.05167388916015625, -0.047573089599609375, -0.0434722900390625, -0.039371490478515625, -0.03527069091796875, -0.031169891357421875, -0.027069091796875, -0.022968292236328125, -0.01886749267578125, -0.014766693115234375, -0.0106658935546875, -0.006565093994140625, -0.00246429443359375, 0.001636505126953125, 0.0057373046875, 0.009838104248046875, 0.01393890380859375, 0.018039703369140625, 0.0221405029296875, 0.026241302490234375, 0.03034210205078125, 0.034442901611328125, 0.038543701171875, 0.042644500732421875, 0.04674530029296875, 0.050846099853515625, 0.0549468994140625, 0.059047698974609375, 0.06314849853515625, 0.06724929809570312, 0.07135009765625, 0.07545089721679688, 0.07955169677734375, 0.08365249633789062, 0.0877532958984375, 0.09185409545898438, 0.09595489501953125, 0.10005569458007812, 0.104156494140625, 0.10825729370117188, 0.11235809326171875, 0.11645889282226562, 0.1205596923828125, 0.12466049194335938, 0.12876129150390625, 0.13286209106445312, 0.136962890625]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 7.0, 2.0, 6.0, 17.0, 40.0, 78.0, 124.0, 279.0, 205.0, 109.0, 64.0, 27.0, 18.0, 12.0, 7.0, 5.0, 1.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.352621555328369, -3.210792303085327, -3.068963050842285, -2.927133798599243, -2.785304546356201, -2.643475294113159, -2.501646041870117, -2.359816789627075, -2.217987537384033, -2.076158285140991, -1.9343290328979492, -1.7924997806549072, -1.6506705284118652, -1.5088412761688232, -1.3670120239257812, -1.2251827716827393, -1.0833535194396973, -0.9415242671966553, -0.7996950149536133, -0.6578657627105713, -0.5160365104675293, -0.3742072582244873, -0.2323780059814453, -0.09054875373840332, 0.05128049850463867, 0.19310975074768066, 0.33493900299072266, 0.47676825523376465, 0.6185975074768066, 0.7604267597198486, 0.9022560119628906, 1.0440852642059326, 1.1859140396118164, 1.3277432918548584, 1.4695725440979004, 1.6114017963409424, 1.7532310485839844, 1.8950603008270264, 2.0368895530700684, 2.1787188053131104, 2.3205480575561523, 2.4623773097991943, 2.6042065620422363, 2.7460358142852783, 2.8878650665283203, 3.0296943187713623, 3.1715235710144043, 3.3133528232574463, 3.4551820755004883, 3.5970113277435303, 3.7388405799865723, 3.8806698322296143, 4.022499084472656, 4.164328575134277, 4.30615758895874, 4.447986602783203, 4.589816093444824, 4.731645584106445, 4.873474597930908, 5.015303611755371, 5.157133102416992, 5.298962593078613, 5.440791606903076, 5.582620620727539, 5.72445011138916]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 6.0, 2.0, 2.0, 6.0, 7.0, 8.0, 1.0, 18.0, 12.0, 12.0, 21.0, 19.0, 24.0, 26.0, 22.0, 23.0, 30.0, 39.0, 38.0, 52.0, 53.0, 63.0, 50.0, 62.0, 46.0, 45.0, 32.0, 37.0, 38.0, 28.0, 23.0, 27.0, 24.0, 14.0, 22.0, 13.0, 22.0, 4.0, 3.0, 6.0, 7.0, 5.0, 3.0, 8.0, 1.0, 0.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-1.6170198917388916, -1.5671344995498657, -1.5172491073608398, -1.4673638343811035, -1.4174784421920776, -1.3675930500030518, -1.3177076578140259, -1.267822265625, -1.2179369926452637, -1.1680516004562378, -1.118166208267212, -1.0682809352874756, -1.0183955430984497, -0.9685101509094238, -0.918624758720398, -0.8687393665313721, -0.8188539743423462, -0.7689685821533203, -0.7190832495689392, -0.6691978573799133, -0.6193125247955322, -0.5694271326065063, -0.5195417404174805, -0.469656378030777, -0.4197710156440735, -0.36988565325737, -0.3200002908706665, -0.2701148986816406, -0.22022953629493713, -0.17034417390823364, -0.12045878171920776, -0.07057341933250427, -0.02068793773651123, 0.029197432100772858, 0.07908280193805695, 0.12896817922592163, 0.17885354161262512, 0.2287389039993286, 0.2786242961883545, 0.328509658575058, 0.3783950209617615, 0.42828038334846497, 0.47816574573516846, 0.5280511379241943, 0.5779365301132202, 0.6278218626976013, 0.6777072548866272, 0.7275925874710083, 0.7774779796600342, 0.8273633718490601, 0.8772487044334412, 0.927134096622467, 0.9770194292068481, 1.026904821395874, 1.0767902135849, 1.1266756057739258, 1.176560878753662, 1.226446270942688, 1.2763316631317139, 1.3262169361114502, 1.376102328300476, 1.425987720489502, 1.4758731126785278, 1.5257585048675537, 1.5756438970565796]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 8.0, 4.0, 6.0, 7.0, 16.0, 18.0, 13.0, 43.0, 54.0, 78.0, 110.0, 178.0, 274.0, 448.0, 767.0, 1300.0, 2189.0, 3901.0, 7173.0, 13792.0, 28199.0, 61542.0, 157710.0, 478225.0, 1372458.0, 1336529.0, 457310.0, 153234.0, 60513.0, 27780.0, 13703.0, 7208.0, 3969.0, 2220.0, 1279.0, 723.0, 471.0, 285.0, 204.0, 116.0, 83.0, 47.0, 31.0, 26.0, 16.0, 19.0, 5.0, 4.0, 1.0, 3.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0897216796875, -0.08682632446289062, -0.08393096923828125, -0.08103561401367188, -0.0781402587890625, -0.07524490356445312, -0.07234954833984375, -0.06945419311523438, -0.066558837890625, -0.06366348266601562, -0.06076812744140625, -0.057872772216796875, -0.0549774169921875, -0.052082061767578125, -0.04918670654296875, -0.046291351318359375, -0.04339599609375, -0.040500640869140625, -0.03760528564453125, -0.034709930419921875, -0.0318145751953125, -0.028919219970703125, -0.02602386474609375, -0.023128509521484375, -0.020233154296875, -0.017337799072265625, -0.01444244384765625, -0.011547088623046875, -0.0086517333984375, -0.005756378173828125, -0.00286102294921875, 3.4332275390625e-05, 0.0029296875, 0.005825042724609375, 0.00872039794921875, 0.011615753173828125, 0.0145111083984375, 0.017406463623046875, 0.02030181884765625, 0.023197174072265625, 0.026092529296875, 0.028987884521484375, 0.03188323974609375, 0.034778594970703125, 0.0376739501953125, 0.040569305419921875, 0.04346466064453125, 0.046360015869140625, 0.04925537109375, 0.052150726318359375, 0.05504608154296875, 0.057941436767578125, 0.0608367919921875, 0.06373214721679688, 0.06662750244140625, 0.06952285766601562, 0.072418212890625, 0.07531356811523438, 0.07820892333984375, 0.08110427856445312, 0.0839996337890625, 0.08689498901367188, 0.08979034423828125, 0.09268569946289062, 0.0955810546875]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [4.0, 1.0, 1.0, 1.0, 2.0, 4.0, 4.0, 4.0, 7.0, 8.0, 10.0, 9.0, 8.0, 10.0, 9.0, 14.0, 17.0, 19.0, 26.0, 30.0, 37.0, 37.0, 37.0, 41.0, 52.0, 40.0, 51.0, 40.0, 45.0, 38.0, 49.0, 48.0, 50.0, 34.0, 35.0, 35.0, 24.0, 18.0, 21.0, 16.0, 16.0, 16.0, 11.0, 5.0, 9.0, 7.0, 7.0, 3.0, 2.0, 4.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0731201171875, -0.07046890258789062, -0.06781768798828125, -0.06516647338867188, -0.0625152587890625, -0.059864044189453125, -0.05721282958984375, -0.054561614990234375, -0.051910400390625, -0.049259185791015625, -0.04660797119140625, -0.043956756591796875, -0.0413055419921875, -0.038654327392578125, -0.03600311279296875, -0.033351898193359375, -0.03070068359375, -0.028049468994140625, -0.02539825439453125, -0.022747039794921875, -0.0200958251953125, -0.017444610595703125, -0.01479339599609375, -0.012142181396484375, -0.009490966796875, -0.006839752197265625, -0.00418853759765625, -0.001537322998046875, 0.0011138916015625, 0.003765106201171875, 0.00641632080078125, 0.009067535400390625, 0.01171875, 0.014369964599609375, 0.01702117919921875, 0.019672393798828125, 0.0223236083984375, 0.024974822998046875, 0.02762603759765625, 0.030277252197265625, 0.032928466796875, 0.035579681396484375, 0.03823089599609375, 0.040882110595703125, 0.0435333251953125, 0.046184539794921875, 0.04883575439453125, 0.051486968994140625, 0.05413818359375, 0.056789398193359375, 0.05944061279296875, 0.062091827392578125, 0.0647430419921875, 0.06739425659179688, 0.07004547119140625, 0.07269668579101562, 0.075347900390625, 0.07799911499023438, 0.08065032958984375, 0.08330154418945312, 0.0859527587890625, 0.08860397338867188, 0.09125518798828125, 0.09390640258789062, 0.0965576171875]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 7.0, 6.0, 6.0, 10.0, 21.0, 27.0, 46.0, 71.0, 109.0, 207.0, 457.0, 1202.0, 3765.0, 15801.0, 99486.0, 1393468.0, 2477906.0, 167879.0, 24936.0, 5796.0, 1823.0, 621.0, 265.0, 156.0, 90.0, 54.0, 32.0, 12.0, 7.0, 8.0, 4.0, 7.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2763671875, -0.26617431640625, -0.2559814453125, -0.24578857421875, -0.235595703125, -0.22540283203125, -0.2152099609375, -0.20501708984375, -0.19482421875, -0.18463134765625, -0.1744384765625, -0.16424560546875, -0.154052734375, -0.14385986328125, -0.1336669921875, -0.12347412109375, -0.11328125, -0.10308837890625, -0.0928955078125, -0.08270263671875, -0.072509765625, -0.06231689453125, -0.0521240234375, -0.04193115234375, -0.03173828125, -0.02154541015625, -0.0113525390625, -0.00115966796875, 0.009033203125, 0.01922607421875, 0.0294189453125, 0.03961181640625, 0.0498046875, 0.05999755859375, 0.0701904296875, 0.08038330078125, 0.090576171875, 0.10076904296875, 0.1109619140625, 0.12115478515625, 0.13134765625, 0.14154052734375, 0.1517333984375, 0.16192626953125, 0.172119140625, 0.18231201171875, 0.1925048828125, 0.20269775390625, 0.212890625, 0.22308349609375, 0.2332763671875, 0.24346923828125, 0.253662109375, 0.26385498046875, 0.2740478515625, 0.28424072265625, 0.29443359375, 0.30462646484375, 0.3148193359375, 0.32501220703125, 0.335205078125, 0.34539794921875, 0.3555908203125, 0.36578369140625, 0.3759765625]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 2.0, 10.0, 13.0, 3.0, 11.0, 20.0, 20.0, 23.0, 37.0, 60.0, 60.0, 109.0, 148.0, 251.0, 325.0, 421.0, 504.0, 588.0, 409.0, 294.0, 213.0, 142.0, 98.0, 79.0, 58.0, 45.0, 40.0, 22.0, 15.0, 23.0, 9.0, 5.0, 5.0, 6.0, 3.0, 2.0, 1.0, 1.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.284423828125, -0.27581024169921875, -0.2671966552734375, -0.25858306884765625, -0.249969482421875, -0.24135589599609375, -0.2327423095703125, -0.22412872314453125, -0.21551513671875, -0.20690155029296875, -0.1982879638671875, -0.18967437744140625, -0.181060791015625, -0.17244720458984375, -0.1638336181640625, -0.15522003173828125, -0.1466064453125, -0.13799285888671875, -0.1293792724609375, -0.12076568603515625, -0.112152099609375, -0.10353851318359375, -0.0949249267578125, -0.08631134033203125, -0.07769775390625, -0.06908416748046875, -0.0604705810546875, -0.05185699462890625, -0.043243408203125, -0.03462982177734375, -0.0260162353515625, -0.01740264892578125, -0.0087890625, -0.00017547607421875, 0.0084381103515625, 0.01705169677734375, 0.025665283203125, 0.03427886962890625, 0.0428924560546875, 0.05150604248046875, 0.06011962890625, 0.06873321533203125, 0.0773468017578125, 0.08596038818359375, 0.094573974609375, 0.10318756103515625, 0.1118011474609375, 0.12041473388671875, 0.1290283203125, 0.13764190673828125, 0.1462554931640625, 0.15486907958984375, 0.163482666015625, 0.17209625244140625, 0.1807098388671875, 0.18932342529296875, 0.19793701171875, 0.20655059814453125, 0.2151641845703125, 0.22377777099609375, 0.232391357421875, 0.24100494384765625, 0.2496185302734375, 0.25823211669921875, 0.266845703125]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 11.0, 33.0, 119.0, 305.0, 334.0, 141.0, 37.0, 8.0, 9.0, 5.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.593810081481934, -4.385926246643066, -4.178042411804199, -3.970158576965332, -3.762274742126465, -3.5543909072875977, -3.3465073108673096, -3.1386234760284424, -2.930739641189575, -2.722855806350708, -2.514971971511841, -2.3070883750915527, -2.0992045402526855, -1.8913205862045288, -1.6834368705749512, -1.475553035736084, -1.2676692008972168, -1.0597853660583496, -0.8519015908241272, -0.6440178155899048, -0.4361339807510376, -0.2282501459121704, -0.020366430282592773, 0.18751740455627441, 0.3954012393951416, 0.6032850742340088, 0.8111688494682312, 1.0190526247024536, 1.2269364595413208, 1.434820294380188, 1.6427040100097656, 1.8505878448486328, 2.0584716796875, 2.266355514526367, 2.4742393493652344, 2.6821231842041016, 2.8900070190429688, 3.097890853881836, 3.305774450302124, 3.513658285140991, 3.7215421199798584, 3.9294259548187256, 4.137309551239014, 4.345193386077881, 4.553077220916748, 4.760961055755615, 4.968844890594482, 5.17672872543335, 5.384612560272217, 5.592496395111084, 5.800380229949951, 6.008264064788818, 6.2161478996276855, 6.424031734466553, 6.631915092468262, 6.839798927307129, 7.047682762145996, 7.255566596984863, 7.4634504318237305, 7.671334266662598, 7.879218101501465, 8.087101936340332, 8.2949857711792, 8.502869606018066, 8.710753440856934]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 2.0, 3.0, 1.0, 5.0, 6.0, 7.0, 5.0, 18.0, 11.0, 9.0, 18.0, 21.0, 27.0, 37.0, 26.0, 30.0, 50.0, 47.0, 50.0, 54.0, 58.0, 52.0, 65.0, 50.0, 44.0, 37.0, 42.0, 32.0, 37.0, 34.0, 28.0, 27.0, 18.0, 15.0, 14.0, 4.0, 9.0, 10.0, 6.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.7327477931976318, -1.6812776327133179, -1.6298075914382935, -1.5783374309539795, -1.526867389678955, -1.4753972291946411, -1.4239270687103271, -1.3724570274353027, -1.3209868669509888, -1.2695167064666748, -1.2180466651916504, -1.1665765047073364, -1.1151063442230225, -1.063636302947998, -1.012166142463684, -0.9606960415840149, -0.9092259407043457, -0.8577558398246765, -0.8062857389450073, -0.7548155784606934, -0.7033454775810242, -0.651875376701355, -0.600405216217041, -0.5489351153373718, -0.49746501445770264, -0.44599491357803345, -0.39452478289604187, -0.3430546522140503, -0.2915845513343811, -0.24011445045471191, -0.18864431977272034, -0.13717418909072876, -0.08570408821105957, -0.03423397243022919, 0.017236143350601196, 0.06870625913143158, 0.12017637491226196, 0.17164647579193115, 0.22311660647392273, 0.2745867371559143, 0.3260568380355835, 0.3775269389152527, 0.42899706959724426, 0.48046720027923584, 0.531937301158905, 0.5834074020385742, 0.6348775625228882, 0.6863476634025574, 0.7378177642822266, 0.7892878651618958, 0.8407579660415649, 0.8922281265258789, 0.9436982274055481, 0.9951683282852173, 1.0466384887695312, 1.0981085300445557, 1.1495786905288696, 1.2010488510131836, 1.252518892288208, 1.303989052772522, 1.355459213256836, 1.4069292545318604, 1.4583994150161743, 1.5098695755004883, 1.5613396167755127]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 10.0, 6.0, 15.0, 19.0, 24.0, 37.0, 58.0, 72.0, 132.0, 197.0, 304.0, 417.0, 660.0, 1026.0, 1609.0, 2544.0, 4038.0, 6968.0, 12157.0, 22698.0, 47008.0, 116031.0, 306390.0, 308740.0, 116705.0, 47094.0, 23078.0, 12225.0, 7058.0, 4092.0, 2550.0, 1583.0, 1022.0, 680.0, 428.0, 295.0, 199.0, 123.0, 97.0, 59.0, 37.0, 31.0, 14.0, 10.0, 8.0, 4.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.1729736328125, -0.16788673400878906, -0.16279983520507812, -0.1577129364013672, -0.15262603759765625, -0.1475391387939453, -0.14245223999023438, -0.13736534118652344, -0.1322784423828125, -0.12719154357910156, -0.12210464477539062, -0.11701774597167969, -0.11193084716796875, -0.10684394836425781, -0.10175704956054688, -0.09667015075683594, -0.091583251953125, -0.08649635314941406, -0.08140945434570312, -0.07632255554199219, -0.07123565673828125, -0.06614875793457031, -0.061061859130859375, -0.05597496032714844, -0.0508880615234375, -0.04580116271972656, -0.040714263916015625, -0.03562736511230469, -0.03054046630859375, -0.025453567504882812, -0.020366668701171875, -0.015279769897460938, -0.01019287109375, -0.0051059722900390625, -1.9073486328125e-05, 0.0050678253173828125, 0.01015472412109375, 0.015241622924804688, 0.020328521728515625, 0.025415420532226562, 0.0305023193359375, 0.03558921813964844, 0.040676116943359375, 0.04576301574707031, 0.05084991455078125, 0.05593681335449219, 0.061023712158203125, 0.06611061096191406, 0.071197509765625, 0.07628440856933594, 0.08137130737304688, 0.08645820617675781, 0.09154510498046875, 0.09663200378417969, 0.10171890258789062, 0.10680580139160156, 0.1118927001953125, 0.11697959899902344, 0.12206649780273438, 0.1271533966064453, 0.13224029541015625, 0.1373271942138672, 0.14241409301757812, 0.14750099182128906, 0.152587890625]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 6.0, 3.0, 8.0, 11.0, 9.0, 12.0, 11.0, 30.0, 16.0, 22.0, 21.0, 31.0, 36.0, 35.0, 37.0, 35.0, 49.0, 46.0, 56.0, 39.0, 37.0, 50.0, 45.0, 41.0, 39.0, 40.0, 28.0, 39.0, 18.0, 19.0, 18.0, 20.0, 14.0, 16.0, 19.0, 8.0, 9.0, 14.0, 8.0, 2.0, 4.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.0985107421875, -0.09566974639892578, -0.09282875061035156, -0.08998775482177734, -0.08714675903320312, -0.0843057632446289, -0.08146476745605469, -0.07862377166748047, -0.07578277587890625, -0.07294178009033203, -0.07010078430175781, -0.0672597885131836, -0.06441879272460938, -0.061577796936035156, -0.05873680114746094, -0.05589580535888672, -0.0530548095703125, -0.05021381378173828, -0.04737281799316406, -0.044531822204589844, -0.041690826416015625, -0.038849830627441406, -0.03600883483886719, -0.03316783905029297, -0.03032684326171875, -0.02748584747314453, -0.024644851684570312, -0.021803855895996094, -0.018962860107421875, -0.016121864318847656, -0.013280868530273438, -0.010439872741699219, -0.007598876953125, -0.004757881164550781, -0.0019168853759765625, 0.0009241104125976562, 0.003765106201171875, 0.006606101989746094, 0.009447097778320312, 0.012288093566894531, 0.01512908935546875, 0.01797008514404297, 0.020811080932617188, 0.023652076721191406, 0.026493072509765625, 0.029334068298339844, 0.03217506408691406, 0.03501605987548828, 0.0378570556640625, 0.04069805145263672, 0.04353904724121094, 0.046380043029785156, 0.049221038818359375, 0.052062034606933594, 0.05490303039550781, 0.05774402618408203, 0.06058502197265625, 0.06342601776123047, 0.06626701354980469, 0.0691080093383789, 0.07194900512695312, 0.07479000091552734, 0.07763099670410156, 0.08047199249267578, 0.08331298828125]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 2.0, 2.0, 5.0, 8.0, 7.0, 9.0, 9.0, 15.0, 25.0, 29.0, 30.0, 50.0, 66.0, 99.0, 138.0, 200.0, 375.0, 582.0, 1079.0, 2474.0, 7259.0, 28125.0, 225900.0, 707806.0, 55352.0, 11777.0, 3585.0, 1484.0, 746.0, 428.0, 258.0, 188.0, 112.0, 76.0, 69.0, 56.0, 34.0, 38.0, 22.0, 4.0, 17.0, 5.0, 6.0, 4.0, 3.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.475341796875, -0.4618377685546875, -0.448333740234375, -0.4348297119140625, -0.42132568359375, -0.4078216552734375, -0.394317626953125, -0.3808135986328125, -0.3673095703125, -0.3538055419921875, -0.340301513671875, -0.3267974853515625, -0.31329345703125, -0.2997894287109375, -0.286285400390625, -0.2727813720703125, -0.25927734375, -0.2457733154296875, -0.232269287109375, -0.2187652587890625, -0.20526123046875, -0.1917572021484375, -0.178253173828125, -0.1647491455078125, -0.1512451171875, -0.1377410888671875, -0.124237060546875, -0.1107330322265625, -0.09722900390625, -0.0837249755859375, -0.070220947265625, -0.0567169189453125, -0.043212890625, -0.0297088623046875, -0.016204833984375, -0.0027008056640625, 0.01080322265625, 0.0243072509765625, 0.037811279296875, 0.0513153076171875, 0.0648193359375, 0.0783233642578125, 0.091827392578125, 0.1053314208984375, 0.11883544921875, 0.1323394775390625, 0.145843505859375, 0.1593475341796875, 0.1728515625, 0.1863555908203125, 0.199859619140625, 0.2133636474609375, 0.22686767578125, 0.2403717041015625, 0.253875732421875, 0.2673797607421875, 0.2808837890625, 0.2943878173828125, 0.307891845703125, 0.3213958740234375, 0.33489990234375, 0.3484039306640625, 0.361907958984375, 0.3754119873046875, 0.388916015625]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 9.0, 3.0, 9.0, 7.0, 8.0, 22.0, 18.0, 30.0, 22.0, 33.0, 29.0, 38.0, 54.0, 40.0, 52.0, 44.0, 59.0, 55.0, 45.0, 59.0, 44.0, 45.0, 40.0, 39.0, 33.0, 21.0, 24.0, 22.0, 18.0, 17.0, 18.0, 7.0, 4.0, 5.0, 8.0, 7.0, 5.0, 5.0, 2.0, 3.0, 0.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.5087890625, -0.49488067626953125, -0.4809722900390625, -0.46706390380859375, -0.453155517578125, -0.43924713134765625, -0.4253387451171875, -0.41143035888671875, -0.39752197265625, -0.38361358642578125, -0.3697052001953125, -0.35579681396484375, -0.341888427734375, -0.32798004150390625, -0.3140716552734375, -0.30016326904296875, -0.2862548828125, -0.27234649658203125, -0.2584381103515625, -0.24452972412109375, -0.230621337890625, -0.21671295166015625, -0.2028045654296875, -0.18889617919921875, -0.17498779296875, -0.16107940673828125, -0.1471710205078125, -0.13326263427734375, -0.119354248046875, -0.10544586181640625, -0.0915374755859375, -0.07762908935546875, -0.063720703125, -0.04981231689453125, -0.0359039306640625, -0.02199554443359375, -0.008087158203125, 0.00582122802734375, 0.0197296142578125, 0.03363800048828125, 0.04754638671875, 0.06145477294921875, 0.0753631591796875, 0.08927154541015625, 0.103179931640625, 0.11708831787109375, 0.1309967041015625, 0.14490509033203125, 0.1588134765625, 0.17272186279296875, 0.1866302490234375, 0.20053863525390625, 0.214447021484375, 0.22835540771484375, 0.2422637939453125, 0.25617218017578125, 0.27008056640625, 0.28398895263671875, 0.2978973388671875, 0.31180572509765625, 0.325714111328125, 0.33962249755859375, 0.3535308837890625, 0.36743927001953125, 0.38134765625]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 1.0, 3.0, 2.0, 6.0, 12.0, 13.0, 19.0, 20.0, 45.0, 72.0, 145.0, 261.0, 502.0, 1068.0, 2956.0, 9259.0, 39906.0, 248455.0, 646810.0, 76062.0, 15581.0, 4404.0, 1571.0, 691.0, 304.0, 162.0, 96.0, 47.0, 39.0, 14.0, 9.0, 6.0, 6.0, 4.0, 6.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.178466796875, -0.17308998107910156, -0.16771316528320312, -0.1623363494873047, -0.15695953369140625, -0.1515827178955078, -0.14620590209960938, -0.14082908630371094, -0.1354522705078125, -0.13007545471191406, -0.12469863891601562, -0.11932182312011719, -0.11394500732421875, -0.10856819152832031, -0.10319137573242188, -0.09781455993652344, -0.092437744140625, -0.08706092834472656, -0.08168411254882812, -0.07630729675292969, -0.07093048095703125, -0.06555366516113281, -0.060176849365234375, -0.05480003356933594, -0.0494232177734375, -0.04404640197753906, -0.038669586181640625, -0.03329277038574219, -0.02791595458984375, -0.022539138793945312, -0.017162322998046875, -0.011785507202148438, -0.00640869140625, -0.0010318756103515625, 0.004344940185546875, 0.009721755981445312, 0.01509857177734375, 0.020475387573242188, 0.025852203369140625, 0.031229019165039062, 0.0366058349609375, 0.04198265075683594, 0.047359466552734375, 0.05273628234863281, 0.05811309814453125, 0.06348991394042969, 0.06886672973632812, 0.07424354553222656, 0.079620361328125, 0.08499717712402344, 0.09037399291992188, 0.09575080871582031, 0.10112762451171875, 0.10650444030761719, 0.11188125610351562, 0.11725807189941406, 0.1226348876953125, 0.12801170349121094, 0.13338851928710938, 0.1387653350830078, 0.14414215087890625, 0.1495189666748047, 0.15489578247070312, 0.16027259826660156, 0.1656494140625]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 5.0, 10.0, 7.0, 13.0, 22.0, 24.0, 30.0, 45.0, 88.0, 125.0, 157.0, 141.0, 111.0, 74.0, 58.0, 26.0, 26.0, 15.0, 12.0, 6.0, 7.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.204843521118164e-05, -5.934573709964752e-05, -5.66430389881134e-05, -5.3940340876579285e-05, -5.1237642765045166e-05, -4.853494465351105e-05, -4.583224654197693e-05, -4.312954843044281e-05, -4.042685031890869e-05, -3.772415220737457e-05, -3.5021454095840454e-05, -3.2318755984306335e-05, -2.9616057872772217e-05, -2.6913359761238098e-05, -2.421066164970398e-05, -2.150796353816986e-05, -1.8805265426635742e-05, -1.6102567315101624e-05, -1.3399869203567505e-05, -1.0697171092033386e-05, -7.994472980499268e-06, -5.291774868965149e-06, -2.5890767574310303e-06, 1.1362135410308838e-07, 2.816319465637207e-06, 5.519017577171326e-06, 8.221715688705444e-06, 1.0924413800239563e-05, 1.3627111911773682e-05, 1.63298100233078e-05, 1.903250813484192e-05, 2.1735206246376038e-05, 2.4437904357910156e-05, 2.7140602469444275e-05, 2.9843300580978394e-05, 3.254599869251251e-05, 3.524869680404663e-05, 3.795139491558075e-05, 4.065409302711487e-05, 4.335679113864899e-05, 4.6059489250183105e-05, 4.8762187361717224e-05, 5.146488547325134e-05, 5.416758358478546e-05, 5.687028169631958e-05, 5.95729798078537e-05, 6.227567791938782e-05, 6.497837603092194e-05, 6.768107414245605e-05, 7.038377225399017e-05, 7.308647036552429e-05, 7.578916847705841e-05, 7.849186658859253e-05, 8.119456470012665e-05, 8.389726281166077e-05, 8.659996092319489e-05, 8.9302659034729e-05, 9.200535714626312e-05, 9.470805525779724e-05, 9.741075336933136e-05, 0.00010011345148086548, 0.0001028161495923996, 0.00010551884770393372, 0.00010822154581546783, 0.00011092424392700195]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 5.0, 3.0, 5.0, 9.0, 11.0, 29.0, 37.0, 47.0, 93.0, 168.0, 369.0, 817.0, 1988.0, 7156.0, 50365.0, 723657.0, 235686.0, 21466.0, 4035.0, 1367.0, 615.0, 268.0, 164.0, 77.0, 44.0, 36.0, 13.0, 12.0, 2.0, 10.0, 4.0, 3.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1622314453125, -0.15541648864746094, -0.14860153198242188, -0.1417865753173828, -0.13497161865234375, -0.1281566619873047, -0.12134170532226562, -0.11452674865722656, -0.1077117919921875, -0.10089683532714844, -0.09408187866210938, -0.08726692199707031, -0.08045196533203125, -0.07363700866699219, -0.06682205200195312, -0.06000709533691406, -0.053192138671875, -0.04637718200683594, -0.039562225341796875, -0.03274726867675781, -0.02593231201171875, -0.019117355346679688, -0.012302398681640625, -0.0054874420166015625, 0.0013275146484375, 0.008142471313476562, 0.014957427978515625, 0.021772384643554688, 0.02858734130859375, 0.03540229797363281, 0.042217254638671875, 0.04903221130371094, 0.05584716796875, 0.06266212463378906, 0.06947708129882812, 0.07629203796386719, 0.08310699462890625, 0.08992195129394531, 0.09673690795898438, 0.10355186462402344, 0.1103668212890625, 0.11718177795410156, 0.12399673461914062, 0.1308116912841797, 0.13762664794921875, 0.1444416046142578, 0.15125656127929688, 0.15807151794433594, 0.164886474609375, 0.17170143127441406, 0.17851638793945312, 0.1853313446044922, 0.19214630126953125, 0.1989612579345703, 0.20577621459960938, 0.21259117126464844, 0.2194061279296875, 0.22622108459472656, 0.23303604125976562, 0.2398509979248047, 0.24666595458984375, 0.2534809112548828, 0.2602958679199219, 0.26711082458496094, 0.27392578125]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 7.0, 7.0, 5.0, 16.0, 8.0, 16.0, 18.0, 36.0, 43.0, 44.0, 47.0, 77.0, 85.0, 101.0, 101.0, 76.0, 70.0, 48.0, 41.0, 38.0, 28.0, 20.0, 21.0, 11.0, 8.0, 7.0, 5.0, 4.0, 4.0, 4.0, 4.0, 2.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1610107421875, -0.15641403198242188, -0.15181732177734375, -0.14722061157226562, -0.1426239013671875, -0.13802719116210938, -0.13343048095703125, -0.12883377075195312, -0.124237060546875, -0.11964035034179688, -0.11504364013671875, -0.11044692993164062, -0.1058502197265625, -0.10125350952148438, -0.09665679931640625, -0.09206008911132812, -0.08746337890625, -0.08286666870117188, -0.07826995849609375, -0.07367324829101562, -0.0690765380859375, -0.06447982788085938, -0.05988311767578125, -0.055286407470703125, -0.050689697265625, -0.046092987060546875, -0.04149627685546875, -0.036899566650390625, -0.0323028564453125, -0.027706146240234375, -0.02310943603515625, -0.018512725830078125, -0.013916015625, -0.009319305419921875, -0.00472259521484375, -0.000125885009765625, 0.0044708251953125, 0.009067535400390625, 0.01366424560546875, 0.018260955810546875, 0.022857666015625, 0.027454376220703125, 0.03205108642578125, 0.036647796630859375, 0.0412445068359375, 0.045841217041015625, 0.05043792724609375, 0.055034637451171875, 0.05963134765625, 0.06422805786132812, 0.06882476806640625, 0.07342147827148438, 0.0780181884765625, 0.08261489868164062, 0.08721160888671875, 0.09180831909179688, 0.096405029296875, 0.10100173950195312, 0.10559844970703125, 0.11019515991210938, 0.1147918701171875, 0.11938858032226562, 0.12398529052734375, 0.12858200073242188, 0.1331787109375]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 3.0, 4.0, 2.0, 6.0, 7.0, 6.0, 15.0, 38.0, 45.0, 63.0, 96.0, 157.0, 211.0, 123.0, 81.0, 58.0, 34.0, 17.0, 8.0, 11.0, 6.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.716684103012085, -2.6395390033721924, -2.5623936653137207, -2.485248565673828, -2.4081032276153564, -2.330958127975464, -2.253812789916992, -2.1766676902770996, -2.099522590637207, -2.0223774909973145, -1.9452321529388428, -1.8680869340896606, -1.7909417152404785, -1.713796615600586, -1.6366513967514038, -1.5595061779022217, -1.48236083984375, -1.4052156209945679, -1.3280704021453857, -1.2509251832962036, -1.1737799644470215, -1.096634864807129, -1.0194896459579468, -0.9423444271087646, -0.8651992082595825, -0.7880539894104004, -0.7109087705612183, -0.6337636113166809, -0.5566183924674988, -0.47947317361831665, -0.4023279845714569, -0.32518279552459717, -0.24803781509399414, -0.1708926111459732, -0.09374740719795227, -0.016602203249931335, 0.0605430006980896, 0.13768821954727173, 0.21483340859413147, 0.2919785976409912, 0.36912381649017334, 0.44626903533935547, 0.5234142541885376, 0.600559413433075, 0.6777046322822571, 0.7548498511314392, 0.8319950103759766, 0.9091402292251587, 0.9862854480743408, 1.063430666923523, 1.140575885772705, 1.2177211046218872, 1.2948663234710693, 1.372011423110962, 1.449156641960144, 1.5263018608093262, 1.6034470796585083, 1.6805922985076904, 1.7577375173568726, 1.8348827362060547, 1.9120278358459473, 1.989173173904419, 2.0663182735443115, 2.143463611602783, 2.220608711242676]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 1.0, 3.0, 4.0, 5.0, 3.0, 7.0, 8.0, 11.0, 17.0, 13.0, 2.0, 15.0, 13.0, 26.0, 17.0, 26.0, 32.0, 29.0, 32.0, 35.0, 36.0, 42.0, 54.0, 72.0, 53.0, 51.0, 44.0, 40.0, 37.0, 32.0, 21.0, 21.0, 28.0, 23.0, 18.0, 20.0, 26.0, 17.0, 14.0, 13.0, 8.0, 10.0, 6.0, 7.0, 7.0, 3.0, 1.0, 2.0, 4.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.2956559658050537, -1.248177170753479, -1.2006983757019043, -1.1532195806503296, -1.1057407855987549, -1.0582619905471802, -1.0107831954956055, -0.963304340839386, -0.9158255457878113, -0.8683467507362366, -0.8208679556846619, -0.7733891010284424, -0.7259103059768677, -0.678431510925293, -0.6309527158737183, -0.5834739208221436, -0.5359951257705688, -0.48851633071899414, -0.44103753566741943, -0.39355871081352234, -0.34607991576194763, -0.2986011207103729, -0.25112229585647583, -0.20364350080490112, -0.15616470575332642, -0.10868590325117111, -0.06120710074901581, -0.013728290796279907, 0.0337505042552948, 0.0812292993068695, 0.1287081241607666, 0.1761869192123413, 0.22366571426391602, 0.2711445093154907, 0.31862330436706543, 0.3661021292209625, 0.41358092427253723, 0.46105971932411194, 0.508538544178009, 0.5560173392295837, 0.6034961342811584, 0.6509749293327332, 0.6984537243843079, 0.7459325790405273, 0.793411374092102, 0.8408901691436768, 0.8883689641952515, 0.9358477592468262, 0.9833265542984009, 1.0308053493499756, 1.0782841444015503, 1.125762939453125, 1.1732417345046997, 1.2207205295562744, 1.2681994438171387, 1.3156781196594238, 1.363157033920288, 1.4106358289718628, 1.4581146240234375, 1.5055934190750122, 1.553072214126587, 1.6005510091781616, 1.6480298042297363, 1.6955087184906006, 1.7429873943328857]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 1.0, 2.0, 3.0, 7.0, 10.0, 26.0, 33.0, 51.0, 81.0, 167.0, 298.0, 516.0, 1131.0, 2391.0, 5129.0, 11971.0, 32381.0, 113191.0, 602930.0, 2389046.0, 826910.0, 142349.0, 39660.0, 14466.0, 6090.0, 2794.0, 1267.0, 645.0, 324.0, 194.0, 93.0, 59.0, 29.0, 20.0, 14.0, 2.0, 3.0, 5.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.115478515625, -0.11113548278808594, -0.10679244995117188, -0.10244941711425781, -0.09810638427734375, -0.09376335144042969, -0.08942031860351562, -0.08507728576660156, -0.0807342529296875, -0.07639122009277344, -0.07204818725585938, -0.06770515441894531, -0.06336212158203125, -0.05901908874511719, -0.054676055908203125, -0.05033302307128906, -0.045989990234375, -0.04164695739746094, -0.037303924560546875, -0.03296089172363281, -0.02861785888671875, -0.024274826049804688, -0.019931793212890625, -0.015588760375976562, -0.0112457275390625, -0.0069026947021484375, -0.002559661865234375, 0.0017833709716796875, 0.00612640380859375, 0.010469436645507812, 0.014812469482421875, 0.019155502319335938, 0.02349853515625, 0.027841567993164062, 0.032184600830078125, 0.03652763366699219, 0.04087066650390625, 0.04521369934082031, 0.049556732177734375, 0.05389976501464844, 0.0582427978515625, 0.06258583068847656, 0.06692886352539062, 0.07127189636230469, 0.07561492919921875, 0.07995796203613281, 0.08430099487304688, 0.08864402770996094, 0.092987060546875, 0.09733009338378906, 0.10167312622070312, 0.10601615905761719, 0.11035919189453125, 0.11470222473144531, 0.11904525756835938, 0.12338829040527344, 0.1277313232421875, 0.13207435607910156, 0.13641738891601562, 0.1407604217529297, 0.14510345458984375, 0.1494464874267578, 0.15378952026367188, 0.15813255310058594, 0.1624755859375]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 5.0, 4.0, 8.0, 12.0, 10.0, 12.0, 25.0, 25.0, 22.0, 18.0, 36.0, 18.0, 23.0, 43.0, 37.0, 41.0, 51.0, 44.0, 33.0, 47.0, 32.0, 49.0, 43.0, 37.0, 43.0, 30.0, 37.0, 31.0, 31.0, 24.0, 26.0, 15.0, 16.0, 10.0, 15.0, 10.0, 12.0, 5.0, 4.0, 12.0, 2.0, 3.0, 5.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0], "bins": [-0.09185791015625, -0.08912944793701172, -0.08640098571777344, -0.08367252349853516, -0.08094406127929688, -0.0782155990600586, -0.07548713684082031, -0.07275867462158203, -0.07003021240234375, -0.06730175018310547, -0.06457328796386719, -0.061844825744628906, -0.059116363525390625, -0.056387901306152344, -0.05365943908691406, -0.05093097686767578, -0.0482025146484375, -0.04547405242919922, -0.04274559020996094, -0.040017127990722656, -0.037288665771484375, -0.034560203552246094, -0.03183174133300781, -0.02910327911376953, -0.02637481689453125, -0.02364635467529297, -0.020917892456054688, -0.018189430236816406, -0.015460968017578125, -0.012732505798339844, -0.010004043579101562, -0.007275581359863281, -0.004547119140625, -0.0018186569213867188, 0.0009098052978515625, 0.0036382675170898438, 0.006366729736328125, 0.009095191955566406, 0.011823654174804688, 0.014552116394042969, 0.01728057861328125, 0.02000904083251953, 0.022737503051757812, 0.025465965270996094, 0.028194427490234375, 0.030922889709472656, 0.03365135192871094, 0.03637981414794922, 0.0391082763671875, 0.04183673858642578, 0.04456520080566406, 0.047293663024902344, 0.050022125244140625, 0.052750587463378906, 0.05547904968261719, 0.05820751190185547, 0.06093597412109375, 0.06366443634033203, 0.06639289855957031, 0.0691213607788086, 0.07184982299804688, 0.07457828521728516, 0.07730674743652344, 0.08003520965576172, 0.082763671875]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 2.0, 2.0, 5.0, 7.0, 5.0, 11.0, 15.0, 18.0, 30.0, 25.0, 48.0, 76.0, 146.0, 289.0, 649.0, 1697.0, 6374.0, 29110.0, 235719.0, 3274532.0, 581802.0, 50274.0, 9452.0, 2420.0, 780.0, 323.0, 169.0, 107.0, 67.0, 39.0, 26.0, 13.0, 25.0, 8.0, 5.0, 10.0, 2.0, 4.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.31982421875, -0.3093910217285156, -0.29895782470703125, -0.2885246276855469, -0.2780914306640625, -0.2676582336425781, -0.25722503662109375, -0.24679183959960938, -0.236358642578125, -0.22592544555664062, -0.21549224853515625, -0.20505905151367188, -0.1946258544921875, -0.18419265747070312, -0.17375946044921875, -0.16332626342773438, -0.15289306640625, -0.14245986938476562, -0.13202667236328125, -0.12159347534179688, -0.1111602783203125, -0.10072708129882812, -0.09029388427734375, -0.07986068725585938, -0.069427490234375, -0.058994293212890625, -0.04856109619140625, -0.038127899169921875, -0.0276947021484375, -0.017261505126953125, -0.00682830810546875, 0.003604888916015625, 0.0140380859375, 0.024471282958984375, 0.03490447998046875, 0.045337677001953125, 0.0557708740234375, 0.06620407104492188, 0.07663726806640625, 0.08707046508789062, 0.097503662109375, 0.10793685913085938, 0.11837005615234375, 0.12880325317382812, 0.1392364501953125, 0.14966964721679688, 0.16010284423828125, 0.17053604125976562, 0.18096923828125, 0.19140243530273438, 0.20183563232421875, 0.21226882934570312, 0.2227020263671875, 0.23313522338867188, 0.24356842041015625, 0.2540016174316406, 0.264434814453125, 0.2748680114746094, 0.28530120849609375, 0.2957344055175781, 0.3061676025390625, 0.3166007995605469, 0.32703399658203125, 0.3374671936035156, 0.347900390625]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 3.0, 6.0, 5.0, 7.0, 4.0, 6.0, 10.0, 10.0, 9.0, 12.0, 16.0, 17.0, 30.0, 39.0, 48.0, 64.0, 94.0, 108.0, 138.0, 209.0, 265.0, 387.0, 471.0, 447.0, 426.0, 318.0, 233.0, 173.0, 130.0, 95.0, 59.0, 49.0, 35.0, 31.0, 32.0, 19.0, 10.0, 14.0, 13.0, 16.0, 2.0, 6.0, 6.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.208740234375, -0.20246315002441406, -0.19618606567382812, -0.1899089813232422, -0.18363189697265625, -0.1773548126220703, -0.17107772827148438, -0.16480064392089844, -0.1585235595703125, -0.15224647521972656, -0.14596939086914062, -0.1396923065185547, -0.13341522216796875, -0.1271381378173828, -0.12086105346679688, -0.11458396911621094, -0.108306884765625, -0.10202980041503906, -0.09575271606445312, -0.08947563171386719, -0.08319854736328125, -0.07692146301269531, -0.07064437866210938, -0.06436729431152344, -0.0580902099609375, -0.05181312561035156, -0.045536041259765625, -0.03925895690917969, -0.03298187255859375, -0.026704788208007812, -0.020427703857421875, -0.014150619506835938, -0.00787353515625, -0.0015964508056640625, 0.004680633544921875, 0.010957717895507812, 0.01723480224609375, 0.023511886596679688, 0.029788970947265625, 0.03606605529785156, 0.0423431396484375, 0.04862022399902344, 0.054897308349609375, 0.06117439270019531, 0.06745147705078125, 0.07372856140136719, 0.08000564575195312, 0.08628273010253906, 0.092559814453125, 0.09883689880371094, 0.10511398315429688, 0.11139106750488281, 0.11766815185546875, 0.12394523620605469, 0.13022232055664062, 0.13649940490722656, 0.1427764892578125, 0.14905357360839844, 0.15533065795898438, 0.1616077423095703, 0.16788482666015625, 0.1741619110107422, 0.18043899536132812, 0.18671607971191406, 0.1929931640625]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 4.0, 1.0, 4.0, 3.0, 11.0, 21.0, 50.0, 128.0, 189.0, 222.0, 190.0, 98.0, 33.0, 30.0, 10.0, 3.0, 6.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.001578330993652, -3.8913233280181885, -3.7810683250427246, -3.67081356048584, -3.560558557510376, -3.450303554534912, -3.3400485515594482, -3.2297935485839844, -3.1195385456085205, -3.0092835426330566, -2.8990285396575928, -2.788773536682129, -2.678518772125244, -2.5682637691497803, -2.4580087661743164, -2.3477537631988525, -2.2374987602233887, -2.127243757247925, -2.016988754272461, -1.9067338705062866, -1.7964788675308228, -1.6862239837646484, -1.5759689807891846, -1.4657139778137207, -1.355459213256836, -1.245204210281372, -1.1349493265151978, -1.0246943235397339, -0.91443932056427, -0.8041843771934509, -0.6939294338226318, -0.583674430847168, -0.4734194278717041, -0.3631644546985626, -0.25290948152542114, -0.14265453815460205, -0.03239956498146057, 0.07785540819168091, 0.1881103515625, 0.29836535453796387, 0.40862029790878296, 0.518875241279602, 0.6291302442550659, 0.739385187625885, 0.8496401309967041, 0.959895133972168, 1.0701501369476318, 1.1804051399230957, 1.29066002368927, 1.4009150266647339, 1.5111699104309082, 1.621424913406372, 1.731679916381836, 1.8419349193572998, 1.9521898031234741, 2.0624446868896484, 2.1726996898651123, 2.282954692840576, 2.39320969581604, 2.503464698791504, 2.6137194633483887, 2.7239744663238525, 2.8342294692993164, 2.9444844722747803, 3.054739475250244]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 4.0, 2.0, 1.0, 7.0, 1.0, 3.0, 6.0, 3.0, 4.0, 9.0, 3.0, 6.0, 21.0, 9.0, 13.0, 15.0, 10.0, 15.0, 27.0, 17.0, 27.0, 17.0, 30.0, 26.0, 24.0, 32.0, 40.0, 49.0, 50.0, 41.0, 48.0, 34.0, 28.0, 25.0, 43.0, 27.0, 36.0, 30.0, 27.0, 19.0, 20.0, 27.0, 25.0, 19.0, 19.0, 19.0, 12.0, 4.0, 8.0, 11.0, 5.0, 4.0, 2.0, 4.0, 4.0, 0.0, 2.0, 4.0, 1.0, 2.0, 1.0, 1.0], "bins": [-0.9727334380149841, -0.9419143795967102, -0.911095380783081, -0.8802763223648071, -0.8494572639465332, -0.8186382055282593, -0.7878191471099854, -0.7570001482963562, -0.7261810898780823, -0.6953620314598083, -0.6645430326461792, -0.6337239742279053, -0.6029049158096313, -0.5720858573913574, -0.5412667989730835, -0.5104478001594543, -0.4796287417411804, -0.4488096833229065, -0.41799065470695496, -0.3871716260910034, -0.3563525676727295, -0.32553350925445557, -0.29471448063850403, -0.2638954520225525, -0.23307639360427856, -0.20225735008716583, -0.1714383065700531, -0.14061926305294037, -0.10980021953582764, -0.0789811760187149, -0.04816213250160217, -0.01734308898448944, 0.013475894927978516, 0.04429493844509125, 0.07511398196220398, 0.10593302547931671, 0.13675206899642944, 0.16757111251354218, 0.1983901560306549, 0.22920919954776764, 0.26002824306488037, 0.2908473014831543, 0.32166633009910583, 0.3524853587150574, 0.3833044171333313, 0.4141234755516052, 0.44494250416755676, 0.4757615327835083, 0.5065805912017822, 0.5373996496200562, 0.5682187080383301, 0.5990377068519592, 0.6298567652702332, 0.6606758236885071, 0.6914948225021362, 0.7223138809204102, 0.7531329393386841, 0.783951997756958, 0.8147710561752319, 0.8455900549888611, 0.876409113407135, 0.9072281718254089, 0.9380471706390381, 0.968866229057312, 0.9996852874755859]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 4.0, 5.0, 7.0, 8.0, 7.0, 18.0, 19.0, 28.0, 49.0, 67.0, 80.0, 113.0, 154.0, 240.0, 386.0, 500.0, 780.0, 1275.0, 2041.0, 3319.0, 5835.0, 11634.0, 27507.0, 75728.0, 208970.0, 356553.0, 218206.0, 78832.0, 28612.0, 12245.0, 5960.0, 3436.0, 1982.0, 1324.0, 846.0, 562.0, 376.0, 284.0, 188.0, 112.0, 69.0, 56.0, 38.0, 37.0, 33.0, 10.0, 9.0, 2.0, 7.0, 1.0, 3.0, 3.0, 4.0, 4.0, 0.0, 2.0], "bins": [-0.1357421875, -0.13169288635253906, -0.12764358520507812, -0.12359428405761719, -0.11954498291015625, -0.11549568176269531, -0.11144638061523438, -0.10739707946777344, -0.1033477783203125, -0.09929847717285156, -0.09524917602539062, -0.09119987487792969, -0.08715057373046875, -0.08310127258300781, -0.07905197143554688, -0.07500267028808594, -0.070953369140625, -0.06690406799316406, -0.06285476684570312, -0.05880546569824219, -0.05475616455078125, -0.05070686340332031, -0.046657562255859375, -0.04260826110839844, -0.0385589599609375, -0.03450965881347656, -0.030460357666015625, -0.026411056518554688, -0.02236175537109375, -0.018312454223632812, -0.014263153076171875, -0.010213851928710938, -0.00616455078125, -0.0021152496337890625, 0.001934051513671875, 0.0059833526611328125, 0.01003265380859375, 0.014081954956054688, 0.018131256103515625, 0.022180557250976562, 0.0262298583984375, 0.030279159545898438, 0.034328460693359375, 0.03837776184082031, 0.04242706298828125, 0.04647636413574219, 0.050525665283203125, 0.05457496643066406, 0.058624267578125, 0.06267356872558594, 0.06672286987304688, 0.07077217102050781, 0.07482147216796875, 0.07887077331542969, 0.08292007446289062, 0.08696937561035156, 0.0910186767578125, 0.09506797790527344, 0.09911727905273438, 0.10316658020019531, 0.10721588134765625, 0.11126518249511719, 0.11531448364257812, 0.11936378479003906, 0.1234130859375]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 7.0, 5.0, 6.0, 3.0, 8.0, 7.0, 8.0, 12.0, 26.0, 20.0, 30.0, 29.0, 29.0, 35.0, 50.0, 46.0, 52.0, 49.0, 61.0, 43.0, 44.0, 42.0, 58.0, 42.0, 36.0, 37.0, 35.0, 34.0, 30.0, 20.0, 15.0, 24.0, 13.0, 14.0, 9.0, 10.0, 9.0, 2.0, 4.0, 0.0, 5.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1160888671875, -0.11265277862548828, -0.10921669006347656, -0.10578060150146484, -0.10234451293945312, -0.0989084243774414, -0.09547233581542969, -0.09203624725341797, -0.08860015869140625, -0.08516407012939453, -0.08172798156738281, -0.0782918930053711, -0.07485580444335938, -0.07141971588134766, -0.06798362731933594, -0.06454753875732422, -0.0611114501953125, -0.05767536163330078, -0.05423927307128906, -0.050803184509277344, -0.047367095947265625, -0.043931007385253906, -0.04049491882324219, -0.03705883026123047, -0.03362274169921875, -0.03018665313720703, -0.026750564575195312, -0.023314476013183594, -0.019878387451171875, -0.016442298889160156, -0.013006210327148438, -0.009570121765136719, -0.006134033203125, -0.0026979446411132812, 0.0007381439208984375, 0.004174232482910156, 0.007610321044921875, 0.011046409606933594, 0.014482498168945312, 0.01791858673095703, 0.02135467529296875, 0.02479076385498047, 0.028226852416992188, 0.031662940979003906, 0.035099029541015625, 0.038535118103027344, 0.04197120666503906, 0.04540729522705078, 0.0488433837890625, 0.05227947235107422, 0.05571556091308594, 0.059151649475097656, 0.06258773803710938, 0.0660238265991211, 0.06945991516113281, 0.07289600372314453, 0.07633209228515625, 0.07976818084716797, 0.08320426940917969, 0.0866403579711914, 0.09007644653320312, 0.09351253509521484, 0.09694862365722656, 0.10038471221923828, 0.10382080078125]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 0.0, 1.0, 0.0, 2.0, 4.0, 1.0, 6.0, 2.0, 3.0, 3.0, 10.0, 12.0, 9.0, 15.0, 27.0, 33.0, 53.0, 84.0, 132.0, 264.0, 495.0, 1064.0, 2671.0, 8138.0, 47748.0, 664711.0, 287364.0, 26294.0, 5546.0, 2041.0, 835.0, 380.0, 217.0, 124.0, 74.0, 58.0, 38.0, 24.0, 16.0, 13.0, 13.0, 8.0, 10.0, 5.0, 6.0, 0.0, 0.0, 4.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.336669921875, -0.32642364501953125, -0.3161773681640625, -0.30593109130859375, -0.295684814453125, -0.28543853759765625, -0.2751922607421875, -0.26494598388671875, -0.25469970703125, -0.24445343017578125, -0.2342071533203125, -0.22396087646484375, -0.213714599609375, -0.20346832275390625, -0.1932220458984375, -0.18297576904296875, -0.1727294921875, -0.16248321533203125, -0.1522369384765625, -0.14199066162109375, -0.131744384765625, -0.12149810791015625, -0.1112518310546875, -0.10100555419921875, -0.09075927734375, -0.08051300048828125, -0.0702667236328125, -0.06002044677734375, -0.049774169921875, -0.03952789306640625, -0.0292816162109375, -0.01903533935546875, -0.0087890625, 0.00145721435546875, 0.0117034912109375, 0.02194976806640625, 0.032196044921875, 0.04244232177734375, 0.0526885986328125, 0.06293487548828125, 0.07318115234375, 0.08342742919921875, 0.0936737060546875, 0.10391998291015625, 0.114166259765625, 0.12441253662109375, 0.1346588134765625, 0.14490509033203125, 0.1551513671875, 0.16539764404296875, 0.1756439208984375, 0.18589019775390625, 0.196136474609375, 0.20638275146484375, 0.2166290283203125, 0.22687530517578125, 0.23712158203125, 0.24736785888671875, 0.2576141357421875, 0.26786041259765625, 0.278106689453125, 0.28835296630859375, 0.2985992431640625, 0.30884552001953125, 0.319091796875]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 6.0, 9.0, 7.0, 14.0, 13.0, 22.0, 13.0, 19.0, 27.0, 34.0, 32.0, 45.0, 60.0, 47.0, 61.0, 86.0, 59.0, 62.0, 59.0, 69.0, 42.0, 35.0, 38.0, 35.0, 23.0, 16.0, 9.0, 9.0, 12.0, 4.0, 11.0, 9.0, 4.0, 2.0, 4.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.51416015625, -0.49811553955078125, -0.4820709228515625, -0.46602630615234375, -0.449981689453125, -0.43393707275390625, -0.4178924560546875, -0.40184783935546875, -0.38580322265625, -0.36975860595703125, -0.3537139892578125, -0.33766937255859375, -0.321624755859375, -0.30558013916015625, -0.2895355224609375, -0.27349090576171875, -0.2574462890625, -0.24140167236328125, -0.2253570556640625, -0.20931243896484375, -0.193267822265625, -0.17722320556640625, -0.1611785888671875, -0.14513397216796875, -0.12908935546875, -0.11304473876953125, -0.0970001220703125, -0.08095550537109375, -0.064910888671875, -0.04886627197265625, -0.0328216552734375, -0.01677703857421875, -0.000732421875, 0.01531219482421875, 0.0313568115234375, 0.04740142822265625, 0.063446044921875, 0.07949066162109375, 0.0955352783203125, 0.11157989501953125, 0.12762451171875, 0.14366912841796875, 0.1597137451171875, 0.17575836181640625, 0.191802978515625, 0.20784759521484375, 0.2238922119140625, 0.23993682861328125, 0.2559814453125, 0.27202606201171875, 0.2880706787109375, 0.30411529541015625, 0.320159912109375, 0.33620452880859375, 0.3522491455078125, 0.36829376220703125, 0.38433837890625, 0.40038299560546875, 0.4164276123046875, 0.43247222900390625, 0.448516845703125, 0.46456146240234375, 0.4806060791015625, 0.49665069580078125, 0.5126953125]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 2.0, 5.0, 6.0, 12.0, 14.0, 26.0, 35.0, 60.0, 127.0, 252.0, 554.0, 1418.0, 4677.0, 20803.0, 142456.0, 745483.0, 109505.0, 16982.0, 3862.0, 1275.0, 526.0, 214.0, 101.0, 69.0, 39.0, 25.0, 12.0, 8.0, 9.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.124267578125, -0.11918258666992188, -0.11409759521484375, -0.10901260375976562, -0.1039276123046875, -0.09884262084960938, -0.09375762939453125, -0.08867263793945312, -0.083587646484375, -0.07850265502929688, -0.07341766357421875, -0.06833267211914062, -0.0632476806640625, -0.058162689208984375, -0.05307769775390625, -0.047992706298828125, -0.04290771484375, -0.037822723388671875, -0.03273773193359375, -0.027652740478515625, -0.0225677490234375, -0.017482757568359375, -0.01239776611328125, -0.007312774658203125, -0.002227783203125, 0.002857208251953125, 0.00794219970703125, 0.013027191162109375, 0.0181121826171875, 0.023197174072265625, 0.02828216552734375, 0.033367156982421875, 0.0384521484375, 0.043537139892578125, 0.04862213134765625, 0.053707122802734375, 0.0587921142578125, 0.06387710571289062, 0.06896209716796875, 0.07404708862304688, 0.079132080078125, 0.08421707153320312, 0.08930206298828125, 0.09438705444335938, 0.0994720458984375, 0.10455703735351562, 0.10964202880859375, 0.11472702026367188, 0.11981201171875, 0.12489700317382812, 0.12998199462890625, 0.13506698608398438, 0.1401519775390625, 0.14523696899414062, 0.15032196044921875, 0.15540695190429688, 0.160491943359375, 0.16557693481445312, 0.17066192626953125, 0.17574691772460938, 0.1808319091796875, 0.18591690063476562, 0.19100189208984375, 0.19608688354492188, 0.201171875]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 2.0, 6.0, 1.0, 7.0, 11.0, 18.0, 18.0, 35.0, 32.0, 28.0, 71.0, 74.0, 82.0, 101.0, 85.0, 98.0, 77.0, 70.0, 36.0, 28.0, 32.0, 29.0, 24.0, 7.0, 8.0, 7.0, 6.0, 3.0, 1.0, 4.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.607439041137695e-05, -4.481431096792221e-05, -4.355423152446747e-05, -4.2294152081012726e-05, -4.1034072637557983e-05, -3.977399319410324e-05, -3.85139137506485e-05, -3.7253834307193756e-05, -3.5993754863739014e-05, -3.473367542028427e-05, -3.347359597682953e-05, -3.2213516533374786e-05, -3.0953437089920044e-05, -2.96933576464653e-05, -2.843327820301056e-05, -2.7173198759555817e-05, -2.5913119316101074e-05, -2.4653039872646332e-05, -2.339296042919159e-05, -2.2132880985736847e-05, -2.0872801542282104e-05, -1.9612722098827362e-05, -1.835264265537262e-05, -1.7092563211917877e-05, -1.5832483768463135e-05, -1.4572404325008392e-05, -1.331232488155365e-05, -1.2052245438098907e-05, -1.0792165994644165e-05, -9.532086551189423e-06, -8.27200710773468e-06, -7.011927664279938e-06, -5.751848220825195e-06, -4.491768777370453e-06, -3.2316893339157104e-06, -1.971609890460968e-06, -7.115304470062256e-07, 5.485489964485168e-07, 1.8086284399032593e-06, 3.0687078833580017e-06, 4.328787326812744e-06, 5.5888667702674866e-06, 6.848946213722229e-06, 8.109025657176971e-06, 9.369105100631714e-06, 1.0629184544086456e-05, 1.1889263987541199e-05, 1.3149343430995941e-05, 1.4409422874450684e-05, 1.5669502317905426e-05, 1.692958176136017e-05, 1.818966120481491e-05, 1.9449740648269653e-05, 2.0709820091724396e-05, 2.1969899535179138e-05, 2.322997897863388e-05, 2.4490058422088623e-05, 2.5750137865543365e-05, 2.7010217308998108e-05, 2.827029675245285e-05, 2.9530376195907593e-05, 3.0790455639362335e-05, 3.205053508281708e-05, 3.331061452627182e-05, 3.457069396972656e-05]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 2.0, 1.0, 4.0, 2.0, 3.0, 3.0, 12.0, 13.0, 21.0, 24.0, 51.0, 56.0, 87.0, 170.0, 355.0, 649.0, 1452.0, 3589.0, 11813.0, 49752.0, 288272.0, 590288.0, 77347.0, 16300.0, 4789.0, 1754.0, 819.0, 389.0, 195.0, 117.0, 82.0, 41.0, 29.0, 20.0, 15.0, 16.0, 12.0, 6.0, 5.0, 2.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0], "bins": [-0.160400390625, -0.15619373321533203, -0.15198707580566406, -0.1477804183959961, -0.14357376098632812, -0.13936710357666016, -0.1351604461669922, -0.13095378875732422, -0.12674713134765625, -0.12254047393798828, -0.11833381652832031, -0.11412715911865234, -0.10992050170898438, -0.1057138442993164, -0.10150718688964844, -0.09730052947998047, -0.0930938720703125, -0.08888721466064453, -0.08468055725097656, -0.0804738998413086, -0.07626724243164062, -0.07206058502197266, -0.06785392761230469, -0.06364727020263672, -0.05944061279296875, -0.05523395538330078, -0.05102729797363281, -0.046820640563964844, -0.042613983154296875, -0.038407325744628906, -0.03420066833496094, -0.02999401092529297, -0.025787353515625, -0.02158069610595703, -0.017374038696289062, -0.013167381286621094, -0.008960723876953125, -0.004754066467285156, -0.0005474090576171875, 0.0036592483520507812, 0.00786590576171875, 0.012072563171386719, 0.016279220581054688, 0.020485877990722656, 0.024692535400390625, 0.028899192810058594, 0.03310585021972656, 0.03731250762939453, 0.0415191650390625, 0.04572582244873047, 0.04993247985839844, 0.054139137268066406, 0.058345794677734375, 0.06255245208740234, 0.06675910949707031, 0.07096576690673828, 0.07517242431640625, 0.07937908172607422, 0.08358573913574219, 0.08779239654541016, 0.09199905395507812, 0.0962057113647461, 0.10041236877441406, 0.10461902618408203, 0.10882568359375]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 3.0, 1.0, 2.0, 3.0, 6.0, 7.0, 8.0, 10.0, 11.0, 16.0, 26.0, 39.0, 52.0, 65.0, 71.0, 95.0, 104.0, 90.0, 91.0, 67.0, 54.0, 58.0, 38.0, 23.0, 13.0, 19.0, 7.0, 6.0, 8.0, 1.0, 4.0, 5.0, 1.0, 1.0, 3.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1497802734375, -0.14571762084960938, -0.14165496826171875, -0.13759231567382812, -0.1335296630859375, -0.12946701049804688, -0.12540435791015625, -0.12134170532226562, -0.117279052734375, -0.11321640014648438, -0.10915374755859375, -0.10509109497070312, -0.1010284423828125, -0.09696578979492188, -0.09290313720703125, -0.08884048461914062, -0.08477783203125, -0.08071517944335938, -0.07665252685546875, -0.07258987426757812, -0.0685272216796875, -0.06446456909179688, -0.06040191650390625, -0.056339263916015625, -0.052276611328125, -0.048213958740234375, -0.04415130615234375, -0.040088653564453125, -0.0360260009765625, -0.031963348388671875, -0.02790069580078125, -0.023838043212890625, -0.019775390625, -0.015712738037109375, -0.01165008544921875, -0.007587432861328125, -0.0035247802734375, 0.000537872314453125, 0.00460052490234375, 0.008663177490234375, 0.012725830078125, 0.016788482666015625, 0.02085113525390625, 0.024913787841796875, 0.0289764404296875, 0.033039093017578125, 0.03710174560546875, 0.041164398193359375, 0.04522705078125, 0.049289703369140625, 0.05335235595703125, 0.057415008544921875, 0.0614776611328125, 0.06554031372070312, 0.06960296630859375, 0.07366561889648438, 0.077728271484375, 0.08179092407226562, 0.08585357666015625, 0.08991622924804688, 0.0939788818359375, 0.09804153442382812, 0.10210418701171875, 0.10616683959960938, 0.1102294921875]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 1.0, 2.0, 4.0, 11.0, 14.0, 25.0, 52.0, 95.0, 136.0, 265.0, 177.0, 97.0, 58.0, 32.0, 8.0, 6.0, 9.0, 3.0, 1.0, 3.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0], "bins": [-3.548521041870117, -3.4740092754364014, -3.3994977474212646, -3.324985980987549, -3.250474214553833, -3.175962448120117, -3.1014509201049805, -3.0269391536712646, -2.952427387237549, -2.877915620803833, -2.8034040927886963, -2.7288923263549805, -2.6543805599212646, -2.579868793487549, -2.505357265472412, -2.4308454990386963, -2.3563339710235596, -2.2818222045898438, -2.207310676574707, -2.132798910140991, -2.0582871437072754, -1.9837754964828491, -1.9092638492584229, -1.834752082824707, -1.7602404356002808, -1.6857287883758545, -1.6112170219421387, -1.5367053747177124, -1.4621937274932861, -1.3876819610595703, -1.313170313835144, -1.2386586666107178, -1.1641470193862915, -1.0896353721618652, -1.0151236057281494, -0.9406119585037231, -0.8661002516746521, -0.791588544845581, -0.7170768976211548, -0.6425651907920837, -0.5680534839630127, -0.49354177713394165, -0.419030100107193, -0.34451842308044434, -0.2700067162513733, -0.19549500942230225, -0.12098333239555359, -0.04647165536880493, 0.028040051460266113, 0.10255174338817596, 0.17706343531608582, 0.2515751123428345, 0.3260868191719055, 0.40059852600097656, 0.4751102030277252, 0.5496218800544739, 0.6241335868835449, 0.698645293712616, 0.773157000541687, 0.8476686477661133, 0.9221803545951843, 0.9966920614242554, 1.0712037086486816, 1.1457154750823975, 1.2202271223068237]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 3.0, 3.0, 4.0, 5.0, 9.0, 7.0, 15.0, 17.0, 19.0, 20.0, 17.0, 30.0, 31.0, 56.0, 41.0, 60.0, 93.0, 86.0, 73.0, 82.0, 62.0, 48.0, 31.0, 28.0, 24.0, 25.0, 15.0, 15.0, 14.0, 12.0, 15.0, 9.0, 9.0, 8.0, 5.0, 5.0, 4.0, 1.0, 2.0, 1.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.151763916015625, -2.0883803367614746, -2.024996757507324, -1.9616132974624634, -1.8982298374176025, -1.8348462581634521, -1.7714626789093018, -1.7080790996551514, -1.6446956396102905, -1.5813120603561401, -1.5179286003112793, -1.454545021057129, -1.3911614418029785, -1.3277779817581177, -1.2643944025039673, -1.2010109424591064, -1.137627363204956, -1.0742437839508057, -1.0108603239059448, -0.9474767446517944, -0.8840932250022888, -0.8207097053527832, -0.7573261260986328, -0.6939426064491272, -0.6305590867996216, -0.567175567150116, -0.5037920475006104, -0.44040846824645996, -0.37702494859695435, -0.31364142894744873, -0.2502578794956207, -0.18687433004379272, -0.12349069118499756, -0.06010715663433075, 0.0032763779163360596, 0.06665991246700287, 0.13004344701766968, 0.1934269666671753, 0.2568105161190033, 0.3201940655708313, 0.3835775852203369, 0.44696110486984253, 0.5103446245193481, 0.5737282037734985, 0.6371117234230042, 0.7004952430725098, 0.7638788223266602, 0.8272623419761658, 0.8906458616256714, 0.954029381275177, 1.0174129009246826, 1.080796480178833, 1.1441800594329834, 1.2075635194778442, 1.2709470987319946, 1.3343305587768555, 1.3977141380310059, 1.4610977172851562, 1.524481177330017, 1.5878647565841675, 1.6512482166290283, 1.7146317958831787, 1.778015375137329, 1.8413989543914795, 1.9047824144363403]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 1.0, 3.0, 5.0, 8.0, 7.0, 12.0, 27.0, 23.0, 43.0, 73.0, 113.0, 173.0, 313.0, 478.0, 824.0, 1417.0, 2629.0, 4741.0, 9433.0, 20248.0, 48136.0, 140285.0, 530389.0, 1851855.0, 1155840.0, 281993.0, 83610.0, 31713.0, 14273.0, 6908.0, 3727.0, 2065.0, 1109.0, 668.0, 436.0, 233.0, 185.0, 112.0, 69.0, 33.0, 35.0, 15.0, 8.0, 7.0, 6.0, 5.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0], "bins": [-0.1180419921875, -0.11474227905273438, -0.11144256591796875, -0.10814285278320312, -0.1048431396484375, -0.10154342651367188, -0.09824371337890625, -0.09494400024414062, -0.091644287109375, -0.08834457397460938, -0.08504486083984375, -0.08174514770507812, -0.0784454345703125, -0.07514572143554688, -0.07184600830078125, -0.06854629516601562, -0.06524658203125, -0.061946868896484375, -0.05864715576171875, -0.055347442626953125, -0.0520477294921875, -0.048748016357421875, -0.04544830322265625, -0.042148590087890625, -0.038848876953125, -0.035549163818359375, -0.03224945068359375, -0.028949737548828125, -0.0256500244140625, -0.022350311279296875, -0.01905059814453125, -0.015750885009765625, -0.012451171875, -0.009151458740234375, -0.00585174560546875, -0.002552032470703125, 0.0007476806640625, 0.004047393798828125, 0.00734710693359375, 0.010646820068359375, 0.013946533203125, 0.017246246337890625, 0.02054595947265625, 0.023845672607421875, 0.0271453857421875, 0.030445098876953125, 0.03374481201171875, 0.037044525146484375, 0.04034423828125, 0.043643951416015625, 0.04694366455078125, 0.050243377685546875, 0.0535430908203125, 0.056842803955078125, 0.06014251708984375, 0.06344223022460938, 0.066741943359375, 0.07004165649414062, 0.07334136962890625, 0.07664108276367188, 0.0799407958984375, 0.08324050903320312, 0.08654022216796875, 0.08983993530273438, 0.0931396484375]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 1.0, 8.0, 5.0, 8.0, 10.0, 10.0, 11.0, 19.0, 13.0, 26.0, 27.0, 35.0, 35.0, 37.0, 48.0, 52.0, 46.0, 52.0, 47.0, 59.0, 45.0, 51.0, 55.0, 39.0, 45.0, 37.0, 33.0, 17.0, 24.0, 26.0, 17.0, 8.0, 18.0, 9.0, 14.0, 6.0, 7.0, 3.0, 6.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.10247802734375, -0.09899139404296875, -0.0955047607421875, -0.09201812744140625, -0.088531494140625, -0.08504486083984375, -0.0815582275390625, -0.07807159423828125, -0.0745849609375, -0.07109832763671875, -0.0676116943359375, -0.06412506103515625, -0.060638427734375, -0.05715179443359375, -0.0536651611328125, -0.05017852783203125, -0.04669189453125, -0.04320526123046875, -0.0397186279296875, -0.03623199462890625, -0.032745361328125, -0.02925872802734375, -0.0257720947265625, -0.02228546142578125, -0.018798828125, -0.01531219482421875, -0.0118255615234375, -0.00833892822265625, -0.004852294921875, -0.00136566162109375, 0.0021209716796875, 0.00560760498046875, 0.00909423828125, 0.01258087158203125, 0.0160675048828125, 0.01955413818359375, 0.023040771484375, 0.02652740478515625, 0.0300140380859375, 0.03350067138671875, 0.0369873046875, 0.04047393798828125, 0.0439605712890625, 0.04744720458984375, 0.050933837890625, 0.05442047119140625, 0.0579071044921875, 0.06139373779296875, 0.06488037109375, 0.06836700439453125, 0.0718536376953125, 0.07534027099609375, 0.078826904296875, 0.08231353759765625, 0.0858001708984375, 0.08928680419921875, 0.0927734375, 0.09626007080078125, 0.0997467041015625, 0.10323333740234375, 0.106719970703125, 0.11020660400390625, 0.1136932373046875, 0.11717987060546875, 0.12066650390625]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 8.0, 6.0, 9.0, 15.0, 24.0, 40.0, 77.0, 192.0, 479.0, 2534.0, 30734.0, 3126536.0, 1014953.0, 16496.0, 1540.0, 373.0, 105.0, 67.0, 37.0, 21.0, 16.0, 7.0, 8.0, 0.0, 4.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.65625, -0.6374435424804688, -0.6186370849609375, -0.5998306274414062, -0.581024169921875, -0.5622177124023438, -0.5434112548828125, -0.5246047973632812, -0.50579833984375, -0.48699188232421875, -0.4681854248046875, -0.44937896728515625, -0.430572509765625, -0.41176605224609375, -0.3929595947265625, -0.37415313720703125, -0.3553466796875, -0.33654022216796875, -0.3177337646484375, -0.29892730712890625, -0.280120849609375, -0.26131439208984375, -0.2425079345703125, -0.22370147705078125, -0.20489501953125, -0.18608856201171875, -0.1672821044921875, -0.14847564697265625, -0.129669189453125, -0.11086273193359375, -0.0920562744140625, -0.07324981689453125, -0.054443359375, -0.03563690185546875, -0.0168304443359375, 0.00197601318359375, 0.020782470703125, 0.03958892822265625, 0.0583953857421875, 0.07720184326171875, 0.09600830078125, 0.11481475830078125, 0.1336212158203125, 0.15242767333984375, 0.171234130859375, 0.19004058837890625, 0.2088470458984375, 0.22765350341796875, 0.2464599609375, 0.26526641845703125, 0.2840728759765625, 0.30287933349609375, 0.321685791015625, 0.34049224853515625, 0.3592987060546875, 0.37810516357421875, 0.39691162109375, 0.41571807861328125, 0.4345245361328125, 0.45333099365234375, 0.472137451171875, 0.49094390869140625, 0.5097503662109375, 0.5285568237304688, 0.54736328125]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 4.0, 5.0, 3.0, 6.0, 6.0, 4.0, 4.0, 12.0, 11.0, 18.0, 23.0, 26.0, 40.0, 49.0, 92.0, 102.0, 147.0, 195.0, 360.0, 509.0, 575.0, 610.0, 379.0, 272.0, 165.0, 118.0, 92.0, 74.0, 38.0, 27.0, 29.0, 18.0, 17.0, 13.0, 9.0, 9.0, 6.0, 8.0, 0.0, 3.0, 5.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2666015625, -0.25914764404296875, -0.2516937255859375, -0.24423980712890625, -0.236785888671875, -0.22933197021484375, -0.2218780517578125, -0.21442413330078125, -0.20697021484375, -0.19951629638671875, -0.1920623779296875, -0.18460845947265625, -0.177154541015625, -0.16970062255859375, -0.1622467041015625, -0.15479278564453125, -0.1473388671875, -0.13988494873046875, -0.1324310302734375, -0.12497711181640625, -0.117523193359375, -0.11006927490234375, -0.1026153564453125, -0.09516143798828125, -0.08770751953125, -0.08025360107421875, -0.0727996826171875, -0.06534576416015625, -0.057891845703125, -0.05043792724609375, -0.0429840087890625, -0.03553009033203125, -0.028076171875, -0.02062225341796875, -0.0131683349609375, -0.00571441650390625, 0.001739501953125, 0.00919342041015625, 0.0166473388671875, 0.02410125732421875, 0.03155517578125, 0.03900909423828125, 0.0464630126953125, 0.05391693115234375, 0.061370849609375, 0.06882476806640625, 0.0762786865234375, 0.08373260498046875, 0.0911865234375, 0.09864044189453125, 0.1060943603515625, 0.11354827880859375, 0.121002197265625, 0.12845611572265625, 0.1359100341796875, 0.14336395263671875, 0.15081787109375, 0.15827178955078125, 0.1657257080078125, 0.17317962646484375, 0.180633544921875, 0.18808746337890625, 0.1955413818359375, 0.20299530029296875, 0.21044921875]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 3.0, 9.0, 5.0, 12.0, 30.0, 71.0, 178.0, 270.0, 217.0, 127.0, 57.0, 16.0, 10.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.443475246429443, -4.325896739959717, -4.20831823348999, -4.090740203857422, -3.9731616973876953, -3.8555831909179688, -3.738004684448242, -3.6204264163970947, -3.5028481483459473, -3.3852696418762207, -3.2676913738250732, -3.1501128673553467, -3.032534599304199, -2.9149560928344727, -2.797377586364746, -2.6797993183135986, -2.562220811843872, -2.4446423053741455, -2.327064037322998, -2.2094855308532715, -2.091907262802124, -1.9743287563323975, -1.8567503690719604, -1.7391719818115234, -1.6215935945510864, -1.5040152072906494, -1.3864368200302124, -1.2688584327697754, -1.1512799263000488, -1.0337016582489014, -0.9161231517791748, -0.7985447645187378, -0.6809661388397217, -0.5633877515792847, -0.44580933451652527, -0.32823091745376587, -0.21065253019332886, -0.09307414293289185, 0.02450430393218994, 0.14208269119262695, 0.25966107845306396, 0.377239465713501, 0.4948178827762604, 0.6123962998390198, 0.7299746870994568, 0.8475530743598938, 0.9651315212249756, 1.0827099084854126, 1.2002882957458496, 1.3178666830062866, 1.4354450702667236, 1.5530235767364502, 1.6706018447875977, 1.7881803512573242, 1.9057587385177612, 2.0233371257781982, 2.1409153938293457, 2.2584939002990723, 2.3760721683502197, 2.4936506748199463, 2.6112289428710938, 2.7288074493408203, 2.846385955810547, 2.9639642238616943, 3.081542730331421]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 5.0, 4.0, 8.0, 13.0, 7.0, 12.0, 12.0, 15.0, 15.0, 23.0, 27.0, 23.0, 29.0, 31.0, 27.0, 27.0, 36.0, 43.0, 47.0, 38.0, 46.0, 53.0, 42.0, 40.0, 32.0, 43.0, 28.0, 33.0, 25.0, 29.0, 27.0, 23.0, 20.0, 17.0, 20.0, 18.0, 11.0, 12.0, 9.0, 12.0, 2.0, 5.0, 5.0, 0.0, 5.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.9159272909164429, -0.8853943943977356, -0.8548614978790283, -0.824328601360321, -0.7937957048416138, -0.7632628083229065, -0.7327299118041992, -0.7021970152854919, -0.6716641187667847, -0.6411312222480774, -0.6105983257293701, -0.5800654292106628, -0.5495325326919556, -0.5189996361732483, -0.488466739654541, -0.45793384313583374, -0.4274009168148041, -0.3968680202960968, -0.3663351237773895, -0.33580222725868225, -0.305269330739975, -0.2747364044189453, -0.24420352280139923, -0.21367062628269196, -0.18313772976398468, -0.1526048332452774, -0.12207193672657013, -0.09153903275728226, -0.06100613623857498, -0.03047323226928711, 5.9664249420166016e-05, 0.03059256076812744, 0.06112545728683472, 0.09165835380554199, 0.12219125032424927, 0.15272414684295654, 0.18325704336166382, 0.2137899547815323, 0.24432285130023956, 0.27485573291778564, 0.3053886294364929, 0.3359215259552002, 0.36645442247390747, 0.39698731899261475, 0.427520215511322, 0.4580531120300293, 0.4885860085487366, 0.5191189050674438, 0.5496518611907959, 0.5801847577095032, 0.6107176542282104, 0.6412505507469177, 0.671783447265625, 0.7023163437843323, 0.7328492403030396, 0.7633821368217468, 0.7939150333404541, 0.8244479298591614, 0.8549808263778687, 0.8855137228965759, 0.9160466194152832, 0.9465795159339905, 0.9771124124526978, 1.0076453685760498, 1.0381782054901123]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 1.0, 2.0, 1.0, 4.0, 6.0, 20.0, 28.0, 35.0, 43.0, 55.0, 124.0, 149.0, 228.0, 378.0, 565.0, 966.0, 1739.0, 3484.0, 7865.0, 21546.0, 79546.0, 345421.0, 431516.0, 109036.0, 27529.0, 9451.0, 3891.0, 2012.0, 1116.0, 676.0, 378.0, 248.0, 159.0, 106.0, 81.0, 49.0, 35.0, 21.0, 19.0, 9.0, 9.0, 4.0, 7.0, 1.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.20703125, -0.20113372802734375, -0.1952362060546875, -0.18933868408203125, -0.183441162109375, -0.17754364013671875, -0.1716461181640625, -0.16574859619140625, -0.15985107421875, -0.15395355224609375, -0.1480560302734375, -0.14215850830078125, -0.136260986328125, -0.13036346435546875, -0.1244659423828125, -0.11856842041015625, -0.1126708984375, -0.10677337646484375, -0.1008758544921875, -0.09497833251953125, -0.089080810546875, -0.08318328857421875, -0.0772857666015625, -0.07138824462890625, -0.06549072265625, -0.05959320068359375, -0.0536956787109375, -0.04779815673828125, -0.041900634765625, -0.03600311279296875, -0.0301055908203125, -0.02420806884765625, -0.018310546875, -0.01241302490234375, -0.0065155029296875, -0.00061798095703125, 0.005279541015625, 0.01117706298828125, 0.0170745849609375, 0.02297210693359375, 0.02886962890625, 0.03476715087890625, 0.0406646728515625, 0.04656219482421875, 0.052459716796875, 0.05835723876953125, 0.0642547607421875, 0.07015228271484375, 0.0760498046875, 0.08194732666015625, 0.0878448486328125, 0.09374237060546875, 0.099639892578125, 0.10553741455078125, 0.1114349365234375, 0.11733245849609375, 0.12322998046875, 0.12912750244140625, 0.1350250244140625, 0.14092254638671875, 0.146820068359375, 0.15271759033203125, 0.1586151123046875, 0.16451263427734375, 0.17041015625]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 3.0, 4.0, 1.0, 2.0, 6.0, 5.0, 7.0, 18.0, 14.0, 17.0, 12.0, 17.0, 17.0, 18.0, 27.0, 34.0, 38.0, 27.0, 33.0, 35.0, 46.0, 36.0, 47.0, 42.0, 43.0, 34.0, 26.0, 43.0, 38.0, 48.0, 24.0, 29.0, 34.0, 27.0, 19.0, 9.0, 22.0, 13.0, 18.0, 10.0, 7.0, 11.0, 10.0, 4.0, 7.0, 3.0, 6.0, 3.0, 5.0, 3.0, 3.0, 4.0, 2.0, 3.0, 1.0, 1.0], "bins": [-0.09228515625, -0.0894479751586914, -0.08661079406738281, -0.08377361297607422, -0.08093643188476562, -0.07809925079345703, -0.07526206970214844, -0.07242488861083984, -0.06958770751953125, -0.06675052642822266, -0.06391334533691406, -0.06107616424560547, -0.058238983154296875, -0.05540180206298828, -0.05256462097167969, -0.049727439880371094, -0.0468902587890625, -0.044053077697753906, -0.04121589660644531, -0.03837871551513672, -0.035541534423828125, -0.03270435333251953, -0.029867172241210938, -0.027029991149902344, -0.02419281005859375, -0.021355628967285156, -0.018518447875976562, -0.01568126678466797, -0.012844085693359375, -0.010006904602050781, -0.0071697235107421875, -0.004332542419433594, -0.001495361328125, 0.0013418197631835938, 0.0041790008544921875, 0.007016181945800781, 0.009853363037109375, 0.012690544128417969, 0.015527725219726562, 0.018364906311035156, 0.02120208740234375, 0.024039268493652344, 0.026876449584960938, 0.02971363067626953, 0.032550811767578125, 0.03538799285888672, 0.03822517395019531, 0.041062355041503906, 0.0438995361328125, 0.046736717224121094, 0.04957389831542969, 0.05241107940673828, 0.055248260498046875, 0.05808544158935547, 0.06092262268066406, 0.06375980377197266, 0.06659698486328125, 0.06943416595458984, 0.07227134704589844, 0.07510852813720703, 0.07794570922851562, 0.08078289031982422, 0.08362007141113281, 0.0864572525024414, 0.08929443359375]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 0.0, 1.0, 5.0, 6.0, 1.0, 6.0, 6.0, 11.0, 13.0, 22.0, 21.0, 27.0, 46.0, 57.0, 87.0, 120.0, 179.0, 343.0, 577.0, 1137.0, 2652.0, 8290.0, 41535.0, 590465.0, 355327.0, 35229.0, 7199.0, 2508.0, 1168.0, 568.0, 343.0, 198.0, 130.0, 87.0, 53.0, 34.0, 34.0, 20.0, 11.0, 12.0, 10.0, 6.0, 4.0, 1.0, 3.0, 3.0, 4.0, 4.0, 0.0, 0.0, 1.0, 0.0, 3.0], "bins": [-0.322998046875, -0.31375885009765625, -0.3045196533203125, -0.29528045654296875, -0.286041259765625, -0.27680206298828125, -0.2675628662109375, -0.25832366943359375, -0.24908447265625, -0.23984527587890625, -0.2306060791015625, -0.22136688232421875, -0.212127685546875, -0.20288848876953125, -0.1936492919921875, -0.18441009521484375, -0.1751708984375, -0.16593170166015625, -0.1566925048828125, -0.14745330810546875, -0.138214111328125, -0.12897491455078125, -0.1197357177734375, -0.11049652099609375, -0.10125732421875, -0.09201812744140625, -0.0827789306640625, -0.07353973388671875, -0.064300537109375, -0.05506134033203125, -0.0458221435546875, -0.03658294677734375, -0.02734375, -0.01810455322265625, -0.0088653564453125, 0.00037384033203125, 0.009613037109375, 0.01885223388671875, 0.0280914306640625, 0.03733062744140625, 0.04656982421875, 0.05580902099609375, 0.0650482177734375, 0.07428741455078125, 0.083526611328125, 0.09276580810546875, 0.1020050048828125, 0.11124420166015625, 0.1204833984375, 0.12972259521484375, 0.1389617919921875, 0.14820098876953125, 0.157440185546875, 0.16667938232421875, 0.1759185791015625, 0.18515777587890625, 0.19439697265625, 0.20363616943359375, 0.2128753662109375, 0.22211456298828125, 0.231353759765625, 0.24059295654296875, 0.2498321533203125, 0.25907135009765625, 0.268310546875]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 3.0, 1.0, 1.0, 6.0, 1.0, 6.0, 1.0, 3.0, 4.0, 9.0, 12.0, 15.0, 10.0, 23.0, 18.0, 27.0, 40.0, 37.0, 41.0, 52.0, 60.0, 62.0, 63.0, 63.0, 60.0, 58.0, 51.0, 40.0, 48.0, 42.0, 22.0, 21.0, 30.0, 14.0, 18.0, 15.0, 5.0, 6.0, 4.0, 4.0, 8.0, 4.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.58056640625, -0.5652580261230469, -0.5499496459960938, -0.5346412658691406, -0.5193328857421875, -0.5040245056152344, -0.48871612548828125, -0.4734077453613281, -0.458099365234375, -0.4427909851074219, -0.42748260498046875, -0.4121742248535156, -0.3968658447265625, -0.3815574645996094, -0.36624908447265625, -0.3509407043457031, -0.33563232421875, -0.3203239440917969, -0.30501556396484375, -0.2897071838378906, -0.2743988037109375, -0.2590904235839844, -0.24378204345703125, -0.22847366333007812, -0.213165283203125, -0.19785690307617188, -0.18254852294921875, -0.16724014282226562, -0.1519317626953125, -0.13662338256835938, -0.12131500244140625, -0.10600662231445312, -0.0906982421875, -0.07538986206054688, -0.06008148193359375, -0.044773101806640625, -0.0294647216796875, -0.014156341552734375, 0.00115203857421875, 0.016460418701171875, 0.031768798828125, 0.047077178955078125, 0.06238555908203125, 0.07769393920898438, 0.0930023193359375, 0.10831069946289062, 0.12361907958984375, 0.13892745971679688, 0.15423583984375, 0.16954421997070312, 0.18485260009765625, 0.20016098022460938, 0.2154693603515625, 0.23077774047851562, 0.24608612060546875, 0.2613945007324219, 0.276702880859375, 0.2920112609863281, 0.30731964111328125, 0.3226280212402344, 0.3379364013671875, 0.3532447814941406, 0.36855316162109375, 0.3838615417480469, 0.399169921875]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 6.0, 0.0, 2.0, 3.0, 5.0, 14.0, 18.0, 22.0, 48.0, 72.0, 128.0, 227.0, 421.0, 825.0, 1903.0, 4791.0, 13562.0, 52784.0, 558532.0, 345092.0, 49111.0, 12910.0, 4508.0, 1820.0, 778.0, 414.0, 231.0, 134.0, 69.0, 39.0, 36.0, 22.0, 15.0, 9.0, 5.0, 5.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.131591796875, -0.12782955169677734, -0.12406730651855469, -0.12030506134033203, -0.11654281616210938, -0.11278057098388672, -0.10901832580566406, -0.1052560806274414, -0.10149383544921875, -0.0977315902709961, -0.09396934509277344, -0.09020709991455078, -0.08644485473632812, -0.08268260955810547, -0.07892036437988281, -0.07515811920166016, -0.0713958740234375, -0.06763362884521484, -0.06387138366699219, -0.06010913848876953, -0.056346893310546875, -0.05258464813232422, -0.04882240295410156, -0.045060157775878906, -0.04129791259765625, -0.037535667419433594, -0.03377342224121094, -0.03001117706298828, -0.026248931884765625, -0.02248668670654297, -0.018724441528320312, -0.014962196350097656, -0.011199951171875, -0.007437705993652344, -0.0036754608154296875, 8.678436279296875e-05, 0.003849029541015625, 0.007611274719238281, 0.011373519897460938, 0.015135765075683594, 0.01889801025390625, 0.022660255432128906, 0.026422500610351562, 0.03018474578857422, 0.033946990966796875, 0.03770923614501953, 0.04147148132324219, 0.045233726501464844, 0.0489959716796875, 0.052758216857910156, 0.05652046203613281, 0.06028270721435547, 0.06404495239257812, 0.06780719757080078, 0.07156944274902344, 0.0753316879272461, 0.07909393310546875, 0.0828561782836914, 0.08661842346191406, 0.09038066864013672, 0.09414291381835938, 0.09790515899658203, 0.10166740417480469, 0.10542964935302734, 0.10919189453125]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 6.0, 8.0, 6.0, 1.0, 6.0, 3.0, 10.0, 7.0, 19.0, 21.0, 43.0, 38.0, 38.0, 67.0, 73.0, 113.0, 102.0, 82.0, 84.0, 77.0, 42.0, 40.0, 34.0, 24.0, 15.0, 10.0, 9.0, 8.0, 5.0, 4.0, 6.0, 2.0, 2.0, 0.0, 0.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.68952751159668e-05, -3.5715289413928986e-05, -3.4535303711891174e-05, -3.335531800985336e-05, -3.217533230781555e-05, -3.099534660577774e-05, -2.981536090373993e-05, -2.8635375201702118e-05, -2.7455389499664307e-05, -2.6275403797626495e-05, -2.5095418095588684e-05, -2.3915432393550873e-05, -2.273544669151306e-05, -2.155546098947525e-05, -2.037547528743744e-05, -1.9195489585399628e-05, -1.8015503883361816e-05, -1.6835518181324005e-05, -1.5655532479286194e-05, -1.4475546777248383e-05, -1.3295561075210571e-05, -1.211557537317276e-05, -1.0935589671134949e-05, -9.755603969097137e-06, -8.575618267059326e-06, -7.395632565021515e-06, -6.215646862983704e-06, -5.035661160945892e-06, -3.855675458908081e-06, -2.6756897568702698e-06, -1.4957040548324585e-06, -3.157183527946472e-07, 8.642673492431641e-07, 2.0442530512809753e-06, 3.2242387533187866e-06, 4.404224455356598e-06, 5.584210157394409e-06, 6.7641958594322205e-06, 7.944181561470032e-06, 9.124167263507843e-06, 1.0304152965545654e-05, 1.1484138667583466e-05, 1.2664124369621277e-05, 1.3844110071659088e-05, 1.50240957736969e-05, 1.620408147573471e-05, 1.7384067177772522e-05, 1.8564052879810333e-05, 1.9744038581848145e-05, 2.0924024283885956e-05, 2.2104009985923767e-05, 2.328399568796158e-05, 2.446398138999939e-05, 2.56439670920372e-05, 2.6823952794075012e-05, 2.8003938496112823e-05, 2.9183924198150635e-05, 3.0363909900188446e-05, 3.154389560222626e-05, 3.272388130426407e-05, 3.390386700630188e-05, 3.508385270833969e-05, 3.62638384103775e-05, 3.7443824112415314e-05, 3.8623809814453125e-05]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 5.0, 6.0, 4.0, 19.0, 25.0, 39.0, 70.0, 168.0, 354.0, 874.0, 3299.0, 19379.0, 286796.0, 703163.0, 28185.0, 4348.0, 1128.0, 381.0, 140.0, 83.0, 49.0, 18.0, 12.0, 11.0, 4.0, 1.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.164794921875, -0.15822601318359375, -0.1516571044921875, -0.14508819580078125, -0.138519287109375, -0.13195037841796875, -0.1253814697265625, -0.11881256103515625, -0.11224365234375, -0.10567474365234375, -0.0991058349609375, -0.09253692626953125, -0.085968017578125, -0.07939910888671875, -0.0728302001953125, -0.06626129150390625, -0.0596923828125, -0.05312347412109375, -0.0465545654296875, -0.03998565673828125, -0.033416748046875, -0.02684783935546875, -0.0202789306640625, -0.01371002197265625, -0.00714111328125, -0.00057220458984375, 0.0059967041015625, 0.01256561279296875, 0.019134521484375, 0.02570343017578125, 0.0322723388671875, 0.03884124755859375, 0.04541015625, 0.05197906494140625, 0.0585479736328125, 0.06511688232421875, 0.071685791015625, 0.07825469970703125, 0.0848236083984375, 0.09139251708984375, 0.09796142578125, 0.10453033447265625, 0.1110992431640625, 0.11766815185546875, 0.124237060546875, 0.13080596923828125, 0.1373748779296875, 0.14394378662109375, 0.1505126953125, 0.15708160400390625, 0.1636505126953125, 0.17021942138671875, 0.176788330078125, 0.18335723876953125, 0.1899261474609375, 0.19649505615234375, 0.20306396484375, 0.20963287353515625, 0.2162017822265625, 0.22277069091796875, 0.229339599609375, 0.23590850830078125, 0.2424774169921875, 0.24904632568359375, 0.255615234375]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 3.0, 4.0, 6.0, 4.0, 5.0, 17.0, 12.0, 20.0, 25.0, 51.0, 68.0, 100.0, 129.0, 172.0, 131.0, 78.0, 61.0, 33.0, 22.0, 20.0, 12.0, 11.0, 6.0, 7.0, 1.0, 3.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1607666015625, -0.1559600830078125, -0.151153564453125, -0.1463470458984375, -0.14154052734375, -0.1367340087890625, -0.131927490234375, -0.1271209716796875, -0.122314453125, -0.1175079345703125, -0.112701416015625, -0.1078948974609375, -0.10308837890625, -0.0982818603515625, -0.093475341796875, -0.0886688232421875, -0.0838623046875, -0.0790557861328125, -0.074249267578125, -0.0694427490234375, -0.06463623046875, -0.0598297119140625, -0.055023193359375, -0.0502166748046875, -0.04541015625, -0.0406036376953125, -0.035797119140625, -0.0309906005859375, -0.02618408203125, -0.0213775634765625, -0.016571044921875, -0.0117645263671875, -0.0069580078125, -0.0021514892578125, 0.002655029296875, 0.0074615478515625, 0.01226806640625, 0.0170745849609375, 0.021881103515625, 0.0266876220703125, 0.031494140625, 0.0363006591796875, 0.041107177734375, 0.0459136962890625, 0.05072021484375, 0.0555267333984375, 0.060333251953125, 0.0651397705078125, 0.0699462890625, 0.0747528076171875, 0.079559326171875, 0.0843658447265625, 0.08917236328125, 0.0939788818359375, 0.098785400390625, 0.1035919189453125, 0.1083984375, 0.1132049560546875, 0.118011474609375, 0.1228179931640625, 0.12762451171875, 0.1324310302734375, 0.137237548828125, 0.1420440673828125, 0.1468505859375]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 8.0, 10.0, 55.0, 92.0, 208.0, 383.0, 155.0, 47.0, 28.0, 8.0, 3.0, 6.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.750192165374756, -3.6341590881347656, -3.5181257724761963, -3.402092695236206, -3.286059617996216, -3.1700263023376465, -3.0539932250976562, -2.937960147857666, -2.821927070617676, -2.7058939933776855, -2.589860677719116, -2.473827600479126, -2.3577945232391357, -2.2417612075805664, -2.125728130340576, -2.009695053100586, -1.8936617374420166, -1.7776285409927368, -1.6615954637527466, -1.5455622673034668, -1.4295291900634766, -1.3134959936141968, -1.197462797164917, -1.0814297199249268, -0.965396523475647, -0.849363386631012, -0.733330249786377, -0.6172970533370972, -0.5012639164924622, -0.38523077964782715, -0.26919758319854736, -0.15316444635391235, -0.037131309509277344, 0.07890184223651886, 0.19493499398231506, 0.31096816062927246, 0.42700129747390747, 0.5430344343185425, 0.6590676307678223, 0.7751007676124573, 0.8911339044570923, 1.007167100906372, 1.1232001781463623, 1.239233374595642, 1.3552665710449219, 1.471299648284912, 1.587332844734192, 1.7033660411834717, 1.819399118423462, 1.9354323148727417, 2.0514655113220215, 2.1674985885620117, 2.283531665802002, 2.399564743041992, 2.5155980587005615, 2.6316311359405518, 2.747664451599121, 2.8636975288391113, 2.9797308444976807, 3.095763921737671, 3.211796998977661, 3.3278303146362305, 3.4438633918762207, 3.559896469116211, 3.675929546356201]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 6.0, 2.0, 3.0, 5.0, 6.0, 6.0, 9.0, 12.0, 6.0, 13.0, 14.0, 24.0, 19.0, 27.0, 22.0, 28.0, 35.0, 32.0, 44.0, 45.0, 59.0, 71.0, 63.0, 67.0, 60.0, 45.0, 33.0, 26.0, 21.0, 21.0, 25.0, 21.0, 17.0, 22.0, 15.0, 8.0, 9.0, 15.0, 8.0, 14.0, 7.0, 5.0, 2.0, 1.0, 2.0, 5.0, 3.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0], "bins": [-1.4265739917755127, -1.3821661472320557, -1.3377584218978882, -1.2933505773544312, -1.2489428520202637, -1.2045350074768066, -1.1601271629333496, -1.1157194375991821, -1.0713117122650146, -1.0269038677215576, -0.9824961423873901, -0.9380882978439331, -0.8936805725097656, -0.8492727279663086, -0.8048649430274963, -0.7604571580886841, -0.716049313545227, -0.6716415286064148, -0.6272337436676025, -0.5828258991241455, -0.538418173789978, -0.4940103590488434, -0.44960254430770874, -0.4051947593688965, -0.36078697443008423, -0.316379189491272, -0.2719714045524597, -0.22756358981132507, -0.18315580487251282, -0.13874801993370056, -0.09434020519256592, -0.04993242025375366, -0.005524754524230957, 0.038883037865161896, 0.08329083025455475, 0.1276986300945282, 0.17210641503334045, 0.2165141999721527, 0.26092201471328735, 0.3053297996520996, 0.34973758459091187, 0.3941453695297241, 0.4385531544685364, 0.482960969209671, 0.5273687839508057, 0.5717765092849731, 0.6161843538284302, 0.6605921387672424, 0.7049999237060547, 0.7494077086448669, 0.7938154935836792, 0.8382233381271362, 0.8826310634613037, 0.9270389080047607, 0.971446692943573, 1.0158544778823853, 1.0602622032165527, 1.1046700477600098, 1.1490777730941772, 1.1934856176376343, 1.2378933429718018, 1.2823011875152588, 1.3267090320587158, 1.3711167573928833, 1.4155246019363403]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 7.0, 10.0, 8.0, 14.0, 16.0, 37.0, 46.0, 74.0, 135.0, 179.0, 299.0, 475.0, 738.0, 1380.0, 2306.0, 4219.0, 8160.0, 16659.0, 37654.0, 97272.0, 298451.0, 1000340.0, 1762845.0, 653703.0, 190244.0, 65268.0, 26910.0, 12390.0, 6166.0, 3448.0, 1962.0, 1071.0, 722.0, 387.0, 246.0, 145.0, 102.0, 62.0, 48.0, 28.0, 22.0, 9.0, 12.0, 4.0, 3.0, 3.0, 4.0, 1.0, 5.0, 0.0, 1.0, 2.0, 1.0, 2.0], "bins": [-0.1021728515625, -0.09901142120361328, -0.09584999084472656, -0.09268856048583984, -0.08952713012695312, -0.0863656997680664, -0.08320426940917969, -0.08004283905029297, -0.07688140869140625, -0.07371997833251953, -0.07055854797363281, -0.0673971176147461, -0.06423568725585938, -0.061074256896972656, -0.05791282653808594, -0.05475139617919922, -0.0515899658203125, -0.04842853546142578, -0.04526710510253906, -0.042105674743652344, -0.038944244384765625, -0.035782814025878906, -0.03262138366699219, -0.02945995330810547, -0.02629852294921875, -0.02313709259033203, -0.019975662231445312, -0.016814231872558594, -0.013652801513671875, -0.010491371154785156, -0.0073299407958984375, -0.004168510437011719, -0.001007080078125, 0.0021543502807617188, 0.0053157806396484375, 0.008477210998535156, 0.011638641357421875, 0.014800071716308594, 0.017961502075195312, 0.02112293243408203, 0.02428436279296875, 0.02744579315185547, 0.030607223510742188, 0.033768653869628906, 0.036930084228515625, 0.040091514587402344, 0.04325294494628906, 0.04641437530517578, 0.0495758056640625, 0.05273723602294922, 0.05589866638183594, 0.059060096740722656, 0.062221527099609375, 0.0653829574584961, 0.06854438781738281, 0.07170581817626953, 0.07486724853515625, 0.07802867889404297, 0.08119010925292969, 0.0843515396118164, 0.08751296997070312, 0.09067440032958984, 0.09383583068847656, 0.09699726104736328, 0.10015869140625]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 4.0, 2.0, 3.0, 4.0, 7.0, 9.0, 6.0, 11.0, 22.0, 18.0, 14.0, 30.0, 29.0, 28.0, 26.0, 44.0, 61.0, 35.0, 47.0, 54.0, 43.0, 42.0, 48.0, 57.0, 36.0, 36.0, 48.0, 27.0, 31.0, 24.0, 23.0, 26.0, 16.0, 17.0, 18.0, 5.0, 10.0, 5.0, 11.0, 8.0, 4.0, 5.0, 2.0, 4.0, 0.0, 0.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.10357666015625, -0.10036563873291016, -0.09715461730957031, -0.09394359588623047, -0.09073257446289062, -0.08752155303955078, -0.08431053161621094, -0.0810995101928711, -0.07788848876953125, -0.0746774673461914, -0.07146644592285156, -0.06825542449951172, -0.06504440307617188, -0.06183338165283203, -0.05862236022949219, -0.055411338806152344, -0.0522003173828125, -0.048989295959472656, -0.04577827453613281, -0.04256725311279297, -0.039356231689453125, -0.03614521026611328, -0.03293418884277344, -0.029723167419433594, -0.02651214599609375, -0.023301124572753906, -0.020090103149414062, -0.01687908172607422, -0.013668060302734375, -0.010457038879394531, -0.0072460174560546875, -0.004034996032714844, -0.000823974609375, 0.0023870468139648438, 0.0055980682373046875, 0.008809089660644531, 0.012020111083984375, 0.015231132507324219, 0.018442153930664062, 0.021653175354003906, 0.02486419677734375, 0.028075218200683594, 0.03128623962402344, 0.03449726104736328, 0.037708282470703125, 0.04091930389404297, 0.04413032531738281, 0.047341346740722656, 0.0505523681640625, 0.053763389587402344, 0.05697441101074219, 0.06018543243408203, 0.06339645385742188, 0.06660747528076172, 0.06981849670410156, 0.0730295181274414, 0.07624053955078125, 0.0794515609741211, 0.08266258239746094, 0.08587360382080078, 0.08908462524414062, 0.09229564666748047, 0.09550666809082031, 0.09871768951416016, 0.1019287109375]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 3.0, 10.0, 5.0, 9.0, 15.0, 12.0, 26.0, 33.0, 43.0, 68.0, 115.0, 238.0, 465.0, 1390.0, 6516.0, 48851.0, 902653.0, 3084150.0, 132315.0, 13540.0, 2426.0, 655.0, 272.0, 157.0, 97.0, 60.0, 48.0, 17.0, 23.0, 22.0, 12.0, 7.0, 5.0, 9.0, 6.0, 5.0, 5.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2705078125, -0.26018524169921875, -0.2498626708984375, -0.23954010009765625, -0.229217529296875, -0.21889495849609375, -0.2085723876953125, -0.19824981689453125, -0.18792724609375, -0.17760467529296875, -0.1672821044921875, -0.15695953369140625, -0.146636962890625, -0.13631439208984375, -0.1259918212890625, -0.11566925048828125, -0.1053466796875, -0.09502410888671875, -0.0847015380859375, -0.07437896728515625, -0.064056396484375, -0.05373382568359375, -0.0434112548828125, -0.03308868408203125, -0.02276611328125, -0.01244354248046875, -0.0021209716796875, 0.00820159912109375, 0.018524169921875, 0.02884674072265625, 0.0391693115234375, 0.04949188232421875, 0.059814453125, 0.07013702392578125, 0.0804595947265625, 0.09078216552734375, 0.101104736328125, 0.11142730712890625, 0.1217498779296875, 0.13207244873046875, 0.14239501953125, 0.15271759033203125, 0.1630401611328125, 0.17336273193359375, 0.183685302734375, 0.19400787353515625, 0.2043304443359375, 0.21465301513671875, 0.2249755859375, 0.23529815673828125, 0.2456207275390625, 0.25594329833984375, 0.266265869140625, 0.27658843994140625, 0.2869110107421875, 0.29723358154296875, 0.30755615234375, 0.31787872314453125, 0.3282012939453125, 0.33852386474609375, 0.348846435546875, 0.35916900634765625, 0.3694915771484375, 0.37981414794921875, 0.39013671875]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 2.0, 5.0, 5.0, 8.0, 6.0, 7.0, 12.0, 23.0, 20.0, 22.0, 28.0, 43.0, 40.0, 66.0, 84.0, 113.0, 144.0, 203.0, 265.0, 355.0, 469.0, 502.0, 423.0, 310.0, 235.0, 177.0, 143.0, 83.0, 66.0, 64.0, 36.0, 20.0, 27.0, 16.0, 16.0, 9.0, 9.0, 7.0, 3.0, 2.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0], "bins": [-0.2010498046875, -0.1950206756591797, -0.18899154663085938, -0.18296241760253906, -0.17693328857421875, -0.17090415954589844, -0.16487503051757812, -0.1588459014892578, -0.1528167724609375, -0.1467876434326172, -0.14075851440429688, -0.13472938537597656, -0.12870025634765625, -0.12267112731933594, -0.11664199829101562, -0.11061286926269531, -0.104583740234375, -0.09855461120605469, -0.09252548217773438, -0.08649635314941406, -0.08046722412109375, -0.07443809509277344, -0.06840896606445312, -0.06237983703613281, -0.0563507080078125, -0.05032157897949219, -0.044292449951171875, -0.03826332092285156, -0.03223419189453125, -0.026205062866210938, -0.020175933837890625, -0.014146804809570312, -0.00811767578125, -0.0020885467529296875, 0.003940582275390625, 0.009969711303710938, 0.01599884033203125, 0.022027969360351562, 0.028057098388671875, 0.03408622741699219, 0.0401153564453125, 0.04614448547363281, 0.052173614501953125, 0.05820274353027344, 0.06423187255859375, 0.07026100158691406, 0.07629013061523438, 0.08231925964355469, 0.088348388671875, 0.09437751770019531, 0.10040664672851562, 0.10643577575683594, 0.11246490478515625, 0.11849403381347656, 0.12452316284179688, 0.1305522918701172, 0.1365814208984375, 0.1426105499267578, 0.14863967895507812, 0.15466880798339844, 0.16069793701171875, 0.16672706604003906, 0.17275619506835938, 0.1787853240966797, 0.184814453125]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 3.0, 3.0, 2.0, 5.0, 2.0, 10.0, 6.0, 21.0, 42.0, 90.0, 132.0, 186.0, 217.0, 149.0, 65.0, 39.0, 22.0, 9.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.780270576477051, -4.6871161460876465, -4.593961715698242, -4.50080680847168, -4.407652378082275, -4.314497947692871, -4.221343517303467, -4.1281890869140625, -4.0350341796875, -3.9418797492980957, -3.8487250804901123, -3.755570650100708, -3.6624159812927246, -3.5692615509033203, -3.476107120513916, -3.3829524517059326, -3.2897980213165283, -3.196643590927124, -3.1034889221191406, -3.0103344917297363, -2.917179822921753, -2.8240253925323486, -2.7308707237243652, -2.637716293334961, -2.5445618629455566, -2.4514074325561523, -2.358252763748169, -2.2650983333587646, -2.1719436645507812, -2.078789234161377, -1.985634684562683, -1.8924801349639893, -1.7993252277374268, -1.706170678138733, -1.613016128540039, -1.5198616981506348, -1.4267070293426514, -1.333552598953247, -1.2403980493545532, -1.1472434997558594, -1.0540889501571655, -0.9609344005584717, -0.8677798509597778, -0.7746253609657288, -0.6814708113670349, -0.5883162617683411, -0.495161771774292, -0.40200722217559814, -0.3088526725769043, -0.21569813787937164, -0.12254360318183899, -0.02938908338546753, 0.06376546621322632, 0.15692001581192017, 0.25007450580596924, 0.3432290554046631, 0.43638360500335693, 0.5295381546020508, 0.6226927042007446, 0.7158471941947937, 0.8090017437934875, 0.9021562933921814, 0.9953107833862305, 1.0884653329849243, 1.1816198825836182]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 3.0, 2.0, 7.0, 3.0, 5.0, 6.0, 10.0, 9.0, 10.0, 16.0, 20.0, 31.0, 38.0, 36.0, 40.0, 38.0, 41.0, 36.0, 44.0, 44.0, 54.0, 44.0, 39.0, 49.0, 52.0, 41.0, 41.0, 43.0, 41.0, 32.0, 26.0, 26.0, 16.0, 10.0, 12.0, 8.0, 11.0, 9.0, 6.0, 6.0, 0.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.13295578956604, -1.0957857370376587, -1.058615803718567, -1.0214457511901855, -0.984275758266449, -0.9471057653427124, -0.909935712814331, -0.8727657198905945, -0.8355957269668579, -0.7984257340431213, -0.7612557411193848, -0.7240856885910034, -0.6869156956672668, -0.6497457027435303, -0.6125756502151489, -0.5754056572914124, -0.5382356643676758, -0.5010656714439392, -0.46389564871788025, -0.4267256259918213, -0.3895556330680847, -0.35238564014434814, -0.3152156174182892, -0.2780455946922302, -0.24087560176849365, -0.2037055939435959, -0.16653558611869812, -0.12936557829380035, -0.09219557046890259, -0.05502556264400482, -0.017855554819107056, 0.019314467906951904, 0.05648446083068848, 0.09365446865558624, 0.130824476480484, 0.16799448430538177, 0.20516449213027954, 0.2423344999551773, 0.2795045077800751, 0.31667453050613403, 0.3538445234298706, 0.3910145163536072, 0.42818453907966614, 0.4653545618057251, 0.5025245547294617, 0.5396945476531982, 0.5768646001815796, 0.6140345931053162, 0.6512045860290527, 0.6883745789527893, 0.7255445718765259, 0.7627146244049072, 0.7998846173286438, 0.8370546102523804, 0.8742246627807617, 0.9113946557044983, 0.9485646486282349, 0.9857346415519714, 1.022904634475708, 1.0600746870040894, 1.0972447395324707, 1.1344146728515625, 1.1715847253799438, 1.2087547779083252, 1.245924711227417]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 6.0, 6.0, 13.0, 15.0, 14.0, 30.0, 44.0, 66.0, 115.0, 126.0, 227.0, 374.0, 611.0, 1029.0, 1734.0, 3559.0, 7302.0, 16019.0, 39553.0, 112505.0, 335226.0, 341060.0, 116146.0, 40555.0, 16581.0, 7438.0, 3647.0, 1852.0, 1051.0, 562.0, 384.0, 238.0, 179.0, 110.0, 64.0, 44.0, 22.0, 21.0, 14.0, 8.0, 2.0, 5.0, 4.0, 3.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.128662109375, -0.12422752380371094, -0.11979293823242188, -0.11535835266113281, -0.11092376708984375, -0.10648918151855469, -0.10205459594726562, -0.09762001037597656, -0.0931854248046875, -0.08875083923339844, -0.08431625366210938, -0.07988166809082031, -0.07544708251953125, -0.07101249694824219, -0.06657791137695312, -0.06214332580566406, -0.057708740234375, -0.05327415466308594, -0.048839569091796875, -0.04440498352050781, -0.03997039794921875, -0.03553581237792969, -0.031101226806640625, -0.026666641235351562, -0.0222320556640625, -0.017797470092773438, -0.013362884521484375, -0.008928298950195312, -0.00449371337890625, -5.91278076171875e-05, 0.004375457763671875, 0.008810043334960938, 0.01324462890625, 0.017679214477539062, 0.022113800048828125, 0.026548385620117188, 0.03098297119140625, 0.03541755676269531, 0.039852142333984375, 0.04428672790527344, 0.0487213134765625, 0.05315589904785156, 0.057590484619140625, 0.06202507019042969, 0.06645965576171875, 0.07089424133300781, 0.07532882690429688, 0.07976341247558594, 0.084197998046875, 0.08863258361816406, 0.09306716918945312, 0.09750175476074219, 0.10193634033203125, 0.10637092590332031, 0.11080551147460938, 0.11524009704589844, 0.1196746826171875, 0.12410926818847656, 0.12854385375976562, 0.1329784393310547, 0.13741302490234375, 0.1418476104736328, 0.14628219604492188, 0.15071678161621094, 0.1551513671875]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 4.0, 2.0, 4.0, 5.0, 11.0, 19.0, 17.0, 24.0, 32.0, 19.0, 37.0, 38.0, 24.0, 42.0, 47.0, 48.0, 46.0, 68.0, 62.0, 56.0, 43.0, 46.0, 28.0, 36.0, 34.0, 36.0, 30.0, 29.0, 23.0, 25.0, 17.0, 13.0, 13.0, 4.0, 9.0, 6.0, 2.0, 2.0, 2.0, 0.0, 4.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1278076171875, -0.12385940551757812, -0.11991119384765625, -0.11596298217773438, -0.1120147705078125, -0.10806655883789062, -0.10411834716796875, -0.10017013549804688, -0.096221923828125, -0.09227371215820312, -0.08832550048828125, -0.08437728881835938, -0.0804290771484375, -0.07648086547851562, -0.07253265380859375, -0.06858444213867188, -0.06463623046875, -0.060688018798828125, -0.05673980712890625, -0.052791595458984375, -0.0488433837890625, -0.044895172119140625, -0.04094696044921875, -0.036998748779296875, -0.033050537109375, -0.029102325439453125, -0.02515411376953125, -0.021205902099609375, -0.0172576904296875, -0.013309478759765625, -0.00936126708984375, -0.005413055419921875, -0.00146484375, 0.002483367919921875, 0.00643157958984375, 0.010379791259765625, 0.0143280029296875, 0.018276214599609375, 0.02222442626953125, 0.026172637939453125, 0.030120849609375, 0.034069061279296875, 0.03801727294921875, 0.041965484619140625, 0.0459136962890625, 0.049861907958984375, 0.05381011962890625, 0.057758331298828125, 0.06170654296875, 0.06565475463867188, 0.06960296630859375, 0.07355117797851562, 0.0774993896484375, 0.08144760131835938, 0.08539581298828125, 0.08934402465820312, 0.093292236328125, 0.09724044799804688, 0.10118865966796875, 0.10513687133789062, 0.1090850830078125, 0.11303329467773438, 0.11698150634765625, 0.12092971801757812, 0.1248779296875]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 4.0, 3.0, 2.0, 6.0, 7.0, 8.0, 20.0, 30.0, 32.0, 52.0, 80.0, 109.0, 167.0, 298.0, 505.0, 1014.0, 2421.0, 7933.0, 46813.0, 751485.0, 208703.0, 20823.0, 4562.0, 1634.0, 782.0, 385.0, 235.0, 146.0, 87.0, 66.0, 50.0, 37.0, 19.0, 7.0, 13.0, 8.0, 4.0, 4.0, 3.0, 1.0, 1.0, 0.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.309814453125, -0.2997550964355469, -0.28969573974609375, -0.2796363830566406, -0.2695770263671875, -0.2595176696777344, -0.24945831298828125, -0.23939895629882812, -0.229339599609375, -0.21928024291992188, -0.20922088623046875, -0.19916152954101562, -0.1891021728515625, -0.17904281616210938, -0.16898345947265625, -0.15892410278320312, -0.14886474609375, -0.13880538940429688, -0.12874603271484375, -0.11868667602539062, -0.1086273193359375, -0.09856796264648438, -0.08850860595703125, -0.07844924926757812, -0.068389892578125, -0.058330535888671875, -0.04827117919921875, -0.038211822509765625, -0.0281524658203125, -0.018093109130859375, -0.00803375244140625, 0.002025604248046875, 0.0120849609375, 0.022144317626953125, 0.03220367431640625, 0.042263031005859375, 0.0523223876953125, 0.062381744384765625, 0.07244110107421875, 0.08250045776367188, 0.092559814453125, 0.10261917114257812, 0.11267852783203125, 0.12273788452148438, 0.1327972412109375, 0.14285659790039062, 0.15291595458984375, 0.16297531127929688, 0.17303466796875, 0.18309402465820312, 0.19315338134765625, 0.20321273803710938, 0.2132720947265625, 0.22333145141601562, 0.23339080810546875, 0.24345016479492188, 0.253509521484375, 0.2635688781738281, 0.27362823486328125, 0.2836875915527344, 0.2937469482421875, 0.3038063049316406, 0.31386566162109375, 0.3239250183105469, 0.333984375]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 0.0, 2.0, 9.0, 3.0, 6.0, 11.0, 4.0, 14.0, 17.0, 23.0, 28.0, 24.0, 47.0, 37.0, 51.0, 39.0, 71.0, 76.0, 74.0, 75.0, 69.0, 56.0, 53.0, 37.0, 32.0, 40.0, 24.0, 26.0, 15.0, 12.0, 6.0, 11.0, 4.0, 2.0, 3.0, 6.0, 0.0, 0.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.45751953125, -0.4389190673828125, -0.420318603515625, -0.4017181396484375, -0.38311767578125, -0.3645172119140625, -0.345916748046875, -0.3273162841796875, -0.3087158203125, -0.2901153564453125, -0.271514892578125, -0.2529144287109375, -0.23431396484375, -0.2157135009765625, -0.197113037109375, -0.1785125732421875, -0.159912109375, -0.1413116455078125, -0.122711181640625, -0.1041107177734375, -0.08551025390625, -0.0669097900390625, -0.048309326171875, -0.0297088623046875, -0.0111083984375, 0.0074920654296875, 0.026092529296875, 0.0446929931640625, 0.06329345703125, 0.0818939208984375, 0.100494384765625, 0.1190948486328125, 0.1376953125, 0.1562957763671875, 0.174896240234375, 0.1934967041015625, 0.21209716796875, 0.2306976318359375, 0.249298095703125, 0.2678985595703125, 0.2864990234375, 0.3050994873046875, 0.323699951171875, 0.3423004150390625, 0.36090087890625, 0.3795013427734375, 0.398101806640625, 0.4167022705078125, 0.435302734375, 0.4539031982421875, 0.472503662109375, 0.4911041259765625, 0.50970458984375, 0.5283050537109375, 0.546905517578125, 0.5655059814453125, 0.5841064453125, 0.6027069091796875, 0.621307373046875, 0.6399078369140625, 0.65850830078125, 0.6771087646484375, 0.695709228515625, 0.7143096923828125, 0.73291015625]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 3.0, 3.0, 12.0, 17.0, 20.0, 27.0, 52.0, 73.0, 107.0, 165.0, 348.0, 785.0, 1903.0, 5516.0, 19496.0, 104913.0, 758454.0, 124819.0, 22042.0, 6027.0, 2071.0, 851.0, 393.0, 182.0, 109.0, 51.0, 39.0, 26.0, 19.0, 10.0, 10.0, 7.0, 4.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0], "bins": [-0.09893798828125, -0.09623050689697266, -0.09352302551269531, -0.09081554412841797, -0.08810806274414062, -0.08540058135986328, -0.08269309997558594, -0.0799856185913086, -0.07727813720703125, -0.0745706558227539, -0.07186317443847656, -0.06915569305419922, -0.06644821166992188, -0.06374073028564453, -0.06103324890136719, -0.058325767517089844, -0.0556182861328125, -0.052910804748535156, -0.05020332336425781, -0.04749584197998047, -0.044788360595703125, -0.04208087921142578, -0.03937339782714844, -0.036665916442871094, -0.03395843505859375, -0.031250953674316406, -0.028543472290039062, -0.02583599090576172, -0.023128509521484375, -0.02042102813720703, -0.017713546752929688, -0.015006065368652344, -0.012298583984375, -0.009591102600097656, -0.0068836212158203125, -0.004176139831542969, -0.001468658447265625, 0.0012388229370117188, 0.0039463043212890625, 0.006653785705566406, 0.00936126708984375, 0.012068748474121094, 0.014776229858398438, 0.01748371124267578, 0.020191192626953125, 0.02289867401123047, 0.025606155395507812, 0.028313636779785156, 0.0310211181640625, 0.033728599548339844, 0.03643608093261719, 0.03914356231689453, 0.041851043701171875, 0.04455852508544922, 0.04726600646972656, 0.049973487854003906, 0.05268096923828125, 0.055388450622558594, 0.05809593200683594, 0.06080341339111328, 0.06351089477539062, 0.06621837615966797, 0.06892585754394531, 0.07163333892822266, 0.0743408203125]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 4.0, 2.0, 6.0, 6.0, 9.0, 10.0, 10.0, 13.0, 30.0, 38.0, 46.0, 63.0, 103.0, 117.0, 131.0, 89.0, 77.0, 50.0, 50.0, 38.0, 35.0, 20.0, 11.0, 8.0, 8.0, 6.0, 8.0, 3.0, 5.0, 3.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.1961669921875e-05, -4.0815211832523346e-05, -3.966875374317169e-05, -3.852229565382004e-05, -3.7375837564468384e-05, -3.622937947511673e-05, -3.5082921385765076e-05, -3.393646329641342e-05, -3.279000520706177e-05, -3.1643547117710114e-05, -3.049708902835846e-05, -2.9350630939006805e-05, -2.820417284965515e-05, -2.7057714760303497e-05, -2.5911256670951843e-05, -2.476479858160019e-05, -2.3618340492248535e-05, -2.247188240289688e-05, -2.1325424313545227e-05, -2.0178966224193573e-05, -1.903250813484192e-05, -1.7886050045490265e-05, -1.673959195613861e-05, -1.5593133866786957e-05, -1.4446675777435303e-05, -1.3300217688083649e-05, -1.2153759598731995e-05, -1.100730150938034e-05, -9.860843420028687e-06, -8.714385330677032e-06, -7.567927241325378e-06, -6.421469151973724e-06, -5.27501106262207e-06, -4.128552973270416e-06, -2.982094883918762e-06, -1.8356367945671082e-06, -6.891787052154541e-07, 4.5727938413619995e-07, 1.603737473487854e-06, 2.750195562839508e-06, 3.896653652191162e-06, 5.043111741542816e-06, 6.18956983089447e-06, 7.336027920246124e-06, 8.482486009597778e-06, 9.628944098949432e-06, 1.0775402188301086e-05, 1.192186027765274e-05, 1.3068318367004395e-05, 1.4214776456356049e-05, 1.5361234545707703e-05, 1.6507692635059357e-05, 1.765415072441101e-05, 1.8800608813762665e-05, 1.994706690311432e-05, 2.1093524992465973e-05, 2.2239983081817627e-05, 2.338644117116928e-05, 2.4532899260520935e-05, 2.567935734987259e-05, 2.6825815439224243e-05, 2.7972273528575897e-05, 2.911873161792755e-05, 3.0265189707279205e-05, 3.141164779663086e-05]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 4.0, 7.0, 5.0, 10.0, 13.0, 20.0, 19.0, 28.0, 42.0, 47.0, 96.0, 127.0, 196.0, 336.0, 552.0, 1041.0, 2103.0, 4865.0, 13082.0, 41519.0, 158794.0, 646894.0, 125512.0, 33769.0, 11069.0, 4233.0, 1841.0, 969.0, 496.0, 275.0, 171.0, 140.0, 83.0, 57.0, 41.0, 31.0, 19.0, 16.0, 7.0, 13.0, 3.0, 11.0, 7.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.0679931640625, -0.06595849990844727, -0.06392383575439453, -0.0618891716003418, -0.05985450744628906, -0.05781984329223633, -0.055785179138183594, -0.05375051498413086, -0.051715850830078125, -0.04968118667602539, -0.047646522521972656, -0.04561185836791992, -0.04357719421386719, -0.04154253005981445, -0.03950786590576172, -0.037473201751708984, -0.03543853759765625, -0.033403873443603516, -0.03136920928955078, -0.029334545135498047, -0.027299880981445312, -0.025265216827392578, -0.023230552673339844, -0.02119588851928711, -0.019161224365234375, -0.01712656021118164, -0.015091896057128906, -0.013057231903076172, -0.011022567749023438, -0.008987903594970703, -0.006953239440917969, -0.004918575286865234, -0.0028839111328125, -0.0008492469787597656, 0.0011854171752929688, 0.003220081329345703, 0.0052547454833984375, 0.007289409637451172, 0.009324073791503906, 0.01135873794555664, 0.013393402099609375, 0.01542806625366211, 0.017462730407714844, 0.019497394561767578, 0.021532058715820312, 0.023566722869873047, 0.02560138702392578, 0.027636051177978516, 0.02967071533203125, 0.031705379486083984, 0.03374004364013672, 0.03577470779418945, 0.03780937194824219, 0.03984403610229492, 0.041878700256347656, 0.04391336441040039, 0.045948028564453125, 0.04798269271850586, 0.050017356872558594, 0.05205202102661133, 0.05408668518066406, 0.0561213493347168, 0.05815601348876953, 0.060190677642822266, 0.062225341796875]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 6.0, 2.0, 2.0, 3.0, 2.0, 1.0, 9.0, 12.0, 14.0, 18.0, 28.0, 19.0, 24.0, 27.0, 61.0, 51.0, 83.0, 84.0, 90.0, 99.0, 85.0, 72.0, 49.0, 40.0, 26.0, 25.0, 16.0, 13.0, 10.0, 9.0, 8.0, 3.0, 5.0, 2.0, 2.0, 0.0, 6.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.07183837890625, -0.06919288635253906, -0.06654739379882812, -0.06390190124511719, -0.06125640869140625, -0.05861091613769531, -0.055965423583984375, -0.05331993103027344, -0.0506744384765625, -0.04802894592285156, -0.045383453369140625, -0.04273796081542969, -0.04009246826171875, -0.03744697570800781, -0.034801483154296875, -0.03215599060058594, -0.029510498046875, -0.026865005493164062, -0.024219512939453125, -0.021574020385742188, -0.01892852783203125, -0.016283035278320312, -0.013637542724609375, -0.010992050170898438, -0.0083465576171875, -0.0057010650634765625, -0.003055572509765625, -0.0004100799560546875, 0.00223541259765625, 0.0048809051513671875, 0.007526397705078125, 0.010171890258789062, 0.0128173828125, 0.015462875366210938, 0.018108367919921875, 0.020753860473632812, 0.02339935302734375, 0.026044845581054688, 0.028690338134765625, 0.03133583068847656, 0.0339813232421875, 0.03662681579589844, 0.039272308349609375, 0.04191780090332031, 0.04456329345703125, 0.04720878601074219, 0.049854278564453125, 0.05249977111816406, 0.055145263671875, 0.05779075622558594, 0.060436248779296875, 0.06308174133300781, 0.06572723388671875, 0.06837272644042969, 0.07101821899414062, 0.07366371154785156, 0.0763092041015625, 0.07895469665527344, 0.08160018920898438, 0.08424568176269531, 0.08689117431640625, 0.08953666687011719, 0.09218215942382812, 0.09482765197753906, 0.09747314453125]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 4.0, 7.0, 18.0, 29.0, 129.0, 453.0, 211.0, 88.0, 30.0, 15.0, 6.0, 7.0, 3.0, 2.0, 4.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.8410844802856445, -2.726147413253784, -2.611210584640503, -2.4962735176086426, -2.3813366889953613, -2.266399621963501, -2.1514627933502197, -2.0365257263183594, -1.9215888977050781, -1.8066519498825073, -1.6917150020599365, -1.5767780542373657, -1.461841106414795, -1.3469040393829346, -1.2319672107696533, -1.117030143737793, -1.0020931959152222, -0.8871562480926514, -0.7722193002700806, -0.6572823524475098, -0.542345404624939, -0.4274083971977234, -0.3124714493751526, -0.1975345015525818, -0.08259755373001099, 0.03233940154314041, 0.1472763568162918, 0.2622133195400238, 0.3771502673625946, 0.4920872449874878, 0.6070241928100586, 0.7219611406326294, 0.8368980884552002, 0.951835036277771, 1.0667719841003418, 1.1817089319229126, 1.2966458797454834, 1.4115829467773438, 1.526519775390625, 1.6414568424224854, 1.7563936710357666, 1.8713306188583374, 1.9862675666809082, 2.1012046337127686, 2.21614146232605, 2.33107852935791, 2.4460153579711914, 2.5609524250030518, 2.675889492034912, 2.7908265590667725, 2.9057633876800537, 3.020700454711914, 3.1356372833251953, 3.2505743503570557, 3.365511178970337, 3.4804482460021973, 3.5953850746154785, 3.710322141647339, 3.82525897026062, 3.9401960372924805, 4.055132865905762, 4.170069694519043, 4.285006999969482, 4.399943828582764, 4.514880657196045]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 1.0, 3.0, 11.0, 6.0, 4.0, 9.0, 11.0, 14.0, 16.0, 13.0, 15.0, 20.0, 19.0, 24.0, 23.0, 27.0, 54.0, 59.0, 77.0, 121.0, 99.0, 72.0, 51.0, 33.0, 29.0, 27.0, 18.0, 28.0, 21.0, 23.0, 10.0, 5.0, 13.0, 7.0, 8.0, 9.0, 4.0, 7.0, 5.0, 6.0, 2.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.8421064615249634, -1.7893468141555786, -1.7365871667861938, -1.683827519416809, -1.6310678720474243, -1.5783082246780396, -1.5255485773086548, -1.47278892993927, -1.4200292825698853, -1.3672696352005005, -1.3145099878311157, -1.261750340461731, -1.2089906930923462, -1.1562310457229614, -1.1034713983535767, -1.050711750984192, -0.9979521036148071, -0.9451924562454224, -0.8924328088760376, -0.8396731615066528, -0.7869135141372681, -0.7341538667678833, -0.6813942193984985, -0.6286345720291138, -0.575874924659729, -0.5231152772903442, -0.4703556299209595, -0.4175959825515747, -0.36483633518218994, -0.3120766878128052, -0.2593170404434204, -0.20655739307403564, -0.15379774570465088, -0.10103809833526611, -0.04827845096588135, 0.004481196403503418, 0.057240843772888184, 0.11000049114227295, 0.16276013851165771, 0.21551978588104248, 0.26827943325042725, 0.321039080619812, 0.3737987279891968, 0.42655837535858154, 0.4793180227279663, 0.5320776700973511, 0.5848373174667358, 0.6375969648361206, 0.6903566122055054, 0.7431162595748901, 0.7958759069442749, 0.8486355543136597, 0.9013952016830444, 0.9541548490524292, 1.006914496421814, 1.0596741437911987, 1.1124337911605835, 1.1651934385299683, 1.217953085899353, 1.2707127332687378, 1.3234723806381226, 1.3762320280075073, 1.428991675376892, 1.4817513227462769, 1.5345109701156616]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 7.0, 14.0, 21.0, 34.0, 64.0, 80.0, 135.0, 246.0, 416.0, 784.0, 1401.0, 2919.0, 6328.0, 15285.0, 39835.0, 121174.0, 436136.0, 1440325.0, 1486981.0, 447735.0, 124885.0, 40458.0, 15601.0, 6734.0, 3225.0, 1526.0, 842.0, 433.0, 273.0, 140.0, 95.0, 67.0, 38.0, 20.0, 7.0, 10.0, 4.0, 4.0, 7.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1588134765625, -0.15314483642578125, -0.1474761962890625, -0.14180755615234375, -0.136138916015625, -0.13047027587890625, -0.1248016357421875, -0.11913299560546875, -0.11346435546875, -0.10779571533203125, -0.1021270751953125, -0.09645843505859375, -0.090789794921875, -0.08512115478515625, -0.0794525146484375, -0.07378387451171875, -0.068115234375, -0.06244659423828125, -0.0567779541015625, -0.05110931396484375, -0.045440673828125, -0.03977203369140625, -0.0341033935546875, -0.02843475341796875, -0.02276611328125, -0.01709747314453125, -0.0114288330078125, -0.00576019287109375, -9.1552734375e-05, 0.00557708740234375, 0.0112457275390625, 0.01691436767578125, 0.0225830078125, 0.02825164794921875, 0.0339202880859375, 0.03958892822265625, 0.045257568359375, 0.05092620849609375, 0.0565948486328125, 0.06226348876953125, 0.06793212890625, 0.07360076904296875, 0.0792694091796875, 0.08493804931640625, 0.090606689453125, 0.09627532958984375, 0.1019439697265625, 0.10761260986328125, 0.11328125, 0.11894989013671875, 0.1246185302734375, 0.13028717041015625, 0.135955810546875, 0.14162445068359375, 0.1472930908203125, 0.15296173095703125, 0.15863037109375, 0.16429901123046875, 0.1699676513671875, 0.17563629150390625, 0.181304931640625, 0.18697357177734375, 0.1926422119140625, 0.19831085205078125, 0.2039794921875]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 2.0, 7.0, 5.0, 9.0, 8.0, 9.0, 11.0, 12.0, 14.0, 10.0, 20.0, 20.0, 28.0, 25.0, 35.0, 45.0, 30.0, 37.0, 35.0, 40.0, 38.0, 49.0, 49.0, 50.0, 38.0, 43.0, 36.0, 28.0, 35.0, 38.0, 20.0, 27.0, 20.0, 30.0, 16.0, 16.0, 13.0, 11.0, 13.0, 10.0, 5.0, 5.0, 7.0, 2.0, 4.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0950927734375, -0.09203910827636719, -0.08898544311523438, -0.08593177795410156, -0.08287811279296875, -0.07982444763183594, -0.07677078247070312, -0.07371711730957031, -0.0706634521484375, -0.06760978698730469, -0.06455612182617188, -0.06150245666503906, -0.05844879150390625, -0.05539512634277344, -0.052341461181640625, -0.04928779602050781, -0.046234130859375, -0.04318046569824219, -0.040126800537109375, -0.03707313537597656, -0.03401947021484375, -0.030965805053710938, -0.027912139892578125, -0.024858474731445312, -0.0218048095703125, -0.018751144409179688, -0.015697479248046875, -0.012643814086914062, -0.00959014892578125, -0.0065364837646484375, -0.003482818603515625, -0.0004291534423828125, 0.00262451171875, 0.0056781768798828125, 0.008731842041015625, 0.011785507202148438, 0.01483917236328125, 0.017892837524414062, 0.020946502685546875, 0.024000167846679688, 0.0270538330078125, 0.030107498168945312, 0.033161163330078125, 0.03621482849121094, 0.03926849365234375, 0.04232215881347656, 0.045375823974609375, 0.04842948913574219, 0.051483154296875, 0.05453681945800781, 0.057590484619140625, 0.06064414978027344, 0.06369781494140625, 0.06675148010253906, 0.06980514526367188, 0.07285881042480469, 0.0759124755859375, 0.07896614074707031, 0.08201980590820312, 0.08507347106933594, 0.08812713623046875, 0.09118080139160156, 0.09423446655273438, 0.09728813171386719, 0.100341796875]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 5.0, 3.0, 8.0, 9.0, 8.0, 14.0, 25.0, 33.0, 40.0, 78.0, 143.0, 270.0, 572.0, 1414.0, 6135.0, 188943.0, 3957168.0, 34109.0, 3303.0, 998.0, 435.0, 230.0, 132.0, 81.0, 47.0, 36.0, 12.0, 13.0, 9.0, 3.0, 1.0, 3.0, 3.0, 0.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2666015625, -1.233551025390625, -1.20050048828125, -1.167449951171875, -1.1343994140625, -1.101348876953125, -1.06829833984375, -1.035247802734375, -1.002197265625, -0.969146728515625, -0.93609619140625, -0.903045654296875, -0.8699951171875, -0.836944580078125, -0.80389404296875, -0.770843505859375, -0.73779296875, -0.704742431640625, -0.67169189453125, -0.638641357421875, -0.6055908203125, -0.572540283203125, -0.53948974609375, -0.506439208984375, -0.473388671875, -0.440338134765625, -0.40728759765625, -0.374237060546875, -0.3411865234375, -0.308135986328125, -0.27508544921875, -0.242034912109375, -0.208984375, -0.175933837890625, -0.14288330078125, -0.109832763671875, -0.0767822265625, -0.043731689453125, -0.01068115234375, 0.022369384765625, 0.055419921875, 0.088470458984375, 0.12152099609375, 0.154571533203125, 0.1876220703125, 0.220672607421875, 0.25372314453125, 0.286773681640625, 0.31982421875, 0.352874755859375, 0.38592529296875, 0.418975830078125, 0.4520263671875, 0.485076904296875, 0.51812744140625, 0.551177978515625, 0.584228515625, 0.617279052734375, 0.65032958984375, 0.683380126953125, 0.7164306640625, 0.749481201171875, 0.78253173828125, 0.815582275390625, 0.8486328125]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 5.0, 3.0, 7.0, 4.0, 4.0, 3.0, 12.0, 12.0, 24.0, 25.0, 21.0, 36.0, 56.0, 70.0, 107.0, 147.0, 175.0, 217.0, 301.0, 382.0, 503.0, 485.0, 347.0, 272.0, 242.0, 171.0, 130.0, 80.0, 71.0, 40.0, 39.0, 40.0, 16.0, 5.0, 6.0, 5.0, 8.0, 3.0, 2.0, 7.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.308349609375, -0.29645538330078125, -0.2845611572265625, -0.27266693115234375, -0.260772705078125, -0.24887847900390625, -0.2369842529296875, -0.22509002685546875, -0.21319580078125, -0.20130157470703125, -0.1894073486328125, -0.17751312255859375, -0.165618896484375, -0.15372467041015625, -0.1418304443359375, -0.12993621826171875, -0.1180419921875, -0.10614776611328125, -0.0942535400390625, -0.08235931396484375, -0.070465087890625, -0.05857086181640625, -0.0466766357421875, -0.03478240966796875, -0.02288818359375, -0.01099395751953125, 0.0009002685546875, 0.01279449462890625, 0.024688720703125, 0.03658294677734375, 0.0484771728515625, 0.06037139892578125, 0.072265625, 0.08415985107421875, 0.0960540771484375, 0.10794830322265625, 0.119842529296875, 0.13173675537109375, 0.1436309814453125, 0.15552520751953125, 0.16741943359375, 0.17931365966796875, 0.1912078857421875, 0.20310211181640625, 0.214996337890625, 0.22689056396484375, 0.2387847900390625, 0.25067901611328125, 0.2625732421875, 0.27446746826171875, 0.2863616943359375, 0.29825592041015625, 0.310150146484375, 0.32204437255859375, 0.3339385986328125, 0.34583282470703125, 0.35772705078125, 0.36962127685546875, 0.3815155029296875, 0.39340972900390625, 0.405303955078125, 0.41719818115234375, 0.4290924072265625, 0.44098663330078125, 0.452880859375]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 4.0, 2.0, 0.0, 10.0, 12.0, 24.0, 52.0, 103.0, 202.0, 258.0, 167.0, 86.0, 36.0, 21.0, 14.0, 5.0, 3.0, 4.0, 4.0, 2.0, 2.0, 1.0], "bins": [-11.689427375793457, -11.461386680603027, -11.233345031738281, -11.005304336547852, -10.777262687683105, -10.549221992492676, -10.32118034362793, -10.0931396484375, -9.865097999572754, -9.637057304382324, -9.409015655517578, -9.180974960327148, -8.952933311462402, -8.724892616271973, -8.496850967407227, -8.268810272216797, -8.040769577026367, -7.812728404998779, -7.584687232971191, -7.3566460609436035, -7.128604888916016, -6.900563716888428, -6.67252254486084, -6.44448184967041, -6.216440200805664, -5.988399028778076, -5.760357856750488, -5.5323166847229, -5.3042755126953125, -5.076234340667725, -4.848193168640137, -4.620152473449707, -4.392110347747803, -4.164069175720215, -3.936028003692627, -3.707986831665039, -3.479945659637451, -3.2519044876098633, -3.0238635540008545, -2.7958223819732666, -2.5677812099456787, -2.339740037918091, -2.111698865890503, -1.8836578130722046, -1.6556166410446167, -1.4275754690170288, -1.1995344161987305, -0.9714932441711426, -0.7434520721435547, -0.5154109001159668, -0.2873697876930237, -0.059328675270080566, 0.16871249675750732, 0.3967536687850952, 0.6247947216033936, 0.8528358936309814, 1.0808770656585693, 1.3089182376861572, 1.5369594097137451, 1.7650004625320435, 1.9930416345596313, 2.2210826873779297, 2.4491238594055176, 2.6771650314331055, 2.9052062034606934]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 3.0, 5.0, 5.0, 4.0, 6.0, 6.0, 9.0, 16.0, 13.0, 18.0, 15.0, 23.0, 30.0, 35.0, 23.0, 33.0, 25.0, 44.0, 28.0, 47.0, 51.0, 52.0, 65.0, 51.0, 52.0, 40.0, 43.0, 39.0, 17.0, 35.0, 23.0, 30.0, 17.0, 18.0, 17.0, 14.0, 5.0, 9.0, 7.0, 10.0, 8.0, 8.0, 3.0, 1.0, 4.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.046013832092285, -1.9810378551483154, -1.9160618782043457, -1.8510857820510864, -1.7861098051071167, -1.721133828163147, -1.6561577320098877, -1.591181755065918, -1.5262057781219482, -1.4612298011779785, -1.3962538242340088, -1.3312777280807495, -1.2663017511367798, -1.20132577419281, -1.1363496780395508, -1.071373701095581, -1.0063977241516113, -0.9414217472076416, -0.8764457106590271, -0.8114696741104126, -0.7464936971664429, -0.6815177202224731, -0.6165416836738586, -0.5515656471252441, -0.4865896701812744, -0.4216136634349823, -0.3566376566886902, -0.29166164994239807, -0.22668564319610596, -0.16170963644981384, -0.09673362970352173, -0.031757622957229614, 0.0332183837890625, 0.09819439053535461, 0.16317039728164673, 0.22814640402793884, 0.29312241077423096, 0.35809841752052307, 0.4230744242668152, 0.4880504310131073, 0.5530264377593994, 0.6180024147033691, 0.6829784512519836, 0.7479544878005981, 0.8129304647445679, 0.8779064416885376, 0.9428824782371521, 1.0078585147857666, 1.0728344917297363, 1.137810468673706, 1.2027864456176758, 1.267762541770935, 1.3327385187149048, 1.3977144956588745, 1.4626905918121338, 1.5276665687561035, 1.5926425457000732, 1.657618522644043, 1.7225944995880127, 1.787570595741272, 1.8525465726852417, 1.9175225496292114, 1.9824986457824707, 2.0474746227264404, 2.11245059967041]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 7.0, 5.0, 10.0, 5.0, 10.0, 17.0, 31.0, 47.0, 74.0, 132.0, 234.0, 453.0, 857.0, 1784.0, 4133.0, 11067.0, 34835.0, 145195.0, 606868.0, 180520.0, 41037.0, 12549.0, 4658.0, 2014.0, 910.0, 496.0, 255.0, 148.0, 79.0, 55.0, 29.0, 24.0, 10.0, 6.0, 2.0, 2.0, 5.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.139404296875, -0.13262557983398438, -0.12584686279296875, -0.11906814575195312, -0.1122894287109375, -0.10551071166992188, -0.09873199462890625, -0.09195327758789062, -0.085174560546875, -0.07839584350585938, -0.07161712646484375, -0.06483840942382812, -0.0580596923828125, -0.051280975341796875, -0.04450225830078125, -0.037723541259765625, -0.03094482421875, -0.024166107177734375, -0.01738739013671875, -0.010608673095703125, -0.0038299560546875, 0.002948760986328125, 0.00972747802734375, 0.016506195068359375, 0.023284912109375, 0.030063629150390625, 0.03684234619140625, 0.043621063232421875, 0.0503997802734375, 0.057178497314453125, 0.06395721435546875, 0.07073593139648438, 0.0775146484375, 0.08429336547851562, 0.09107208251953125, 0.09785079956054688, 0.1046295166015625, 0.11140823364257812, 0.11818695068359375, 0.12496566772460938, 0.131744384765625, 0.13852310180664062, 0.14530181884765625, 0.15208053588867188, 0.1588592529296875, 0.16563796997070312, 0.17241668701171875, 0.17919540405273438, 0.18597412109375, 0.19275283813476562, 0.19953155517578125, 0.20631027221679688, 0.2130889892578125, 0.21986770629882812, 0.22664642333984375, 0.23342514038085938, 0.240203857421875, 0.24698257446289062, 0.25376129150390625, 0.2605400085449219, 0.2673187255859375, 0.2740974426269531, 0.28087615966796875, 0.2876548767089844, 0.29443359375]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 6.0, 3.0, 7.0, 3.0, 12.0, 12.0, 22.0, 21.0, 21.0, 23.0, 33.0, 33.0, 49.0, 50.0, 57.0, 51.0, 59.0, 63.0, 67.0, 60.0, 61.0, 40.0, 39.0, 33.0, 30.0, 23.0, 18.0, 24.0, 20.0, 13.0, 13.0, 10.0, 10.0, 5.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.2159423828125, -0.20929527282714844, -0.20264816284179688, -0.1960010528564453, -0.18935394287109375, -0.1827068328857422, -0.17605972290039062, -0.16941261291503906, -0.1627655029296875, -0.15611839294433594, -0.14947128295898438, -0.1428241729736328, -0.13617706298828125, -0.1295299530029297, -0.12288284301757812, -0.11623573303222656, -0.109588623046875, -0.10294151306152344, -0.09629440307617188, -0.08964729309082031, -0.08300018310546875, -0.07635307312011719, -0.06970596313476562, -0.06305885314941406, -0.0564117431640625, -0.04976463317871094, -0.043117523193359375, -0.03647041320800781, -0.02982330322265625, -0.023176193237304688, -0.016529083251953125, -0.009881973266601562, -0.00323486328125, 0.0034122467041015625, 0.010059356689453125, 0.016706466674804688, 0.02335357666015625, 0.030000686645507812, 0.036647796630859375, 0.04329490661621094, 0.0499420166015625, 0.05658912658691406, 0.06323623657226562, 0.06988334655761719, 0.07653045654296875, 0.08317756652832031, 0.08982467651367188, 0.09647178649902344, 0.103118896484375, 0.10976600646972656, 0.11641311645507812, 0.12306022644042969, 0.12970733642578125, 0.1363544464111328, 0.14300155639648438, 0.14964866638183594, 0.1562957763671875, 0.16294288635253906, 0.16958999633789062, 0.1762371063232422, 0.18288421630859375, 0.1895313262939453, 0.19617843627929688, 0.20282554626464844, 0.20947265625]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 5.0, 3.0, 1.0, 10.0, 10.0, 18.0, 27.0, 30.0, 30.0, 43.0, 60.0, 110.0, 146.0, 260.0, 483.0, 979.0, 2443.0, 7386.0, 32771.0, 664987.0, 297607.0, 29973.0, 6668.0, 2313.0, 995.0, 419.0, 268.0, 160.0, 92.0, 54.0, 47.0, 43.0, 30.0, 26.0, 13.0, 9.0, 11.0, 9.0, 2.0, 7.0, 2.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.277587890625, -0.2691688537597656, -0.26074981689453125, -0.2523307800292969, -0.2439117431640625, -0.23549270629882812, -0.22707366943359375, -0.21865463256835938, -0.210235595703125, -0.20181655883789062, -0.19339752197265625, -0.18497848510742188, -0.1765594482421875, -0.16814041137695312, -0.15972137451171875, -0.15130233764648438, -0.14288330078125, -0.13446426391601562, -0.12604522705078125, -0.11762619018554688, -0.1092071533203125, -0.10078811645507812, -0.09236907958984375, -0.08395004272460938, -0.075531005859375, -0.06711196899414062, -0.05869293212890625, -0.050273895263671875, -0.0418548583984375, -0.033435821533203125, -0.02501678466796875, -0.016597747802734375, -0.0081787109375, 0.000240325927734375, 0.00865936279296875, 0.017078399658203125, 0.0254974365234375, 0.033916473388671875, 0.04233551025390625, 0.050754547119140625, 0.059173583984375, 0.06759262084960938, 0.07601165771484375, 0.08443069458007812, 0.0928497314453125, 0.10126876831054688, 0.10968780517578125, 0.11810684204101562, 0.12652587890625, 0.13494491577148438, 0.14336395263671875, 0.15178298950195312, 0.1602020263671875, 0.16862106323242188, 0.17704010009765625, 0.18545913696289062, 0.193878173828125, 0.20229721069335938, 0.21071624755859375, 0.21913528442382812, 0.2275543212890625, 0.23597335815429688, 0.24439239501953125, 0.2528114318847656, 0.26123046875]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 1.0, 1.0, 3.0, 4.0, 1.0, 6.0, 5.0, 5.0, 4.0, 6.0, 7.0, 5.0, 8.0, 15.0, 16.0, 16.0, 31.0, 25.0, 37.0, 33.0, 35.0, 61.0, 70.0, 70.0, 76.0, 76.0, 73.0, 61.0, 45.0, 36.0, 30.0, 25.0, 19.0, 22.0, 12.0, 5.0, 12.0, 9.0, 11.0, 7.0, 5.0, 9.0, 5.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.83251953125, -0.8089370727539062, -0.7853546142578125, -0.7617721557617188, -0.738189697265625, -0.7146072387695312, -0.6910247802734375, -0.6674423217773438, -0.64385986328125, -0.6202774047851562, -0.5966949462890625, -0.5731124877929688, -0.549530029296875, -0.5259475708007812, -0.5023651123046875, -0.47878265380859375, -0.4552001953125, -0.43161773681640625, -0.4080352783203125, -0.38445281982421875, -0.360870361328125, -0.33728790283203125, -0.3137054443359375, -0.29012298583984375, -0.26654052734375, -0.24295806884765625, -0.2193756103515625, -0.19579315185546875, -0.172210693359375, -0.14862823486328125, -0.1250457763671875, -0.10146331787109375, -0.077880859375, -0.05429840087890625, -0.0307159423828125, -0.00713348388671875, 0.016448974609375, 0.04003143310546875, 0.0636138916015625, 0.08719635009765625, 0.11077880859375, 0.13436126708984375, 0.1579437255859375, 0.18152618408203125, 0.205108642578125, 0.22869110107421875, 0.2522735595703125, 0.27585601806640625, 0.2994384765625, 0.32302093505859375, 0.3466033935546875, 0.37018585205078125, 0.393768310546875, 0.41735076904296875, 0.4409332275390625, 0.46451568603515625, 0.48809814453125, 0.5116806030273438, 0.5352630615234375, 0.5588455200195312, 0.582427978515625, 0.6060104370117188, 0.6295928955078125, 0.6531753540039062, 0.6767578125]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 5.0, 2.0, 7.0, 6.0, 13.0, 7.0, 8.0, 9.0, 9.0, 28.0, 29.0, 53.0, 61.0, 93.0, 159.0, 228.0, 388.0, 766.0, 1595.0, 3891.0, 11011.0, 43135.0, 776931.0, 170505.0, 26236.0, 7699.0, 2879.0, 1216.0, 625.0, 361.0, 191.0, 119.0, 78.0, 57.0, 36.0, 26.0, 28.0, 10.0, 13.0, 10.0, 11.0, 6.0, 10.0, 3.0, 1.0, 6.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.05914306640625, -0.0573420524597168, -0.055541038513183594, -0.05374002456665039, -0.05193901062011719, -0.050137996673583984, -0.04833698272705078, -0.04653596878051758, -0.044734954833984375, -0.04293394088745117, -0.04113292694091797, -0.039331912994384766, -0.03753089904785156, -0.03572988510131836, -0.033928871154785156, -0.03212785720825195, -0.03032684326171875, -0.028525829315185547, -0.026724815368652344, -0.02492380142211914, -0.023122787475585938, -0.021321773529052734, -0.01952075958251953, -0.017719745635986328, -0.015918731689453125, -0.014117717742919922, -0.012316703796386719, -0.010515689849853516, -0.008714675903320312, -0.006913661956787109, -0.005112648010253906, -0.003311634063720703, -0.0015106201171875, 0.0002903938293457031, 0.0020914077758789062, 0.0038924217224121094, 0.0056934356689453125, 0.007494449615478516, 0.009295463562011719, 0.011096477508544922, 0.012897491455078125, 0.014698505401611328, 0.01649951934814453, 0.018300533294677734, 0.020101547241210938, 0.02190256118774414, 0.023703575134277344, 0.025504589080810547, 0.02730560302734375, 0.029106616973876953, 0.030907630920410156, 0.03270864486694336, 0.03450965881347656, 0.036310672760009766, 0.03811168670654297, 0.03991270065307617, 0.041713714599609375, 0.04351472854614258, 0.04531574249267578, 0.047116756439208984, 0.04891777038574219, 0.05071878433227539, 0.052519798278808594, 0.0543208122253418, 0.056121826171875]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 4.0, 1.0, 1.0, 4.0, 4.0, 3.0, 9.0, 12.0, 8.0, 13.0, 10.0, 22.0, 21.0, 19.0, 33.0, 24.0, 37.0, 64.0, 76.0, 88.0, 79.0, 74.0, 84.0, 61.0, 52.0, 44.0, 28.0, 19.0, 25.0, 20.0, 15.0, 8.0, 9.0, 3.0, 9.0, 3.0, 4.0, 7.0, 5.0, 3.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-2.5987625122070312e-05, -2.5277957320213318e-05, -2.4568289518356323e-05, -2.385862171649933e-05, -2.3148953914642334e-05, -2.243928611278534e-05, -2.1729618310928345e-05, -2.101995050907135e-05, -2.0310282707214355e-05, -1.960061490535736e-05, -1.8890947103500366e-05, -1.818127930164337e-05, -1.7471611499786377e-05, -1.6761943697929382e-05, -1.6052275896072388e-05, -1.5342608094215393e-05, -1.4632940292358398e-05, -1.3923272490501404e-05, -1.321360468864441e-05, -1.2503936886787415e-05, -1.179426908493042e-05, -1.1084601283073425e-05, -1.037493348121643e-05, -9.665265679359436e-06, -8.955597877502441e-06, -8.245930075645447e-06, -7.536262273788452e-06, -6.8265944719314575e-06, -6.116926670074463e-06, -5.407258868217468e-06, -4.697591066360474e-06, -3.987923264503479e-06, -3.2782554626464844e-06, -2.5685876607894897e-06, -1.8589198589324951e-06, -1.1492520570755005e-06, -4.3958425521850586e-07, 2.7008354663848877e-07, 9.797513484954834e-07, 1.689419150352478e-06, 2.3990869522094727e-06, 3.1087547540664673e-06, 3.818422555923462e-06, 4.5280903577804565e-06, 5.237758159637451e-06, 5.947425961494446e-06, 6.6570937633514404e-06, 7.366761565208435e-06, 8.07642936706543e-06, 8.786097168922424e-06, 9.495764970779419e-06, 1.0205432772636414e-05, 1.0915100574493408e-05, 1.1624768376350403e-05, 1.2334436178207397e-05, 1.3044103980064392e-05, 1.3753771781921387e-05, 1.4463439583778381e-05, 1.5173107385635376e-05, 1.588277518749237e-05, 1.6592442989349365e-05, 1.730211079120636e-05, 1.8011778593063354e-05, 1.872144639492035e-05, 1.9431114196777344e-05]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 2.0, 3.0, 2.0, 8.0, 9.0, 5.0, 12.0, 17.0, 24.0, 30.0, 56.0, 95.0, 183.0, 324.0, 684.0, 1595.0, 4056.0, 12376.0, 50714.0, 803435.0, 139194.0, 24168.0, 6936.0, 2549.0, 1032.0, 465.0, 232.0, 136.0, 66.0, 59.0, 26.0, 20.0, 15.0, 5.0, 7.0, 3.0, 7.0, 5.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.068603515625, -0.06637287139892578, -0.06414222717285156, -0.061911582946777344, -0.059680938720703125, -0.057450294494628906, -0.05521965026855469, -0.05298900604248047, -0.05075836181640625, -0.04852771759033203, -0.04629707336425781, -0.044066429138183594, -0.041835784912109375, -0.039605140686035156, -0.03737449645996094, -0.03514385223388672, -0.0329132080078125, -0.03068256378173828, -0.028451919555664062, -0.026221275329589844, -0.023990631103515625, -0.021759986877441406, -0.019529342651367188, -0.01729869842529297, -0.01506805419921875, -0.012837409973144531, -0.010606765747070312, -0.008376121520996094, -0.006145477294921875, -0.003914833068847656, -0.0016841888427734375, 0.0005464553833007812, 0.002777099609375, 0.005007743835449219, 0.0072383880615234375, 0.009469032287597656, 0.011699676513671875, 0.013930320739746094, 0.016160964965820312, 0.01839160919189453, 0.02062225341796875, 0.02285289764404297, 0.025083541870117188, 0.027314186096191406, 0.029544830322265625, 0.031775474548339844, 0.03400611877441406, 0.03623676300048828, 0.0384674072265625, 0.04069805145263672, 0.04292869567871094, 0.045159339904785156, 0.047389984130859375, 0.049620628356933594, 0.05185127258300781, 0.05408191680908203, 0.05631256103515625, 0.05854320526123047, 0.06077384948730469, 0.0630044937133789, 0.06523513793945312, 0.06746578216552734, 0.06969642639160156, 0.07192707061767578, 0.07415771484375]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 3.0, 1.0, 3.0, 3.0, 3.0, 19.0, 11.0, 17.0, 25.0, 20.0, 34.0, 57.0, 71.0, 108.0, 168.0, 161.0, 77.0, 68.0, 41.0, 34.0, 17.0, 19.0, 11.0, 10.0, 6.0, 3.0, 4.0, 4.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1407470703125, -0.13667869567871094, -0.13261032104492188, -0.1285419464111328, -0.12447357177734375, -0.12040519714355469, -0.11633682250976562, -0.11226844787597656, -0.1082000732421875, -0.10413169860839844, -0.10006332397460938, -0.09599494934082031, -0.09192657470703125, -0.08785820007324219, -0.08378982543945312, -0.07972145080566406, -0.075653076171875, -0.07158470153808594, -0.06751632690429688, -0.06344795227050781, -0.05937957763671875, -0.05531120300292969, -0.051242828369140625, -0.04717445373535156, -0.0431060791015625, -0.03903770446777344, -0.034969329833984375, -0.030900955200195312, -0.02683258056640625, -0.022764205932617188, -0.018695831298828125, -0.014627456665039062, -0.01055908203125, -0.0064907073974609375, -0.002422332763671875, 0.0016460418701171875, 0.00571441650390625, 0.009782791137695312, 0.013851165771484375, 0.017919540405273438, 0.0219879150390625, 0.026056289672851562, 0.030124664306640625, 0.03419303894042969, 0.03826141357421875, 0.04232978820800781, 0.046398162841796875, 0.05046653747558594, 0.054534912109375, 0.05860328674316406, 0.06267166137695312, 0.06674003601074219, 0.07080841064453125, 0.07487678527832031, 0.07894515991210938, 0.08301353454589844, 0.0870819091796875, 0.09115028381347656, 0.09521865844726562, 0.09928703308105469, 0.10335540771484375, 0.10742378234863281, 0.11149215698242188, 0.11556053161621094, 0.11962890625]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 5.0, 8.0, 12.0, 22.0, 83.0, 414.0, 313.0, 68.0, 37.0, 20.0, 9.0, 7.0, 7.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.763082981109619, -2.6244237422943115, -2.485764741897583, -2.3471055030822754, -2.208446502685547, -2.0697872638702393, -1.9311280250549316, -1.7924689054489136, -1.6538097858428955, -1.5151506662368774, -1.3764915466308594, -1.2378323078155518, -1.0991731882095337, -0.9605140686035156, -0.8218548893928528, -0.6831957101821899, -0.5445365905761719, -0.4058774411678314, -0.26721829175949097, -0.1285591423511505, 0.010100007057189941, 0.148759126663208, 0.28741830587387085, 0.4260774850845337, 0.5647366046905518, 0.7033957242965698, 0.8420549035072327, 0.9807140827178955, 1.1193732023239136, 1.2580323219299316, 1.3966915607452393, 1.5353506803512573, 1.6740102767944336, 1.8126693964004517, 1.9513285160064697, 2.0899877548217773, 2.228646755218506, 2.3673059940338135, 2.505965232849121, 2.6446242332458496, 2.7832834720611572, 2.921942710876465, 3.0606017112731934, 3.199260950088501, 3.3379201889038086, 3.476579189300537, 3.6152384281158447, 3.7538976669311523, 3.892556667327881, 4.031215667724609, 4.169875144958496, 4.308534145355225, 4.447193145751953, 4.58585262298584, 4.724511623382568, 4.863170623779297, 5.001830101013184, 5.140489101409912, 5.279148578643799, 5.417807579040527, 5.556466579437256, 5.695125579833984, 5.833785057067871, 5.9724440574646, 6.111103057861328]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 6.0, 6.0, 5.0, 9.0, 4.0, 10.0, 10.0, 10.0, 7.0, 15.0, 14.0, 13.0, 16.0, 30.0, 41.0, 92.0, 175.0, 190.0, 82.0, 43.0, 35.0, 34.0, 21.0, 22.0, 23.0, 15.0, 21.0, 11.0, 10.0, 8.0, 14.0, 3.0, 1.0, 3.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.523611545562744, -2.449512004852295, -2.375412702560425, -2.3013131618499756, -2.2272136211395264, -2.153114080429077, -2.079014778137207, -2.004915237426758, -1.9308156967163086, -1.856716275215149, -1.7826167345046997, -1.70851731300354, -1.6344177722930908, -1.5603183507919312, -1.4862189292907715, -1.4121193885803223, -1.3380199670791626, -1.263920545578003, -1.1898210048675537, -1.115721583366394, -1.0416220426559448, -0.9675226211547852, -0.8934231400489807, -0.8193236589431763, -0.7452241778373718, -0.6711246967315674, -0.5970252156257629, -0.5229257345199585, -0.44882628321647644, -0.374726802110672, -0.30062735080718994, -0.2265278697013855, -0.15242838859558105, -0.07832891494035721, -0.004229441285133362, 0.06987002491950989, 0.14396950602531433, 0.21806898713111877, 0.29216843843460083, 0.3662679195404053, 0.4403674006462097, 0.5144668817520142, 0.5885663628578186, 0.662665843963623, 0.7367652654647827, 0.8108648061752319, 0.8849642276763916, 0.959063708782196, 1.0331631898880005, 1.1072626113891602, 1.1813621520996094, 1.255461573600769, 1.3295611143112183, 1.403660535812378, 1.4777600765228271, 1.5518594980239868, 1.6259589195251465, 1.7000583410263062, 1.7741578817367554, 1.848257303237915, 1.9223568439483643, 1.996456265449524, 2.0705556869506836, 2.144655227661133, 2.218754768371582]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 4.0, 0.0, 4.0, 5.0, 7.0, 2.0, 17.0, 7.0, 12.0, 20.0, 14.0, 8.0, 28.0, 28.0, 44.0, 32.0, 45.0, 50.0, 121.0, 172.0, 90.0, 46.0, 41.0, 37.0, 35.0, 27.0, 17.0, 18.0, 11.0, 12.0, 14.0, 7.0, 11.0, 3.0, 4.0, 6.0, 3.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.20849609375, -0.2016143798828125, -0.194732666015625, -0.1878509521484375, -0.18096923828125, -0.1740875244140625, -0.167205810546875, -0.1603240966796875, -0.1534423828125, -0.1465606689453125, -0.139678955078125, -0.1327972412109375, -0.12591552734375, -0.1190338134765625, -0.112152099609375, -0.1052703857421875, -0.098388671875, -0.0915069580078125, -0.084625244140625, -0.0777435302734375, -0.07086181640625, -0.0639801025390625, -0.057098388671875, -0.0502166748046875, -0.0433349609375, -0.0364532470703125, -0.029571533203125, -0.0226898193359375, -0.01580810546875, -0.0089263916015625, -0.002044677734375, 0.0048370361328125, 0.01171875, 0.0186004638671875, 0.025482177734375, 0.0323638916015625, 0.03924560546875, 0.0461273193359375, 0.053009033203125, 0.0598907470703125, 0.0667724609375, 0.0736541748046875, 0.080535888671875, 0.0874176025390625, 0.09429931640625, 0.1011810302734375, 0.108062744140625, 0.1149444580078125, 0.121826171875, 0.1287078857421875, 0.135589599609375, 0.1424713134765625, 0.14935302734375, 0.1562347412109375, 0.163116455078125, 0.1699981689453125, 0.1768798828125, 0.1837615966796875, 0.190643310546875, 0.1975250244140625, 0.20440673828125, 0.2112884521484375, 0.218170166015625, 0.2250518798828125, 0.23193359375]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 8.0, 6.0, 1.0, 2.0, 3.0, 4.0, 0.0, 3.0, 10.0, 6.0, 15.0, 17.0, 25.0, 27.0, 44.0, 83.0, 149.0, 253.0, 599.0, 1613.0, 4864.0, 28140.0, 8319679.0, 25565.0, 4759.0, 1555.0, 546.0, 239.0, 142.0, 69.0, 44.0, 24.0, 30.0, 16.0, 11.0, 10.0, 5.0, 5.0, 5.0, 4.0, 4.0, 2.0, 1.0, 0.0, 2.0, 5.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0], "bins": [-0.9834104180335999, -0.9500563144683838, -0.916702151298523, -0.8833479881286621, -0.849993884563446, -0.81663978099823, -0.7832856178283691, -0.7499314546585083, -0.7165773510932922, -0.6832232475280762, -0.6498690843582153, -0.6165149211883545, -0.5831608176231384, -0.5498067140579224, -0.5164525508880615, -0.48309841752052307, -0.4497442841529846, -0.41639015078544617, -0.3830360174179077, -0.34968188405036926, -0.3163277506828308, -0.28297361731529236, -0.2496194839477539, -0.21626535058021545, -0.182911217212677, -0.14955708384513855, -0.1162029504776001, -0.08284881711006165, -0.04949468374252319, -0.01614055037498474, 0.01721358299255371, 0.05056771636009216, 0.08392179012298584, 0.11727592349052429, 0.15063005685806274, 0.1839841902256012, 0.21733832359313965, 0.2506924569606781, 0.28404659032821655, 0.317400723695755, 0.35075485706329346, 0.3841089904308319, 0.41746312379837036, 0.4508172571659088, 0.48417139053344727, 0.5175255537033081, 0.5508796572685242, 0.5842337608337402, 0.6175879240036011, 0.6509420871734619, 0.684296190738678, 0.717650294303894, 0.7510044574737549, 0.7843586206436157, 0.8177127242088318, 0.8510668277740479, 0.8844209909439087, 0.9177751541137695, 0.9511292576789856, 0.9844833612442017, 1.0178375244140625, 1.0511916875839233, 1.0845458507537842, 1.1178998947143555, 1.1512540578842163]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 3.0, 1.0, 2.0, 2.0, 3.0, 5.0, 2.0, 2.0, 3.0, 6.0, 3.0, 2.0, 4.0, 1.0, 3.0, 4.0, 5.0, 5.0, 3.0, 4.0, 10.0, 0.0, 7.0, 4.0, 8.0, 3.0, 1.0, 3.0, 4.0, 2.0, 2.0, 2.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.4420177936553955, -2.377901792526245, -2.3137857913970947, -2.2496697902679443, -2.185553550720215, -2.1214375495910645, -2.057321548461914, -1.9932055473327637, -1.9290895462036133, -1.864973545074463, -1.8008575439453125, -1.7367414236068726, -1.6726254224777222, -1.6085094213485718, -1.5443933010101318, -1.4802772998809814, -1.416161298751831, -1.3520452976226807, -1.2879292964935303, -1.2238131761550903, -1.15969717502594, -1.0955811738967896, -1.0314650535583496, -0.9673490524291992, -0.9032330513000488, -0.8391170501708984, -0.7750009894371033, -0.7108849287033081, -0.6467689275741577, -0.5826529264450073, -0.5185368657112122, -0.4544208347797394, -0.3903048038482666, -0.3261887729167938, -0.26207274198532104, -0.19795671105384827, -0.1338406801223755, -0.06972464919090271, -0.005608618259429932, 0.05850741267204285, 0.12262344360351562, 0.1867394745349884, 0.2508555054664612, 0.31497153639793396, 0.37908756732940674, 0.4432035982608795, 0.5073196291923523, 0.5714356899261475, 0.6355516910552979, 0.6996676921844482, 0.7637837529182434, 0.8278998136520386, 0.892015814781189, 0.9561318159103394, 1.0202479362487793, 1.0843639373779297, 1.14847993850708, 1.2125959396362305, 1.2767119407653809, 1.3408280611038208, 1.4049440622329712, 1.4690600633621216, 1.5331761837005615, 1.597292184829712, 1.6614081859588623]}, "gradients/encoder.masked_spec_embed": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 4.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 1.0, 4.0, 3.0, 12.0, 15.0, 10.0, 13.0, 19.0, 29.0, 19.0, 53.0, 50.0, 61.0, 67.0, 73.0, 66.0, 73.0, 61.0, 72.0, 52.0, 37.0, 41.0, 33.0, 23.0, 27.0, 19.0, 20.0, 8.0, 7.0, 4.0, 6.0, 8.0, 4.0, 4.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.252197265625, -0.2451915740966797, -0.23818588256835938, -0.23118019104003906, -0.22417449951171875, -0.21716880798339844, -0.21016311645507812, -0.2031574249267578, -0.1961517333984375, -0.1891460418701172, -0.18214035034179688, -0.17513465881347656, -0.16812896728515625, -0.16112327575683594, -0.15411758422851562, -0.1471118927001953, -0.140106201171875, -0.1331005096435547, -0.12609481811523438, -0.11908912658691406, -0.11208343505859375, -0.10507774353027344, -0.09807205200195312, -0.09106636047363281, -0.0840606689453125, -0.07705497741699219, -0.07004928588867188, -0.06304359436035156, -0.05603790283203125, -0.04903221130371094, -0.042026519775390625, -0.03502082824707031, -0.02801513671875, -0.021009445190429688, -0.014003753662109375, -0.0069980621337890625, 7.62939453125e-06, 0.0070133209228515625, 0.014019012451171875, 0.021024703979492188, 0.0280303955078125, 0.03503608703613281, 0.042041778564453125, 0.04904747009277344, 0.05605316162109375, 0.06305885314941406, 0.07006454467773438, 0.07707023620605469, 0.084075927734375, 0.09108161926269531, 0.09808731079101562, 0.10509300231933594, 0.11209869384765625, 0.11910438537597656, 0.12611007690429688, 0.1331157684326172, 0.1401214599609375, 0.1471271514892578, 0.15413284301757812, 0.16113853454589844, 0.16814422607421875, 0.17514991760253906, 0.18215560913085938, 0.1891613006591797, 0.1961669921875]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 4.0, 5.0, 0.0, 4.0, 3.0, 2.0, 1.0, 9.0, 8.0, 10.0, 14.0, 23.0, 39.0, 44.0, 72.0, 87.0, 172.0, 287.0, 504.0, 897.0, 1760.0, 3382.0, 6829.0, 14535.0, 31699.0, 69050.0, 132932.0, 133537.0, 68603.0, 30965.0, 14308.0, 6928.0, 3462.0, 1791.0, 913.0, 542.0, 297.0, 214.0, 118.0, 63.0, 47.0, 40.0, 28.0, 18.0, 8.0, 9.0, 12.0, 3.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.884765625, -0.8601913452148438, -0.8356170654296875, -0.8110427856445312, -0.786468505859375, -0.7618942260742188, -0.7373199462890625, -0.7127456665039062, -0.68817138671875, -0.6635971069335938, -0.6390228271484375, -0.6144485473632812, -0.589874267578125, -0.5652999877929688, -0.5407257080078125, -0.5161514282226562, -0.4915771484375, -0.46700286865234375, -0.4424285888671875, -0.41785430908203125, -0.393280029296875, -0.36870574951171875, -0.3441314697265625, -0.31955718994140625, -0.29498291015625, -0.27040863037109375, -0.2458343505859375, -0.22126007080078125, -0.196685791015625, -0.17211151123046875, -0.1475372314453125, -0.12296295166015625, -0.098388671875, -0.07381439208984375, -0.0492401123046875, -0.02466583251953125, -9.1552734375e-05, 0.02448272705078125, 0.0490570068359375, 0.07363128662109375, 0.09820556640625, 0.12277984619140625, 0.1473541259765625, 0.17192840576171875, 0.196502685546875, 0.22107696533203125, 0.2456512451171875, 0.27022552490234375, 0.2947998046875, 0.31937408447265625, 0.3439483642578125, 0.36852264404296875, 0.393096923828125, 0.41767120361328125, 0.4422454833984375, 0.46681976318359375, 0.49139404296875, 0.5159683227539062, 0.5405426025390625, 0.5651168823242188, 0.589691162109375, 0.6142654418945312, 0.6388397216796875, 0.6634140014648438, 0.68798828125]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 10.0, 3.0, 8.0, 20.0, 29.0, 33.0, 45.0, 59.0, 70.0, 85.0, 102.0, 100.0, 95.0, 84.0, 55.0, 59.0, 51.0, 34.0, 28.0, 14.0, 7.0, 13.0, 4.0, 5.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.39404296875, -0.3847827911376953, -0.3755226135253906, -0.36626243591308594, -0.35700225830078125, -0.34774208068847656, -0.3384819030761719, -0.3292217254638672, -0.3199615478515625, -0.3107013702392578, -0.3014411926269531, -0.29218101501464844, -0.28292083740234375, -0.27366065979003906, -0.2644004821777344, -0.2551403045654297, -0.245880126953125, -0.2366199493408203, -0.22735977172851562, -0.21809959411621094, -0.20883941650390625, -0.19957923889160156, -0.19031906127929688, -0.1810588836669922, -0.1717987060546875, -0.1625385284423828, -0.15327835083007812, -0.14401817321777344, -0.13475799560546875, -0.12549781799316406, -0.11623764038085938, -0.10697746276855469, -0.09771728515625, -0.08845710754394531, -0.07919692993164062, -0.06993675231933594, -0.06067657470703125, -0.05141639709472656, -0.042156219482421875, -0.03289604187011719, -0.0236358642578125, -0.014375686645507812, -0.005115509033203125, 0.0041446685791015625, 0.01340484619140625, 0.022665023803710938, 0.031925201416015625, 0.04118537902832031, 0.050445556640625, 0.05970573425292969, 0.06896591186523438, 0.07822608947753906, 0.08748626708984375, 0.09674644470214844, 0.10600662231445312, 0.11526679992675781, 0.1245269775390625, 0.1337871551513672, 0.14304733276367188, 0.15230751037597656, 0.16156768798828125, 0.17082786560058594, 0.18008804321289062, 0.1893482208251953, 0.1986083984375]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 3.0, 1.0, 5.0, 7.0, 3.0, 6.0, 9.0, 19.0, 70.0, 171.0, 124.0, 30.0, 16.0, 9.0, 9.0, 2.0, 3.0, 7.0, 3.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-3.052302837371826, -2.983961343765259, -2.9156198501586914, -2.847278356552124, -2.7789368629455566, -2.7105953693389893, -2.642253875732422, -2.5739126205444336, -2.505570888519287, -2.4372293949127197, -2.3688879013061523, -2.300546407699585, -2.2322049140930176, -2.16386342048645, -2.095521926879883, -2.0271806716918945, -1.9588391780853271, -1.8904976844787598, -1.8221561908721924, -1.753814697265625, -1.6854732036590576, -1.6171317100524902, -1.5487903356552124, -1.480448842048645, -1.4121073484420776, -1.3437658548355103, -1.2754243612289429, -1.2070828676223755, -1.1387414932250977, -1.0703999996185303, -1.002058506011963, -0.9337170124053955, -0.8653757572174072, -0.7970342636108398, -0.7286927700042725, -0.6603513360023499, -0.5920098423957825, -0.5236683487892151, -0.4553268849849701, -0.3869854211807251, -0.3186439275741577, -0.25030243396759033, -0.18196097016334534, -0.11361949145793915, -0.04527801275253296, 0.023063480854034424, 0.09140494465827942, 0.15974640846252441, 0.2280879020690918, 0.2964293956756592, 0.3647708594799042, 0.43311232328414917, 0.5014538168907166, 0.5697953104972839, 0.6381367444992065, 0.7064782381057739, 0.7748197317123413, 0.8431612253189087, 0.9115027189254761, 0.9798441529273987, 1.0481855869293213, 1.1165270805358887, 1.184868574142456, 1.2532100677490234, 1.3215515613555908]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 4.0, 2.0, 1.0, 4.0, 8.0, 4.0, 5.0, 1.0, 2.0, 12.0, 6.0, 12.0, 20.0, 47.0, 112.0, 107.0, 71.0, 23.0, 11.0, 6.0, 3.0, 7.0, 1.0, 2.0, 2.0, 4.0, 0.0, 4.0, 2.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0941205024719238, -1.0543020963668823, -1.0144836902618408, -0.9746652841567993, -0.9348468780517578, -0.8950284719467163, -0.8552101254463196, -0.8153917193412781, -0.7755733132362366, -0.7357549071311951, -0.6959365010261536, -0.6561180949211121, -0.6162997484207153, -0.5764813423156738, -0.5366629362106323, -0.4968445301055908, -0.4570261240005493, -0.4172077178955078, -0.3773893117904663, -0.3375709354877472, -0.2977525293827057, -0.2579341232776642, -0.21811573207378387, -0.17829734086990356, -0.13847893476486206, -0.09866053611040115, -0.05884213745594025, -0.01902373880147934, 0.020794659852981567, 0.06061306595802307, 0.10043145716190338, 0.1402498483657837, 0.18006813526153564, 0.21988654136657715, 0.25970494747161865, 0.29952332377433777, 0.3393417298793793, 0.3791601359844208, 0.4189785122871399, 0.4587969183921814, 0.4986153244972229, 0.5384337306022644, 0.5782521367073059, 0.6180705428123474, 0.6578888893127441, 0.6977072954177856, 0.7375257015228271, 0.7773441076278687, 0.8171625137329102, 0.8569809198379517, 0.8967993259429932, 0.9366177320480347, 0.9764361381530762, 1.0162545442581177, 1.0560729503631592, 1.0958912372589111, 1.1357097625732422, 1.1755281686782837, 1.2153465747833252, 1.2551649808883667, 1.2949833869934082, 1.3348017930984497, 1.3746201992034912, 1.4144384860992432, 1.4542568922042847]}, "eval/loss": 0.3589690625667572, "eval/wer": 0.09641015470051567, "eval/runtime": 570.6282, "eval/samples_per_second": 4.63, "eval/steps_per_second": 0.58, "train/train_runtime": 51756.4072, "train/train_samples_per_second": 5.514, "train/train_steps_per_second": 0.043, "train/total_flos": 0.0, "train/train_loss": 1.290548439615828} \ No newline at end of file